Repository: LibrePhotos/librephotos
Branch: dev
Commit: 460655fada5b
Files: 423
Total size: 2.3 MB

Directory structure:
gitextract_0h3h3ffo/

├── .coveragerc
├── .github/
│   ├── FUNDING.yml
│   ├── ISSUE_TEMPLATE/
│   │   ├── bug_report.md
│   │   └── enhancement-request.md
│   └── workflows/
│       ├── docker-publish.yml
│       └── pre-commit.yml
├── .gitignore
├── .pre-commit-config.yaml
├── CLAUDE.md
├── CONTRIBUTING.md
├── LICENSE
├── README.md
├── api/
│   ├── __init__.py
│   ├── admin.py
│   ├── all_tasks.py
│   ├── api_util.py
│   ├── apps.py
│   ├── autoalbum.py
│   ├── background_tasks.py
│   ├── batch_jobs.py
│   ├── burst_detection_rules.py
│   ├── cluster_manager.py
│   ├── date_time_extractor.py
│   ├── directory_watcher/
│   │   ├── __init__.py
│   │   ├── file_grouping.py
│   │   ├── file_handlers.py
│   │   ├── processing_jobs.py
│   │   ├── repair_jobs.py
│   │   ├── scan_jobs.py
│   │   └── utils.py
│   ├── drf_optimize.py
│   ├── duplicate_detection.py
│   ├── face_classify.py
│   ├── face_extractor.py
│   ├── face_recognition.py
│   ├── feature/
│   │   ├── __init__.py
│   │   ├── embedded_media.py
│   │   └── tests/
│   │       ├── __init__.py
│   │       └── test_embedded_media.py
│   ├── filters.py
│   ├── geocode/
│   │   ├── __init__.py
│   │   ├── config.py
│   │   ├── geocode.py
│   │   └── parsers/
│   │       ├── __init__.py
│   │       ├── mapbox.py
│   │       ├── nominatim.py
│   │       ├── opencage.py
│   │       └── tomtom.py
│   ├── image_captioning.py
│   ├── image_similarity.py
│   ├── llm.py
│   ├── management/
│   │   ├── __init__.py
│   │   └── commands/
│   │       ├── build_similarity_index.py
│   │       ├── clear_cache.py
│   │       ├── createadmin.py
│   │       ├── createuser.py
│   │       ├── save_metadata.py
│   │       ├── scan.py
│   │       ├── start_cleaning_service.py
│   │       ├── start_job_cleanup_service.py
│   │       └── start_service.py
│   ├── metadata/
│   │   ├── __init__.py
│   │   ├── face_regions.py
│   │   ├── reader.py
│   │   ├── tags.py
│   │   └── writer.py
│   ├── middleware.py
│   ├── migrations/
│   │   ├── 0001_initial.py
│   │   ├── 0002_add_confidence.py
│   │   ├── 0003_remove_unused_thumbs.py
│   │   ├── 0004_fix_album_thing_constraint.py
│   │   ├── 0005_add_video_to_photo.py
│   │   ├── 0006_migrate_to_boolean_field.py
│   │   ├── 0007_migrate_to_json_field.py
│   │   ├── 0008_remove_image_path.py
│   │   ├── 0009_add_aspect_ratio.py
│   │   ├── 0009_add_clip_embedding_field.py
│   │   ├── 0010_merge_20210725_1547.py
│   │   ├── 0011_a_add_rating.py
│   │   ├── 0011_b_migrate_favorited_to_rating.py
│   │   ├── 0011_c_remove_favorited.py
│   │   ├── 0012_add_favorite_min_rating.py
│   │   ├── 0013_add_image_scale_and_misc.py
│   │   ├── 0014_add_save_metadata_to_disk.py
│   │   ├── 0015_add_dominant_color.py
│   │   ├── 0016_add_transcode_videos.py
│   │   ├── 0017_add_cover_photo.py
│   │   ├── 0018_user_config_datetime_rules.py
│   │   ├── 0019_change_config_datetime_rules.py
│   │   ├── 0020_add_default_timezone.py
│   │   ├── 0021_remove_photo_image.py
│   │   ├── 0022_photo_video_length.py
│   │   ├── 0023_photo_deleted.py
│   │   ├── 0024_photo_timestamp.py
│   │   ├── 0025_add_cover_photo.py
│   │   ├── 0026_add_cluster_info.py
│   │   ├── 0027_rename_unknown_person.py
│   │   ├── 0028_add_metadata_fields.py
│   │   ├── 0029_change_to_text_field.py
│   │   ├── 0030_user_confidence_person.py
│   │   ├── 0031_remove_account.py
│   │   ├── 0032_always_have_owner.py
│   │   ├── 0033_add_post_delete_person.py
│   │   ├── 0034_allow_deleting_person.py
│   │   ├── 0035_add_files_model.py
│   │   ├── 0036_handle_missing_files.py
│   │   ├── 0037_migrate_to_files.py
│   │   ├── 0038_add_main_file.py
│   │   ├── 0039_remove_photo_image_paths.py
│   │   ├── 0040_add_user_public_sharing_flag.py
│   │   ├── 0041_apply_user_enum_for_person.py
│   │   ├── 0042_alter_albumuser_cover_photo_alter_photo_main_file.py
│   │   ├── 0043_alter_photo_size.py
│   │   ├── 0044_alter_cluster_person_alter_person_cluster_owner.py
│   │   ├── 0045_alter_face_cluster.py
│   │   ├── 0046_add_embedded_media.py
│   │   ├── 0047_alter_file_embedded_media.py
│   │   ├── 0048_fix_null_height.py
│   │   ├── 0049_fix_metadata_files_as_main_files.py
│   │   ├── 0050_person_face_count.py
│   │   ├── 0051_set_person_defaults.py
│   │   ├── 0052_alter_person_name.py
│   │   ├── 0053_user_confidence_unknown_face_and_more.py
│   │   ├── 0054_user_cluster_selection_epsilon_user_min_samples.py
│   │   ├── 0055_alter_longrunningjob_job_type.py
│   │   ├── 0056_user_llm_settings_alter_longrunningjob_job_type.py
│   │   ├── 0057_remove_face_image_path_and_more.py
│   │   ├── 0058_alter_user_avatar_alter_user_nextcloud_app_password_and_more.py
│   │   ├── 0059_person_cover_face.py
│   │   ├── 0060_apply_default_face_cover.py
│   │   ├── 0061_alter_person_name.py
│   │   ├── 0062_albumthing_cover_photos.py
│   │   ├── 0063_apply_default_album_things_cover.py
│   │   ├── 0064_albumthing_photo_count.py
│   │   ├── 0065_apply_default_photo_count.py
│   │   ├── 0066_photo_last_modified_alter_longrunningjob_job_type.py
│   │   ├── 0067_alter_longrunningjob_job_type.py
│   │   ├── 0068_remove_longrunningjob_result_and_more.py
│   │   ├── 0069_rename_to_in_trashcan.py
│   │   ├── 0070_photo_removed.py
│   │   ├── 0071_rename_person_label_probability_face_cluster_probability_and_more.py
│   │   ├── 0072_alter_face_person.py
│   │   ├── 0073_remove_unknown_person.py
│   │   ├── 0074_migrate_cluster_person.py
│   │   ├── 0075_alter_face_cluster_person.py
│   │   ├── 0076_alter_file_path_alter_longrunningjob_job_type_and_more.py
│   │   ├── 0077_alter_albumdate_title.py
│   │   ├── 0078_create_photo_thumbnail.py
│   │   ├── 0079_alter_albumauto_title.py
│   │   ├── 0080_create_photo_caption.py
│   │   ├── 0081_remove_caption_fields_from_photo.py
│   │   ├── 0082_create_photo_search.py
│   │   ├── 0083_remove_search_fields.py
│   │   ├── 0084_convert_arrayfield_to_json.py
│   │   ├── 0085_albumuser_public_expires_at_albumuser_public_slug.py
│   │   ├── 0086_remove_albumuser_public_and_more.py
│   │   ├── 0087_add_folder_album.py
│   │   ├── 0088_remove_folder_album.py
│   │   ├── 0089_add_text_alignment.py
│   │   ├── 0090_add_header_size.py
│   │   ├── 0091_alter_user_scan_directory.py
│   │   ├── 0092_add_skip_raw_files_field.py
│   │   ├── 0093_migrate_photon_to_nominatim.py
│   │   ├── 0094_add_slideshow_interval.py
│   │   ├── 0095_photo_perceptual_hash_alter_longrunningjob_job_type_and_more.py
│   │   ├── 0096_add_progress_step_and_result_to_longrunningjob.py
│   │   ├── 0097_add_duplicate_detection_settings_to_user.py
│   │   ├── 0098_add_photo_stack.py
│   │   ├── 0099_photo_uuid_primary_key.py
│   │   ├── 0100_metadataedit_metadatafile_photometadata_stackreview_and_more.py
│   │   ├── 0101_populate_photo_metadata.py
│   │   ├── 0102_photo_stacks_manytomany.py
│   │   ├── 0103_remove_photo_metadata_fields.py
│   │   ├── 0104_remove_photostack_potential_savings_and_more.py
│   │   ├── 0105_alter_photo_image_hash.py
│   │   ├── 0106_alter_longrunningjob_options.py
│   │   ├── 0107_add_burst_detection_rules.py
│   │   ├── 0108_add_stack_raw_jpeg_field.py
│   │   ├── 0109_migrate_skip_raw_to_stack_raw_jpeg.py
│   │   ├── 0110_fix_file_embedded_media_self_reference.py
│   │   ├── 0111_alter_file_embedded_media.py
│   │   ├── 0112_convert_file_stacks_to_variants.py
│   │   ├── 0113_alter_photostack_stack_type.py
│   │   ├── 0114_add_file_path_unique.py
│   │   ├── 0115_cleanup_duplicate_photos.py
│   │   ├── 0116_cleanup_duplicate_groups_removed_photos.py
│   │   ├── 0117_delete_removed_photos.py
│   │   ├── 0118_alter_longrunningjob_job_type.py
│   │   ├── 0119_add_public_sharing_options.py
│   │   ├── 0120_rename_thumbnails_uuid_to_hash.py
│   │   ├── 0121_add_default_tagging_model.py
│   │   ├── 0121_user_save_face_tags_to_disk.py
│   │   └── __init__.py
│   ├── ml_models.py
│   ├── models/
│   │   ├── __init__.py
│   │   ├── album_auto.py
│   │   ├── album_date.py
│   │   ├── album_place.py
│   │   ├── album_thing.py
│   │   ├── album_user.py
│   │   ├── album_user_share.py
│   │   ├── cluster.py
│   │   ├── duplicate.py
│   │   ├── face.py
│   │   ├── file.py
│   │   ├── long_running_job.py
│   │   ├── person.py
│   │   ├── photo.py
│   │   ├── photo_caption.py
│   │   ├── photo_metadata.py
│   │   ├── photo_search.py
│   │   ├── photo_stack.py
│   │   ├── stack_review.py
│   │   ├── thumbnail.py
│   │   └── user.py
│   ├── nextcloud.py
│   ├── perceptual_hash.py
│   ├── permissions.py
│   ├── schemas/
│   │   └── site_settings.py
│   ├── semantic_search.py
│   ├── serializers/
│   │   ├── PhotosGroupedByDate.py
│   │   ├── __init__.py
│   │   ├── album_auto.py
│   │   ├── album_date.py
│   │   ├── album_place.py
│   │   ├── album_thing.py
│   │   ├── album_user.py
│   │   ├── face.py
│   │   ├── job.py
│   │   ├── person.py
│   │   ├── photo_metadata.py
│   │   ├── photos.py
│   │   ├── simple.py
│   │   └── user.py
│   ├── services.py
│   ├── social_graph.py
│   ├── stack_detection.py
│   ├── stacks/
│   │   ├── __init__.py
│   │   └── live_photo.py
│   ├── stats.py
│   ├── tests/
│   │   ├── __init__.py
│   │   ├── fixtures/
│   │   │   ├── __init__.py
│   │   │   ├── api_util/
│   │   │   │   ├── captions_json.py
│   │   │   │   ├── expectation.py
│   │   │   │   ├── photos.py
│   │   │   │   └── sunburst_expectation.py
│   │   │   ├── geocode/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── expectations/
│   │   │   │   │   ├── mapbox.py
│   │   │   │   │   ├── nominatim.py
│   │   │   │   │   ├── opencage.py
│   │   │   │   │   └── tomtom.py
│   │   │   │   └── responses/
│   │   │   │       ├── mapbox.py
│   │   │   │       ├── nominatim.py
│   │   │   │       ├── opencage.py
│   │   │   │       └── tomtom.py
│   │   │   ├── location_timeline_test_data.csv
│   │   │   └── niaz.xmp
│   │   ├── test_api_robustness.py
│   │   ├── test_api_util.py
│   │   ├── test_auto_select_and_savings.py
│   │   ├── test_background_tasks.py
│   │   ├── test_bktree_and_duplicate_detection.py
│   │   ├── test_bulk_operations.py
│   │   ├── test_burst_detection_rules.py
│   │   ├── test_burst_filename_patterns.py
│   │   ├── test_delete_photos.py
│   │   ├── test_detection_edge_cases.py
│   │   ├── test_directory_watcher_fix.py
│   │   ├── test_dirtree.py
│   │   ├── test_duplicate_api_edge_cases.py
│   │   ├── test_duplicate_detection.py
│   │   ├── test_duplicate_detection_logic.py
│   │   ├── test_duplicate_filtering.py
│   │   ├── test_edge_cases_integration.py
│   │   ├── test_edit_photo_details.py
│   │   ├── test_face_extractor.py
│   │   ├── test_face_writeback.py
│   │   ├── test_favorite_photos.py
│   │   ├── test_file_model.py
│   │   ├── test_file_path_uniqueness.py
│   │   ├── test_geocode.py
│   │   ├── test_get_faces.py
│   │   ├── test_hide_photos.py
│   │   ├── test_im2txt.py
│   │   ├── test_live_photo.py
│   │   ├── test_location_timeline.py
│   │   ├── test_metadata_ordering_sentinel.py
│   │   ├── test_migration_0099.py
│   │   ├── test_migration_0101.py
│   │   ├── test_multi_user_isolation.py
│   │   ├── test_only_photos_or_only_videos.py
│   │   ├── test_perceptual_hash.py
│   │   ├── test_photo_caption_model.py
│   │   ├── test_photo_captions.py
│   │   ├── test_photo_lifecycle.py
│   │   ├── test_photo_list_without_timestamp.py
│   │   ├── test_photo_metadata.py
│   │   ├── test_photo_metadata_api.py
│   │   ├── test_photo_model_integration.py
│   │   ├── test_photo_search_model.py
│   │   ├── test_photo_search_refactor.py
│   │   ├── test_photo_summary.py
│   │   ├── test_photo_viewset_permissions.py
│   │   ├── test_predefined_rules.py
│   │   ├── test_public_photos.py
│   │   ├── test_reading_exif.py
│   │   ├── test_recently_added_photos.py
│   │   ├── test_redetection_idempotency.py
│   │   ├── test_regenerate_titles.py
│   │   ├── test_retrieve_photo.py
│   │   ├── test_scan_percentage_bug.py
│   │   ├── test_scan_photos.py
│   │   ├── test_scan_photos_directories.py
│   │   ├── test_search_term_examples.py
│   │   ├── test_search_terms.py
│   │   ├── test_services.py
│   │   ├── test_setup_directory.py
│   │   ├── test_share_photos.py
│   │   ├── test_skip_raw_files.py
│   │   ├── test_social_graph.py
│   │   ├── test_stack_api_edge_cases.py
│   │   ├── test_stack_detection.py
│   │   ├── test_stack_detection_edge_cases.py
│   │   ├── test_stack_detection_logic.py
│   │   ├── test_stack_duplicate_integration.py
│   │   ├── test_stack_review.py
│   │   ├── test_stack_validation_edge_cases.py
│   │   ├── test_stats_accuracy.py
│   │   ├── test_thumbnail_migration.py
│   │   ├── test_thumbnail_naming.py
│   │   ├── test_trash_api.py
│   │   ├── test_user.py
│   │   ├── test_xmp_association.py
│   │   ├── test_zip_list_photos_view_v2.py
│   │   └── utils.py
│   ├── thumbnails.py
│   ├── util.py
│   └── views/
│       ├── __init__.py
│       ├── album_auto.py
│       ├── album_folder.py
│       ├── albums.py
│       ├── custom_api_view.py
│       ├── dataviz.py
│       ├── duplicates.py
│       ├── faces.py
│       ├── geocode.py
│       ├── jobs.py
│       ├── pagination.py
│       ├── photo_filters.py
│       ├── photo_metadata.py
│       ├── photos.py
│       ├── public_albums.py
│       ├── search.py
│       ├── services.py
│       ├── sharing.py
│       ├── stacks.py
│       ├── timezone.py
│       ├── upload.py
│       ├── user.py
│       └── views.py
├── image_similarity/
│   ├── __init__.py
│   ├── main.py
│   ├── retrieval_index.py
│   └── utils.py
├── librephotos/
│   ├── __init__.py
│   ├── settings/
│   │   ├── __init__.py
│   │   ├── development.py
│   │   ├── production.py
│   │   ├── test.py
│   │   └── test_sqlite.py
│   ├── urls.py
│   └── wsgi.py
├── manage.py
├── nextcloud/
│   ├── __init__.py
│   ├── admin.py
│   ├── apps.py
│   ├── directory_watcher.py
│   ├── models.py
│   ├── tests.py
│   └── views.py
├── pyproject.toml
├── renovate.json
├── requirements.dev.txt
├── requirements.mlval.txt
├── requirements.txt
└── service/
    ├── __init__.py
    ├── clip_embeddings/
    │   ├── __init__.py
    │   ├── main.py
    │   └── semantic_search/
    │       ├── __init__.py
    │       └── semantic_search.py
    ├── exif/
    │   ├── __init__.py
    │   └── main.py
    ├── face_recognition/
    │   ├── __init__.py
    │   └── main.py
    ├── image_captioning/
    │   ├── __init__.py
    │   ├── api/
    │   │   └── im2txt/
    │   │       ├── README.md
    │   │       ├── blip/
    │   │       │   ├── blip.py
    │   │       │   ├── med.py
    │   │       │   └── vit.py
    │   │       ├── build_vocab.py
    │   │       ├── data_loader.py
    │   │       ├── model.py
    │   │       ├── resize.py
    │   │       ├── sample.py
    │   │       └── train.py
    │   └── main.py
    ├── llm/
    │   ├── __init__.py
    │   └── main.py
    ├── tags/
    │   ├── __init__.py
    │   ├── main.py
    │   ├── places365/
    │   │   ├── __init__.py
    │   │   ├── places365.py
    │   │   └── wideresnet.py
    │   └── siglip2/
    │       ├── __init__.py
    │       ├── siglip2.py
    │       └── tags.txt
    └── thumbnail/
        ├── __init__.py
        ├── main.py
        └── test/
            ├── .gitignore
            ├── __init__.py
            ├── samples/
            │   ├── .gitkeep
            │   └── README.md
            └── test_thumbnail_worker.py

================================================
FILE CONTENTS
================================================

================================================
FILE: .coveragerc
================================================
[run]
branch = True

[report]
skip_covered = True
skip_empty = True
# show_missing = True

[html]
skip_covered = True
skip_empty = True


================================================
FILE: .github/FUNDING.yml
================================================
github: derneuere
custom: https://www.paypal.com/donate/?hosted_button_id=5JWVM2UR4LM96


================================================
FILE: .github/ISSUE_TEMPLATE/bug_report.md
================================================
---
name: Bug report
about: Create a report to help us improve
title: ''
labels: bug
assignees: ''

---

# 🛑 Before you create an issue make sure that:
- Your issue is **strictly related to LibrePhotos** itself. Questions about setting up a reverse proxy belong in what ever reverse proxy you are using. 
- You have read the [documentation](https://docs.librephotos.com) thoroughly.
- You have searched for a similar issue among all the former issues (even closed ones).
- You have tried to replicate the issue with a clean install of the project.
- You have asked for help on our Discord server [LibrePhotos](https://discord.gg/xwRvtSDGWb) if your issue involves general "how to" questions

**When Submitting please remove every thing above this line**


# 🐛 Bug Report

* [ ] 📁 I've Included a ZIP file containing my librephotos `log` files
* [ ] ❌ I have looked for similar issues (including closed ones)
* [ ] 🎬 (If applicable) I've provided pictures or links to videos that clearly demonstrate the issue 

## 📝 Description of issue:


## 🔁 How can we reproduce it:


## Please provide additional information:
- 💻 Operating system: 
- ⚙ Architecture (x86 or ARM): 
- 🔢 Librephotos version: 
- 📸 Librephotos installation method (Docker, Kubernetes, .deb, etc.): 
    * 🐋 If Docker or Kubernets, provide docker-compose image tag:
- 📁 How is you picture library mounted (Local file system (Type), NFS, SMB, etc.): 
- ☁ If you are virtualizing librephotos, Virtualization platform (Proxmox, Xen, HyperV, etc.): 


================================================
FILE: .github/ISSUE_TEMPLATE/enhancement-request.md
================================================
---
name: Enhancement request
about: Suggest an idea for this project
title: ''
labels: enhancement
assignees: ''

---

**Describe the enhancement you'd like**
A clear and concise description of what you want to happen.

**Describe why this will benefit the LibrePhotos**
A clear and concise explanation on why this will make LibrePhotos better.

**Additional context**
Add any other context or screenshots about the enhancement request here.


================================================
FILE: .github/workflows/docker-publish.yml
================================================
on:
  push:
    # Publish `dev` as Docker `latest` image.
    branches:
      - dev

jobs:
  # Run tests.
  # See also https://docs.docker.com/docker-hub/builds/automated-testing/
  test:
    runs-on: ubuntu-latest

    steps:
      - uses: actions/checkout@08eba0b27e820071cde6df949e0beb9ba4906955 # v4
      - name: Run tests
        run: echo "to-do"

  # Push image to GitHub Packages.
  # See also https://docs.docker.com/docker-hub/builds/
  push:
    # Ensure test job passes before pushing image.
    needs: test

    runs-on: ubuntu-latest
    if: github.event_name == 'push'

    steps:
      - name: Repository Dispatch
        uses: peter-evans/repository-dispatch@v3
        with:
          token: ${{ secrets.REPO_ACCESS_TOKEN }}
          repository: librephotos/librephotos-docker
          event-type: backend-commit-event


================================================
FILE: .github/workflows/pre-commit.yml
================================================
name: Linting (using pre-commit)

on: [push, pull_request]

jobs:
  pre-commit:
    runs-on: ubuntu-latest
    steps:
      - uses: actions/checkout@v4
      - name: Install dependencies
        run: pip install ruff
      - name: Run pre-commit check
        uses: pre-commit/action@v3.0.1


================================================
FILE: .gitignore
================================================
# Byte-compiled / optimized / DLL files
__pycache__/
*.py[cod]
*$py.class

# C extensions
*.so

# Docker
Dockerfile
entrypoint.sh

# Static assets
static/

# Nuitka
manage.build/
manage.dist/

# Distribution / packaging
.Python
build/
develop-eggs/
dist/
downloads/
eggs/
.eggs/
lib/
lib64/
parts/
sdist/
var/
wheels/
share/python-wheels/
*.egg-info/
.installed.cfg
*.egg
MANIFEST

# PyInstaller
#  Usually these files are written by a python script from a template
#  before PyInstaller builds the exe, so as to inject date/other infos into it.
*.manifest
*.spec

# Installer logs
pip-log.txt
pip-delete-this-directory.txt

# Unit test / coverage reports
htmlcov/
.tox/
.nox/
.coverage
.coverage.*
.cache
nosetests.xml
coverage.xml
*.cover
*.py,cover
.hypothesis/
.pytest_cache/
cover/
coco/
survey/

# Translations
*.mo
*.pot

# Django stuff:
*.log
local_settings.py
db.sqlite3
db.sqlite3-journal

# Flask stuff:
instance/
.webassets-cache

# Scrapy stuff:
.scrapy

# Sphinx documentation
docs/_build/

# PyBuilder
.pybuilder/
target/

# Jupyter Notebook
.ipynb_checkpoints

# IPython
profile_default/
ipython_config.py

# pyenv
#   For a library or package, you might want to ignore these files since the code is
#   intended to run in multiple environments; otherwise, check them in:
# .python-version

# pipenv
#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
#   However, in case of collaboration, if having platform-specific dependencies or dependencies
#   having no cross-platform support, pipenv may install dependencies that don't work, or not
#   install all needed dependencies.
#Pipfile.lock

# PEP 582; used by e.g. github.com/David-OConnor/pyflow
__pypackages__/

# Celery stuff
celerybeat-schedule
celerybeat.pid

# SageMath parsed files
*.sage.py

# Environments
.env
.venv
env/
venv/
ENV/
env.bak/
venv.bak/

# Spyder project settings
.spyderproject
.spyproject

# Rope project settings
.ropeproject

# visual studio
.vs/
.vscode/

# IntelliJ
.idea/

# mkdocs documentation
/site

# mypy
.mypy_cache/
.dmypy.json
dmypy.json

# Pyre type checker
.pyre/

# pytype static type analyzer
.pytype/

# Cython debug symbols
cython_debug/

# LibrePhotos
densecap/data/models/densecap/densecap-pretrained-vgg16.t7
*/*.pkl
*/*/*.pkl
thumbnails
media
samplephotos
Conv2d.patch
Linear.patch
Sequential.patch
BatchNorm2d.patch
AvgPool2d.patch
ReLU.patch
run_docker.sh
logs/
playground
api/im2txt/data/
api/im2txt/models/
api/im2txt/png/
*.ipynb
api/im2txt/*.tar.gz
*.db
media*
protected_media
report_dynamo_export.sarif

# Vim
*.swp
*.swo


================================================
FILE: .pre-commit-config.yaml
================================================
default_language_version:
  python: python3

repos:
  - repo: https://github.com/astral-sh/ruff-pre-commit
    rev: v0.9.4 # Check latest version
    hooks:
      - id: ruff
        args: ["--fix"] # Fix lint & format

      - id: ruff-format # Format code


================================================
FILE: CLAUDE.md
================================================
# LibrePhotos Backend Agent Guidelines

## Build & Development Commands

**Note:** All commands should be run inside the backend Docker container (`docker exec -it backend bash`).

### Django Management
- **Run Migrations**: `python manage.py migrate`
- **Make Migrations**: `python manage.py makemigrations`
- **Create Superuser**: `python manage.py createsuperuser`
- **Collect Static**: `python manage.py collectstatic`
- **Shell**: `python manage.py shell`
- **Custom Commands**: `python manage.py <command_name>` (see `api/management/commands/`)

### Running Services
- **API Server (Gunicorn)**: Runs automatically in container
- **Background Jobs (django-q2)**: Runs automatically via `qcluster` command
- **Image Similarity Service**: Flask app for semantic search
- **Thumbnail Service**: Separate process for image processing

### Linting & Formatting
- **Lint**: `ruff check .`
- **Format**: `ruff format .`
- **Lint + Fix**: `ruff check --fix .`

### Testing
- **Run All Tests**: `python manage.py test api.tests`
- **Run Specific Test**: `python manage.py test api.tests.test_module`
- **Run with Verbosity**: `python manage.py test api.tests -v 2`

### Debugging
- **PDB Breakpoint**: Add `import pdb; pdb.set_trace()` in code
- **Attach to Container**: `docker attach $(docker ps --filter name=backend -q)`
- **Silk Profiler**: Access `/api/silk` (dev mode only)
- **Detach**: `Ctrl+P` then `Ctrl+Q`

## Code Style & Conventions

- **Formatting**: Ruff with 88 char line width (configured in `pyproject.toml`)
- **Imports**: Sorted by isort (via Ruff)
- **Target Python**: 3.11+
- **Framework**: Django 5.x with Django REST Framework
- **Async Jobs**: django-q2 with ORM broker
- **ML Framework**: PyTorch for machine learning models

## Project Structure

### `api/` - Main Application
- `models/` - Django ORM models (Photo, Face, Person, Album, etc.)
- `views/` - API endpoints using Django REST Framework
- `serializers/` - JSON serialization for models
- `management/commands/` - CLI commands (`python manage.py <cmd>`)
- `migrations/` - Database migrations
- `tests/` - Test suite
- `geocode/` - Reverse geocoding functionality
- `feature/` - Feature extraction utilities

### `service/` - Microservices
- `clip_embeddings/` - CLIP model for semantic search
- `face_recognition/` - Face detection and recognition
- `image_captioning/` - Image captioning (im2txt, BLIP)
- `thumbnail/` - Thumbnail generation
- `llm/` - LLM integration for chat features
- `tags/` - Tag extraction (places365)
- `exif/` - EXIF metadata extraction

### `image_similarity/` - Similarity Search
- FAISS-based image retrieval index
- Flask REST API for similarity queries

### Key Files
- `manage.py` - Django management script
- `requirements.txt` - Python dependencies
- `pyproject.toml` - Ruff/project configuration
- `librephotos/settings/` - Django settings (base, dev, prod)
- `librephotos/urls.py` - URL routing

## Environment Variables

Key environment variables (set in Docker or `.env`):
- `DEBUG` - Enable debug mode (0 or 1)
- `SECRET_KEY` - Django secret key
- `DB_*` - Database connection settings
- `MAPBOX_API_KEY` - For map features
- `WEB_CONCURRENCY` - Gunicorn worker count

## Common Patterns

### Adding a New API Endpoint
1. Create/update model in `api/models/`
2. Create serializer in `api/serializers/`
3. Create view in `api/views/`
4. Add URL in `librephotos/urls.py`
5. Run migrations if model changed

### Adding a New Background Job
1. Define task function in `api/all_tasks.py` or relevant module
2. Use `@shared_task` decorator for django-q2
3. Queue with `async_task()` or schedule in admin

### Adding a New ML Model
1. Add model loading in `api/ml_models.py`
2. Create service wrapper in `service/<model_name>/`
3. Integrate with API views as needed


================================================
FILE: CONTRIBUTING.md
================================================
# Contributing to LibrePhotos

Thank you for your interest in contributing to LibrePhotos! This guide will help you get started with the development process.

## Table of Contents

- [Development Environment Setup](#development-environment-setup)
- [Docker & Docker Compose](#docker--docker-compose)
- [IDE Recommendations](#ide-recommendations)
- [Code Quality Standards](#code-quality-standards)
- [How to Open a Pull Request](#how-to-open-a-pull-request)
- [Getting Help](#getting-help)

---

## Development Environment Setup

### Prerequisites

- **Git** - for version control
- **Docker** and **Docker Compose** - for running the development environment
- **Node.js 18+** and **Yarn** - for frontend development (optional, if developing outside Docker)
- **Python 3.11+** - for backend development (optional, if developing outside Docker)

### Step 1: Clone the Repositories

Create a directory for the project and clone all required repositories:

**Linux/macOS:**
```bash
export codedir=~/dev/librephotos
mkdir -p $codedir
cd $codedir

git clone https://github.com/LibrePhotos/librephotos-frontend.git
git clone https://github.com/LibrePhotos/librephotos.git
git clone https://github.com/LibrePhotos/librephotos-docker.git
```

**Windows (PowerShell):**
```powershell
$Env:codedir = "$HOME\dev\librephotos"
New-Item -ItemType Directory -Force -Path $Env:codedir
Set-Location $Env:codedir

git clone https://github.com/LibrePhotos/librephotos-frontend.git
git clone https://github.com/LibrePhotos/librephotos.git
git clone https://github.com/LibrePhotos/librephotos-docker.git
```

### Step 2: Configure Environment

Navigate to the `librephotos-docker` directory and create your `.env` file:

```bash
cd librephotos-docker
cp librephotos.env .env
```

Edit the `.env` file and set these critical variables:

```bash
# Path to your photo library (for testing)
scanDirectory=/path/to/your/test/photos

# Path to LibrePhotos data
data=./librephotos/data

# IMPORTANT: Path where you cloned the repositories
codedir=~/dev/librephotos
```

### Step 3: Start the Development Environment

```bash
docker compose -f docker-compose.yml -f docker-compose.dev.yml up -d
```

This command:
- Builds development images with hot-reload enabled
- Mounts your local source code into the containers
- Starts all required services (backend, frontend, database, proxy)

Access LibrePhotos at: **http://localhost:3000**

### Rebuilding After Dependency Changes

If you add new dependencies to `requirements.txt` or `package.json`:

```bash
# Rebuild backend
docker compose -f docker-compose.yml -f docker-compose.dev.yml build --no-cache backend

# Rebuild frontend
docker compose -f docker-compose.yml -f docker-compose.dev.yml build --no-cache frontend

# Restart containers
docker compose -f docker-compose.yml -f docker-compose.dev.yml up -d
```

---

## Docker & Docker Compose

### Architecture Overview

LibrePhotos uses a microservices architecture with four main containers:

| Container   | Purpose                                              |
|-------------|------------------------------------------------------|
| `backend`   | Django API server, ML models, background jobs        |
| `frontend`  | React web application                                |
| `proxy`     | Nginx reverse proxy, serves static files             |
| `db`        | PostgreSQL database                                  |

### Useful Docker Commands

```bash
# View running containers
docker compose ps

# View logs (all containers)
docker compose -f docker-compose.yml -f docker-compose.dev.yml logs -f

# View logs (specific container)
docker compose -f docker-compose.yml -f docker-compose.dev.yml logs -f backend

# Restart a container
docker compose -f docker-compose.yml -f docker-compose.dev.yml restart backend

# Stop all containers
docker compose -f docker-compose.yml -f docker-compose.dev.yml down

# Stop and remove volumes (fresh start)
docker compose -f docker-compose.yml -f docker-compose.dev.yml down -v

# Execute command in container
docker exec -it backend bash
docker exec -it frontend sh

# Run Django management commands
docker exec -it backend python manage.py migrate
docker exec -it backend python manage.py createsuperuser
```

### Development vs Production

| Aspect            | Development (`docker-compose.dev.yml`)              | Production (`docker-compose.yml`)    |
|-------------------|-----------------------------------------------------|--------------------------------------|
| Source code       | Mounted from local filesystem                       | Built into image                     |
| Hot reload        | ✅ Enabled                                           | ❌ Disabled                           |
| Debug mode        | ✅ `DEBUG=1`                                         | ❌ `DEBUG=0`                          |
| Build time        | Longer (builds from source)                         | Fast (pulls pre-built images)        |
| Additional tools  | pgAdmin available on port 3001                      | Minimal                              |

---

## IDE Recommendations

### VS Code (Recommended)

VS Code is the recommended IDE with excellent Docker and Python support.

**Recommended Extensions:**
- **Python** - Python language support
- **Pylance** - Fast Python language server
- **Docker** - Docker container management
- **Remote - Containers** - Develop inside Docker containers
- **ESLint** - JavaScript/TypeScript linting
- **Prettier** - Code formatting

**Workspace Settings:**

The repository includes VS Code settings in `librephotos-docker/vscode/settings.json` that are automatically mounted into the backend container.

**Attaching to Backend Container:**

For the best development experience, you can attach VS Code directly to the running backend container:

1. Install the "Remote - Containers" extension
2. Open Command Palette (`Ctrl+Shift+P`)
3. Run "Remote-Containers: Attach to Running Container"
4. Select the `backend` container
5. Open the `/code` folder

### PyCharm

PyCharm Professional supports Docker interpreters natively:

1. Go to Settings → Project → Python Interpreter
2. Add Interpreter → On Docker Compose
3. Select the `docker-compose.yml` and `docker-compose.dev.yml` files
4. Choose the `backend` service

### Other IDEs

Any IDE with Python and TypeScript support will work. Key requirements:
- Python 3.11+ interpreter support
- ESLint/Prettier integration for frontend
- Docker integration (optional but helpful)

---

## Code Quality Standards

### Backend (Python/Django)

**Linting and Formatting:**

We use `ruff` for linting and formatting (configured in `pyproject.toml`):

```bash
# Inside the backend container
cd /code
pip install ruff
ruff check .
ruff format .
```

**Pre-commit Hooks:**

Install pre-commit hooks for automatic formatting:

```bash
pip install pre-commit
pre-commit install
```

**Code Style:**
- Line length: 88 characters
- Use type hints where practical
- Follow PEP 8 naming conventions
- Write docstrings for public functions

### Frontend (React/TypeScript)

**Linting and Formatting:**

```bash
# Inside frontend container or locally
yarn lint:error        # Check for errors
yarn lint:warning:fix  # Fix linting issues
```

**Code Style:**
- Line length: 120 characters
- Use Prettier for formatting (configured in `prettier.config.cjs`)
- Prefer TypeScript types over interfaces (project convention)
- Use functional components with hooks
- Follow the slice pattern for Redux state management

### Pull Request Checklist

Before submitting a PR, ensure:

- [ ] Code follows the project's style guidelines
- [ ] All linting passes without errors
- [ ] New features include tests (if applicable)
- [ ] Documentation is updated (if needed)
- [ ] Commit messages are clear and descriptive
- [ ] The PR addresses a single concern/feature

---

## How to Open a Pull Request

### Step 1: Fork the Repository

1. Navigate to the repository you want to contribute to on GitHub
2. Click the "Fork" button in the top right corner
3. Clone your fork locally:

```bash
git clone https://github.com/YOUR-USERNAME/librephotos.git
cd librephotos
git remote add upstream https://github.com/LibrePhotos/librephotos.git
```

### Step 2: Create a Feature Branch

Always create a new branch for your work:

```bash
git checkout -b feature/my-awesome-feature
# or
git checkout -b fix/bug-description
```

### Step 3: Make Your Changes

1. Write your code following the code quality standards above
2. Test your changes thoroughly
3. Commit your changes with descriptive messages:

```bash
git add .
git commit -m "feat: add support for XYZ"
# or
git commit -m "fix: resolve issue with ABC"
```

**Commit Message Guidelines:**
- Use present tense ("add feature" not "added feature")
- Keep the first line under 72 characters
- Reference issues when applicable: `fix: resolve login bug (#123)`

### Step 4: Push and Create Pull Request

```bash
git push origin feature/my-awesome-feature
```

Then on GitHub:
1. Navigate to your fork
2. Click "Compare & pull request"
3. Fill out the PR template with:
   - Clear description of changes
   - Reference to related issues
   - Screenshots (for UI changes)
   - Testing instructions

### Step 5: Respond to Review

- Address reviewer feedback promptly
- Make requested changes in new commits
- Be open to suggestions and discussion

---

## Getting Help

- **Discord:** [Join our Discord server](https://discord.gg/xwRvtSDGWb)
- **GitHub Issues:** [Report bugs or request features](https://github.com/LibrePhotos/librephotos/issues)
- **Documentation:** [docs.librephotos.com](https://docs.librephotos.com)
- **Development Videos:** [Niaz Faridani-Rad's YouTube channel](https://www.youtube.com/channel/UCZJ2pk2BPKxwbuCV9LWDR0w)

### Debugging Tips

**Backend (Django):**

Use `pdb` for debugging:

```python
import pdb; pdb.set_trace()
```

Then attach to the container:

```bash
docker attach $(docker ps --filter name=backend -q)
```

Press `Ctrl+P` followed by `Ctrl+Q` to detach without stopping the container.

**Frontend (React):**

- Use React DevTools browser extension
- Use Redux DevTools for state debugging
- Enable WDYR by setting `WDYR=True` in your `.env`

**API Documentation:**

After starting LibrePhotos, access the API docs at:
- Swagger: http://localhost:3000/api/swagger
- ReDoc: http://localhost:3000/api/redoc

---

## License

By contributing to LibrePhotos, you agree that your contributions will be licensed under the MIT License.

Thank you for contributing! 🎉


================================================
FILE: LICENSE
================================================
MIT License

Copyright (c) 2017 Hooram Nam

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.


================================================
FILE: README.md
================================================
[![Discord](https://img.shields.io/discord/784619049208250388?style=plastic)][discord] [![Website](https://img.shields.io/website?down_color=lightgrey&down_message=offline&style=plastic&up_color=blue&up_message=online&url=https%3A%2F%2Flibrephotos.com)](https://librephotos.com/)
[![Read the docs](https://img.shields.io/static/v1?label=Read&message=the%20docs&color=blue&style=plastic)](https://docs.librephotos.com/) [![GitHub contributors](https://img.shields.io/github/contributors/librephotos/librephotos?style=plastic)](https://github.com/LibrePhotos/librephotos/graphs/contributors) [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg?style=plastic)](https://github.com/LibrePhotos/librephotos/blob/dev/LICENSE)
<a href="https://hosted.weblate.org/engage/librephotos/">
<img src="https://hosted.weblate.org/widgets/librephotos/-/librephotos-frontend/svg-badge.svg" alt="Translation status" />
</a>

# LibrePhotos

![](https://github.com/LibrePhotos/librephotos/blob/dev/screenshots/mockups_main_fhd.png?raw=true)
<sub>Mockup designed by rawpixel.com / Freepik</sub>

A self-hosted, open-source photo management service with automatic face recognition, object detection, and semantic search — powered by modern machine learning.

- **Stable** demo is available here: https://demo1.librephotos.com/ . User is ```demo```, password is ```demo1234``` (with sample images).
- Latest **development** demo is available here: https://demo2.librephotos.com/ (same user/password)
- You can watch development videos on [Niaz Faridani-Rad's channel](https://www.youtube.com/channel/UCZJ2pk2BPKxwbuCV9LWDR0w)
- You can join our [Discord][discord].

## Installation

Step-by-step installation instructions are available in our [documentation](https://docs.librephotos.com/docs/installation/standard-install).

### System Requirements

| Resource | Minimum | Recommended |
|----------|---------|-------------|
| RAM      | 4 GB    | 8 GB+       |
| Storage  | 10 GB (plus your photo library) | SSD recommended |
| CPU      | 2 cores | 4+ cores    |
| OS       | Any Docker-compatible OS | Linux |

> **Note:** Machine learning features (face recognition, scene classification, image captioning) are memory-intensive. 8 GB+ RAM is strongly recommended for smooth operation.

## Features

  - Support for all types of photos including raw photos
  - Support for videos
  - Timeline view
  - Scans pictures on the file system
  - Multiuser support
  - Generate albums based on events like "Thursday in Berlin"
  - Face recognition / Face classification
  - Reverse geocoding
  - Object / Scene detection
  - Semantic image search
  - Search by metadata

## Tech Stack

### Backend

- **Framework:** [Django 5](https://www.djangoproject.com/) with [Django REST Framework](https://www.django-rest-framework.org/)
- **Database:** [PostgreSQL](https://www.postgresql.org/)
- **Task Queue:** [Django-Q2](https://github.com/django-q2/django-q2)
- **Image Conversion:** [ImageMagick](https://github.com/ImageMagick/ImageMagick)
- **Video Conversion:** [FFmpeg](https://github.com/FFmpeg/FFmpeg)
- **Exif Support:** [ExifTool](https://github.com/exiftool/exiftool)

### Frontend

- **UI:** [React 18](https://react.dev/) with [TypeScript](https://www.typescriptlang.org/)
- **Build Tool:** [Vite](https://vite.dev/)
- **Component Library:** [Mantine](https://mantine.dev/)
- **Routing:** [TanStack Router](https://tanstack.com/router)
- **Data Fetching:** [TanStack Query](https://tanstack.com/query)
- **Maps:** [MapLibre GL](https://maplibre.org/)
- **Internationalization:** [i18next](https://www.i18next.com/)

### Machine Learning

- **Face detection:** [face_recognition](https://github.com/ageitgey/face_recognition)
- **Face classification/clustering:** [scikit-learn](https://scikit-learn.org/) and [hdbscan](https://github.com/scikit-learn-contrib/hdbscan)
- **Image captioning:** [im2txt](https://github.com/HughKu/Im2txt)
- **Scene classification:** [places365](http://places.csail.mit.edu/)
- **Reverse geocoding:** [geopy](https://github.com/geopy/geopy)

### Infrastructure

- **Deployment:** [Docker](https://www.docker.com/) & [Docker Compose](https://docs.docker.com/compose/)
- **Reverse Proxy:** [Nginx](https://nginx.org/)

### API Documentation

After starting LibrePhotos, interactive API docs are available at:

- **Swagger UI:** `http://localhost:3000/api/swagger`
- **ReDoc:** `http://localhost:3000/api/redoc`

## How to help out

- ⭐ **Star** this repository if you like this project!
- 🚀 **Developing**: Get started in less than 30 minutes by following [this guide](https://docs.librephotos.com/docs/development/dev-install). Also see our [CONTRIBUTING.md](CONTRIBUTING.md) for detailed development setup, code quality standards, and PR guidelines.
- 🗒️ **Documentation**: Improving the documentation is as simple as submitting a pull request [here](https://github.com/LibrePhotos/librephotos.docs)
- 🧪 **Testing**: If you want to help find bugs, use the ```dev``` tag and update it regularly. If you find a bug, open an issue.
- 🧑‍🤝‍🧑 **Outreach**: Talk about this project with other people and help them to get started too!
- 🌐 **Translations**: Make LibrePhotos accessible to more people with [weblate](https://hosted.weblate.org/engage/librephotos/).
- 💸 [**Donate**](https://github.com/sponsors/derneuere) to the developers of LibrePhotos

## Related Projects

| Repository | Description |
|------------|-------------|
| [librephotos-frontend](https://github.com/LibrePhotos/librephotos-frontend) | React/TypeScript web frontend |
| [librephotos-docker](https://github.com/LibrePhotos/librephotos-docker) | Docker Compose deployment configurations |
| [librephotos.docs](https://github.com/LibrePhotos/librephotos.docs) | Documentation website source |
| [librephotos-mobile](https://github.com/LibrePhotos/librephotos-mobile) | Mobile application |

## License

This project is licensed under the [MIT License](LICENSE).

[discord]: https://discord.gg/xwRvtSDGWb


================================================
FILE: api/__init__.py
================================================
default_app_config = "api.apps.ApiConfig"


================================================
FILE: api/admin.py
================================================
from django.contrib import admin
from django_q.tasks import AsyncTask

from .models import (
    AlbumAuto,
    AlbumDate,
    AlbumPlace,
    AlbumThing,
    AlbumUser,
    Cluster,
    Face,
    File,
    LongRunningJob,
    Person,
    Photo,
    User,
    Thumbnail,
)


def deduplicate_faces_function(queryset):
    for photo in queryset:
        # Get all faces in the photo
        faces = Face.objects.filter(photo=photo)
        # Check if there are any faces which have similar bounding boxes
        for face in faces:
            margin = int((face.location_right - face.location_left) * 0.05)
            similar_faces = Face.objects.filter(
                photo=photo,
                location_top__lte=face.location_top + margin,
                location_top__gte=face.location_top - margin,
                location_right__lte=face.location_right + margin,
                location_right__gte=face.location_right - margin,
                location_bottom__lte=face.location_bottom + margin,
                location_bottom__gte=face.location_bottom - margin,
                location_left__lte=face.location_left + margin,
                location_left__gte=face.location_left - margin,
            )
            if len(similar_faces) > 1:
                # Divide between faces with a person label and faces without
                faces_with_person_label = []
                faces_without_person_label = []
                for similar_face in similar_faces:
                    if similar_face.person:
                        faces_with_person_label.append(similar_face)
                    else:
                        faces_without_person_label.append(similar_face)
                # If there are faces with a person label, keep the first one and delete the rest
                for similar_face in faces_with_person_label[1:]:
                    similar_face.delete()
                # If there are faces with a person label, delete all of them
                if len(faces_with_person_label) > 0:
                    for similar_face in faces_without_person_label:
                        similar_face.delete()
                # Otherwise, keep the first face and delete the rest
                else:
                    for similar_face in faces_without_person_label[1:]:
                        similar_face.delete()


@admin.register(Face)
class FaceAdmin(admin.ModelAdmin):
    list_display = (
        "id",
        "cluster_person",
        "cluster_probability",
        "classification_person",
        "cluster",
        "photo",
        "person",
    )
    list_filter = ("person", "cluster")


@admin.register(Photo)
class PhotoAdmin(admin.ModelAdmin):
    actions = ["deduplicate_faces"]
    list_display = [
        "image_hash",
        "owner",
        "main_file",
        "last_modified",
        "added_on",
        "size",
    ]
    list_filter = ["owner"]

    def deduplicate_faces(self, request, queryset):
        AsyncTask(
            deduplicate_faces_function,
            queryset=queryset,
        ).run()


@admin.register(Thumbnail)
class ThumbnailAdmin(admin.ModelAdmin):
    list_display = ["photo", "aspect_ratio"]
    raw_id_fields = ["photo"]


admin.site.register(Person)
admin.site.register(AlbumAuto)
admin.site.register(AlbumUser)
admin.site.register(AlbumThing)
admin.site.register(AlbumDate)
admin.site.register(AlbumPlace)
admin.site.register(Cluster)
admin.site.register(LongRunningJob)
admin.site.register(File)
admin.site.register(User)


================================================
FILE: api/all_tasks.py
================================================
import io
import os
import zipfile

from django.conf import settings
from django.utils import timezone
from django_q.tasks import AsyncTask, schedule

from api import util
from api.models.long_running_job import LongRunningJob


def create_download_job(job_type, user, photos, filename):
    lrj = LongRunningJob.create_job(
        user=user,
        job_type=job_type,
    )
    if job_type == LongRunningJob.JOB_DOWNLOAD_PHOTOS:
        AsyncTask(
            zip_photos_task, job_id=lrj.job_id, user=user, photos=photos, filename=filename
        ).run()

    return lrj.job_id


def zip_photos_task(job_id, user, photos, filename):
    lrj = LongRunningJob.objects.get(job_id=job_id)
    lrj.start()
    count = len(photos)
    lrj.update_progress(current=0, target=count)
    output_directory = os.path.join(settings.MEDIA_ROOT, "zip")
    zip_file_name = filename
    done_count = 0
    try:
        if not os.path.exists(output_directory):
            os.mkdir(output_directory)
        mf = io.BytesIO()
        files_added = {}  # Track files by path to avoid duplicates

        for photo in photos:
            done_count = done_count + 1

            # Collect all files for this photo.
            # NOTE: main_file is not guaranteed to be included in Photo.files.
            all_files = []
            if getattr(photo, "main_file", None) is not None:
                all_files.append(photo.main_file)
            all_files.extend(list(photo.files.all()))

            # Back-compat: some datasets may still represent RAW+JPEG / Live Photo variants
            # as deprecated stacks. Include those stack members' files too.
            try:
                variant_stacks = photo.stacks.filter(
                    stack_type__in=["raw_jpeg", "live_photo"]
                ).prefetch_related("photos", "photos__files", "photos__main_file")
                for stack in variant_stacks:
                    for stack_photo in stack.photos.all():
                        if getattr(stack_photo, "main_file", None) is not None:
                            all_files.append(stack_photo.main_file)
                        all_files.extend(list(stack_photo.files.all()))
            except Exception:
                # If stacks aren't available for some reason, just proceed with variants.
                pass

            # Include embedded media variants for every collected file (not just main_file)
            for file_obj in list(all_files):
                try:
                    if file_obj and file_obj.embedded_media.exists():
                        all_files.extend(list(file_obj.embedded_media.all()))
                except Exception:
                    continue
            
            # Add each file to the zip
            for file_obj in all_files:
                if not file_obj or not file_obj.path:
                    continue
                    
                # Skip if file doesn't exist on disk
                if not os.path.exists(file_obj.path):
                    util.logger.warning(f"File not found, skipping: {file_obj.path}")
                    continue
                
                # Skip if already added (avoid duplicates)
                if file_obj.path in files_added:
                    continue
                
                file_name = os.path.basename(file_obj.path)
                
                # Handle duplicate filenames in the zip
                if file_name in files_added.values():
                    # Find a unique name by prepending a counter
                    counter = 1
                    base_name, ext = os.path.splitext(file_name)
                    while f"{base_name}_{counter}{ext}" in files_added.values():
                        counter += 1
                    file_name = f"{base_name}_{counter}{ext}"
                
                files_added[file_obj.path] = file_name
                
                with zipfile.ZipFile(mf, mode="a", compression=zipfile.ZIP_DEFLATED) as zf:
                    zf.write(file_obj.path, arcname=file_name)
            
            lrj.update_progress(current=done_count, target=count)
        
        with open(os.path.join(output_directory, zip_file_name), "wb") as output_file:
            output_file.write(mf.getvalue())

    except Exception as e:
        util.logger.error(f"Error while converting files to zip: {e}")

    lrj.complete()
    # scheduling a task to delete the zip file after a day
    execution_time = timezone.now() + timezone.timedelta(days=1)
    schedule("api.all_tasks.delete_zip_file", filename, next_run=execution_time)
    return os.path.join(output_directory, zip_file_name)


def delete_zip_file(filename):
    file_path = os.path.join(settings.MEDIA_ROOT, "zip", filename)
    try:
        if not os.path.exists(file_path):
            util.logger.error(f"Error while deleting file not found at : {file_path}")
            return
        else:
            os.remove(file_path)
            util.logger.info(f"file deleted sucessfully at path : {file_path}")
            return

    except Exception as e:
        util.logger.error(f"Error while deleting file: {e}")
        return e


================================================
FILE: api/api_util.py
================================================
import os
import random
import stat

from api.models import (
    LongRunningJob,
    Photo,
)
from api.serializers.job import LongRunningJobSerializer
from api.util import logger


def get_current_job():
    job_detail = None
    running_job = (
        LongRunningJob.objects.filter(finished=False).order_by("-started_at").first()
    )
    if running_job:
        job_detail = LongRunningJobSerializer(running_job).data
    return job_detail


def shuffle(list):
    random.shuffle(list)
    return list


def is_hidden(filepath):
    name = os.path.basename(os.path.abspath(filepath))
    return name.startswith(".") or has_hidden_attribute(filepath)


def has_hidden_attribute(filepath):
    try:
        return bool(os.stat(filepath).st_file_attributes & stat.FILE_ATTRIBUTE_HIDDEN)
    except Exception:
        return False


def path_to_dict(path, recurse=2):
    d = {"title": os.path.basename(path), "absolute_path": path}
    if recurse > 0:
        d["children"] = [
            path_to_dict(os.path.join(path, x), recurse - 1)
            for x in os.scandir(path)
            if os.path.isdir(os.path.join(path, x))
            and not is_hidden(os.path.join(path, x))
        ]
    else:
        d["children"] = []
    # sort children by title alphabetically (case insensitive)
    d["children"] = sorted(d["children"], key=lambda k: k["title"].lower())
    return d


def get_search_term_examples(user):
    default_search_terms = [
        "for people",
        "for places",
        "for things",
        "for time",
        "for file path or file name",
    ]

    possible_ids = list(
        Photo.objects.filter(owner=user)
        .exclude(caption_instance__captions_json={})
        .exclude(caption_instance__captions_json__isnull=True)[:1000]
        .values_list("image_hash", flat=True)
    )
    if len(possible_ids) > 99:
        possible_ids = random.choices(possible_ids, k=100)
    logger.info(f"{len(possible_ids)} possible ids")
    try:
        samples = (
            Photo.objects.filter(owner=user)
            .exclude(caption_instance__captions_json={})
            .exclude(caption_instance__captions_json__isnull=True)
            .filter(image_hash__in=possible_ids)
            .prefetch_related("faces")
            .prefetch_related("faces__person")
            .prefetch_related("caption_instance")
            .all()
        )
    except ValueError:
        return default_search_terms

    search_data = []
    search_terms = default_search_terms
    logger.info("Getting search terms for user %s", user.id)
    logger.info("Found %s photos", len(samples))
    for p in samples:
        faces = p.faces.all()
        terms_loc = ""
        if (
            p.geolocation_json
            and p.geolocation_json != {}
            and "features" in p.geolocation_json
        ):
            terms_loc = [
                f["text"]
                for f in p.geolocation_json["features"][-5:]
                if "text" in f and not f["text"].isdigit()
            ]
        terms_time = ""
        if p.exif_timestamp:
            terms_time = [str(p.exif_timestamp.year)]
        terms_people = []
        if p.faces.count() > 0:
            terms_people = [
                f.person.name.split(" ")[0] if f.person else "" for f in faces
            ]
        terms_things = ""
        if (
            p.caption_instance
            and p.caption_instance.captions_json
            and p.caption_instance.captions_json.get("places365") is not None
        ):
            terms_things = p.caption_instance.captions_json["places365"]["categories"]

        terms = {
            "loc": terms_loc,
            "time": terms_time,
            "people": terms_people,
            "things": terms_things,
        }

        search_data.append(terms)
        search_terms = []
        for datum in search_data:
            term_time = ""
            term_thing = ""
            term_loc = ""
            term_people = ""
            if datum["loc"]:
                term_loc = random.choice(datum["loc"])
                search_terms.append(term_loc)
            if datum["time"]:
                term_time = random.choice(datum["time"])
                search_terms.append(term_time)
            if datum["things"]:
                term_thing = random.choice(datum["things"])
                search_terms.append(term_thing)
            if datum["people"]:
                term_people = random.choice(datum["people"])
                search_terms.append(term_people)

            search_term_loc_people = " ".join(shuffle([term_loc, term_people]))
            if random.random() > 0.3:
                search_terms.append(search_term_loc_people)

            search_term_time_people = " ".join(shuffle([term_time, term_people]))
            if random.random() > 0.3:
                search_terms.append(search_term_time_people)

            search_term_people_thing = " ".join(shuffle([term_people, term_thing]))
            if random.random() > 0.9:
                search_terms.append(search_term_people_thing)

            search_term_all = " ".join(
                shuffle([term_loc, term_people, term_time, term_thing])
            )
            if random.random() > 0.95:
                search_terms.append(search_term_all)

            search_term_loc_time = " ".join(shuffle([term_loc, term_time]))
            if random.random() > 0.3:
                search_terms.append(search_term_loc_time)

            search_term_loc_thing = " ".join(shuffle([term_loc, term_thing]))
            if random.random() > 0.9:
                search_terms.append(search_term_loc_thing)

            search_term_time_thing = " ".join(shuffle([term_time, term_thing]))
            if random.random() > 0.9:
                search_terms.append(search_term_time_thing)

    return list(filter(lambda x: len(x), set([x.strip() for x in search_terms])))


================================================
FILE: api/apps.py
================================================
from django.apps import AppConfig


class ApiConfig(AppConfig):
    name = "api"
    verbose_name = "LibrePhotos"


================================================
FILE: api/autoalbum.py
================================================
from datetime import datetime, timedelta

import numpy as np
import pytz
from django.db.models import Q

from api.models import (
    AlbumAuto,
    AlbumDate,
    AlbumPlace,
    AlbumThing,
    AlbumUser,
    Face,
    File,
    LongRunningJob,
    Photo,
)
from api.util import logger


def regenerate_event_titles(user, job_id):
    lrj = LongRunningJob.get_or_create_job(
        user=user,
        job_type=LongRunningJob.JOB_GENERATE_AUTO_ALBUM_TITLES,
        job_id=job_id,
    )
    try:
        aus = AlbumAuto.objects.filter(owner=user).prefetch_related("photos")
        target_count = len(aus)
        for idx, au in enumerate(aus):
            logger.info(f"job {job_id}: {idx}")
            au._generate_title()
            au.save()
            lrj.update_progress(current=idx + 1, target=target_count)

        lrj.complete()
        logger.info(f"job {job_id}: updated lrj entry to db")

    except Exception as e:
        logger.exception("An error occurred")
        lrj.fail(error=e)

    return 1


def generate_event_albums(user, job_id):
    lrj = LongRunningJob.get_or_create_job(
        user=user,
        job_type=LongRunningJob.JOB_GENERATE_AUTO_ALBUMS,
        job_id=job_id,
    )

    try:
        photos = (
            Photo.objects.filter(Q(owner=user))
            .exclude(Q(exif_timestamp=None))
            .only("exif_timestamp")
        )

        def group(photos, dt=timedelta(hours=6)):
            photos_with_timestamp = sorted(photos, key=lambda p: p.exif_timestamp)
            groups = []
            for idx, photo in enumerate(photos_with_timestamp):
                if len(groups) == 0:
                    groups.append([])
                    groups[-1].append(photo)
                # Photos are sorted by timestamp, so we can just check the last photo of the last group
                # to see if it is within the time delta
                elif photo.exif_timestamp - groups[-1][-1].exif_timestamp < dt:
                    groups[-1].append(photo)
                # If the photo is not within the time delta, we create a new group
                else:
                    groups.append([])
                    groups[-1].append(photo)
            return groups

        # Group images that are on the same 1 day and 12 hours interval
        groups = group(photos, dt=timedelta(days=1, hours=12))
        target_count = len(groups)
        logger.info(
            f"job {job_id}: made {target_count} groups out of {len(photos)} images"
        )

        album_locations = []

        date_format = "%Y:%m:%d %H:%M:%S"
        for idx, group in enumerate(groups):
            key = group[0].exif_timestamp - timedelta(hours=11, minutes=59)
            lastKey = group[-1].exif_timestamp + timedelta(hours=11, minutes=59)
            logger.info(str(key.date) + " - " + str(lastKey.date))
            logger.info(
                f"job {job_id}: processing auto album with date: "
                + key.strftime(date_format)
                + " to "
                + lastKey.strftime(date_format)
            )
            items = group
            if len(group) >= 2:
                qs = AlbumAuto.objects.filter(owner=user).filter(
                    timestamp__range=(key, lastKey)
                )
                if qs.count() == 0:
                    album = AlbumAuto(
                        created_on=datetime.utcnow().replace(tzinfo=pytz.utc),
                        owner=user,
                    )
                    album.timestamp = key
                    album.save()

                    logger.info(f"job {job_id}: generate auto album {album.id}")
                    locs = []
                    for item in items:
                        album.photos.add(item)
                        item.save()
                        if item.exif_gps_lat and item.exif_gps_lon:
                            locs.append([item.exif_gps_lat, item.exif_gps_lon])
                    if len(locs) > 0:
                        album_location = np.mean(np.array(locs), 0)
                        album_locations.append(album_location)
                        album.gps_lat = album_location[0]
                        album.gps_lon = album_location[1]
                    else:
                        album_locations.append([])
                    album._generate_title()
                    album.save()
                    continue
                if qs.count() == 1:
                    album = qs.first()
                    logger.info(f"job {job_id}: update auto album {album.id}")
                    for item in items:
                        if item in album.photos.all():
                            continue
                        album.photos.add(item)
                        item.save()
                    album._generate_title()
                    album.save()
                    continue
                if qs.count() > 1:
                    # To-Do: Merge both auto albums
                    logger.info(
                        f"job {job_id}: found multiple auto albums for date {key.strftime(date_format)}"
                    )
                    continue

            lrj.update_progress(current=idx + 1, target=target_count)

        lrj.complete()

    except Exception as e:
        logger.exception("An error occurred")
        lrj.fail(error=e)

    return 1


# To-Do: This does not belong here
def delete_missing_photos(user, job_id):
    lrj = LongRunningJob.get_or_create_job(
        user=user,
        job_type=LongRunningJob.JOB_DELETE_MISSING_PHOTOS,
        job_id=job_id,
    )
    try:
        missing_photos = Photo.objects.filter(
            Q(owner=user) & Q(files=None) | Q(main_file=None)
        )
        for missing_photo in missing_photos:
            album_dates = AlbumDate.objects.filter(photos=missing_photo)
            for album_date in album_dates:
                album_date.photos.remove(missing_photo)
            album_things = AlbumThing.objects.filter(photos=missing_photo)
            for album_thing in album_things:
                album_thing.photos.remove(missing_photo)
            album_places = AlbumPlace.objects.filter(photos=missing_photo)
            for album_place in album_places:
                album_place.photos.remove(missing_photo)
            album_users = AlbumUser.objects.filter(photos=missing_photo)
            for album_user in album_users:
                album_user.photos.remove(missing_photo)
            faces = Face.objects.filter(photo=missing_photo)
            faces.delete()
            # To-Do: Remove thumbnails

        missing_photos.delete()

        missing_files = File.objects.filter(Q(hash__endswith=user) & Q(missing=True))
        missing_files.delete()

        lrj.complete()
    except Exception as e:
        logger.exception("An error occurred")
        lrj.fail(error=e)
    return 1


================================================
FILE: api/background_tasks.py
================================================
from tqdm import tqdm
from django.db import models

from api.models import Photo
from api.models.photo_caption import PhotoCaption
from api.util import logger


def generate_captions(overwrite=False):
    if overwrite:
        photos = Photo.objects.all()
    else:
        # Find photos that don't have search captions in PhotoSearch model
        photos = Photo.objects.filter(
            models.Q(search_instance__isnull=True)
            | models.Q(search_instance__search_captions__isnull=True)
        )
    logger.info("%d photos to be processed for caption generation" % photos.count())
    for photo in photos:
        logger.info("generating captions for %s" % photo.main_file.path)
        caption_instance, created = PhotoCaption.objects.get_or_create(photo=photo)
        caption_instance.generate_tag_captions()
        photo.save()


def geolocate(overwrite=False):
    if overwrite:
        photos = Photo.objects.all()
    else:
        photos = Photo.objects.filter(geolocation_json={})
    logger.info("%d photos to be geolocated" % photos.count())
    for photo in photos:
        try:
            logger.info("geolocating %s" % photo.main_file.path)
            photo._geolocate()
            photo._add_location_to_album_dates()
        except Exception:
            logger.exception("could not geolocate photo: %s", photo)


def add_photos_to_album_things():
    photos = Photo.objects.all()
    for photo in tqdm(photos):
        photo._add_to_album_place()


================================================
FILE: api/batch_jobs.py
================================================
import os

from django.db.models import Q

from api import util
from api.image_similarity import build_image_similarity_index
from api.models.long_running_job import LongRunningJob
from api.models.photo import Photo
from api.semantic_search import create_clip_embeddings


def batch_calculate_clip_embedding(user):
    import torch

    lrj = LongRunningJob.create_job(
        user=user,
        job_type=LongRunningJob.JOB_CALCULATE_CLIP_EMBEDDINGS,
        start_now=True,
    )

    count = Photo.objects.filter(
        Q(owner=user) & Q(clip_embeddings__isnull=True)
    ).count()
    lrj.update_progress(current=0, target=count)
    
    if not torch.cuda.is_available():
        num_threads = 1
        torch.set_num_threads(num_threads)
        os.environ["OMP_NUM_THREADS"] = str(num_threads)
    else:
        torch.multiprocessing.set_start_method("spawn", force=True)

    BATCH_SIZE = 64
    util.logger.info(f"Using threads: {torch.get_num_threads()}")

    done_count = 0
    while done_count < count:
        try:
            objs = list(
                Photo.objects.filter(Q(owner=user) & Q(clip_embeddings__isnull=True))[
                    :BATCH_SIZE
                ]
            )
            done_count += len(objs)

            if len(objs) == 0:
                break
            valid_objs = []
            for obj in objs:
                # Thumbnail could have been deleted
                if obj.thumbnail.thumbnail_big and os.path.exists(
                    obj.thumbnail.thumbnail_big.path
                ):
                    valid_objs.append(obj)
            imgs = list(map(lambda obj: obj.thumbnail.thumbnail_big.path, valid_objs))
            if len(valid_objs) == 0:
                continue

            imgs_emb, magnitudes = create_clip_embeddings(imgs)

            for obj, img_emb, magnitude in zip(valid_objs, imgs_emb, magnitudes):
                obj.clip_embeddings = img_emb.tolist()
                obj.clip_embeddings_magnitude = magnitude
                obj.save()
        except Exception as e:
            util.logger.error(f"Error calculating clip embeddings: {e}")

        lrj.update_progress(current=done_count, target=count)

    build_image_similarity_index(user)
    lrj.complete()


================================================
FILE: api/burst_detection_rules.py
================================================
"""
Burst detection rules module for grouping photos taken in rapid succession.

This module provides a rules-based system for detecting burst sequences,
following the same pattern as date_time_extractor.py. Rules are stored
as JSON in each user's profile and applied sequentially.

Rules are divided into two categories:
- Hard criteria: Deterministic detection based on EXIF data and filename patterns
  (e.g., BurstMode tag, SequenceNumber, filename patterns like IMG_001_BURST001)
- Soft criteria: Estimation based on timestamp proximity and visual similarity
  (e.g., photos within 2 seconds of each other from the same camera)

By default, only hard criteria rules are enabled.
"""

import json
import os
import re
from datetime import timedelta

from api.metadata.tags import Tags
from api.util import logger


class BurstRuleTypes:
    """Types of burst detection rules."""

    # Hard criteria (deterministic)
    EXIF_BURST_MODE = "exif_burst_mode"
    EXIF_SEQUENCE_NUMBER = "exif_sequence_number"
    FILENAME_PATTERN = "filename_pattern"

    # Soft criteria (estimation)
    TIMESTAMP_PROXIMITY = "timestamp_proximity"
    VISUAL_SIMILARITY = "visual_similarity"


class BurstRuleCategory:
    """Categories for burst detection rules."""

    HARD = "hard"  # Deterministic (EXIF, filenames)
    SOFT = "soft"  # Estimation (timestamps, visual similarity)


# Predefined filename patterns for burst detection
BURST_FILENAME_PATTERNS = {
    # Pattern name: (regex, description)
    "burst_suffix": (
        r"_BURST\d+",
        "Files with _BURST followed by numbers (e.g., IMG_001_BURST001.jpg)",
    ),
    "sequence_suffix": (
        r"_\d{3,}$",
        "Files ending with 3+ digit sequence number (e.g., IMG_001.jpg, IMG_002.jpg)",
    ),
    "bracketed_sequence": (
        r"\(\d+\)$",
        "Files with bracketed numbers at end (e.g., photo (1).jpg, photo (2).jpg)",
    ),
    "samsung_burst": (r"_\d{3}_COVER", "Samsung burst cover images"),
    "iphone_burst": (r"IMG_\d{4}_\d+", "iPhone burst sequence pattern"),
}


class BurstDetectionRule:
    """
    A rule for detecting burst sequences.

    Each rule has:
    - id: Unique identifier
    - name: Human-readable name
    - rule_type: One of BurstRuleTypes
    - category: 'hard' or 'soft' (for UI grouping)
    - enabled: Whether the rule is active
    - is_default: Whether this is a default rule
    - Type-specific parameters (e.g., interval_ms for timestamp_proximity)

    Additionally, each rule can have conditions:
    - condition_path: Regex to match full path
    - condition_filename: Regex to match filename
    - condition_exif: Format: "TAG_NAME//regex_pattern"
    """

    def __init__(self, params):
        self.id = params.get("id")
        self.name = params.get("name", "Unnamed rule")
        self.rule_type = params["rule_type"]
        self.category = params.get("category", BurstRuleCategory.HARD)
        self.enabled = params.get("enabled", True)
        self.is_default = params.get("is_default", True)
        self.params = params

    def get_required_exif_tags(self):
        """Return set of EXIF tags needed by this rule."""
        tags = set()

        # Add condition tag if present
        condition_exif = self.params.get("condition_exif")
        if condition_exif:
            tag_name = condition_exif.split("//", maxsplit=1)[0]
            tags.add(tag_name)

        # Add rule-specific tags
        if self.rule_type == BurstRuleTypes.EXIF_BURST_MODE:
            tags.add(Tags.BURST_MODE)
            tags.add(Tags.CONTINUOUS_DRIVE)
        elif self.rule_type == BurstRuleTypes.EXIF_SEQUENCE_NUMBER:
            tags.add(Tags.SEQUENCE_NUMBER)
            tags.add(Tags.IMAGE_NUMBER)
            tags.add(Tags.SUBSEC_TIME_ORIGINAL)

        return tags

    def _check_condition_path(self, path):
        """Check if path matches condition_path regex."""
        condition = self.params.get("condition_path")
        if condition:
            return re.search(condition, path) is not None
        return True

    def _check_condition_filename(self, path):
        """Check if filename matches condition_filename regex."""
        condition = self.params.get("condition_filename")
        if condition:
            filename = os.path.basename(path)
            return re.search(condition, filename) is not None
        return True

    def _check_condition_exif(self, exif_tags):
        """Check if EXIF tag value matches condition_exif pattern."""
        condition = self.params.get("condition_exif")
        if not condition:
            return True

        parts = condition.split("//", maxsplit=1)
        if len(parts) != 2:
            logger.warning(f"Invalid condition_exif format: {condition}")
            return False

        tag_name, pattern = parts
        tag_value = exif_tags.get(tag_name)
        if not tag_value:
            return False
        return re.search(pattern, str(tag_value)) is not None

    def check_conditions(self, path, exif_tags):
        """Check all conditions for this rule."""
        return (
            self._check_condition_path(path)
            and self._check_condition_filename(path)
            and self._check_condition_exif(exif_tags)
        )

    def is_burst_photo(self, photo, exif_tags):
        """
        Check if a photo is part of a burst sequence according to this rule.

        Args:
            photo: Photo model instance
            exif_tags: Dict of EXIF tag name -> value

        Returns:
            Tuple of (is_burst: bool, group_key: str or None)
            group_key can be used to group photos into the same burst
        """
        if not self.enabled:
            return False, None

        path = photo.main_file.path if photo.main_file else ""

        if not self.check_conditions(path, exif_tags):
            return False, None

        if self.rule_type == BurstRuleTypes.EXIF_BURST_MODE:
            return self._check_exif_burst_mode(photo, exif_tags)
        elif self.rule_type == BurstRuleTypes.EXIF_SEQUENCE_NUMBER:
            return self._check_exif_sequence_number(photo, exif_tags)
        elif self.rule_type == BurstRuleTypes.FILENAME_PATTERN:
            return self._check_filename_pattern(photo, exif_tags)
        else:
            # Soft rules don't use is_burst_photo - they use group_by_proximity
            return False, None

    def _check_exif_burst_mode(self, photo, exif_tags):
        """Check if EXIF BurstMode or ContinuousDrive indicates burst."""
        burst_mode = exif_tags.get(Tags.BURST_MODE)
        continuous_drive = exif_tags.get(Tags.CONTINUOUS_DRIVE)

        # BurstMode: 1 = On (Canon, etc.)
        if burst_mode and str(burst_mode) in ("1", "On", "True", "Yes"):
            # Group by timestamp (rounded to second) + camera model
            camera = exif_tags.get(Tags.CAMERA, "unknown")
            timestamp = photo.exif_timestamp
            if timestamp:
                group_key = f"burst_{camera}_{timestamp.strftime('%Y%m%d_%H%M%S')}"
                return True, group_key
            return True, None

        # ContinuousDrive: Continuous, etc.
        if continuous_drive and continuous_drive.lower() in ("continuous", "on", "1"):
            camera = exif_tags.get(Tags.CAMERA, "unknown")
            timestamp = photo.exif_timestamp
            if timestamp:
                group_key = f"burst_{camera}_{timestamp.strftime('%Y%m%d_%H%M%S')}"
                return True, group_key
            return True, None

        return False, None

    def _check_exif_sequence_number(self, photo, exif_tags):
        """Check if photo has sequence number indicating burst."""
        sequence_num = exif_tags.get(Tags.SEQUENCE_NUMBER)

        # If we have a sequence number, it's likely part of a burst
        if sequence_num is not None:
            try:
                int(sequence_num)  # Validate it's a valid number
                # Sequence numbers suggest burst
                # Group by directory + base timestamp
                camera = exif_tags.get(Tags.CAMERA, "unknown")
                timestamp = photo.exif_timestamp
                if timestamp:
                    # Round to same second for grouping
                    group_key = f"seq_{camera}_{timestamp.strftime('%Y%m%d_%H%M%S')}"
                    return True, group_key
                return True, None
            except (ValueError, TypeError):
                pass

        return False, None

    def _check_filename_pattern(self, photo, exif_tags):
        """Check if filename matches burst pattern."""
        if not photo.main_file:
            return False, None

        filename = os.path.basename(photo.main_file.path)
        basename = os.path.splitext(filename)[0]

        # Get pattern type from params, default to checking all patterns
        pattern_type = self.params.get("pattern_type", "all")
        custom_pattern = self.params.get("custom_pattern")

        if custom_pattern:
            if re.search(custom_pattern, basename):
                # Extract base name for grouping (remove trailing numbers/burst suffix)
                base = re.sub(r"(_BURST\d+|_\d{3,}|\(\d+\))$", "", basename)
                directory = os.path.dirname(photo.main_file.path)
                group_key = f"filename_{directory}_{base}"
                return True, group_key
        elif pattern_type == "all":
            # Check all predefined patterns
            for pattern_name, (pattern, _) in BURST_FILENAME_PATTERNS.items():
                if re.search(pattern, basename, re.IGNORECASE):
                    base = re.sub(
                        r"(_BURST\d+|_\d{3,}|\(\d+\)|_COVER)$",
                        "",
                        basename,
                        flags=re.IGNORECASE,
                    )
                    directory = os.path.dirname(photo.main_file.path)
                    group_key = f"filename_{directory}_{base}"
                    return True, group_key
        else:
            # Check specific pattern
            if pattern_type in BURST_FILENAME_PATTERNS:
                pattern, _ = BURST_FILENAME_PATTERNS[pattern_type]
                if re.search(pattern, basename, re.IGNORECASE):
                    base = re.sub(
                        r"(_BURST\d+|_\d{3,}|\(\d+\)|_COVER)$",
                        "",
                        basename,
                        flags=re.IGNORECASE,
                    )
                    directory = os.path.dirname(photo.main_file.path)
                    group_key = f"filename_{directory}_{base}"
                    return True, group_key

        return False, None


def check_filename_pattern(photo, pattern_type="any"):
    """
    Check if a photo's filename matches a burst pattern.

    Standalone function for testing and external use.

    Args:
        photo: Photo model instance with main_file
        pattern_type: "any" to check all patterns, or specific pattern name
                     (e.g., "burst_suffix", "sequence_suffix", "bracketed_sequence",
                      "samsung_burst", "iphone_burst")

    Returns:
        Tuple of (matches: bool, group_key: str or None)
        group_key can be used to group photos into the same burst
    """
    if not photo.main_file:
        return False, None

    filename = os.path.basename(photo.main_file.path)
    basename = os.path.splitext(filename)[0]
    directory = os.path.dirname(photo.main_file.path)

    if pattern_type == "any" or pattern_type == "all":
        # Check all predefined patterns
        for pattern_name, (pattern, _) in BURST_FILENAME_PATTERNS.items():
            if re.search(pattern, basename, re.IGNORECASE):
                base = re.sub(
                    r"(_BURST\d+|_\d{3,}|\(\d+\)|_COVER)$",
                    "",
                    basename,
                    flags=re.IGNORECASE,
                )
                group_key = f"filename_{directory}_{base}"
                return True, group_key
    else:
        # Check specific pattern
        if pattern_type in BURST_FILENAME_PATTERNS:
            pattern, _ = BURST_FILENAME_PATTERNS[pattern_type]
            if re.search(pattern, basename, re.IGNORECASE):
                base = re.sub(
                    r"(_BURST\d+|_\d{3,}|\(\d+\)|_COVER)$",
                    "",
                    basename,
                    flags=re.IGNORECASE,
                )
                group_key = f"filename_{directory}_{base}"
                return True, group_key

    return False, None


def group_photos_by_timestamp(photos, interval_ms=2000, require_same_camera=True):
    """
    Group photos by timestamp proximity (soft criterion).

    Args:
        photos: QuerySet of Photo objects ordered by exif_timestamp
        interval_ms: Maximum milliseconds between consecutive burst shots
        require_same_camera: If True, only group photos from same camera

    Returns:
        List of lists, each inner list is a group of Photo objects
    """
    if not photos:
        return []

    interval = timedelta(milliseconds=interval_ms)
    groups = []
    current_group = []
    prev_photo = None
    prev_camera = None

    for photo in photos:
        if not photo.exif_timestamp:
            continue

        # Get camera info for same-camera check
        camera = None
        if require_same_camera and hasattr(photo, "metadata") and photo.metadata:
            camera = f"{photo.metadata.camera_make or ''}_{photo.metadata.camera_model or ''}"

        if prev_photo is None:
            current_group = [photo]
            prev_photo = photo
            prev_camera = camera
            continue

        # Check time difference
        time_diff = photo.exif_timestamp - prev_photo.exif_timestamp

        # Check if same camera (if required)
        same_camera = True
        if require_same_camera and camera and prev_camera:
            same_camera = camera == prev_camera

        if time_diff <= interval and same_camera:
            # Part of same burst
            current_group.append(photo)
        else:
            # End of current burst, save if we have a group
            if len(current_group) >= 2:
                groups.append(current_group)
            # Start new group
            current_group = [photo]

        prev_photo = photo
        prev_camera = camera

    # Don't forget the last group
    if len(current_group) >= 2:
        groups.append(current_group)

    return groups


def group_photos_by_visual_similarity(photos, similarity_threshold=15):
    """
    Group photos by visual similarity (soft criterion).

    Uses perceptual hash comparison to group visually similar photos.

    Args:
        photos: List of Photo objects
        similarity_threshold: Maximum hamming distance (lower = more similar)

    Returns:
        List of lists, each inner list is a group of visually similar Photo objects
    """
    from api.perceptual_hash import hamming_distance

    if not photos:
        return []

    # Filter photos with perceptual hashes
    photos_with_hash = [p for p in photos if p.perceptual_hash]

    if len(photos_with_hash) < 2:
        return []

    # Simple clustering: group consecutive similar photos
    groups = []
    current_group = [photos_with_hash[0]]

    for i in range(1, len(photos_with_hash)):
        photo = photos_with_hash[i]
        prev_photo = photos_with_hash[i - 1]

        distance = hamming_distance(photo.perceptual_hash, prev_photo.perceptual_hash)

        if distance <= similarity_threshold:
            current_group.append(photo)
        else:
            if len(current_group) >= 2:
                groups.append(current_group)
            current_group = [photo]

    if len(current_group) >= 2:
        groups.append(current_group)

    return groups


# Default rules configuration
# Hard criteria rules (enabled by default)
DEFAULT_HARD_RULES = [
    {
        "id": 1,
        "name": "EXIF Burst Mode Tag",
        "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
        "category": BurstRuleCategory.HARD,
        "enabled": True,
        "is_default": True,
        "description": "Detects photos where camera was in burst mode (using MakerNotes:BurstMode or MakerNotes:ContinuousDrive EXIF tags)",
    },
    {
        "id": 2,
        "name": "EXIF Sequence Number",
        "rule_type": BurstRuleTypes.EXIF_SEQUENCE_NUMBER,
        "category": BurstRuleCategory.HARD,
        "enabled": True,
        "is_default": True,
        "description": "Groups photos by EXIF sequence number (MakerNotes:SequenceNumber) taken at the same time",
    },
    {
        "id": 3,
        "name": "Filename Burst Pattern",
        "rule_type": BurstRuleTypes.FILENAME_PATTERN,
        "category": BurstRuleCategory.HARD,
        "enabled": True,
        "is_default": True,
        "pattern_type": "all",
        "description": "Detects burst sequences from filename patterns (e.g., IMG_001_BURST001, photo (1), photo (2))",
    },
]

# Soft criteria rules (disabled by default)
DEFAULT_SOFT_RULES = [
    {
        "id": 101,
        "name": "Timestamp Proximity",
        "rule_type": BurstRuleTypes.TIMESTAMP_PROXIMITY,
        "category": BurstRuleCategory.SOFT,
        "enabled": False,
        "is_default": True,
        "interval_ms": 2000,
        "require_same_camera": True,
        "description": "Groups photos taken within a short time interval (configurable, default 2 seconds)",
    },
    {
        "id": 102,
        "name": "Visual Similarity",
        "rule_type": BurstRuleTypes.VISUAL_SIMILARITY,
        "category": BurstRuleCategory.SOFT,
        "enabled": False,
        "is_default": True,
        "similarity_threshold": 15,
        "description": "Groups visually similar consecutive photos using perceptual hash comparison",
    },
]

# Other available rules (not included by default)
OTHER_RULES = [
    {
        "id": 4,
        "name": "Filename Burst Suffix Only",
        "rule_type": BurstRuleTypes.FILENAME_PATTERN,
        "category": BurstRuleCategory.HARD,
        "enabled": False,
        "is_default": False,
        "pattern_type": "burst_suffix",
        "description": "Only detect files with explicit _BURST suffix in filename",
    },
    {
        "id": 5,
        "name": "Custom Filename Pattern",
        "rule_type": BurstRuleTypes.FILENAME_PATTERN,
        "category": BurstRuleCategory.HARD,
        "enabled": False,
        "is_default": False,
        "pattern_type": "custom",
        "custom_pattern": "",
        "description": "Use a custom regex pattern to match burst filenames",
    },
    {
        "id": 103,
        "name": "Timestamp Proximity (Loose)",
        "rule_type": BurstRuleTypes.TIMESTAMP_PROXIMITY,
        "category": BurstRuleCategory.SOFT,
        "enabled": False,
        "is_default": False,
        "interval_ms": 5000,
        "require_same_camera": False,
        "description": "Groups photos taken within 5 seconds, regardless of camera",
    },
]


def get_default_burst_detection_rules():
    """Get default burst detection rules as JSON-serializable list."""
    return DEFAULT_HARD_RULES + DEFAULT_SOFT_RULES


def get_all_predefined_burst_rules():
    """Get all predefined burst detection rules (default + optional)."""
    return DEFAULT_HARD_RULES + DEFAULT_SOFT_RULES + OTHER_RULES


def _as_json(configs):
    """Convert rule configs to JSON string."""
    return json.dumps(configs, default=lambda x: x.__dict__)


# Pre-computed JSON strings for API responses
DEFAULT_RULES_JSON = _as_json(get_default_burst_detection_rules())
PREDEFINED_RULES_JSON = _as_json(get_all_predefined_burst_rules())


def as_rules(configs):
    """Convert list of rule configs to list of BurstDetectionRule objects."""
    return [BurstDetectionRule(config) for config in configs]


def get_hard_rules(rules):
    """Filter to only hard criteria rules."""
    return [r for r in rules if r.category == BurstRuleCategory.HARD and r.enabled]


def get_soft_rules(rules):
    """Filter to only soft criteria rules."""
    return [r for r in rules if r.category == BurstRuleCategory.SOFT and r.enabled]


def get_enabled_rules(rules):
    """Filter to only enabled rules."""
    return [r for r in rules if r.enabled]


================================================
FILE: api/cluster_manager.py
================================================
import numpy as np

from api.models.cluster import UNKNOWN_CLUSTER_ID, Cluster, get_unknown_cluster
from api.models.face import Face
from api.models.person import Person, get_or_create_person
from api.models.user import User
from api.util import logger


class ClusterManager:
    @staticmethod
    def try_add_cluster(
        user: User, cluster_id: int, faces: list[Face], padLen: int = 1
    ) -> list[Cluster]:
        added_clusters: list[Cluster] = []
        known_faces: list[Face] = []
        face_ids_by_cluster: dict[int, list[int]] = dict()
        unknown_faces: list[Face] = []
        unknown_ids: list[int] = []
        encoding_by_person: dict[int, list[np.ndarray]] = dict()

        face: Face
        new_cluster: Cluster
        unknown_cluster: Cluster = get_unknown_cluster(user=user)
        labelStr = str(cluster_id).zfill(padLen)
        for face in faces:
            if not face.person:
                unknown_faces.append(face)
                unknown_ids.append(face.id)
            else:
                known_faces.append(face)

        if cluster_id == UNKNOWN_CLUSTER_ID:
            logger.info("Adding unknown cluster")
            logger.info(
                "Adding unknown %d faces to unknown cluster" % len(unknown_faces)
            )
            logger.info("Adding known %d faces to unknown cluster" % len(known_faces))
            for face in unknown_faces:
                face.cluster = unknown_cluster
                face.cluster_person = None
                face.save()
            for face in known_faces:
                face.cluster = unknown_cluster
                face.save()

            return added_clusters

        if len(known_faces) == 0:
            new_cluster: Cluster
            new_person: Person

            new_person = get_or_create_person(
                name="Unknown " + labelStr, owner=user, kind=Person.KIND_CLUSTER
            )
            new_person.cluster_owner = user
            new_person.save()
            new_cluster = Cluster.get_or_create_cluster_by_id(user, cluster_id)
            new_cluster.name = "Cluster " + str(cluster_id)

            new_cluster.person = new_person
            encoding_by_person[new_cluster.person.id] = []
            new_cluster.save()
            added_clusters.append(new_cluster)

            for face in unknown_faces:
                encoding_by_person[new_cluster.person.id].append(
                    face.get_encoding_array()
                )
            Face.objects.filter(id__in=unknown_ids).update(
                cluster=new_cluster,
                cluster_person=new_person,
            )
        else:
            clusters_by_person: dict[int, Cluster] = dict()
            mean_encoding_by_cluster: dict[int, list[np.ndarray]] = dict()
            idx: int = 0
            for face in known_faces:
                if face.person.id not in clusters_by_person.keys():
                    idx = idx + 1
                    new_cluster = Cluster.get_or_create_cluster_by_name(
                        user, "Cluster " + str(cluster_id) + "-" + str(idx)
                    )
                    new_cluster.cluster_id = cluster_id
                    new_cluster.person = face.person
                    clusters_by_person[new_cluster.person.id] = new_cluster
                    added_clusters.append(new_cluster)
                    encoding_by_person[face.person.id] = []
                    face_ids_by_cluster[new_cluster.id] = []
                else:
                    new_cluster = clusters_by_person[face.person.id]
                encoding_by_person[face.person.id].append(face.get_encoding_array())
                face_ids_by_cluster[new_cluster.id].append(face.id)
            for new_cluster in added_clusters:
                Face.objects.filter(id__in=face_ids_by_cluster[new_cluster.id]).update(
                    cluster=new_cluster
                )

            # Set initial metadata on the split clusters based on known faces
            for new_cluster in added_clusters:
                new_cluster.set_metadata(encoding_by_person[new_cluster.person.id])
                mean_encoding_by_cluster[new_cluster.id] = (
                    new_cluster.get_mean_encoding_array()
                )

            # Clear the face IDs list to prepare for processing the unknown faces
            for new_cluster in added_clusters:
                face_ids_by_cluster[new_cluster.id] = []

            for new_cluster in added_clusters:
                Face.objects.filter(id__in=face_ids_by_cluster[new_cluster.id]).update(
                    cluster=new_cluster,
                    cluster_person=new_cluster.person,
                )

        # Update statistics again and save everything, since we've added more faces
        for new_cluster in added_clusters:
            new_cluster.set_metadata(encoding_by_person[new_cluster.person.id])
            new_cluster.save()

        return added_clusters


================================================
FILE: api/date_time_extractor.py
================================================
import json
import math
import os
import pathlib
import re
from datetime import datetime

import pytz

from api.metadata.tags import Tags
from api.util import logger


def _regexp_group_range(a, b):
    return "(" + "|".join(f"{i:02}" for i in range(a, b)) + ")"


_REGEXP_GROUP_YEAR = r"((?:19|20|21)\d\d)"
_REGEXP_GROUP_MONTH = _regexp_group_range(1, 13)
_REGEXP_GROUP_DAY = _regexp_group_range(1, 32)
_REGEXP_GROUP_HOUR = _regexp_group_range(0, 24)
_REGEXP_GROUP_MIN = r"([0-5]\d)"
_REGEXP_GROUP_SEC = r"([0-5]\d)"
_REGEXP_DELIM = r"[-:_\., ]*"
_NOT_A_NUMBER = r"(?<!\d)"

REGEXP_NO_TZ = re.compile(
    _NOT_A_NUMBER
    + _REGEXP_DELIM.join(
        [
            _REGEXP_GROUP_YEAR,
            _REGEXP_GROUP_MONTH,
            _REGEXP_GROUP_DAY,
            _REGEXP_GROUP_HOUR,
            _REGEXP_GROUP_MIN,
            _REGEXP_GROUP_SEC,
        ]
    )
)

# WhatsApp style filename - like IMG-20220101-WA0007.jpg
# Here we get year, month, day from the filename and use the number as microsecond so that
# media is ordered by that number but all of these images are grouped together separated from
# other media on that date.
REGEXP_WHATSAPP = re.compile(r"^(?:IMG|VID)[-_](\d{4})(\d{2})(\d{2})(?:[-_]WA(\d+))?")
REGEXP_WHATSAPP_GROUP_MAPPING = ["year", "month", "day", "microsecond"]

PREDEFINED_REGEXPS = {
    "default": (REGEXP_NO_TZ, None),
    "whatsapp": (REGEXP_WHATSAPP, REGEXP_WHATSAPP_GROUP_MAPPING),
}

REGEXP_GROUP_MAPPINGS = {
    "year": 0,
    "month": 1,
    "day": 2,
    "hour": 3,
    "minute": 4,
    "second": 5,
    "microsecond": 6,
}


def _extract_no_tz_datetime_from_str(x, regexp=REGEXP_NO_TZ, group_mapping=None):
    match = re.search(regexp, x)
    if not match:
        return None
    g = match.groups()
    if group_mapping is None:
        datetime_args = list(map(int, g))
    else:
        if len(g) > len(group_mapping):
            raise ValueError(
                f"Can't have more groups than group mapping values: {x}, regexp: {regexp}, mapping: {group_mapping}"
            )
        datetime_args = [
            None,
            None,
            None,
            0,
            0,
            0,
            0,
        ]  # year, month, day, hour, minute, second, microsecond
        for value, how_to_use in zip(g, group_mapping):
            if how_to_use not in REGEXP_GROUP_MAPPINGS:
                raise ValueError(
                    f"Group mapping {how_to_use} is unknown - must be one of {list(REGEXP_GROUP_MAPPINGS.keys())}"
                )
            ind = REGEXP_GROUP_MAPPINGS[how_to_use]
            # handle case when we have less groups than expected
            if value is not None:
                datetime_args[ind] = int(value)

    try:
        parsed_datetime = datetime(*datetime_args)
        delta = parsed_datetime - datetime.now()
        if delta.days > 30:
            logger.error(
                f"Error while parsing datetime from '{x}': Parsed datetime is {delta.days} in the future."
            )
            return None

        return parsed_datetime
    except ValueError:
        logger.error(
            f"Error while trying to create datetime using '{x}': datetime arguments {datetime_args}. Regexp used: '{regexp}'"
        )
        return None


class RuleTypes:
    EXIF = "exif"
    PATH = "path"
    FILESYSTEM = "filesystem"
    USER_DEFINED = "user_defined"


class TimeExtractionRule:
    """The goal is to help extract local time, but for historical reason it is expected the returned
    datetime will have timezone to be set to pytz.utc (so local time + timezone equal to UTC)..

    Some sources of data might give us very rich information, e.g. timestamp + timezone,
    but others only allow to get local time (without knowing real timestamp).

    The logic for extracting local time is described as a list of rules that should be applied
    one after another until one rule is able to extract date time (or until all rules are tried
    without success).

    Currently supported rule types:
      - "exif" - local time is taken using exif tag params["exif_tag"] as obtained with exiftool
      - "path" - time is taken from the filename using a regular expression matching
        - if params["path_part"] is set to "full_path" then full path (as seen by backend container)
          is used for regexp matching instead of just fileanme.
        - if params["custom_regexp"] is specified - that regexp is used instead of default one
          (it is still expecting 6 groups to be matched: year, month, day, hour, minute, second).
      - "fs" - time is taken from file property. Since these are unix timestamps without timezones
        they are always translated to local time using UTC.
        - params["file_property"] must be specified and equal to one of the following:
          - "mtime" - for file modifided time
          - "ctime" - for file created time
    If a rule can't fetch the time (e.g. the exif tag value is not present or path doesn't match
    a regexp) then that rule is considered to be not applicable.

    In some cases it is known that the local time the rule would obtain is not in the desired
    timezone. E.g. video datetime tag QuickTime:CreateDate is by standard written in UTC rather
    than local time. For such cases each rule can optionally have setting "transform_tz" set to "1"
    - in that case this rule should also specify "source_tz" and "report_tz" settings where
    "source_tz" is describing the timezone that the rule is getting and "report_tz" is describing
    the timezone of the location where the photo/video was taken. Both "source_tz" and "report_tz"
    should be one of the following:
      - "utc" - UTC timezone
      - "gps_timezonefinder" - the timezone of the GPS location associated with the photo/video
      - "server_local" - the timezone of the librephotos server - not very useful since we run docker containers in UTC timezone.
      - "user_default" - user default timezone
      - "name:<timezone_name>" - the timezone with the name <timezone_name>
    If either "source_tz" or "report_tz" could not be obtained the rule is considered to be not applicable.

    Additionally each rule can have condition specifications that limits the rule application
    to only the photos/videos that meet the condition's requirement. Supported conditions:
      - "condition_path": "<regexp>" - rule only applied to files with full path (as seen by backend)
                                       matching the regexp
      - "condition_filename": "<regexp>" - rule only applied to files with filename matching the regexp
      - "condition_exif": "<tag_name>//<regexp>" - first "//" is considered end of tag name and the rule is only
                                          applied if value of tag <tag_name> exists and matches the regexp.

    If multiple conditions are provided the rule is considered applicable only if all of them are met.

    Examples of the rules:
      - Take local time from exif tag "EXIF:DateTimeOriginal" if it is available:

            {
                "rule_type": "exif",
                "exif_tag": "EXIF:DateTimeOriginal",
            }

      - Take UTC time using tag "QuickTime:CreateDate" and convert it from UTC
        to timezone associated with the GPS coordinates (only applies if both
        tag value and GPS coordinates are available):

            {
                "rule_type": "exif",
                "exif_tag": "QuickTime:CreateDate",
                "transform_tz": 1,
                "source_tz": "utc",
                "report_tz": "gps_timezonefinder",
            }

      - Look at the filename and try to extract time from it - treat it as local time
        (it is known that some devices are not using local time here - e.g. some phones
        might use UTC time for video filenames):

            {
                "rule_type": "path",
            }

      - Take UTC time time using tag "QuickTime:CreateDate" and convert it from UTC
        to a fixed timezone "Europe/Moscow" to get local time. Only apply to files
        which path contains "Moscow_Visit" or "FromMoscow":

            {
                "rule_type": "exif",
                "exif_tag": "QuickTime:CreateDate",
                "transform_tz": 1,
                "source_tz": "utc",
                "report_tz": "name:Europe/Moscow",
                "condition_path": "(Moscow_Visit|FromMoscow)",
            }

      - Take modified time of the file and get local time using timezone associated
        with the GPS location. Only apply to files with "EXIF:Model" exif tag
        containing "FooBar":

            {
                "rule_type": "filesystem",
                "file_property": "mtime",
                "transform_tz": 1,
                "source_tz": "utc",
                "report_tz": "gps_timezonefinder",
                "condition_exif": "EXIF:Model//FooBar"
            }
    """

    def __init__(self, params):
        self.rule_type = params["rule_type"]
        self.params = params

    def get_required_exif_tags(self):
        condition_tag, pattern = self._get_condition_exif()
        res = set()
        if condition_tag is not None:
            res.add(condition_tag)
        if self.rule_type == RuleTypes.EXIF:
            res.add(self.params["exif_tag"])
        return res

    def _get_no_tz_dt_from_tag(self, tag_name, exif_tags):
        tag_val = exif_tags.get(tag_name)
        if not tag_val:
            return None
        dt = _extract_no_tz_datetime_from_str(tag_val)
        return dt

    def _check_condition_path(self, path):
        if "condition_path" in self.params:
            return re.search(self.params["condition_path"], path) is not None
        else:
            return True

    def _check_condition_filename(self, path):
        if "condition_filename" in self.params:
            return (
                re.search(self.params["condition_filename"], pathlib.Path(path).name)
                is not None
            )
        else:
            return True

    def _get_condition_exif(self):
        val = self.params.get("condition_exif")
        if val is None:
            return None, None
        tag_and_pattern = val.split("//", maxsplit=1)
        if len(tag_and_pattern) != 2:
            raise ValueError(
                f"Value of condition_exif must contain '//' delimiter between tag name and pattern: '{val}'"
            )
        tag, pattern = tag_and_pattern
        return tag, pattern

    def _check_condition_exif(self, exif_tags):
        tag, pattern = self._get_condition_exif()
        if tag:
            tag_value = exif_tags.get(tag)
            if not tag_value:
                return False
            return re.search(pattern, tag_value) is not None
        else:
            return True

    def _check_conditions(self, path, exif_tags, gps_lat, gps_lon):
        return (
            self._check_condition_exif(exif_tags)
            and self._check_condition_path(path)
            and self._check_condition_filename(path)
        )

    def apply(
        self, path, exif_tags, gps_lat, gps_lon, user_default_tz, user_defined_timestamp
    ):
        if not self._check_conditions(path, exif_tags, gps_lat, gps_lon):
            return None
        if self.rule_type == RuleTypes.EXIF:
            return self._apply_exif(exif_tags, gps_lat, gps_lon, user_default_tz)
        elif self.rule_type == RuleTypes.PATH:
            return self._apply_path(path, gps_lat, gps_lon, user_default_tz)
        elif self.rule_type == RuleTypes.FILESYSTEM:
            return self._apply_filesystem(path, gps_lat, gps_lon, user_default_tz)
        elif self.rule_type == RuleTypes.USER_DEFINED:
            return user_defined_timestamp
        else:
            raise ValueError(f"Unknown rule type {self.rule_type}")

    def _get_tz(self, description, gps_lat, gps_lon, user_default_tz):
        """None is a valid timezone returned here (meaning that we want to use server local time).
        This is why this function returns a tuple with the first element specifying success of
        determining the timezone, and the second element - the timezone itself.
        """
        if description == "gps_timezonefinder":
            if not _check_gps_ok(gps_lat, gps_lon):
                return (False, None)
            from timezonefinder import TimezoneFinder

            tzfinder = TimezoneFinder()
            tz_name = tzfinder.timezone_at(lng=gps_lon, lat=gps_lat)
            return (True, pytz.timezone(tz_name)) if tz_name else (False, None)
        elif description == "user_default":
            return (True, pytz.timezone(user_default_tz))
        elif description == "server_local":
            return (True, None)
        elif description.lower() == "utc":
            return (True, pytz.utc)
        elif description.startswith("name:"):
            return (True, pytz.timezone(description[5:]))
        else:
            raise ValueError(f"Unknown tz description {description}")

    def _transform_tz(self, dt, gps_lat, gps_lon, user_default_tz):
        if not dt:
            return None
        if self.params.get("transform_tz"):
            has_source_tz, source_tz = self._get_tz(
                self.params["source_tz"], gps_lat, gps_lon, user_default_tz
            )
            if not has_source_tz:
                return None
            has_report_tz, report_tz = self._get_tz(
                self.params["report_tz"], gps_lat, gps_lon, user_default_tz
            )
            if not has_report_tz:
                return None
            # Either of source_tz or report_tz might be None - meaning that we want to use
            # server local timezone
            dt = datetime.fromtimestamp(
                dt.replace(tzinfo=source_tz).timestamp(), report_tz
            )
        return dt.replace(tzinfo=pytz.utc)

    def _apply_exif(self, exif_tags, gps_lat, gps_lon, user_default_tz):
        dt = self._get_no_tz_dt_from_tag(self.params["exif_tag"], exif_tags)
        return self._transform_tz(dt, gps_lat, gps_lon, user_default_tz)

    def _apply_path(self, path, gps_lat, gps_lon, user_default_tz):
        path_part = self.params.get("path_part")
        if path_part is None or path_part == "filename":
            source = pathlib.Path(path).name
        elif path_part == "full_path":
            source = path
        else:
            raise ValueError(f"Unknown path_part {path_part}")

        group_mapping = None
        regexp = self.params.get("custom_regexp")
        if not regexp:
            predefined_regexp_type = self.params.get("predefined_regexp", "default")
            if predefined_regexp_type not in PREDEFINED_REGEXPS:
                raise ValueError(
                    f"Unknown predefined regexp type {predefined_regexp_type}"
                )
            regexp, group_mapping = PREDEFINED_REGEXPS[predefined_regexp_type]
        dt = _extract_no_tz_datetime_from_str(source, regexp, group_mapping)
        return self._transform_tz(dt, gps_lat, gps_lon, user_default_tz)

    def _apply_filesystem(self, path, gps_lat, gps_lon, user_default_tz):
        file_property = self.params.get("file_property")
        if file_property == "mtime":
            dt = datetime.fromtimestamp(os.path.getmtime(path), pytz.utc)
        elif file_property == "ctime":
            dt = datetime.fromtimestamp(os.path.getctime(path), pytz.utc)
        else:
            raise ValueError(f"Unknown file_property {file_property}")
        return self._transform_tz(dt, gps_lat, gps_lon, user_default_tz)


def _check_gps_ok(lat, lon):
    return (
        lat is not None
        and lon is not None
        and math.isfinite(lat)
        and math.isfinite(lon)
        and (lat != 0.0 or lon != 0.0)
    )


ALL_TIME_ZONES = pytz.all_timezones

DEFAULT_RULES_PARAMS = [
    {
        "id": 14,
        "name": "Timestamp set by user",
        "rule_type": RuleTypes.USER_DEFINED,
    },
    {
        "id": 15,
        "name": f"Local time from {Tags.DATE_TIME} exif tag",
        "rule_type": RuleTypes.EXIF,
        "exif_tag": Tags.DATE_TIME,
    },
    {
        "id": 1,
        "name": f"Local time from {Tags.DATE_TIME_ORIGINAL} exif tag",
        "rule_type": RuleTypes.EXIF,
        "exif_tag": Tags.DATE_TIME_ORIGINAL,
    },
    {
        "id": 2,
        "name": "Get Video creation tag in UTC + figure out timezone using GPS coordinates",
        "rule_type": RuleTypes.EXIF,
        "exif_tag": Tags.QUICKTIME_CREATE_DATE,
        "transform_tz": 1,
        "source_tz": "utc",
        "report_tz": "gps_timezonefinder",
    },
    {
        "id": 11,
        "name": f"Use {Tags.GPS_DATE_TIME} tag + figure out timezone using GPS coordinates",
        "rule_type": RuleTypes.EXIF,
        "exif_tag": Tags.GPS_DATE_TIME,
        "transform_tz": 1,
        "source_tz": "utc",
        "report_tz": "gps_timezonefinder",
    },
    {
        "id": 3,
        "name": "Using filename assuming time is local (most of filenames auto generated by smartphones etc)",
        "rule_type": RuleTypes.PATH,
    },
    {
        "id": 4,
        "name": "Video creation datetime in user default timezone (can't find out actual timezone)",
        "rule_type": RuleTypes.EXIF,
        "exif_tag": Tags.QUICKTIME_CREATE_DATE,
        "transform_tz": 1,
        "source_tz": "utc",
        "report_tz": "user_default",
    },
    {
        "id": 5,
        "name": "Extract date using WhatsApp file name",
        "rule_type": RuleTypes.PATH,
        "predefined_regexp": "whatsapp",
    },
]

OTHER_RULES_PARAMS = [
    {
        "id": 6,
        "name": "Video creation datetime in UTC timezone (can't find out actual timezone)",
        "rule_type": RuleTypes.EXIF,
        "exif_tag": Tags.QUICKTIME_CREATE_DATE,
    },
    {
        "id": 7,
        "name": "File modified time in user default timezone",
        "rule_type": RuleTypes.FILESYSTEM,
        "file_property": "mtime",
        "transform_tz": 1,
        "source_tz": "utc",
        "report_tz": "user_default",
    },
    {
        "id": 8,
        "name": "File modified time in UTC timezone",
        "rule_type": RuleTypes.FILESYSTEM,
        "file_property": "mtime",
    },
    {
        "id": 9,
        "name": "File created time in user default timezone",
        "rule_type": RuleTypes.FILESYSTEM,
        "file_property": "ctime",
        "transform_tz": 1,
        "source_tz": "utc",
        "report_tz": "user_default",
    },
    {
        "id": 10,
        "name": "File created time in UTC timezone",
        "rule_type": RuleTypes.FILESYSTEM,
        "file_property": "ctime",
    },
    {
        "id": 12,
        "name": f"Use {Tags.GPS_DATE_TIME} tag in user default timezone (can't find out actual timezone)",
        "rule_type": RuleTypes.EXIF,
        "exif_tag": Tags.GPS_DATE_TIME,
        "transform_tz": 1,
        "source_tz": "utc",
        "report_tz": "user_default",
    },
    {
        "id": 13,
        "name": f"Use {Tags.GPS_DATE_TIME} tag in UTC timezone (can't find out actual timezone)",
        "rule_type": RuleTypes.EXIF,
        "exif_tag": Tags.GPS_DATE_TIME,
    },
]


def set_as_default_rule(rule):
    rule["is_default"] = True
    return rule


def set_as_other_rule(rule):
    rule["is_default"] = False
    return rule


PREDEFINED_RULES_PARAMS = list(map(set_as_default_rule, DEFAULT_RULES_PARAMS)) + list(
    map(set_as_other_rule, OTHER_RULES_PARAMS)
)


def _as_json(configs):
    return json.dumps(configs, default=lambda x: x.__dict__)


DEFAULT_RULES_JSON = _as_json(DEFAULT_RULES_PARAMS)
PREDEFINED_RULES_JSON = _as_json(PREDEFINED_RULES_PARAMS)
ALL_TIME_ZONES_JSON = _as_json(ALL_TIME_ZONES)


def as_rules(configs):
    return list(map(TimeExtractionRule, configs))


def extract_local_date_time(
    path, rules, exif_getter, gps_lat, gps_lon, user_default_tz, user_defined_timestamp
):
    required_tags = set()
    for rule in rules:
        required_tags.update(rule.get_required_exif_tags())
    required_tags = list(required_tags)
    exif_values = exif_getter(required_tags)
    exif_tags = {k: v for k, v in zip(required_tags, exif_values)}
    for rule in rules:
        res = rule.apply(
            path, exif_tags, gps_lat, gps_lon, user_default_tz, user_defined_timestamp
        )
        if res:
            return res
    return None


================================================
FILE: api/directory_watcher/__init__.py
================================================
"""
Directory watcher module for scanning and processing photos.

This module implements a two-phase scan architecture to avoid race conditions
when processing RAW+JPEG pairs concurrently:

Phase 1: Collect all files and group by (directory, basename)
         - IMG_001.jpg, IMG_001.CR2, IMG_001.xmp -> one group
         - IMG_002.jpg -> separate group

Phase 2: Process each group, creating one Photo per group
         with all file variants attached.
"""

# Main scan functions
from api.directory_watcher.scan_jobs import (
    scan_photos,
    scan_missing_photos,
    photo_scanner,
)

# File handling
from api.directory_watcher.file_handlers import (
    create_new_image,
    create_file_record,
    group_files_into_photo,
    handle_new_image,
    handle_file_group,
)

# File grouping utilities
from api.directory_watcher.file_grouping import (
    JPEG_EXTENSIONS,
    FILE_TYPE_PRIORITY,
    get_file_grouping_key,
    select_main_file,
    find_matching_jpeg_photo,
    find_matching_image_for_video,
)

# Processing jobs
from api.directory_watcher.processing_jobs import (
    generate_tags,
    generate_tag_job,
    add_geolocation,
    geolocation_job,
    scan_faces,
    generate_face_embeddings,
)

# Repair jobs
from api.directory_watcher.repair_jobs import (
    repair_ungrouped_file_variants,
)

# Utilities
from api.directory_watcher.utils import (
    is_hidden,
    should_skip,
    walk_directory,
    walk_files,
    update_scan_counter,
)

# Re-export from api.models.file for backwards compatibility
from api.models.file import is_valid_media

__all__ = [
    # Scan jobs
    "scan_photos",
    "scan_missing_photos",
    "photo_scanner",
    # File handling
    "create_new_image",
    "create_file_record",
    "group_files_into_photo",
    "handle_new_image",
    "handle_file_group",
    # File grouping
    "JPEG_EXTENSIONS",
    "FILE_TYPE_PRIORITY",
    "get_file_grouping_key",
    "select_main_file",
    "find_matching_jpeg_photo",
    "find_matching_image_for_video",
    # Processing jobs
    "generate_tags",
    "generate_tag_job",
    "add_geolocation",
    "geolocation_job",
    "scan_faces",
    "generate_face_embeddings",
    # Repair jobs
    "repair_ungrouped_file_variants",
    # Utilities
    "is_hidden",
    "should_skip",
    "walk_directory",
    "walk_files",
    "update_scan_counter",
    # Re-exported from api.models.file
    "is_valid_media",
]


================================================
FILE: api/directory_watcher/file_grouping.py
================================================
"""
File grouping utilities for the two-phase scan architecture.

This module provides functions for grouping related files (RAW+JPEG pairs,
Live Photos, etc.) so they can be processed together as a single Photo.
"""

import os

from api.models import File, Photo


# JPEG/image extensions that RAW files can be paired with
JPEG_EXTENSIONS = {'.jpg', '.jpeg', '.heic', '.heif', '.png', '.tiff', '.tif'}

# File type priority for main_file selection (lower number = higher priority)
# JPEG/processed images should be main_file, RAW/video variants are secondary
FILE_TYPE_PRIORITY = {
    File.IMAGE: 1,      # JPEG, HEIC, PNG - highest priority
    File.VIDEO: 2,      # Videos (standalone or Live Photo motion)
    File.RAW_FILE: 3,   # RAW files are variants, not main
    File.METADATA_FILE: 4,  # XMP sidecars - lowest priority
    File.UNKNOWN: 5,
}


def get_file_grouping_key(path: str) -> tuple[str, str]:
    """
    Get the grouping key for a file path.
    
    Files with the same (directory, basename) should be grouped together
    as variants of the same Photo (e.g., IMG_001.jpg + IMG_001.CR2 + IMG_001.xmp).
    
    Args:
        path: File path to get grouping key for
        
    Returns:
        Tuple of (directory, lowercase_basename_without_extension)
    """
    directory = os.path.dirname(path)
    basename = os.path.splitext(os.path.basename(path))[0].lower()
    return (directory, basename)


def select_main_file(files: list[File]) -> File | None:
    """
    Select the best file to be the main_file for a Photo.
    
    Priority: IMAGE > VIDEO > RAW > METADATA
    Within same type, prefer the first one found (alphabetically by path).
    
    Args:
        files: List of File objects to choose from
        
    Returns:
        The File that should be main_file, or None if empty list
    """
    if not files:
        return None
    
    return min(files, key=lambda f: (FILE_TYPE_PRIORITY.get(f.type, 999), f.path))


def find_matching_jpeg_photo(raw_path: str, user) -> Photo | None:
    """
    Find an existing Photo with a matching JPEG/image file for a RAW file.
    
    Matches based on same base filename (without extension) in the same directory.
    This implements the PhotoPrism-like file variant model where RAW+JPEG are
    one Photo with multiple file variants, not separate Photos.
    
    Args:
        raw_path: Path to the RAW file
        user: Owner of the photos
        
    Returns:
        Matching Photo if found, None otherwise
    """
    raw_dir = os.path.dirname(raw_path)
    raw_basename = os.path.splitext(os.path.basename(raw_path))[0]
    
    # Look for matching JPEG/image file in same directory
    for jpeg_ext in JPEG_EXTENSIONS:
        # Try both lowercase and uppercase extensions
        for ext in [jpeg_ext, jpeg_ext.upper()]:
            jpeg_path = os.path.join(raw_dir, raw_basename + ext)
            photo = Photo.objects.filter(
                owner=user,
                main_file__path=jpeg_path
            ).first()
            if photo:
                return photo
    
    return None


def find_matching_image_for_video(video_path: str, user) -> Photo | None:
    """
    Find an existing Photo with a matching image file for a Live Photo video.
    
    Apple Live Photos store the video as a separate .mov file with the same
    base name as the image. This allows attaching the video as a file variant.
    
    Args:
        video_path: Path to the video file
        user: Owner of the photos
        
    Returns:
        Matching Photo if found, None otherwise
    """
    video_dir = os.path.dirname(video_path)
    video_basename = os.path.splitext(os.path.basename(video_path))[0]
    video_ext_lower = os.path.splitext(video_path)[1].lower()
    
    # Only match .mov files (Apple Live Photos) with same base name
    if video_ext_lower not in ['.mov']:
        return None
    
    # Look for matching image file with same base name
    image_extensions = list(JPEG_EXTENSIONS) + ['.heic', '.HEIC']
    for img_ext in image_extensions:
        for ext in [img_ext, img_ext.upper()]:
            image_path = os.path.join(video_dir, video_basename + ext)
            photo = Photo.objects.filter(
                owner=user,
                main_file__path=image_path
            ).first()
            if photo:
                return photo
    
    return None


================================================
FILE: api/directory_watcher/file_handlers.py
================================================
"""
File and Photo creation handlers.

This module contains functions for creating File records and grouping
them into Photo objects.
"""

import datetime
import os

import pytz
from django.conf import settings
from django.db.models import Q

from api import util
from api.models import File, Photo, Thumbnail
from api.models.file import calculate_hash, is_metadata, is_raw, is_valid_media, is_video
from api.models.photo_search import PhotoSearch
from api.perceptual_hash import calculate_hash_from_thumbnail
from api.stacks.live_photo import has_embedded_motion_video, extract_embedded_motion_video

from api.directory_watcher.file_grouping import (
    FILE_TYPE_PRIORITY,
    find_matching_jpeg_photo,
    find_matching_image_for_video,
    select_main_file,
)
from api.directory_watcher.utils import update_scan_counter


def create_file_record(user, path) -> File | None:
    """
    Phase 1: Create a File record for a path without creating/grouping Photos.
    
    This is the first phase of the two-phase scan architecture:
    - Phase 1: Create File records for all discovered files (this function)
    - Phase 2: Group files into Photos by (directory, basename)
    
    This separation eliminates race conditions where concurrent processing
    of RAW and JPEG files could create separate Photos instead of grouping them.
    
    Args:
        user: The owner of the file
        path: The file path
        
    Returns:
        File object if created/found, None if invalid media
    """
    if not is_valid_media(path=path, user=user):
        return None
    
    hash_value = calculate_hash(user, path)
    
    # Skip if this is embedded media (already attached to another file)
    if File.embedded_media.through.objects.filter(Q(to_file_id=hash_value)).exists():
        util.logger.warning(f"embedded content file found {path}")
        return None
    
    # Create the File record (File.create handles race conditions via unique path constraint)
    file = File.create(path, user)
    return file


def group_files_into_photo(user, files: list[File], job_id) -> Photo | None:
    """
    Phase 2: Group a list of related files into a single Photo.
    
    Creates a new Photo with the given files as variants, selecting the
    best file as main_file based on type priority (IMAGE > VIDEO > RAW > METADATA).
    
    This function should be called with all files that share the same
    (directory, basename) - e.g., IMG_001.jpg, IMG_001.CR2, IMG_001.xmp.
    
    Args:
        user: The owner of the photo
        files: List of File objects to group (must not be empty)
        job_id: Job ID for logging
        
    Returns:
        The created Photo, or None if no valid files
    """
    if not files:
        return None
    
    # Filter out metadata files for main photo creation - they're sidecars
    non_metadata_files = [f for f in files if f.type != File.METADATA_FILE]
    
    if not non_metadata_files:
        # Only metadata files - no photo to create
        util.logger.warning(f"job {job_id}: Only metadata files in group, skipping")
        return None
    
    # Select main file based on priority
    main_file = select_main_file(non_metadata_files)
    if not main_file:
        return None
    
    # Check if a Photo already exists with any of these files
    existing_photo = Photo.objects.filter(
        owner=user,
        files__in=files
    ).first()
    
    if existing_photo:
        # Add any missing files to the existing photo
        for f in files:
            if not existing_photo.files.filter(hash=f.hash).exists():
                existing_photo.files.add(f)
                util.logger.info(f"job {job_id}: Attached file {f.path} to existing Photo {existing_photo.image_hash}")
        
        # Update main_file if current one has lower priority
        if existing_photo.main_file:
            current_priority = FILE_TYPE_PRIORITY.get(existing_photo.main_file.type, 999)
            new_priority = FILE_TYPE_PRIORITY.get(main_file.type, 999)
            if new_priority < current_priority:
                existing_photo.main_file = main_file
                existing_photo.save(update_fields=['main_file'])
        
        return existing_photo
    
    # Create new Photo
    photo = Photo()
    photo.image_hash = main_file.hash
    photo.owner = user
    photo.added_on = datetime.datetime.now().replace(tzinfo=pytz.utc)
    photo.geolocation_json = {}
    photo.video = (main_file.type == File.VIDEO)
    photo.save()
    
    # Add all files to the photo
    for f in files:
        photo.files.add(f)
    
    photo.main_file = main_file
    photo.save()
    
    # Handle embedded media (Google/Samsung Live Photos with embedded video)
    if has_embedded_motion_video(main_file.path) and settings.FEATURE_PROCESS_EMBEDDED_MEDIA:
        em_path = extract_embedded_motion_video(main_file.path, main_file.hash)
        if em_path:
            em_file = File.create(em_path, user)
            main_file.embedded_media.add(em_file)
            photo.files.add(em_file)
            photo.save()
    
    util.logger.info(f"job {job_id}: Created Photo {photo.image_hash} with {len(files)} file(s)")
    return photo


def create_new_image(user, path) -> Photo | None:
    """
    Creates a new Photo object based on user input and file path.
    
    This is the legacy single-file creation function, kept for backwards
    compatibility with upload handling. For scan operations, use the
    two-phase approach (create_file_record + group_files_into_photo).

    Args:
        user: The owner of the photo.
        path: The file path of the image.

    Returns:
        The created Photo object if successful, otherwise returns None.

    Note:
        This function implements file variant grouping (PhotoPrism-like):
        - RAW files are attached to existing JPEG Photos as file variants
        - Live Photo videos (.mov) are attached to existing image Photos as file variants
        - Other files create new Photo entities
    """
    if not is_valid_media(path=path, user=user):
        return None
    hash_value = calculate_hash(user, path)
    if File.embedded_media.through.objects.filter(Q(to_file_id=hash_value)).exists():
        util.logger.warning(f"embedded content file found {path}")
        return None

    # Handle metadata files (XMP sidecars)
    if is_metadata(path):
        photo_name = os.path.splitext(os.path.basename(path))[0]
        photo_dir = os.path.dirname(path)
        photo = Photo.objects.filter(
            Q(files__path__contains=photo_dir)
            & Q(files__path__contains=photo_name)
            & ~Q(files__path__contains=os.path.basename(path))
        ).first()

        if photo:
            file = File.create(path, user)
            photo.files.add(file)
            photo.save()
        else:
            util.logger.warning(f"no photo to metadata file found {path}")
        return None

    # === File Variant Handling (PhotoPrism-like model) ===
    
    # Handle RAW files: attach to existing JPEG Photo if found
    if is_raw(path):
        existing_photo = find_matching_jpeg_photo(path, user)
        if existing_photo:
            # Check if this RAW file is already attached
            if not existing_photo.files.filter(path=path).exists():
                raw_file = File.create(path, user)
                existing_photo.files.add(raw_file)
                existing_photo.save()
                util.logger.info(f"Attached RAW file {path} to existing Photo {existing_photo.image_hash}")
            return existing_photo
    
    # Handle Live Photo videos (.mov): attach to existing image Photo if found
    if is_video(path):
        existing_photo = find_matching_image_for_video(path, user)
        if existing_photo:
            # Check if this video is already attached
            if not existing_photo.files.filter(path=path).exists():
                video_file = File.create(path, user)
                existing_photo.files.add(video_file)
                existing_photo.video = False  # Keep photo as image (video is just a variant)
                existing_photo.save()
                util.logger.info(f"Attached Live Photo video {path} to existing Photo {existing_photo.image_hash}")
            return existing_photo

    # === Standard Photo Creation ===
    photo = Photo()
    photo.image_hash = hash_value
    photo.owner = user
    photo.added_on = datetime.datetime.now().replace(tzinfo=pytz.utc)
    photo.geolocation_json = {}
    photo.video = is_video(path)
    photo.save()
    file = File.create(path, user)
    
    # Live Photo detection - extracts embedded motion video if present (Google/Samsung)
    if has_embedded_motion_video(file.path) and settings.FEATURE_PROCESS_EMBEDDED_MEDIA:
        em_path = extract_embedded_motion_video(file.path, file.hash)
        if em_path:
            em_file = File.create(em_path, user)
            file.embedded_media.add(em_file)
            # Also add embedded video to Photo.files as a variant
            photo.files.add(em_file)
    
    photo.files.add(file)
    photo.main_file = file
    photo.save()
    return photo


def handle_new_image(user, path, job_id, photo=None):
    """
    Handles the creation and all the processing of the photo needed for it to be displayed.

    Args:
        user: The owner of the photo.
        path: The file path of the image.
        job_id: The long-running job id, which gets updated when the task runs
        photo: An optional parameter, where you can input a photo instead of creating a new one. Used for uploading.

    Note:
        This function is used when uploading a picture, because rescanning does not perform machine learning tasks.
    """
    try:
        start = datetime.datetime.now()
        if photo is None:
            photo = create_new_image(user, path)
            elapsed = (datetime.datetime.now() - start).total_seconds()
            util.logger.info(f"job {job_id}: save image: {path}, elapsed: {elapsed}")
        if photo:
            _process_photo(photo, path, job_id, start)

    except Exception as e:
        try:
            util.logger.exception(
                f"job {job_id}: could not load image {path}. reason: {str(e)}"
            )
        except Exception:
            util.logger.exception(f"job {job_id}: could not load image {path}")
    finally:
        update_scan_counter(job_id)


def handle_file_group(user, file_paths: list[str], job_id):
    """
    Phase 2 handler: Process a group of related files into a single Photo.
    
    This is called after Phase 1 has created File records for all paths.
    Files are grouped by (directory, basename) so RAW+JPEG pairs are processed together.
    
    Args:
        user: The owner of the files
        file_paths: List of file paths that share the same (directory, basename)
        job_id: Job ID for logging and progress tracking
    """
    try:
        start = datetime.datetime.now()
        
        # Get or create File records for all paths
        files = []
        for path in file_paths:
            file = create_file_record(user, path)
            if file:
                files.append(file)
        
        if not files:
            util.logger.warning(f"job {job_id}: No valid files in group: {file_paths}")
            return
        
        # Group files into a Photo
        photo = group_files_into_photo(user, files, job_id)
        
        if not photo:
            util.logger.warning(f"job {job_id}: Could not create photo for files: {file_paths}")
            return
        
        elapsed = (datetime.datetime.now() - start).total_seconds()
        util.logger.info(f"job {job_id}: created photo with {len(files)} files, elapsed: {elapsed}")
        
        # Process the photo (thumbnails, EXIF, etc.) using main_file
        if photo.main_file:
            _process_photo(photo, photo.main_file.path, job_id, start)

    except Exception as e:
        try:
            util.logger.exception(
                f"job {job_id}: could not process file group {file_paths}. reason: {str(e)}"
            )
        except Exception:
            util.logger.exception(f"job {job_id}: could not process file group")
    finally:
        update_scan_counter(job_id)


def _process_photo(photo: Photo, path: str, job_id, start: datetime.datetime):
    """
    Process a photo: generate thumbnails, extract EXIF, calculate hashes, etc.
    
    This is the common processing logic shared between handle_new_image and handle_file_group.
    
    Args:
        photo: The Photo object to process
        path: The main file path (for logging)
        job_id: Job ID for logging
        start: Start time for elapsed time calculation
    """
    util.logger.info(f"job {job_id}: handling image {path}")
    
    # Create or get thumbnail instance
    thumbnail, _ = Thumbnail.objects.get_or_create(photo=photo)
    thumbnail._generate_thumbnail()
    elapsed = (datetime.datetime.now() - start).total_seconds()
    util.logger.info(
        f"job {job_id}: generate thumbnails: {path}, elapsed: {elapsed}"
    )
    
    thumbnail._calculate_aspect_ratio()
    elapsed = (datetime.datetime.now() - start).total_seconds()
    util.logger.info(
        f"job {job_id}: calculate aspect ratio: {path}, elapsed: {elapsed}"
    )
    
    # Calculate perceptual hash for duplicate detection
    if thumbnail.thumbnail_big and os.path.exists(thumbnail.thumbnail_big.path):
        phash = calculate_hash_from_thumbnail(thumbnail.thumbnail_big.path)
        if phash:
            photo.perceptual_hash = phash
            photo.save(update_fields=["perceptual_hash"])
            elapsed = (datetime.datetime.now() - start).total_seconds()
            util.logger.info(
                f"job {job_id}: calculate perceptual hash: {path}, elapsed: {elapsed}"
            )
    
    from api.models.photo_metadata import PhotoMetadata
    PhotoMetadata.extract_exif_data(photo, commit=True)
    elapsed = (datetime.datetime.now() - start).total_seconds()
    util.logger.info(
        f"job {job_id}: extract exif data: {path}, elapsed: {elapsed}"
    )

    photo._extract_date_time_from_exif(True)
    elapsed = (datetime.datetime.now() - start).total_seconds()
    util.logger.info(
        f"job {job_id}: extract date time: {path}, elapsed: {elapsed}"
    )
    
    thumbnail._get_dominant_color()
    elapsed = (datetime.datetime.now() - start).total_seconds()
    util.logger.info(
        f"job {job_id}: get dominant color: {path}, elapsed: {elapsed}"
    )
    
    search_instance, created = PhotoSearch.objects.get_or_create(photo=photo)
    search_instance.recreate_search_captions()
    search_instance.save()
    elapsed = (datetime.datetime.now() - start).total_seconds()
    util.logger.info(
        f"job {job_id}: search caption recreated: {path}, elapsed: {elapsed}"
    )


================================================
FILE: api/directory_watcher/processing_jobs.py
================================================
"""
Photo processing jobs (tags, geolocation, faces).

These jobs run after the main scan to enrich photos with additional
metadata like location information, image tags, and face detection.
"""

import traceback
import uuid
from uuid import UUID

from django import db
from django.db.models import Q
from django_q.tasks import AsyncTask

from api import util
from api.face_classify import cluster_all_faces
from api.models import Face, LongRunningJob, Photo
from api.models.photo_caption import PhotoCaption
from api.directory_watcher.utils import update_scan_counter


def generate_face_embeddings(user, job_id: UUID):
    """
    Generate face embeddings for faces that don't have them yet.
    
    Args:
        user: The user whose faces to process
        job_id: Job ID for tracking progress
    """
    if Face.objects.filter(encoding="").count() == 0:
        return
    
    lrj = LongRunningJob.get_or_create_job(
        user=user,
        job_type=LongRunningJob.JOB_GENERATE_FACE_EMBEDDINGS,
        job_id=job_id,
    )

    try:
        faces = Face.objects.filter(encoding="")
        lrj.update_progress(current=0, target=faces.count())
        db.connections.close_all()

        for face in faces:
            failed = False
            error = None
            try:
                face.generate_encoding()
            except Exception as err:
                util.logger.exception("An error occurred: ")
                print(f"[ERR]: {err}")
                failed = True
                error_msg = f"Face {face.id}: {str(err)}\n{traceback.format_exc()}"
                error = error_msg
            update_scan_counter(job_id, failed, error)

        lrj.complete()

    except Exception as err:
        util.logger.exception("An error occurred: ")
        print(f"[ERR]: {err}")
        lrj.fail(error=err)


def generate_tags(user, job_id: UUID, full_scan=False):
    """
    Generate image tags (Places365 captions) for photos.
    
    Args:
        user: The user whose photos to process
        job_id: Job ID for tracking progress
        full_scan: If True, process all photos; otherwise only new ones
    """
    lrj = LongRunningJob.get_or_create_job(
        user=user,
        job_type=LongRunningJob.JOB_GENERATE_TAGS,
        job_id=job_id,
    )

    try:
        last_scan = (
            LongRunningJob.objects.filter(finished=True)
            .filter(job_type=LongRunningJob.JOB_GENERATE_TAGS)
            .filter(started_by=user)
            .order_by("-finished_at")
            .first()
        )
        from constance import config as site_config

        tagging_model = site_config.TAGGING_MODEL

        existing_photos = Photo.objects.filter(
            Q(owner=user.id)
            & (
                Q(caption_instance__isnull=True)
                | Q(caption_instance__captions_json__isnull=True)
                | Q(**{f"caption_instance__captions_json__{tagging_model}__isnull": True})
            )
        )
        if not full_scan and last_scan:
            existing_photos = existing_photos.filter(added_on__gt=last_scan.started_at)

        if existing_photos.count() == 0:
            lrj.update_progress(current=0, target=0)
            lrj.complete()
            return
        lrj.update_progress(current=0, target=existing_photos.count())
        db.connections.close_all()

        for photo in existing_photos:
            AsyncTask(generate_tag_job, photo, job_id).run()

    except Exception as err:
        util.logger.exception("An error occurred: ")
        print(f"[ERR]: {err}")
        lrj.fail(error=err)


def generate_tag_job(photo: Photo, job_id: str):
    """
    Worker task to generate tags for a single photo.
    
    Args:
        photo: The photo to process
        job_id: Job ID for tracking progress
    """
    failed = False
    error = None
    try:
        photo.refresh_from_db()
        caption_instance, created = PhotoCaption.objects.get_or_create(photo=photo)
        caption_instance.generate_tag_captions(commit=True)
    except Exception as err:
        util.logger.exception("An error occurred: %s", photo.image_hash)
        print(f"[ERR]: {err}")
        failed = True
        error_msg = f"Photo {photo.image_hash}: {str(err)}\n{traceback.format_exc()}"
        error = error_msg
    update_scan_counter(job_id, failed, error)


def add_geolocation(user, job_id: UUID, full_scan=False):
    """
    Add geolocation data to photos based on GPS coordinates.
    
    Args:
        user: The user whose photos to process
        job_id: Job ID for tracking progress
        full_scan: If True, process all photos; otherwise only new ones
    """
    lrj = LongRunningJob.get_or_create_job(
        user=user,
        job_type=LongRunningJob.JOB_ADD_GEOLOCATION,
        job_id=job_id,
    )

    try:
        last_scan = (
            LongRunningJob.objects.filter(finished=True)
            .filter(job_type=LongRunningJob.JOB_ADD_GEOLOCATION)
            .filter(started_by=user)
            .order_by("-finished_at")
            .first()
        )
        existing_photos = Photo.objects.filter(owner=user.id)
        if not full_scan and last_scan:
            existing_photos = existing_photos.filter(added_on__gt=last_scan.started_at)
        if existing_photos.count() == 0:
            lrj.update_progress(current=0, target=0)
            lrj.complete()
            return
        lrj.update_progress(current=0, target=existing_photos.count())
        db.connections.close_all()

        for photo in existing_photos:
            AsyncTask(geolocation_job, photo, job_id).run()

    except Exception as err:
        util.logger.exception("An error occurred: ")
        print(f"[ERR]: {err}")
        lrj.fail(error=err)


def geolocation_job(photo: Photo, job_id: UUID):
    """
    Worker task to add geolocation for a single photo.
    
    Args:
        photo: The photo to process
        job_id: Job ID for tracking progress
    """
    failed = False
    error = None
    try:
        photo.refresh_from_db()
        photo._geolocate()
        photo._add_location_to_album_dates()
    except Exception as err:
        util.logger.exception("An error occurred: ")
        failed = True
        error_msg = f"Photo {photo.image_hash}: {str(err)}\n{traceback.format_exc()}"
        error = error_msg
    update_scan_counter(job_id, failed, error)


def scan_faces(user, job_id: UUID, full_scan=False):
    """
    Detect and extract faces from photos.
    
    Args:
        user: The user whose photos to process
        job_id: Job ID for tracking progress
        full_scan: If True, process all photos; otherwise only new ones
    """
    lrj = LongRunningJob.get_or_create_job(
        user=user,
        job_type=LongRunningJob.JOB_SCAN_FACES,
        job_id=job_id,
    )

    try:
        last_scan = (
            LongRunningJob.objects.filter(finished=True)
            .filter(job_type=LongRunningJob.JOB_SCAN_FACES)
            .filter(started_by=user)
            .order_by("-finished_at")
            .first()
        )
        existing_photos = Photo.objects.filter(
            Q(owner=user.id) & Q(thumbnail__thumbnail_big__isnull=False)
        )
        if not full_scan and last_scan:
            existing_photos = existing_photos.filter(added_on__gt=last_scan.started_at)

        if existing_photos.count() == 0:
            lrj.update_progress(current=0, target=0)
            lrj.complete()
            return

        lrj.update_progress(current=0, target=existing_photos.count())
        db.connections.close_all()

        for photo in existing_photos:
            failed = False
            error = None
            try:
                photo._extract_faces()
            except Exception as err:
                util.logger.exception("An error occurred: ")
                print(f"[ERR]: {err}")
                failed = True
                error_msg = f"Photo {photo.image_hash}: {str(err)}\n{traceback.format_exc()}"
                error = error_msg
            update_scan_counter(job_id, failed, error)
    except Exception as err:
        util.logger.exception("An error occurred: ")
        print(f"[ERR]: {err}")
        lrj.fail(error=err)

    generate_face_embeddings(user, uuid.uuid4())
    cluster_all_faces(user, uuid.uuid4())


================================================
FILE: api/directory_watcher/repair_jobs.py
================================================
"""
Repair jobs for fixing ungrouped file variants.

This module contains jobs that repair data inconsistencies, such as
RAW files that weren't properly grouped with their JPEG counterparts
due to race conditions in previous scans.
"""

from uuid import UUID

from api import util
from api.models import File, LongRunningJob, Photo
from api.directory_watcher.file_grouping import find_matching_jpeg_photo


def repair_ungrouped_file_variants(user, job_id: UUID):
    """
    Post-scan job to fix any ungrouped file variants.
    
    This handles:
    1. Race conditions from previous scans where RAW+JPEG weren't grouped
    2. Rescans where files were added incrementally
    3. Any orphaned RAW/metadata files that should be attached to existing Photos
    
    Strategy: Find Photos with RAW-only main_file, look for matching JPEG Photos,
    merge the RAW file into the JPEG Photo and delete the RAW-only Photo.
    
    Args:
        user: The user whose photos to repair
        job_id: Job ID for tracking progress
    """
    lrj = LongRunningJob.get_or_create_job(
        user=user,
        job_type=LongRunningJob.JOB_REPAIR_FILE_VARIANTS,
        job_id=job_id,
    )
    
    try:
        # Find Photos where main_file is RAW (potential orphans)
        raw_only_photos = Photo.objects.filter(
            owner=user,
            main_file__type=File.RAW_FILE
        )
        
        lrj.update_progress(current=0, target=raw_only_photos.count())
        
        merged_count = 0
        fixed_main_file_count = 0
        
        for raw_photo in raw_only_photos:
            if not raw_photo.main_file:
                continue
                
            # Check if this RAW photo has any IMAGE files (already grouped)
            has_image = raw_photo.files.filter(type=File.IMAGE).exists()
            if has_image:
                # Already properly grouped, just fix main_file priority
                image_file = raw_photo.files.filter(type=File.IMAGE).first()
                if image_file:
                    raw_photo.main_file = image_file
                    raw_photo.video = False
                    raw_photo.save(update_fields=['main_file', 'video'])
                    fixed_main_file_count += 1
                continue
            
            # Look for matching JPEG Photo
            jpeg_photo = find_matching_jpeg_photo(raw_photo.main_file.path, user)
            if jpeg_photo and jpeg_photo.id != raw_photo.id:
                # Merge: move all files from RAW photo to JPEG photo
                for f in raw_photo.files.all():
                    if not jpeg_photo.files.filter(hash=f.hash).exists():
                        jpeg_photo.files.add(f)
                
                jpeg_photo.save()
                
                # Delete the orphaned RAW-only photo
                raw_photo.delete()
                merged_count += 1
                util.logger.info(
                    f"job {job_id}: Merged RAW photo into JPEG photo {jpeg_photo.image_hash}"
                )
        
        util.logger.info(
            f"job {job_id}: Repaired {merged_count} ungrouped file variants, "
            f"fixed {fixed_main_file_count} main_file priorities"
        )
        lrj.complete()
        
    except Exception as e:
        util.logger.exception(f"job {job_id}: Error repairing file variants: {e}")
        lrj.fail(error=e)


================================================
FILE: api/directory_watcher/scan_jobs.py
================================================
"""
Main scan jobs for photo discovery and processing.

This module contains the core scan_photos function that implements the
two-phase scan architecture to avoid race conditions with RAW+JPEG grouping.
"""

import datetime
import os
import uuid
from collections import defaultdict
from uuid import UUID

import pytz
from django import db
from django.conf import settings
from django.core.paginator import Paginator
from django.db.models import F, Q
from django.utils import timezone
from django_q.tasks import AsyncTask, Chain

from api import util
from api.metadata.reader import get_sidecar_files_in_priority_order
from api.batch_jobs import batch_calculate_clip_embedding
from api.models import LongRunningJob, Photo, Thumbnail
from api.models.file import is_metadata

from api.directory_watcher.file_grouping import get_file_grouping_key
from api.directory_watcher.file_handlers import handle_new_image, handle_file_group
from api.directory_watcher.processing_jobs import (
    generate_tags,
    add_geolocation,
    scan_faces,
)
from api.directory_watcher.repair_jobs import repair_ungrouped_file_variants
from api.directory_watcher.utils import (
    walk_directory,
    walk_files,
    update_scan_counter,
)


def _file_was_modified_after(filepath, time):
    """Check if a file was modified after a given time."""
    try:
        modified = os.path.getmtime(filepath)
    except OSError:
        return False
    return datetime.datetime.fromtimestamp(modified).replace(tzinfo=pytz.utc) > time


def wait_for_group_and_process_metadata(
    group_id: str,
    metadata_paths: list[str],
    user_id: int,
    full_scan: bool,
    job_id: UUID | str,
    expected_count: int,
    *,
    attempt: int = 1,
    max_attempts: int = 2,
    **kwargs,  # Django-Q may pass additional arguments like 'schedule'
):
    """
    Sentinel task: waits until the expected number of image/video tasks in the group complete,
    then processes metadata files. It runs inside a django-q worker (non-blocking for the caller).

    Failure handling:
    - If the group is not complete yet, it will re-enqueue itself up to `max_attempts`.
    - After exhausting attempts, it proceeds with metadata processing anyway (best-effort).
    """
    from django_q.tasks import count_group
    from django.contrib.auth import get_user_model

    util.logger.info(
        f"Sentinel attempt {attempt}/{max_attempts} for group {group_id} (expecting {expected_count} tasks)"
    )

    # Check current completion count for the group
    try:
        completed = count_group(group_id)  # counts successes by default
    except Exception as e:
        util.logger.warning(
            f"Could not read group status for {group_id}: {e}. Treating as incomplete."
        )
        completed = 0

    # Normalize to an int to avoid None-related type issues
    completed_int = int(completed or 0)

    if completed_int < expected_count and attempt < max_attempts:
        util.logger.info(
            f"Group {group_id} not complete yet: {completed_int}/{expected_count}. Re-enqueue sentinel (attempt {attempt + 1})."
        )
        # Requeue the sentinel to check again later
        AsyncTask(
            wait_for_group_and_process_metadata,
            group_id,
            metadata_paths,
            user_id,
            full_scan,
            job_id,
            expected_count,
            attempt=attempt + 1,
            max_attempts=max_attempts,
            schedule=datetime.timedelta(seconds=5),
        ).run()
        return

    # Proceed with metadata processing (either completed or after exhausting attempts)
    if completed_int < expected_count:
        util.logger.warning(
            f"Proceeding with metadata despite incomplete image group {group_id}: {completed_int}/{expected_count}."
        )
    else:
        util.logger.info(
            f"Image group {group_id} completed. Processing {len(metadata_paths)} metadata files"
        )

    if not metadata_paths:
        util.logger.info("No metadata files to process after images completion")
        return

    User = get_user_model()
    try:
        user = User.objects.get(id=user_id)
    except User.DoesNotExist:
        util.logger.warning(
            f"User {user_id} not found when processing metadata for job {job_id}"
        )
        return

    last_scan = (
        LongRunningJob.objects.filter(finished=True)
        .filter(job_type=LongRunningJob.JOB_SCAN_PHOTOS)
        .filter(started_by=user)
        .order_by("-finished_at")
        .first()
    )

    for path in metadata_paths:
        try:
            photo_scanner(user, last_scan, full_scan, path, job_id)
        except Exception as e:
            util.logger.exception(
                f"Failed processing metadata {path} for job {job_id}: {e}"
            )


def photo_scanner(user, last_scan, full_scan, path, job_id):
    """
    Check if a single file needs processing and queue it.

    Used primarily for metadata files after the main scan.
    """
    files_to_check = [path]
    files_to_check.extend(get_sidecar_files_in_priority_order(path))
    if (
        not Photo.objects.filter(files__path=path).exists()
        or full_scan
        or not last_scan
        or any(
            [_file_was_modified_after(p, last_scan.finished_at) for p in files_to_check]
        )
    ):
        # Queue processing for this file. Metadata is queued here without grouping on purpose,
        # because grouping is managed at the higher-level scan phase to ensure images complete first.
        AsyncTask(handle_new_image, user, path, job_id).run()
    else:
        update_scan_counter(job_id)


def scan_photos(user, full_scan, job_id, scan_directory="", scan_files=[]):
    """
    Two-phase scan to avoid race conditions with RAW+JPEG grouping.

    Phase 1: Collect all files and group by (directory, basename)
             - IMG_001.jpg, IMG_001.CR2, IMG_001.xmp -> one group
             - IMG_002.jpg -> separate group

    Phase 2: Process each group sequentially, creating one Photo per group
             with all file variants attached.

    This eliminates the race condition where concurrent processing of
    RAW and JPEG files could create separate Photos.

    Args:
        user: The user performing the scan
        full_scan: If True, rescan all files; otherwise only new/modified
        job_id: Job ID for tracking progress
        scan_directory: Directory to scan (defaults to user's scan_directory)
        scan_files: Optional list of specific files to scan
    """
    thumbnail_dirs = [
        os.path.join(settings.MEDIA_ROOT, "square_thumbnails_small"),
        os.path.join(settings.MEDIA_ROOT, "square_thumbnails"),
        os.path.join(settings.MEDIA_ROOT, "thumbnails_big"),
    ]
    for directory in thumbnail_dirs:
        os.makedirs(directory, exist_ok=True)

    lrj = LongRunningJob.get_or_create_job(
        user=user,
        job_type=LongRunningJob.JOB_SCAN_PHOTOS,
        job_id=job_id,
    )
    photo_count_before = Photo.objects.count()

    try:
        if scan_directory == "":
            scan_directory = user.scan_directory
        photo_list = []
        if scan_files:
            walk_files(scan_files, photo_list)
        else:
            walk_directory(scan_directory, photo_list)
        files_found = len(photo_list)
        last_scan = (
            LongRunningJob.objects.filter(finished=True)
            .filter(job_type=1)
            .filter(started_by=user)
            .order_by("-finished_at")
            .first()
        )

        # === PHASE 1: Group files by (directory, basename) ===
        # This ensures RAW+JPEG pairs are processed together, eliminating race conditions
        file_groups: dict[tuple[str, str], list[str]] = defaultdict(list)
        metadata_paths: list[str] = []

        for path in photo_list:
            if is_metadata(path):
                # Metadata files are processed after their parent photos exist
                metadata_paths.append(path)
            else:
                # Group by (directory, basename_lowercase)
                group_key = get_file_grouping_key(path)
                file_groups[group_key].append(path)

        # Determine which groups need processing
        groups_to_process: list[tuple[tuple[str, str], list[str]]] = []

        for group_key, paths in file_groups.items():
            # Check if any file in this group needs processing
            needs_processing = False

            for path in paths:
                files_to_check = [path]
                files_to_check.extend(get_sidecar_files_in_priority_order(path))

                if (
                    not Photo.objects.filter(files__path=path).exists()
                    or full_scan
                    or not last_scan
                    or any(
                        [
                            _file_was_modified_after(p, last_scan.finished_at)
                            for p in files_to_check
                        ]
                    )
                ):
                    needs_processing = True
                    break

            if needs_processing:
                groups_to_process.append((group_key, paths))

        # Progress target is number of groups (not individual files)
        # Each group = one Photo with potentially multiple file variants
        total_groups = len(groups_to_process) + len(metadata_paths)
        lrj.update_progress(current=0, target=total_groups)
        db.connections.close_all()

        util.logger.info(
            f"Grouped {files_found} files into {len(file_groups)} groups, {len(groups_to_process)} need processing"
        )

        # === PHASE 2: Process each file group ===
        # Process groups sequentially to avoid race conditions
        # Each group creates one Photo with all file variants
        image_group_id = str(uuid.uuid4())

        for group_key, paths in groups_to_process:
            AsyncTask(
                handle_file_group,
                user,
                paths,
                job_id,
                group=image_group_id,
            ).run()

        # If there are only metadata files (no image groups queued), process metadata now
        if not groups_to_process and metadata_paths:
            util.logger.info(
                f"No images to process, processing {len(metadata_paths)} metadata files directly"
            )
            for path in metadata_paths:
                photo_scanner(user, last_scan, full_scan, path, job_id)

        # If there are images and metadata, enqueue a sentinel task that waits for the image group
        if groups_to_process and metadata_paths:
            util.logger.info(
                f"Scheduling sentinel to process {len(metadata_paths)} metadata files after {len(groups_to_process)} image groups"
            )
            AsyncTask(
                wait_for_group_and_process_metadata,
                image_group_id,
                metadata_paths,
                user.id,
                full_scan,
                job_id,
                len(groups_to_process),
                attempt=1,
                max_attempts=2,
            ).run()

        util.logger.info(f"Scanned {files_found} files in : {scan_directory}")

        # If no files were queued for processing (empty directory or all files already processed),
        # mark the job as finished immediately since progress_current will equal progress_target (both 0)
        LongRunningJob.objects.filter(
            job_id=job_id, progress_current=F("progress_target")
        ).update(finished=True, finished_at=timezone.now())

        util.logger.info("Finished updating album things")

        # Check for photos with missing aspect ratios but existing thumbnails
        photos_with_missing_aspect_ratio = Photo.objects.filter(
            Q(owner=user.id)
            & Q(thumbnail__isnull=False)
            & Q(thumbnail__thumbnail_big__isnull=False)
            & Q(thumbnail__aspect_ratio__isnull=True)
        )
        if photos_with_missing_aspect_ratio.exists():
            util.logger.info(
                f"Found {photos_with_missing_aspect_ratio.count()} photos with missing aspect ratios"
            )
            for photo in photos_with_missing_aspect_ratio:
                try:
                    thumbnail = getattr(photo, "thumbnail", None)
                    if thumbnail and isinstance(thumbnail, Thumbnail):
                        thumbnail._calculate_aspect_ratio()
                except Exception as e:
                    util.logger.exception(
                        f"Could not calculate aspect ratio for photo {photo.image_hash}: {str(e)}"
                    )

        # if the scan type is not the default user scan directory, or if it is specified as only scanning
        # specific files, there is no need to rescan fully for missing photos.
        if full_scan or (scan_directory == user.scan_directory and not scan_files):
            AsyncTask(scan_missing_photos, user, uuid.uuid4()).run()

        # Run repair job to fix any previously ungrouped file variants
        # This handles race conditions from previous scans and incremental adds
        AsyncTask(repair_ungrouped_file_variants, user, uuid.uuid4()).run()

        AsyncTask(generate_tags, user, uuid.uuid4(), full_scan).run()
        AsyncTask(add_geolocation, user, uuid.uuid4(), full_scan).run()

        # The scan faces job will have issues if the embeddings haven't been generated before it runs
        chain = Chain()
        chain.append(batch_calculate_clip_embedding, user)
        chain.append(scan_faces, user, uuid.uuid4(), full_scan)
        chain.run()

    except Exception as e:
        util.logger.exception("An error occurred: ")
        lrj.fail(error=e)

    added_photo_count = Photo.objects.count() - photo_count_before
    util.logger.info(f"Added {added_photo_count} photos")


def scan_missing_photos(user, job_id: UUID):
    """
    Scan for photos whose files no longer exist on disk.

    Args:
        user: The user whose photos to check
        job_id: Job ID for tracking progress
    """
    lrj = LongRunningJob.get_or_create_job(
        user=user,
        job_type=LongRunningJob.JOB_SCAN_MISSING_PHOTOS,
        job_id=job_id,
    )
    try:
        existing_photos = Photo.objects.filter(owner=user.id).order_by("image_hash")

        paginator = Paginator(existing_photos, 5000)
        lrj.update_progress(current=0, target=paginator.num_pages)
        for page in range(1, paginator.num_pages + 1):
            for existing_photo in paginator.page(page).object_list:
                existing_photo._check_files()

            update_scan_counter(job_id)

        util.logger.info("Finished checking paths for missing photos")
    except Exception as e:
        util.logger.exception("An error occurred: ")
        lrj.fail(error=e)


================================================
FILE: api/directory_watcher/utils.py
================================================
"""
Utility functions for directory scanning and job management.
"""

import os
import stat

from constance import config as site_config
from django.db.models import F
from django.utils import timezone

from api.models import LongRunningJob


def should_skip(path):
    """Check if a path should be skipped based on configured patterns."""
    if not site_config.SKIP_PATTERNS:
        return False

    skip_patterns = site_config.SKIP_PATTERNS
    skip_list = skip_patterns.split(",")
    skip_list = map(str.strip, skip_list)

    res = [ele for ele in skip_list if (ele in path)]
    return bool(res)


if os.name == "Windows":

    def is_hidden(path):
        """Check if a file is hidden (Windows version)."""
        name = os.path.basename(os.path.abspath(path))
        return name.startswith(".") or _has_hidden_attribute(path)

    def _has_hidden_attribute(path):
        """Check if file has Windows hidden attribute."""
        try:
            return bool(os.stat(path).st_file_attributes & stat.FILE_ATTRIBUTE_HIDDEN)
        except Exception:
            return False

else:

    def is_hidden(path):
        """Check if a file is hidden (Unix version - starts with dot)."""
        return os.path.basename(path).startswith(".")


def walk_directory(directory, callback):
    """
    Recursively walk a directory and collect file paths.
    
    Args:
        directory: Directory to scan
        callback: List to append file paths to
    """
    for file in os.scandir(directory):
        fpath = os.path.join(directory, file)
        if not is_hidden(fpath) and not should_skip(fpath):
            if os.path.isdir(fpath):
                walk_directory(fpath, callback)
            else:
                callback.append(fpath)


def walk_files(scan_files, callback):
    """
    Walk a list of specific files.
    
    Args:
        scan_files: List of file paths to check
        callback: List to append valid file paths to
    """
    for fpath in scan_files:
        if os.path.isfile(fpath):
            callback.append(fpath)


def update_scan_counter(job_id, failed=False, error=None):
    """
    Update the progress counter for a long-running job.
    
    Increments progress_current and marks job as finished when complete.
    Also tracks errors for failed items.
    
    Args:
        job_id: The job ID to update
        failed: Whether this item failed processing
        error: Error message if failed
    """
    # Increment the current progress and get the updated job
    LongRunningJob.objects.filter(job_id=job_id).update(
        progress_current=F("progress_current") + 1
    )
    
    # Refetch the job to get the updated progress_current value
    job = LongRunningJob.objects.filter(job_id=job_id).first()
    if not job:
        return

    # Mark the job as finished if the current progress equals the target
    if job.progress_current >= job.progress_target:
        # Job is finishing, update result with errors if any
        result = job.result or {}
        if failed or error:
            result["status"] = "failed"
            if "errors" not in result:
                result["errors"] = []
            if error:
                error_str = str(error)
                # Avoid duplicate errors
                if error_str not in result["errors"]:
                    result["errors"].append(error_str)
            # Set main error field for backward compatibility
            if "error" not in result and error:
                result["error"] = str(error)
            elif "error" not in result and result.get("errors"):
                result["error"] = result["errors"][0]  # Use first error as main error
        job.finished = True
        job.finished_at = timezone.now()
        if failed:
            job.failed = True
        job.result = result
        job.save(update_fields=["finished", "finished_at", "failed", "result"])
    else:
        # Job is still running, accumulate errors in result
        if failed or error:
            job = LongRunningJob.objects.filter(job_id=job_id).first()
            if job:
                result = job.result or {}
                result["status"] = "partial_failure" if not job.finished else "failed"
                if "errors" not in result:
                    result["errors"] = []
                if error:
                    error_str = str(error)
                    # Avoid duplicate errors (limit to last 100 to prevent unbounded growth)
                    if error_str not in result["errors"]:
                        result["errors"].append(error_str)
                        if len(result["errors"]) > 100:
                            result["errors"] = result["errors"][-100:]  # Keep last 100 errors
                # Set main error field for backward compatibility
                if "error" not in result and error:
                    result["error"] = str(error)
                elif "error" not in result and result.get("errors"):
                    result["error"] = result["errors"][0]  # Use first error as main error
                job.result = result
                job.failed = failed or job.failed
                job.save(update_fields=["failed", "result"])


================================================
FILE: api/drf_optimize.py
================================================
from django.db import ProgrammingError, models
from django.db.models.constants import LOOKUP_SEP
from django.db.models.query import normalize_prefetch_lookups
from rest_framework import serializers
from rest_framework.utils import model_meta


class OptimizeRelatedModelViewSetMetaclass(type):
    """This metaclass optimizes the queryset using `prefetch_related` and `select_related`.

    Any attribute of `_base_forward_rel` as attributes on either the class or on
    any of its superclasses will be include in the `base_forward_rel`
    they must be ForeignKey fields and only those will be included.

    If the `serializer_class` attribute is an instance of `serializers.ModelSerializer`
    included as an attribute on the class the `serializers.ModelSerializer.Meta.fields`
    is also added calling prefetch_related on Many-To-One and Many-To-Many related objects.
    """

    @classmethod
    def get_many_to_many_rel(cls, info, meta_fields):
        many_to_many_fields = [
            field_name
            for field_name, relation_info in info.relations.items()
            if relation_info.to_many
        ]
        many_to_many_lookups = []
        for lookup_name, lookup in cls.get_lookups(meta_fields):
            if lookup_name in many_to_many_fields:
                many_to_many_lookups.append(lookup)

        return many_to_many_lookups

    @classmethod
    def get_lookups(cls, fields, strict=False):
        field_lookups = [(lookup.split(LOOKUP_SEP, 1)[0], lookup) for lookup in fields]
        if strict:
            field_lookups = [f for f in field_lookups if LOOKUP_SEP in f[1]]
        return field_lookups

    @classmethod
    def get_many_to_one_rel(cls, info, meta_fields):
        try:
            fields = [
                field_name
                for field_name, relation_info in info.forward_relations.items()
                if issubclass(type(relation_info[0]), models.ForeignKey)
            ]
        except IndexError:
            pass
        else:
            if fields:
                forward_many_to_many_rel = []
                for lookup_name, lookup in cls.get_lookups(meta_fields, strict=True):
                    if lookup_name in fields:
                        forward_many_to_many_rel.append(lookup)
                return forward_many_to_many_rel
        return []

    @classmethod
    def get_forward_rel(cls, info, meta_fields):
        return [
            field_name
            for field_name, relation_info in info.forward_relations.items()
            if field_name in meta_fields and not relation_info.to_many
        ]

    def __new__(cls, name, bases, attrs):
        serializer_class = attrs.get("serializer_class", None)
        many_to_many_fields = many_to_one_fields = related_fields = []

        info = None
        base_forward_rel = list(attrs.pop("_base_forward_rel", ()))

        for base in reversed(bases):
            if hasattr(base, "_base_forward_rel"):
                base_forward_rel.extend(list(base._base_forward_rel))
        if serializer_class and issubclass(
            serializer_class, serializers.ModelSerializer
        ):
            base_forward_rel.extend(
                list(getattr(serializer_class, "_related_fields", [])),
            )
            many_to_many_fields.extend(
                list(getattr(serializer_class, "_many_to_many_fields", [])),
            )
            many_to_one_fields.extend(
                list(getattr(serializer_class, "_many_to_one_fields", [])),
            )
            if hasattr(serializer_class.Meta, "model"):
                info = model_meta.get_field_info(serializer_class.Meta.model)
                meta_fields = list(serializer_class.Meta.fields)
                many_to_many_fields.extend(meta_fields)
                many_to_one_fields.extend(meta_fields)
                base_forward_rel.extend(meta_fields)

        if info is not None:
            many_to_many_fields = cls.get_many_to_many_rel(
                info, set(many_to_many_fields)
            )
            many_to_one_fields = cls.get_many_to_one_rel(info, set(many_to_one_fields))
            related_fields = cls.get_forward_rel(info, set(base_forward_rel))

        queryset = attrs.get("queryset", None)
        try:
            if queryset:
                if many_to_many_fields:
                    queryset = queryset.prefetch_related(
                        *normalize_prefetch_lookups(
                            set(many_to_many_fields + many_to_one_fields)
                        ),
                    )
                if related_fields:
                    queryset = queryset.select_related(*related_fields)
                attrs["queryset"] = queryset.all()
        except ProgrammingError:
            pass
        return super(OptimizeRelatedModelViewSetMetaclass, cls).__new__(
            cls, name, bases, attrs
        )


================================================
FILE: api/duplicate_detection.py
================================================
"""
Duplicate detection module for finding duplicate photos.

Handles two types of duplicates:
- EXACT_COPY: Files with identical MD5 hash (byte-for-byte copies)
- VISUAL_DUPLICATE: Photos with similar perceptual hash

This is separate from stack detection (RAW+JPEG pairs, bursts, etc.)
because duplicates are about storage cleanup, not photo organization.

Optimized with BK-Tree for efficient visual duplicate detection.

Memory Optimizations (v2):
- detect_exact_copies: Uses database aggregation (GROUP BY) instead of loading
  all photos into memory. Only photo IDs are loaded, not full objects.
- detect_visual_duplicates: Processes photos in configurable batches (default 10k).
  Uses two-pass algorithm: within-batch BK-Tree search, then cross-batch linear scan.
  Memory usage: O(batch_size) instead of O(total_photos).

With 300k photos:
- Old: ~10GB+ RAM (all photos + files + large BK-Tree)
- New: ~100-200MB RAM (batch + hash list only)
"""

from collections import defaultdict

from django.db.models import Q

from api.models import Photo
from api.models.duplicate import Duplicate
from api.models.file import File
from api.models.long_running_job import LongRunningJob
from api.perceptual_hash import DEFAULT_HAMMING_THRESHOLD, hamming_distance
from api.util import logger


class BKTree:
    """
    Burkhard-Keller Tree for efficient Hamming distance queries.

    Achieves O(log n) average case by pruning branches using triangle inequality.
    """

    def __init__(self, distance_func):
        self.distance = distance_func
        self.root = None
        self.size = 0

    def add(self, item_id, item_hash):
        """Add an item (id, hash) to the tree."""
        self.size += 1
        if self.root is None:
            self.root = {"id": item_id, "hash": item_hash, "children": {}}
            return

        node = self.root
        while True:
            dist = self.distance(item_hash, node["hash"])
            if dist in node["children"]:
                node = node["children"][dist]
            else:
                node["children"][dist] = {
                    "id": item_id,
                    "hash": item_hash,
                    "children": {},
                }
                break

    def search(self, query_hash, threshold):
        """Find all items within threshold Hamming distance of query."""
        if self.root is None:
            return []

        results = []
        candidates = [self.root]

        while candidates:
            node = candidates.pop()
            dist = self.distance(query_hash, node["hash"])

            if dist <= threshold:
                results.append((node["id"], dist))

            min_dist = max(0, dist - threshold)
            max_dist = dist + threshold

            for d, child in node["children"].items():
                if min_dist <= d <= max_dist:
                    candidates.append(child)

        return results


class UnionFind:
    """Union-Find with path compression and union by rank."""

    def __init__(self):
        self.parent = {}
        self.rank = {}

    def find(self, x):
        if x not in self.parent:
            self.parent[x] = x
            self.rank[x] = 0
            return x
        if self.parent[x] != x:
            self.parent[x] = self.find(self.parent[x])
        return self.parent[x]

    def union(self, x, y):
        px, py = self.find(x), self.find(y)
        if px == py:
            return
        if self.rank[px] < self.rank[py]:
            px, py = py, px
        self.parent[py] = px
        if self.rank[px] == self.rank[py]:
            self.rank[px] += 1

    def get_groups(self):
        groups = defaultdict(list)
        for item in self.parent:
            groups[self.find(item)].append(item)
        return [group for group in groups.values() if len(group) > 1]


def detect_exact_copies(user, progress_callback=None):
    """
    Detect exact file copies for a user.

    Groups photos that have the same content hash. Uses database aggregation
    to efficiently find duplicate groups without loading all photos into memory.

    Memory optimized: Uses database GROUP BY instead of Python dictionaries.

    Args:
        user: The user whose photos to analyze
        progress_callback: Optional callback(current, total, found) for progress

    Returns:
        Number of duplicate groups created
    """
    from django.db.models import Count

    # Method 1: Find duplicate groups by Photo.image_hash using database aggregation
    # This is memory efficient as we only load photo IDs grouped by hash
    image_hash_groups = (
        Photo.objects.filter(
            Q(owner=user)
            & Q(hidden=False)
            & Q(in_trashcan=False)
            & Q(removed=False)
            & Q(image_hash__isnull=False)
        )
        .values("image_hash")
        .annotate(count=Count("id"))
        .filter(count__gt=1)
        .values_list("image_hash", flat=True)
    )

    # Method 2: Find duplicate groups by File content hash (MD5 part)
    # We need to use a SUBSTRING operation to extract the MD5 part
    # This is done via raw SQL for efficiency
    from django.db import connection

    file_hash_duplicates = []
    with connection.cursor() as cursor:
        # Extract first 32 chars (MD5) from File.hash and find duplicates
        # Only consider non-metadata files
        cursor.execute(
            """
            SELECT SUBSTRING(f.hash, 1, 32) as content_hash
            FROM api_file f
            INNER JOIN api_photo_files pf ON pf.file_id = f.hash
            INNER JOIN api_photo p ON p.id = pf.photo_id
            WHERE p.owner_id = %s 
                AND p.hidden = FALSE 
                AND p.in_trashcan = FALSE
                AND p.removed = FALSE
                AND f.type != %s
            GROUP BY SUBSTRING(f.hash, 1, 32)
            HAVING COUNT(DISTINCT p.id) > 1
        """,
            [user.id, File.METADATA_FILE],
        )

        file_hash_duplicates = [row[0] for row in cursor.fetchall()]

    # Use Union-Find to merge overlapping groups
    uf = UnionFind()

    # Process image_hash groups
    # Note: We need to iterate through the queryset, which will load the hashes into memory
    # But this is much better than loading all photos with files
    image_hash_list = list(image_hash_groups)  # Load just the hashes
    total_image_groups = len(image_hash_list)

    for i, image_hash in enumerate(image_hash_list):
        # Only load photo IDs, not full Photo objects
        photo_ids = list(
            Photo.objects.filter(
                owner=user,
                image_hash=image_hash,
                hidden=False,
                in_trashcan=False,
                removed=False,
            ).values_list("id", flat=True)
        )

        if len(photo_ids) >= 2:
            first = photo_ids[0]
            for pid in photo_ids[1:]:
                uf.union(first, pid)

        if progress_callback and i % 100 == 0:
            progress_callback(i, total_image_groups * 2, 0)

    # Process file_hash groups
    for i, content_hash in enumerate(file_hash_duplicates):
        # Find photos with files matching this content hash
        photo_ids = list(
            Photo.objects.filter(
                owner=user,
                hidden=False,
                in_trashcan=False,
                removed=False,
                files__hash__startswith=content_hash,
            )
            .exclude(files__type=File.METADATA_FILE)
            .distinct()
            .values_list("id", flat=True)
        )

        if len(photo_ids) >= 2:
            first = photo_ids[0]
            for pid in photo_ids[1:]:
                uf.union(first, pid)

        if progress_callback and i % 100 == 0:
            progress_callback(total_image_groups + i, total_image_groups * 2, 0)

    # Get merged groups from Union-Find
    merged_groups = uf.get_groups()

    duplicates_created = 0
    total = len(merged_groups)

    for i, photo_id_group in enumerate(merged_groups):
        if len(photo_id_group) < 2:
            continue

        # Get Photo objects for this group
        group_photos = Photo.objects.filter(id__in=photo_id_group)

        # Create or merge duplicate group using the helper method
        duplicate = Duplicate.create_or_merge(
            owner=user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=group_photos,
        )

        if duplicate:
            duplicates_created += 1

        if progress_callback and i % 100 == 0:
            progress_callback(i, total, duplicates_created)

    logger.info(
        f"Exact copy detection for {user.username}: found {duplicates_created} duplicate groups"
    )
    return duplicates_created


def detect_visual_duplicates(
    user, threshold=DEFAULT_HAMMING_THRESHOLD, progress_callback=None, batch_size=10000
):
    """
    Detect visually similar photos using perceptual hash.

    Memory optimized: Processes photos in batches to avoid loading all data into memory.
    Uses a two-pass approach for complete duplicate detection with bounded memory.

    Algorithm:
    1. First pass: Build BKTree in batches, find within-batch duplicates
    2. Second pass: Compare each batch against all previous batches using linear scan

    The linear scan in pass 2 is acceptable because:
    - We only store (id, hash) tuples, not full Photo objects
    - Hamming distance is very fast to compute
    - With 300k photos, we have ~300k comparisons per batch, which is fast

    Args:
        user: The user whose photos to analyze
        threshold: Hamming distance threshold (default: 10)
        progress_callback: Optional callback(current, total, found) for progress
        batch_size: Number of photos to process per batch (default: 10000)

    Returns:
        Number of duplicate groups created
    """
    # Get photos with perceptual hash that aren't already in visual duplicate groups
    # Exclude removed photos to avoid including merged/deleted duplicates
    photos_queryset = (
        Photo.objects.filter(
            Q(owner=user)
            & Q(hidden=False)
            & Q(in_trashcan=False)
            & Q(removed=False)
            & Q(perceptual_hash__isnull=False)
        )
        .exclude(duplicates__duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE)
        .only("id", "perceptual_hash")
    )

    total = photos_queryset.count()
    if total < 2:
        return 0

    logger.info(
        f"Processing {total} photos in batches of {batch_size} (user: {user.username})"
    )

    # Union-Find for grouping across all batches
    uf = UnionFind()
    pairs_found = 0
    processed = 0

    # Store all photo hashes as (id, hash) tuples for cross-batch comparison
    # Memory efficient: 300k photos × ~28 bytes = ~8.4MB theoretical
    # In practice, Python overhead means ~25-40MB for list + objects
    all_photo_hashes = []

    # Calculate number of batches
    num_batches = (total + batch_size - 1) // batch_size

    # Pass 1: Process each batch internally and build the complete hash list
    for batch_idx in range(num_batches):
        offset = batch_idx * batch_size

        # Get current batch using slicing (memory efficient)
        batch_photos = list(
            photos_queryset[offset : offset + batch_size].values(
                "id", "perceptual_hash"
            )
        )

        if not batch_photos:
            break

        logger.info(
            f"Pass 1: Processing batch {batch_idx + 1}/{num_batches} ({len(batch_photos)} photos)"
        )

        # Build temporary BK-Tree for current batch (for efficient within-batch search)
        batch_tree = BKTree(hamming_distance)
        batch_hashes = []

        for photo in batch_photos:
            photo_id = photo["id"]
            phash = photo["perceptual_hash"]

            if phash:
                batch_tree.add(photo_id, phash)
                batch_hashes.append((photo_id, phash))

        # Find duplicates within current batch using BK-Tree
        for photo_id, phash in batch_hashes:
            similar = batch_tree.search(phash, threshold)

            for similar_id, distance in similar:
                if similar_id != photo_id:
                    uf.union(photo_id, similar_id)
                    pairs_found += 1

        # Add batch to the complete list for cross-batch comparison
        all_photo_hashes.extend(batch_hashes)

        processed += len(batch_photos)

        if progress_callback:
            # Report progress for pass 1 (first 50% of total work)
            progress_callback(processed // 2, total, pairs_found)

    logger.info(
        f"Pass 1 complete. Found {pairs_found} within-batch pairs. Starting cross-batch comparison."
    )

    # Pass 2: Compare each batch against all previous photos (linear scan)
    # This ensures we don't miss duplicates between distant batches
    processed = 0

    for batch_idx in range(num_batches):
        start_idx = batch_idx * batch_size
        end_idx = min(start_idx + batch_size, len(all_photo_hashes))

        if start_idx >= end_idx:
            break

        batch_hashes = all_photo_hashes[start_idx:end_idx]

        logger.info(
            f"Pass 2: Comparing batch {batch_idx + 1}/{num_batches} against previous photos"
        )

        # Compare current batch against all previous photos
        # Store the previous photos slice once to avoid repeated slicing
        previous_hashes = all_photo_hashes[:start_idx] if start_idx > 0 else []

        for photo_id, phash in batch_hashes:
            # Only compare against photos in previous batches (avoid duplicate comparisons)
            for prev_id, prev_hash in previous_hashes:
                distance = hamming_distance(phash, prev_hash)
                if distance <= threshold:
                    uf.union(photo_id, prev_id)
                    pairs_found += 1

        processed += len(batch_hashes)

        if progress_callback:
            # Report progress for pass 2 (second 50% of total work)
            progress_callback(total // 2 + processed // 2, total, pairs_found)

    logger.info(f"Pass 2 complete. Total pairs found: {pairs_found}")

    # Create duplicate groups from Union-Find groups
    groups = uf.get_groups()
    duplicates_created = 0

    for group in groups:
        if len(group) < 2:
            continue

        # Get Photo objects for this group
        group_photos = Photo.objects.filter(id__in=group)

        # Create or merge duplicate group
        duplicate = Duplicate.create_or_merge(
            owner=user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
            photos=group_photos,
        )

        if duplicate:
            duplicates_created += 1

    logger.info(
        f"Visual duplicate detection for {user.username}: found {duplicates_created} groups from {pairs_found} pairs"
    )
    return duplicates_created


def batch_detect_duplicates(user, options=None):
    """
    Run batch duplicate detection for a user.

    Args:
        user: The user whose photos to analyze
        options: Dict with detection options:
            - detect_exact_copies: bool (default: True)
            - detect_visual_duplicates: bool (default: True)
            - visual_threshold: int (default: 10)
            - clear_pending: bool (default: False)
            - batch_size: int (default: 10000) - photos per batch for visual detection
    """
    if options is None:
        options = {}

    detect_exact = options.get("detect_exact_copies", True)
    detect_visual = options.get("detect_visual_duplicates", True)
    visual_threshold = options.get("visual_threshold", DEFAULT_HAMMING_THRESHOLD)
    clear_pending = options.get("clear_pending", False)
    batch_size = options.get("batch_size", 10000)

    # Create long-running job for progress tracking
    job = LongRunningJob.create_job(
        user=user,
        job_type=LongRunningJob.JOB_DETECT_DUPLICATES,
        start_now=True,
    )

    try:
        # Clear pending duplicates if requested
        if clear_pending:
            cleared = Duplicate.objects.filter(
                owner=user, review_status=Duplicate.ReviewStatus.PENDING
            ).delete()[0]
            logger.info(f"Cleared {cleared} pending duplicates for {user.username}")

        total_found = 0

        # Detect exact copies
        if detect_exact:

            def progress_exact(current, total, found):
                job.set_result(
                    {
                        "stage": "exact_copies",
                        "current": current,
                        "total": total,
                        "found": found,
                    }
                )

            exact_count = detect_exact_copies(user, progress_exact)
            total_found += exact_count

        # Detect visual duplicates
        if detect_visual:

            def progress_visual(current, total, found):
                job.set_result(
                    {
                        "stage": "visual_duplicates",
                        "current": current,
                        "total": total,
                        "found": found,
                    }
                )

            visual_count = detect_visual_duplicates(
                user, visual_threshold, progress_visual, batch_size
            )
            total_found += visual_count

        job.complete(result={"status": "completed", "duplicates_found": total_found})

        logger.info(
            f"Duplicate detection completed for {user.username}: {total_found} groups found"
        )

    except Exception as e:
        logger.error(f"Duplicate detection failed for {user.username}: {e}")
        job.fail(error=e)
        raise


================================================
FILE: api/face_classify.py
================================================
import datetime
import uuid

import numpy as np
import seaborn as sns
from bulk_update.helper import bulk_update
from django.core.paginator import Paginator
from django.db.models import Q
from django_q.tasks import AsyncTask
from hdbscan import HDBSCAN
from sklearn.decomposition import PCA
from sklearn.neural_network import MLPClassifier

from api.cluster_manager import ClusterManager
from api.models import Face, LongRunningJob, Person
from api.models.cluster import UNKNOWN_CLUSTER_ID, Cluster, get_unknown_cluster
from api.models.user import User, get_deleted_user
from api.util import logger

FACE_CLASSIFY_COLUMNS = [
    "person",
    "classification_person",
    "classification_probability",
    "cluster_person",
    "cluster_probability",
    "id",
    "cluster",
]


def cluster_faces(user, inferred=True):
    # Fetch distinct persons associated with the user's faces
    persons = [p.id for p in Person.objects.filter(faces__photo__owner=user).distinct()]

    # Create a color mapping for each person
    p2c = dict(zip(persons, sns.color_palette(n_colors=len(persons)).as_hex()))

    face_encoding = []
    faces_with_encoding = []
    # Fetch faces that belong to the user and are not deleted
    faces = Face.objects.filter(Q(photo__owner=user) & Q(deleted=False))
    paginator = Paginator(faces, 5000)

    for page in range(1, paginator.num_pages + 1):
        for face in paginator.page(page).object_list:
            if ((not face.person) or inferred) and face.encoding:
                face_encoding.append(face.get_encoding_array())
                faces_with_encoding.append(face)

    # Return empty result if no faces with encodings
    if len(face_encoding) == 0:
        return {"status": True, "data": []}

    # Perform PCA for dimensionality reduction
    pca = PCA(n_components=3)
    vis_all = pca.fit_transform(face_encoding)

    res = []
    for face, vis in zip(faces_with_encoding, vis_all):
        person_id = face.person.id if face.person else UNKNOWN_CLUSTER_ID
        person_name = face.person.name if face.person else "unknown"

        # Ensure UNKNOWN_CLUSTER_ID is in p2c
        if person_id not in p2c:
            # Assign a default color if not found
            color = "#000000"  # Default to black or any fallback color
        else:
            color = p2c[person_id]

        res.append(
            {
                "person_id": person_id,
                "person_name": person_name,
                "person_label_is_inferred": not face.person,
                "color": color,
                "face_url": face.image.url,
                "value": {"x": vis[0], "y": vis[1], "size": vis[2]},
            }
        )
    return {"status": True, "data": res}


def cluster_all_faces(user, job_id) -> bool:
    """Groups all faces into clusters for ease of labeling. It first deletes all
    existing clusters, then regenerates them all. It will split clusters that have
    more than one kind of labeled face.
    :param user: the current user running the training
    :param job_id: the background job ID
    """
    lrj = LongRunningJob.get_or_create_job(
        user=user,
        job_type=LongRunningJob.JOB_CLUSTER_ALL_FACES,
        job_id=job_id,
    )
    lrj.update_progress(current=0, target=1)

    try:
        delete_clustered_people(user)
        delete_clusters(user)
        delete_persons_without_faces()
        target_count: int = create_all_clusters(user, lrj)

        lrj.update_progress(current=target_count, target=target_count)
        lrj.complete()

        train_job_id = uuid.uuid4()
        AsyncTask(train_faces, user, train_job_id).run()
        return True

    except BaseException as err:
        logger.exception("An error occurred")
        print(f"[ERR] {err}")
        lrj.fail(error=err)
        return False


def create_all_clusters(user: User, lrj: LongRunningJob = None) -> int:
    """Generate Cluster records for each different clustering of people
    :param user: the current user
    :param lrj: LongRunningJob to update, if needed
    """
    all_clusters: list[Cluster] = []
    face: Face
    logger.info("Creating clusters")

    data = {
        "all": {"encoding": [], "id": [], "person_id": [], "person_labeled": []},
    }
    for face in Face.objects.filter(photo__owner=user).prefetch_related("person"):
        data["all"]["encoding"].append(face.get_encoding_array())
        data["all"]["id"].append(face.id)

    target_count = len(data["all"]["id"])
    if target_count == 0:
        return target_count

    min_cluster_size = 2
    # double cluster size for every 10x increase in target counts, if user has not set a valid min_cluster_size
    if (
        user.min_cluster_size == 0
        or user.min_cluster_size is None
        or user.min_cluster_size == 1
    ):
        if target_count > 1000:
            min_cluster_size = 4
        if target_count > 10000:
            min_cluster_size = 8
        if target_count > 100000:
            min_cluster_size = 16
    else:
        min_cluster_size = user.min_cluster_size

    min_samples = 1
    if user.min_samples > 0:
        min_samples = user.min_samples

    # creating HDBSCAN object for clustering the encodings with the metric "euclidean"
    clt = HDBSCAN(
        min_cluster_size=min_cluster_size,
        min_samples=min_samples,
        cluster_selection_epsilon=user.cluster_selection_epsilon,
        metric="euclidean",
    )
    logger.info("Before finding clusters")
    # clustering the encodings
    clt.fit(np.array(data["all"]["encoding"]))
    logger.info("After finding clusters")

    labelIDs = np.unique(clt.labels_)
    labelID: np.intp
    commit_time = datetime.datetime.now() + datetime.timedelta(seconds=5)
    count: int = 0
    maxLen: int = len(str(np.size(labelIDs)))
    sortedIndexes: dict[int, np.ndarray] = dict()
    clusterCount: int = 0
    clusterId: int

    for labelID in labelIDs:
        idxs = np.where(clt.labels_ == labelID)[0]
        sortedIndexes[labelID] = idxs

    logger.info(f"Found {len(sortedIndexes)} clusters")
    for labelID in sorted(
        sortedIndexes, key=lambda key: np.size(sortedIndexes[key]), reverse=True
    ):
        if labelID != UNKNOWN_CLUSTER_ID:
            clusterCount = clusterCount + 1
            clusterId = clusterCount
        else:
            clusterId = labelID
        face_array: list[Face] = []
        face_id_list: list[int] = []
        for i in sortedIndexes[labelID]:
            count = count + 1
            face_id = data["all"]["id"][i]
            face_id_list.append(face_id)
        face_array = Face.objects.filter(
            Q(pk__in=face_id_list) & Q(encoding__isnull=False) & Q(deleted=False)
        )
        new_clusters: list[Cluster] = ClusterManager.try_add_cluster(
            user, clusterId, face_array, maxLen
        )

        if commit_time < datetime.datetime.now() and lrj is not None:
            lrj.progress_current = count
            lrj.progress_target = target_count
            lrj.save()
            commit_time = datetime.datetime.now() + datetime.timedelta(seconds=5)

        all_clusters.extend(new_clusters)

    print(f"[INFO] Created {len(all_clusters)} clusters")
    return target_count


def delete_persons_without_faces():
    """Delete all existing Person records that have no associated Face records"""
    print("[INFO] Deleting all people without faces")
    Person.objects.filter(faces=None, kind=Person.KIND_USER).delete()


def delete_clusters(user: User):
    """Delete all existing Cluster records"""
    print("[INFO] Deleting all clusters")
    Cluster.objects.filter(Q(owner=user)).delete()
    Cluster.objects.filter(Q(owner=None)).delete()
    Cluster.objects.filter(Q(owner=get_deleted_user())).delete()


def delete_clustered_people(user: User):
    """Delete all existing Person records of type CLUSTER"""
    print("[INFO] Deleting all clustered people")
    Person.objects.filter(kind=Person.KIND_CLUSTER, cluster_owner=user).delete()
    Person.objects.filter(kind=Person.KIND_UNKNOWN, cluster_owner=user).delete()
    Person.objects.filter(cluster_owner=None).delete()
    Person.objects.filter(cluster_owner=get_deleted_user()).delete()


# Function to filter data based on a desired shape
def filter_data(encodings, ids):
    valid_encodings = []
    valid_ids = []
    expected_shape = (
        len(encodings[0]) if encodings else 0
    )  # Set expected shape from first entry

    for i, (encoding, id_) in enumerate(zip(encodings, ids)):
        if len(encoding) == expected_shape:  # Check if shape is consistent
            valid_encodings.append(encoding)
            valid_ids.append(id_)
        else:
            logger.error(
                f"Discarding entry {i}: ID={id_}, encoding shape={len(encoding)} (expected {expected_shape})"
            )

    return np.array(valid_encodings), np.array(valid_ids)


def train_faces(user: User, job_id) -> bool:
    """Given existing Cluster records for all faces, determines the probability
    that unknown faces belong to those Clusters. It takes any known, labeled faces
    and adds the centroids of "unknown" clusters, assuming that those clusters
    correspond to *some* face. It then trains a classifier on that data to use
    in calculating the probabilities for unknown faces.
    :param user: the current user running the training
    :param job_id: the background job ID
    """
    lrj = LongRunningJob.get_or_create_job(
        user=user,
        job_type=LongRunningJob.JOB_TRAIN_FACES,
        job_id=job_id,
    )
    lrj.update_progress(current=1, target=2)
    try:
        # Use two array, so that the first one gets thrown out, if it is no longer used.
        data_known = {"encoding": [], "id": []}
        data_unknown = {"encoding": [], "id": []}
        # First, sort all faces into known and unknown ones
        face: Face
        for face in Face.objects.filter(
            Q(photo__owner=user) & Q(encoding__isnull=False) & Q(deleted=False)
        ).prefetch_related("person"):
            if not face.person:
                data_unknown["encoding"].append(face.get_encoding_array())
                data_unknown["id"].append(face.id)
            else:
                data_known["encoding"].append(face.get_encoding_array())
                data_known["id"].append(face.person.id)

        if len(data_known["id"]) == 0:
            classifier = None
        else:
            logger.info("Before fitting")
            classifier = MLPClassifier(
                solver="adam", alpha=1e-5, random_state=1, max_iter=1000
            ).fit(np.array(data_known["encoding"]), np.array(data_known["id"]))
            logger.info("After fitting")

        # Next, pretend all unknown face clusters are known and add their mean encoding. This allows us
        # to predict the likelihood of other unknown faces belonging to those simulated clusters. For
        # the "Unknown - Other"-type cluster, we can still try to predict the probability that the face
        # can't be classified into another group, i.e. that it should be classified that way
        cluster: Cluster
        for cluster in Cluster.objects.filter(owner=user):
            if cluster.person and cluster.person.kind == Person.KIND_CLUSTER:
                print(cluster.person)
                data_known["encoding"].append(cluster.get_mean_encoding_array())
                data_known["id"].append(cluster.person.id)

        filtered_encodings, filtered_ids = filter_data(
            data_known["encoding"], data_known["id"]
        )

        # Fit the classifier based on the "known" faces, including the simulated clusters
        logger.info("Before cluster fitting")
        cluster_classifier = MLPClassifier(
            solver="adam", alpha=1e-5, random_state=1, max_iter=1000
        ).fit(filtered_encodings, filtered_ids)
        logger.info("After cluster fitting")

        # Collect the probabilities for each unknown face. The probabilities returned
        # are arrays in the same order as the people IDs in the original training set
        target_count = len(data_unknown["id"])
        if target_count == 0:
            logger.info("No clusters found")
            lrj.update_progress(current=2, target=2)
            lrj.complete()
            return True
        logger.info(f"Number of Cluster: {target_count}")

        # Hacky way to split arrays into smaller arrays
        pages_encoding = [
            data_unknown["encoding"][i : i + 100]
            for i in range(0, len(data_unknown["encoding"]), 100)
        ]
        pages_id = [
            data_unknown["id"][i : i + 100]
            for i in range(0, len(data_unknown["encoding"]), 100)
        ]
        for idx, page in enumerate(pages_encoding):
            page_id = pages_id[idx]
            pages_of_faces = Face.objects.filter(id__in=page_id).all()
            # sort pages of faces by id by page_id
            pages_of_faces = sorted(pages_of_faces, key=lambda x: page_id.index(x.id))
            face_encodings_unknown_np = np.array(page)
            cluster_probs = cluster_classifier.predict_proba(face_encodings_unknown_np)
            if classifier:
                classification_probs = classifier.predict_proba(
                    face_encodings_unknown_np
                )
            else:
                classification_probs = []
                while len(classification_probs) < len(cluster_probs):
                    classification_probs.append(
                        [0.0] * len(cluster_classifier.classes_)
                    )

            commit_time = datetime.datetime.now() + datetime.timedelta(seconds=5)
            face_stack = []
            unknown_cluster: Cluster = get_unknown_cluster(user=user)

            for idx, (
                face,
                cluster_probabilities,
                classification_probabilties,
            ) in enumerate(zip(pages_of_faces, cluster_probs, classification_probs)):
                face.cluster_probability = 0.0  # Cluster probability
                face.classification_probability = 0.0  # Classification probability
                classification_person = None
                classification_probability = 0.0

                highest_classification_probability = max(classification_probabilties)
                highest_classification_person = 0

                # Find the person with the highest probability for classification
                if classifier:
                    for i, target in enumerate(classifier.classes_):
                        if (
                            highest_classification_probability
                            == classification_probabilties[i]
                        ):
                            highest_classification_person = target

                    classification_person = highest_classification_person
                    classification_probability = highest_classification_probability

                # Find the probability in the probability array corresponding to the person
                # that we currently believe the face is, even a simulated "unknown" person
                highest_probability = max(cluster_probabilities)
                highest_probability_person = 0
                for i, target in enumerate(cluster_classifier.classes_):
                    if highest_probability == cluster_probabilities[i]:
                        highest_probability_person = target

                if face.cluster != unknown_cluster:
                    face.cluster_person = Person.objects.get(
                        id=highest_probability_person
                    )
                    face.cluster_probability = highest_probability

                if classification_person:
                    face.classification_person = Person.objects.get(
                        id=classification_person
                    )
                    face.classification_probability = classification_probability

                face_stack.append(face)
                if commit_time < datetime.datetime.now():
                    lrj.update_progress(current=idx + 1, target=target_count)
                    commit_time = datetime.datetime.now() + datetime.timedelta(
                        seconds=5
                    )
                if len(face_stack) > 200:
                    bulk_update(face_stack, update_fields=FACE_CLASSIFY_COLUMNS)
                    face_stack = []

            bulk_update(face_stack, update_fields=FACE_CLASSIFY_COLUMNS)

        lrj.update_progress(current=target_count, target=target_count)
        lrj.complete()
        return True

    except BaseException as err:
        logger.exception("An error occurred")
        print(f"[ERR] {err}")
        lrj.fail(error=err)
        return False


================================================
FILE: api/face_extractor.py
================================================
import numpy as np
import PIL

from api.face_recognition import get_face_locations
from api.metadata.reader import get_metadata
from api.metadata.tags import Tags
from api.util import is_number, logger


class RuleTypes:
    EXIF = "exif"
    DLIB = "dlib"


def extract_from_exif(image_path, big_thumbnail_image_path):
    (region_info, orientation) = get_metadata(
        image_path,
        tags=[Tags.REGION_INFO, Tags.ORIENTATION],
        try_sidecar=True,
        struct=True,
    )
    if not region_info:
        return
    logger.debug(f"Extracted region_info for {image_path}")
    logger.debug(f"region_info: {region_info}")
    face_locations = []
    for region in region_info["RegionList"]:
        if region.get("Type") != "Face":
            continue
        person_name = region.get("Name")

        area = region.get("Area")
        applied_to_dimensions = region.get("AppliedToDimensions")
        big_thumbnail_image = np.array(PIL.Image.open(big_thumbnail_image_path))
        if (area and area.get("Unit") == "normalized") or (
            applied_to_dimensions and applied_to_dimensions.get("Unit") == "pixel"
        ):
            image_width = big_thumbnail_image.shape[1]
            image_height = big_thumbnail_image.shape[0]
            if (
                not is_number(area.get("X"))
                or not is_number(area.get("Y"))
                or not is_number(area.get("W"))
                or not is_number(area.get("H"))
            ):
                logger.info(
                    f"Broken face area exif data! No numerical positional data. region_info: {region_info}"
                )
                continue

            correct_w = float(area.get("W"))
            correct_h = float(area.get("H"))
            correct_x = float(area.get("X"))
            correct_y = float(area.get("Y"))
            if orientation == "Rotate 90 CW":
                temp_x = correct_x
                correct_x = 1 - correct_y
                correct_y = temp_x
                correct_w, correct_h = correct_h, correct_w
            elif orientation == "Mirror horizontal":
                correct_x = 1 - correct_x
            elif orientation == "Rotate 180":
                correct_x = 1 - correct_x
                correct_y = 1 - correct_y
            elif orientation == "Mirror vertical":
                correct_y = 1 - correct_y
            elif orientation == "Mirror horizontal and rotate 270 CW":
                temp_x = correct_x
                correct_x = 1 - correct_y
                correct_y = temp_x
                correct_w, correct_h = correct_h, correct_w
            elif orientation == "Mirror horizontal and rotate 90 CW":
                temp_x = correct_x
                correct_x = correct_y
                correct_y = 1 - temp_x
                correct_w, correct_h = correct_h, correct_w
            elif orientation == "Rotate 270 CW":
                temp_x = correct_x
                correct_x = correct_y
                correct_y = 1 - temp_x
                correct_w, correct_h = correct_h, correct_w

            # Calculate the half-width and half-height of the box
            half_width = (correct_w * image_width) / 2
            half_height = (correct_h * image_height) / 2

            # Calculate the top, right, bottom, and left coordinates
            top = int((correct_y * image_height) - half_height)
            right = int((correct_x * image_width) + half_width)
            bottom = int((correct_y * image_height) + half_height)
            left = int((correct_x * image_width) - half_width)

            face_locations.append((top, right, bottom, left, person_name))
    return face_locations


def extract_from_dlib(image_path, big_thumbnail_path, owner):
    try:
        face_locations = get_face_locations(
            big_thumbnail_path,
            model=owner.face_recognition_model.lower(),
        )
    except Exception as e:
        logger.info(f"Can't extract face information on photo: {image_path}")
        logger.info(e)
        face_locations = []

    for i, face_location in enumerate(face_locations):
        face_locations[i] = (*face_location, None)
    return face_locations


def extract(image_path, big_thumbnail_path, owner):
    exif = extract_from_exif(image_path, big_thumbnail_path)
    if not exif:
        return extract_from_dlib(image_path, big_thumbnail_path, owner)
    return exif


================================================
FILE: api/face_recognition.py
================================================
import numpy as np
import requests


def get_face_encodings(image_path, known_face_locations):
    json = {
        "source": image_path,
        "face_locations": known_face_locations,
    }
    face_encoding = requests.post(
        "http://localhost:8005/face-encodings", json=json
    ).json()

    face_encodings_list = face_encoding["encodings"]
    face_encodings = [np.array(enc) for enc in face_encodings_list]

    return face_encodings


def get_face_locations(image_path, model="hog"):
    json = {"source": image_path, "model": model}
    face_locations = requests.post(
        "http://localhost:8005/face-locations", json=json
    ).json()
    return face_locations["face_locations"]


================================================
FILE: api/feature/__init__.py
================================================


================================================
FILE: api/feature/embedded_media.py
================================================
import os
from mmap import ACCESS_READ, mmap

import magic
from django.conf import settings

JPEG_EOI_MARKER = b"\xff\xd9"
GOOGLE_PIXEL_MOTION_PHOTO_MP4_SIGNATURES = [b"ftypmp42", b"ftypisom", b"ftypiso2"]

# in reality Samsung motion photo marker will look something like this
# ........Image_UTC_Data1458170015363SEFHe...........#...#.......SEFT..0.....MotionPhoto_Data
# but we are interested only in the content of the video which is right after MotionPhoto_Data
SAMSUNG_MOTION_PHOTO_MARKER = b"MotionPhoto_Data"


def _locate_embedded_video_google(data):
    signatures = GOOGLE_PIXEL_MOTION_PHOTO_MP4_SIGNATURES
    for signature in signatures:
        position = data.find(signature)
        if position != -1:
            return position - 4
    return -1


def _locate_embedded_video_samsung(data):
    position = data.find(SAMSUNG_MOTION_PHOTO_MARKER)
    if position != -1:
        return position + len(SAMSUNG_MOTION_PHOTO_MARKER)
    return -1


def has_embedded_media(path: str) -> bool:
    mime = magic.Magic(mime=True)
    mime_type = mime.from_file(path)
    if mime_type != "image/jpeg":
        return False
    with open(path, "rb") as image:
        with mmap(image.fileno(), 0, access=ACCESS_READ) as mm:
            return (
                _locate_embedded_video_samsung(mm) != -1
                or _locate_embedded_video_google(mm) != -1
            )


def extract_embedded_media(path: str, hash: str) -> str | None:
    with open(str(path), "rb") as image:
        with mmap(image.fileno(), 0, access=ACCESS_READ) as mm:
            position = _locate_embedded_video_google(
                mm
            ) or _locate_embedded_video_google(mm)
            if position == -1:
                return None
            output_dir = f"{settings.MEDIA_ROOT}/embedded_media"
            if not os.path.exists(output_dir):
                os.makedirs(output_dir)
            output_path = f"{output_dir}/{hash}_1.mp4"
            with open(output_path, "wb+") as video:
                mm.seek(position)
                data = mm.read(mm.size())
                video.write(data)
            return output_path


================================================
FILE: api/feature/tests/__init__.py
================================================


================================================
FILE: api/feature/tests/test_embedded_media.py
================================================
from django.conf import settings
from django.test import override_settings
from rest_framework.test import APIClient, APITestCase

from api.feature.embedded_media import (
    GOOGLE_PIXEL_MOTION_PHOTO_MP4_SIGNATURES,
    JPEG_EOI_MARKER,
    SAMSUNG_MOTION_PHOTO_MARKER,
    extract_embedded_media,
    has_embedded_media,
)
from api.models import User
from api.models.file import File
from api.tests.utils import create_test_photo, create_test_user


def create_test_file(path: str, user: User, content: bytes):
    with open(path, "wb+") as f:
        f.write(content)
    return File.create(path, user)


JPEG_MAGIC_NUMBER = b"\xff\xd8\xff"
JPEG = JPEG_MAGIC_NUMBER + b"\xde\xad\xfa\xce" + JPEG_EOI_MARKER
MP4_DATA = b"\xca\xfe\xfe\xed"
MP4_PREFIX = b"\x00\x00\x00\x18"
MP4 = MP4_PREFIX + b"ftypmp42" + MP4_DATA
RANDOM_BYTES = b"\x13\x37\xc0\xde"


@override_settings(MEDIA_ROOT="/tmp")
class EmbeddedMediaTest(APITestCase):
    def setUp(self):
        self.test_image_path = "/tmp/test_file.jpeg"
        self.test_video_path = "/tmp/test_file.mp4"
        self.user = create_test_user()
        self.client = APIClient()

    def test_should_not_process_non_jpeg_files(self):
        file = create_test_file(self.test_video_path, self.user, MP4)
        actual = has_embedded_media(file.path)
        self.assertFalse(actual)

    def test_google_pixel_motion_photo_signatures(self):
        for signature in GOOGLE_PIXEL_MOTION_PHOTO_MP4_SIGNATURES:
            content = JPEG + MP4_PREFIX + signature + MP4_DATA
            file = create_test_file(self.test_image_path, self.user, content)
            actual = has_embedded_media(file.path)
            self.assertTrue(actual)

    def test_samsung_motion_photo_signature(self):
        content = JPEG + SAMSUNG_MOTION_PHOTO_MARKER + MP4_DATA
        file = create_test_file(self.test_image_path, self.user, content)
        actual = has_embedded_media(file.path)
        self.assertTrue(actual)

    def test_other_content_should_not_report_as_having_embedded_media(self):
        file = create_test_file(self.test_image_path, self.user, RANDOM_BYTES)
        actual = has_embedded_media(file.path)
        self.assertFalse(actual)

    def test_extract_embedded_media_from_google_motion_photo(self):
        for signature in GOOGLE_PIXEL_MOTION_PHOTO_MP4_SIGNATURES:
            content = JPEG + MP4_PREFIX + signature + MP4_DATA
            file = create_test_file(self.test_image_path, self.user, content)
            path = extract_embedded_media(file.path, file.hash)
            expected = f"{settings.MEDIA_ROOT}/embedded_media/{file.hash}_1.mp4"
            self.assertEqual(path, expected)
            with open(path, "rb") as f:
                contents = f.read()
                self.assertEqual(MP4_PREFIX + signature + MP4_DATA, contents)

    def test_extract_embedded_media_from_samsung_motion_photo(self):
        content = JPEG + SAMSUNG_MOTION_PHOTO_MARKER + MP4
        file = create_test_file(self.test_image_path, self.user, content)
        path = extract_embedded_media(file.path, file.hash)
        expected = f"{settings.MEDIA_ROOT}/embedded_media/{file.hash}_1.mp4"
        self.assertEqual(expected, path)
        with open(path, "rb+") as f:
            contents = f.read()
            self.assertEqual(MP4, contents)

    def test_fetch_embedded_media_as_owner(self):
        self.client.force_authenticate(user=self.user)
        embedded_media = create_test_file(self.test_video_path, self.user, MP4)
        photo = create_test_photo(owner=self.user)
        photo.main_file.embedded_media.add(embedded_media)
        response = self.client.get(f"/media/embedded_media/{photo.pk}")
        self.assertEqual(response.status_code, 200)

    def test_fetch_embedded_media_as_anonymous_when_photo_is_public(self):
        self.client.force_authenticate(user=None)
        embedded_media = create_test_file(self.test_video_path, self.user, MP4)
        photo = create_test_photo(owner=self.user, public=True)
        photo.main_file.embedded_media.add(embedded_media)

        response = self.client.get(f"/media/embedded_media/{photo.pk}")
        self.assertEqual(response.status_code, 200)

    def test_fetch_embedded_media_as_anonymous_when_photo_is_private(self):
        self.client.force_authenticate(user=None)
        embedded_media = create_test_file(self.test_video_path, self.user, MP4)
        photo = create_test_photo(owner=self.user, public=False)
        photo.main_file.embedded_media.add(embedded_media)

        response = self.client.get(f"/media/embedded_media/{photo.pk}")
        self.assertEqual(response.status_code, 404)

    def test_fetch_embedded_media_when_photo_does_not_have_embedded_media(self):
        self.client.force_authenticate(user=self.user)
        photo = create_test_photo(owner=self.user)

        response = self.client.get(f"/media/embedded_media/{photo.pk}")
        self.assertEqual(response.status_code, 404)


================================================
FILE: api/filters.py
================================================
import datetime
import operator
from functools import reduce

from django.db.models import Q
from rest_framework import filters

from api import util
from api.image_similarity import search_similar_embedding
from api.semantic_search import calculate_query_embeddings


class SemanticSearchFilter(filters.SearchFilter):
    def filter_queryset(self, request, queryset, view):
        search_fields = self.get_search_fields(view, request)
        search_terms = self.get_search_terms(request)

        if not search_fields or not search_terms:
            return queryset

        orm_lookups = [
            self.construct_search(str(search_field), queryset=queryset)
            for search_field in search_fields
        ]

        if request.user.semantic_search_topk > 0:
            query = request.query_params.get("search")
            start = datetime.datetime.now()
            emb, magnitude = calculate_query_embeddings(query)
            elapsed = (datetime.datetime.now() - start).total_seconds()
            util.logger.info(
                "finished calculating query embedding - took %.2f seconds" % (elapsed)
            )
            start = datetime.datetime.now()
            image_hashes = search_similar_embedding(
                request.user.id, emb, request.user.semantic_search_topk, threshold=27
            )
            elapsed = (datetime.datetime.now() - start).total_seconds()
            util.logger.info("search similar embedding - took %.2f seconds" % (elapsed))
        conditions = []
        for search_term in search_terms:
            queries = [Q(**{orm_lookup: search_term}) for orm_lookup in orm_lookups]

            if request.user.semantic_search_topk > 0:
                queries += [Q(image_hash__in=image_hashes)]

            conditions.append(reduce(operator.or_, queries))
        queryset = queryset.filter(reduce(operator.and_, conditions))

        if self.must_call_distinct(queryset, search_fields):
            # Filtering against a many-to-many field requires us to
            # call queryset.distinct() in order to avoid duplicate items
            # in the resulting queryset.
            # We try to avoid this if possible, for performance reasons.
            queryset = queryset.distinct()
        return queryset


================================================
FILE: api/geocode/__init__.py
================================================
GEOCODE_VERSION = "1"


================================================
FILE: api/geocode/config.py
================================================
from constance import config as settings

from .parsers.mapbox import parse as parse_mapbox
from .parsers.nominatim import parse as parse_nominatim
from .parsers.opencage import parse as parse_opencage
from .parsers.tomtom import parse as parse_tomtom


def _get_config():
    return {
        "mapbox": {
            "geocode_args": {"api_key": settings.MAP_API_KEY},
            "parser": parse_mapbox,
        },
        "maptiler": {
            "geocode_args": {"api_key": settings.MAP_API_KEY},
            "parser": parse_mapbox,
        },
        "tomtom": {
            "geocode_args": {"api_key": settings.MAP_API_KEY},
            "parser": parse_tomtom,
        },
        "nominatim": {
            "geocode_args": {"user_agent": "librephotos"},
            "parser": parse_nominatim,
        },
        "opencage": {
            "geocode_args": {
                "api_key": settings.MAP_API_KEY,
            },
            "parser": parse_opencage,
        },
    }


def get_provider_config(provider) -> dict:
    config = _get_config()
    if provider not in config:
        raise Exception(f"Map provider not found: {provider}.")
    return config[provider]["geocode_args"]


def get_provider_parser(provider) -> callable:
    config = _get_config()
    if provider not in config:
        raise Exception(f"Map provider not found: {provider}.")
    return config[provider]["parser"]


================================================
FILE: api/geocode/geocode.py
================================================
from typing import List

import geopy
from constance import config as site_config

from api import util

from .config import get_provider_config, get_provider_parser


class Geocode:
    def __init__(self, provider):
        self._provider_config = get_provider_config(provider)
        self._parser = get_provider_parser(provider)
        self._geocoder = geopy.get_geocoder_for_service(provider)(
            **self._provider_config
        )

    def reverse(self, lat: float, lon: float) -> dict:
        if (
            "geocode_args" in self._provider_config
            and "api_key" in self._provider_config["geocode_args"]
            and self._provider_config["geocode_args"]["api_key"] is None
        ):
            util.logger.warning(
                "No API key found for map provider. Please set MAP_API_KEY in the admin panel or switch map provider."
            )
            return {}
        location = self._geocoder.reverse(f"{lat},{lon}")
        return self._parser(location)

    def search(self, query: str, limit: int = 5) -> List[dict]:
        """Forward geocoding: search for locations by name/address."""
        if (
            "api_key" in self._provider_config
            and self._provider_config["api_key"] is None
        ):
            util.logger.warning(
                "No API key found for map provider. Please set MAP_API_KEY in the admin panel or switch map provider."
            )
            return []
        locations = self._geocoder.geocode(query, exactly_one=False, limit=limit)
        if not locations:
            return []
        return [
            {
                "display_name": loc.address,
                "lat": loc.latitude,
                "lon": loc.longitude,
            }
            for loc in locations
        ]


def reverse_geocode(lat: float, lon: float) -> dict:
    try:
        return Geocode(site_config.MAP_API_PROVIDER).reverse(lat, lon)
    except Exception as e:
        util.logger.warning(f"Error while reverse geocoding: {e}")
        return {}


def search_location(query: str, limit: int = 5) -> List[dict]:
    """Search for locations by name/address using the configured map provider."""
    try:
        return Geocode(site_config.MAP_API_PROVIDER).search(query, limit)
    except Exception as e:
        util.logger.warning(f"Error while searching location: {e}")
        return []


================================================
FILE: api/geocode/parsers/__init__.py
================================================


================================================
FILE: api/geocode/parsers/mapbox.py
================================================
from api.geocode import GEOCODE_VERSION


def parse(location):
    context = location.raw["context"]
    center = [location.raw["center"][1], location.raw["center"][0]]
    local_name = location.raw["text"]
    places = [local_name] + [
        i["text"] for i in context if not i["id"].startswith("post")
    ]
    return {
        "features": [{"text": place, "center": center} for place in places],
        "places": places,
        "address": location.address,
        "center": center,
        "_v": GEOCODE_VERSION,
    }


================================================
FILE: api/geocode/parsers/nominatim.py
================================================
from api.geocode import GEOCODE_VERSION


def parse(location):
    data = location.raw["address"]
    props = [
        "road",
        "town",
        "neighbourhood",
        "suburb",
        "hamlet",
        "borough",
        "city",
        "county",
        "state",
        "country",
    ]
    places = [data[prop] for prop in props if prop in data]
    center = [float(location.raw["lat"]), float(location.raw["lon"])]
    return {
        "features": [{"text": place, "center": center} for place in places],
        "places": places,
        "address": location.address,
        "center": center,
        "_v": GEOCODE_VERSION,
    }


================================================
FILE: api/geocode/parsers/opencage.py
================================================
from api.geocode import GEOCODE_VERSION


def parse(location):
    data = location.raw["components"]
    center = [location.raw["geometry"]["lat"], location.raw["geometry"]["lng"]]
    props = [
        data["_type"],
        "road",
        "suburb",
        "municipality",
        "hamlet",
        "towncity",
        "borough",
        "state",
        "county",
        "country",
    ]
    places = [data[prop] for prop in props if prop in data]
    return {
        "features": [{"text": place, "center": center} for place in places],
        "places": places,
        "address": location.address,
        "center": center,
        "_v": GEOCODE_VERSION,
    }


================================================
FILE: api/geocode/parsers/tomtom.py
================================================
from functools import reduce

from api.geocode import GEOCODE_VERSION


def _dedup(iterable):
    unique_items = set()

    def reducer(acc, item):
        if item not in unique_items:
            unique_items.add(item)
            acc.append(item)
        return acc

    return reduce(reducer, iterable, [])


def parse(location):
    data = location.raw["address"]
    address = location.address
    center = list(map(lambda x: float(x), location.raw["position"].split(",")))
    props = [
        "street",
        "streetName",
        "municipalitySubdivision",
        "countrySubdivision",
        "countrySecondarySubdivision",
        "municipality",
        "municipalitySubdivision",
        "country",
    ]
    places = _dedup(
        [data[prop] for prop in props if prop in data and len(data[prop]) > 2]
    )
    return {
        "features": [{"text": place, "center": center} for place in places],
        "places": places,
        "address": address,
        "center": center,
        "_v": GEOCODE_VERSION,
    }


================================================
FILE: api/image_captioning.py
================================================
import requests
from constance import config as site_config


def generate_caption(image_path, blip=False, prompt=None):
    # Check if Moondream is selected as captioning model
    if site_config.CAPTIONING_MODEL == "moondream":
        # Use custom prompt if provided, otherwise use default caption prompt
        if prompt is None:
            prompt = "Describe this image in a short, concise caption."

        json_data = {
            "image_path": image_path,
            "prompt": prompt,
            "max_tokens": 256,
        }
        try:
            response = requests.post("http://localhost:8008/generate", json=json_data)

            if response.status_code != 201:
                print(
                    f"Error with Moondream captioning service: HTTP {response.status_code} - {response.text}"
                )
                return "Error generating caption with Moondream: Service unavailable"

            response_data = response.json()
            return response_data["response"]
        except requests.exceptions.ConnectionError:
            print(
                "Error with Moondream captioning service: Cannot connect to LLM service on port 8008"
            )
            return "Error generating caption with Moondream: Service unavailable"
        except requests.exceptions.Timeout:
            print("Error with Moondream captioning service: Request timeout")
            return "Error generating caption with Moondream: Request timeout"
        except Exception as e:
            print(f"Error with Moondream captioning service: {e}")
            return "Error generating caption with Moondream"

    # Original implementation for other models
    json_data = {
        "image_path": image_path,
        "onnx": False,
        "blip": blip,
    }
    caption_response = requests.post(
        "http://localhost:8007/generate-caption", json=json_data
    ).json()

    return caption_response["caption"]


def unload_model():
    requests.get("http://localhost:8007/unload-model")


================================================
FILE: api/image_similarity.py
================================================
from datetime import datetime

import numpy as np
import requests
from django.conf import settings
from django.core.paginator import Paginator
from django.db.models import Q

from api.models import Photo
from api.util import logger


def search_similar_embedding(user, emb, result_count=100, threshold=27):
    if isinstance(user, int):
        user_id = user
    else:
        user_id = user.id

    image_embedding = np.array(emb, dtype=np.float32)

    post_data = {
        "user_id": user_id,
        "image_embedding": image_embedding.tolist(),
        "n": result_count,
        "threshold": threshold,
    }
    res = requests.post(settings.IMAGE_SIMILARITY_SERVER + "/search/", json=post_data)
    if res.status_code == 200:
        return res.json()["result"]
    else:
        logger.error(f"error retrieving similar embeddings for user {user_id}")
        return []


def search_similar_image(user, photo, threshold=27):
    if isinstance(user, int):
        user_id = user
    else:
        user_id = user.id

    clip_embeddings = photo.get_clip_embeddings()
    if clip_embeddings is None:
        return []

    image_embedding = np.array(clip_embeddings, dtype=np.float32)

    post_data = {
        "user_id": user_id,
        "image_embedding": image_embedding.tolist(),
        "threshold": threshold,
    }
    res = requests.post(settings.IMAGE_SIMILARITY_SERVER + "/search/", json=post_data)
    if res.status_code == 200:
        return res.json()
    else:
        logger.error(
            f"error retrieving similar photos to {photo.image_hash} belonging to user {user.username}"
        )
        return []


def build_image_similarity_index(user):
    logger.info(f"building similarity index for user {user.username}")
    requests.delete(
        settings.IMAGE_SIMILARITY_SERVER + "/build/",
        json={"user_id": user.id},
    )
    start = datetime.now()
    photos = (
        Photo.objects.filter(Q(hidden=False) & Q(owner=user))
        .exclude(clip_embeddings=None)
        .only("clip_embeddings", "image_hash")
        .order_by("image_hash")
        .all()
    )
    paginator = Paginator(photos, 5000)

    for page in range(1, paginator.num_pages + 1):
        image_hashes = []
        image_embeddings = []
        for photo in paginator.page(page).object_list:
            clip_embeddings = photo.get_clip_embeddings()
            if clip_embeddings is not None:
                image_hashes.append(photo.image_hash)
                image_embedding = np.array(clip_embeddings, dtype=np.float32)
                image_embeddings.append(image_embedding.tolist())

        post_data = {
            "user_id": user.id,
            "image_hashes": image_hashes,
            "image_embeddings": image_embeddings,
        }
        requests.post(settings.IMAGE_SIMILARITY_SERVER + "/build/", json=post_data)
    elapsed = (datetime.now() - start).total_seconds()
    logger.info("building similarity index took %.2f seconds" % elapsed)


================================================
FILE: api/llm.py
================================================
import requests
import base64
import io
from PIL import Image
from constance import config as site_config


def image_to_base64_data_uri(image_path):
    """Convert image file to base64 data URI, converting to JPEG for compatibility"""
    try:
        # Open image with PIL and convert to RGB (handles WebP, PNG with transparency, etc.)
        with Image.open(image_path) as img:
            # Convert to RGB mode (removes alpha channel if present)
            if img.mode != "RGB":
                img = img.convert("RGB")

            # Save as JPEG to memory buffer
            buffer = io.BytesIO()
            img.save(buffer, format="JPEG", quality=95)
            buffer.seek(0)

            # Encode to base64
            image_data = base64.b64encode(buffer.getvalue()).decode("utf-8")

        return f"data:image/jpeg;base64,{image_data}"
    except Exception as e:
        print(f"Error converting image to data URI: {str(e)}")
        raise


def generate_prompt(prompt, image_path=None):
    if site_config.LLM_MODEL == "none":
        return None

    # Use the unified LLM service for all models including Moondream
    if site_config.LLM_MODEL == "moondream":
        model_path = "/protected_media/data_models/moondream2-text-model-f16.gguf"
    elif site_config.LLM_MODEL == "mistral-7b-instruct-v0.2.Q5_K_M":
        model_path = "/protected_media/data_models/mistral-7b-instruct-v0.2.Q5_K_M.gguf"
    else:
        return None

    json_data = {
        "model_path": model_path,
        "max_tokens": 64,
        "prompt": prompt,
    }

    # Convert image to base64 data URI if image path is provided
    if image_path:
        try:
            image_data = image_to_base64_data_uri(image_path)
            json_data["image_data"] = image_data
            json_data["multimodal"] = True
        except Exception as e:
            print(f"Error converting image: {e}")
            return None

    try:
        response = requests.post("http://localhost:8008/generate", json=json_data)

        if response.status_code != 201:
            print(
                f"Error with LLM service: HTTP {response.status_code} - {response.text}"
            )
            return None

        response_data = response.json()
        return response_data.get("response", "")
    except requests.exceptions.ConnectionError:
        print("Error with LLM service: Cannot connect to service on port 8008")
        return None
    except requests.exceptions.Timeout:
        print("Error with LLM service: Request timeout")
        return None
    except Exception as e:
        print(f"Error with LLM service: {e}")
        return None


================================================
FILE: api/management/__init__.py
================================================


================================================
FILE: api/management/commands/build_similarity_index.py
================================================
from django.core.management.base import BaseCommand
from django_q.tasks import AsyncTask

from api.image_similarity import build_image_similarity_index
from api.models import User


class Command(BaseCommand):
    help = "Build image similarity index for all users"

    def handle(self, *args, **kwargs):
        for user in User.objects.all():
            AsyncTask(build_image_similarity_index, user).run()


================================================
FILE: api/management/commands/clear_cache.py
================================================
from django.conf import settings
from django.core.cache import cache
from django.core.management.base import BaseCommand, CommandError


class Command(BaseCommand):
    """A simple management command which clears the site-wide cache."""

    help = "Fully clear your site-wide cache."

    def handle(self, *args, **kwargs):
        try:
            assert settings.CACHES
            cache.clear()
            self.stdout.write("Your cache has been cleared!\n")
        except AttributeError:
            raise CommandError("You have no cache configured!\n")


================================================
FILE: api/management/commands/createadmin.py
================================================
import os
import sys

from django.core.management.base import BaseCommand, CommandError
from django.core.validators import ValidationError, validate_email

from api.models import User


class Command(BaseCommand):
    help = "Create a LibrePhotos user with administrative permissions"

    def add_arguments(self, parser):
        parser.add_argument("admin_username", help="Username to create")
        parser.add_argument("admin_email", help="Email address of the new user")
        parser.add_argument(
            "-u",
            "--update",
            help=(
                "Update an existing superuser's password (ignoring the"
                "provided email) instead of reporting an error"
            ),
            action="store_true",
        )
        # Done this way because command lines are visible to the whole system by
        #  default on Linux, so a password in the arguments would leak
        parser.epilog = (
            "The password is read from the ADMIN_PASSWORD"
            "environment variable or interactively if"
            "ADMIN_PASSWORD is not set"
        )

    def handle(self, *args, **options):
        try:
            validate_email(options["admin_email"])
        except ValidationError as err:
            raise CommandError(err.message)

        if "ADMIN_PASSWORD" in os.environ:
            options["admin_password"] = os.environ["ADMIN_PASSWORD"]
        else:
            options["admin_password"] = User.objects.make_random_password()

        if not options["admin_password"]:
            raise CommandError("Admin password cannot be empty")

        if not User.objects.filter(username=options["admin_username"].lower()).exists():
            User.objects.create_superuser(
                options["admin_username"].lower(),
                options["admin_email"],
                options["admin_password"],
            )
        elif options["update"]:
            print(
                "Warning: ignoring provided email " + options["admin_email"],
                file=sys.stderr,
            )
            admin_user = User.objects.get(username=options["admin_username"].lower())
            admin_user.set_password(options["admin_password"])
            admin_user.save()
        else:
            raise CommandError("Specified user already exists")


================================================
FILE: api/management/commands/createuser.py
================================================
import os
import sys

from django.core.management.base import BaseCommand, CommandError
from django.core.validators import ValidationError, validate_email

from api.models import User


class Command(BaseCommand):
    help = "Create a LibrePhotos user"

    def add_arguments(self, parser):
        parser.add_argument("username", help="Username to create")
        parser.add_argument("email", help="Email address of the new user")
        parser.add_argument(
            "--password",
            help="Password to create/update for user. (autogenerate if omitted)",
        )
        parser.add_argument(
            "--update",
            help=(
                "Update an existing user's password (ignoring the provided email) "
                "instead of reporting an error"
            ),
            action="store_true",
        )
        parser.add_argument(
            "--admin",
            help="Create user with administrative privileges",
            action="store_true",
        )
        # Done this way because command lines are visible to the whole system by
        #  default on Linux, so a password in the arguments would leak
        parser.epilog = (
            "When creating user with administrative privileges,"
            "the password is read from the ADMIN_PASSWORD"
            "environment variable or interactively if"
            "ADMIN_PASSWORD is not set"
        )

    def handle(self, *args, **options):
        try:
            validate_email(options["email"])
        except ValidationError as err:
            raise CommandError(err.message)

        if options["admin"] and "ADMIN_PASSWORD" in os.environ:
            options["password"] = os.environ["ADMIN_PASSWORD"]

        if not options["password"]:
            options["password"] = User.objects.make_random_password()

        if not User.objects.filter(username=options["username"].lower()).exists():
            if options["admin"]:
                User.objects.create_superuser(
                    options["username"].lower(),
                    options["email"],
                    options["password"],
                )
            else:
                User.objects.create_user(
                    options["username"].lower(),
                    options["email"],
                    options["password"],
                )

        elif options["update"]:
            print(
                "Warning: ignoring provided email " + options["email"],
                file=sys.stderr,
            )
            user = User.objects.get(username=options["username"].lower())
            user.set_password(options["password"])
            user.save()
        else:
            raise CommandError("Specified user already exists")


================================================
FILE: api/management/commands/save_metadata.py
================================================
from django.core.management.base import BaseCommand

from api.models import Photo, User
from api.models.person import Person


class Command(BaseCommand):
    help = "Save metadata to image files (or XMP sidecar files)"

    def add_arguments(self, parser):
        parser.add_argument(
            "--types",
            nargs="+",
            choices=["ratings", "face_tags"],
            default=["ratings"],
            help="Which metadata types to write (default: ratings)",
        )
        parser.add_argument(
            "--user",
            type=str,
            help="Only process photos owned by this username",
        )
        parser.add_argument(
            "--sidecar",
            action="store_true",
            default=True,
            help="Write to XMP sidecar files (default)",
        )
        parser.add_argument(
            "--media-file",
            action="store_true",
            help="Write directly to media files instead of sidecars",
        )
        parser.add_argument(
            "--dry-run",
            action="store_true",
            help="Only show what would be written, don't actually write",
        )

    def handle(self, *args, **options):
        metadata_types = options["types"]
        use_sidecar = not options["media_file"]

        photos = Photo.objects.all()

        if options["user"]:
            try:
                user = User.objects.get(username=options["user"])
                photos = photos.filter(owner=user)
            except User.DoesNotExist:
                self.stderr.write(f"User '{options['user']}' not found")
                return

        # When only writing face tags, filter to photos with any (non-deleted) faces
        if metadata_types == ["face_tags"]:
            photos = photos.filter(
                faces__deleted=False,
            ).distinct()

        total = photos.count()
        self.stdout.write(f"Found {total} photos to process (types: {metadata_types})")

        if options["dry_run"]:
            self.stdout.write("Dry run — no files will be modified")
            return

        written = 0
        errors = 0
        for i, photo in enumerate(photos.iterator(), 1):
            try:
                photo._save_metadata(
                    use_sidecar=use_sidecar, metadata_types=metadata_types
                )
                written += 1
            except Exception as e:
                errors += 1
                self.stderr.write(f"Error writing {photo.image_hash}: {e}")

            if i % 100 == 0:
                self.stdout.write(
                    f"Progress: {i}/{total} ({written} written, {errors} errors)"
                )

        self.stdout.write(
            self.style.SUCCESS(
                f"Done. {written} written, {errors} errors out of {total} photos."
            )
        )


================================================
FILE: api/management/commands/scan.py
================================================
import traceback
import uuid

from django.core.management.base import BaseCommand

from api.directory_watcher import scan_photos
from api.models import User
from api.models.user import get_deleted_user
from nextcloud.directory_watcher import scan_photos as scan_photos_nextcloud


class Command(BaseCommand):
    help = "scan directory for all users"

    def add_arguments(self, parser):
        parser_group = parser.add_mutually_exclusive_group()
        parser_group.add_argument(
            "-f", "--full-scan", help=("Run full directory scan"), action="store_true"
        )
        parser_group.add_argument(
            "-s", "--scan-files", help=("Scan a list of files"), nargs="+", default=[]
        )
        parser_group.add_argument(
            "-n",
            "--nextcloud",
            help=("Run nextcloud scan instead of directory scan"),
            action="store_true",
        )

    def handle(self, *args, **options):
        # Nextcloud scan
        if options["nextcloud"]:
            self.nextcloud_scan()
            return

        # Add a single file.
        if options["scan_files"]:
            scan_files = options["scan_files"]
            deleted_user: User = get_deleted_user()
            for user in User.objects.all():
                user_files = []
                if user == deleted_user:
                    continue
                for scan_file in scan_files:
                    if scan_file.startswith(user.scan_directory):
                        user_files.append(scan_file)
                if user_files:
                    scan_photos(user, False, uuid.uuid4(), scan_files=user_files)
            return

        # Directory scan
        deleted_user: User = get_deleted_user()
        for user in User.objects.all():
            if user != deleted_user:
                scan_photos(
                    user, options["full_scan"], uuid.uuid4(), user.scan_directory
                )

    def nextcloud_scan(self):
        for user in User.objects.all():
            if not user.nextcloud_scan_directory:
                print(
                    f"Skipping nextcloud scan for user {user.username}. No scan directory configured."
                )
                continue
            print(f"Starting nextcloud scan for user {user.username}.")
            try:
                scan_photos_nextcloud(user, uuid.uuid4())
            except Exception:
                print(f"Nextcloud scan for user {user.username} failed:")
                print(traceback.format_exc())


================================================
FILE: api/management/commands/start_cleaning_service.py
================================================
from django.core.management.base import BaseCommand
from django_q.models import Schedule
from django_q.tasks import schedule

from api.util import logger


class Command(BaseCommand):
    help = "Start the cleanup service."

    def handle(self, *args, **kwargs):
        if not Schedule.objects.filter(
            func="api.services.cleanup_deleted_photos"
        ).exists():
            schedule(
                "api.services.cleanup_deleted_photos",
                schedule_type=Schedule.DAILY,
            )
        logger.info("Cleanup service started")


================================================
FILE: api/management/commands/start_job_cleanup_service.py
================================================
from django.core.management.base import BaseCommand
from django_q.models import Schedule
from django_q.tasks import schedule

from api.util import logger


class Command(BaseCommand):
    help = "Start the job cleanup service to mark stuck jobs as failed and remove old completed jobs."

    def handle(self, *args, **kwargs):
        # Schedule hourly cleanup of stuck jobs (running for more than 24 hours)
        if not Schedule.objects.filter(
            func="api.models.long_running_job.LongRunningJob.cleanup_stuck_jobs"
        ).exists():
            schedule(
                "api.models.long_running_job.LongRunningJob.cleanup_stuck_jobs",
                schedule_type=Schedule.HOURLY,
            )
            logger.info("Scheduled hourly stuck job cleanup")

        # Schedule daily cleanup of old completed jobs (older than 30 days)
        if not Schedule.objects.filter(
            func="api.models.long_running_job.LongRunningJob.cleanup_old_jobs"
        ).exists():
            schedule(
                "api.models.long_running_job.LongRunningJob.cleanup_old_jobs",
                schedule_type=Schedule.DAILY,
            )
            logger.info("Scheduled daily old job cleanup")

        logger.info("Job cleanup service started")


================================================
FILE: api/management/commands/start_service.py
================================================
from django.core.management.base import BaseCommand
from django_q.models import Schedule
from django_q.tasks import schedule

from api.services import SERVICES, start_service


class Command(BaseCommand):
    help = "Start one of the services."

    # Define all the services that can be started
    def add_arguments(self, parser):
        parser.add_argument(
            "service",
            type=str,
            help="The service to start",
            choices=[
                SERVICES.keys(),
                "all",
            ],
        )

    def handle(self, *args, **kwargs):
        service = kwargs["service"]
        if service == "all":
            for svc in SERVICES.keys():
                start_service(svc)
            if not Schedule.objects.filter(func="api.services.check_services").exists():
                schedule(
                    "api.services.check_services",
                    schedule_type=Schedule.MINUTES,
                    minutes=1,
                )
        else:
            start_service(service)


================================================
FILE: api/metadata/__init__.py
================================================
# api/metadata — organized metadata reading, writing, and tag constants.
#
# Submodules:
#   api.metadata.tags          — Tag name constants (Tags class)
#   api.metadata.reader        — get_metadata(), sidecar file helpers
#   api.metadata.writer        — write_metadata()
#   api.metadata.face_regions  — face region coordinate conversion & tag building
#
# Import directly from submodules to avoid circular import issues:
#   from api.metadata.tags import Tags
#   from api.metadata.reader import get_metadata
#   from api.metadata.writer import write_metadata
#   from api.metadata.face_regions import get_face_region_tags


================================================
FILE: api/metadata/face_regions.py
================================================
import PIL

from api.metadata.reader import get_metadata
from api.metadata.tags import Tags
from api.models.face import Face
from api.models.person import Person
from api.util import logger


def thumbnail_coords_to_normalized(top, right, bottom, left, thumb_width, thumb_height):
    """Convert Face model pixel coords (in big thumbnail space) to MWG-RS
    normalized center-based coords."""
    center_x = (left + right) / 2.0 / thumb_width
    center_y = (top + bottom) / 2.0 / thumb_height
    w = (right - left) / thumb_width
    h = (bottom - top) / thumb_height
    return center_x, center_y, w, h


def reverse_orientation_transform(x, y, w, h, orientation):
    """Invert the orientation transforms from face_extractor.py lines 54-80.

    The read path applies a forward transform from XMP coords to display coords.
    This function reverses that so we can go from display coords back to XMP coords.
    """
    if orientation == "Rotate 90 CW":
        # Forward: x' = 1 - y, y' = x, swap w/h
        # Reverse: y_orig = 1 - x', x_orig = y'
        new_x = y
        new_y = 1 - x
        w, h = h, w
        return new_x, new_y, w, h
    elif orientation == "Mirror horizontal":
        # Forward: x' = 1 - x
        # Reverse: x = 1 - x'
        return 1 - x, y, w, h
    elif orientation == "Rotate 180":
        # Forward: x' = 1 - x, y' = 1 - y
        # Reverse: same
        return 1 - x, 1 - y, w, h
    elif orientation == "Mirror vertical":
        # Forward: y' = 1 - y
        # Reverse: y = 1 - y'
        return x, 1 - y, w, h
    elif orientation == "Mirror horizontal and rotate 270 CW":
        # Forward: x' = 1 - y, y' = x, swap w/h
        # Same as Rotate 90 CW (the mirror cancels differently)
        new_x = y
        new_y = 1 - x
        w, h = h, w
        return new_x, new_y, w, h
    elif orientation == "Mirror horizontal and rotate 90 CW":
        # Forward: x' = y, y' = 1 - x, swap w/h
        # Reverse: x_orig = 1 - y', y_orig = x'
        new_x = 1 - y
        new_y = x
        w, h = h, w
        return new_x, new_y, w, h
    elif orientation == "Rotate 270 CW":
        # Forward: x' = y, y' = 1 - x, swap w/h
        # Reverse: x_orig = 1 - y', y_orig = x'
        new_x = 1 - y
        new_y = x
        w, h = h, w
        return new_x, new_y, w, h
    # Normal orientation or unknown — no transform
    return x, y, w, h


def _escape_exiftool_value(value):
    """Escape special characters in a string value for exiftool structured data.

    ExifTool uses commas, equals, braces in its structured value syntax,
    so person names containing these characters need escaping.
    """
    # ExifTool expects special chars to be escaped with backslash
    for ch in ("\\", "{", "}", "=", ","):
        value = value.replace(ch, f"\\{ch}")
    return value


def build_face_region_exiftool_args(face_regions, image_width=None, image_height=None):
    """Build exiftool args dict for writing XMP-mwg-rs:RegionInfo and XMP:Subject.

    Args:
        face_regions: list of dicts with keys: name, x, y, w, h
        image_width: original image width in pixels (for AppliedToDimensions)
        image_height: original image height in pixels (for AppliedToDimensions)

    Returns:
        dict of tag -> value suitable for write_metadata()
    """
    region_parts = []
    person_names = []
    for region in face_regions:
        name = _escape_exiftool_value(region["name"])
        x = f"{region['x']:.6f}"
        y = f"{region['y']:.6f}"
        w = f"{region['w']:.6f}"
        h = f"{region['h']:.6f}"
        region_parts.append(
            f"{{Area={{X={x},Y={y},W={w},H={h},Unit=normalized}}"
            f",Name={name},Type=Face}}"
        )
        if region["name"]:
            person_names.append(region["name"])

    region_list = ",".join(region_parts)

    # Include AppliedToDimensions if image dimensions are available
    if image_width and image_height:
        applied_to = f"AppliedToDimensions={{W={image_width},H={image_height},Unit=pixel}},"
    else:
        applied_to = ""

    value = f"{{{applied_to}RegionList=[{region_list}]}}"

    tags = {Tags.REGION_INFO_WRITE: value}

    # Add person names as XMP:Subject keywords for Lightroom compatibility
    if person_names:
        tags[Tags.SUBJECT] = person_names

    return tags


def get_face_region_tags(photo):
    """Build face region exiftool tags dict for a photo.

    Returns a dict of tags suitable for merging into _save_metadata()'s tags_to_write,
    or an empty dict if no faces exist.

    Args:
        photo: Photo model instance

    Returns:
        dict: e.g. {"XMP-mwg-rs:RegionInfo": "{RegionList=[...]}"}  or {}
    """
    faces = Face.objects.filter(
        photo=photo,
        deleted=False,
    ).select_related("person")

    if not faces.exists():
        return {}

    # Get thumbnail dimensions
    try:
        thumb_path = photo.thumbnail.thumbnail_big.path
        thumb_image = PIL.Image.open(thumb_path)
        thumb_width, thumb_height = thumb_image.size
        thumb_image.close()
    except Exception:
        logger.error(
            f"Cannot open thumbnail for photo {photo.image_hash}, skipping face tags"
        )
        return {}

    # Get EXIF orientation and original image dimensions
    (orientation, image_width, image_height) = get_metadata(
        photo.main_file.path,
        tags=[Tags.ORIENTATION, Tags.IMAGE_WIDTH, Tags.IMAGE_HEIGHT],
        try_sidecar=True,
    )

    # Convert each face's coordinates
    face_regions = []
    for face in faces:
        x, y, w, h = thumbnail_coords_to_normalized(
            face.location_top,
            face.location_right,
            face.location_bottom,
            face.location_left,
            thumb_width,
            thumb_height,
        )
        x, y, w, h = reverse_orientation_transform(x, y, w, h, orientation)
        # Only write person name for user-labeled faces
        if face.person and face.person.kind == Person.KIND_USER:
            name = face.person.name
        else:
            name = ""
        face_regions.append(
            {
                "name": name,
                "x": x,
                "y": y,
                "w": w,
                "h": h,
            }
        )

    return build_face_region_exiftool_args(face_regions, image_width, image_height)


================================================
FILE: api/metadata/reader.py
================================================
import os
import os.path

import requests


def get_sidecar_files_in_priority_order(media_file):
    """Returns a list of possible XMP sidecar files for *media_file*, ordered
    by priority.

    """
    image_basename = os.path.splitext(media_file)[0]
    return [
        image_basename + ".xmp",
        image_basename + ".XMP",
        media_file + ".xmp",
        media_file + ".XMP",
    ]


def _get_existing_metadata_files_reversed(media_file, include_sidecar_files):
    if include_sidecar_files:
        files = [
            file
            for file in get_sidecar_files_in_priority_order(media_file)
            if os.path.exists(file)
        ]
        files.append(media_file)
        return list(reversed(files))
    return [media_file]


def get_metadata(media_file, tags, try_sidecar=True, struct=False):
    """Get values for each metadata tag in *tags* from *media_file*.
    If *try_sidecar* is `True`, use the value set in any XMP sidecar file
    stored alongside *media_file*.
    If *struct* is `True`, use the exiftool instance which returns structured data

    Returns a list with the value of each tag in *tags* or `None` if the
    tag was not found.

    """
    files_by_reverse_priority = _get_existing_metadata_files_reversed(
        media_file, try_sidecar
    )

    json = {
        "tags": tags,
        "files_by_reverse_priority": files_by_reverse_priority,
        "struct": struct,
    }
    response = requests.post("http://localhost:8010/get-tags", json=json).json()
    return response["values"]


================================================
FILE: api/metadata/tags.py
================================================
class Tags:
    RATING = "Rating"
    IMAGE_HEIGHT = "ImageHeight"
    IMAGE_WIDTH = "ImageWidth"
    DATE_TIME_ORIGINAL = "EXIF:DateTimeOriginal"
    DATE_TIME = "EXIF:DateTime"
    QUICKTIME_CREATE_DATE = "QuickTime:CreateDate"
    QUICKTIME_DURATION = "QuickTime:Duration"
    LATITUDE = "Composite:GPSLatitude"
    LONGITUDE = "Composite:GPSLongitude"
    GPS_DATE_TIME = "Composite:GPSDateTime"
    FILE_SIZE = "File:FileSize"
    FSTOP = "EXIF:FNumber"
    EXPOSURE_TIME = "EXIF:ExposureTime"
    ISO = "EXIF:ISOSpeedRatings"
    FOCAL_LENGTH = "EXIF:FocalLength"
    FOCAL_LENGTH_35MM = "EXIF:FocalLengthIn35mmFilm"
    SHUTTER_SPEED = "EXIF:ShutterSpeedValue"
    CAMERA = "EXIF:Model"
    LENS = "EXIF:LensModel"
    SUBJECT_DISTANCE = "EXIF:SubjectDistance"
    DIGITAL_ZOOM_RATIO = "EXIF:DigitalZoomRatio"
    REGION_INFO = "XMP:RegionInfo"
    REGION_INFO_WRITE = "XMP-mwg-rs:RegionInfo"
    SUBJECT = "XMP:Subject"
    ROTATION = "QuickTime:Rotation"
    ORIENTATION = "EXIF:Orientation"

    # Burst/sequence detection tags
    SUBSEC_TIME_ORIGINAL = "EXIF:SubSecTimeOriginal"
    SUBSEC_TIME = "EXIF:SubSecTime"
    IMAGE_NUMBER = "EXIF:ImageNumber"
    IMAGE_UNIQUE_ID = "EXIF:ImageUniqueID"
    BURST_MODE = "MakerNotes:BurstMode"
    CONTINUOUS_DRIVE = "MakerNotes:ContinuousDrive"
    SEQUENCE_NUMBER = "MakerNotes:SequenceNumber"
    # Camera serial number (useful for grouping shots from same camera)
    SERIAL_NUMBER = "EXIF:SerialNumber"
    CAMERA_SERIAL = "MakerNotes:SerialNumber"


================================================
FILE: api/metadata/writer.py
================================================
import os

import exiftool

from api.metadata.reader import get_sidecar_files_in_priority_order
from api.util import logger


def write_metadata(media_file, tags, use_sidecar=True):
    et = exiftool.ExifTool()
    terminate_et = False
    if not et.running:
        et.start()
        terminate_et = True
    # To-Do: Replace with new File Structure
    if use_sidecar:
        file_path = get_sidecar_files_in_priority_order(media_file)[0]
    else:
        file_path = media_file

    try:
        logger.info(f"Writing {tags} to {file_path}")
        params = []
        for tag, value in tags.items():
            if isinstance(value, list):
                for item in value:
                    params.append(os.fsencode(f"-{tag}={item}"))
            else:
                params.append(os.fsencode(f"-{tag}={value}"))
        params.append(b"-overwrite_original")
        params.append(os.fsencode(file_path))
        et.execute(*params)
    finally:
        if terminate_et:
            et.terminate()


================================================
FILE: api/middleware.py
================================================
class FingerPrintMiddleware:
    def __init__(self, get_response):
        self.get_response = get_response
        # One-time configuration and initializatio

    def __call__(self, request):
        response = self.get_response(request)
        import hashlib

        fingerprint_raw = "".join(
            (
                request.META.get("HTTP_USER_AGENT", ""),
                request.META.get("HTTP_ACCEPT_ENCODING", ""),
            )
        )
        # print(fingerprint_raw)
        fingerprint = hashlib.md5(fingerprint_raw.encode("utf-8")).hexdigest()
        request.fingerprint = fingerprint
        # print(fingerprint)
        return response


================================================
FILE: api/migrations/0001_initial.py
================================================
# Generated by Django 2.1.2 on 2020-11-15 18:49

import datetime

import django.contrib.auth.models
import django.contrib.auth.validators
import django.contrib.postgres.fields.jsonb
import django.utils.timezone
import django_cryptography.fields
from django.conf import settings
from django.db import migrations, models

import api.models


class Migration(migrations.Migration):
    initial = True

    dependencies = [
        ("auth", "0009_alter_user_last_name_max_length"),
    ]

    operations = [
        migrations.CreateModel(
            name="User",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("password", models.CharField(max_length=128, verbose_name="password")),
                (
                    "last_login",
                    models.DateTimeField(
                        blank=True, null=True, verbose_name="last login"
                    ),
                ),
                (
                    "is_superuser",
                    models.BooleanField(
                        default=False,
                        help_text="Designates that this user has all permissions without explicitly assigning them.",
                        verbose_name="superuser status",
                    ),
                ),
                (
                    "username",
                    models.CharField(
                        error_messages={
                            "unique": "A user with that username already exists."
                        },
                        help_text="Required. 150 characters or fewer. Letters, digits and @/./+/-/_ only.",
                        max_length=150,
                        unique=True,
                        validators=[
                            django.contrib.auth.validators.UnicodeUsernameValidator()
                        ],
                        verbose_name="username",
                    ),
                ),
                (
                    "first_name",
                    models.CharField(
                        blank=True, max_length=30, verbose_name="first name"
                    ),
                ),
                (
                    "last_name",
                    models.CharField(
                        blank=True, max_length=150, verbose_name="last name"
                    ),
                ),
                (
                    "email",
                    models.EmailField(
                        blank=True, max_length=254, verbose_name="email address"
                    ),
                ),
                (
                    "is_staff",
                    models.BooleanField(
                        default=False,
                        help_text="Designates whether the user can log into this admin site.",
                        verbose_name="staff status",
                    ),
                ),
                (
                    "is_active",
                    models.BooleanField(
                        default=True,
                        help_text="Designates whether this user should be treated as active. Unselect this instead of deleting accounts.",
                        verbose_name="active",
                    ),
                ),
                (
                    "date_joined",
                    models.DateTimeField(
                        default=django.utils.timezone.now, verbose_name="date joined"
                    ),
                ),
                ("scan_directory", models.CharField(db_index=True, max_length=512)),
                ("avatar", models.ImageField(null=True, upload_to="avatars")),
                (
                    "nextcloud_server_address",
                    models.CharField(default=None, max_length=200, null=True),
                ),
                (
                    "nextcloud_username",
                    models.CharField(default=None, max_length=64, null=True),
                ),
                (
                    "nextcloud_app_password",
                    django_cryptography.fields.encrypt(
                        models.CharField(default=None, max_length=64, null=True)
                    ),
                ),
                (
                    "nextcloud_scan_directory",
                    models.CharField(db_index=True, max_length=512, null=True),
                ),
                (
                    "groups",
                    models.ManyToManyField(
                        blank=True,
                        help_text="The groups this user belongs to. A user will get all permissions granted to each of their groups.",
                        related_name="user_set",
                        related_query_name="user",
                        to="auth.Group",
                        verbose_name="groups",
                    ),
                ),
                (
                    "user_permissions",
                    models.ManyToManyField(
                        blank=True,
                        help_text="Specific permissions for this user.",
                        related_name="user_set",
                        related_query_name="user",
                        to="auth.Permission",
                        verbose_name="user permissions",
                    ),
                ),
            ],
            options={
                "verbose_name": "user",
                "verbose_name_plural": "users",
                "abstract": False,
            },
            managers=[
                ("objects", django.contrib.auth.models.UserManager()),
            ],
        ),
        migrations.CreateModel(
            name="AlbumAuto",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("title", models.CharField(blank=True, max_length=512, null=True)),
                ("timestamp", models.DateTimeField(db_index=True)),
                ("created_on", models.DateTimeField(db_index=True)),
                ("gps_lat", models.FloatField(blank=True, null=True)),
                ("gps_lon", models.FloatField(blank=True, null=True)),
                ("favorited", models.BooleanField(db_index=True, default=False)),
                (
                    "owner",
                    models.ForeignKey(
                        default=None,
                        on_delete=models.SET(api.models.user.get_deleted_user),
                        to=settings.AUTH_USER_MODEL,
                    ),
                ),
            ],
        ),
        migrations.CreateModel(
            name="AlbumDate",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                (
                    "title",
                    models.CharField(
                        blank=True, db_index=True, max_length=512, null=True
                    ),
                ),
                ("date", models.DateField(db_index=True, null=True)),
                ("favorited", models.BooleanField(db_index=True, default=False)),
                (
                    "location",
                    django.contrib.postgres.fields.jsonb.JSONField(
                        blank=True, db_index=True, null=True
                    ),
                ),
                (
                    "owner",
                    models.ForeignKey(
                        default=None,
                        on_delete=models.SET(api.models.user.get_deleted_user),
                        to=settings.AUTH_USER_MODEL,
                    ),
                ),
            ],
        ),
        migrations.CreateModel(
            name="AlbumPlace",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("title", models.CharField(db_index=True, max_length=512)),
                ("geolocation_level", models.IntegerField(db_index=True, null=True)),
                ("favorited", models.BooleanField(db_index=True, default=False)),
            ],
        ),
        migrations.CreateModel(
            name="AlbumThing",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("title", models.CharField(db_index=True, max_length=512)),
                (
                    "thing_type",
                    models.CharField(db_index=True, max_length=512, null=True),
                ),
                ("favorited", models.BooleanField(db_index=True, default=False)),
            ],
        ),
        migrations.CreateModel(
            name="AlbumUser",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("title", models.CharField(max_length=512)),
                ("created_on", models.DateTimeField(auto_now=True, db_index=True)),
                ("favorited", models.BooleanField(db_index=True, default=False)),
                ("public", models.BooleanField(db_index=True, default=False)),
            ],
        ),
        migrations.CreateModel(
            name="Face",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("image", models.ImageField(upload_to="faces")),
                ("image_path", models.FilePathField()),
                ("person_label_is_inferred", models.NullBooleanField(db_index=True)),
                (
                    "person_label_probability",
                    models.FloatField(db_index=True, default=0.0),
                ),
                ("location_top", models.IntegerField()),
                ("location_bottom", models.IntegerField()),
                ("location_left", models.IntegerField()),
                ("location_right", models.IntegerField()),
                ("encoding", models.TextField()),
            ],
        ),
        migrations.CreateModel(
            name="LongRunningJob",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                (
                    "job_type",
                    models.PositiveIntegerField(
                        choices=[
                            (1, "Scan Photos"),
                            (2, "Generate Event Albums"),
                            (3, "Regenerate Event Titles"),
                            (4, "Train Faces"),
                        ]
                    ),
                ),
                ("finished", models.BooleanField(default=False)),
                ("failed", models.BooleanField(default=False)),
                ("job_id", models.CharField(db_index=True, max_length=36, unique=True)),
                ("queued_at", models.DateTimeField(default=datetime.datetime.now)),
                ("started_at", models.DateTimeField(null=True)),
                ("finished_at", models.DateTimeField(null=True)),
                (
                    "result",
                    django.contrib.postgres.fields.jsonb.JSONField(
                        default={"progress": {"target": 0, "current": 0}}
                    ),
                ),
                (
                    "started_by",
                    models.ForeignKey(
                        default=None,
                        on_delete=models.SET(api.models.user.get_deleted_user),
                        to=settings.AUTH_USER_MODEL,
                    ),
                ),
            ],
        ),
        migrations.CreateModel(
            name="Person",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("name", models.CharField(max_length=128)),
                (
                    "kind",
                    models.CharField(
                        choices=[
                            ("USER", "User Labelled"),
                            ("CLUSTER", "Cluster ID"),
                            ("UNKNOWN", "Unknown Person"),
                        ],
                        max_length=10,
                    ),
                ),
                ("mean_face_encoding", models.TextField()),
                ("cluster_id", models.IntegerField(null=True)),
                (
                    "account",
                    models.OneToOneField(
                        default=None,
                        null=True,
                        on_delete=models.SET(api.models.user.get_deleted_user),
                        to=settings.AUTH_USER_MODEL,
                    ),
                ),
            ],
        ),
        migrations.CreateModel(
            name="Photo",
            fields=[
                ("image_path", models.CharField(db_index=True, max_length=512)),
                (
                    "image_hash",
                    models.CharField(max_length=64, primary_key=True, serialize=False),
                ),
                ("thumbnail", models.ImageField(upload_to="thumbnails")),
                ("thumbnail_tiny", models.ImageField(upload_to="thumbnails_tiny")),
                ("thumbnail_small", models.ImageField(upload_to="thumbnails_small")),
                ("thumbnail_big", models.ImageField(upload_to="thumbnails_big")),
                ("square_thumbnail", models.ImageField(upload_to="square_thumbnails")),
                (
                    "square_thumbnail_tiny",
                    models.ImageField(upload_to="square_thumbnails_tiny"),
                ),
                (
                    "square_thumbnail_small",
                    models.ImageField(upload_to="square_thumbnails_small"),
                ),
                (
                    "square_thumbnail_big",
                    models.ImageField(upload_to="square_thumbnails_big"),
                ),
                ("image", models.ImageField(upload_to="photos")),
                ("added_on", models.DateTimeField(db_index=True)),
                ("exif_gps_lat", models.FloatField(blank=True, null=True)),
                ("exif_gps_lon", models.FloatField(blank=True, null=True)),
                (
                    "exif_timestamp",
                    models.DateTimeField(blank=True, db_index=True, null=True),
                ),
                (
                    "exif_json",
                    django.contrib.postgres.fields.jsonb.JSONField(
                        blank=True, null=True
                    ),
                ),
                (
                    "geolocation_json",
                    django.contrib.postgres.fields.jsonb.JSONField(
                        blank=True, db_index=True, null=True
                    ),
                ),
                (
                    "captions_json",
                    django.contrib.postgres.fields.jsonb.JSONField(
                        blank=True, db_index=True, null=True
                    ),
                ),
                (
                    "search_captions",
                    models.TextField(blank=True, db_index=True, null=True),
                ),
                (
                    "search_location",
                    models.TextField(blank=True, db_index=True, null=True),
                ),
                ("favorited", models.BooleanField(db_index=True, default=False)),
                ("hidden", models.BooleanField(db_index=True, default=False)),
                ("public", models.BooleanField(db_index=True, default=False)),
                ("encoding", models.TextField(default=None, null=True)),
                (
                    "owner",
                    models.ForeignKey(
                        default=None,
                        on_delete=models.SET(api.models.user.get_deleted_user),
                        to=settings.AUTH_USER_MODEL,
                    ),
                ),
                (
                    "shared_to",
                    models.ManyToManyField(
                        related_name="photo_shared_to", to=settings.AUTH_USER_MODEL
                    ),
                ),
            ],
        ),
        migrations.AddField(
            model_name="face",
            name="person",
            field=models.ForeignKey(
                on_delete=models.SET(api.models.person.get_unknown_person),
                related_name="faces",
                to="api.Person",
            ),
        ),
        migrations.AddField(
            model_name="face",
            name="photo",
            field=models.ForeignKey(
                null=True,
                on_delete=models.SET(api.models.person.get_unknown_person),
                related_name="faces",
                to="api.Photo",
            ),
        ),
        migrations.AddField(
            model_name="albumuser",
            name="cover_photos",
            field=models.ManyToManyField(
                related_name="album_user_cover_photos", to="api.Photo"
            ),
        ),
        migrations.AddField(
            model_name="albumuser",
            name="owner",
            field=models.ForeignKey(
                default=None,
                on_delete=models.SET(api.models.user.get_deleted_user),
                to=settings.AUTH_USER_MODEL,
            ),
        ),
        migrations.AddField(
            model_name="albumuser",
            name="photos",
            field=models.ManyToManyField(to="api.Photo"),
        ),
        migrations.AddField(
            model_name="albumuser",
            name="shared_to",
            field=models.ManyToManyField(
                related_name="album_user_shared_to", to=settings.AUTH_USER_MODEL
            ),
        ),
        migrations.AddField(
            model_name="albumthing",
            name="cover_photos",
            field=models.ManyToManyField(
                related_name="album_thing_cover_photos", to="api.Photo"
            ),
        ),
        migrations.AddField(
            model_name="albumthing",
            name="owner",
            field=models.ForeignKey(
                default=None,
                on_delete=models.SET(api.models.user.get_deleted_user),
                to=settings.AUTH_USER_MODEL,
            ),
        ),
        migrations.AddField(
            model_name="albumthing",
            name="photos",
            field=models.ManyToManyField(to="api.Photo"),
        ),
        migrations.AddField(
            model_name="albumthing",
            name="shared_to",
            field=models.ManyToManyField(
                related_name="album_thing_shared_to", to=settings.AUTH_USER_MODEL
            ),
        ),
        migrations.AddField(
            model_name="albumplace",
            name="cover_photos",
            field=models.ManyToManyField(
                related_name="album_place_cover_photos", to="api.Photo"
            ),
        ),
        migrations.AddField(
            model_name="albumplace",
            name="owner",
            field=models.ForeignKey(
                default=None,
                on_delete=models.SET(api.models.user.get_deleted_user),
                to=settings.AUTH_USER_MODEL,
            ),
        ),
        migrations.AddField(
            model_name="albumplace",
            name="photos",
            field=models.ManyToManyField(to="api.Photo"),
        ),
        migrations.AddField(
            model_name="albumplace",
            name="shared_to",
            field=models.ManyToManyField(
                related_name="album_place_shared_to", to=settings.AUTH_USER_MODEL
            ),
        ),
        migrations.AddField(
            model_name="albumdate",
            name="photos",
            field=models.ManyToManyField(to="api.Photo"),
        ),
        migrations.AddField(
            model_name="albumdate",
            name="shared_to",
            field=models.ManyToManyField(
                related_name="album_date_shared_to", to=settings.AUTH_USER_MODEL
            ),
        ),
        migrations.AddField(
            model_name="albumauto",
            name="photos",
            field=models.ManyToManyField(to="api.Photo"),
        ),
        migrations.AddField(
            model_name="albumauto",
            name="shared_to",
            field=models.ManyToManyField(
                related_name="album_auto_shared_to", to=settings.AUTH_USER_MODEL
            ),
        ),
        migrations.AlterUniqueTogether(
            name="albumuser",
            unique_together={("title", "owner")},
        ),
        migrations.AlterUniqueTogether(
            name="albumthing",
            unique_together={("title", "owner")},
        ),
        migrations.AlterUniqueTogether(
            name="albumplace",
            unique_together={("title", "owner")},
        ),
        migrations.AlterUniqueTogether(
            name="albumdate",
            unique_together={("date", "owner")},
        ),
        migrations.AlterUniqueTogether(
            name="albumauto",
            unique_together={("timestamp", "owner")},
        ),
        migrations.RemoveField(model_name="albumplace", name="cover_photos"),
        migrations.RemoveField(model_name="albumthing", name="cover_photos"),
        migrations.RemoveField(model_name="albumuser", name="cover_photos"),
    ]


================================================
FILE: api/migrations/0002_add_confidence.py
================================================
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0001_initial"),
    ]

    operations = [
        migrations.AddField(
            model_name="User",
            name="confidence",
            field=models.FloatField(default=0.1, db_index=True),
        )
    ]


================================================
FILE: api/migrations/0003_remove_unused_thumbs.py
================================================
from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0002_add_confidence"),
    ]

    operations = [
        migrations.RemoveField(model_name="Photo", name="thumbnail_tiny"),
        migrations.RemoveField(model_name="Photo", name="thumbnail_small"),
        migrations.RemoveField(model_name="Photo", name="thumbnail"),
        migrations.RemoveField(model_name="Photo", name="square_thumbnail_tiny"),
        migrations.RemoveField(model_name="Photo", name="square_thumbnail_big"),
    ]


================================================
FILE: api/migrations/0004_fix_album_thing_constraint.py
================================================
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0003_remove_unused_thumbs"),
    ]

    operations = [
        migrations.AlterUniqueTogether(
            name="albumthing",
            unique_together=set([]),
        ),
        migrations.AddConstraint(
            model_name="albumthing",
            constraint=models.UniqueConstraint(
                fields=["title", "thing_type", "owner"],
                name="unique AlbumThing",
            ),
        ),
    ]


================================================
FILE: api/migrations/0005_add_video_to_photo.py
================================================
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0004_fix_album_thing_constraint"),
    ]

    operations = [
        migrations.AddField(
            model_name="Photo", name="video", field=models.BooleanField(default=False)
        )
    ]


================================================
FILE: api/migrations/0006_migrate_to_boolean_field.py
================================================
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0005_add_video_to_photo"),
    ]

    operations = [
        migrations.AlterField(
            model_name="Face",
            name="person_label_is_inferred",
            field=models.BooleanField(null=True, db_index=True),
        )
    ]


================================================
FILE: api/migrations/0007_migrate_to_json_field.py
================================================
import json

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0006_migrate_to_boolean_field"),
    ]

    def forwards_func(apps, schema):
        Photo = apps.get_model("api", "Photo")
        for obj in Photo.objects.all():
            try:
                obj.image_paths.append(obj.image_path)
                obj.save()
            except json.decoder.JSONDecodeError:
                print("Cannot convert {} object".format(obj.image_path))

    operations = [
        migrations.AddField(
            model_name="Photo",
            name="image_paths",
            field=models.JSONField(db_index=True, default=list),
        ),
        migrations.RunPython(forwards_func),
    ]


================================================
FILE: api/migrations/0008_remove_image_path.py
================================================
from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0007_migrate_to_json_field"),
    ]

    operations = [
        migrations.RemoveField(model_name="Photo", name="image_path"),
    ]


================================================
FILE: api/migrations/0009_add_aspect_ratio.py
================================================
import exiftool
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0008_remove_image_path"),
    ]

    def forwards_func(apps, schema):
        Photo = apps.get_model("api", "Photo")
        with exiftool.ExifTool() as et:
            for obj in Photo.objects.all():
                if obj.thumbnail_big:
                    try:
                        height = et.get_tag("ImageHeight", obj.thumbnail_big.path)
                        width = et.get_tag("ImageWidth", obj.thumbnail_big.path)
                        obj.aspect_ratio = round((width / height), 2)
                        obj.save()
                    except Exception:
                        print("Cannot convert {} object".format(obj))

    operations = [
        migrations.AddField(
            model_name="Photo",
            name="aspect_ratio",
            field=models.FloatField(blank=True, null=True),
        ),
        migrations.RunPython(forwards_func),
    ]


================================================
FILE: api/migrations/0009_add_clip_embedding_field.py
================================================
from django.contrib.postgres.fields import ArrayField
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0008_remove_image_path"),
    ]

    operations = [
        migrations.AddField(
            model_name="Photo",
            name="clip_embeddings",
            field=ArrayField(
                models.FloatField(blank=True, null=True), size=512, null=True
            ),
        ),
        migrations.AddField(
            model_name="Photo",
            name="clip_embeddings_magnitude",
            field=models.FloatField(blank=True, null=True),
        ),
        migrations.AddField(
            model_name="User",
            name="semantic_search_topk",
            field=models.IntegerField(default=0, null=False),
        ),
        migrations.RemoveField(
            model_name="Photo",
            name="encoding",
        ),
    ]


================================================
FILE: api/migrations/0010_merge_20210725_1547.py
================================================
# Generated by Django 3.1.8 on 2021-07-25 21:47

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0009_add_aspect_ratio"),
        ("api", "0009_add_clip_embedding_field"),
    ]

    operations = []


================================================
FILE: api/migrations/0011_a_add_rating.py
================================================
# Generated by Django 3.1.8 on 2021-08-06 11:32

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0010_merge_20210725_1547"),
    ]

    run_before = [("api", "0011_b_migrate_favorited_to_rating")]

    operations = [
        migrations.AddField(
            model_name="photo",
            name="rating",
            field=models.IntegerField(db_index=True, default=0),
        ),
    ]


================================================
FILE: api/migrations/0011_b_migrate_favorited_to_rating.py
================================================
# Generated by Django 3.1.8 on 2021-08-06 11:32

from django.db import migrations


def favorited_to_rating(apps, schema_editor):
    Photo = apps.get_model("api", "Photo")
    for photo in Photo.objects.all():
        photo.rating = 4 if photo.favorited else 0
        photo.save()


def rating_to_favorited(apps, schema_editor):
    Photo = apps.get_model("api", "Photo")
    for photo in Photo.objects.all():
        photo.favorited = photo.rating >= 4
        photo.save()


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0011_a_add_rating"),
    ]

    run_before = [("api", "0011_c_remove_favorited")]

    operations = [migrations.RunPython(favorited_to_rating, rating_to_favorited)]


================================================
FILE: api/migrations/0011_c_remove_favorited.py
================================================
# Generated by Django 3.1.8 on 2021-08-06 11:32

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0011_b_migrate_favorited_to_rating"),
    ]

    operations = [
        migrations.RemoveField(
            model_name="photo",
            name="favorited",
        ),
    ]


================================================
FILE: api/migrations/0012_add_favorite_min_rating.py
================================================
# Generated by Django 3.1.8 on 2021-08-08 17:05

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0011_c_remove_favorited"),
    ]

    operations = [
        migrations.AddField(
            model_name="user",
            name="favorite_min_rating",
            field=models.IntegerField(db_index=True, default=4),
        ),
    ]


================================================
FILE: api/migrations/0013_add_image_scale_and_misc.py
================================================
# Generated by Django 3.1.8 on 2021-09-09 16:06

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0012_add_favorite_min_rating"),
    ]

    operations = [
        migrations.AddField(
            model_name="user",
            name="image_scale",
            field=models.FloatField(default=1),
        ),
        migrations.AlterField(
            model_name="albumdate",
            name="location",
            field=models.JSONField(blank=True, db_index=True, null=True),
        ),
        migrations.AlterField(
            model_name="face",
            name="image",
            field=models.ImageField(null=True, upload_to="faces"),
        ),
        migrations.AlterField(
            model_name="face",
            name="photo",
            field=models.ForeignKey(
                null=True,
                on_delete=django.db.models.deletion.CASCADE,
                related_name="faces",
                to="api.photo",
            ),
        ),
        migrations.AlterField(
            model_name="longrunningjob",
            name="job_type",
            field=models.PositiveIntegerField(
                choices=[
                    (1, "Scan Photos"),
                    (2, "Generate Event Albums"),
                    (3, "Regenerate Event Titles"),
                    (4, "Train Faces"),
                    (5, "Delete Missing Photos"),
                    (7, "Scan Faces"),
                    (6, "Calculate Clip Embeddings"),
                ]
            ),
        ),
        migrations.AlterField(
            model_name="longrunningjob",
            name="result",
            field=models.JSONField(default={"progress": {"target": 0, "current": 0}}),
        ),
        migrations.AlterField(
            model_name="photo",
            name="captions_json",
            field=models.JSONField(blank=True, db_index=True, null=True),
        ),
        migrations.AlterField(
            model_name="photo",
            name="exif_json",
            field=models.JSONField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="photo",
            name="geolocation_json",
            field=models.JSONField(blank=True, db_index=True, null=True),
        ),
        migrations.AlterField(
            model_name="photo",
            name="image_paths",
            field=models.JSONField(default=list),
        ),
        migrations.AlterField(
            model_name="user",
            name="first_name",
            field=models.CharField(
                blank=True, max_length=150, verbose_name="first name"
            ),
        ),
    ]


================================================
FILE: api/migrations/0014_add_save_metadata_to_disk.py
================================================
# Generated by Django 3.1.8 on 2021-08-08 17:05

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0013_add_image_scale_and_misc"),
    ]

    operations = [
        migrations.AddField(
            model_name="user",
            name="save_metadata_to_disk",
            field=models.TextField(
                choices=[
                    ("OFF", "Off"),
                    ("MEDIA_FILE", "Media File"),
                    ("SIDECAR_FILE", "Sidecar File"),
                ],
                default="OFF",
            ),
        ),
    ]


================================================
FILE: api/migrations/0015_add_dominant_color.py
================================================
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0014_add_save_metadata_to_disk"),
    ]
    operations = [
        migrations.AddField(
            model_name="Photo",
            name="dominant_color",
            field=models.TextField(blank=True, null=True),
        ),
    ]


================================================
FILE: api/migrations/0016_add_transcode_videos.py
================================================
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0015_add_dominant_color"),
    ]
    operations = [
        migrations.AddField(
            model_name="User",
            name="transcode_videos",
            field=models.BooleanField(default=False),
        ),
    ]


================================================
FILE: api/migrations/0017_add_cover_photo.py
================================================
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0016_add_transcode_videos"),
    ]
    operations = [
        migrations.AddField(
            model_name="Person",
            name="cover_photo",
            field=models.ForeignKey(
                to="api.Photo",
                related_name="person",
                on_delete=models.PROTECT,
                blank=False,
                null=True,
            ),
        ),
    ]


================================================
FILE: api/migrations/0018_user_config_datetime_rules.py
================================================
# Generated by Django 3.1.14 on 2022-01-24 17:11

from django.db import migrations, models

import api.models.user


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0017_add_cover_photo"),
    ]

    operations = [
        migrations.AddField(
            model_name="user",
            name="config_datetime_rules",
            field=models.JSONField(
                default=api.models.user.get_default_config_datetime_rules
            ),
        ),
    ]


================================================
FILE: api/migrations/0019_change_config_datetime_rules.py
================================================
# Generated by Django 3.1.14 on 2022-01-24 17:11

from django.db import migrations, models

import api.models.user


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0018_user_config_datetime_rules"),
    ]

    operations = [
        migrations.RemoveField(
            model_name="user",
            name="config_datetime_rules",
        ),
        migrations.AddField(
            model_name="user",
            name="datetime_rules",
            field=models.JSONField(
                default=api.models.user.get_default_config_datetime_rules
            ),
        ),
    ]


================================================
FILE: api/migrations/0020_add_default_timezone.py
================================================
# Generated by Django 3.1.14 on 2022-01-24 17:11

import pytz
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0019_change_config_datetime_rules"),
    ]

    operations = [
        migrations.AddField(
            model_name="user",
            name="default_timezone",
            field=models.TextField(
                choices=[(x, x) for x in pytz.all_timezones],
                default="UTC",
            ),
        ),
    ]


================================================
FILE: api/migrations/0021_remove_photo_image.py
================================================
# Generated by Django 3.1.14 on 2022-02-01 22:42

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0020_add_default_timezone"),
    ]

    operations = [
        migrations.RemoveField(
            model_name="photo",
            name="image",
        ),
    ]


================================================
FILE: api/migrations/0022_photo_video_length.py
================================================
# Generated by Django 3.1.14 on 2022-02-20 11:16

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0021_remove_photo_image"),
    ]

    operations = [
        migrations.AddField(
            model_name="photo",
            name="video_length",
            field=models.TextField(blank=True, null=True),
        ),
    ]


================================================
FILE: api/migrations/0023_photo_deleted.py
================================================
# Generated by Django 3.1.14 on 2022-02-23 21:29

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0022_photo_video_length"),
    ]

    operations = [
        migrations.AddField(
            model_name="photo",
            name="deleted",
            field=models.BooleanField(db_index=True, default=False),
        ),
    ]


================================================
FILE: api/migrations/0024_photo_timestamp.py
================================================
# Generated by Django 3.1.14 on 2022-03-18 10:35

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0023_photo_deleted"),
    ]

    operations = [
        migrations.AddField(
            model_name="photo",
            name="timestamp",
            field=models.DateTimeField(blank=True, db_index=True, null=True),
        ),
    ]


================================================
FILE: api/migrations/0025_add_cover_photo.py
================================================
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0024_photo_timestamp"),
    ]
    operations = [
        migrations.AddField(
            model_name="AlbumUser",
            name="cover_photo",
            field=models.ForeignKey(
                to="api.Photo",
                related_name="album_user",
                on_delete=models.PROTECT,
                blank=False,
                null=True,
            ),
        ),
    ]


================================================
FILE: api/migrations/0026_add_cluster_info.py
================================================
# Generated by Django 3.1.14 on 2022-07-15 21:19

import django.db.models.deletion
import django.db.models.manager
from django.conf import settings
from django.db import migrations, models

import api.models.person


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0025_add_cover_photo"),
    ]

    operations = [
        migrations.AlterModelManagers(
            name="albumdate",
            managers=[
                ("visible", django.db.models.manager.Manager()),
            ],
        ),
        migrations.RemoveField(
            model_name="person",
            name="cluster_id",
        ),
        migrations.AlterField(
            model_name="person",
            name="mean_face_encoding",
            field=models.TextField(default="default"),
        ),
        migrations.RemoveField(
            model_name="person",
            name="mean_face_encoding",
        ),
        migrations.AlterField(
            model_name="longrunningjob",
            name="job_type",
            field=models.PositiveIntegerField(
                choices=[
                    (1, "Scan Photos"),
                    (2, "Generate Event Albums"),
                    (3, "Regenerate Event Titles"),
                    (4, "Train Faces"),
                    (5, "Delete Missing Photos"),
                    (7, "Scan Faces"),
                    (6, "Calculate Clip Embeddings"),
                    (8, "Find Similar Faces"),
                ]
            ),
        ),
        migrations.CreateModel(
            name="Cluster",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("mean_face_encoding", models.TextField()),
                ("cluster_id", models.IntegerField(null=True)),
                ("name", models.TextField(null=True)),
                (
                    "person",
                    models.ForeignKey(
                        blank=True,
                        null=True,
                        on_delete=models.SET(api.models.person.get_unknown_person),
                        related_name="clusters",
                        to="api.person",
                    ),
                ),
                (
                    "owner",
                    models.ForeignKey(
                        default=None,
                        null=True,
                        on_delete=models.SET(api.models.user.get_deleted_user),
                        to=settings.AUTH_USER_MODEL,
                    ),
                ),
            ],
        ),
        migrations.AddField(
            model_name="face",
            name="cluster",
            field=models.ForeignKey(
                blank=True,
                null=True,
                on_delete=models.SET(api.models.cluster.get_unknown_cluster),
                related_name="faces",
                to="api.cluster",
            ),
        ),
        migrations.AddField(
            model_name="person",
            name="cluster_owner",
            field=models.ForeignKey(
                default=None,
                null=True,
                related_name="owner",
                on_delete=models.SET(api.models.user.get_deleted_user),
                to=settings.AUTH_USER_MODEL,
            ),
        ),
    ]


================================================
FILE: api/migrations/0027_rename_unknown_person.py
================================================
# Generated by Django 3.1.14 on 2022-07-17 19:07
from django.db import migrations

UNKNOWN_PERSON_NAME = "Unknown - Other"
KIND_UNKNOWN = "UNKNOWN"


def migrate_unknown(apps, schema_editor):
    Person = apps.get_model("api", "Person")
    person: Person
    try:
        person = Person.objects.get(name="unknown")
        person.name = UNKNOWN_PERSON_NAME
        person.kind = KIND_UNKNOWN
        person.save()
    except Person.DoesNotExist:
        unknown_person: Person = Person.objects.get_or_create(
            name=UNKNOWN_PERSON_NAME, cluster_owner=None, kind=KIND_UNKNOWN
        )[0]
        if unknown_person.kind != KIND_UNKNOWN:
            unknown_person.kind = KIND_UNKNOWN
            unknown_person.save()


def unmigrate_unknown(apps, schema_editor):
    Person = apps.get_model("api", "Person")
    try:
        person: Person = Person.objects.get(name=UNKNOWN_PERSON_NAME)
        person.name = "unknown"
        person.kind = ""
        person.save()
    except Person.DoesNotExist:
        pass


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0026_add_cluster_info"),
    ]

    operations = [migrations.RunPython(migrate_unknown, unmigrate_unknown)]


================================================
FILE: api/migrations/0028_add_metadata_fields.py
================================================
# Generated by Django 3.1.14 on 2022-07-30 11:47

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0027_rename_unknown_person"),
    ]

    operations = [
        migrations.AddField(
            model_name="photo",
            name="camera",
            field=models.TextField(blank=True, null=True),
        ),
        migrations.AddField(
            model_name="photo",
            name="digitalZoomRatio",
            field=models.FloatField(blank=True, null=True),
        ),
        migrations.AddField(
            model_name="photo",
            name="focalLength35Equivalent",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AddField(
            model_name="photo",
            name="focal_length",
            field=models.FloatField(blank=True, null=True),
        ),
        migrations.AddField(
            model_name="photo",
            name="fstop",
            field=models.FloatField(blank=True, null=True),
        ),
        migrations.AddField(
            model_name="photo",
            name="height",
            field=models.IntegerField(default=0),
        ),
        migrations.AddField(
            model_name="photo",
            name="iso",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AddField(
            model_name="photo",
            name="lens",
            field=models.TextField(blank=True, null=True),
        ),
        migrations.AddField(
            model_name="photo",
            name="shutter_speed",
            field=models.FloatField(blank=True, null=True),
        ),
        migrations.AddField(
            model_name="photo",
            name="size",
            field=models.IntegerField(default=0),
        ),
        migrations.AddField(
            model_name="photo",
            name="subjectDistance",
            field=models.FloatField(blank=True, null=True),
        ),
        migrations.AddField(
            model_name="photo",
            name="width",
            field=models.IntegerField(default=0),
        ),
    ]


================================================
FILE: api/migrations/0029_change_to_text_field.py
================================================
# Generated by Django 3.1.14 on 2022-07-31 11:35

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0028_add_metadata_fields"),
    ]

    operations = [
        migrations.AlterField(
            model_name="photo",
            name="shutter_speed",
            field=models.TextField(blank=True, null=True),
        ),
    ]


================================================
FILE: api/migrations/0030_user_confidence_person.py
================================================
# Generated by Django 3.1.14 on 2022-08-08 13:39

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0029_change_to_text_field"),
    ]

    operations = [
        migrations.AddField(
            model_name="user",
            name="confidence_person",
            field=models.FloatField(default=0.9),
        ),
    ]


================================================
FILE: api/migrations/0031_remove_account.py
================================================
# Generated by Django 3.1.14 on 2022-09-01 16:28

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0030_user_confidence_person"),
    ]

    operations = [
        migrations.AlterModelManagers(
            name="albumdate",
            managers=[],
        ),
        migrations.RemoveField(
            model_name="person",
            name="account",
        ),
    ]


================================================
FILE: api/migrations/0032_always_have_owner.py
================================================
# Generated by Django 3.1.8 on 2021-08-06 11:32

from django.db import migrations


def add_cluster_owner(apps, schema_editor):
    Person = apps.get_model("api", "Person")
    for person in Person.objects.all():
        if person.faces.first():
            person.cluster_owner = person.faces.first().photo.owner
            person.save()


def remove_cluster_owner(apps, schema_editor):
    Person = apps.get_model("api", "Person")
    for person in Person.objects.all():
        person.cluster_owner = None


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0031_remove_account"),
    ]

    operations = [migrations.RunPython(add_cluster_owner, remove_cluster_owner)]


================================================
FILE: api/migrations/0033_add_post_delete_person.py
================================================
# Generated by Django 3.1.14 on 2022-09-02 10:23

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0032_always_have_owner"),
    ]

    operations = [
        migrations.AlterField(
            model_name="face",
            name="person",
            field=models.ForeignKey(
                on_delete=django.db.models.deletion.DO_NOTHING,
                related_name="faces",
                to="api.person",
            ),
        ),
    ]


================================================
FILE: api/migrations/0034_allow_deleting_person.py
================================================
# Generated by Django 3.1.14 on 2022-09-02 10:26

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0033_add_post_delete_person"),
    ]

    operations = [
        migrations.AlterField(
            model_name="person",
            name="cover_photo",
            field=models.ForeignKey(
                null=True,
                on_delete=django.db.models.deletion.SET_NULL,
                related_name="person",
                to="api.photo",
            ),
        ),
    ]


================================================
FILE: api/migrations/0035_add_files_model.py
================================================
# Generated by Django 3.1.14 on 2022-11-09 17:35

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0034_allow_deleting_person"),
    ]

    operations = [
        migrations.CreateModel(
            name="File",
            fields=[
                (
                    "hash",
                    models.CharField(max_length=64, primary_key=True, serialize=False),
                ),
                ("path", models.TextField(blank=True, null=True)),
                (
                    "type",
                    models.PositiveIntegerField(
                        blank=True,
                        choices=[
                            (1, "Image"),
                            (2, "Video"),
                            (3, "Metadata File e.g. XMP"),
                            (4, "Raw File"),
                        ],
                    ),
                ),
            ],
        ),
        migrations.AddField(
            model_name="photo",
            name="files",
            field=models.ManyToManyField(to="api.File"),
        ),
        migrations.AddField(
            model_name="photo",
            name="main_file",
            field=models.ForeignKey(
                null=True,
                on_delete=django.db.models.deletion.PROTECT,
                related_name="main_photo",
                to="api.file",
            ),
        ),
    ]


================================================
FILE: api/migrations/0036_handle_missing_files.py
================================================
# Generated by Django 3.1.14 on 2022-11-10 08:41

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0035_add_files_model"),
    ]

    operations = [
        migrations.AddField(
            model_name="file",
            name="missing",
            field=models.BooleanField(default=False),
        ),
        migrations.AlterField(
            model_name="file",
            name="type",
            field=models.PositiveIntegerField(
                blank=True,
                choices=[
                    (1, "Image"),
                    (2, "Video"),
                    (3, "Metadata File e.g. XMP"),
                    (4, "Raw File"),
                    (5, "Unknown"),
                ],
            ),
        ),
    ]


================================================
FILE: api/migrations/0037_migrate_to_files.py
================================================
import os

from django.db import migrations

from api.models.file import is_metadata, is_raw, is_video

IMAGE = 1
VIDEO = 2
METADATA_FILE = 3
RAW_FILE = 4
UNKNOWN = 5


def find_out_type(path):
    if is_raw(path):
        return RAW_FILE
    if is_video(path):
        return VIDEO
    if is_metadata(path):
        return METADATA_FILE
    return IMAGE


def migrate_to_files(apps, schema_editor):
    Photo = apps.get_model("api", "Photo")
    File = apps.get_model("api", "File")
    for photo in Photo.objects.all():
        if photo.image_paths:
            for path in photo.image_paths:
                file: File = File()
                file.path = path
                if os.path.exists(path):
                    file.type = find_out_type(path)
                else:
                    file.type = UNKNOWN
                    if photo.video:
                        file.type = VIDEO
                    file.missing = True
                # This is fine, because at this point all files that belong to a photo have the same hash
                file.hash = photo.image_hash
                file.save()
                photo.files.add(file)
                photo.save()
        # handle missing photos
        else:
            file: File = File()
            file.path = None
            file.type = UNKNOWN
            file.missing = True
            file.hash = photo.image_hash
            file.save()
            photo.files.add(file)
            photo.save()


def remove_files(apps, schema_editor):
    File = apps.get_model("api", "File")
    for file in File.objects.all():
        file.delete()


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0036_handle_missing_files"),
    ]

    operations = [migrations.RunPython(migrate_to_files, remove_files)]


================================================
FILE: api/migrations/0038_add_main_file.py
================================================
from django.db import migrations

from api.models.file import is_metadata, is_raw, is_video

IMAGE = 1
VIDEO = 2
METADATA_FILE = 3
RAW_FILE = 4
UNKNOWN = 5


def find_out_type(path):
    if is_raw(path):
        return RAW_FILE
    if is_video(path):
        return VIDEO
    if is_metadata(path):
        return METADATA_FILE
    return IMAGE


def add_main_file(apps, schema_editor):
    Photo = apps.get_model("api", "Photo")
    for photo in Photo.objects.all():
        if photo.files.count() > 0:
            photo.main_file = photo.files.first()
            photo.save()


def remove_main_file(apps, schema_editor):
    Photo = apps.get_model("api", "Photo")
    for photo in Photo.objects.all():
        photo.main_file = None
        photo.save()


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0037_migrate_to_files"),
    ]

    operations = [migrations.RunPython(add_main_file, remove_main_file)]


================================================
FILE: api/migrations/0039_remove_photo_image_paths.py
================================================
# Generated by Django 3.1.14 on 2022-12-21 09:24

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0038_add_main_file"),
    ]

    operations = [
        migrations.RemoveField(
            model_name="photo",
            name="image_paths",
        ),
    ]


================================================
FILE: api/migrations/0040_add_user_public_sharing_flag.py
================================================
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0039_remove_photo_image_paths"),
    ]

    operations = [
        migrations.AddField(
            model_name="user",
            name="public_sharing",
            field=models.BooleanField(default=False),
        ),
    ]


================================================
FILE: api/migrations/0041_apply_user_enum_for_person.py
================================================
from django.db import migrations


class Migration(migrations.Migration):
    def apply_enum(apps, schema_editor):
        Person = apps.get_model("api", "Person")
        for person in Person.objects.filter(kind="").all():
            person.kind = "USER"
            person.save()

    def remove_enum(apps, schema_editor):
        Person = apps.get_model("api", "Person")
        for person in Person.objects.filter(kind="").all():
            person.kind = ""
            person.save()

    dependencies = [
        ("api", "0040_add_user_public_sharing_flag"),
    ]

    operations = [migrations.RunPython(apply_enum, remove_enum)]


================================================
FILE: api/migrations/0042_alter_albumuser_cover_photo_alter_photo_main_file.py
================================================
# Generated by Django 4.2rc1 on 2023-04-04 09:14

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0041_apply_user_enum_for_person"),
    ]

    operations = [
        migrations.AlterField(
            model_name="albumuser",
            name="cover_photo",
            field=models.ForeignKey(
                null=True,
                on_delete=django.db.models.deletion.SET_NULL,
                related_name="album_user",
                to="api.photo",
            ),
        ),
        migrations.AlterField(
            model_name="photo",
            name="main_file",
            field=models.ForeignKey(
                null=True,
                on_delete=django.db.models.deletion.SET_NULL,
                related_name="main_photo",
                to="api.file",
            ),
        ),
    ]


================================================
FILE: api/migrations/0043_alter_photo_size.py
================================================
# Generated by Django 4.2rc1 on 2023-04-05 07:34

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0042_alter_albumuser_cover_photo_alter_photo_main_file"),
    ]

    operations = [
        migrations.AlterField(
            model_name="photo",
            name="size",
            field=models.BigIntegerField(default=0),
        ),
    ]


================================================
FILE: api/migrations/0044_alter_cluster_person_alter_person_cluster_owner.py
================================================
# Generated by Django 4.2rc1 on 2023-04-07 19:02

import django.db.models.deletion
from django.conf import settings
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0043_alter_photo_size"),
    ]

    operations = [
        migrations.AlterField(
            model_name="cluster",
            name="person",
            field=models.ForeignKey(
                blank=True,
                null=True,
                on_delete=django.db.models.deletion.SET_NULL,
                related_name="clusters",
                to="api.person",
            ),
        ),
        migrations.AlterField(
            model_name="person",
            name="cluster_owner",
            field=models.ForeignKey(
                default=None,
                null=True,
                on_delete=django.db.models.deletion.SET_NULL,
                related_name="owner",
                to=settings.AUTH_USER_MODEL,
            ),
        ),
    ]


================================================
FILE: api/migrations/0045_alter_face_cluster.py
================================================
# Generated by Django 4.2rc1 on 2023-04-07 19:15

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0044_alter_cluster_person_alter_person_cluster_owner"),
    ]

    operations = [
        migrations.AlterField(
            model_name="face",
            name="cluster",
            field=models.ForeignKey(
                blank=True,
                null=True,
                on_delete=django.db.models.deletion.SET_NULL,
                related_name="faces",
                to="api.cluster",
            ),
        ),
    ]


================================================
FILE: api/migrations/0046_add_embedded_media.py
================================================
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0045_alter_face_cluster"),
    ]

    operations = [
        migrations.AddField(
            model_name="file",
            name="embedded_media",
            field=models.ManyToManyField("File"),
        ),
    ]


================================================
FILE: api/migrations/0047_alter_file_embedded_media.py
================================================
# Generated by Django 4.2rc1 on 2023-04-15 10:42

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0046_add_embedded_media"),
    ]

    operations = [
        migrations.AlterField(
            model_name="file",
            name="embedded_media",
            field=models.ManyToManyField(to="api.file"),
        ),
    ]


================================================
FILE: api/migrations/0048_fix_null_height.py
================================================
from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0047_alter_file_embedded_media"),
    ]

    operations = [
        migrations.RunSQL("UPDATE api_photo SET height=0 WHERE height IS NULL;")
    ]


================================================
FILE: api/migrations/0049_fix_metadata_files_as_main_files.py
================================================
from django.db import migrations


def delete_photos_with_metadata_as_main(apps, schema_editor):
    Photo = apps.get_model("api", "Photo")
    for photo in Photo.objects.filter(main_file__type=3):
        photo.delete()


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0048_fix_null_height"),
    ]

    operations = [
        migrations.RunPython(delete_photos_with_metadata_as_main),
    ]


================================================
FILE: api/migrations/0050_person_face_count.py
================================================
# Generated by Django 4.2.1 on 2023-06-20 09:46

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0049_fix_metadata_files_as_main_files"),
    ]

    operations = [
        migrations.AddField(
            model_name="person",
            name="face_count",
            field=models.IntegerField(default=0),
        ),
    ]


================================================
FILE: api/migrations/0051_set_person_defaults.py
================================================
from django.db import migrations


class Migration(migrations.Migration):
    def apply_default(apps, schema_editor):
        Person = apps.get_model("api", "Person")
        User = apps.get_model("api", "User")

        for person in Person.objects.filter(kind="USER").all():
            number_of_faces = person.faces.filter(
                photo__hidden=False,
                photo__deleted=False,
                photo__owner=person.cluster_owner.id,
            ).count()
            if not person.cover_photo and number_of_faces > 0:
                person.cover_photo = (
                    person.faces.filter(
                        photo__hidden=False,
                        photo__deleted=False,
                        photo__owner=person.cluster_owner.id,
                    )
                    .first()
                    .photo
                )
            confidence_person = (
                User.objects.filter(id=person.cluster_owner.id)
                .first()
                .confidence_person
            )
            person.face_count = person.faces.filter(
                photo__hidden=False,
                photo__deleted=False,
                photo__owner=person.cluster_owner.id,
                person_label_probability__gte=confidence_person,
            ).count()
            person.save()

    def remove_default(apps, schema_editor):
        Person = apps.get_model("api", "Person")
        for person in Person.objects.all():
            person.face_count = 0
            person.save()

    dependencies = [
        ("api", "0050_person_face_count"),
    ]

    operations = [migrations.RunPython(apply_default, remove_default)]


================================================
FILE: api/migrations/0052_alter_person_name.py
================================================
# Generated by Django 4.2.1 on 2023-06-26 12:14

import django.core.validators
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0051_set_person_defaults"),
    ]

    operations = [
        migrations.AlterField(
            model_name="person",
            name="name",
            field=models.CharField(
                max_length=128,
                validators=[django.core.validators.MinLengthValidator(1)],
            ),
        ),
    ]


================================================
FILE: api/migrations/0053_user_confidence_unknown_face_and_more.py
================================================
# Generated by Django 4.2.1 on 2023-07-09 11:08

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0052_alter_person_name"),
    ]

    operations = [
        migrations.AddField(
            model_name="user",
            name="confidence_unknown_face",
            field=models.FloatField(default=0.5),
        ),
        migrations.AddField(
            model_name="user",
            name="face_recognition_model",
            field=models.TextField(
                choices=[("HOG", "Hog"), ("CNN", "Cnn")], default="HOG"
            ),
        ),
        migrations.AddField(
            model_name="user",
            name="min_cluster_size",
            field=models.IntegerField(default=0),
        ),
    ]


================================================
FILE: api/migrations/0054_user_cluster_selection_epsilon_user_min_samples.py
================================================
# Generated by Django 4.2.1 on 2023-07-11 11:06

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0053_user_confidence_unknown_face_and_more"),
    ]

    operations = [
        migrations.AddField(
            model_name="user",
            name="cluster_selection_epsilon",
            field=models.FloatField(default=0.05),
        ),
        migrations.AddField(
            model_name="user",
            name="min_samples",
            field=models.IntegerField(default=1),
        ),
    ]


================================================
FILE: api/migrations/0055_alter_longrunningjob_job_type.py
================================================
# Generated by Django 4.2.6 on 2023-10-27 13:01

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0054_user_cluster_selection_epsilon_user_min_samples"),
    ]

    operations = [
        migrations.AlterField(
            model_name="longrunningjob",
            name="job_type",
            field=models.PositiveIntegerField(
                choices=[
                    (1, "Scan Photos"),
                    (2, "Generate Event Albums"),
                    (3, "Regenerate Event Titles"),
                    (4, "Train Faces"),
                    (5, "Delete Missing Photos"),
                    (7, "Scan Faces"),
                    (6, "Calculate Clip Embeddings"),
                    (8, "Find Similar Faces"),
                    (9, "Download Selected Photos"),
                ]
            ),
        ),
    ]


================================================
FILE: api/migrations/0056_user_llm_settings_alter_longrunningjob_job_type.py
================================================
# Generated by Django 4.2.8 on 2023-12-21 11:16

from django.db import migrations, models

import api.models.user


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0055_alter_longrunningjob_job_type"),
    ]

    operations = [
        migrations.AddField(
            model_name="user",
            name="llm_settings",
            field=models.JSONField(default=api.models.user.get_default_llm_settings),
        ),
        migrations.AlterField(
            model_name="longrunningjob",
            name="job_type",
            field=models.PositiveIntegerField(
                choices=[
                    (1, "Scan Photos"),
                    (2, "Generate Event Albums"),
                    (3, "Regenerate Event Titles"),
                    (4, "Train Faces"),
                    (5, "Delete Missing Photos"),
                    (7, "Scan Faces"),
                    (6, "Calculate Clip Embeddings"),
                    (8, "Find Similar Faces"),
                    (9, "Download Selected Photos"),
                    (10, "Download Models"),
                ]
            ),
        ),
    ]


================================================
FILE: api/migrations/0057_remove_face_image_path_and_more.py
================================================
# Generated by Django 4.2.8 on 2024-01-10 17:12

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0056_user_llm_settings_alter_longrunningjob_job_type"),
    ]

    operations = [
        migrations.RemoveField(
            model_name="face",
            name="image_path",
        ),
        migrations.AlterField(
            model_name="face",
            name="person_label_is_inferred",
            field=models.BooleanField(db_index=True, default=False),
        ),
    ]


================================================
FILE: api/migrations/0058_alter_user_avatar_alter_user_nextcloud_app_password_and_more.py
================================================
# Generated by Django 4.2.9 on 2024-02-02 16:36

import django_cryptography.fields
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0057_remove_face_image_path_and_more"),
    ]

    operations = [
        migrations.AlterField(
            model_name="user",
            name="avatar",
            field=models.ImageField(blank=True, null=True, upload_to="avatars"),
        ),
        migrations.AlterField(
            model_name="user",
            name="nextcloud_app_password",
            field=django_cryptography.fields.encrypt(
                models.CharField(blank=True, default=None, max_length=64, null=True)
            ),
        ),
        migrations.AlterField(
            model_name="user",
            name="nextcloud_scan_directory",
            field=models.CharField(
                blank=True, db_index=True, max_length=512, null=True
            ),
        ),
        migrations.AlterField(
            model_name="user",
            name="nextcloud_server_address",
            field=models.CharField(blank=True, default=None, max_length=200, null=True),
        ),
        migrations.AlterField(
            model_name="user",
            name="nextcloud_username",
            field=models.CharField(blank=True, default=None, max_length=64, null=True),
        ),
    ]


================================================
FILE: api/migrations/0059_person_cover_face.py
================================================
# Generated by Django 4.2.11 on 2024-03-29 16:03

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0058_alter_user_avatar_alter_user_nextcloud_app_password_and_more"),
    ]

    operations = [
        migrations.AddField(
            model_name="person",
            name="cover_face",
            field=models.ForeignKey(
                null=True,
                on_delete=django.db.models.deletion.SET_NULL,
                related_name="face",
                to="api.face",
            ),
        ),
    ]


================================================
FILE: api/migrations/0060_apply_default_face_cover.py
================================================
from django.db import migrations


class Migration(migrations.Migration):
    def apply_default(apps, schema_editor):
        Person = apps.get_model("api", "Person")

        for person in Person.objects.filter(kind="USER").all():
            if not person.cover_face and person.faces.count() > 0:
                person.cover_face = person.faces.first()
                person.save()
            if (
                not person.cover_face
                and person.cover_photo
                and person.cover_photo.faces.count() > 0
            ):
                person.cover_face = person.cover_photo.faces.filter(
                    person__name=person.name
                ).first()
                person.save()

    def remove_default(apps, schema_editor):
        Person = apps.get_model("api", "Person")
        for person in Person.objects.all():
            person.cover_face = None

    dependencies = [
        ("api", "0059_person_cover_face"),
    ]

    operations = [migrations.RunPython(apply_default, remove_default)]


================================================
FILE: api/migrations/0061_alter_person_name.py
================================================
# Generated by Django 4.2.11 on 2024-03-29 17:20

import django.core.validators
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0060_apply_default_face_cover"),
    ]

    operations = [
        migrations.AlterField(
            model_name="person",
            name="name",
            field=models.CharField(
                db_index=True,
                max_length=128,
                validators=[django.core.validators.MinLengthValidator(1)],
            ),
        ),
    ]


================================================
FILE: api/migrations/0062_albumthing_cover_photos.py
================================================
# Generated by Django 4.2.11 on 2024-03-29 17:33

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0061_alter_person_name"),
    ]

    operations = [
        migrations.AddField(
            model_name="albumthing",
            name="cover_photos",
            field=models.ManyToManyField(
                related_name="album_thing_cover_photos", to="api.photo"
            ),
        ),
    ]


================================================
FILE: api/migrations/0063_apply_default_album_things_cover.py
================================================
from django.db import migrations


class Migration(migrations.Migration):
    def apply_default(apps, schema_editor):
        AlbumThing = apps.get_model("api", "AlbumThing")

        for thing in AlbumThing.objects.all():
            if thing.photos.count() > 0:
                thing.cover_photos.add(*thing.photos.all()[:4])
                thing.save()

    def remove_default(apps, schema_editor):
        AlbumThing = apps.get_model("api", "AlbumThing")
        for thing in AlbumThing.objects.all():
            thing.cover_photos = None
            thing.save()

    dependencies = [
        ("api", "0062_albumthing_cover_photos"),
    ]

    operations = [migrations.RunPython(apply_default, remove_default)]


================================================
FILE: api/migrations/0064_albumthing_photo_count.py
================================================
# Generated by Django 4.2.11 on 2024-03-30 13:20

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0063_apply_default_album_things_cover"),
    ]

    operations = [
        migrations.AddField(
            model_name="albumthing",
            name="photo_count",
            field=models.IntegerField(default=0),
        ),
    ]


================================================
FILE: api/migrations/0065_apply_default_photo_count.py
================================================
from django.db import migrations


class Migration(migrations.Migration):
    def apply_default(apps, schema_editor):
        AlbumThing = apps.get_model("api", "AlbumThing")

        for thing in AlbumThing.objects.all():
            thing.photo_count = thing.photos.filter(hidden=False).count()
            thing.save()

    def remove_default(apps, schema_editor):
        AlbumThing = apps.get_model("api", "AlbumThing")
        for thing in AlbumThing.objects.all():
            thing.photo_count = 0
            thing.save()

    dependencies = [
        ("api", "0064_albumthing_photo_count"),
    ]

    operations = [migrations.RunPython(apply_default, remove_default)]


================================================
FILE: api/migrations/0066_photo_last_modified_alter_longrunningjob_job_type.py
================================================
# Generated by Django 4.2.13 on 2024-06-12 15:09

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0065_apply_default_photo_count"),
    ]

    operations = [
        migrations.AddField(
            model_name="photo",
            name="last_modified",
            field=models.DateTimeField(auto_now=True),
        ),
        migrations.AlterField(
            model_name="longrunningjob",
            name="job_type",
            field=models.PositiveIntegerField(
                choices=[
                    (1, "Scan Photos"),
                    (2, "Generate Event Albums"),
                    (3, "Regenerate Event Titles"),
                    (4, "Train Faces"),
                    (5, "Delete Missing Photos"),
                    (7, "Scan Faces"),
                    (6, "Calculate Clip Embeddings"),
                    (8, "Find Similar Faces"),
                    (9, "Download Selected Photos"),
                    (10, "Download Models"),
                    (11, "Add Geolocation"),
                    (12, "Generate Tags"),
                ]
            ),
        ),
    ]


================================================
FILE: api/migrations/0067_alter_longrunningjob_job_type.py
================================================
# Generated by Django 4.2.13 on 2024-06-16 15:40

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0066_photo_last_modified_alter_longrunningjob_job_type"),
    ]

    operations = [
        migrations.AlterField(
            model_name="longrunningjob",
            name="job_type",
            field=models.PositiveIntegerField(
                choices=[
                    (1, "Scan Photos"),
                    (2, "Generate Event Albums"),
                    (3, "Regenerate Event Titles"),
                    (4, "Train Faces"),
                    (5, "Delete Missing Photos"),
                    (7, "Scan Faces"),
                    (6, "Calculate Clip Embeddings"),
                    (8, "Find Similar Faces"),
                    (9, "Download Selected Photos"),
                    (10, "Download Models"),
                    (11, "Add Geolocation"),
                    (12, "Generate Tags"),
                    (13, "Generate Face Embeddings"),
                ]
            ),
        ),
    ]


================================================
FILE: api/migrations/0068_remove_longrunningjob_result_and_more.py
================================================
# Generated by Django 4.2.13 on 2024-06-18 13:18
from django.db import migrations, models


def copy_progress_data(apps, schema_editor):
    LongRunningJob = apps.get_model("api", "LongRunningJob")
    for job in LongRunningJob.objects.all():
        result = job.result
        job.progress_current = result["progress"]["current"]
        job.progress_target = result["progress"]["target"]
        job.save()


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0067_alter_longrunningjob_job_type"),
    ]

    operations = [
        migrations.AddField(
            model_name="longrunningjob",
            name="progress_current",
            field=models.PositiveIntegerField(default=0),
        ),
        migrations.AddField(
            model_name="longrunningjob",
            name="progress_target",
            field=models.PositiveIntegerField(default=0),
        ),
        migrations.RunPython(copy_progress_data),
        migrations.RemoveField(
            model_name="longrunningjob",
            name="result",
        ),
    ]


================================================
FILE: api/migrations/0069_rename_to_in_trashcan.py
================================================
from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0068_remove_longrunningjob_result_and_more"),
    ]

    operations = [
        migrations.RenameField(
            model_name="photo",
            old_name="deleted",
            new_name="in_trashcan",
        ),
    ]


================================================
FILE: api/migrations/0070_photo_removed.py
================================================
# Generated by Django 4.2.14 on 2024-08-21 19:17

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0069_rename_to_in_trashcan"),
    ]

    operations = [
        migrations.AddField(
            model_name="photo",
            name="removed",
            field=models.BooleanField(db_index=True, default=False),
        ),
    ]


================================================
FILE: api/migrations/0071_rename_person_label_probability_face_cluster_probability_and_more.py
================================================
# Generated by Django 4.2.16 on 2024-09-20 18:56

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0070_photo_removed"),
    ]

    operations = [
        migrations.RenameField(
            model_name="face",
            old_name="person_label_probability",
            new_name="cluster_probability",
        ),
        migrations.RemoveField(
            model_name="face",
            name="person_label_is_inferred",
        ),
        migrations.AddField(
            model_name="face",
            name="classification_person",
            field=models.ForeignKey(
                blank=True,
                null=True,
                on_delete=django.db.models.deletion.SET_NULL,
                related_name="classification_faces",
                to="api.person",
            ),
        ),
        migrations.AddField(
            model_name="face",
            name="classification_probability",
            field=models.FloatField(db_index=True, default=0.0),
        ),
        migrations.AddField(
            model_name="face",
            name="cluster_person",
            field=models.ForeignKey(
                blank=True,
                null=True,
                on_delete=django.db.models.deletion.SET_NULL,
                related_name="cluster_classification_faces",
                to="api.person",
            ),
        ),
        migrations.AddField(
            model_name="face",
            name="deleted",
            field=models.BooleanField(default=False),
        ),
    ]


================================================
FILE: api/migrations/0072_alter_face_person.py
================================================
# Generated by Django 4.2.16 on 2024-09-20 19:07

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        (
            "api",
            "0071_rename_person_label_probability_face_cluster_probability_and_more",
        ),
    ]

    operations = [
        migrations.AlterField(
            model_name="face",
            name="person",
            field=models.ForeignKey(
                null=True,
                on_delete=django.db.models.deletion.DO_NOTHING,
                related_name="faces",
                to="api.person",
            ),
        ),
    ]


================================================
FILE: api/migrations/0073_remove_unknown_person.py
================================================
from django.db import migrations


def delete_unknown_person_and_update_faces(apps, schema_editor):
    # Get models
    Person = apps.get_model("api", "Person")
    Face = apps.get_model("api", "Face")

    # Define the name for unknown persons
    unknown_person_name = "Unknown - Other"

    # Find all persons with the name "Unknown - Other"
    unknown_persons = Person.objects.filter(name=unknown_person_name)

    # Iterate through each unknown person and set faces' person field to null
    for unknown_person in unknown_persons:
        # Set all faces' person field referencing the "Unknown - Other" person to null
        Face.objects.filter(person=unknown_person).update(person=None)

        # Delete the "Unknown - Other" person
        unknown_person.delete()


def recreate_unknown_person_and_restore_faces(apps, schema_editor):
    # Get models
    Person = apps.get_model("api", "Person")
    Face = apps.get_model("api", "Face")
    User = apps.get_model("api", "User")

    # Define the name for unknown persons
    unknown_person_name = "Unknown - Other"

    # Retrieve all users to recreate their unknown persons
    users = User.objects.all()

    for user in users:
        # Recreate the "Unknown - Other" person for each user
        unknown_person = Person.objects.create(
            name=unknown_person_name, kind=Person.KIND_UNKNOWN, cluster_owner=user
        )

        # Restore faces for each recreated person based on user ownership
        Face.objects.filter(person=None, photo__owner=user).update(
            person=unknown_person
        )


class Migration(migrations.Migration):
    dependencies = [
        (
            "api",
            "0072_alter_face_person",
        ),
    ]

    operations = [
        migrations.RunPython(
            delete_unknown_person_and_update_faces,
            recreate_unknown_person_and_restore_faces,
        ),
    ]


================================================
FILE: api/migrations/0074_migrate_cluster_person.py
================================================
from django.db import migrations


def move_person_to_cluster_if_kind_cluster(apps, schema_editor):
    # Get the necessary models
    Face = apps.get_model("api", "Face")

    # Define the constant for KIND_CLUSTER
    KIND_CLUSTER = "CLUSTER"

    # Fetch all Face instances where person is not null
    faces_to_update = Face.objects.filter(person__isnull=False)

    # Iterate over the faces and process each one
    for face in faces_to_update:
        # Check if the person is of type KIND_CLUSTER
        if face.person.kind == KIND_CLUSTER:
            # Move the person to the cluster field and set the person field to null
            face.cluster_person = face.person
            face.person = None
            face.save()


def restore_person_from_cluster(apps, schema_editor):
    # Get the necessary models
    Face = apps.get_model("api", "Face")

    # Fetch all Face instances where original_person_id is not null (from forward migration)
    faces_to_restore = Face.objects.filter(cluster_person__isnull=False)

    # Iterate over the faces and restore the person reference from the original_person_id field
    for face in faces_to_restore:
        face.person = face.cluster_person
        face.cluster_person = None
        face.save()


class Migration(migrations.Migration):
    dependencies = [
        (
            "api",
            "0073_remove_unknown_person",
        ),
    ]

    operations = [
        migrations.RunPython(
            move_person_to_cluster_if_kind_cluster,
            restore_person_from_cluster,
        ),
    ]


================================================
FILE: api/migrations/0075_alter_face_cluster_person.py
================================================
# Generated by Django 4.2.16 on 2024-09-20 19:49

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0074_migrate_cluster_person"),
    ]

    operations = [
        migrations.AlterField(
            model_name="face",
            name="cluster_person",
            field=models.ForeignKey(
                blank=True,
                null=True,
                on_delete=django.db.models.deletion.SET_NULL,
                related_name="cluster_faces",
                to="api.person",
            ),
        ),
    ]


================================================
FILE: api/migrations/0076_alter_file_path_alter_longrunningjob_job_type_and_more.py
================================================
# Generated by Django 4.2.18 on 2025-03-29 12:38

from django.db import migrations, models
import django_cryptography.fields


class Migration(migrations.Migration):

    dependencies = [
        ("api", "0075_alter_face_cluster_person"),
    ]

    operations = [
        migrations.AlterField(
            model_name="file",
            name="path",
            field=models.TextField(blank=True, default=""),
        ),
        migrations.AlterField(
            model_name="longrunningjob",
            name="job_type",
            field=models.PositiveIntegerField(
                choices=[
                    (1, "Scan Photos"),
                    (2, "Generate Event Albums"),
                    (3, "Regenerate Event Titles"),
                    (4, "Train Faces"),
                    (5, "Delete Missing Photos"),
                    (7, "Scan Faces"),
                    (6, "Calculate Clip Embeddings"),
                    (8, "Find Similar Faces"),
                    (9, "Download Selected Photos"),
                    (10, "Download Models"),
                    (11, "Add Geolocation"),
                    (12, "Generate Tags"),
                    (13, "Generate Face Embeddings"),
                    (14, "Scan Missing Photos"),
                ]
            ),
        ),
        migrations.AlterField(
            model_name="user",
            name="nextcloud_app_password",
            field=django_cryptography.fields.encrypt(
                models.CharField(blank=True, default="", max_length=64)
            ),
        ),
        migrations.AlterField(
            model_name="user",
            name="nextcloud_scan_directory",
            field=models.CharField(
                blank=True, db_index=True, default="", max_length=512
            ),
        ),
        migrations.AlterField(
            model_name="user",
            name="nextcloud_server_address",
            field=models.CharField(blank=True, default="", max_length=200),
        ),
        migrations.AlterField(
            model_name="user",
            name="nextcloud_username",
            field=models.CharField(blank=True, default="", max_length=64),
        ),
    ]


================================================
FILE: api/migrations/0077_alter_albumdate_title.py
================================================
# Generated by Django 4.2.18 on 2025-03-29 12:59

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("api", "0076_alter_file_path_alter_longrunningjob_job_type_and_more"),
    ]

    operations = [
        migrations.AlterField(
            model_name="albumdate",
            name="title",
            field=models.CharField(
                blank=True, db_index=True, default="", max_length=512
            ),
        ),
    ]


================================================
FILE: api/migrations/0078_create_photo_thumbnail.py
================================================
from django.db import migrations, models
import django.db.models.deletion


class Migration(migrations.Migration):
    dependencies = [
        ('api', '0077_alter_albumdate_title'),
    ]

    operations = [
        migrations.CreateModel(
            name='Thumbnail',
            fields=[
                ('photo', models.OneToOneField(on_delete=django.db.models.deletion.CASCADE, primary_key=True, related_name='thumbnail', serialize=False, to='api.photo')),
                ('thumbnail_big', models.ImageField(upload_to='thumbnails_big')),
                ('square_thumbnail', models.ImageField(upload_to='square_thumbnails')),
                ('square_thumbnail_small', models.ImageField(upload_to='square_thumbnails_small')),
                ('aspect_ratio', models.FloatField(blank=True, null=True)),
                ('dominant_color', models.TextField(blank=True, null=True)),
            ],
        ),
        migrations.RunSQL(
            sql=[
                """
                INSERT INTO api_thumbnail (
                    photo_id,
                    thumbnail_big,
                    square_thumbnail,
                    square_thumbnail_small,
                    aspect_ratio,
                    dominant_color
                )
                SELECT 
                    image_hash,
                    thumbnail_big,
                    square_thumbnail,
                    square_thumbnail_small,
                    aspect_ratio,
                    dominant_color
                FROM api_photo
                """
            ],
            reverse_sql=[
                """
                UPDATE api_photo p
                SET 
                    thumbnail_big = pt.thumbnail_big,
                    square_thumbnail = pt.square_thumbnail,
                    square_thumbnail_small = pt.square_thumbnail_small,
                    aspect_ratio = pt.aspect_ratio,
                    dominant_color = pt.dominant_color
                FROM api_thumbnail pt
                WHERE p.image_hash = pt.photo_id
                """
            ]
        ),
        migrations.RemoveField(
            model_name='photo',
            name='aspect_ratio',
        ),
        migrations.RemoveField(
            model_name='photo',
            name='dominant_color',
        ),
        migrations.RemoveField(
            model_name='photo',
            name='square_thumbnail',
        ),
        migrations.RemoveField(
            model_name='photo',
            name='square_thumbnail_small',
        ),
        migrations.RemoveField(
            model_name='photo',
            name='thumbnail_big',
        ),
    ] 

================================================
FILE: api/migrations/0079_alter_albumauto_title.py
================================================
# Generated by Django 4.2.18 on 2025-05-04 14:28

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("api", "0078_create_photo_thumbnail"),
    ]

    operations = [
        migrations.AlterField(
            model_name="albumauto",
            name="title",
            field=models.CharField(default="Untitled Album", max_length=512),
        ),
    ]


================================================
FILE: api/migrations/0080_create_photo_caption.py
================================================
# Generated migration for PhotoCaption model

from django.db import migrations, models
import django.db.models.deletion


def migrate_caption_data(apps, schema_editor):
    """Migrate existing caption data from Photo to PhotoCaption"""
    Photo = apps.get_model('api', 'Photo')
    PhotoCaption = apps.get_model('api', 'PhotoCaption')
    
    db_alias = schema_editor.connection.alias
    
    # Create PhotoCaption instances for all photos that have caption data
    photos_with_captions = Photo.objects.using(db_alias).filter(
        models.Q(captions_json__isnull=False) | models.Q(search_captions__isnull=False)
    ).exclude(captions_json={})
    
    captions_to_create = []
    
    for photo in photos_with_captions.iterator():
        captions_to_create.append(
            PhotoCaption(
                photo_id=photo.image_hash,
                captions_json=photo.captions_json,
                search_captions=photo.search_captions
            )
        )
        
        # Process in batches to avoid memory issues
        if len(captions_to_create) >= 1000:
            PhotoCaption.objects.using(db_alias).bulk_create(captions_to_create, ignore_conflicts=True)
            captions_to_create = []
    
    # Create remaining captions
    if captions_to_create:
        PhotoCaption.objects.using(db_alias).bulk_create(captions_to_create, ignore_conflicts=True)


def reverse_migrate_caption_data(apps, schema_editor):
    """Reverse migration - copy data back from PhotoCaption to Photo"""
    Photo = apps.get_model('api', 'Photo')
    PhotoCaption = apps.get_model('api', 'PhotoCaption')
    
    db_alias = schema_editor.connection.alias
    
    # Update photos with caption data from PhotoCaption instances
    for caption in PhotoCaption.objects.using(db_alias).all():
        try:
            photo = Photo.objects.using(db_alias).get(image_hash=caption.photo_id)
            photo.captions_json = caption.captions_json
            photo.search_captions = caption.search_captions
            photo.save(update_fields=['captions_json', 'search_captions'])
        except Photo.DoesNotExist:
            continue


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0079_alter_albumauto_title'),
    ]

    operations = [
        migrations.CreateModel(
            name='PhotoCaption',
            fields=[
                ('photo', models.OneToOneField(on_delete=django.db.models.deletion.CASCADE, primary_key=True, related_name='caption_instance', serialize=False, to='api.photo')),
                ('captions_json', models.JSONField(blank=True, db_index=True, null=True)),
                ('search_captions', models.TextField(blank=True, db_index=True, null=True)),
                ('created_at', models.DateTimeField(auto_now_add=True)),
                ('updated_at', models.DateTimeField(auto_now=True)),
            ],
            options={
                'db_table': 'api_photo_caption',
            },
        ),
        migrations.RunPython(
            migrate_caption_data,
            reverse_migrate_caption_data,
        ),
    ] 

================================================
FILE: api/migrations/0081_remove_caption_fields_from_photo.py
================================================
# Generated migration to remove caption fields from Photo model

from django.db import migrations


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0080_create_photo_caption'),
    ]

    operations = [
        migrations.RemoveField(
            model_name='photo',
            name='captions_json',
        ),
        migrations.RemoveField(
            model_name='photo',
            name='search_captions',
        ),
    ] 

================================================
FILE: api/migrations/0082_create_photo_search.py
================================================
# Generated migration for PhotoSearch model

from django.db import migrations, models
import django.db.models.deletion


def migrate_search_data(apps, schema_editor):
    """Migrate existing search data from Photo and PhotoCaption to PhotoSearch"""
    Photo = apps.get_model('api', 'Photo')
    PhotoCaption = apps.get_model('api', 'PhotoCaption')
    PhotoSearch = apps.get_model('api', 'PhotoSearch')
    
    db_alias = schema_editor.connection.alias
    
    # Create PhotoSearch instances for all photos that have search data
    photos_with_search_data = Photo.objects.using(db_alias).filter(
        search_location__isnull=False
    ).exclude(search_location='')
    
    search_instances_to_create = []
    
    for photo in photos_with_search_data.iterator():
        search_instances_to_create.append(
            PhotoSearch(
                photo=photo,
                search_location=photo.search_location,
                search_captions=''  # Will be populated later
            )
        )
    
    # Bulk create PhotoSearch instances
    PhotoSearch.objects.using(db_alias).bulk_create(search_instances_to_create, ignore_conflicts=True)
    
    # Now migrate search_captions from PhotoCaption to PhotoSearch
    for caption in PhotoCaption.objects.using(db_alias).filter(search_captions__isnull=False).exclude(search_captions=''):
        search_instance, created = PhotoSearch.objects.using(db_alias).get_or_create(
            photo=caption.photo,
            defaults={'search_captions': caption.search_captions, 'search_location': ''}
        )
        if not created:
            search_instance.search_captions = caption.search_captions
            search_instance.save()


def reverse_migrate_search_data(apps, schema_editor):
    """Reverse migration - copy data back from PhotoSearch to Photo and PhotoCaption"""
    Photo = apps.get_model('api', 'Photo')
    PhotoCaption = apps.get_model('api', 'PhotoCaption')
    PhotoSearch = apps.get_model('api', 'PhotoSearch')
    
    db_alias = schema_editor.connection.alias
    
    # Update photos with search_location from PhotoSearch instances
    for search in PhotoSearch.objects.using(db_alias).all():
        try:
            photo = Photo.objects.using(db_alias).get(image_hash=search.photo_id)
            photo.search_location = search.search_location
            photo.save(update_fields=['search_location'])
            
            # Update PhotoCaption with search_captions
            caption, created = PhotoCaption.objects.using(db_alias).get_or_create(photo=photo)
            caption.search_captions = search.search_captions
            caption.save(update_fields=['search_captions'])
        except Photo.DoesNotExist:
            continue


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0081_remove_caption_fields_from_photo'),
    ]

    operations = [
        migrations.CreateModel(
            name='PhotoSearch',
            fields=[
                ('photo', models.OneToOneField(on_delete=django.db.models.deletion.CASCADE, primary_key=True, related_name='search_instance', serialize=False, to='api.photo')),
                ('search_captions', models.TextField(blank=True, db_index=True, null=True)),
                ('search_location', models.TextField(blank=True, db_index=True, null=True)),
                ('created_at', models.DateTimeField(auto_now_add=True)),
                ('updated_at', models.DateTimeField(auto_now=True)),
            ],
            options={
                'db_table': 'api_photo_search',
            },
        ),
        migrations.RunPython(
            migrate_search_data,
            reverse_migrate_search_data,
        ),
    ] 

================================================
FILE: api/migrations/0083_remove_search_fields.py
================================================
# Generated migration to remove search fields from Photo and PhotoCaption models

from django.db import migrations


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0082_create_photo_search'),
    ]

    operations = [
        migrations.RemoveField(
            model_name='photo',
            name='search_location',
        ),
        migrations.RemoveField(
            model_name='photocaption',
            name='search_captions',
        ),
    ] 

================================================
FILE: api/migrations/0084_convert_arrayfield_to_json.py
================================================
# Migration to safely convert ArrayField to JSONField for SQLite compatibility
from django.db import migrations, models


def copy_arrayfield_to_json(apps, schema_editor):
    """
    Copy data from ArrayField to JSONField format.
    This handles the conversion for both PostgreSQL and SQLite.
    """
    Photo = apps.get_model('api', 'Photo')
    
    for photo in Photo.objects.all():
        if photo.clip_embeddings is not None:
            # ArrayField data is already in list format, just copy it
            photo.clip_embeddings_json = photo.clip_embeddings
            photo.save(update_fields=['clip_embeddings_json'])


def copy_json_to_arrayfield(apps, schema_editor):
    """
    Reverse migration: copy JSONField data back to ArrayField format.
    """
    Photo = apps.get_model('api', 'Photo')
    
    for photo in Photo.objects.all():
        if photo.clip_embeddings_json is not None:
            photo.clip_embeddings = photo.clip_embeddings_json
            photo.save(update_fields=['clip_embeddings'])


class Migration(migrations.Migration):
    dependencies = [
        ('api', '0083_remove_search_fields'),
    ]

    operations = [
        # Step 1: Add new JSONField
        migrations.AddField(
            model_name='Photo',
            name='clip_embeddings_json',
            field=models.JSONField(blank=True, null=True),
        ),
        
        # Step 2: Copy data from ArrayField to JSONField
        migrations.RunPython(
            copy_arrayfield_to_json,
            copy_json_to_arrayfield,
        ),
        
        # Step 3: Remove old ArrayField
        migrations.RemoveField(
            model_name='Photo',
            name='clip_embeddings',
        ),
        
        # Step 4: Rename JSONField to original name
        migrations.RenameField(
            model_name='Photo',
            old_name='clip_embeddings_json',
            new_name='clip_embeddings',
        ),
    ] 

================================================
FILE: api/migrations/0085_albumuser_public_expires_at_albumuser_public_slug.py
================================================
# Generated by Django 5.2.4 on 2025-08-16 08:40

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0084_convert_arrayfield_to_json'),
    ]

    operations = [
        migrations.AddField(
            model_name='albumuser',
            name='public_expires_at',
            field=models.DateTimeField(blank=True, db_index=True, null=True),
        ),
        migrations.AddField(
            model_name='albumuser',
            name='public_slug',
            field=models.SlugField(blank=True, max_length=64, null=True, unique=True),
        ),
    ]


================================================
FILE: api/migrations/0086_remove_albumuser_public_and_more.py
================================================
# Generated by Django 5.2.4 on 2025-08-17 17:23

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0085_albumuser_public_expires_at_albumuser_public_slug'),
    ]

    operations = [
        migrations.RemoveField(
            model_name='albumuser',
            name='public',
        ),
        migrations.RemoveField(
            model_name='albumuser',
            name='public_expires_at',
        ),
        migrations.RemoveField(
            model_name='albumuser',
            name='public_slug',
        ),
        migrations.CreateModel(
            name='AlbumUserShare',
            fields=[
                ('id', models.AutoField(auto_created=True, primary_key=True, serialize=False, verbose_name='ID')),
                ('enabled', models.BooleanField(db_index=True, default=False)),
                ('slug', models.SlugField(blank=True, max_length=64, null=True, unique=True)),
                ('expires_at', models.DateTimeField(blank=True, db_index=True, null=True)),
                ('album', models.OneToOneField(on_delete=django.db.models.deletion.CASCADE, related_name='share', to='api.albumuser')),
            ],
        ),
    ]


================================================
FILE: api/migrations/0087_add_folder_album.py
================================================
# Generated by Django 5.2.4 on 2025-08-22 14:48

import django.db.models.deletion
from django.conf import settings
from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0086_remove_albumuser_public_and_more'),
    ]

    operations = [
        migrations.CreateModel(
            name='FolderAlbum',
            fields=[
                ('id', models.AutoField(auto_created=True, primary_key=True, serialize=False, verbose_name='ID')),
                ('title', models.CharField(max_length=512)),
                ('created_on', models.DateTimeField(auto_now_add=True, db_index=True)),
                ('updated_on', models.DateTimeField(auto_now=True)),
                ('folder_path', models.TextField()),
                ('include_subdirectories', models.BooleanField(default=True)),
                ('public', models.BooleanField(db_index=True, default=False)),
                ('favorited', models.BooleanField(db_index=True, default=False)),
                ('cover_photo', models.ForeignKey(blank=True, null=True, on_delete=django.db.models.deletion.SET_NULL, related_name='folder_album_cover', to='api.photo')),
                ('owner', models.ForeignKey(default=None, on_delete=django.db.models.deletion.CASCADE, to=settings.AUTH_USER_MODEL)),
            ],
            options={
                'ordering': ['-created_on'],
                'unique_together': {('folder_path', 'owner')},
            },
        ),
    ]


================================================
FILE: api/migrations/0088_remove_folder_album.py
================================================
# Generated by Django 5.2.4 on 2025-08-22 15:40

from django.db import migrations


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0087_add_folder_album'),
    ]

    operations = [
        migrations.DeleteModel(
            name='FolderAlbum',
        ),
    ]


================================================
FILE: api/migrations/0089_add_text_alignment.py
================================================
# Generated by Django 5.2.4 on 2025-08-22 16:00

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0088_remove_folder_album'),
    ]

    operations = [
        migrations.AddField(
            model_name='user',
            name='text_alignment',
            field=models.TextField(choices=[('left', 'Left'), ('right', 'Right')], default='right'),
        ),
    ]


================================================
FILE: api/migrations/0090_add_header_size.py
================================================
# Generated by Django 5.2.4 on 2025-08-22 16:27

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0089_add_text_alignment'),
    ]

    operations = [
        migrations.AddField(
            model_name='user',
            name='header_size',
            field=models.TextField(choices=[('large', 'Large'), ('normal', 'Normal'), ('small', 'Small')], default='large'),
        ),
    ]


================================================
FILE: api/migrations/0091_alter_user_scan_directory.py
================================================
# Generated by Django 5.2.4 on 2025-08-30 12:34

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0090_add_header_size'),
    ]

    operations = [
        migrations.AlterField(
            model_name='user',
            name='scan_directory',
            field=models.CharField(blank=True, db_index=True, default='', max_length=512),
        ),
    ]


================================================
FILE: api/migrations/0092_add_skip_raw_files_field.py
================================================
# Generated by Django 5.2.7 on 2025-10-26 21:54

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0091_alter_user_scan_directory'),
    ]

    operations = [
        migrations.AddField(
            model_name='user',
            name='skip_raw_files',
            field=models.BooleanField(default=False),
        ),
    ]


================================================
FILE: api/migrations/0093_migrate_photon_to_nominatim.py
================================================
"""
Migration to change MAP_API_PROVIDER from 'photon' to 'nominatim'.

Photon's public API at photon.komoot.io has become unreliable (502 errors),
so we're switching the default to Nominatim which is more stable.
"""

from django.db import migrations


def migrate_photon_to_nominatim(apps, schema_editor):
    """Update constance config from photon to nominatim."""
    try:
        Constance = apps.get_model("constance", "Constance")
        config = Constance.objects.filter(key="MAP_API_PROVIDER").first()
        if config and config.value == '"photon"':
            config.value = '"nominatim"'
            config.save()
    except LookupError:
        # constance model not available, skip
        pass


def reverse_migration(apps, schema_editor):
    """Reverse: change nominatim back to photon (not recommended)."""
    try:
        Constance = apps.get_model("constance", "Constance")
        config = Constance.objects.filter(key="MAP_API_PROVIDER").first()
        if config and config.value == '"nominatim"':
            config.value = '"photon"'
            config.save()
    except LookupError:
        pass


class Migration(migrations.Migration):

    dependencies = [
        ("api", "0092_add_skip_raw_files_field"),
    ]

    operations = [
        migrations.RunPython(migrate_photon_to_nominatim, reverse_migration),
    ]


================================================
FILE: api/migrations/0094_add_slideshow_interval.py
================================================
# Generated manually for slideshow interval feature

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0093_migrate_photon_to_nominatim'),
    ]

    operations = [
        migrations.AddField(
            model_name='user',
            name='slideshow_interval',
            field=models.IntegerField(default=5),
        ),
    ]


================================================
FILE: api/migrations/0095_photo_perceptual_hash_alter_longrunningjob_job_type_and_more.py
================================================
# Generated by Django 5.2.9 on 2025-12-23 09:47

import api.models.user
import django.db.models.deletion
from django.conf import settings
from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0094_add_slideshow_interval'),
    ]

    operations = [
        migrations.AddField(
            model_name='photo',
            name='perceptual_hash',
            field=models.CharField(blank=True, db_index=True, max_length=64, null=True),
        ),
        migrations.AlterField(
            model_name='longrunningjob',
            name='job_type',
            field=models.PositiveIntegerField(choices=[(1, 'Scan Photos'), (2, 'Generate Event Albums'), (3, 'Regenerate Event Titles'), (4, 'Train Faces'), (5, 'Delete Missing Photos'), (7, 'Scan Faces'), (6, 'Calculate Clip Embeddings'), (8, 'Find Similar Faces'), (9, 'Download Selected Photos'), (10, 'Download Models'), (11, 'Add Geolocation'), (12, 'Generate Tags'), (13, 'Generate Face Embeddings'), (14, 'Scan Missing Photos'), (15, 'Detect Duplicate Photos')]),
        ),
        migrations.CreateModel(
            name='DuplicateGroup',
            fields=[
                ('id', models.AutoField(auto_created=True, primary_key=True, serialize=False, verbose_name='ID')),
                ('created_at', models.DateTimeField(auto_now_add=True)),
                ('updated_at', models.DateTimeField(auto_now=True)),
                ('status', models.CharField(choices=[('pending', 'Pending Review'), ('reviewed', 'Reviewed'), ('dismissed', 'Dismissed (Not Duplicates)')], db_index=True, default='pending', max_length=20)),
                ('owner', models.ForeignKey(on_delete=models.SET(api.models.user.get_deleted_user), related_name='duplicate_groups', to=settings.AUTH_USER_MODEL)),
                ('preferred_photo', models.ForeignKey(blank=True, null=True, on_delete=django.db.models.deletion.SET_NULL, related_name='preferred_in_group', to='api.photo')),
            ],
            options={
                'ordering': ['-created_at'],
            },
        ),
        migrations.AddField(
            model_name='photo',
            name='duplicate_group',
            field=models.ForeignKey(blank=True, null=True, on_delete=django.db.models.deletion.SET_NULL, related_name='photos', to='api.duplicategroup'),
        ),
    ]


================================================
FILE: api/migrations/0096_add_progress_step_and_result_to_longrunningjob.py
================================================
# Generated by Django 5.2.9 on 2025-12-23 12:13

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0095_photo_perceptual_hash_alter_longrunningjob_job_type_and_more'),
    ]

    operations = [
        migrations.AddField(
            model_name='longrunningjob',
            name='progress_step',
            field=models.CharField(blank=True, max_length=100, null=True),
        ),
        migrations.AddField(
            model_name='longrunningjob',
            name='result',
            field=models.JSONField(blank=True, null=True),
        ),
    ]


================================================
FILE: api/migrations/0097_add_duplicate_detection_settings_to_user.py
================================================
# Generated by Django 5.2.9 on 2025-12-23 13:00

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0096_add_progress_step_and_result_to_longrunningjob'),
    ]

    operations = [
        migrations.AddField(
            model_name='user',
            name='duplicate_clear_existing',
            field=models.BooleanField(default=False),
        ),
        migrations.AddField(
            model_name='user',
            name='duplicate_sensitivity',
            field=models.TextField(choices=[('strict', 'Strict'), ('normal', 'Normal'), ('loose', 'Loose')], default='normal'),
        ),
    ]


================================================
FILE: api/migrations/0098_add_photo_stack.py
================================================
# Generated migration for PhotoStack unified grouping system

import uuid
from django.db import migrations, models
import django.db.models.deletion


def get_deleted_user():
    """Reference to the function that returns the deleted user placeholder."""
    from api.models.user import get_deleted_user as _get_deleted_user
    return _get_deleted_user


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0097_add_duplicate_detection_settings_to_user'),
    ]

    operations = [
        # Create the PhotoStack table
        migrations.CreateModel(
            name='PhotoStack',
            fields=[
                ('id', models.UUIDField(default=uuid.uuid4, editable=False, primary_key=True, serialize=False)),
                ('stack_type', models.CharField(
                    choices=[
                        ('exact_copy', 'Exact Copies'),
                        ('visual_duplicate', 'Visual Duplicates'),
                        ('raw_jpeg', 'RAW + JPEG Pair'),
                        ('burst', 'Burst Sequence'),
                        ('bracket', 'Exposure Bracket'),
                        ('live_photo', 'Live Photo'),
                        ('manual', 'Manual Stack'),
                    ],
                    db_index=True,
                    default='visual_duplicate',
                    max_length=20,
                )),
                ('status', models.CharField(
                    choices=[
                        ('pending', 'Pending Review'),
                        ('reviewed', 'Reviewed'),
                        ('dismissed', 'Dismissed'),
                    ],
                    db_index=True,
                    default='pending',
                    max_length=20,
                )),
                ('created_at', models.DateTimeField(auto_now_add=True)),
                ('updated_at', models.DateTimeField(auto_now=True)),
                ('similarity_score', models.FloatField(blank=True, null=True)),
                ('sequence_start', models.DateTimeField(blank=True, null=True)),
                ('sequence_end', models.DateTimeField(blank=True, null=True)),
                ('potential_savings', models.BigIntegerField(default=0)),
                ('owner', models.ForeignKey(
                    on_delete=django.db.models.deletion.SET(get_deleted_user),
                    related_name='photo_stacks',
                    to='api.user',
                )),
                ('primary_photo', models.ForeignKey(
                    blank=True,
                    null=True,
                    on_delete=django.db.models.deletion.SET_NULL,
                    related_name='primary_in_stack',
                    to='api.photo',
                )),
            ],
            options={
                'verbose_name': 'Photo Stack',
                'verbose_name_plural': 'Photo Stacks',
                'ordering': ['-created_at'],
            },
        ),
        # Add indexes for PhotoStack
        migrations.AddIndex(
            model_name='photostack',
            index=models.Index(fields=['owner', 'stack_type', 'status'], name='api_photost_owner_i_abc123_idx'),
        ),
        migrations.AddIndex(
            model_name='photostack',
            index=models.Index(fields=['owner', 'status'], name='api_photost_owner_i_def456_idx'),
        ),
        # Add stack field to Photo
        migrations.AddField(
            model_name='photo',
            name='stack',
            field=models.ForeignKey(
                blank=True,
                null=True,
                on_delete=django.db.models.deletion.SET_NULL,
                related_name='photos',
                to='api.photostack',
            ),
        ),
        # Add sub-second timestamp for burst detection
        migrations.AddField(
            model_name='photo',
            name='exif_timestamp_subsec',
            field=models.CharField(blank=True, max_length=10, null=True),
        ),
        # Add image sequence number for burst detection
        migrations.AddField(
            model_name='photo',
            name='image_sequence_number',
            field=models.IntegerField(blank=True, null=True),
        ),
        # Remove duplicate_group FK from Photo (replaced by stack)
        migrations.RemoveField(
            model_name='photo',
            name='duplicate_group',
        ),
        # Delete the old DuplicateGroup model
        migrations.DeleteModel(
            name='DuplicateGroup',
        ),
    ]


================================================
FILE: api/migrations/0099_photo_uuid_primary_key.py
================================================
# Generated migration for Photo UUID primary key
# This migration changes Photo from using image_hash as PK to using UUID as PK
#
# Supports both PostgreSQL (raw SQL) and SQLite (table recreation pattern).
#
# ============================================================================
# CRITICAL WARNING: THIS MIGRATION IS NOT REVERSIBLE
# ============================================================================
# This migration fundamentally changes the Photo primary key from image_hash
# (a content-based hash) to UUID (a random identifier). Reversing this would
# require regenerating the original image_hash values from file content, which
# is not possible without access to the original photo files and significant
# processing time.
#
# BEFORE RUNNING THIS MIGRATION:
# 1. Create a FULL DATABASE BACKUP: pg_dump -U your_user your_db > backup.sql
# 2. Test the migration on a copy of your production database first
# 3. Plan for downtime - this migration may take significant time on large DBs
# 4. Ensure you have enough disk space for the migration operations
#
# TO ROLLBACK (if needed):
# 1. Stop the application
# 2. Restore from your pre-migration database backup
# 3. Fake-migrate back: python manage.py migrate api 0098 --fake
# ============================================================================

import uuid
from django.db import migrations, models


# ============================================================================
# PostgreSQL raw SQL
# ============================================================================

POSTGRESQL_FORWARD_SQL = """
-- Step 1: Add UUID column to api_photo
ALTER TABLE api_photo ADD COLUMN id UUID DEFAULT gen_random_uuid();
UPDATE api_photo SET id = gen_random_uuid() WHERE id IS NULL;
ALTER TABLE api_photo ALTER COLUMN id SET NOT NULL;

-- Step 2: Create a mapping table for old hash -> new UUID
CREATE TEMP TABLE photo_id_mapping AS
SELECT image_hash, id FROM api_photo;
CREATE INDEX ON photo_id_mapping(image_hash);

-- Step 3: Add new UUID columns to all related tables

-- api_face
ALTER TABLE api_face ADD COLUMN photo_id_new UUID;
UPDATE api_face f SET photo_id_new = m.id
FROM photo_id_mapping m WHERE f.photo_id = m.image_hash;

-- api_photo_shared_to (M2M through table)
ALTER TABLE api_photo_shared_to ADD COLUMN photo_id_new UUID;
UPDATE api_photo_shared_to t SET photo_id_new = m.id
FROM photo_id_mapping m WHERE t.photo_id = m.image_hash;

-- api_photo_files (M2M through table)
ALTER TABLE api_photo_files ADD COLUMN photo_id_new UUID;
UPDATE api_photo_files t SET photo_id_new = m.id
FROM photo_id_mapping m WHERE t.photo_id = m.image_hash;

-- api_albumuser_photos (M2M through table)
ALTER TABLE api_albumuser_photos ADD COLUMN photo_id_new UUID;
UPDATE api_albumuser_photos t SET photo_id_new = m.id
FROM photo_id_mapping m WHERE t.photo_id = m.image_hash;

-- api_albumthing_photos (M2M through table)
ALTER TABLE api_albumthing_photos ADD COLUMN photo_id_new UUID;
UPDATE api_albumthing_photos t SET photo_id_new = m.id
FROM photo_id_mapping m WHERE t.photo_id = m.image_hash;

-- api_albumplace_photos (M2M through table)
ALTER TABLE api_albumplace_photos ADD COLUMN photo_id_new UUID;
UPDATE api_albumplace_photos t SET photo_id_new = m.id
FROM photo_id_mapping m WHERE t.photo_id = m.image_hash;

-- api_albumdate_photos (M2M through table)
ALTER TABLE api_albumdate_photos ADD COLUMN photo_id_new UUID;
UPDATE api_albumdate_photos t SET photo_id_new = m.id
FROM photo_id_mapping m WHERE t.photo_id = m.image_hash;

-- api_albumauto_photos (M2M through table)
ALTER TABLE api_albumauto_photos ADD COLUMN photo_id_new UUID;
UPDATE api_albumauto_photos t SET photo_id_new = m.id
FROM photo_id_mapping m WHERE t.photo_id = m.image_hash;

-- api_person (cover_photo_id)
ALTER TABLE api_person ADD COLUMN cover_photo_id_new UUID;
UPDATE api_person p SET cover_photo_id_new = m.id
FROM photo_id_mapping m WHERE p.cover_photo_id = m.image_hash;

-- api_albumuser (cover_photo_id)
ALTER TABLE api_albumuser ADD COLUMN cover_photo_id_new UUID;
UPDATE api_albumuser a SET cover_photo_id_new = m.id
FROM photo_id_mapping m WHERE a.cover_photo_id = m.image_hash;

-- api_albumthing_cover_photos (M2M through table for cover photos)
ALTER TABLE api_albumthing_cover_photos ADD COLUMN photo_id_new UUID;
UPDATE api_albumthing_cover_photos t SET photo_id_new = m.id
FROM photo_id_mapping m WHERE t.photo_id = m.image_hash;

-- api_thumbnail (OneToOne with PK)
ALTER TABLE api_thumbnail ADD COLUMN photo_id_new UUID;
UPDATE api_thumbnail t SET photo_id_new = m.id
FROM photo_id_mapping m WHERE t.photo_id = m.image_hash;

-- api_photo_caption (OneToOne with PK)
ALTER TABLE api_photo_caption ADD COLUMN photo_id_new UUID;
UPDATE api_photo_caption t SET photo_id_new = m.id
FROM photo_id_mapping m WHERE t.photo_id = m.image_hash;

-- api_photo_search (OneToOne with PK)
ALTER TABLE api_photo_search ADD COLUMN photo_id_new UUID;
UPDATE api_photo_search t SET photo_id_new = m.id
FROM photo_id_mapping m WHERE t.photo_id = m.image_hash;

-- api_photostack (primary_photo_id)
ALTER TABLE api_photostack ADD COLUMN primary_photo_id_new UUID;
UPDATE api_photostack s SET primary_photo_id_new = m.id
FROM photo_id_mapping m WHERE s.primary_photo_id = m.image_hash;

-- Step 4: Drop all FK constraints
ALTER TABLE api_face DROP CONSTRAINT IF EXISTS api_face_photo_id_6f997226_fk_api_photo_image_hash;
ALTER TABLE api_photo_shared_to DROP CONSTRAINT IF EXISTS api_photo_shared_to_photo_id_852923c7_fk_api_photo_image_hash;
ALTER TABLE api_photo_files DROP CONSTRAINT IF EXISTS api_photo_files_photo_id_f4365127_fk_api_photo_image_hash;
ALTER TABLE api_albumuser_photos DROP CONSTRAINT IF EXISTS api_albumuser_photos_photo_id_b9df1b14_fk_api_photo_image_hash;
ALTER TABLE api_albumthing_photos DROP CONSTRAINT IF EXISTS api_albumthing_photos_photo_id_d0832fc3_fk_api_photo_image_hash;
ALTER TABLE api_albumplace_photos DROP CONSTRAINT IF EXISTS api_albumplace_photos_photo_id_8fd88190_fk_api_photo_image_hash;
ALTER TABLE api_albumdate_photos DROP CONSTRAINT IF EXISTS api_albumdate_photos_photo_id_26095959_fk_api_photo_image_hash;
ALTER TABLE api_albumauto_photos DROP CONSTRAINT IF EXISTS api_albumauto_photos_photo_id_3320c2f0_fk_api_photo_image_hash;
ALTER TABLE api_person DROP CONSTRAINT IF EXISTS api_person_cover_photo_id_e0d8a6ab_fk_api_photo_image_hash;
ALTER TABLE api_albumuser DROP CONSTRAINT IF EXISTS api_albumuser_cover_photo_id_69b304ac_fk_api_photo_image_hash;
ALTER TABLE api_albumthing_cover_photos DROP CONSTRAINT IF EXISTS api_albumthing_cover_photo_id_ae113997_fk_api_photo;
ALTER TABLE api_thumbnail DROP CONSTRAINT IF EXISTS api_thumbnail_photo_id_484afcd0_fk_api_photo_image_hash;
ALTER TABLE api_photo_caption DROP CONSTRAINT IF EXISTS api_photo_caption_photo_id_363f8856_fk_api_photo_image_hash;
ALTER TABLE api_photo_search DROP CONSTRAINT IF EXISTS api_photo_search_photo_id_b4055a77_fk_api_photo_image_hash;
ALTER TABLE api_photostack DROP CONSTRAINT IF EXISTS api_photostack_primary_photo_id_a2e9fc96_fk_api_photo;

-- Step 5: Drop PKs on related tables that use photo as PK
ALTER TABLE api_thumbnail DROP CONSTRAINT IF EXISTS api_thumbnail_pkey;
ALTER TABLE api_photo_caption DROP CONSTRAINT IF EXISTS api_photo_caption_pkey;
ALTER TABLE api_photo_search DROP CONSTRAINT IF EXISTS api_photo_search_pkey;

-- Step 6: Drop old PK on api_photo, add new one
ALTER TABLE api_photo DROP CONSTRAINT api_photo_pkey;
ALTER TABLE api_photo ADD PRIMARY KEY (id);

-- Step 7: Add unique constraint on image_hash (for deduplication)
CREATE UNIQUE INDEX api_photo_image_hash_unique ON api_photo(image_hash);

-- Step 8: Drop old FK columns, rename new ones

ALTER TABLE api_face DROP COLUMN photo_id;
ALTER TABLE api_face RENAME COLUMN photo_id_new TO photo_id;

ALTER TABLE api_photo_shared_to DROP COLUMN photo_id;
ALTER TABLE api_photo_shared_to RENAME COLUMN photo_id_new TO photo_id;

ALTER TABLE api_photo_files DROP COLUMN photo_id;
ALTER TABLE api_photo_files RENAME COLUMN photo_id_new TO photo_id;

ALTER TABLE api_albumuser_photos DROP COLUMN photo_id;
ALTER TABLE api_albumuser_photos RENAME COLUMN photo_id_new TO photo_id;

ALTER TABLE api_albumthing_photos DROP COLUMN photo_id;
ALTER TABLE api_albumthing_photos RENAME COLUMN photo_id_new TO photo_id;

ALTER TABLE api_albumplace_photos DROP COLUMN photo_id;
ALTER TABLE api_albumplace_photos RENAME COLUMN photo_id_new TO photo_id;

ALTER TABLE api_albumdate_photos DROP COLUMN photo_id;
ALTER TABLE api_albumdate_photos RENAME COLUMN photo_id_new TO photo_id;

ALTER TABLE api_albumauto_photos DROP COLUMN photo_id;
ALTER TABLE api_albumauto_photos RENAME COLUMN photo_id_new TO photo_id;

ALTER TABLE api_person DROP COLUMN cover_photo_id;
ALTER TABLE api_person RENAME COLUMN cover_photo_id_new TO cover_photo_id;

ALTER TABLE api_albumuser DROP COLUMN cover_photo_id;
ALTER TABLE api_albumuser RENAME COLUMN cover_photo_id_new TO cover_photo_id;

ALTER TABLE api_albumthing_cover_photos DROP COLUMN photo_id;
ALTER TABLE api_albumthing_cover_photos RENAME COLUMN photo_id_new TO photo_id;

ALTER TABLE api_thumbnail DROP COLUMN photo_id;
ALTER TABLE api_thumbnail RENAME COLUMN photo_id_new TO photo_id;
ALTER TABLE api_thumbnail ALTER COLUMN photo_id SET NOT NULL;
ALTER TABLE api_thumbnail ADD PRIMARY KEY (photo_id);

ALTER TABLE api_photo_caption DROP COLUMN photo_id;
ALTER TABLE api_photo_caption RENAME COLUMN photo_id_new TO photo_id;
ALTER TABLE api_photo_caption ALTER COLUMN photo_id SET NOT NULL;
ALTER TABLE api_photo_caption ADD PRIMARY KEY (photo_id);

ALTER TABLE api_photo_search DROP COLUMN photo_id;
ALTER TABLE api_photo_search RENAME COLUMN photo_id_new TO photo_id;
ALTER TABLE api_photo_search ALTER COLUMN photo_id SET NOT NULL;
ALTER TABLE api_photo_search ADD PRIMARY KEY (photo_id);

ALTER TABLE api_photostack DROP COLUMN primary_photo_id;
ALTER TABLE api_photostack RENAME COLUMN primary_photo_id_new TO primary_photo_id;

-- Step 9: Recreate all FK constraints with new UUID type
ALTER TABLE api_face ADD CONSTRAINT api_face_photo_id_fk_api_photo
    FOREIGN KEY (photo_id) REFERENCES api_photo(id) ON DELETE CASCADE;

ALTER TABLE api_photo_shared_to ADD CONSTRAINT api_photo_shared_to_photo_id_fk
    FOREIGN KEY (photo_id) REFERENCES api_photo(id) ON DELETE CASCADE;

ALTER TABLE api_photo_files ADD CONSTRAINT api_photo_files_photo_id_fk
    FOREIGN KEY (photo_id) REFERENCES api_photo(id) ON DELETE CASCADE;

ALTER TABLE api_albumuser_photos ADD CONSTRAINT api_albumuser_photos_photo_id_fk
    FOREIGN KEY (photo_id) REFERENCES api_photo(id) ON DELETE CASCADE;

ALTER TABLE api_albumthing_photos ADD CONSTRAINT api_albumthing_photos_photo_id_fk
    FOREIGN KEY (photo_id) REFERENCES api_photo(id) ON DELETE CASCADE;

ALTER TABLE api_albumplace_photos ADD CONSTRAINT api_albumplace_photos_photo_id_fk
    FOREIGN KEY (photo_id) REFERENCES api_photo(id) ON DELETE CASCADE;

ALTER TABLE api_albumdate_photos ADD CONSTRAINT api_albumdate_photos_photo_id_fk
    FOREIGN KEY (photo_id) REFERENCES api_photo(id) ON DELETE CASCADE;

ALTER TABLE api_albumauto_photos ADD CONSTRAINT api_albumauto_photos_photo_id_fk
    FOREIGN KEY (photo_id) REFERENCES api_photo(id) ON DELETE CASCADE;

ALTER TABLE api_person ADD CONSTRAINT api_person_cover_photo_id_fk
    FOREIGN KEY (cover_photo_id) REFERENCES api_photo(id) ON DELETE SET NULL;

ALTER TABLE api_albumuser ADD CONSTRAINT api_albumuser_cover_photo_id_fk
    FOREIGN KEY (cover_photo_id) REFERENCES api_photo(id) ON DELETE SET NULL;

ALTER TABLE api_albumthing_cover_photos ADD CONSTRAINT api_albumthing_cover_photos_photo_id_fk
    FOREIGN KEY (photo_id) REFERENCES api_photo(id) ON DELETE CASCADE;

ALTER TABLE api_thumbnail ADD CONSTRAINT api_thumbnail_photo_id_fk
    FOREIGN KEY (photo_id) REFERENCES api_photo(id) ON DELETE CASCADE;

ALTER TABLE api_photo_caption ADD CONSTRAINT api_photo_caption_photo_id_fk
    FOREIGN KEY (photo_id) REFERENCES api_photo(id) ON DELETE CASCADE;

ALTER TABLE api_photo_search ADD CONSTRAINT api_photo_search_photo_id_fk
    FOREIGN KEY (photo_id) REFERENCES api_photo(id) ON DELETE CASCADE;

ALTER TABLE api_photostack ADD CONSTRAINT api_photostack_primary_photo_id_fk
    FOREIGN KEY (primary_photo_id) REFERENCES api_photo(id) ON DELETE SET NULL;

-- Step 10: Create indexes for performance
CREATE INDEX api_face_photo_id_idx ON api_face(photo_id);
CREATE INDEX api_photo_shared_to_photo_id_idx ON api_photo_shared_to(photo_id);
CREATE INDEX api_photo_files_photo_id_idx ON api_photo_files(photo_id);
CREATE INDEX api_person_cover_photo_id_idx ON api_person(cover_photo_id);
CREATE INDEX api_albumuser_cover_photo_id_idx ON api_albumuser(cover_photo_id);
CREATE INDEX api_photostack_primary_photo_id_idx ON api_photostack(primary_photo_id);

-- Clean up temp table
DROP TABLE photo_id_mapping;
"""


# ============================================================================
# Forward / reverse Python entry points
# ============================================================================

def migrate_forward(apps, schema_editor):
    """Forward migration - dispatches to PostgreSQL or SQLite implementation."""
    vendor = schema_editor.connection.vendor
    if vendor == "postgresql":
        _migrate_postgresql(schema_editor)
    elif vendor == "sqlite":
        _migrate_sqlite(schema_editor)
    else:
        raise ValueError(
            f"Unsupported database backend: {vendor}. "
            f"This migration supports PostgreSQL and SQLite only."
        )


def migrate_reverse(apps, schema_editor):
    """Reverse migration - not supported for any backend."""
    raise RuntimeError(
        "Migration 0099_photo_uuid_primary_key cannot be reversed automatically. "
        "Please restore from your pre-migration database backup and run: "
        "python manage.py migrate api 0098 --fake"
    )


# ============================================================================
# PostgreSQL implementation
# ============================================================================

def _migrate_postgresql(schema_editor):
    """Execute the PostgreSQL-specific migration using raw SQL."""
    statements = schema_editor.connection.ops.prepare_sql_script(
        POSTGRESQL_FORWARD_SQL
    )
    for statement in statements:
        schema_editor.execute(statement)


# ============================================================================
# SQLite implementation  (table-recreation pattern)
# ============================================================================
#
# SQLite does not support most ALTER TABLE operations required by the
# PostgreSQL path (DROP/ADD CONSTRAINT, ADD PRIMARY KEY, ALTER COLUMN,
# UPDATE … FROM, gen_random_uuid(), etc.).
#
# Instead we use the standard SQLite table-recreation pattern:
#   1. CREATE TABLE …__new  (with the desired schema)
#   2. INSERT INTO …__new SELECT … FROM …  (copy data, translating FKs)
#   3. DROP TABLE …
#   4. ALTER TABLE …__new RENAME TO …
#   5. Re-create indexes
# ============================================================================

def _migrate_sqlite(schema_editor):
    """Execute the SQLite-compatible migration via table recreation."""
    cursor = schema_editor.connection.cursor()

    # Disable FK enforcement while we recreate tables
    cursor.execute("PRAGMA foreign_keys = OFF")

    try:
        # -- Step 1: Build image_hash → UUID mapping --------------------------
        cursor.execute('SELECT "image_hash" FROM "api_photo"')
        mapping = {row[0]: str(uuid.uuid4()) for row in cursor.fetchall()}

        # -- Step 2: Add id column to api_photo and populate UUIDs ------------
        cursor.execute('ALTER TABLE "api_photo" ADD COLUMN "id" TEXT')
        for image_hash, new_id in mapping.items():
            cursor.execute(
                'UPDATE "api_photo" SET "id" = ? WHERE "image_hash" = ?',
                [new_id, image_hash],
            )

        # -- Step 3: Recreate api_photo with id as PK ------------------------
        _sqlite_recreate_table(
            cursor,
            "api_photo",
            pk_column="id",
            column_overrides={
                "id": '"id" TEXT NOT NULL',
                "image_hash": '"image_hash" varchar(64) NOT NULL UNIQUE',
            },
        )

        # -- Step 4: Update FK references in every related table --------------
        _FK_TABLES = [
            ("api_face", "photo_id"),
            ("api_photo_shared_to", "photo_id"),
            ("api_photo_files", "photo_id"),
            ("api_albumuser_photos", "photo_id"),
            ("api_albumthing_photos", "photo_id"),
            ("api_albumplace_photos", "photo_id"),
            ("api_albumdate_photos", "photo_id"),
            ("api_albumauto_photos", "photo_id"),
            ("api_albumthing_cover_photos", "photo_id"),
            ("api_person", "cover_photo_id"),
            ("api_albumuser", "cover_photo_id"),
            ("api_photostack", "primary_photo_id"),
            ("api_thumbnail", "photo_id"),
            ("api_photo_caption", "photo_id"),
            ("api_photo_search", "photo_id"),
        ]
        for table_name, fk_column in _FK_TABLES:
            _sqlite_update_fk_table(cursor, table_name, fk_column, mapping)

        # -- Step 5: Create performance indexes -------------------------------
        _sqlite_create_indexes(cursor)

    finally:
        cursor.execute("PRAGMA foreign_keys = ON")


# -- SQLite helpers -----------------------------------------------------------

def _sqlite_recreate_table(cursor, table_name, pk_column, column_overrides):
    """
    Recreate *api_photo* with a new primary-key column.

    * ``pk_column``        – name of the column that becomes PRIMARY KEY
    * ``column_overrides`` – dict  column_name → SQL column-definition fragment
                             (without PRIMARY KEY – that is appended automatically
                              for *pk_column*)
    """
    columns = _sqlite_column_info(cursor, table_name)
    indexes = _sqlite_index_info(cursor, table_name)

    col_defs = []
    col_names = []
    for _cid, name, type_, notnull, dflt_value, _pk in columns:
        col_names.append(name)
        if name in column_overrides:
            defn = column_overrides[name]
            if name == pk_column:
                defn += " PRIMARY KEY"
            col_defs.append(defn)
        else:
            parts = [f'"{name}"', type_ or "TEXT"]
            if name == pk_column:
                parts.append("NOT NULL PRIMARY KEY")
            elif notnull:
                parts.append("NOT NULL")
            if dflt_value is not None and name != pk_column:
                parts.append(f"DEFAULT {dflt_value}")
            col_defs.append(" ".join(parts))

    cols_quoted = ", ".join(f'"{c}"' for c in col_names)
    new_table = f"{table_name}__new"

    cursor.execute(f'CREATE TABLE "{new_table}" ({", ".join(col_defs)})')
    cursor.execute(
        f'INSERT INTO "{new_table}" ({cols_quoted}) '
        f'SELECT {cols_quoted} FROM "{table_name}"'
    )
    cursor.execute(f'DROP TABLE "{table_name}"')
    cursor.execute(f'ALTER TABLE "{new_table}" RENAME TO "{table_name}"')

    # Re-create any existing indexes
    for _idx_name, idx_sql in indexes:
        try:
            cursor.execute(idx_sql)
        except Exception:
            pass  # index may conflict with new UNIQUE constraint


def _sqlite_update_fk_table(cursor, table_name, fk_column, mapping):
    """
    Recreate *table_name* so that every value in *fk_column* is translated
    from the old image_hash to the new UUID via *mapping*.
    """
    # Guard: skip if the table or column doesn't exist
    cursor.execute(
        "SELECT COUNT(*) FROM sqlite_master WHERE type='table' AND name=?",
        [table_name],
    )
    if cursor.fetchone()[0] == 0:
        return

    columns = _sqlite_column_info(cursor, table_name)
    col_names_list = [col[1] for col in columns]
    if fk_column not in col_names_list:
        return

    indexes = _sqlite_index_info(cursor, table_name)

    # Build column definitions – change the FK column type to TEXT
    col_defs = []
    col_names = []
    fk_col_idx = None

    for _cid, name, type_, notnull, dflt_value, pk in columns:
        col_names.append(name)
        if name == fk_column:
            fk_col_idx = len(col_names) - 1
            parts = [f'"{name}" TEXT']
            if pk:
                parts.append("NOT NULL PRIMARY KEY")
            col_defs.append(" ".join(parts))
        else:
            parts = [f'"{name}"', type_ or "TEXT"]
            if pk:
                parts.append("PRIMARY KEY")
            if notnull and not pk:
                parts.append("NOT NULL")
            if dflt_value is not None:
                parts.append(f"DEFAULT {dflt_value}")
            col_defs.append(" ".join(parts))

    cols_quoted = ", ".join(f'"{c}"' for c in col_names)
    new_table = f"{table_name}__new"

    # Create new table and bulk-copy data
    cursor.execute(f'CREATE TABLE "{new_table}" ({", ".join(col_defs)})')
    cursor.execute(
        f'INSERT INTO "{new_table}" ({cols_quoted}) '
        f'SELECT {cols_quoted} FROM "{table_name}"'
    )

    # Translate FK values in the new table
    for old_hash, new_uuid in mapping.items():
        cursor.execute(
            f'UPDATE "{new_table}" SET "{fk_column}" = ? '
            f'WHERE "{fk_column}" = ?',
            [new_uuid, old_hash],
        )

    # Swap tables
    cursor.execute(f'DROP TABLE "{table_name}"')
    cursor.execute(f'ALTER TABLE "{new_table}" RENAME TO "{table_name}"')

    # Re-create indexes
    for _idx_name, idx_sql in indexes:
        try:
            cursor.execute(idx_sql)
        except Exception:
            pass


def _sqlite_create_indexes(cursor):
    """Create the same performance indexes as the PostgreSQL path."""
    index_defs = [
        (True, "api_photo_image_hash_unique", "api_photo", "image_hash"),
        (False, "api_face_photo_id_idx", "api_face", "photo_id"),
        (False, "api_photo_shared_to_photo_id_idx", "api_photo_shared_to", "photo_id"),
        (False, "api_photo_files_photo_id_idx", "api_photo_files", "photo_id"),
        (False, "api_person_cover_photo_id_idx", "api_person", "cover_photo_id"),
        (False, "api_albumuser_cover_photo_id_idx", "api_albumuser", "cover_photo_id"),
        (False, "api_photostack_primary_photo_id_idx", "api_photostack", "primary_photo_id"),
    ]
    for unique, idx_name, table, column in index_defs:
        unique_kw = "UNIQUE " if unique else ""
        try:
            cursor.execute(
                f'CREATE {unique_kw}INDEX IF NOT EXISTS '
                f'"{idx_name}" ON "{table}"("{column}")'
            )
        except Exception:
            pass


def _sqlite_column_info(cursor, table_name):
    """Return PRAGMA table_info rows for *table_name*."""
    cursor.execute(f'PRAGMA table_info("{table_name}")')
    return cursor.fetchall()


def _sqlite_index_info(cursor, table_name):
    """Return (name, sql) for every explicit index on *table_name*."""
    cursor.execute(
        "SELECT name, sql FROM sqlite_master "
        "WHERE type='index' AND tbl_name=? AND sql IS NOT NULL",
        [table_name],
    )
    return cursor.fetchall()


# ============================================================================
# Migration class
# ============================================================================

class Migration(migrations.Migration):
    """
    Migration to change Photo primary key from image_hash (CharField) to id (UUIDField).

    WARNING: This migration is NOT reversible through Django's migration system.
    You MUST have a database backup before running this migration.

    Steps:
    1. Add UUID column to api_photo
    2. Generate UUIDs for existing photos
    3. Add UUID columns to all related tables (to store new FK values)
    4. Populate new UUID FK columns from image_hash lookups
    5. Drop all old FK constraints
    6. Drop old PK, add new PK
    7. Drop old FK columns, rename new FK columns
    8. Recreate all FK constraints
    """

    dependencies = [
        ('api', '0098_add_photo_stack'),
    ]

    operations = [
        migrations.SeparateDatabaseAndState(
            database_operations=[
                migrations.RunPython(migrate_forward, migrate_reverse),
            ],
            state_operations=[
                # Add the new UUID primary key field
                migrations.AddField(
                    model_name='photo',
                    name='id',
                    field=models.UUIDField(default=uuid.uuid4, editable=False, primary_key=True, serialize=False),
                ),
                # Change image_hash from primary_key=True to just unique=True
                migrations.AlterField(
                    model_name='photo',
                    name='image_hash',
                    field=models.CharField(db_index=True, max_length=64, unique=True),
                ),
            ],
        ),
    ]


================================================
FILE: api/migrations/0100_metadataedit_metadatafile_photometadata_stackreview_and_more.py
================================================
# Generated by Django 5.2.9 on 2025-12-25 14:15

import api.models.user
import django.db.models.deletion
import uuid
from django.conf import settings
from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0099_photo_uuid_primary_key'),
    ]

    operations = [
        migrations.CreateModel(
            name='MetadataEdit',
            fields=[
                ('id', models.UUIDField(default=uuid.uuid4, editable=False, primary_key=True, serialize=False)),
                ('field_name', models.CharField(max_length=100)),
                ('old_value', models.JSONField(blank=True, null=True)),
                ('new_value', models.JSONField(blank=True, null=True)),
                ('synced_to_file', models.BooleanField(default=False)),
                ('synced_at', models.DateTimeField(blank=True, null=True)),
                ('created_at', models.DateTimeField(auto_now_add=True)),
            ],
            options={
                'verbose_name': 'Metadata Edit',
                'verbose_name_plural': 'Metadata Edits',
                'ordering': ['-created_at'],
            },
        ),
        migrations.CreateModel(
            name='MetadataFile',
            fields=[
                ('id', models.UUIDField(default=uuid.uuid4, editable=False, primary_key=True, serialize=False)),
                ('file_type', models.CharField(choices=[('xmp', 'XMP Sidecar'), ('json', 'JSON Metadata'), ('exif', 'EXIF Extract'), ('other', 'Other')], default='xmp', max_length=10)),
                ('source', models.CharField(choices=[('original', 'Original Sidecar'), ('software', 'Software Generated'), ('librephotos', 'LibrePhotos Generated'), ('user', 'User Created')], default='original', max_length=20)),
                ('priority', models.IntegerField(default=0)),
                ('creator_software', models.CharField(blank=True, max_length=100, null=True)),
                ('created_at', models.DateTimeField(auto_now_add=True)),
                ('updated_at', models.DateTimeField(auto_now=True)),
            ],
            options={
                'verbose_name': 'Metadata File',
                'verbose_name_plural': 'Metadata Files',
                'ordering': ['-priority', '-updated_at'],
            },
        ),
        migrations.CreateModel(
            name='PhotoMetadata',
            fields=[
                ('id', models.UUIDField(default=uuid.uuid4, editable=False, primary_key=True, serialize=False)),
                ('aperture', models.FloatField(blank=True, db_index=True, null=True)),
                ('shutter_speed', models.CharField(blank=True, max_length=20, null=True)),
                ('shutter_speed_seconds', models.FloatField(blank=True, null=True)),
                ('iso', models.IntegerField(blank=True, db_index=True, null=True)),
                ('focal_length', models.FloatField(blank=True, null=True)),
                ('focal_length_35mm', models.IntegerField(blank=True, null=True)),
                ('exposure_compensation', models.FloatField(blank=True, null=True)),
                ('flash_fired', models.BooleanField(blank=True, null=True)),
                ('metering_mode', models.CharField(blank=True, max_length=50, null=True)),
                ('white_balance', models.CharField(blank=True, max_length=50, null=True)),
                ('camera_make', models.CharField(blank=True, db_index=True, max_length=100, null=True)),
                ('camera_model', models.CharField(blank=True, db_index=True, max_length=100, null=True)),
                ('lens_make', models.CharField(blank=True, max_length=100, null=True)),
                ('lens_model', models.CharField(blank=True, db_index=True, max_length=100, null=True)),
                ('serial_number', models.CharField(blank=True, max_length=100, null=True)),
                ('width', models.IntegerField(blank=True, null=True)),
                ('height', models.IntegerField(blank=True, null=True)),
                ('orientation', models.IntegerField(blank=True, null=True)),
                ('color_space', models.CharField(blank=True, max_length=50, null=True)),
                ('bit_depth', models.IntegerField(blank=True, null=True)),
                ('date_taken', models.DateTimeField(blank=True, db_index=True, null=True)),
                ('date_taken_subsec', models.CharField(blank=True, max_length=10, null=True)),
                ('date_modified', models.DateTimeField(blank=True, null=True)),
                ('timezone_offset', models.CharField(blank=True, max_length=10, null=True)),
                ('gps_latitude', models.FloatField(blank=True, db_index=True, null=True)),
                ('gps_longitude', models.FloatField(blank=True, db_index=True, null=True)),
                ('gps_altitude', models.FloatField(blank=True, null=True)),
                ('location_country', models.CharField(blank=True, db_index=True, max_length=100, null=True)),
                ('location_state', models.CharField(blank=True, max_length=100, null=True)),
                ('location_city', models.CharField(blank=True, db_index=True, max_length=100, null=True)),
                ('location_address', models.TextField(blank=True, null=True)),
                ('title', models.CharField(blank=True, max_length=500, null=True)),
                ('caption', models.TextField(blank=True, null=True)),
                ('keywords', models.JSONField(blank=True, null=True)),
                ('rating', models.IntegerField(blank=True, db_index=True, null=True)),
                ('copyright', models.TextField(blank=True, null=True)),
                ('creator', models.CharField(blank=True, max_length=200, null=True)),
                ('source', models.CharField(choices=[('embedded', 'Embedded in File'), ('sidecar', 'XMP Sidecar'), ('user_edit', 'User Edit'), ('computed', 'Computed')], default='embedded', max_length=20)),
                ('raw_exif', models.JSONField(blank=True, null=True)),
                ('raw_xmp', models.JSONField(blank=True, null=True)),
                ('raw_iptc', models.JSONField(blank=True, null=True)),
                ('version', models.IntegerField(default=1)),
                ('created_at', models.DateTimeField(auto_now_add=True)),
                ('updated_at', models.DateTimeField(auto_now=True)),
            ],
            options={
                'verbose_name': 'Photo Metadata',
                'verbose_name_plural': 'Photo Metadata',
            },
        ),
        migrations.CreateModel(
            name='StackReview',
            fields=[
                ('id', models.UUIDField(default=uuid.uuid4, editable=False, primary_key=True, serialize=False)),
                ('decision', models.CharField(choices=[('pending', 'Pending Review'), ('resolved', 'Resolved'), ('dismissed', 'Dismissed')], db_index=True, default='pending', max_length=20)),
                ('trashed_count', models.IntegerField(default=0)),
                ('created_at', models.DateTimeField(auto_now_add=True)),
                ('reviewed_at', models.DateTimeField(blank=True, null=True)),
                ('note', models.TextField(blank=True, null=True)),
            ],
            options={
                'verbose_name': 'Stack Review',
                'verbose_name_plural': 'Stack Reviews',
                'ordering': ['-created_at'],
            },
        ),
        migrations.RemoveIndex(
            model_name='photostack',
            name='api_photost_owner_i_abc123_idx',
        ),
        migrations.RemoveIndex(
            model_name='photostack',
            name='api_photost_owner_i_def456_idx',
        ),
        migrations.RemoveField(
            model_name='photostack',
            name='status',
        ),
        migrations.AlterField(
            model_name='photostack',
            name='owner',
            field=models.ForeignKey(on_delete=models.SET(api.models.user.get_deleted_user), related_name='photo_stacks', to=settings.AUTH_USER_MODEL),
        ),
        migrations.AddIndex(
            model_name='photostack',
            index=models.Index(fields=['owner', 'stack_type'], name='api_photost_owner_i_40a369_idx'),
        ),
        migrations.AddField(
            model_name='metadataedit',
            name='photo',
            field=models.ForeignKey(on_delete=django.db.models.deletion.CASCADE, related_name='metadata_edits', to='api.photo'),
        ),
        migrations.AddField(
            model_name='metadataedit',
            name='user',
            field=models.ForeignKey(on_delete=models.SET(api.models.user.get_deleted_user), related_name='metadata_edits', to=settings.AUTH_USER_MODEL),
        ),
        migrations.AddField(
            model_name='metadatafile',
            name='file',
            field=models.OneToOneField(on_delete=django.db.models.deletion.CASCADE, related_name='metadata_info', to='api.file'),
        ),
        migrations.AddField(
            model_name='metadatafile',
            name='photo',
            field=models.ForeignKey(on_delete=django.db.models.deletion.CASCADE, related_name='metadata_files', to='api.photo'),
        ),
        migrations.AddField(
            model_name='photometadata',
            name='photo',
            field=models.OneToOneField(on_delete=django.db.models.deletion.CASCADE, related_name='metadata', to='api.photo'),
        ),
        migrations.AddField(
            model_name='stackreview',
            name='kept_photo',
            field=models.ForeignKey(blank=True, null=True, on_delete=django.db.models.deletion.SET_NULL, related_name='kept_in_reviews', to='api.photo'),
        ),
        migrations.AddField(
            model_name='stackreview',
            name='reviewer',
            field=models.ForeignKey(on_delete=models.SET(api.models.user.get_deleted_user), related_name='stack_reviews', to=settings.AUTH_USER_MODEL),
        ),
        migrations.AddField(
            model_name='stackreview',
            name='stack',
            field=models.OneToOneField(on_delete=django.db.models.deletion.CASCADE, related_name='review', to='api.photostack'),
        ),
        migrations.AddIndex(
            model_name='metadataedit',
            index=models.Index(fields=['photo', '-created_at'], name='api_metadat_photo_i_21e478_idx'),
        ),
        migrations.AddIndex(
            model_name='photometadata',
            index=models.Index(fields=['camera_make', 'camera_model'], name='api_photome_camera__361eac_idx'),
        ),
        migrations.AddIndex(
            model_name='photometadata',
            index=models.Index(fields=['date_taken'], name='api_photome_date_ta_35e59b_idx'),
        ),
        migrations.AddIndex(
            model_name='photometadata',
            index=models.Index(fields=['location_country', 'location_city'], name='api_photome_locatio_1ca8bb_idx'),
        ),
        migrations.AddIndex(
            model_name='stackreview',
            index=models.Index(fields=['reviewer', 'decision'], name='api_stackre_reviewe_48380f_idx'),
        ),
    ]


================================================
FILE: api/migrations/0101_populate_photo_metadata.py
================================================
# Generated migration to populate PhotoMetadata from existing Photo data

from django.db import migrations, transaction
from django.db.models import Exists, OuterRef


BATCH_SIZE = 1000


def populate_photo_metadata(apps, schema_editor):
    """
    Populate PhotoMetadata for all existing photos.

    This copies metadata fields from Photo model to the structured PhotoMetadata model.
    PhotoMetadata provides:
    - Normalized field names
    - Edit history tracking
    - XMP sidecar support
    - Better organization of camera/lens/settings

    Optimized for SQLite and PostgreSQL compatibility:
    - Fetches all photo IDs upfront (avoids open cursor + writes conflict on SQLite)
    - Loads caption data per-batch to avoid memory issues
    - Processes in batches with per-batch transactions (no huge outer transaction)
    """
    Photo = apps.get_model("api", "Photo")
    PhotoMetadata = apps.get_model("api", "PhotoMetadata")
    PhotoCaption = apps.get_model("api", "PhotoCaption")

    # Exists subquery for efficient filtering
    existing_metadata = PhotoMetadata.objects.filter(photo_id=OuterRef('pk'))

    # Collect all photo IDs that need metadata upfront.
    # Using values_list avoids keeping a cursor open while we write below,
    # which can cause SQLite "database is locked" / cursor-state issues.
    photo_ids = list(
        Photo.objects
        .filter(~Exists(existing_metadata))
        .values_list('pk', flat=True)
    )

    total_count = len(photo_ids)
    if total_count == 0:
        print("No photos need metadata population.")
        return

    print(f"Populating metadata for {total_count} photos...")

    processed = 0

    for i in range(0, total_count, BATCH_SIZE):
        chunk_ids = photo_ids[i:i + BATCH_SIZE]

        # Load caption data for this chunk only
        captions = {
            c.photo_id: c.captions_json
            for c in PhotoCaption.objects.filter(photo_id__in=chunk_ids)
        }

        batch = []
        for photo in Photo.objects.filter(pk__in=chunk_ids):
            captions_json = captions.get(photo.pk)
            metadata = PhotoMetadata(
                photo=photo,
                # Camera info
                camera_make=None,  # Not stored in Photo model separately
                camera_model=photo.camera,
                lens_make=None,  # Not stored separately
                lens_model=photo.lens,
                # Capture settings
                aperture=photo.fstop,
                shutter_speed=photo.shutter_speed,
                iso=photo.iso,
                focal_length=photo.focal_length,
                focal_length_35mm=photo.focalLength35Equivalent,
                # Image properties
                width=photo.width,
                height=photo.height,
                # Date/time
                date_taken=photo.exif_timestamp,
                # GPS
                gps_latitude=photo.exif_gps_lat,
                gps_longitude=photo.exif_gps_lon,
                # Content
                title=None,  # Photo doesn't have separate title
                caption=captions_json.get("user_caption") if captions_json else None,
                keywords=list(captions_json.get("keywords", [])) if captions_json else [],
                rating=photo.rating,
                # Source
                source="embedded",  # All existing data came from EXIF
                version=1,
            )
            batch.append(metadata)

        with transaction.atomic():
            PhotoMetadata.objects.bulk_create(batch, ignore_conflicts=True)
        processed += len(batch)
        print(f"  Processed {processed}/{total_count} photos ({100*processed//total_count}%)")

    print(f"Completed populating metadata for {processed} photos.")


def reverse_populate(apps, schema_editor):
    """
    Reverse migration - delete PhotoMetadata records.
    Note: This will lose any user edits made through PhotoMetadata.
    """
    PhotoMetadata = apps.get_model("api", "PhotoMetadata")
    PhotoMetadata.objects.all().delete()


class Migration(migrations.Migration):
    """
    Data migration to populate PhotoMetadata from existing Photo data.
    
    This ensures backwards compatibility:
    - Photo model still has all the original fields
    - PhotoMetadata provides structured access + edit history
    - API can read from either, preferring PhotoMetadata when available
    """

    dependencies = [
        ("api", "0100_metadataedit_metadatafile_photometadata_stackreview_and_more"),
    ]

    operations = [
        migrations.RunPython(
            populate_photo_metadata,
            reverse_populate,
            atomic=False,
        ),
    ]


================================================
FILE: api/migrations/0102_photo_stacks_manytomany.py
================================================
"""
Migration to convert Photo.stack ForeignKey to Photo.stacks ManyToManyField.

This change allows a photo to belong to multiple stacks of different types
simultaneously, preventing data loss when photos have multiple relationships:
- A RAW+JPEG pair can also be visually similar to other photos
- A burst sequence can also have exact copies
- etc.
"""

from django.db import migrations, models


def migrate_fk_to_m2m(apps, schema_editor):
    """
    Migrate existing ForeignKey relationships to ManyToMany.
    
    For each photo that has a stack ForeignKey set, add that stack
    to the new ManyToMany relationship.
    """
    Photo = apps.get_model('api', 'Photo')
    
    # Get all photos with a stack set (using the old FK field)
    photos_with_stacks = Photo.objects.filter(stack__isnull=False).select_related('stack')
    
    for photo in photos_with_stacks:
        # Add the old FK stack to the new M2M relationship
        photo.stacks.add(photo.stack)


def reverse_m2m_to_fk(apps, schema_editor):
    """
    Reverse migration: convert ManyToMany back to ForeignKey.
    
    For each photo, set the FK to the first stack in the M2M relationship.
    Note: This may lose data if a photo was in multiple stacks.
    """
    Photo = apps.get_model('api', 'Photo')
    
    for photo in Photo.objects.prefetch_related('stacks').all():
        first_stack = photo.stacks.first()
        if first_stack:
            photo.stack = first_stack
            photo.save(update_fields=['stack'])


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0101_populate_photo_metadata'),
    ]

    operations = [
        # Step 1: Add the new ManyToMany field
        migrations.AddField(
            model_name='photo',
            name='stacks',
            field=models.ManyToManyField(
                blank=True,
                related_name='photos_m2m',
                to='api.photostack',
            ),
        ),
        
        # Step 2: Migrate data from FK to M2M
        migrations.RunPython(
            migrate_fk_to_m2m,
            reverse_m2m_to_fk,
        ),
        
        # Step 3: Remove the old ForeignKey field
        migrations.RemoveField(
            model_name='photo',
            name='stack',
        ),
        
        # Step 4: Rename M2M related_name to final name
        migrations.AlterField(
            model_name='photo',
            name='stacks',
            field=models.ManyToManyField(
                blank=True,
                related_name='photos',
                to='api.photostack',
            ),
        ),
    ]


================================================
FILE: api/migrations/0103_remove_photo_metadata_fields.py
================================================
# Generated migration to remove deprecated metadata fields from Photo model
# These fields have been migrated to PhotoMetadata model

from django.db import migrations


class Migration(migrations.Migration):
    """
    Remove deprecated metadata fields from Photo model.
    
    These fields have been migrated to the structured PhotoMetadata model:
    - camera -> PhotoMetadata.camera_model
    - lens -> PhotoMetadata.lens_model
    - fstop -> PhotoMetadata.aperture
    - shutter_speed -> PhotoMetadata.shutter_speed
    - iso -> PhotoMetadata.iso
    - focal_length -> PhotoMetadata.focal_length
    - focalLength35Equivalent -> PhotoMetadata.focal_length_35mm
    - width -> PhotoMetadata.width
    - height -> PhotoMetadata.height
    - digitalZoomRatio -> Not migrated (rarely used)
    - subjectDistance -> Not migrated (rarely used)
    
    Data was already copied in migration 0101_populate_photo_metadata.
    """

    dependencies = [
        ("api", "0102_photo_stacks_manytomany"),
    ]

    operations = [
        migrations.RemoveField(
            model_name="photo",
            name="fstop",
        ),
        migrations.RemoveField(
            model_name="photo",
            name="focal_length",
        ),
        migrations.RemoveField(
            model_name="photo",
            name="iso",
        ),
        migrations.RemoveField(
            model_name="photo",
            name="shutter_speed",
        ),
        migrations.RemoveField(
            model_name="photo",
            name="camera",
        ),
        migrations.RemoveField(
            model_name="photo",
            name="lens",
        ),
        migrations.RemoveField(
            model_name="photo",
            name="width",
        ),
        migrations.RemoveField(
            model_name="photo",
            name="height",
        ),
        migrations.RemoveField(
            model_name="photo",
            name="focalLength35Equivalent",
        ),
        migrations.RemoveField(
            model_name="photo",
            name="digitalZoomRatio",
        ),
        migrations.RemoveField(
            model_name="photo",
            name="subjectDistance",
        ),
    ]


================================================
FILE: api/migrations/0104_remove_photostack_potential_savings_and_more.py
================================================
# Generated by Django 5.2.9 on 2025-12-26 15:05

import api.models.user
import django.db.models.deletion
import uuid
from django.conf import settings
from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0103_remove_photo_metadata_fields'),
    ]

    operations = [
        migrations.RemoveField(
            model_name='photostack',
            name='potential_savings',
        ),
        migrations.RemoveField(
            model_name='photostack',
            name='similarity_score',
        ),
        migrations.AlterField(
            model_name='photostack',
            name='stack_type',
            field=models.CharField(choices=[('raw_jpeg', 'RAW + JPEG Pair'), ('burst', 'Burst Sequence'), ('bracket', 'Exposure Bracket'), ('live_photo', 'Live Photo'), ('manual', 'Manual Stack')], db_index=True, default='raw_jpeg', max_length=20),
        ),
        migrations.CreateModel(
            name='Duplicate',
            fields=[
                ('id', models.UUIDField(default=uuid.uuid4, editable=False, primary_key=True, serialize=False)),
                ('duplicate_type', models.CharField(choices=[('exact_copy', 'Exact Copies'), ('visual_duplicate', 'Visual Duplicates')], db_index=True, default='visual_duplicate', max_length=20)),
                ('review_status', models.CharField(choices=[('pending', 'Pending Review'), ('resolved', 'Resolved'), ('dismissed', 'Dismissed')], db_index=True, default='pending', max_length=20)),
                ('created_at', models.DateTimeField(auto_now_add=True)),
                ('updated_at', models.DateTimeField(auto_now=True)),
                ('reviewed_at', models.DateTimeField(blank=True, null=True)),
                ('similarity_score', models.FloatField(blank=True, null=True)),
                ('potential_savings', models.BigIntegerField(default=0)),
                ('trashed_count', models.IntegerField(default=0)),
                ('note', models.TextField(blank=True, null=True)),
                ('kept_photo', models.ForeignKey(blank=True, null=True, on_delete=django.db.models.deletion.SET_NULL, related_name='kept_in_duplicates', to='api.photo')),
                ('owner', models.ForeignKey(on_delete=models.SET(api.models.user.get_deleted_user), related_name='duplicates', to=settings.AUTH_USER_MODEL)),
            ],
            options={
                'verbose_name': 'Duplicate',
                'verbose_name_plural': 'Duplicates',
                'ordering': ['-created_at'],
            },
        ),
        migrations.AddField(
            model_name='photo',
            name='duplicates',
            field=models.ManyToManyField(blank=True, related_name='photos', to='api.duplicate'),
        ),
        migrations.AddIndex(
            model_name='duplicate',
            index=models.Index(fields=['owner', 'duplicate_type'], name='api_duplica_owner_i_78a3a4_idx'),
        ),
        migrations.AddIndex(
            model_name='duplicate',
            index=models.Index(fields=['owner', 'review_status'], name='api_duplica_owner_i_039fa3_idx'),
        ),
    ]


================================================
FILE: api/migrations/0105_alter_photo_image_hash.py
================================================
# Generated by Django 5.2.9 on 2025-12-26 16:12

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0104_remove_photostack_potential_savings_and_more'),
    ]

    operations = [
        # Drop the unique index created by migration 0099 (it was created as an index, not a constraint)
        migrations.RunSQL(
            sql="DROP INDEX IF EXISTS api_photo_image_hash_unique;",
            reverse_sql="CREATE UNIQUE INDEX IF NOT EXISTS api_photo_image_hash_unique ON api_photo(image_hash);",
        ),
        migrations.AlterField(
            model_name='photo',
            name='image_hash',
            field=models.CharField(db_index=True, max_length=64),
        ),
    ]


================================================
FILE: api/migrations/0106_alter_longrunningjob_options.py
================================================
# Generated by Django 5.2.9 on 2025-12-26 19:35

from django.db import migrations


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0105_alter_photo_image_hash'),
    ]

    operations = [
        migrations.AlterModelOptions(
            name='longrunningjob',
            options={'ordering': ['-queued_at'], 'verbose_name': 'Long Running Job', 'verbose_name_plural': 'Long Running Jobs'},
        ),
    ]


================================================
FILE: api/migrations/0107_add_burst_detection_rules.py
================================================
# Generated by Django 5.0 on 2024-12-26

from django.db import migrations, models

import api.models.user


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0106_alter_longrunningjob_options"),
    ]

    operations = [
        migrations.AddField(
            model_name="user",
            name="burst_detection_rules",
            field=models.JSONField(
                default=api.models.user.get_default_config_burst_detection_rules
            ),
        ),
    ]


================================================
FILE: api/migrations/0108_add_stack_raw_jpeg_field.py
================================================
# Generated migration for adding stack_raw_jpeg field

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("api", "0107_add_burst_detection_rules"),
    ]

    operations = [
        migrations.AddField(
            model_name="user",
            name="stack_raw_jpeg",
            field=models.BooleanField(default=True),
        ),
    ]


================================================
FILE: api/migrations/0109_migrate_skip_raw_to_stack_raw_jpeg.py
================================================
# Data migration to set stack_raw_jpeg based on skip_raw_files
# If skip_raw_files was True (skip RAWs), then stack_raw_jpeg should be False (don't stack)
# If skip_raw_files was False (don't skip RAWs), then stack_raw_jpeg should be True (stack them)

from django.db import migrations


def migrate_skip_raw_to_stack_raw_jpeg(apps, schema_editor):
    User = apps.get_model("api", "User")
    # Set stack_raw_jpeg = not skip_raw_files
    # If user was skipping RAW files, they probably don't want them stacked
    # If user was not skipping RAW files, enable stacking by default
    User.objects.filter(skip_raw_files=True).update(stack_raw_jpeg=False)
    User.objects.filter(skip_raw_files=False).update(stack_raw_jpeg=True)


def reverse_migration(apps, schema_editor):
    # Reverse migration: set skip_raw_files based on stack_raw_jpeg
    User = apps.get_model("api", "User")
    User.objects.filter(stack_raw_jpeg=False).update(skip_raw_files=True)
    User.objects.filter(stack_raw_jpeg=True).update(skip_raw_files=False)


class Migration(migrations.Migration):

    dependencies = [
        ("api", "0108_add_stack_raw_jpeg_field"),
    ]

    operations = [
        migrations.RunPython(migrate_skip_raw_to_stack_raw_jpeg, reverse_migration),
    ]


================================================
FILE: api/migrations/0110_fix_file_embedded_media_self_reference.py
================================================
# Generated migration to fix self-referential ManyToManyField

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("api", "0109_migrate_skip_raw_to_stack_raw_jpeg"),
    ]

    operations = [
        migrations.AlterField(
            model_name="file",
            name="embedded_media",
            field=models.ManyToManyField("self", symmetrical=False),
        ),
    ]


================================================
FILE: api/migrations/0111_alter_file_embedded_media.py
================================================
# Generated by Django 5.2.9 on 2026-01-08 19:16

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0110_fix_file_embedded_media_self_reference'),
    ]

    operations = [
        migrations.AlterField(
            model_name='file',
            name='embedded_media',
            field=models.ManyToManyField(to='api.file'),
        ),
    ]


================================================
FILE: api/migrations/0112_convert_file_stacks_to_variants.py
================================================
"""
Migration to convert RAW_JPEG_PAIR and LIVE_PHOTO stacks to file variants.

This migration implements the PhotoPrism-like file variant model where:
- RAW+JPEG pairs become one Photo with multiple files
- Live Photos (image+video) become one Photo with multiple files

Instead of having 2 Photo entities in a stack, we now have 1 Photo entity
with multiple File entries in its files ManyToMany field.

This is a data migration that:
1. For each RAW_JPEG_PAIR stack:
   - Identifies the JPEG Photo (primary) and RAW Photo
   - Moves the RAW file to the JPEG Photo's files field
   - Deletes the RAW Photo entity
   - Deletes the stack
2. For each LIVE_PHOTO stack:
   - Identifies the image Photo (primary) and video Photo
   - Moves the video file to the image Photo's files field
   - Deletes the video Photo entity
   - Deletes the stack

Optimized for large datasets:
- Uses prefetch_related to eliminate N+1 queries
- Uses bulk M2M operations via through model
- Processes in batches with progress logging
"""

from django.db import migrations, transaction
from django.db.models import Prefetch


BATCH_SIZE = 500


def convert_raw_jpeg_stacks_to_file_variants(apps, schema_editor):
    """Convert RAW_JPEG_PAIR stacks to Photo.files variants."""
    PhotoStack = apps.get_model('api', 'PhotoStack')
    Photo = apps.get_model('api', 'Photo')
    File = apps.get_model('api', 'File')
    
    # Get through model for bulk M2M operations
    PhotoFiles = Photo.files.through
    PhotoStacks = Photo.stacks.through
    
    # RAW_JPEG_PAIR = "raw_jpeg"
    # Count total for progress logging
    total_count = PhotoStack.objects.filter(stack_type="raw_jpeg").count()
    if total_count == 0:
        print("No RAW_JPEG_PAIR stacks to convert.")
        return
    
    print(f"Converting {total_count} RAW_JPEG_PAIR stacks to file variants...")
    
    # Prefetch photos with their files and main_file to eliminate N+1 queries
    raw_jpeg_stacks = (
        PhotoStack.objects
        .filter(stack_type="raw_jpeg")
        .prefetch_related(
            Prefetch(
                'photos',
                queryset=Photo.objects.select_related('main_file').prefetch_related('files')
            )
        )
    )
    
    converted_count = 0
    error_count = 0
    
    # Collect bulk operations
    m2m_files_to_create = []
    photos_to_delete = []
    stacks_to_delete = []
    m2m_stacks_to_delete = []
    
    for stack in raw_jpeg_stacks.iterator(chunk_size=BATCH_SIZE):
        try:
            # Photos are already prefetched - no extra query
            photos = list(stack.photos.all())
            
            if len(photos) != 2:
                print(f"WARNING: RAW_JPEG stack {stack.id} has {len(photos)} photos, expected 2. Skipping.")
                error_count += 1
                continue
            
            # Identify JPEG and RAW photos
            # RAW files have type=4 in File model
            jpeg_photo = None
            raw_photo = None
            
            for photo in photos:
                if photo.main_file and photo.main_file.type == 4:  # RAW_FILE
                    raw_photo = photo
                else:
                    jpeg_photo = photo
            
            if not jpeg_photo or not raw_photo:
                print(f"WARNING: Could not identify JPEG/RAW in stack {stack.id}. Skipping.")
                error_count += 1
                continue
            
            # Collect files to add to jpeg_photo (using prefetched data)
            files_to_add = list(raw_photo.files.all())
            if raw_photo.main_file:
                files_to_add.append(raw_photo.main_file)
            
            # Build M2M through model entries for bulk create
            existing_file_hashes = set(f.hash for f in jpeg_photo.files.all())
            for file in files_to_add:
                if file.hash not in existing_file_hashes:
                    m2m_files_to_create.append(
                        PhotoFiles(photo_id=jpeg_photo.pk, file_id=file.hash)
                    )
                    existing_file_hashes.add(file.hash)
            
            # Collect M2M stack relationships to delete
            for photo in photos:
                m2m_stacks_to_delete.append((photo.pk, stack.pk))
            
            photos_to_delete.append(raw_photo.pk)
            stacks_to_delete.append(stack.pk)
            converted_count += 1
            
            # Process in batches to avoid memory buildup
            if len(stacks_to_delete) >= BATCH_SIZE:
                _flush_raw_jpeg_batch(
                    PhotoFiles, PhotoStacks, Photo, PhotoStack,
                    m2m_files_to_create, m2m_stacks_to_delete, photos_to_delete, stacks_to_delete
                )
                m2m_files_to_create = []
                m2m_stacks_to_delete = []
                photos_to_delete = []
                stacks_to_delete = []
                print(f"  Processed {converted_count}/{total_count} stacks ({100*converted_count//total_count}%)")
            
        except Exception as e:
            print(f"ERROR converting RAW_JPEG stack {stack.id}: {e}")
            error_count += 1
    
    # Flush remaining batch
    if stacks_to_delete:
        _flush_raw_jpeg_batch(
            PhotoFiles, PhotoStacks, Photo, PhotoStack,
            m2m_files_to_create, m2m_stacks_to_delete, photos_to_delete, stacks_to_delete
        )
    
    print(f"Converted {converted_count} RAW_JPEG_PAIR stacks to file variants ({error_count} errors)")


def _flush_raw_jpeg_batch(PhotoFiles, PhotoStacks, Photo, PhotoStack,
                          m2m_files_to_create, m2m_stacks_to_delete, photos_to_delete, stacks_to_delete):
    """Flush a batch of operations to the database."""
    with transaction.atomic():
        # Bulk create M2M file relationships
        if m2m_files_to_create:
            PhotoFiles.objects.bulk_create(m2m_files_to_create, ignore_conflicts=True)
        
        # Bulk delete M2M stack relationships
        if m2m_stacks_to_delete:
            for photo_id, stack_id in m2m_stacks_to_delete:
                PhotoStacks.objects.filter(photo_id=photo_id, photostack_id=stack_id).delete()
        
        # Bulk delete photos
        if photos_to_delete:
            Photo.objects.filter(pk__in=photos_to_delete).delete()
        
        # Bulk delete stacks
        if stacks_to_delete:
            PhotoStack.objects.filter(pk__in=stacks_to_delete).delete()


def convert_live_photo_stacks_to_file_variants(apps, schema_editor):
    """Convert LIVE_PHOTO stacks to Photo.files variants."""
    PhotoStack = apps.get_model('api', 'PhotoStack')
    Photo = apps.get_model('api', 'Photo')
    File = apps.get_model('api', 'File')
    
    # Get through model for bulk M2M operations
    PhotoFiles = Photo.files.through
    PhotoStacks = Photo.stacks.through
    
    # LIVE_PHOTO = "live_photo"
    # Count total for progress logging
    total_count = PhotoStack.objects.filter(stack_type="live_photo").count()
    if total_count == 0:
        print("No LIVE_PHOTO stacks to convert.")
        return
    
    print(f"Converting {total_count} LIVE_PHOTO stacks to file variants...")
    
    # Prefetch photos with their files and main_file to eliminate N+1 queries
    live_photo_stacks = (
        PhotoStack.objects
        .filter(stack_type="live_photo")
        .prefetch_related(
            Prefetch(
                'photos',
                queryset=Photo.objects.select_related('main_file').prefetch_related('files')
            )
        )
    )
    
    converted_count = 0
    error_count = 0
    
    # Collect bulk operations
    m2m_files_to_create = []
    photos_to_delete = []
    stacks_to_delete = []
    m2m_stacks_to_delete = []
    
    for stack in live_photo_stacks.iterator(chunk_size=BATCH_SIZE):
        try:
            # Photos are already prefetched - no extra query
            photos = list(stack.photos.all())
            
            if len(photos) != 2:
                print(f"WARNING: LIVE_PHOTO stack {stack.id} has {len(photos)} photos, expected 2. Skipping.")
                error_count += 1
                continue
            
            # Identify image and video photos
            # VIDEO files have type=2 in File model
            image_photo = None
            video_photo = None
            
            for photo in photos:
                if photo.main_file and photo.main_file.type == 2:  # VIDEO
                    video_photo = photo
                elif photo.video:
                    video_photo = photo
                else:
                    image_photo = photo
            
            if not image_photo or not video_photo:
                print(f"WARNING: Could not identify image/video in LIVE_PHOTO stack {stack.id}. Skipping.")
                error_count += 1
                continue
            
            # Collect files to add to image_photo (using prefetched data)
            files_to_add = list(video_photo.files.all())
            if video_photo.main_file:
                files_to_add.append(video_photo.main_file)
            
            # Build M2M through model entries for bulk create
            existing_file_hashes = set(f.hash for f in image_photo.files.all())
            for file in files_to_add:
                if file.hash not in existing_file_hashes:
                    m2m_files_to_create.append(
                        PhotoFiles(photo_id=image_photo.pk, file_id=file.hash)
                    )
                    existing_file_hashes.add(file.hash)
            
            # Collect M2M stack relationships to delete
            for photo in photos:
                m2m_stacks_to_delete.append((photo.pk, stack.pk))
            
            photos_to_delete.append(video_photo.pk)
            stacks_to_delete.append(stack.pk)
            converted_count += 1
            
            # Process in batches to avoid memory buildup
            if len(stacks_to_delete) >= BATCH_SIZE:
                _flush_live_photo_batch(
                    PhotoFiles, PhotoStacks, Photo, PhotoStack,
                    m2m_files_to_create, m2m_stacks_to_delete, photos_to_delete, stacks_to_delete
                )
                m2m_files_to_create = []
                m2m_stacks_to_delete = []
                photos_to_delete = []
                stacks_to_delete = []
                print(f"  Processed {converted_count}/{total_count} stacks ({100*converted_count//total_count}%)")
            
        except Exception as e:
            print(f"ERROR converting LIVE_PHOTO stack {stack.id}: {e}")
            error_count += 1
    
    # Flush remaining batch
    if stacks_to_delete:
        _flush_live_photo_batch(
            PhotoFiles, PhotoStacks, Photo, PhotoStack,
            m2m_files_to_create, m2m_stacks_to_delete, photos_to_delete, stacks_to_delete
        )
    
    print(f"Converted {converted_count} LIVE_PHOTO stacks to file variants ({error_count} errors)")


def _flush_live_photo_batch(PhotoFiles, PhotoStacks, Photo, PhotoStack,
                            m2m_files_to_create, m2m_stacks_to_delete, photos_to_delete, stacks_to_delete):
    """Flush a batch of operations to the database."""
    with transaction.atomic():
        # Bulk create M2M file relationships
        if m2m_files_to_create:
            PhotoFiles.objects.bulk_create(m2m_files_to_create, ignore_conflicts=True)
        
        # Bulk delete M2M stack relationships
        if m2m_stacks_to_delete:
            for photo_id, stack_id in m2m_stacks_to_delete:
                PhotoStacks.objects.filter(photo_id=photo_id, photostack_id=stack_id).delete()
        
        # Bulk delete photos
        if photos_to_delete:
            Photo.objects.filter(pk__in=photos_to_delete).delete()
        
        # Bulk delete stacks
        if stacks_to_delete:
            PhotoStack.objects.filter(pk__in=stacks_to_delete).delete()


def forward_migration(apps, schema_editor):
    """Run both conversions."""
    convert_raw_jpeg_stacks_to_file_variants(apps, schema_editor)
    convert_live_photo_stacks_to_file_variants(apps, schema_editor)


def reverse_migration(apps, schema_editor):
    """
    Reverse migration is not fully supported as we've deleted Photo entities.
    This would require recreating the deleted Photos which is complex.
    Instead, we just print a warning.
    """
    print("WARNING: Reverse migration is not supported. "
          "RAW_JPEG_PAIR and LIVE_PHOTO stacks cannot be recreated automatically. "
          "Run a full rescan to detect file variants again.")


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0111_alter_file_embedded_media'),
    ]

    operations = [
        migrations.RunPython(forward_migration, reverse_migration),
    ]


================================================
FILE: api/migrations/0113_alter_photostack_stack_type.py
================================================
# Generated by Django 5.2.9 on 2026-01-21 13:36

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0112_convert_file_stacks_to_variants'),
    ]

    operations = [
        migrations.AlterField(
            model_name='photostack',
            name='stack_type',
            field=models.CharField(choices=[('burst', 'Burst Sequence'), ('bracket', 'Exposure Bracket'), ('manual', 'Manual Stack'), ('raw_jpeg', 'RAW + JPEG Pair (Deprecated)'), ('live_photo', 'Live Photo (Deprecated)')], db_index=True, default='manual', max_length=20),
        ),
    ]


================================================
FILE: api/migrations/0114_add_file_path_unique.py
================================================
# Generated migration to add unique constraint on File.path
# This migration handles existing duplicate paths before adding the constraint

from django.db import migrations, models, transaction
from django.db.models import Count, Exists, OuterRef, Case, When, Value, IntegerField


BATCH_SIZE = 500


def deduplicate_file_paths(apps, schema_editor):
    """
    Deduplicate File records that have the same path.
    
    Strategy:
    1. Find all paths that have multiple File records
    2. For each duplicate group, keep the "best" File:
       - Prefer non-missing files
       - Prefer files that are main_file for a Photo
       - Prefer files linked to more Photos
    3. Reassign all Photo associations from deleted Files to kept File
    4. Delete duplicate File records
    
    Optimized for large datasets:
    - Uses annotations to compute scores in database instead of per-file queries
    - Uses bulk M2M operations via through model
    - Uses prefetch_related to eliminate N+1 queries
    - Processes in batches with progress logging
    """
    File = apps.get_model('api', 'File')
    Photo = apps.get_model('api', 'Photo')
    
    # Get through models for bulk M2M operations
    PhotoFiles = Photo.files.through
    FileEmbeddedMedia = File.embedded_media.through
    
    # Find paths that have duplicates (excluding empty paths)
    duplicate_paths = list(
        File.objects
        .exclude(path='')
        .exclude(path__isnull=True)
        .values('path')
        .annotate(count=Count('hash'))
        .filter(count__gt=1)
    )
    
    total_count = len(duplicate_paths)
    if total_count == 0:
        print("No duplicate file paths to deduplicate.")
        return
    
    print(f"Deduplicating {total_count} file paths...")
    
    processed = 0
    deleted_count = 0
    
    for dup in duplicate_paths:
        path = dup['path']
        
        # Subquery to check if file is main_file for any Photo
        is_main_file = Photo.objects.filter(main_file_id=OuterRef('hash'))
        
        # Get all Files with this path, annotated with scores computed in DB
        files = list(
            File.objects
            .filter(path=path)
            .annotate(
                photo_count=Count('photo', distinct=True),
                is_main=Case(
                    When(Exists(is_main_file), then=Value(50)),
                    default=Value(0),
                    output_field=IntegerField()
                ),
                missing_penalty=Case(
                    When(missing=False, then=Value(100)),
                    default=Value(0),
                    output_field=IntegerField()
                ),
            )
            .prefetch_related('photo_set', 'embedded_media')
            .order_by('-missing_penalty', '-is_main', '-photo_count')
        )
        
        if len(files) <= 1:
            continue
        
        # First file is the best one (sorted by score descending)
        keep_file = files[0]
        delete_files = files[1:]
        
        with transaction.atomic():
            # Collect M2M entries to create
            m2m_photo_files_to_create = []
            m2m_photo_files_to_delete = []
            m2m_embedded_to_create = []
            m2m_embedded_to_delete = []
            photos_to_update_main = []
            
            for del_file in delete_files:
                # Get all Photos that have this file in their files M2M (prefetched)
                for photo in del_file.photo_set.all():
                    # Schedule add of keep_file to photo
                    m2m_photo_files_to_create.append(
                        PhotoFiles(photo_id=photo.pk, file_id=keep_file.hash)
                    )
                    # Schedule removal of del_file from photo
                    m2m_photo_files_to_delete.append((photo.pk, del_file.hash))
                
                # Update main_file references in bulk
                photos_with_main = Photo.objects.filter(main_file=del_file)
                for photo in photos_with_main:
                    photo.main_file = keep_file
                    photos_to_update_main.append(photo)
                
                # Handle embedded_media M2M (prefetched)
                for parent_file in File.objects.filter(embedded_media=del_file):
                    m2m_embedded_to_create.append(
                        FileEmbeddedMedia(from_file_id=parent_file.hash, to_file_id=keep_file.hash)
                    )
                    m2m_embedded_to_delete.append((parent_file.hash, del_file.hash))
            
            # Execute bulk operations
            if m2m_photo_files_to_create:
                PhotoFiles.objects.bulk_create(m2m_photo_files_to_create, ignore_conflicts=True)
            
            if m2m_photo_files_to_delete:
                for photo_id, file_id in m2m_photo_files_to_delete:
                    PhotoFiles.objects.filter(photo_id=photo_id, file_id=file_id).delete()
            
            if photos_to_update_main:
                Photo.objects.bulk_update(photos_to_update_main, ['main_file'])
            
            if m2m_embedded_to_create:
                FileEmbeddedMedia.objects.bulk_create(m2m_embedded_to_create, ignore_conflicts=True)
            
            if m2m_embedded_to_delete:
                for from_id, to_id in m2m_embedded_to_delete:
                    FileEmbeddedMedia.objects.filter(from_file_id=from_id, to_file_id=to_id).delete()
            
            # Delete duplicate files in bulk
            delete_hashes = [f.hash for f in delete_files]
            File.objects.filter(hash__in=delete_hashes).delete()
            deleted_count += len(delete_files)
        
        processed += 1
        if processed % 100 == 0:
            print(f"  Processed {processed}/{total_count} duplicate paths ({100*processed//total_count}%)")
    
    print(f"Completed deduplication. Deleted {deleted_count} duplicate files.")


def reverse_deduplicate(apps, schema_editor):
    """
    Reverse migration is a no-op since we can't restore deleted duplicates.
    The unique constraint will be dropped by the AlterField reverse.
    """
    pass


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0113_alter_photostack_stack_type'),
    ]

    operations = [
        # First, deduplicate existing paths
        migrations.RunPython(
            deduplicate_file_paths,
            reverse_deduplicate,
        ),
        # Then add the unique constraint
        migrations.AlterField(
            model_name='file',
            name='path',
            field=models.TextField(blank=True, default="", unique=True),
        ),
    ]


================================================
FILE: api/migrations/0115_cleanup_duplicate_photos.py
================================================
# Generated migration to cleanup duplicate Photo records
# This migration handles Photos with the same image_hash for the same owner

from django.db import migrations, transaction
from django.db.models import Count, Case, When, Value, F, IntegerField


BATCH_SIZE = 100


def cleanup_duplicate_photos(apps, schema_editor):
    """
    Cleanup Photo records that have the same image_hash for the same owner.
    
    Strategy:
    1. Find all (image_hash, owner) combinations that have multiple Photo records
    2. For each duplicate group, keep the "best" Photo:
       - Prefer non-removed photos
       - Prefer non-trashed photos
       - Prefer photos with main_file
       - Prefer photos with more files attached
       - Prefer photos with more metadata (faces, albums, etc.)
       - Prefer older photos (smaller added_on)
    3. Merge associations from duplicate Photos to kept Photo:
       - files (M2M)
       - albums (album_user, album_thing, album_place, album_date)
       - faces
       - stacks
       - duplicates (duplicate groups)
       - shared_to
    4. Delete duplicate Photos
    
    Optimized for large datasets:
    - Uses database annotations to compute scores instead of per-photo queries
    - Uses bulk M2M operations via through model
    - Uses prefetch_related to eliminate N+1 queries
    - Processes in batches with progress logging
    """
    Photo = apps.get_model('api', 'Photo')
    Face = apps.get_model('api', 'Face')
    AlbumUser = apps.get_model('api', 'AlbumUser')
    
    # Get through models for bulk M2M operations
    PhotoFiles = Photo.files.through
    PhotoStacks = Photo.stacks.through
    PhotoDuplicates = Photo.duplicates.through
    PhotoSharedTo = Photo.shared_to.through
    AlbumUserPhotos = AlbumUser.photos.through
    
    # Find (image_hash, owner) combinations with duplicates
    # Exclude already removed photos from consideration
    duplicate_groups = list(
        Photo.objects
        .filter(removed=False)
        .values('image_hash', 'owner')
        .annotate(count=Count('id'))
        .filter(count__gt=1)
    )
    
    total_count = len(duplicate_groups)
    if total_count == 0:
        print("No duplicate photos to clean up.")
        return
    
    print(f"Cleaning up {total_count} duplicate photo groups...")
    
    merged_count = 0
    processed = 0
    
    for dup in duplicate_groups:
        image_hash = dup['image_hash']
        owner_id = dup['owner']
        
        # Get all non-removed Photos with this hash/owner
        # Annotate with scores computed in database
        photos = list(
            Photo.objects
            .filter(image_hash=image_hash, owner_id=owner_id, removed=False)
            .annotate(
                file_count=Count('files', distinct=True),
                face_count=Count('face', distinct=True),
                album_count=Count('albumuser', distinct=True),
                stack_count=Count('stacks', distinct=True),
                # Compute score in database
                score=(
                    Case(When(removed=False, then=Value(1000)), default=Value(0), output_field=IntegerField()) +
                    Case(When(in_trashcan=False, then=Value(500)), default=Value(0), output_field=IntegerField()) +
                    Case(When(main_file__isnull=False, then=Value(200)), default=Value(0), output_field=IntegerField()) +
                    F('file_count') * 10 +
                    F('face_count') * 5 +
                    F('album_count') * 2 +
                    F('stack_count') * 2 +
                    Case(When(clip_embeddings__isnull=False, then=Value(50)), default=Value(0), output_field=IntegerField()) +
                    Case(When(perceptual_hash__isnull=False, then=Value(30)), default=Value(0), output_field=IntegerField()) +
                    Case(When(geolocation_json__isnull=False, then=Value(20)), default=Value(0), output_field=IntegerField())
                )
            )
            .select_related('main_file')
            .prefetch_related('files', 'stacks', 'duplicates', 'shared_to', 'albumuser_set')
            .order_by('-score', 'added_on')  # Higher score first, then older
        )
        
        if len(photos) <= 1:
            continue
        
        keep_photo = photos[0]
        merge_photos = photos[1:]
        merge_ids = [p.pk for p in merge_photos]
        
        with transaction.atomic():
            # Bulk update faces - single query
            Face.objects.filter(photo_id__in=merge_ids).update(photo=keep_photo)
            
            # Collect existing M2M IDs to prevent duplicates
            existing_file_ids = set(keep_photo.files.values_list('hash', flat=True))
            existing_stack_ids = set(keep_photo.stacks.values_list('id', flat=True))
            existing_duplicate_ids = set(keep_photo.duplicates.values_list('id', flat=True))
            existing_shared_ids = set(keep_photo.shared_to.values_list('id', flat=True))
            existing_album_ids = set(keep_photo.albumuser_set.values_list('id', flat=True))
            
            # Collect M2M entries to create
            new_files = []
            new_stacks = []
            new_duplicates = []
            new_shared = []
            new_albums = []
            
            # Track if we need to update main_file
            main_file_candidate = None
            
            for merge_photo in merge_photos:
                # Collect files (prefetched)
                for file in merge_photo.files.all():
                    if file.hash not in existing_file_ids:
                        new_files.append(PhotoFiles(photo_id=keep_photo.pk, file_id=file.hash))
                        existing_file_ids.add(file.hash)
                
                # If kept photo has no main_file but merge_photo does, remember it
                if not keep_photo.main_file_id and merge_photo.main_file_id and not main_file_candidate:
                    main_file_candidate = merge_photo.main_file
                
                # Collect stacks (prefetched)
                for stack in merge_photo.stacks.all():
                    if stack.id not in existing_stack_ids:
                        new_stacks.append(PhotoStacks(photo_id=keep_photo.pk, photostack_id=stack.id))
                        existing_stack_ids.add(stack.id)
                
                # Collect duplicates (prefetched)
                for dup_group in merge_photo.duplicates.all():
                    if dup_group.id not in existing_duplicate_ids:
                        new_duplicates.append(PhotoDuplicates(photo_id=keep_photo.pk, duplicate_id=dup_group.id))
                        existing_duplicate_ids.add(dup_group.id)
                
                # Collect shared_to (prefetched)
                for user in merge_photo.shared_to.all():
                    if user.id not in existing_shared_ids:
                        new_shared.append(PhotoSharedTo(photo_id=keep_photo.pk, user_id=user.id))
                        existing_shared_ids.add(user.id)
                
                # Collect album memberships (prefetched)
                for album in merge_photo.albumuser_set.all():
                    if album.id not in existing_album_ids:
                        new_albums.append(AlbumUserPhotos(albumuser_id=album.id, photo_id=keep_photo.pk))
                        existing_album_ids.add(album.id)
            
            # Bulk create all M2M relationships
            if new_files:
                PhotoFiles.objects.bulk_create(new_files, ignore_conflicts=True)
            if new_stacks:
                PhotoStacks.objects.bulk_create(new_stacks, ignore_conflicts=True)
            if new_duplicates:
                PhotoDuplicates.objects.bulk_create(new_duplicates, ignore_conflicts=True)
            if new_shared:
                PhotoSharedTo.objects.bulk_create(new_shared, ignore_conflicts=True)
            if new_albums:
                AlbumUserPhotos.objects.bulk_create(new_albums, ignore_conflicts=True)
            
            # Update main_file if needed
            if main_file_candidate:
                keep_photo.main_file = main_file_candidate
                keep_photo.save(update_fields=['main_file'])
            
            # Bulk delete merge photos
            # Django's delete() on queryset handles M2M clearing automatically
            Photo.objects.filter(pk__in=merge_ids).delete()
            merged_count += len(merge_ids)
        
        processed += 1
        if processed % BATCH_SIZE == 0:
            print(f"  Processed {processed}/{total_count} duplicate groups ({100*processed//total_count}%)")
    
    if merged_count > 0:
        print(f"Completed cleanup. Deleted {merged_count} duplicate Photo records.")


def reverse_cleanup(apps, schema_editor):
    """
    Reverse migration is a no-op since deleted photos cannot be restored.
    """
    pass


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0114_add_file_path_unique'),
    ]

    operations = [
        migrations.RunPython(
            cleanup_duplicate_photos,
            reverse_cleanup,
        ),
    ]


================================================
FILE: api/migrations/0116_cleanup_duplicate_groups_removed_photos.py
================================================
# Generated migration to clean up Duplicate groups containing removed photos
# This removes removed=True photos from groups and deletes groups with 0-1 photos remaining

from django.db import migrations


def cleanup_duplicate_groups(apps, schema_editor):
    """
    Remove removed=True photos from Duplicate groups.
    Delete Duplicate groups that end up with 0 or 1 photos.
    
    This is needed because migration 0115 marks duplicate Photos as removed=True
    but doesn't remove them from their Duplicate group M2M relationships.
    """
    Duplicate = apps.get_model('api', 'Duplicate')
    
    cleaned_count = 0
    deleted_count = 0
    
    for duplicate in Duplicate.objects.all():
        # Get removed photos in this group
        removed_photos = duplicate.photos.filter(removed=True)
        removed_count = removed_photos.count()
        
        if removed_count > 0:
            # Remove the removed photos from the group
            for photo in removed_photos:
                duplicate.photos.remove(photo)
            cleaned_count += removed_count
        
        # Check if group now has 0 or 1 photos (no longer a valid duplicate group)
        remaining = duplicate.photos.filter(removed=False).count()
        if remaining <= 1:
            # Clear remaining photos first to avoid orphan M2M entries
            duplicate.photos.clear()
            duplicate.delete()
            deleted_count += 1
    
    if cleaned_count or deleted_count:
        print(f"Cleaned {cleaned_count} removed photos from duplicate groups")
        print(f"Deleted {deleted_count} empty/single-photo duplicate groups")


def reverse_cleanup(apps, schema_editor):
    """
    Reverse migration is a no-op since we can't restore removed photos to groups.
    The photos still exist (just marked removed=True) but we don't track which
    groups they belonged to.
    """
    pass


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0115_cleanup_duplicate_photos'),
    ]

    operations = [
        migrations.RunPython(cleanup_duplicate_groups, reverse_cleanup),
    ]


================================================
FILE: api/migrations/0117_delete_removed_photos.py
================================================
# Generated migration to delete removed photos
# These are duplicate photos that were merged in migration 0115

from django.db import migrations


def delete_removed_photos(apps, schema_editor):
    """
    Delete all Photo records marked as removed=True.
    
    These are duplicate photos that were already merged in migration 0115.
    Their relationships (faces, albums, files, stacks, duplicates) were
    reassigned to the kept photo, so these are now orphan records.
    
    Deleting them is cleaner than soft-delete because:
    1. No need to filter removed=True everywhere in queries
    2. No orphan data cluttering the database
    3. Clearer data model
    """
    Photo = apps.get_model('api', 'Photo')
    
    # Find all removed photos
    removed_photos = Photo.objects.filter(removed=True)
    count = removed_photos.count()
    
    if count > 0:
        # Delete them - relationships were already cleared/reassigned in 0115
        removed_photos.delete()
        print(f"Deleted {count} removed (duplicate) photos")


def reverse_delete(apps, schema_editor):
    """
    Reverse migration is a no-op - deleted photos cannot be restored.
    """
    pass


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0116_cleanup_duplicate_groups_removed_photos'),
    ]

    operations = [
        migrations.RunPython(delete_removed_photos, reverse_delete),
    ]


================================================
FILE: api/migrations/0118_alter_longrunningjob_job_type.py
================================================
# Generated by Django 5.2.9 on 2026-01-28 13:43

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0117_delete_removed_photos'),
    ]

    operations = [
        migrations.AlterField(
            model_name='longrunningjob',
            name='job_type',
            field=models.PositiveIntegerField(choices=[(1, 'Scan Photos'), (2, 'Generate Event Albums'), (3, 'Regenerate Event Titles'), (4, 'Train Faces'), (5, 'Delete Missing Photos'), (7, 'Scan Faces'), (6, 'Calculate Clip Embeddings'), (8, 'Find Similar Faces'), (9, 'Download Selected Photos'), (10, 'Download Models'), (11, 'Add Geolocation'), (12, 'Generate Tags'), (13, 'Generate Face Embeddings'), (14, 'Scan Missing Photos'), (15, 'Detect Duplicate Photos'), (16, 'Repair File Variants')]),
        ),
    ]


================================================
FILE: api/migrations/0119_add_public_sharing_options.py
================================================
# Generated migration for public sharing options

from django.db import migrations, models
import api.models.user


class Migration(migrations.Migration):

    dependencies = [
        ("api", "0118_alter_longrunningjob_job_type"),
    ]

    operations = [
        # Add public_sharing_defaults to User model
        migrations.AddField(
            model_name="user",
            name="public_sharing_defaults",
            field=models.JSONField(default=api.models.user.get_default_public_sharing_settings),
        ),
        # Add sharing option fields to AlbumUserShare model
        migrations.AddField(
            model_name="albumusershare",
            name="share_location",
            field=models.BooleanField(blank=True, default=None, null=True),
        ),
        migrations.AddField(
            model_name="albumusershare",
            name="share_camera_info",
            field=models.BooleanField(blank=True, default=None, null=True),
        ),
        migrations.AddField(
            model_name="albumusershare",
            name="share_timestamps",
            field=models.BooleanField(blank=True, default=None, null=True),
        ),
        migrations.AddField(
            model_name="albumusershare",
            name="share_captions",
            field=models.BooleanField(blank=True, default=None, null=True),
        ),
        migrations.AddField(
            model_name="albumusershare",
            name="share_faces",
            field=models.BooleanField(blank=True, default=None, null=True),
        ),
    ]


================================================
FILE: api/migrations/0120_rename_thumbnails_uuid_to_hash.py
================================================
# Migration to rename thumbnail files from UUID to image_hash
# This migration fixes the thumbnail naming issue where thumbnails were being
# created with UUID names but the frontend expected image_hash names

import os
from django.conf import settings
from django.db import migrations


def rename_thumbnails_uuid_to_hash(apps, schema_editor):
    """
    Rename existing thumbnail files from UUID-based names to image_hash-based names.
    This only renames files that exist and updates the database records.
    Uses batch processing for improved performance with large photo collections.
    """
    Photo = apps.get_model('api', 'Photo')
    Thumbnail = apps.get_model('api', 'Thumbnail')
    
    BATCH_SIZE = 1000  # Process thumbnails in batches of 1000
    
    # Get total count for progress reporting
    total_count = Thumbnail.objects.count()
    print(f"Starting thumbnail migration for {total_count} photos...")
    
    renamed_count = 0
    skipped_count = 0
    processed_count = 0
    
    # Process thumbnails in batches to avoid loading all into memory at once
    thumbnails_to_update = []
    
    # Use iterator() to avoid loading all objects into memory
    # Process in batches using only() to load only required fields
    for thumbnail in Thumbnail.objects.select_related('photo').only(
        'photo_id', 'photo__id', 'photo__image_hash', 'photo__video',
        'thumbnail_big', 'square_thumbnail', 'square_thumbnail_small'
    ).iterator(chunk_size=BATCH_SIZE):
        photo = thumbnail.photo
        photo_uuid = str(photo.id)
        photo_hash = photo.image_hash
        
        # Skip if UUID and hash are the same (shouldn't happen, but be safe)
        if photo_uuid == photo_hash:
            skipped_count += 1
            processed_count += 1
            continue
        
        # Process each thumbnail type
        thumbnail_types = [
            ('thumbnails_big', '.webp', False),  # (path, extension, is_video)
            ('square_thumbnails', '.webp' if not photo.video else '.mp4', photo.video),
            ('square_thumbnails_small', '.webp' if not photo.video else '.mp4', photo.video),
        ]
        
        needs_update = False
        
        for thumb_dir, ext, _ in thumbnail_types:
            old_path = os.path.join(settings.MEDIA_ROOT, thumb_dir, f"{photo_uuid}{ext}")
            new_path = os.path.join(settings.MEDIA_ROOT, thumb_dir, f"{photo_hash}{ext}")
            
            # Only rename if old file exists and new file doesn't
            if os.path.exists(old_path) and not os.path.exists(new_path):
                try:
                    os.rename(old_path, new_path)
                    needs_update = True
                except Exception as e:
                    print(f"Warning: Could not rename {old_path} to {new_path}: {e}")
        
        # Queue for batch update if any files were renamed
        if needs_update:
            filetype = '.mp4' if photo.video else '.webp'
            thumbnail.thumbnail_big = os.path.join('thumbnails_big', f"{photo_hash}.webp")
            thumbnail.square_thumbnail = os.path.join('square_thumbnails', f"{photo_hash}{filetype}")
            thumbnail.square_thumbnail_small = os.path.join('square_thumbnails_small', f"{photo_hash}{filetype}")
            thumbnails_to_update.append(thumbnail)
            renamed_count += 1
        else:
            skipped_count += 1
        
        processed_count += 1
        
        # Batch update every BATCH_SIZE records
        if len(thumbnails_to_update) >= BATCH_SIZE:
            Thumbnail.objects.bulk_update(
                thumbnails_to_update,
                ['thumbnail_big', 'square_thumbnail', 'square_thumbnail_small'],
                batch_size=BATCH_SIZE
            )
            print(f"Progress: {processed_count}/{total_count} processed, {renamed_count} renamed, {skipped_count} skipped")
            thumbnails_to_update = []
    
    # Update any remaining thumbnails in the final batch
    if thumbnails_to_update:
        Thumbnail.objects.bulk_update(
            thumbnails_to_update,
            ['thumbnail_big', 'square_thumbnail', 'square_thumbnail_small'],
            batch_size=BATCH_SIZE
        )
    
    print(f"Migration complete: {renamed_count} photos renamed, {skipped_count} photos skipped")


def reverse_rename_thumbnails(apps, schema_editor):
    """
    This migration cannot be easily reversed because we would need to know
    the original UUID for each photo. The forward migration renames files
    from UUID to image_hash, but reversing would require knowing which UUID
    was used originally, which we don't store.
    """
    print("Warning: This migration cannot be reversed. Thumbnails will keep image_hash names.")
    print("If you need to revert, regenerate thumbnails from scratch.")


class Migration(migrations.Migration):

    dependencies = [
        ('api', '0119_add_public_sharing_options'),
    ]

    operations = [
        migrations.RunPython(
            rename_thumbnails_uuid_to_hash,
            reverse_rename_thumbnails,
        ),
    ]


================================================
FILE: api/migrations/0121_add_default_tagging_model.py
================================================
"""
Migration to add a default TAGGING_MODEL entry to the constance database.

When TAGGING_MODEL was added to CONSTANCE_CONFIG, existing systems that upgraded
would not have this key in the constance database backend. While constance normally
falls back to the default from CONSTANCE_CONFIG, this migration explicitly sets the
default to ensure compatibility with old systems.
"""

from django.db import migrations


def add_default_tagging_model(apps, schema_editor):
    """Add TAGGING_MODEL default value to constance DB if it doesn't exist."""
    try:
        Constance = apps.get_model("constance", "Constance")
        if not Constance.objects.filter(key="TAGGING_MODEL").exists():
            Constance.objects.create(key="TAGGING_MODEL", value='"places365"')
    except LookupError:
        # constance model not available, skip
        pass


def reverse_migration(apps, schema_editor):
    """Remove TAGGING_MODEL from constance DB if it has the default value."""
    try:
        Constance = apps.get_model("constance", "Constance")
        Constance.objects.filter(key="TAGGING_MODEL", value='"places365"').delete()
    except LookupError:
        pass


class Migration(migrations.Migration):

    dependencies = [
        ("api", "0120_rename_thumbnails_uuid_to_hash"),
    ]

    operations = [
        migrations.RunPython(add_default_tagging_model, reverse_migration),
    ]


================================================
FILE: api/migrations/0121_user_save_face_tags_to_disk.py
================================================
from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("api", "0120_rename_thumbnails_uuid_to_hash"),
    ]

    operations = [
        migrations.AddField(
            model_name="user",
            name="save_face_tags_to_disk",
            field=models.BooleanField(default=False),
        ),
    ]


================================================
FILE: api/migrations/__init__.py
================================================


================================================
FILE: api/ml_models.py
================================================
import math
import os
import tarfile
from pathlib import Path

import requests
from constance import config as site_config
from django.conf import settings

from api import util
from api.models.long_running_job import LongRunningJob


class MlTypes:
    CAPTIONING = "captioning"
    FACE_RECOGNITION = "face_recognition"
    CATEGORIES = "categories"
    CLIP = "clip"
    LLM = "llm"
    MOONDREAM = "moondream"
    TAGGING = "tagging"


ML_MODELS = [
    {
        "id": 1,
        "name": "im2txt",
        "url": "https://github.com/LibrePhotos/librephotos-docker/releases/download/0.1/im2txt.tar.gz",
        "type": MlTypes.CAPTIONING,
        "unpack-command": "tar -zxC",
        "target-dir": "im2txt",
    },
    {
        "id": 2,
        "name": "clip-embeddings",
        "url": "https://github.com/LibrePhotos/librephotos-docker/releases/download/0.1/clip-embeddings.tar.gz",
        "type": MlTypes.CLIP,
        "unpack-command": "tar -zxC",
        "target-dir": "clip-embeddings",
    },
    {
        "id": 3,
        "name": "places365",
        "url": "https://github.com/LibrePhotos/librephotos-docker/releases/download/0.1/places365.tar.gz",
        "type": MlTypes.CATEGORIES,
        "unpack-command": "tar -zxC",
        "target-dir": "places365",
    },
    {
        "id": 4,
        "name": "resnet18",
        "url": "https://download.pytorch.org/models/resnet18-5c106cde.pth",
        "type": MlTypes.CATEGORIES,
        "unpack-command": None,
        "target-dir": "resnet18-5c106cde.pth",
    },
    {
        "id": 6,
        "name": "blip_base_capfilt_large",
        "url": "https://huggingface.co/derneuere/librephotos_models/resolve/main/blip_large.tar.gz?download=true",
        "type": MlTypes.CAPTIONING,
        "unpack-command": "tar -zxC",
        "target-dir": "blip",
    },
    {
        "id": 8,
        "name": "mistral-7b-instruct-v0.2.Q5_K_M",
        "url": "https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.2-GGUF/resolve/main/mistral-7b-instruct-v0.2.Q5_K_M.gguf?download=true",
        "type": MlTypes.LLM,
        "unpack-command": None,
        "target-dir": "mistral-7b-instruct-v0.2.Q5_K_M.gguf",
    },
    {
        "id": 11,
        "name": "siglip2",
        "url": "https://huggingface.co/onnx-community/siglip2-base-patch16-384-ONNX/resolve/main/onnx/vision_model.onnx",
        "type": MlTypes.TAGGING,
        "unpack-command": None,
        "target-dir": "siglip2/vision_model.onnx",
        "additional_files": [
            {
                "url": "https://huggingface.co/onnx-community/siglip2-base-patch16-384-ONNX/resolve/main/onnx/text_model.onnx",
                "target": "siglip2/text_model.onnx",
            },
            {
                "url": "https://huggingface.co/onnx-community/siglip2-base-patch16-384-ONNX/resolve/main/tokenizer.model",
                "target": "siglip2/tokenizer.model",
            },
        ],
    },
    {
        # Moondream 2 GGUF model for llama-cpp-python multimodal support
        "id": 9,
        "name": "moondream",
        "url": "https://huggingface.co/moondream/moondream-2b-2025-04-14-4bit/resolve/main/moondream2-text-model-f16.gguf?download=true",
        "type": MlTypes.MOONDREAM,
        "unpack-command": None,
        "target-dir": "moondream2-text-model-f16.gguf",
        "additional_files": [
            {
                "url": "https://huggingface.co/moondream/moondream-2b-2025-04-14-4bit/resolve/main/moondream2-mmproj-f16.gguf?download=true",
                "target": "moondream2-mmproj-f16.gguf",
            }
        ],
    },
]


def download_model(model):
    model = model.copy()
    if model["type"] == MlTypes.LLM:
        util.logger.info("Downloading LLM model")
        model_to_download = site_config.LLM_MODEL
        if not model_to_download or str(model_to_download).strip().lower() == "none":
            util.logger.info("No LLM model selected")
            return
        util.logger.info(f"Model to download: {model_to_download}")
        # Look through ML_MODELS and find the model with the name
        for ml_model in ML_MODELS:
            if ml_model["name"] == model_to_download:
                model = ml_model
    elif model["type"] == MlTypes.MOONDREAM:
        util.logger.info("Downloading Moondream model")
        model_to_download = site_config.LLM_MODEL
        if model_to_download != "moondream":
            util.logger.info("Moondream not selected")
            return
        util.logger.info(f"Model to download: {model_to_download}")
        # Look through ML_MODELS and find the model with the name
        for ml_model in ML_MODELS:
            if ml_model["name"] == model_to_download:
                model = ml_model
    elif model["type"] == MlTypes.CAPTIONING:
        util.logger.info("Downloading captioning model")
        model_to_download = site_config.CAPTIONING_MODEL
        util.logger.info(f"Model to download: {model_to_download}")
        # Look through ML_MODELS and find the model with the name
        for ml_model in ML_MODELS:
            if ml_model["name"] == model_to_download:
                model = ml_model
    elif model["type"] == MlTypes.TAGGING:
        util.logger.info("Downloading tagging model")
        model_to_download = site_config.TAGGING_MODEL
        if model_to_download != model["name"]:
            util.logger.info(
                f"Tagging model {model['name']} not selected (current: {model_to_download})"
            )
            return
        util.logger.info(f"Model to download: {model_to_download}")

    util.logger.info(f"Downloading model {model['name']}")
    model_folder = Path(settings.MEDIA_ROOT) / "data_models"

    # Handle regular models
    target_dir = model_folder / model["target-dir"]

    if target_dir.exists():
        util.logger.info(f"Model {model['name']} already downloaded")
        # Check if all additional files exist for models like Moondream
        if model.get("additional_files"):
            for additional_file in model["additional_files"]:
                additional_target = model_folder / additional_file["target"]
                if not additional_target.exists():
                    util.logger.info(
                        f"Additional file {additional_file['target']} missing, downloading..."
                    )
                    _download_file(
                        additional_file["url"],
                        additional_target,
                        f"{model['name']} ({additional_file['target']})",
                    )
        return

    if model["unpack-command"] == "tar -zxC":
        target_dir = model_folder / (model["target-dir"] + ".tar.gz")
    if model["unpack-command"] == "tar -xvf":
        target_dir = model_folder / (model["target-dir"] + ".tar")
    if model["unpack-command"] is None:
        target_dir = model_folder / model["target-dir"]

    _download_file(model["url"], target_dir, model["name"])

    if model["unpack-command"] == "tar -zxC":
        with tarfile.open(target_dir, mode="r:gz") as tar:
            tar.extractall(path=model_folder)
        os.remove(target_dir)
    if model["unpack-command"] == "tar -xvf":
        with tarfile.open(target_dir, mode="r:") as tar:
            tar.extractall(path=model_folder)
        os.remove(target_dir)

    # Download additional files if they exist (e.g., mmproj for Moondream)
    if model.get("additional_files"):
        for additional_file in model["additional_files"]:
            additional_target = model_folder / additional_file["target"]
            if not additional_target.exists():
                _download_file(
                    additional_file["url"],
                    additional_target,
                    f"{model['name']} ({additional_file['target']})",
                )


def _download_file(url, target_path, model_name):
    """Helper function to download a single file with progress tracking"""
    target_path = Path(target_path)
    target_path.parent.mkdir(parents=True, exist_ok=True)
    response = requests.get(url, stream=True, allow_redirects=True)
    total_size = int(response.headers.get("content-length", 0))
    block_size = 1024
    current_progress = 0
    previous_percentage = -1

    with open(target_path, "wb") as target_file:
        for chunk in response.iter_content(chunk_size=block_size):
            if chunk:
                target_file.write(chunk)
                current_progress += len(chunk)

                if total_size > 0:
                    percentage = math.floor((current_progress / total_size) * 100)

                    if percentage != previous_percentage:
                        util.logger.info(
                            f"Downloading {model_name}: {current_progress}/{total_size} ({percentage}%)"
                        )
                        previous_percentage = percentage

    if total_size == 0:
        util.logger.info(
            f"Downloaded {model_name}: {current_progress} bytes (size unknown during transfer)"
        )


def download_models(user):
    lrj = LongRunningJob.create_job(
        user=user,
        job_type=LongRunningJob.JOB_DOWNLOAD_MODELS,
        start_now=True,
    )
    lrj.update_progress(current=0, target=len(ML_MODELS))

    model_folder = Path(settings.MEDIA_ROOT) / "data_models"
    model_folder.mkdir(parents=True, exist_ok=True)

    for idx, model in enumerate(ML_MODELS):
        download_model(model)
        lrj.update_progress(current=idx + 1)

    lrj.complete()


def do_all_models_exist():
    model_folder = Path(settings.MEDIA_ROOT) / "data_models"
    for model in ML_MODELS:
        if model["type"] in (MlTypes.LLM, MlTypes.MOONDREAM, MlTypes.TAGGING):
            if not model and model != "none":
                continue

        # Check main model file
        target_dir = model_folder / model["target-dir"]
        if not target_dir.exists():
            return False

        # Check additional files if they exist (like mmproj for Moondream)
        if model.get("additional_files"):
            for additional_file in model["additional_files"]:
                additional_target = model_folder / additional_file["target"]
                if not additional_target.exists():
                    return False
    return True


================================================
FILE: api/models/__init__.py
================================================
from api.models.album_auto import AlbumAuto
from api.models.album_date import AlbumDate
from api.models.album_place import AlbumPlace
from api.models.album_thing import AlbumThing
from api.models.album_user import AlbumUser
from api.models.cluster import Cluster
from api.models.duplicate import Duplicate
from api.models.face import Face
from api.models.file import File
from api.models.long_running_job import LongRunningJob
from api.models.person import Person
from api.models.photo import Photo
from api.models.photo_caption import PhotoCaption
from api.models.photo_metadata import MetadataEdit, MetadataFile, PhotoMetadata
from api.models.photo_search import PhotoSearch
from api.models.photo_stack import PhotoStack
from api.models.stack_review import StackReview
from api.models.thumbnail import Thumbnail
from api.models.user import User

__all__ = [
    "AlbumAuto",
    "AlbumDate",
    "AlbumPlace",
    "AlbumThing",
    "AlbumUser",
    "Cluster",
    "Duplicate",
    "Face",
    "LongRunningJob",
    "MetadataEdit",
    "MetadataFile",
    "Person",
    "Photo",
    "PhotoCaption",
    "PhotoMetadata",
    "PhotoSearch",
    "PhotoStack",
    "StackReview",
    "Thumbnail",
    "User",
    "File",
]


================================================
FILE: api/models/album_auto.py
================================================
from collections import Counter

from django.db import models

from api import util
from api.models.person import Person
from api.models.photo import Photo
from api.models.user import User, get_deleted_user


class AlbumAuto(models.Model):
    title = models.CharField(
        blank=False, null=False, max_length=512, default="Untitled Album"
    )
    timestamp = models.DateTimeField(db_index=True)
    created_on = models.DateTimeField(auto_now=False, db_index=True)
    gps_lat = models.FloatField(blank=True, null=True)
    gps_lon = models.FloatField(blank=True, null=True)
    photos = models.ManyToManyField(Photo)
    favorited = models.BooleanField(default=False, db_index=True)
    owner = models.ForeignKey(
        User, on_delete=models.SET(get_deleted_user), default=None
    )

    shared_to = models.ManyToManyField(User, related_name="album_auto_shared_to")

    class Meta:
        unique_together = ("timestamp", "owner")

    def _generate_title(self):
        try:
            weekday = ""
            time = ""
            loc = ""
            if self.timestamp:
                weekday = util.weekdays[self.timestamp.isoweekday()]
                hour = self.timestamp.hour
                if hour > 0 and hour < 5:
                    time = "Early Morning"
                elif hour >= 5 and hour < 12:
                    time = "Morning"
                elif hour >= 12 and hour < 18:
                    time = "Afternoon"
                elif hour >= 18 and hour <= 24:
                    time = "Evening"

            when = " ".join([weekday, time])

            photos = self.photos.all()

            loc = ""
            pep = ""

            places = []
            people = []
            timestamps = []

            for photo in photos:
                if (
                    photo.geolocation_json
                    and "places" in photo.geolocation_json.keys()
                    and len(photo.geolocation_json["places"]) > 0
                ):
                    places = photo.geolocation_json["places"]

                timestamps.append(photo.exif_timestamp)

                faces = photo.faces.all()
                for face in faces:
                    people.append(face.person.name)

            if len(places) > 0:
                cnts_places = Counter(places)
                loc = "in " + " and ".join(dict(cnts_places.most_common(2)).keys())
            if len(people) > 0:
                cnts_people = Counter(people)
                names = dict(
                    [
                        (k, v)
                        for k, v in cnts_people.most_common(2)
                        if k.lower() != "unknown"
                        and k.lower() != Person.UNKNOWN_PERSON_NAME
                    ]
                ).keys()
                if len(names) > 0:
                    pep = "with " + " and ".join(names)
            if len(timestamps) > 0:
                if (max(timestamps) - min(timestamps)).days >= 3:
                    when = "%d days" % ((max(timestamps) - min(timestamps)).days)

                weekend = [5, 6]
                if (
                    max(timestamps).weekday() in weekend
                    and min(timestamps).weekday() in weekend
                    and not (max(timestamps).weekday() == min(timestamps).weekday())
                ):
                    when = "Weekend"

            title = " ".join([when, pep, loc]).strip()
            # Ensure title is never empty
            if not title:
                title = f"Album from {self.timestamp.strftime('%Y-%m-%d')}"
            self.title = title
            self.save()
        except Exception as e:
            util.logger.exception(e)
            # Set a fallback title if something goes wrong
            self.title = f"Album from {self.timestamp.strftime('%Y-%m-%d')}"
            self.save()

    def __str__(self):
        return "%d: %s" % (self.id, self.title)


================================================
FILE: api/models/album_date.py
================================================
from django.db import models

from api.models.photo import Photo
from api.models.user import User, get_deleted_user


class AlbumDate(models.Model):
    title = models.CharField(blank=True, default="", max_length=512, db_index=True)
    date = models.DateField(db_index=True, null=True)
    photos = models.ManyToManyField(Photo)
    favorited = models.BooleanField(default=False, db_index=True)
    location = models.JSONField(blank=True, db_index=True, null=True)
    owner = models.ForeignKey(
        User, on_delete=models.SET(get_deleted_user), default=None
    )
    shared_to = models.ManyToManyField(User, related_name="album_date_shared_to")
    objects = models.Manager()

    class Meta:
        unique_together = ("date", "owner")

    def __str__(self):
        return str(self.date) + " (" + str(self.owner) + ")"

    def ordered_photos(self):
        return self.photos.all().order_by("-exif_timestamp")


def get_or_create_album_date(date, owner):
    try:
        return AlbumDate.objects.get_or_create(date=date, owner=owner)[0]
    except AlbumDate.MultipleObjectsReturned:
        return AlbumDate.objects.filter(date=date, owner=owner).first()


def get_album_date(date, owner):
    try:
        return AlbumDate.objects.get(date=date, owner=owner)
    except Exception:
        return None


def get_album_nodate(owner):
    return AlbumDate.objects.get_or_create(date=None, owner=owner)[0]


================================================
FILE: api/models/album_place.py
================================================
from django.db import models

from api.models.photo import Photo
from api.models.user import User, get_deleted_user


class AlbumPlace(models.Model):
    title = models.CharField(max_length=512, db_index=True)
    photos = models.ManyToManyField(Photo)
    geolocation_level = models.IntegerField(db_index=True, null=True)
    favorited = models.BooleanField(default=False, db_index=True)
    owner = models.ForeignKey(
        User, on_delete=models.SET(get_deleted_user), default=None
    )

    shared_to = models.ManyToManyField(User, related_name="album_place_shared_to")

    class Meta:
        unique_together = ("title", "owner")

    def __str__(self):
        return "%d: %s" % (self.id, self.title)


def get_album_place(title, owner):
    return AlbumPlace.objects.get_or_create(title=title, owner=owner)[0]


================================================
FILE: api/models/album_thing.py
================================================
from django.db import models
from django.db.models.signals import m2m_changed
from django.dispatch import receiver

from api.models.photo import Photo
from api.models.user import User, get_deleted_user


def update_default_cover_photo(instance):
    if instance.cover_photos.count() < 4:
        photos_to_add = instance.photos.filter(hidden=False)[
            : 4 - instance.cover_photos.count()
        ]
        instance.cover_photos.add(*photos_to_add)


class AlbumThing(models.Model):
    title = models.CharField(max_length=512, db_index=True)
    photos = models.ManyToManyField(Photo)
    thing_type = models.CharField(max_length=512, db_index=True, null=True)
    favorited = models.BooleanField(default=False, db_index=True)
    owner = models.ForeignKey(
        User, on_delete=models.SET(get_deleted_user), default=None
    )
    shared_to = models.ManyToManyField(User, related_name="album_thing_shared_to")
    cover_photos = models.ManyToManyField(
        Photo, related_name="album_thing_cover_photos"
    )
    photo_count = models.IntegerField(default=0)

    class Meta:
        constraints = [
            models.UniqueConstraint(
                fields=["title", "thing_type", "owner"], name="unique AlbumThing"
            )
        ]

    def save(self, *args, **kwargs):
        super().save(*args, **kwargs)

    def update_default_cover_photo(self):
        update_default_cover_photo(self)

    def __str__(self):
        return "%d: %s" % (self.id or 0, self.title)


@receiver(m2m_changed, sender=AlbumThing.photos.through)
def update_photo_count(sender, instance, action, reverse, model, pk_set, **kwargs):
    if action == "post_add" or (action == "post_remove" and not reverse):
        count = instance.photos.filter(hidden=False).count()
        instance.photo_count = count
        instance.save(update_fields=["photo_count"])
        instance.update_default_cover_photo()


def get_album_thing(title, owner, thing_type=None):
    return AlbumThing.objects.get_or_create(
        title=title, owner=owner, thing_type=thing_type
    )[0]


================================================
FILE: api/models/album_user.py
================================================
from django.db import models

from api.models.photo import Photo
from api.models.user import User, get_deleted_user


class AlbumUser(models.Model):
    title = models.CharField(max_length=512)
    created_on = models.DateTimeField(auto_now=True, db_index=True)
    photos = models.ManyToManyField(Photo)
    favorited = models.BooleanField(default=False, db_index=True)
    owner = models.ForeignKey(
        User, on_delete=models.SET(get_deleted_user), default=None
    )
    cover_photo = models.ForeignKey(
        Photo,
        related_name="album_user",
        on_delete=models.SET_NULL,
        blank=False,
        null=True,
    )

    shared_to = models.ManyToManyField(User, related_name="album_user_shared_to")

    def __str__(self):
        return f"{self.title} ({self.owner.username})"

    class Meta:
        unique_together = ("title", "owner")


================================================
FILE: api/models/album_user_share.py
================================================
import uuid
from django.db import models
from django.utils import timezone

from api.models.album_user import AlbumUser


class AlbumUserShare(models.Model):
    album = models.OneToOneField(
        AlbumUser, on_delete=models.CASCADE, related_name="share"
    )
    enabled = models.BooleanField(default=False, db_index=True)
    slug = models.SlugField(
        max_length=64, unique=True, null=True, blank=True, db_index=True
    )
    expires_at = models.DateTimeField(null=True, blank=True, db_index=True)

    # Sharing options - None means inherit from user defaults, True/False overrides
    share_location = models.BooleanField(null=True, blank=True, default=None)
    share_camera_info = models.BooleanField(null=True, blank=True, default=None)
    share_timestamps = models.BooleanField(null=True, blank=True, default=None)
    share_captions = models.BooleanField(null=True, blank=True, default=None)
    share_faces = models.BooleanField(null=True, blank=True, default=None)

    def ensure_slug(self) -> None:
        if self.enabled and not self.slug:
            base = uuid.uuid4().hex[:12]
            candidate = base
            idx = 0
            while (
                AlbumUserShare.objects.filter(slug=candidate)
                .exclude(id=self.id)
                .exists()
            ):
                idx += 1
                candidate = f"{base}-{idx}"
            self.slug = candidate

    def is_active(self) -> bool:
        if not self.enabled:
            return False
        if self.expires_at is None:
            return True
        return self.expires_at >= timezone.now()

    def save(self, *args, **kwargs):
        if self.enabled and not self.slug:
            self.ensure_slug()
        super().save(*args, **kwargs)

    def get_effective_sharing_settings(self) -> dict:
        """Resolve effective sharing settings.
        
        Priority: album override > user defaults > system defaults (all False)
        """
        from api.models.user import get_default_public_sharing_settings
        
        # Start with system defaults (all False)
        defaults = get_default_public_sharing_settings()
        
        # Apply user defaults if available
        user_defaults = getattr(self.album.owner, 'public_sharing_defaults', None)
        if user_defaults:
            defaults.update(user_defaults)
        
        # Apply album-level overrides (only non-None values)
        overrides = {
            'share_location': self.share_location,
            'share_camera_info': self.share_camera_info,
            'share_timestamps': self.share_timestamps,
            'share_captions': self.share_captions,
            'share_faces': self.share_faces,
        }
        
        for key, value in overrides.items():
            if value is not None:
                defaults[key] = value
        
        return defaults


================================================
FILE: api/models/cluster.py
================================================
import numpy as np
from django.core.exceptions import MultipleObjectsReturned
from django.db import models

from api.models.person import Person
from api.models.user import User, get_deleted_user
from api.util import logger

UNKNOWN_CLUSTER_ID = -1
UNKNOWN_CLUSTER_NAME = "Other Unknown Cluster"


class Cluster(models.Model):
    person = models.ForeignKey(
        Person,
        on_delete=models.SET_NULL,
        related_name="clusters",
        blank=True,
        null=True,
    )
    mean_face_encoding = models.TextField()
    cluster_id = models.IntegerField(null=True)
    name = models.TextField(null=True)

    owner = models.ForeignKey(
        User, on_delete=models.SET(get_deleted_user), default=None, null=True
    )

    def __str__(self):
        return "%d" % self.id

    def get_mean_encoding_array(self) -> np.ndarray:
        return np.frombuffer(bytes.fromhex(self.mean_face_encoding))

    def set_metadata(self, all_vectors):
        self.mean_face_encoding = (
            Cluster.calculate_mean_face_encoding(all_vectors).tobytes().hex()
        )

    @staticmethod
    def get_or_create_cluster_by_name(user: User, name):
        return Cluster.objects.get_or_create(owner=user, name=name)[0]

    @staticmethod
    def get_or_create_cluster_by_id(user: User, cluster_id: int):
        try:
            return Cluster.objects.get_or_create(owner=user, cluster_id=cluster_id)[0]
        except MultipleObjectsReturned:
            logger.error(
                "Multiple clusters found with id %d. Choosing first one" % cluster_id
            )
            return Cluster.objects.filter(owner=user, cluster_id=cluster_id).first()

    @staticmethod
    def calculate_mean_face_encoding(all_encodings):
        return np.mean(a=all_encodings, axis=0, dtype=np.float64)


def get_unknown_cluster(user: User) -> Cluster:
    unknown_cluster: Cluster = Cluster.get_or_create_cluster_by_id(
        user, UNKNOWN_CLUSTER_ID
    )
    if unknown_cluster.person is not None:
        unknown_cluster.person = None
        unknown_cluster.name = UNKNOWN_CLUSTER_NAME
        unknown_cluster.save()
    return unknown_cluster


================================================
FILE: api/models/duplicate.py
================================================
"""
Duplicate model for tracking duplicate photo groups.

Duplicates are photos that are either:
- EXACT_COPY: Byte-for-byte identical files (same MD5 hash, different paths)
- VISUAL_DUPLICATE: Visually similar photos (similar perceptual hash or CLIP embeddings)

Duplicates are fundamentally different from Stacks:
- Duplicates represent redundant storage that the user may want to clean up
- Stacks represent related photos that should be kept together for organization

This separation allows:
- Focused workflows: Duplicates → review/delete, Stacks → browse/organize
- Different UX: Duplicates page focused on storage savings vs Stacks for browsing
- Clearer data model with appropriate fields for each concept
"""

import uuid

from django.db import models
from django.utils import timezone

from api.models.user import User, get_deleted_user


class Duplicate(models.Model):
    """
    Represents a group of duplicate photos that should be reviewed.
    
    Photos in a duplicate group are candidates for deletion - the user
    reviews them and decides which to keep.
    """

    class DuplicateType(models.TextChoices):
        # Exact byte-for-byte copies (same MD5 hash, different file paths)
        EXACT_COPY = "exact_copy", "Exact Copies"
        # Visually similar images (similar pHash or CLIP embeddings)
        VISUAL_DUPLICATE = "visual_duplicate", "Visual Duplicates"

    class ReviewStatus(models.TextChoices):
        # User hasn't reviewed yet
        PENDING = "pending", "Pending Review"
        # User selected a primary and trashed others
        RESOLVED = "resolved", "Resolved"
        # User marked as "not actually duplicates"
        DISMISSED = "dismissed", "Dismissed"

    id = models.UUIDField(primary_key=True, default=uuid.uuid4, editable=False)

    owner = models.ForeignKey(
        User,
        on_delete=models.SET(get_deleted_user),
        related_name="duplicates",
    )

    duplicate_type = models.CharField(
        max_length=20,
        choices=DuplicateType.choices,
        default=DuplicateType.VISUAL_DUPLICATE,
        db_index=True,
    )

    review_status = models.CharField(
        max_length=20,
        choices=ReviewStatus.choices,
        default=ReviewStatus.PENDING,
        db_index=True,
    )

    # The photo the user chose to keep (set when resolved)
    kept_photo = models.ForeignKey(
        "Photo",
        on_delete=models.SET_NULL,
        null=True,
        blank=True,
        related_name="kept_in_duplicates",
    )

    # Detection metadata
    created_at = models.DateTimeField(auto_now_add=True)
    updated_at = models.DateTimeField(auto_now=True)
    reviewed_at = models.DateTimeField(null=True, blank=True)

    # For visual duplicates: similarity score (0-1, higher = more similar)
    similarity_score = models.FloatField(null=True, blank=True)

    # Potential storage savings if non-kept photos are removed (bytes)
    potential_savings = models.BigIntegerField(default=0)

    # Number of photos trashed when resolved
    trashed_count = models.IntegerField(default=0)

    # Optional note from user
    note = models.TextField(blank=True, null=True)

    class Meta:
        ordering = ["-created_at"]
        verbose_name = "Duplicate"
        verbose_name_plural = "Duplicates"
        indexes = [
            models.Index(fields=["owner", "duplicate_type"]),
            models.Index(fields=["owner", "review_status"]),
        ]

    def __str__(self):
        return f"Duplicate {self.id} - {self.duplicate_type} - {self.owner.username}"

    @property
    def photo_count(self):
        """Number of photos in this duplicate group."""
        return self.photos.count()

    def get_photos_ordered_by_quality(self):
        """
        Returns photos ordered by quality metrics.
        Higher resolution and larger file size are considered better quality.
        """
        return self.photos.select_related('metadata').order_by(
            "-metadata__width", "-metadata__height", "-size"
        )

    def auto_select_best_photo(self):
        """
        Automatically selects the best quality photo as the kept photo.
        Used as a suggestion for the user.
        
        For EXACT_COPY: Picks the one with shortest path (likely "original")
        For VISUAL_DUPLICATE: Highest resolution
        
        Returns:
            The best Photo instance or None
        """
        from django.db.models.functions import Length
        
        photos = self.photos.all()
        if not photos.exists():
            return None

        if self.duplicate_type == self.DuplicateType.EXACT_COPY:
            # For exact copies, pick the one with shortest path (likely "original")
            best = photos.order_by(Length("main_file__path")).first()
        else:
            # For visual duplicates: highest resolution
            from django.db.models import F
            best = photos.order_by(
                F("metadata__width") * F("metadata__height")
            ).last()

        return best

    def calculate_potential_savings(self):
        """
        Calculate how much storage could be saved if non-best photos
        are removed from disk.
        """
        best = self.auto_select_best_photo()
        if not best:
            self.potential_savings = 0
        else:
            # Sum size of all photos except best
            from django.db.models import Sum
            non_best_size = (
                self.photos.exclude(pk=best.pk)
                .aggregate(total=Sum("size"))
                .get("total", 0)
            ) or 0
            self.potential_savings = non_best_size

        self.save(update_fields=["potential_savings", "updated_at"])
        return self.potential_savings

    def resolve(self, kept_photo, trash_others: bool = True):
        """
        Mark the duplicate as resolved by selecting a photo to keep.
        
        Args:
            kept_photo: The Photo instance to keep
            trash_others: Whether to move other photos to trash
        """
        # Set the kept photo
        self.kept_photo = kept_photo
        self.review_status = self.ReviewStatus.RESOLVED
        self.reviewed_at = timezone.now()

        # Trash others if requested
        if trash_others:
            other_photos = self.photos.exclude(pk=kept_photo.pk)
            self.trashed_count = other_photos.update(in_trashcan=True)
        
        self.save()
        return self

    def dismiss(self):
        """Mark as 'not actually duplicates' and unlink photos from group."""
        self.review_status = self.ReviewStatus.DISMISSED
        self.reviewed_at = timezone.now()
        
        # Unlink photos from duplicate group (ManyToMany)
        for photo in self.photos.all():
            photo.duplicates.remove(self)
        
        self.save()
        return self

    def revert(self):
        """Revert a resolved duplicate, restoring trashed photos."""
        if self.review_status != self.ReviewStatus.RESOLVED:
            return 0

        # Restore trashed photos in this duplicate group
        restored_count = self.photos.filter(
            in_trashcan=True
        ).update(in_trashcan=False)

        # Reset to pending
        self.review_status = self.ReviewStatus.PENDING
        self.kept_photo = None
        self.trashed_count = 0
        self.reviewed_at = None

        self.save()
        return restored_count

    def merge_with(self, other_duplicate: "Duplicate"):
        """
        Merge another duplicate group into this one.
        All photos from the other group are moved here,
        and the other group is deleted.
        """
        if other_duplicate.pk == self.pk:
            return

        # Move all photos from other duplicate to this one (ManyToMany)
        for photo in other_duplicate.photos.all():
            photo.duplicates.add(self)
            photo.duplicates.remove(other_duplicate)

        self.calculate_potential_savings()

        # Delete the now-empty duplicate group
        other_duplicate.delete()

    @classmethod
    def create_or_merge(cls, owner, duplicate_type, photos, similarity_score=None):
        """
        Create a new duplicate group or merge into existing if any photo is already grouped.

        Args:
            owner: User who owns the photos
            duplicate_type: Type of duplicate (EXACT_COPY or VISUAL_DUPLICATE)
            photos: Queryset or list of Photo objects to group
            similarity_score: Optional similarity score for visual duplicates

        Returns:
            The Duplicate instance (new or existing)
        """
        photo_list = list(photos)
        if len(photo_list) < 2:
            return None

        # Check if any photo is already in a duplicate group of the same type
        existing_duplicates = cls.objects.filter(
            photos__in=photo_list,
            duplicate_type=duplicate_type,
            owner=owner,
        ).distinct()

        if existing_duplicates.exists():
            # Merge all into the first existing duplicate group
            target_duplicate = existing_duplicates.first()
            for duplicate in existing_duplicates[1:]:
                target_duplicate.merge_with(duplicate)

            # Add any new photos to the group (ManyToMany)
            for photo in photo_list:
                if not photo.duplicates.filter(pk=target_duplicate.pk).exists():
                    photo.duplicates.add(target_duplicate)

            target_duplicate.calculate_potential_savings()
            return target_duplicate
        else:
            # Create new duplicate group
            duplicate = cls.objects.create(
                owner=owner,
                duplicate_type=duplicate_type,
                similarity_score=similarity_score,
            )

            # Associate photos (ManyToMany)
            for photo in photo_list:
                photo.duplicates.add(duplicate)

            duplicate.calculate_potential_savings()
            return duplicate


================================================
FILE: api/models/face.py
================================================
import os

import numpy as np
from django.db import models
from django.dispatch import receiver

from api.face_recognition import get_face_encodings
from api.models.cluster import Cluster
from api.models.person import Person
from api.models.photo import Photo


class Face(models.Model):
    photo = models.ForeignKey(
        Photo, related_name="faces", on_delete=models.CASCADE, blank=False, null=True
    )
    image = models.ImageField(upload_to="faces", null=True)

    person = models.ForeignKey(
        Person, on_delete=models.DO_NOTHING, related_name="faces", null=True
    )

    classification_person = models.ForeignKey(
        Person,
        related_name="classification_faces",
        on_delete=models.SET_NULL,
        blank=True,
        null=True,
    )
    classification_probability = models.FloatField(default=0.0, db_index=True)

    cluster_person = models.ForeignKey(
        Person,
        related_name="cluster_faces",
        on_delete=models.SET_NULL,
        blank=True,
        null=True,
    )
    cluster_probability = models.FloatField(default=0.0, db_index=True)

    deleted = models.BooleanField(default=False)

    cluster = models.ForeignKey(
        Cluster,
        related_name="faces",
        on_delete=models.SET_NULL,
        blank=True,
        null=True,
    )

    location_top = models.IntegerField()
    location_bottom = models.IntegerField()
    location_left = models.IntegerField()
    location_right = models.IntegerField()
    encoding = models.TextField()

    @property
    def timestamp(self):
        return self.photo.exif_timestamp if self.photo else None

    def __str__(self):
        return "%d" % self.id

    def generate_encoding(self):
        self.encoding = (
            get_face_encodings(
                self.photo.thumbnail.thumbnail_big.path,
                [
                    (
                        self.location_top,
                        self.location_right,
                        self.location_bottom,
                        self.location_left,
                    )
                ],
            )[0]
            .tobytes()
            .hex()
        )
        self.save()

    def get_encoding_array(self):
        return np.frombuffer(bytes.fromhex(self.encoding))


@receiver(models.signals.post_delete, sender=Person)
def reset_person(sender, instance, **kwargs):
    instance.faces.update(person=None)


# From: https://stackoverflow.com/questions/16041232/django-delete-filefield
@receiver(models.signals.post_delete, sender=Face)
def auto_delete_file_on_delete(sender, instance, **kwargs):
    if instance.image:
        if os.path.isfile(instance.image.path):
            os.remove(instance.image.path)


================================================
FILE: api/models/file.py
================================================
import hashlib
import os

import magic
import pyvips
from django.db import models

from api import util

# Most optimal value for performance/memory. Found here:
# https://stackoverflow.com/questions/17731660/hashlib-optimal-size-of-chunks-to-be-used-in-md5-update
BUFFER_SIZE = 65536


# To-Do: add owner to file
class File(models.Model):
    IMAGE = 1
    VIDEO = 2
    METADATA_FILE = 3
    RAW_FILE = 4
    UNKNOWN = 5

    FILE_TYPES = (
        (IMAGE, "Image"),
        (VIDEO, "Video"),
        (METADATA_FILE, "Metadata File e.g. XMP"),
        (RAW_FILE, "Raw File"),
        (UNKNOWN, "Unknown"),
    )

    hash = models.CharField(primary_key=True, max_length=64, null=False)
    path = models.TextField(blank=True, default="", unique=True)
    type = models.PositiveIntegerField(
        blank=True,
        choices=FILE_TYPES,
    )
    missing = models.BooleanField(default=False)
    embedded_media = models.ManyToManyField("self", symmetrical=False)

    def __str__(self):
        return self.path + " " + self._find_out_type()

    @staticmethod
    def create(path: str, user):
        """
        Create or retrieve a File record for the given path.

        Uses get_or_create pattern to handle unique path constraint:
        - If a File with this path already exists, return it
        - If not, create a new File with calculated hash

        Handles race conditions: if concurrent creates happen for the same
        path, only one will succeed and others will return the existing file.

        Note: If file content has changed (different hash), the existing
        File record is returned. Hash updates should be handled separately
        during rescan operations.

        Args:
            path: The file system path to the file
            user: The user who owns this file (used for hash calculation)

        Returns:
            File: The existing or newly created File instance
        """
        from django.db import IntegrityError

        # Check if a File with this path already exists
        existing = File.objects.filter(path=path).first()
        if existing:
            return existing

        # Create new File
        file = File()
        file.path = path
        file.hash = calculate_hash(user, path)
        file._find_out_type()

        try:
            file.save()
            return file
        except IntegrityError:
            # Race condition: another thread created the file between our check and save
            # Try to fetch by path first (unique constraint), then by hash (primary key)
            existing = File.objects.filter(path=path).first()
            if existing:
                return existing
            # If path doesn't exist, hash collision occurred - fetch by hash
            existing = File.objects.filter(hash=file.hash).first()
            if existing:
                return existing
            # Re-raise if we can't find the conflicting record
            raise

    def _find_out_type(self):
        self.type = File.IMAGE
        if is_raw(self.path):
            self.type = File.RAW_FILE
        if is_video(self.path):
            self.type = File.VIDEO
        if is_metadata(self.path):
            self.type = File.METADATA_FILE
        self.save()


def is_video(path):
    try:
        mime = magic.Magic(mime=True)
        filename = mime.from_file(path)
        return filename.find("video") != -1
    except Exception:
        util.logger.error(f"Error while checking if file is video: {path}")
        return False


def is_raw(path):
    fileextension = os.path.splitext(path)[1]
    rawformats = [
        ".RWZ",
        ".CR2",
        ".NRW",
        ".EIP",
        ".RAF",
        ".ERF",
        ".RW2",
        ".NEF",
        ".ARW",
        ".K25",
        ".DNG",
        ".SRF",
        ".DCR",
        ".RAW",
        ".CRW",
        ".BAY",
        ".3FR",
        ".CS1",
        ".MEF",
        ".ORF",
        ".ARI",
        ".SR2",
        ".KDC",
        ".MOS",
        ".MFW",
        ".FFF",
        ".CR3",
        ".SRW",
        ".RWL",
        ".J6I",
        ".KC2",
        ".X3F",
        ".MRW",
        ".IIQ",
        ".PEF",
        ".CXI",
        ".MDC",
    ]
    return fileextension.upper() in rawformats


def is_metadata(path):
    fileextension = os.path.splitext(path)[1]
    rawformats = [
        ".XMP",
    ]
    return fileextension.upper() in rawformats


def is_valid_media(path, user) -> bool:
    if is_video(path=path) or is_metadata(path=path):
        return True
    if is_raw(path=path):
        return True
    try:
        pyvips.Image.thumbnail(path, 10000, height=200, size=pyvips.enums.Size.DOWN)
        return True
    except Exception as e:
        util.logger.info(f"Could not handle {path}, because {str(e)}")
        return False


def calculate_hash(user, path):
    try:
        hash_md5 = hashlib.md5()
        with open(path, "rb") as f:
            for chunk in iter(lambda: f.read(BUFFER_SIZE), b""):
                hash_md5.update(chunk)
        return hash_md5.hexdigest() + str(user.id)
    except Exception as e:
        util.logger.error(f"Could not calculate hash for file {path}")
        raise e


def calculate_hash_b64(user, content):
    hash_md5 = hashlib.md5()
    with content as f:
        for chunk in iter(lambda: f.read(BUFFER_SIZE), b""):
            hash_md5.update(chunk)
    return hash_md5.hexdigest() + str(user.id)


================================================
FILE: api/models/long_running_job.py
================================================
import uuid
from datetime import datetime, timedelta

from django.db import models
from django.utils import timezone

from api.models.user import User, get_deleted_user


class LongRunningJob(models.Model):
    JOB_SCAN_PHOTOS = 1
    JOB_GENERATE_AUTO_ALBUMS = 2
    JOB_GENERATE_AUTO_ALBUM_TITLES = 3
    JOB_TRAIN_FACES = 4
    JOB_DELETE_MISSING_PHOTOS = 5
    JOB_CALCULATE_CLIP_EMBEDDINGS = 6
    JOB_SCAN_FACES = 7
    JOB_CLUSTER_ALL_FACES = 8
    JOB_DOWNLOAD_PHOTOS = 9
    JOB_DOWNLOAD_MODELS = 10
    JOB_ADD_GEOLOCATION = 11
    JOB_GENERATE_TAGS = 12
    JOB_GENERATE_FACE_EMBEDDINGS = 13
    JOB_SCAN_MISSING_PHOTOS = 14
    JOB_DETECT_DUPLICATES = 15
    JOB_REPAIR_FILE_VARIANTS = 16

    JOB_TYPES = (
        (JOB_SCAN_PHOTOS, "Scan Photos"),
        (JOB_GENERATE_AUTO_ALBUMS, "Generate Event Albums"),
        (JOB_GENERATE_AUTO_ALBUM_TITLES, "Regenerate Event Titles"),
        (JOB_TRAIN_FACES, "Train Faces"),
        (JOB_DELETE_MISSING_PHOTOS, "Delete Missing Photos"),
        (JOB_SCAN_FACES, "Scan Faces"),
        (JOB_CALCULATE_CLIP_EMBEDDINGS, "Calculate Clip Embeddings"),
        (JOB_CLUSTER_ALL_FACES, "Find Similar Faces"),
        (JOB_DOWNLOAD_PHOTOS, "Download Selected Photos"),
        (JOB_DOWNLOAD_MODELS, "Download Models"),
        (JOB_ADD_GEOLOCATION, "Add Geolocation"),
        (JOB_GENERATE_TAGS, "Generate Tags"),
        (JOB_GENERATE_FACE_EMBEDDINGS, "Generate Face Embeddings"),
        (JOB_SCAN_MISSING_PHOTOS, "Scan Missing Photos"),
        (JOB_DETECT_DUPLICATES, "Detect Duplicate Photos"),
        (JOB_REPAIR_FILE_VARIANTS, "Repair File Variants"),
    )

    job_type = models.PositiveIntegerField(
        choices=JOB_TYPES,
    )

    finished = models.BooleanField(default=False, blank=False, null=False)
    failed = models.BooleanField(default=False, blank=False, null=False)
    job_id = models.CharField(max_length=36, unique=True, db_index=True)
    queued_at = models.DateTimeField(default=datetime.now, null=False)
    started_at = models.DateTimeField(null=True)
    finished_at = models.DateTimeField(null=True)
    started_by = models.ForeignKey(
        User, on_delete=models.SET(get_deleted_user), default=None
    )
    progress_current = models.PositiveIntegerField(default=0)
    progress_target = models.PositiveIntegerField(default=0)
    # New fields for detailed progress reporting
    progress_step = models.CharField(max_length=100, null=True, blank=True)  # Current step description
    result = models.JSONField(null=True, blank=True)  # Detailed result/progress data

    class Meta:
        ordering = ["-queued_at"]
        verbose_name = "Long Running Job"
        verbose_name_plural = "Long Running Jobs"

    def __str__(self):
        status = "failed" if self.failed else ("finished" if self.finished else "running" if self.started_at else "queued")
        return f"Job {self.job_id} - {self.get_job_type_display()} - {status}"

    @property
    def is_running(self):
        """Check if job is currently running (started but not finished)."""
        return self.started_at is not None and not self.finished

    @property
    def duration(self):
        """Return job duration in seconds, or None if not started."""
        if not self.started_at:
            return None
        end = self.finished_at or timezone.now()
        return (end - self.started_at).total_seconds()

    def start(self):
        """Mark job as started."""
        self.started_at = timezone.now()
        self.save(update_fields=["started_at"])

    def complete(self, result=None):
        """Mark job as successfully completed."""
        self.finished = True
        self.finished_at = timezone.now()
        if result is not None:
            self.result = result
        self.save(update_fields=["finished", "finished_at", "result"])

    def fail(self, error=None):
        """Mark job as failed with optional error message."""
        self.failed = True
        self.finished = True
        self.finished_at = timezone.now()
        if error is not None:
            self.result = {"status": "failed", "error": str(error)}
        self.save(update_fields=["failed", "finished", "finished_at", "result"])

    def update_progress(self, current, target=None, step=None):
        """Update job progress counters and optional step description."""
        update_fields = ["progress_current"]
        self.progress_current = current
        if target is not None:
            self.progress_target = target
            update_fields.append("progress_target")
        if step is not None:
            self.progress_step = step
            update_fields.append("progress_step")
        self.save(update_fields=update_fields)

    def set_result(self, result):
        """Update the job result/progress data."""
        self.result = result
        self.save(update_fields=["result"])

    @classmethod
    def create_job(cls, user, job_type, job_id=None, start_now=False):
        """
        Factory method to create a new job with proper defaults.
        
        Args:
            user: The user who started the job
            job_type: One of the JOB_* constants
            job_id: Optional job ID (auto-generated UUID if not provided)
            start_now: If True, set started_at to now
        
        Returns:
            The newly created LongRunningJob instance
        """
        if job_id is None:
            job_id = str(uuid.uuid4())
        job = cls.objects.create(
            started_by=user,
            job_id=str(job_id),
            queued_at=timezone.now(),
            job_type=job_type,
        )
        if start_now:
            job.start()
        return job

    @classmethod
    def get_or_create_job(cls, user, job_type, job_id):
        """
        Get an existing job by job_id or create a new one.
        
        This is useful for queued jobs where the job_id is known ahead of time.
        If the job exists, it will be marked as started. If not, a new job is created.
        
        Args:
            user: The user who started the job
            job_type: One of the JOB_* constants
            job_id: The job ID to look up or use for creation
        
        Returns:
            The LongRunningJob instance (existing or newly created)
        """
        if cls.objects.filter(job_id=job_id).exists():
            job = cls.objects.get(job_id=job_id)
            job.start()
            return job
        return cls.create_job(user=user, job_type=job_type, job_id=job_id, start_now=True)

    @classmethod
    def cleanup_stuck_jobs(cls, hours=24):
        """
        Mark jobs as failed if they've been running for too long.
        
        Jobs that have started_at set but finished=False for longer than
        the specified hours are considered stuck and will be marked as failed.
        
        Args:
            hours: Number of hours after which a running job is considered stuck
        
        Returns:
            Number of jobs marked as failed
        """
        cutoff = timezone.now() - timedelta(hours=hours)
        stuck_jobs = cls.objects.filter(
            finished=False,
            started_at__isnull=False,
            started_at__lt=cutoff
        )
        count = stuck_jobs.count()
        stuck_jobs.update(
            failed=True,
            finished=True,
            finished_at=timezone.now(),
            result={"status": "failed", "error": f"Job timed out after {hours} hours"}
        )
        return count

    @classmethod
    def cleanup_old_jobs(cls, days=30):
        """
        Delete completed/failed jobs older than specified days.
        
        Args:
            days: Number of days after which completed jobs should be deleted
        
        Returns:
            Number of jobs deleted
        """
        cutoff = timezone.now() - timedelta(days=days)
        deleted, _ = cls.objects.filter(
            finished=True,
            finished_at__lt=cutoff
        ).delete()
        return deleted


================================================
FILE: api/models/person.py
================================================
import datetime

import pytz
from django.core.validators import MinLengthValidator
from django.db import models
from django.db.models import Prefetch

from api.models.photo import Photo
from api.models.user import User

utc = pytz.UTC


class Person(models.Model):
    UNKNOWN_PERSON_NAME = "Unknown - Other"
    KIND_USER = "USER"
    KIND_CLUSTER = "CLUSTER"
    KIND_UNKNOWN = "UNKNOWN"
    KIND_CHOICES = (
        (KIND_USER, "User Labelled"),
        (KIND_CLUSTER, "Cluster ID"),
        (KIND_UNKNOWN, "Unknown Person"),
    )
    name = models.CharField(
        blank=False, max_length=128, validators=[MinLengthValidator(1)], db_index=True
    )
    kind = models.CharField(choices=KIND_CHOICES, max_length=10)
    cover_photo = models.ForeignKey(
        Photo, related_name="person", on_delete=models.SET_NULL, blank=False, null=True
    )
    cover_face = models.ForeignKey(
        "Face",
        related_name="face",
        on_delete=models.SET_NULL,
        blank=False,
        null=True,
    )
    face_count = models.IntegerField(default=0)
    cluster_owner = models.ForeignKey(
        User,
        related_name="owner",
        on_delete=models.SET_NULL,
        default=None,
        null=True,
    )

    def __str__(self):
        return (
            self.name
            + " ("
            + self.kind
            + ")"
            + " ("
            + str(self.id)
            + ")"
            + " ("
            + str(self.cluster_owner)
            + ")"
        )

    def _calculate_face_count(self):
        self.face_count = self.faces.filter(
            photo__hidden=False,
            photo__in_trashcan=False,
            photo__owner=self.cluster_owner.id,
        ).count()
        self.save()

    def _set_default_cover_photo(self):
        if not self.cover_photo and self.faces.count() > 0:
            self.cover_photo = self.faces.first().photo
            self.cover_face = self.faces.first()
            self.save()

    def get_photos(self, owner):
        faces = list(
            self.faces.prefetch_related(
                Prefetch(
                    "photo",
                    queryset=Photo.objects.exclude(image_hash=None)
                    .filter(hidden=False, owner=owner)
                    .order_by("-exif_timestamp")
                    .only(
                        "image_hash",
                        "exif_timestamp",
                        "rating",
                        "owner__id",
                        "public",
                        "hidden",
                    )
                    .prefetch_related("owner"),
                )
            )
        )

        photos = [face.photo for face in faces if hasattr(face.photo, "owner")]
        photos.sort(
            key=lambda x: x.exif_timestamp or utc.localize(datetime.datetime.min),
            reverse=True,
        )
        return photos


# TODO: Should be removed in the future, as it is not used, only in migrations
def get_unknown_person(owner: User = None):
    unknown_person: Person = Person.objects.get_or_create(
        name=Person.UNKNOWN_PERSON_NAME, cluster_owner=owner, kind=Person.KIND_UNKNOWN
    )[0]
    if unknown_person.kind != Person.KIND_UNKNOWN:
        unknown_person.kind = Person.KIND_UNKNOWN
        unknown_person.save()
    return unknown_person


def get_or_create_person(name, owner: User = None, kind: str = Person.KIND_UNKNOWN):
    return Person.objects.get_or_create(name=name, cluster_owner=owner, kind=kind)[0]


================================================
FILE: api/models/photo.py
================================================
import json
import numbers
import os
import uuid
from fractions import Fraction
from io import BytesIO

import numpy as np
import PIL
from django.core.files.base import ContentFile
from django.db import models
from django.db.models import Q
from django.db.utils import IntegrityError

import api.models
from api import date_time_extractor, face_extractor, util
from api.geocode import GEOCODE_VERSION
from api.geocode.geocode import reverse_geocode
from api.metadata.reader import get_metadata
from api.metadata.tags import Tags
from api.metadata.writer import write_metadata
from api.models.file import File
from api.models.user import User, get_deleted_user
from api.util import logger


class VisiblePhotoManager(models.Manager):
    def get_queryset(self):
        return (
            super()
            .get_queryset()
            .filter(
                Q(hidden=False)
                & Q(thumbnail__aspect_ratio__isnull=False)
                & Q(in_trashcan=False)
                & Q(removed=False)
            )
        )


class Photo(models.Model):
    # UUID primary key (like Immich) - enables flexible asset management
    id = models.UUIDField(primary_key=True, default=uuid.uuid4, editable=False)

    # Content hash for deduplication - unique per user
    # Format: MD5 hash + user_id (e.g., "abc123def456...789" + "1")
    image_hash = models.CharField(max_length=64, db_index=True)

    files = models.ManyToManyField(File)
    main_file = models.ForeignKey(
        File,
        related_name="main_photo",
        on_delete=models.SET_NULL,
        blank=False,
        null=True,
    )

    added_on = models.DateTimeField(null=False, blank=False, db_index=True)

    exif_gps_lat = models.FloatField(blank=True, null=True)
    exif_gps_lon = models.FloatField(blank=True, null=True)
    exif_timestamp = models.DateTimeField(blank=True, null=True, db_index=True)

    exif_json = models.JSONField(blank=True, null=True)

    geolocation_json = models.JSONField(blank=True, null=True, db_index=True)

    timestamp = models.DateTimeField(blank=True, null=True, db_index=True)
    rating = models.IntegerField(default=0, db_index=True)
    in_trashcan = models.BooleanField(default=False, db_index=True)
    removed = models.BooleanField(default=False, db_index=True)
    hidden = models.BooleanField(default=False, db_index=True)
    video = models.BooleanField(default=False)
    video_length = models.TextField(blank=True, null=True)
    size = models.BigIntegerField(default=0)
    # Metadata fields (camera, lens, fstop, etc.) moved to PhotoMetadata model
    # See migration 0103_remove_photo_metadata_fields.py

    owner = models.ForeignKey(
        User, on_delete=models.SET(get_deleted_user), default=None
    )

    shared_to = models.ManyToManyField(User, related_name="photo_shared_to")

    public = models.BooleanField(default=False, db_index=True)

    # Use JSONField for database compatibility (works with both PostgreSQL and SQLite)
    clip_embeddings = models.JSONField(blank=True, null=True)

    clip_embeddings_magnitude = models.FloatField(blank=True, null=True)
    last_modified = models.DateTimeField(auto_now=True)

    # Perceptual hash for duplicate detection (pHash algorithm)
    perceptual_hash = models.CharField(
        max_length=64, blank=True, null=True, db_index=True
    )

    # Organizational photo stacks (RAW+JPEG pairs, bursts, brackets, live photos, manual)
    # A photo can belong to multiple stacks of different types simultaneously
    stacks = models.ManyToManyField(
        "PhotoStack",
        blank=True,
        related_name="photos",
    )

    # Duplicate groups (exact copies, visual duplicates)
    # Separate from stacks because duplicates are about cleanup, not organization
    duplicates = models.ManyToManyField(
        "Duplicate",
        blank=True,
        related_name="photos",
    )

    # Sub-second timestamp precision for burst detection
    # Stores the fractional seconds from EXIF:SubSecTimeOriginal
    exif_timestamp_subsec = models.CharField(max_length=10, blank=True, null=True)

    # Camera image sequence number (for burst/sequence detection)
    # From EXIF:ImageNumber or MakerNotes
    image_sequence_number = models.IntegerField(blank=True, null=True)

    objects = models.Manager()
    visible = VisiblePhotoManager()

    _loaded_values = {}

    def get_clip_embeddings(self):
        """Get clip embeddings as a list, regardless of storage format"""
        if not self.clip_embeddings:
            return None

        # Handle case where embeddings might be stored as JSON string
        if isinstance(self.clip_embeddings, str):
            try:
                import json

                return json.loads(self.clip_embeddings)
            except (json.JSONDecodeError, TypeError):
                return None

        return self.clip_embeddings

    def set_clip_embeddings(self, embeddings):
        """Set clip embeddings, automatically handling storage format"""
        self.clip_embeddings = embeddings if embeddings else None

    @classmethod
    def from_db(cls, db, field_names, values):
        instance = super().from_db(db, field_names, values)

        # save original values, when model is loaded from database,
        # in a separate attribute on the model
        instance._loaded_values = dict(zip(field_names, values))

        return instance

    def save(
        self,
        force_insert=False,
        force_update=False,
        using=None,
        update_fields=None,
        save_metadata=True,
    ):
        modified_fields = [
            field_name
            for field_name, value in self._loaded_values.items()
            if value != getattr(self, field_name)
        ]
        user = User.objects.get(username=self.owner)
        if save_metadata and user.save_metadata_to_disk != User.SaveMetadata.OFF:
            self._save_metadata(
                modified_fields,
                user.save_metadata_to_disk == User.SaveMetadata.SIDECAR_FILE,
            )
        return super().save(
            force_insert=force_insert,
            force_update=force_update,
            using=using,
            update_fields=update_fields,
        )

    def _save_metadata(
        self, modified_fields=None, use_sidecar=True, metadata_types=None
    ):
        """Write metadata tags to the photo's file or sidecar.

        Args:
            modified_fields: List of changed field names (from Photo.save() diff).
                When None, writes all applicable tags unconditionally.
            use_sidecar: Write to XMP sidecar file if True, media file if False.
            metadata_types: List of metadata categories to write, e.g.
                ["ratings", "face_tags"]. When None, uses default behavior
                (ratings/timestamps only, for backward compatibility).
        """
        tags_to_write = {}

        write_ratings = metadata_types is None or "ratings" in metadata_types
        write_face_tags = metadata_types is not None and "face_tags" in metadata_types

        if write_ratings:
            if modified_fields is None or "rating" in modified_fields:
                tags_to_write[Tags.RATING] = self.rating
            if modified_fields is not None and "timestamp" in modified_fields:
                # To-Do: Only works for files and not for the sidecar file
                tags_to_write[Tags.DATE_TIME] = self.timestamp

        if write_face_tags:
            from api.metadata.face_regions import get_face_region_tags

            tags_to_write.update(get_face_region_tags(self))

        if tags_to_write:
            write_metadata(self.main_file.path, tags_to_write, use_sidecar=use_sidecar)

    def _find_album_place(self):
        return api.models.album_place.AlbumPlace.objects.filter(
            Q(photos__in=[self])
        ).all()

    def _find_album_date(self):
        old_album_date = None
        if self.exif_timestamp:
            possible_old_album_date = api.models.album_date.get_album_date(
                date=self.exif_timestamp.date(), owner=self.owner
            )
            if (
                possible_old_album_date is not None
                and possible_old_album_date.photos.filter(
                    image_hash=self.image_hash
                ).exists()
            ):
                old_album_date = possible_old_album_date
        else:
            possible_old_album_date = api.models.album_date.get_album_date(
                date=None, owner=self.owner
            )
            if (
                possible_old_album_date is not None
                and possible_old_album_date.photos.filter(
                    image_hash=self.image_hash
                ).exists()
            ):
                old_album_date = possible_old_album_date
        return old_album_date

    def _extract_date_time_from_exif(self, commit=True):
        def exif_getter(tags):
            return get_metadata(self.main_file.path, tags=tags, try_sidecar=True)

        datetime_config = json.loads(self.owner.datetime_rules)
        extracted_local_time = date_time_extractor.extract_local_date_time(
            self.main_file.path,
            date_time_extractor.as_rules(datetime_config),
            exif_getter,
            self.exif_gps_lat,
            self.exif_gps_lon,
            self.owner.default_timezone,
            self.timestamp,
        )

        old_album_date = self._find_album_date()
        if self.exif_timestamp != extracted_local_time:
            self.exif_timestamp = extracted_local_time

        if old_album_date is not None:
            old_album_date.photos.remove(self)
            old_album_date.save()

        album_date = None

        if self.exif_timestamp:
            album_date = api.models.album_date.get_or_create_album_date(
                date=self.exif_timestamp.date(), owner=self.owner
            )
            album_date.photos.add(self)
        else:
            album_date = api.models.album_date.get_or_create_album_date(
                date=None, owner=self.owner
            )
            album_date.photos.add(self)

        if commit:
            self.save()
        album_date.save()

    def _geolocate(self, commit=True):
        old_gps_lat = self.exif_gps_lat
        old_gps_lon = self.exif_gps_lon
        new_gps_lat, new_gps_lon = get_metadata(
            self.main_file.path,
            tags=[Tags.LATITUDE, Tags.LONGITUDE],
            try_sidecar=True,
        )
        old_album_places = self._find_album_place()
        # Skip if it hasn't changed or is null
        if not new_gps_lat or not new_gps_lon:
            return
        if (
            old_gps_lat == float(new_gps_lat)
            and old_gps_lon == float(new_gps_lon)
            and old_album_places.count() != 0
            and self.geolocation_json
            and "_v" in self.geolocation_json
            and self.geolocation_json["_v"] == GEOCODE_VERSION
        ):
            return
        self.exif_gps_lon = float(new_gps_lon)
        self.exif_gps_lat = float(new_gps_lat)
        if commit:
            self.save()
        try:
            res = reverse_geocode(new_gps_lat, new_gps_lon)
            if not res:
                return
        except Exception as e:
            util.logger.warning(e)
            util.logger.warning("Something went wrong with geolocating")
            return

        self.geolocation_json = res

        # Update search location through PhotoSearch model
        from api.models.photo_search import PhotoSearch

        search_instance, created = PhotoSearch.objects.get_or_create(photo=self)
        search_instance.update_search_location(res)
        search_instance.save()

        # Delete photo from album places if location has changed
        if old_album_places is not None:
            for old_album_place in old_album_places:
                old_album_place.photos.remove(self)
                old_album_place.save()

        # Add photo to new album places
        for geolocation_level, feature in enumerate(self.geolocation_json["features"]):
            if "text" not in feature.keys() or feature["text"].isnumeric():
                continue
            album_place = api.models.album_place.get_album_place(
                feature["text"], owner=self.owner
            )
            if album_place.photos.filter(image_hash=self.image_hash).count() == 0:
                album_place.geolocation_level = (
                    len(self.geolocation_json["features"]) - geolocation_level
                )
            album_place.photos.add(self)
            album_place.save()

        if commit:
            self.save()

    def _add_location_to_album_dates(self):
        if not self.geolocation_json:
            return
        if len(self.geolocation_json["places"]) < 2:
            logger.info(self.geolocation_json)
            return

        album_date = self._find_album_date()
        city_name = self.geolocation_json["places"][-2]
        if album_date.location and len(album_date.location) > 0:
            prev_value = album_date.location
            new_value = prev_value
            if city_name not in prev_value["places"]:
                new_value["places"].append(city_name)
                new_value["places"] = list(set(new_value["places"]))
                album_date.location = new_value
        else:
            album_date.location = {"places": [city_name]}
        # Safe geolocation_json
        album_date.save()

    def _extract_faces(self, second_try=False):
        unknown_cluster: api.models.cluster.Cluster = (
            api.models.cluster.get_unknown_cluster(user=self.owner)
        )
        try:
            big_thumbnail_image = np.array(
                PIL.Image.open(self.thumbnail.thumbnail_big.path)
            )

            face_locations = face_extractor.extract(
                self.main_file.path, self.thumbnail.thumbnail_big.path, self.owner
            )

            if len(face_locations) == 0:
                return

            for idx_face, face_location in enumerate(face_locations):
                top, right, bottom, left, person_name = face_location
                if person_name:
                    person = api.models.person.get_or_create_person(
                        name=person_name, owner=self.owner
                    )
                    person.save()
                else:
                    person = None

                face_image = big_thumbnail_image[top:bottom, left:right]
                face_image = PIL.Image.fromarray(face_image)

                image_path = self.image_hash + "_" + str(idx_face) + ".jpg"

                margin = int((right - left) * 0.05)
                existing_faces = api.models.face.Face.objects.filter(
                    photo=self,
                    location_top__lte=top + margin,
                    location_top__gte=top - margin,
                    location_right__lte=right + margin,
                    location_right__gte=right - margin,
                    location_bottom__lte=bottom + margin,
                    location_bottom__gte=bottom - margin,
                    location_left__lte=left + margin,
                    location_left__gte=left - margin,
                )

                if existing_faces.count() != 0:
                    continue

                face = api.models.face.Face(
                    photo=self,
                    location_top=top,
                    location_right=right,
                    location_bottom=bottom,
                    location_left=left,
                    encoding="",
                    person=person,
                    cluster=unknown_cluster,
                )
                if person_name:
                    person._calculate_face_count()
                    person._set_default_cover_photo()
                face_io = BytesIO()
                face_image.save(face_io, format="JPEG")
                face.image.save(image_path, ContentFile(face_io.getvalue()))
                face_io.close()
                face.save()
            logger.info(f"image {self.image_hash}: {len(face_locations)} face(s) saved")
        except IntegrityError:
            # When using multiple processes, then we can save at the same time, which leads to this error
            if self.files.count() > 0:
                # print out the location of the image only if we have a path
                logger.info(f"image {self.main_file.path}: rescan face failed")
            if not second_try:
                self._extract_faces(True)
            elif self.files.count() > 0:
                logger.error(f"image {self.main_file.path}: rescan face failed")
            else:
                logger.error(f"image {self}: rescan face failed")
        except Exception as e:
            logger.error(f"image {self}: scan face failed")
            raise e

    def _add_to_album_thing(self):
        if (
            hasattr(self, "caption_instance")
            and self.caption_instance
            and self.caption_instance.captions_json
            and type(self.caption_instance.captions_json) is dict
            and "places365" in self.caption_instance.captions_json.keys()
        ):
            for attribute in self.caption_instance.captions_json["places365"][
                "attributes"
            ]:
                album_thing = api.models.album_thing.get_album_thing(
                    title=attribute,
                    owner=self.owner,
                )
                if album_thing.photos.filter(image_hash=self.image_hash).count() == 0:
                    album_thing.photos.add(self)
                    album_thing.thing_type = "places365_attribute"
                    album_thing.save()
            for category in self.caption_instance.captions_json["places365"][
                "categories"
            ]:
                album_thing = api.models.album_thing.get_album_thing(
                    title=category,
                    owner=self.owner,
                )
                if album_thing.photos.filter(image_hash=self.image_hash).count() == 0:
                    album_thing = api.models.album_thing.get_album_thing(
                        title=category, owner=self.owner
                    )
                    album_thing.photos.add(self)
                    album_thing.thing_type = "places365_category"
                    album_thing.save()

    def _check_files(self):
        for file in self.files.all():
            if not file.path or not os.path.exists(file.path):
                self.files.remove(file)
                file.missing = True
                file.save()
        self.save()

    def manual_delete(self):
        # Store stack references before cleanup (ManyToMany)
        photo_stacks = list(self.stacks.all())

        # Store duplicate group references before cleanup (ManyToMany)
        photo_duplicates = list(self.duplicates.all())

        # Handle file cleanup - only delete files not shared with other Photos
        for file in self.files.all():
            # Check if this file is used by other Photos (via files M2M or as main_file)
            other_photos_using_file = (
                file.photo_set.exclude(pk=self.pk).exists()
                or file.main_photo.exclude(pk=self.pk).exists()
            )

            if other_photos_using_file:
                # File is shared - just unlink from this photo, don't delete
                logger.info(
                    f"File {file.path} is shared with other photos, unlinking only"
                )
                self.files.remove(file)
            else:
                # File is only used by this photo - safe to delete
                if os.path.isfile(file.path):
                    logger.info(f"Removing photo {file.path}")
                    os.remove(file.path)
                file.delete()

        self.files.set([])
        self.main_file = None
        self.removed = True

        # Clear all stack references from this photo (ManyToMany)
        self.stacks.clear()

        # Clear all duplicate group references from this photo (ManyToMany)
        self.duplicates.clear()

        result = self.save()

        # Clean up stacks if they're now empty or have only one photo left
        for photo_stack in photo_stacks:
            remaining_photos = photo_stack.photos.filter(removed=False).count()
            if remaining_photos <= 1:
                # If 0 or 1 photos left, delete the stack (no longer a valid grouping)
                logger.info(
                    f"Deleting photo stack {photo_stack.id} - only {remaining_photos} photos remaining"
                )
                # Unlink remaining photos from stack first
                for remaining_photo in photo_stack.photos.all():
                    remaining_photo.stacks.remove(photo_stack)
                photo_stack.delete()

        # Clean up duplicate groups if they're now empty or have only one photo left
        for duplicate in photo_duplicates:
            remaining_photos = duplicate.photos.filter(removed=False).count()
            if remaining_photos <= 1:
                # If 0 or 1 photos left, delete the duplicate group (no longer valid)
                logger.info(
                    f"Deleting duplicate group {duplicate.id} - only {remaining_photos} photos remaining"
                )
                # Unlink remaining photos from duplicate first
                for remaining_photo in duplicate.photos.all():
                    remaining_photo.duplicates.remove(duplicate)
                duplicate.delete()

        # To-Do: Handle wrong file permissions
        return result

    def _set_embedded_media(self, obj):
        return obj.main_file.embedded_media

    def __str__(self):
        main_file_path = (
            self.main_file.path if self.main_file is not None else "No main file"
        )
        return f"{self.image_hash} - {self.owner} - {main_file_path}"


================================================
FILE: api/models/photo_caption.py
================================================
from django.db import models
from django.db.models import Q

import api.models
from api import util
from api.image_captioning import generate_caption
from api.llm import generate_prompt
from api.models.user import User


class PhotoCaption(models.Model):
    """Model for handling image captions and related functionality"""

    photo = models.OneToOneField(
        "Photo",
        on_delete=models.CASCADE,
        related_name="caption_instance",
        primary_key=True,
    )
    captions_json = models.JSONField(blank=True, null=True, db_index=True)

    created_at = models.DateTimeField(auto_now_add=True)
    updated_at = models.DateTimeField(auto_now=True)

    class Meta:
        db_table = "api_photo_caption"

    def __str__(self):
        return f"Captions for {self.photo.image_hash}"

    def generate_captions_im2txt(self, commit=True):
        """Generate im2txt captions for the photo"""
        if not self.photo.thumbnail or not self.photo.thumbnail.thumbnail_big:
            util.logger.warning(
                f"No thumbnail available for photo {self.photo.image_hash}"
            )
            return False

        util.logger.info("Generating captions with Im2txt")

        try:
            image_path = self.photo.thumbnail.thumbnail_big.path
        except Exception:
            util.logger.warning(
                f"Cannot access thumbnail path for photo {self.photo.image_hash}"
            )
            return False
        if self.captions_json is None:
            self.captions_json = {}
        captions = self.captions_json

        try:
            from constance import config as site_config

            if site_config.CAPTIONING_MODEL == "None":
                util.logger.info("Generating captions is disabled")
                return False

            if site_config.CAPTIONING_MODEL == "moondream":
                util.logger.info("Generating captions with Moondream")
                return self._generate_captions_moondream(commit=commit)

            blip = False
            if site_config.CAPTIONING_MODEL == "blip_base_capfilt_large":
                blip = True

            caption = generate_caption(image_path=image_path, blip=blip)
            caption = caption.replace("<start>", "").replace("<end>", "").strip()

            settings = User.objects.get(username=self.photo.owner).llm_settings
            if site_config.LLM_MODEL != "None" and settings["enabled"]:
                face = api.models.Face.objects.filter(photo=self.photo).first()
                person_name = ""
                if face and settings["add_person"]:
                    person_name = " Person: " + face.person.name
                place = ""
                if (
                    self.photo.search_instance
                    and self.photo.search_instance.search_location
                    and settings["add_location"]
                ):
                    place = " Place: " + self.photo.search_instance.search_location
                keywords = ""
                if settings["add_keywords"]:
                    keywords = " and tags or keywords"
                prompt = (
                    "Q: Your task is to improve the following image caption: "
                    + caption
                    + ". You also know the following information about the image:"
                    + place
                    + person_name
                    + ". Stick as closely as possible to the caption, while replacing generic information with information you know about the image. Only output the caption"
                    + keywords
                    + ". \n A:"
                )
                util.logger.info(prompt)
                caption = generate_prompt(prompt)

            captions["im2txt"] = caption
            self.captions_json = captions
            self.recreate_search_captions()
            if commit:
                self.save()

            util.logger.info(
                f"generated im2txt captions for image {image_path} with SiteConfig {site_config.CAPTIONING_MODEL} with Blip: {blip} caption: {caption}"
            )
            return True
        except Exception:
            util.logger.exception(
                f"could not generate im2txt captions for image {image_path}"
            )
            return False

    def _generate_captions_moondream(self, commit=True):
        """Generate captions using Moondream with enhanced prompt"""
        if not self.photo.thumbnail or not self.photo.thumbnail.thumbnail_big:
            util.logger.warning(
                f"No thumbnail available for photo {self.photo.image_hash}"
            )
            return False

        try:
            image_path = self.photo.thumbnail.thumbnail_big.path
        except Exception:
            util.logger.warning(
                f"Cannot access thumbnail path for photo {self.photo.image_hash}"
            )
            return False
        if self.captions_json is None:
            self.captions_json = {}
        captions = self.captions_json

        try:
            from constance import config as site_config

            util.logger.info("Generating Moondream captions")

            settings = User.objects.get(username=self.photo.owner).llm_settings

            # Default prompt
            prompt = "Describe this image in a short, natural image caption."

            # Enhanced prompting if LLM is enabled
            if site_config.LLM_MODEL != "None" and settings["enabled"]:
                face = api.models.Face.objects.filter(photo=self.photo).first()
                person_name = ""
                if face and settings["add_person"]:
                    person_name = (
                        f" The person in the photo is named {face.person.name}. "
                        f"Use the name '{face.person.name}' directly in the caption — do not say 'a person named'. "
                        f"Keep the caption casual and to the point, like a friend tagging a photo."
                    )

                place = ""
                if (
                    self.photo.search_instance
                    and self.photo.search_instance.search_location
                    and settings["add_location"]
                ):
                    place = f" This photo was taken at {self.photo.search_instance.search_location}."

                keywords_instruction = ""
                if settings["add_keywords"]:
                    keywords_instruction = " Include relevant tags and keywords."

                prompt = (
                    "Write a short, natural image caption."
                    + person_name
                    + place
                    + keywords_instruction
                )

            util.logger.info(f"Moondream prompt: {prompt}")

            # Generate caption with the final prompt
            caption = generate_prompt(image_path=image_path, prompt=prompt)
            caption = caption.replace("<start>", "").replace("<end>", "").strip()

            # Save the result
            captions["im2txt"] = caption
            self.captions_json = captions
            self.recreate_search_captions()
            if commit:
                self.save()

            util.logger.info(
                f"Generated Moondream captions for image {image_path}, caption: {caption}"
            )
            return True
        except Exception:
            util.logger.exception(
                f"Could not generate Moondream captions for image {image_path}"
            )
            return False

    def save_user_caption(self, caption, commit=True):
        """Save user-provided caption"""
        if not self.photo.thumbnail or not self.photo.thumbnail.thumbnail_big:
            util.logger.warning(
                f"No thumbnail available for photo {self.photo.image_hash}"
            )
            return False

        try:
            image_path = self.photo.thumbnail.thumbnail_big.path
        except Exception:
            util.logger.warning(
                f"Cannot access thumbnail path for photo {self.photo.image_hash}"
            )
            return False

        try:
            caption = caption.replace("<start>", "").replace("<end>", "").strip()

            if self.captions_json is None:
                self.captions_json = {}
            self.captions_json["user_caption"] = caption
            self.recreate_search_captions()

            if commit:
                self.save()

            util.logger.info(
                f"saved captions for image {image_path}. caption: {caption}. captions_json: {self.captions_json}."
            )

            # Handle hashtags
            hashtags = [
                word
                for word in caption.split()
                if word.startswith("#") and len(word) > 1
            ]

            for hashtag in hashtags:
                album_thing = api.models.album_thing.get_album_thing(
                    title=hashtag,
                    owner=self.photo.owner,
                    thing_type="hashtag_attribute",
                )
                if (
                    album_thing.photos.filter(image_hash=self.photo.image_hash).count()
                    == 0
                ):
                    album_thing.photos.add(self.photo)
                    album_thing.save()

            for album_thing in api.models.album_thing.AlbumThing.objects.filter(
                Q(photos__in=[self.photo])
                & Q(thing_type="hashtag_attribute")
                & Q(owner=self.photo.owner)
            ).all():
                if album_thing.title not in caption:
                    album_thing.photos.remove(self.photo)
                    album_thing.save()
            return True
        except Exception:
            util.logger.exception(f"could not save captions for image {image_path}")
            return False

    def recreate_search_captions(self):
        """Recreate search captions - directly access PhotoSearch model"""
        from api.models.photo_search import PhotoSearch

        search_instance, created = PhotoSearch.objects.get_or_create(photo=self.photo)
        search_instance.recreate_search_captions()
        search_instance.save()

    def generate_tag_captions(self, commit=True):
        """Generate tag captions using the active tagging model (Places365 or SigLIP 2).

        Tags are stored per-model in captions_json and are never deleted when
        switching models -- only the active model's tags are generated / visible.
        """
        from constance import config as site_config

        tagging_model = site_config.TAGGING_MODEL

        if not self.photo.thumbnail or not self.photo.thumbnail.thumbnail_big:
            return

        # Skip if this photo already has tags from the active model
        if (
            self.captions_json is not None
            and self.captions_json.get(tagging_model) is not None
        ):
            return

        try:
            import requests

            image_path = self.photo.thumbnail.thumbnail_big.path
            confidence = self.photo.owner.confidence
            json_data = {
                "image_path": image_path,
                "confidence": confidence,
                "tagging_model": tagging_model,
            }
            response = requests.post(
                "http://localhost:8011/generate-tags", json=json_data
            )
            tags_result = response.json()["tags"]

            if tags_result is None:
                return
            if self.captions_json is None:
                self.captions_json = {}

            # Store under the model-specific key
            self.captions_json[tagging_model] = tags_result
            self.recreate_search_captions()

            if tagging_model == "siglip2":
                self._update_siglip2_album_things(tags_result)
            else:
                self._update_places365_album_things(tags_result)

            if commit:
                self.save()
            util.logger.info(
                f"generated {tagging_model} tags for image {image_path}."
            )
        except Exception as e:
            util.logger.exception(
                f"could not generate tags for image "
                f"{self.photo.main_file.path if self.photo.main_file else 'no main file'}"
            )
            raise e

    def _update_places365_album_things(self, res_places365):
        """Create/update AlbumThing entries for Places365 tags."""
        # Remove old album associations for this photo
        for album_thing in api.models.album_thing.AlbumThing.objects.filter(
            Q(photos__in=[self.photo])
            & (
                Q(thing_type="places365_attribute")
                | Q(thing_type="places365_category")
            )
            & Q(owner=self.photo.owner)
        ).all():
            album_thing.photos.remove(self.photo)
            album_thing.save()

        if "attributes" in res_places365:
            for attribute in res_places365["attributes"]:
                album_thing = api.models.album_thing.get_album_thing(
                    title=attribute,
                    owner=self.photo.owner,
                    thing_type="places365_attribute",
                )
                album_thing.photos.add(self.photo)
                album_thing.save()

        if "categories" in res_places365:
            for category in res_places365["categories"]:
                album_thing = api.models.album_thing.get_album_thing(
                    title=category,
                    owner=self.photo.owner,
                    thing_type="places365_category",
                )
                album_thing.photos.add(self.photo)
                album_thing.save()

    def _update_siglip2_album_things(self, siglip2_result):
        """Create/update AlbumThing entries for SigLIP 2 tags."""
        tags = siglip2_result.get("tags", [])

        # Remove old siglip2 album associations for this photo
        for album_thing in api.models.album_thing.AlbumThing.objects.filter(
            Q(photos__in=[self.photo])
            & Q(thing_type="siglip2_tag")
            & Q(owner=self.photo.owner)
        ).all():
            album_thing.photos.remove(self.photo)
            album_thing.save()

        for tag in tags:
            album_thing = api.models.album_thing.get_album_thing(
                title=tag,
                owner=self.photo.owner,
                thing_type="siglip2_tag",
            )
            album_thing.photos.add(self.photo)
            album_thing.save()

    # Backward-compatible alias
    def generate_places365_captions(self, commit=True):
        return self.generate_tag_captions(commit=commit)


================================================
FILE: api/models/photo_metadata.py
================================================
"""
PhotoMetadata and MetadataFile models for structured metadata handling.

This module provides proper models for:
1. PhotoMetadata - Structured EXIF/metadata extracted from photos
2. MetadataFile - XMP sidecars and other metadata files

Benefits over current approach:
- Typed fields instead of JSON blob (exif_json)
- Proper foreign key relationships
- Versioning for metadata changes
- Support for multiple metadata sources (embedded, sidecar, user-edited)
- Clear separation between camera metadata and derived metadata
"""

import numbers
import uuid
from fractions import Fraction

from django.db import models

from api.metadata.reader import get_metadata
from api.metadata.tags import Tags
from api.models.user import User, get_deleted_user


class MetadataFile(models.Model):
    """
    Represents a metadata sidecar file (XMP, JSON, etc.) associated with a photo.

    A photo can have multiple metadata files:
    - XMP sidecar from camera/software
    - Adobe Lightroom .xmp
    - Darktable .xmp
    - User-created metadata file
    """

    class FileType(models.TextChoices):
        XMP = "xmp", "XMP Sidecar"
        JSON = "json", "JSON Metadata"
        EXIF = "exif", "EXIF Extract"
        OTHER = "other", "Other"

    class Source(models.TextChoices):
        # Sidecar that came with the photo (same directory)
        ORIGINAL = "original", "Original Sidecar"
        # Generated by photo editing software
        SOFTWARE = "software", "Software Generated"
        # Created by LibrePhotos
        LIBREPHOTOS = "librephotos", "LibrePhotos Generated"
        # User manually created/uploaded
        USER = "user", "User Created"

    id = models.UUIDField(primary_key=True, default=uuid.uuid4, editable=False)

    # Link to the File model for actual file storage
    file = models.OneToOneField(
        "File",
        on_delete=models.CASCADE,
        related_name="metadata_info",
    )

    # The photo this metadata belongs to
    photo = models.ForeignKey(
        "Photo",
        on_delete=models.CASCADE,
        related_name="metadata_files",
    )

    file_type = models.CharField(
        max_length=10,
        choices=FileType.choices,
        default=FileType.XMP,
    )

    source = models.CharField(
        max_length=20,
        choices=Source.choices,
        default=Source.ORIGINAL,
    )

    # Priority for metadata resolution (higher = more authoritative)
    # User edits > Software sidecars > Original sidecars > Embedded
    priority = models.IntegerField(default=0)

    # Software that created this file (if known)
    creator_software = models.CharField(max_length=100, blank=True, null=True)

    created_at = models.DateTimeField(auto_now_add=True)
    updated_at = models.DateTimeField(auto_now=True)

    class Meta:
        ordering = ["-priority", "-updated_at"]
        verbose_name = "Metadata File"
        verbose_name_plural = "Metadata Files"

    def __str__(self):
        return f"{self.file_type} sidecar for {self.photo_id}"


class PhotoMetadata(models.Model):
    """
    Structured metadata for a photo.

    This model stores extracted and computed metadata in typed fields,
    making it queryable and more maintainable than a JSON blob.

    Metadata Sources (in priority order):
    1. User edits (highest priority)
    2. XMP sidecar files
    3. Embedded EXIF/IPTC/XMP
    4. Computed/derived values (lowest priority)
    """

    class Source(models.TextChoices):
        # Embedded in the file (EXIF, IPTC, embedded XMP)
        EMBEDDED = "embedded", "Embedded in File"
        # From XMP sidecar file
        SIDECAR = "sidecar", "XMP Sidecar"
        # User manually edited
        USER_EDIT = "user_edit", "User Edit"
        # Computed by LibrePhotos (AI, geocoding, etc.)
        COMPUTED = "computed", "Computed"

    id = models.UUIDField(primary_key=True, default=uuid.uuid4, editable=False)

    photo = models.OneToOneField(
        "Photo",
        on_delete=models.CASCADE,
        related_name="metadata",
    )

    # ==================== Camera Settings ====================
    # Aperture (f-stop), e.g., 2.8
    aperture = models.FloatField(null=True, blank=True, db_index=True)

    # Shutter speed as a string fraction, e.g., "1/250"
    shutter_speed = models.CharField(max_length=20, null=True, blank=True)

    # Shutter speed in seconds (for queries), e.g., 0.004
    shutter_speed_seconds = models.FloatField(null=True, blank=True)

    # ISO sensitivity
    iso = models.IntegerField(null=True, blank=True, db_index=True)

    # Focal length in mm
    focal_length = models.FloatField(null=True, blank=True)

    # 35mm equivalent focal length
    focal_length_35mm = models.IntegerField(null=True, blank=True)

    # Exposure compensation in EV
    exposure_compensation = models.FloatField(null=True, blank=True)

    # Flash fired
    flash_fired = models.BooleanField(null=True, blank=True)

    # Metering mode
    metering_mode = models.CharField(max_length=50, null=True, blank=True)

    # White balance
    white_balance = models.CharField(max_length=50, null=True, blank=True)

    # ==================== Camera/Lens Info ====================
    camera_make = models.CharField(max_length=100, null=True, blank=True, db_index=True)
    camera_model = models.CharField(
        max_length=100, null=True, blank=True, db_index=True
    )
    lens_make = models.CharField(max_length=100, null=True, blank=True)
    lens_model = models.CharField(max_length=100, null=True, blank=True, db_index=True)
    serial_number = models.CharField(max_length=100, null=True, blank=True)

    # ==================== Image Properties ====================
    width = models.IntegerField(null=True, blank=True)
    height = models.IntegerField(null=True, blank=True)
    orientation = models.IntegerField(null=True, blank=True)
    color_space = models.CharField(max_length=50, null=True, blank=True)
    bit_depth = models.IntegerField(null=True, blank=True)

    # ==================== Timestamps ====================
    # Original capture time from EXIF
    date_taken = models.DateTimeField(null=True, blank=True, db_index=True)

    # Sub-second precision (from EXIF:SubSecTimeOriginal)
    date_taken_subsec = models.CharField(max_length=10, null=True, blank=True)

    # When the file was last modified
    date_modified = models.DateTimeField(null=True, blank=True)

    # Timezone offset if available
    timezone_offset = models.CharField(max_length=10, null=True, blank=True)

    # ==================== Location ====================
    gps_latitude = models.FloatField(null=True, blank=True, db_index=True)
    gps_longitude = models.FloatField(null=True, blank=True, db_index=True)
    gps_altitude = models.FloatField(null=True, blank=True)

    # Location from reverse geocoding
    location_country = models.CharField(
        max_length=100, null=True, blank=True, db_index=True
    )
    location_state = models.CharField(max_length=100, null=True, blank=True)
    location_city = models.CharField(
        max_length=100, null=True, blank=True, db_index=True
    )
    location_address = models.TextField(null=True, blank=True)

    # ==================== Content Description ====================
    title = models.CharField(max_length=500, null=True, blank=True)
    caption = models.TextField(null=True, blank=True)
    keywords = models.JSONField(null=True, blank=True)  # List of strings

    # Rating (0-5 stars)
    rating = models.IntegerField(null=True, blank=True, db_index=True)

    # Copyright info
    copyright = models.TextField(null=True, blank=True)
    creator = models.CharField(max_length=200, null=True, blank=True)

    # ==================== Tracking ====================
    # Which source this metadata came from
    source = models.CharField(
        max_length=20,
        choices=Source.choices,
        default=Source.EMBEDDED,
    )

    # Raw EXIF/XMP data for fields we don't have explicit columns for
    raw_exif = models.JSONField(null=True, blank=True)
    raw_xmp = models.JSONField(null=True, blank=True)
    raw_iptc = models.JSONField(null=True, blank=True)

    # Version tracking
    version = models.IntegerField(default=1)
    created_at = models.DateTimeField(auto_now_add=True)
    updated_at = models.DateTimeField(auto_now=True)

    class Meta:
        verbose_name = "Photo Metadata"
        verbose_name_plural = "Photo Metadata"
        indexes = [
            models.Index(fields=["camera_make", "camera_model"]),
            models.Index(fields=["date_taken"]),
            models.Index(fields=["location_country", "location_city"]),
        ]

    def __str__(self):
        return f"Metadata for {self.photo_id}"

    @property
    def resolution(self):
        """Returns resolution as 'WxH' string."""
        if self.width and self.height:
            return f"{self.width}x{self.height}"
        return None

    @property
    def megapixels(self):
        """Returns megapixel count."""
        if self.width and self.height:
            return round((self.width * self.height) / 1_000_000, 1)
        return None

    @property
    def has_location(self):
        """Check if GPS coordinates are available."""
        return self.gps_latitude is not None and self.gps_longitude is not None

    @property
    def camera_display(self):
        """Returns a human-readable camera name."""
        if self.camera_make and self.camera_model:
            # Avoid duplicating make in model
            if self.camera_model.startswith(self.camera_make):
                return self.camera_model
            return f"{self.camera_make} {self.camera_model}"
        return self.camera_model or self.camera_make

    @property
    def lens_display(self):
        """Returns a human-readable lens name."""
        if self.lens_make and self.lens_model:
            if self.lens_model.startswith(self.lens_make):
                return self.lens_model
            return f"{self.lens_make} {self.lens_model}"
        return self.lens_model or self.lens_make

    @classmethod
    def extract_exif_data(cls, photo, commit=True):
        """
        Extract EXIF data from a photo's main file and update PhotoMetadata.

        This method extracts metadata from the photo's main file and:
        1. Updates Photo fields (size, video_length, rating, exif_timestamp_subsec, image_sequence_number)
        2. Gets or creates PhotoMetadata and populates it with extracted data

        Args:
            photo: Photo instance to extract metadata from
            commit: Whether to save Photo and PhotoMetadata after extraction

        Returns:
            PhotoMetadata instance
        """
        if not photo.main_file:
            return None

        (
            size,
            fstop,
            focal_length,
            iso,
            shutter_speed,
            camera,
            lens,
            width,
            height,
            focalLength35Equivalent,
            subjectDistance,
            digitalZoomRatio,
            video_length,
            rating,
            subsec_time_original,
            image_number,
        ) = get_metadata(  # noqa: E501
            photo.main_file.path,
            tags=[
                Tags.FILE_SIZE,
                Tags.FSTOP,
                Tags.FOCAL_LENGTH,
                Tags.ISO,
                Tags.EXPOSURE_TIME,
                Tags.CAMERA,
                Tags.LENS,
                Tags.IMAGE_WIDTH,
                Tags.IMAGE_HEIGHT,
                Tags.FOCAL_LENGTH_35MM,
                Tags.SUBJECT_DISTANCE,
                Tags.DIGITAL_ZOOM_RATIO,
                Tags.QUICKTIME_DURATION,
                Tags.RATING,
                Tags.SUBSEC_TIME_ORIGINAL,
                Tags.IMAGE_NUMBER,
            ],
            try_sidecar=True,
        )

        # Fields still on Photo model
        if size and isinstance(size, numbers.Number):
            photo.size = size
        if video_length and isinstance(video_length, numbers.Number):
            photo.video_length = video_length
        if rating and isinstance(rating, numbers.Number):
            photo.rating = rating

        # Burst/sequence detection fields
        if subsec_time_original:
            # SubSecTimeOriginal is typically a string like "123" representing milliseconds
            photo.exif_timestamp_subsec = str(subsec_time_original)[:10]
        if image_number and isinstance(image_number, numbers.Number):
            photo.image_sequence_number = int(image_number)

        if commit:
            photo.save()

        # Store metadata in PhotoMetadata model
        metadata, created = cls.objects.get_or_create(
            photo=photo, defaults={"source": cls.Source.EMBEDDED}
        )

        if fstop and isinstance(fstop, numbers.Number):
            metadata.aperture = fstop
        if focal_length and isinstance(focal_length, numbers.Number):
            metadata.focal_length = focal_length
        if iso and isinstance(iso, numbers.Number):
            metadata.iso = iso
        if shutter_speed and isinstance(shutter_speed, numbers.Number):
            metadata.shutter_speed = str(
                Fraction(shutter_speed).limit_denominator(1000)
            )
        if camera and isinstance(camera, str):
            metadata.camera_model = camera
        if lens and isinstance(lens, str):
            metadata.lens_model = lens
        if width and isinstance(width, numbers.Number):
            metadata.width = width
        if height and isinstance(height, numbers.Number):
            metadata.height = height
        if focalLength35Equivalent and isinstance(
            focalLength35Equivalent, numbers.Number
        ):
            metadata.focal_length_35mm = focalLength35Equivalent
        if rating and isinstance(rating, numbers.Number):
            metadata.rating = rating
        if subsec_time_original:
            metadata.date_taken_subsec = str(subsec_time_original)[:10]

        if commit:
            metadata.save()

        return metadata


class MetadataEdit(models.Model):
    """
    Tracks user edits to photo metadata for history/undo functionality.

    Each edit records what field was changed, old value, new value,
    and who made the change.
    """

    id = models.UUIDField(primary_key=True, default=uuid.uuid4, editable=False)

    photo = models.ForeignKey(
        "Photo",
        on_delete=models.CASCADE,
        related_name="metadata_edits",
    )

    user = models.ForeignKey(
        User,
        on_delete=models.SET(get_deleted_user),
        related_name="metadata_edits",
    )

    # Which field was edited
    field_name = models.CharField(max_length=100)

    # JSON-serialized old and new values
    old_value = models.JSONField(null=True, blank=True)
    new_value = models.JSONField(null=True, blank=True)

    # Whether this edit has been written back to the file
    synced_to_file = models.BooleanField(default=False)
    synced_at = models.DateTimeField(null=True, blank=True)

    created_at = models.DateTimeField(auto_now_add=True)

    class Meta:
        ordering = ["-created_at"]
        verbose_name = "Metadata Edit"
        verbose_name_plural = "Metadata Edits"
        indexes = [
            models.Index(fields=["photo", "-created_at"]),
        ]

    def __str__(self):
        return f"Edit {self.field_name} on {self.photo_id}"


================================================
FILE: api/models/photo_search.py
================================================
from django.db import models

import api.models
from api import util


class PhotoSearch(models.Model):
    """Model for handling photo search functionality"""

    photo = models.OneToOneField(
        "Photo",
        on_delete=models.CASCADE,
        related_name="search_instance",
        primary_key=True,
    )
    search_captions = models.TextField(blank=True, null=True, db_index=True)
    search_location = models.TextField(blank=True, null=True, db_index=True)

    created_at = models.DateTimeField(auto_now_add=True)
    updated_at = models.DateTimeField(auto_now=True)

    class Meta:
        db_table = "api_photo_search"

    def __str__(self):
        return f"Search data for {self.photo.image_hash}"

    def recreate_search_captions(self):
        """Recreate search captions from all caption sources.

        Only tags from the active TAGGING_MODEL are indexed into search_captions.
        This allows instant switching of tag visibility without re-inference.
        """
        from constance import config as site_config

        search_captions = ""

        # Get captions from the PhotoCaption model
        if hasattr(self.photo, "caption_instance") and self.photo.caption_instance:
            captions_json = self.photo.caption_instance.captions_json
            if captions_json:
                # Index tags from the active tagging model only
                tagging_model = site_config.TAGGING_MODEL

                if tagging_model == "siglip2":
                    siglip2_data = captions_json.get("siglip2", {})
                    siglip2_tags = siglip2_data.get("tags", [])
                    if siglip2_tags:
                        search_captions += " ".join(siglip2_tags) + " "
                else:
                    places365_captions = captions_json.get("places365", {})
                    attributes = places365_captions.get("attributes", [])
                    search_captions += " ".join(attributes) + " "
                    categories = places365_captions.get("categories", [])
                    search_captions += " ".join(categories) + " "
                    environment = places365_captions.get("environment", "")
                    search_captions += environment + " "

                user_caption = captions_json.get("user_caption", "")
                if user_caption:
                    search_captions += user_caption + " "

                im2txt_caption = captions_json.get("im2txt", "")
                if im2txt_caption:
                    search_captions += im2txt_caption + " "

        # Add face/person names
        for face in api.models.face.Face.objects.filter(photo=self.photo).all():
            if face.person:
                search_captions += face.person.name + " "

        # Add file paths
        if self.photo.main_file:
            search_captions += self.photo.main_file.path + " "
        for file in self.photo.files.all():
            search_captions += file.path + " "

        # Add media type
        if self.photo.video:
            search_captions += "type: video "

        # Add camera and lens info from PhotoMetadata
        try:
            metadata = self.photo.metadata
            if metadata.camera_display:
                search_captions += metadata.camera_display + " "
            if metadata.lens_display:
                search_captions += metadata.lens_display + " "
        except Exception:
            # PhotoMetadata may not exist yet
            pass

        self.search_captions = search_captions.strip()

        util.logger.debug(
            f"Recreated search captions for image {self.photo.image_hash}."
        )

    def update_search_location(self, geolocation_json):
        """Update search location from geolocation data"""
        if geolocation_json and "address" in geolocation_json:
            self.search_location = geolocation_json["address"]
        elif geolocation_json and "features" in geolocation_json:
            # Handle features format used in tests
            features = geolocation_json["features"]
            location_parts = [
                feature.get("text", "") for feature in features if feature.get("text")
            ]
            self.search_location = ", ".join(location_parts) if location_parts else ""
        else:
            self.search_location = ""

        util.logger.debug(
            f"Updated search location for image {self.photo.image_hash}: {self.search_location}"
        )


================================================
FILE: api/models/photo_stack.py
================================================
"""
PhotoStack model for organizational photo grouping.

Stacks represent related photos that should be kept together for organization:
- Burst sequences (rapid succession shots)
- Exposure brackets (HDR sequences)
- Manual user groupings

NOTE: RAW+JPEG pairs and Live Photos are NO LONGER handled as stacks.
Instead, they use the Photo.files ManyToMany field to store multiple file
variants of the same capture (PhotoPrism-like model). This allows:
- A single Photo entity for RAW+JPEG (same capture, different formats)
- A single Photo entity for Live Photos (image + video variant)
- Photo stacks for DIFFERENT captures that are logically related

Legacy RAW_JPEG_PAIR and LIVE_PHOTO stack types are kept for migration
compatibility but are deprecated and will be converted to file variants.

Inspired by PhotoPrism's file variant model and Immich's stacking system.
"""

import uuid

from django.db import models

from api.models.user import User, get_deleted_user


class PhotoStack(models.Model):
    """
    Represents a group of related but DISTINCT photos that should be kept together.
    Only the primary photo is shown in the timeline, with others accessible via expansion.
    
    NOTE: This is for grouping DIFFERENT captures (bursts, brackets, manual).
    For same-capture file variants (RAW+JPEG, Live Photos), use Photo.files instead.
    
    Stacks are informational groupings - they help organize related photos
    but don't imply that any should be deleted (unlike Duplicates).
    """

    class StackType(models.TextChoices):
        # === ACTIVE STACK TYPES (for different captures) ===
        
        # Photos taken in rapid succession (burst/continuous mode)
        # User may want to browse all or pick the best
        BURST_SEQUENCE = "burst", "Burst Sequence"
        # Exposure bracketed shots (for HDR)
        # HDR processing may need all exposures
        EXPOSURE_BRACKET = "bracket", "Exposure Bracket"
        # User manually grouped photos
        # User explicitly created the grouping
        MANUAL = "manual", "Manual Stack"
        
        # === DEPRECATED STACK TYPES (migrated to Photo.files) ===
        # Kept for backwards compatibility during migration
        
        # DEPRECATED: Use Photo.files for RAW+JPEG variants
        RAW_JPEG_PAIR = "raw_jpeg", "RAW + JPEG Pair (Deprecated)"
        # DEPRECATED: Use Photo.files for Live Photo variants
        LIVE_PHOTO = "live_photo", "Live Photo (Deprecated)"

    # Valid stack types for new stacks (excludes deprecated types)
    VALID_STACK_TYPES = [
        StackType.BURST_SEQUENCE,
        StackType.EXPOSURE_BRACKET,
        StackType.MANUAL,
    ]

    id = models.UUIDField(primary_key=True, default=uuid.uuid4, editable=False)

    owner = models.ForeignKey(
        User,
        on_delete=models.SET(get_deleted_user),
        related_name="photo_stacks",
    )

    stack_type = models.CharField(
        max_length=20,
        choices=StackType.choices,
        default=StackType.MANUAL,
        db_index=True,
    )

    # The photo shown in the timeline (cover photo)
    primary_photo = models.ForeignKey(
        "Photo",
        on_delete=models.SET_NULL,
        null=True,
        blank=True,
        related_name="primary_in_stack",
    )

    # Detection metadata
    created_at = models.DateTimeField(auto_now_add=True)
    updated_at = models.DateTimeField(auto_now=True)

    # For bursts: time span of the sequence
    sequence_start = models.DateTimeField(null=True, blank=True)
    sequence_end = models.DateTimeField(null=True, blank=True)

    class Meta:
        ordering = ["-created_at"]
        verbose_name = "Photo Stack"
        verbose_name_plural = "Photo Stacks"
        indexes = [
            models.Index(fields=["owner", "stack_type"]),
        ]

    def __str__(self):
        return f"PhotoStack {self.id} - {self.stack_type} - {self.owner.username}"

    @property
    def photo_count(self):
        """Number of photos in this stack."""
        return self.photos.count()

    def get_photos_ordered_by_quality(self):
        """
        Returns photos in the stack ordered by quality metrics.
        Higher resolution and larger file size are considered better quality.
        """
        return self.photos.order_by("-metadata__width", "-metadata__height", "-size")

    def auto_select_primary(self):
        """
        Automatically selects the best photo as primary based on stack type.

        For BURST_SEQUENCE: Middle of sequence by timestamp
        For EXPOSURE_BRACKET: Middle exposure
        For MANUAL: Highest resolution
        
        For deprecated types (RAW_JPEG_PAIR, LIVE_PHOTO):
        These should be migrated to Photo.files, but for compatibility:
        - RAW_JPEG_PAIR: Prefer JPEG (non-RAW)
        - LIVE_PHOTO: Prefer still image (non-video)
        """
        photos = self.photos.all()
        if not photos.exists():
            return None

        if self.stack_type == self.StackType.BURST_SEQUENCE:
            # Pick middle of sequence by timestamp
            ordered = photos.order_by("exif_timestamp")
            count = ordered.count()
            best = ordered[count // 2] if count > 0 else None
        elif self.stack_type == self.StackType.EXPOSURE_BRACKET:
            # Pick middle exposure (usually the "correct" exposure)
            ordered = photos.order_by("exif_timestamp")
            count = ordered.count()
            best = ordered[count // 2] if count > 0 else None
        elif self.stack_type == self.StackType.RAW_JPEG_PAIR:
            # DEPRECATED: Prefer JPEG for display (RAW files have type=4)
            jpeg_photos = photos.exclude(main_file__type=4)
            best = jpeg_photos.first() if jpeg_photos.exists() else photos.first()
        elif self.stack_type == self.StackType.LIVE_PHOTO:
            # DEPRECATED: Prefer still image over video (VIDEO = 2)
            still_photos = photos.exclude(main_file__type=2)
            best = still_photos.first() if still_photos.exists() else photos.first()
        else:
            # MANUAL and default: highest resolution
            # Use metadata__width and metadata__height since these fields moved to PhotoMetadata
            best = photos.order_by(
                models.F("metadata__width") * models.F("metadata__height")
            ).last()

        if best:
            self.primary_photo = best
            self.save(update_fields=["primary_photo", "updated_at"])

        return best

    def merge_with(self, other_stack: "PhotoStack"):
        """
        Merge another stack into this one.
        All photos from the other stack are moved to this stack,
        and the other stack is deleted.
        """
        if other_stack.pk == self.pk:
            return

        # Move all photos from other stack to this one (ManyToMany)
        # Convert to list first to avoid modifying queryset while iterating
        photos_to_move = list(other_stack.photos.all())
        for photo in photos_to_move:
            photo.stacks.add(self)
            photo.stacks.remove(other_stack)

        # Recalculate primary if needed
        if not self.primary_photo:
            self.auto_select_primary()

        # Delete the now-empty stack
        other_stack.delete()

    @classmethod
    def create_or_merge(cls, owner, stack_type, photos, sequence_start=None, sequence_end=None):
        """
        Create a new stack or merge into existing if any photo is already stacked.

        Args:
            owner: User who owns the photos
            stack_type: Type of stack to create
            photos: Queryset or list of Photo objects to group
            sequence_start: Optional start timestamp for burst/bracket sequences
            sequence_end: Optional end timestamp for burst/bracket sequences

        Returns:
            The PhotoStack instance (new or existing)
        """
        photo_list = list(photos)
        if len(photo_list) < 2:
            return None

        # Check if any photo is already in a stack of the same type
        existing_stacks = cls.objects.filter(
            photos__in=photo_list,
            stack_type=stack_type,
            owner=owner,
        ).distinct()

        if existing_stacks.exists():
            # Merge all into the first existing stack
            target_stack = existing_stacks.first()
            for stack in existing_stacks[1:]:
                target_stack.merge_with(stack)

            # Add any new photos to the stack (ManyToMany)
            for photo in photo_list:
                if not photo.stacks.filter(pk=target_stack.pk).exists():
                    photo.stacks.add(target_stack)

            # Update sequence timestamps if provided and this is a burst/bracket stack
            if sequence_start is not None and sequence_end is not None:
                if target_stack.sequence_start is None or target_stack.sequence_start > sequence_start:
                    target_stack.sequence_start = sequence_start
                if target_stack.sequence_end is None or target_stack.sequence_end < sequence_end:
                    target_stack.sequence_end = sequence_end
                target_stack.save(update_fields=['sequence_start', 'sequence_end', 'updated_at'])

            target_stack.auto_select_primary()
            return target_stack
        else:
            # Create new stack
            stack = cls.objects.create(
                owner=owner,
                stack_type=stack_type,
                sequence_start=sequence_start,
                sequence_end=sequence_end,
            )

            # Associate photos (ManyToMany - add each photo to the stack)
            for photo in photo_list:
                photo.stacks.add(stack)

            stack.auto_select_primary()
            return stack


================================================
FILE: api/models/stack_review.py
================================================
"""
StackReview model for tracking user review decisions on reviewable stacks.

This model is separate from PhotoStack because:
1. Only certain stack types need review (exact_copy, visual_duplicate)
2. Other stack types (raw_jpeg, burst, bracket, live_photo) are informational
3. Manual stacks are always "reviewed" by definition (user created them)

This separation allows:
- Clean data model with clear semantics
- Different workflows for different stack types
- Historical tracking of review decisions
"""

import uuid

from django.db import models

from api.models.photo_stack import PhotoStack
from api.models.user import User, get_deleted_user


class StackReview(models.Model):
    """
    Records a user's review decision for a reviewable stack.
    
    Reviewable stack types:
    - exact_copy: User decides which copy to keep
    - visual_duplicate: User decides if photos are truly duplicates
    
    Non-reviewable stack types (informational only):
    - raw_jpeg: Both RAW and JPEG are kept (different purposes)
    - burst: User may want to browse all burst photos
    - bracket: HDR processing may need all exposures
    - live_photo: Photo and video are intrinsically linked
    - manual: User explicitly created the grouping
    """

    class Decision(models.TextChoices):
        # User hasn't reviewed yet
        PENDING = "pending", "Pending Review"
        # User selected a primary and trashed others
        RESOLVED = "resolved", "Resolved"
        # User marked as "not actually duplicates"
        DISMISSED = "dismissed", "Dismissed"

    id = models.UUIDField(primary_key=True, default=uuid.uuid4, editable=False)

    stack = models.OneToOneField(
        PhotoStack,
        on_delete=models.CASCADE,
        related_name="review",
    )

    reviewer = models.ForeignKey(
        User,
        on_delete=models.SET(get_deleted_user),
        related_name="stack_reviews",
    )

    decision = models.CharField(
        max_length=20,
        choices=Decision.choices,
        default=Decision.PENDING,
        db_index=True,
    )

    # The photo the user chose to keep (only set when decision=RESOLVED)
    kept_photo = models.ForeignKey(
        "Photo",
        on_delete=models.SET_NULL,
        null=True,
        blank=True,
        related_name="kept_in_reviews",
    )

    # Number of photos trashed when resolved
    trashed_count = models.IntegerField(default=0)

    # Timestamps
    created_at = models.DateTimeField(auto_now_add=True)
    reviewed_at = models.DateTimeField(null=True, blank=True)

    # Optional note from user
    note = models.TextField(blank=True, null=True)

    class Meta:
        ordering = ["-created_at"]
        verbose_name = "Stack Review"
        verbose_name_plural = "Stack Reviews"
        indexes = [
            models.Index(fields=["reviewer", "decision"]),
        ]

    def __str__(self):
        return f"Review for {self.stack.id} - {self.decision}"

    @classmethod
    def is_reviewable_type(cls, stack_type: str) -> bool:
        """
        Check if a stack type requires user review.
        
        Currently no stack types are reviewable because:
        - exact_copy and visual_duplicate are now handled by Duplicate model
        - BURST_SEQUENCE, EXPOSURE_BRACKET, MANUAL are informational
        - RAW_JPEG_PAIR and LIVE_PHOTO are deprecated (use Photo.files)
        
        Returns:
            False for all current stack types
        """
        # No current stack types require review
        # Duplicates are handled by the separate Duplicate model
        return False

    @classmethod
    def create_for_stack(cls, stack: PhotoStack) -> "StackReview | None":
        """
        Create a review record for a stack if it's a reviewable type.
        Returns None for non-reviewable stack types.
        """
        if not cls.is_reviewable_type(stack.stack_type):
            return None

        review, created = cls.objects.get_or_create(
            stack=stack,
            defaults={
                "reviewer": stack.owner,
                "decision": cls.Decision.PENDING,
            }
        )
        return review

    def resolve(self, kept_photo, trash_others: bool = True):
        """
        Mark the review as resolved by selecting a photo to keep.
        
        Args:
            kept_photo: The Photo instance to keep as primary
            trash_others: Whether to move other photos to trash
        """
        from django.utils import timezone

        # Set the kept photo
        self.kept_photo = kept_photo
        self.decision = self.Decision.RESOLVED
        self.reviewed_at = timezone.now()

        # Also set as stack's primary photo
        self.stack.primary_photo = kept_photo
        self.stack.save(update_fields=["primary_photo", "updated_at"])

        # Trash others if requested
        if trash_others:
            other_photos = self.stack.photos.exclude(pk=kept_photo.pk)
            self.trashed_count = other_photos.update(in_trashcan=True)
        
        self.save()
        return self

    def dismiss(self):
        """Mark as 'not actually duplicates' and unlink photos from stack."""
        from django.utils import timezone

        self.decision = self.Decision.DISMISSED
        self.reviewed_at = timezone.now()
        
        # Unlink photos from stack (ManyToMany)
        for photo in self.stack.photos.all():
            photo.stacks.remove(self.stack)
        
        self.save()
        return self

    def revert(self):
        """Revert a resolved review, restoring trashed photos."""
        if self.decision != self.Decision.RESOLVED:
            return self

        # Restore trashed photos in this stack (using ManyToMany relationship)
        restored_count = self.stack.photos.filter(
            in_trashcan=True
        ).update(in_trashcan=False)

        # Reset to pending
        self.decision = self.Decision.PENDING
        self.kept_photo = None
        self.trashed_count = 0
        self.reviewed_at = None
        
        # Clear stack's primary
        self.stack.primary_photo = None
        self.stack.save(update_fields=["primary_photo", "updated_at"])

        self.save()
        return restored_count


================================================
FILE: api/models/thumbnail.py
================================================
import os

from django.db import models
from PIL import Image

from api.metadata.reader import get_metadata
from api.metadata.tags import Tags
from api.models.photo import Photo
from api.thumbnails import (
    create_animated_thumbnail,
    create_thumbnail,
    create_thumbnail_for_video,
    does_static_thumbnail_exist,
    does_video_thumbnail_exist,
)
from api.util import logger


class Thumbnail(models.Model):
    photo = models.OneToOneField(
        Photo, on_delete=models.CASCADE, related_name="thumbnail", primary_key=True
    )
    thumbnail_big = models.ImageField(upload_to="thumbnails_big")
    square_thumbnail = models.ImageField(upload_to="square_thumbnails")
    square_thumbnail_small = models.ImageField(upload_to="square_thumbnails_small")
    aspect_ratio = models.FloatField(blank=True, null=True)
    dominant_color = models.TextField(blank=True, null=True)

    def _generate_thumbnail(self):
        try:
            # Use photo.image_hash for thumbnail paths for frontend compatibility
            photo_hash = self.photo.image_hash
            if not does_static_thumbnail_exist("thumbnails_big", photo_hash):
                if not self.photo.video:
                    create_thumbnail(
                        input_path=self.photo.main_file.path,
                        output_height=1080,
                        output_path="thumbnails_big",
                        hash=photo_hash,
                        file_type=".webp",
                    )
                else:
                    create_thumbnail_for_video(
                        input_path=self.photo.main_file.path,
                        output_path="thumbnails_big",
                        hash=photo_hash,
                        file_type=".webp",
                    )

            if not self.photo.video and not does_static_thumbnail_exist(
                "square_thumbnails", photo_hash
            ):
                create_thumbnail(
                    input_path=self.photo.main_file.path,
                    output_height=500,
                    output_path="square_thumbnails",
                    hash=photo_hash,
                    file_type=".webp",
                )
            if self.photo.video and not does_video_thumbnail_exist(
                "square_thumbnails", photo_hash
            ):
                create_animated_thumbnail(
                    input_path=self.photo.main_file.path,
                    output_height=500,
                    output_path="square_thumbnails",
                    hash=photo_hash,
                    file_type=".mp4",
                )

            if not self.photo.video and not does_static_thumbnail_exist(
                "square_thumbnails_small", photo_hash
            ):
                create_thumbnail(
                    input_path=self.photo.main_file.path,
                    output_height=250,
                    output_path="square_thumbnails_small",
                    hash=photo_hash,
                    file_type=".webp",
                )
            if self.photo.video and not does_video_thumbnail_exist(
                "square_thumbnails_small", photo_hash
            ):
                create_animated_thumbnail(
                    input_path=self.photo.main_file.path,
                    output_height=250,
                    output_path="square_thumbnails_small",
                    hash=photo_hash,
                    file_type=".mp4",
                )
            filetype = ".webp"
            if self.photo.video:
                filetype = ".mp4"
            self.thumbnail_big.name = os.path.join(
                "thumbnails_big", photo_hash + ".webp"
            )
            self.square_thumbnail.name = os.path.join(
                "square_thumbnails", photo_hash + filetype
            )
            self.square_thumbnail_small.name = os.path.join(
                "square_thumbnails_small", photo_hash + filetype
            )
            self.save()
        except Exception as e:
            logger.exception(
                f"could not generate thumbnail for image {self.photo.main_file.path}"
            )
            raise e

    def _calculate_aspect_ratio(self):
        try:
            # Relies on big thumbnail for correct aspect ratio
            height, width = get_metadata(
                self.thumbnail_big.path,
                tags=[Tags.IMAGE_HEIGHT, Tags.IMAGE_WIDTH],
                try_sidecar=False,
            )
            self.aspect_ratio = round(width / height, 2)

            self.save()
        except Exception as e:
            logger.exception(
                f"could not calculate aspect ratio for image {self.thumbnail_big.path}"
            )
            raise e

    def _get_dominant_color(self, palette_size=16):
        # Skip if it's already calculated
        if self.dominant_color:
            return
        try:
            # Resize image to speed up processing
            img = Image.open(self.square_thumbnail_small.path)
            img.thumbnail((100, 100))

            # Reduce colors (uses k-means internally)
            paletted = img.convert("P", palette=Image.ADAPTIVE, colors=palette_size)

            # Find the color that occurs most often
            palette = paletted.getpalette()
            color_counts = sorted(paletted.getcolors(), reverse=True)
            palette_index = color_counts[0][1]
            dominant_color = palette[palette_index * 3 : palette_index * 3 + 3]
            self.dominant_color = dominant_color
            self.save()
        except Exception:
            logger.info(f"Cannot calculate dominant color {self} object")


================================================
FILE: api/models/user.py
================================================
import pytz
from django.conf import settings
from django.contrib.auth.models import AbstractUser
from django.db import models
from django_cryptography.fields import encrypt

from api.date_time_extractor import DEFAULT_RULES_JSON
from api.burst_detection_rules import get_default_burst_detection_rules


def get_default_config_datetime_rules():  # This is a callable
    return DEFAULT_RULES_JSON


def get_default_config_burst_detection_rules():  # This is a callable
    return get_default_burst_detection_rules()


def get_default_llm_settings():
    return {
        "enabled": False,
        "add_person": False,
        "add_location": False,
        "add_keywords": False,
        "add_camera": False,
        "add_lens": False,
        "add_album": False,
        "sentiment": 0,
        "custom_prompt": "",
        "custom_prompt_enabled": False,
    }


def get_default_public_sharing_settings():
    """Default settings for what metadata to share in public albums.

    All options default to False (opt-in) for privacy-first approach.
    Users can change their defaults, and per-album overrides take precedence.
    """
    return {
        "share_location": False,  # GPS coordinates and location names
        "share_camera_info": False,  # Camera make/model, lens, settings
        "share_timestamps": False,  # Date/time when photo was taken
        "share_captions": False,  # AI-generated or user captions
        "share_faces": False,  # Detected faces (always recommend False)
    }


class User(AbstractUser):
    scan_directory = models.CharField(
        max_length=512, db_index=True, blank=True, default=""
    )
    confidence = models.FloatField(default=0.1, db_index=True)
    confidence_person = models.FloatField(default=0.9)
    image_scale = models.FloatField(default=1)
    semantic_search_topk = models.IntegerField(default=0)
    avatar = models.ImageField(upload_to="avatars", null=True, blank=True)
    transcode_videos = models.BooleanField(default=False)
    nextcloud_server_address = models.CharField(max_length=200, default="", blank=True)
    nextcloud_username = models.CharField(max_length=64, default="", blank=True)
    nextcloud_app_password = encrypt(
        models.CharField(max_length=64, default="", blank=True)
    )
    nextcloud_scan_directory = models.CharField(
        max_length=512, db_index=True, default="", blank=True
    )

    favorite_min_rating = models.IntegerField(
        default=settings.DEFAULT_FAVORITE_MIN_RATING, db_index=True
    )

    class SaveMetadata(models.TextChoices):
        OFF = "OFF"
        MEDIA_FILE = "MEDIA_FILE"
        SIDECAR_FILE = "SIDECAR_FILE"

    save_metadata_to_disk = models.TextField(
        choices=SaveMetadata.choices, default=SaveMetadata.OFF
    )
    save_face_tags_to_disk = models.BooleanField(default=False)
    llm_settings = models.JSONField(default=get_default_llm_settings)
    datetime_rules = models.JSONField(default=get_default_config_datetime_rules)
    burst_detection_rules = models.JSONField(
        default=get_default_config_burst_detection_rules
    )
    default_timezone = models.TextField(
        choices=[(x, x) for x in pytz.all_timezones],
        default="UTC",
    )
    public_sharing = models.BooleanField(default=False)
    public_sharing_defaults = models.JSONField(
        default=get_default_public_sharing_settings
    )

    class FaceRecogniton(models.TextChoices):
        HOG = "HOG"
        CNN = "CNN"

    face_recognition_model = models.TextField(
        choices=FaceRecogniton.choices, default=FaceRecogniton.HOG
    )
    min_cluster_size = models.IntegerField(default=0)
    confidence_unknown_face = models.FloatField(default=0.5)
    min_samples = models.IntegerField(default=1)
    cluster_selection_epsilon = models.FloatField(default=0.05)

    class TextAlignment(models.TextChoices):
        LEFT = "left"
        RIGHT = "right"

    text_alignment = models.TextField(
        choices=TextAlignment.choices, default=TextAlignment.RIGHT
    )

    class HeaderSize(models.TextChoices):
        LARGE = "large"
        NORMAL = "normal"
        SMALL = "small"

    header_size = models.TextField(choices=HeaderSize.choices, default=HeaderSize.LARGE)
    skip_raw_files = models.BooleanField(
        default=False
    )  # Deprecated: kept for migration compatibility
    stack_raw_jpeg = models.BooleanField(default=True)
    slideshow_interval = models.IntegerField(default=5)

    # Duplicate detection settings
    class DuplicateSensitivity(models.TextChoices):
        STRICT = "strict"
        NORMAL = "normal"
        LOOSE = "loose"

    duplicate_sensitivity = models.TextField(
        choices=DuplicateSensitivity.choices, default=DuplicateSensitivity.NORMAL
    )
    duplicate_clear_existing = models.BooleanField(default=False)


def get_admin_user():
    return User.objects.get(is_superuser=True)


def get_deleted_user():
    deleted_user: User = User.objects.get_or_create(username="deleted")[0]
    if deleted_user.is_active is not False:
        deleted_user.is_active = False
        deleted_user.save()
    return deleted_user


================================================
FILE: api/nextcloud.py
================================================
import os

import owncloud as nextcloud


def login(user):
    nc = nextcloud.Client(user.nextcloud_server_address)
    nc.login(user.nextcloud_username, user.nextcloud_app_password)

    def path_to_dict(path):
        d = {"title": os.path.basename(path), "absolute_path": path}
        try:
            d["children"] = [
                path_to_dict(os.path.join(path, x.path))
                for x in nc.list(path)
                if x.is_dir()
            ]
        except Exception:
            pass

        return d


def list_dir(user, path):
    nc = nextcloud.Client(user.nextcloud_server_address)
    nc.login(user.nextcloud_username, user.nextcloud_app_password)
    return [p.path for p in nc.list(path) if p.is_dir()]


================================================
FILE: api/perceptual_hash.py
================================================
"""
Perceptual hashing module for duplicate image detection.

Uses pHash (perceptual hash) algorithm which is robust to:
- Image resizing/scaling
- Compression artifacts (JPEG quality differences)
- Minor color adjustments
- Small crops (up to ~15% border removal)
"""

import imagehash
from PIL import Image

from api.util import logger

# Threshold for considering two images as duplicates
# pHash produces 64-bit hashes, Hamming distance <= 10 indicates high similarity
DEFAULT_HAMMING_THRESHOLD = 10


def calculate_perceptual_hash(image_path: str, hash_size: int = 8) -> str | None:
    """
    Calculate the perceptual hash (pHash) of an image.

    Args:
        image_path: Path to the image file
        hash_size: Size of the hash (default 8 produces 64-bit hash)

    Returns:
        Hex string representation of the perceptual hash, or None if failed
    """
    try:
        with Image.open(image_path) as img:
            # Convert to RGB if necessary (handles RGBA, palette images, etc.)
            if img.mode not in ("RGB", "L"):
                img = img.convert("RGB")

            # Calculate pHash - uses DCT (Discrete Cosine Transform)
            # More robust than average hash or difference hash
            phash = imagehash.phash(img, hash_size=hash_size)
            return str(phash)
    except Exception as e:
        logger.error(f"Failed to calculate perceptual hash for {image_path}: {e}")
        return None


def calculate_hash_from_thumbnail(thumbnail_path: str) -> str | None:
    """
    Calculate perceptual hash from a thumbnail image.
    Using thumbnails is faster and still produces reliable hashes.

    Args:
        thumbnail_path: Path to the thumbnail file

    Returns:
        Hex string representation of the perceptual hash, or None if failed
    """
    return calculate_perceptual_hash(thumbnail_path)


def hamming_distance(hash1: str, hash2: str) -> int:
    """
    Calculate the Hamming distance between two perceptual hashes.

    Args:
        hash1: First hash as hex string
        hash2: Second hash as hex string

    Returns:
        Number of differing bits (0 = identical, higher = more different)
    """
    try:
        h1 = imagehash.hex_to_hash(hash1)
        h2 = imagehash.hex_to_hash(hash2)
        return h1 - h2  # imagehash overloads subtraction to return Hamming distance
    except Exception as e:
        logger.error(f"Failed to calculate Hamming distance: {e}")
        return 64  # Maximum distance (completely different)


def are_duplicates(hash1: str, hash2: str, threshold: int = DEFAULT_HAMMING_THRESHOLD) -> bool:
    """
    Determine if two images are duplicates based on their perceptual hashes.

    Args:
        hash1: First perceptual hash
        hash2: Second perceptual hash
        threshold: Maximum Hamming distance to consider as duplicates (default 10)

    Returns:
        True if images are likely duplicates, False otherwise
    """
    if not hash1 or not hash2:
        return False
    return hamming_distance(hash1, hash2) <= threshold


def find_similar_hashes(
    target_hash: str,
    hash_list: list[tuple[str, str]],
    threshold: int = DEFAULT_HAMMING_THRESHOLD,
) -> list[tuple[str, int]]:
    """
    Find all hashes similar to the target hash.

    Args:
        target_hash: The hash to compare against
        hash_list: List of (image_id, hash) tuples to search
        threshold: Maximum Hamming distance for similarity

    Returns:
        List of (image_id, distance) tuples for similar images, sorted by distance
    """
    if not target_hash:
        return []

    similar = []
    for image_id, hash_value in hash_list:
        if hash_value and hash_value != target_hash:
            distance = hamming_distance(target_hash, hash_value)
            if distance <= threshold:
                similar.append((image_id, distance))

    return sorted(similar, key=lambda x: x[1])


================================================
FILE: api/permissions.py
================================================
from constance import config as site_config
from rest_framework import permissions

from api.models import User


class IsAdminOrSelf(permissions.BasePermission):
    def has_object_permission(self, request, view, obj):
        if request.method in permissions.SAFE_METHODS:
            return True

        return request.user and request.user.is_staff or obj == request.user


class IsAdminOrFirstTimeSetupOrRegistrationAllowed(permissions.BasePermission):
    def has_permission(self, request, view):
        if request.method in permissions.SAFE_METHODS:
            return True

        is_admin = request.user and request.user.is_staff
        is_first_time_setup = not User.objects.filter(is_superuser=True).exists()
        is_registration_allowed = bool(site_config.ALLOW_REGISTRATION)

        return is_admin or is_first_time_setup or is_registration_allowed


class IsOwnerOrReadOnly(permissions.BasePermission):
    """Custom permission to only allow owners of an object to edit it."""

    def has_object_permission(self, request, view, obj):
        # Read permissions are allowed to any request,
        # so we'll always allow GET, HEAD or OPTIONS requests.
        if request.method in permissions.SAFE_METHODS:
            return True

        # Write permissions are only allowed to the owner of the snippet.
        return obj.owner == request.user


class IsUserOrReadOnly(permissions.BasePermission):
    """Custom permission to only allow owners of an object to edit it."""

    def has_object_permission(self, request, view, obj):
        # Read permissions are allowed to any request,
        # so we'll always allow GET, HEAD or OPTIONS requests.
        if request.method in permissions.SAFE_METHODS:
            return True

        # Write permissions are only allowed to the owner of the snippet.
        return obj == request.user


class IsPhotoOrAlbumSharedTo(permissions.BasePermission):
    """Custom permission to only allow owners of an object to edit it."""

    def has_object_permission(self, request, view, obj):
        if obj.public:
            return True

        if obj.owner == request.user or request.user in obj.shared_to.all():
            return True

        for album in obj.albumuser_set.only("shared_to"):
            if request.user in album.shared_to.all():
                return True

        return False


class IsRegistrationAllowed(permissions.BasePermission):
    """Custom permission to only allow if registration is allowed globally."""

    def has_permission(self, request, view):
        return bool(site_config.ALLOW_REGISTRATION)


================================================
FILE: api/schemas/site_settings.py
================================================
site_settings_schema = {
    "type": "object",
    "anyOf": [
        {"required": ["allow_registration"]},
        {"required": ["allow_upload"]},
        {"required": ["skip_patterns"]},
        {"required": ["map_api_provider"]},
        {"required": ["map_api_key"]},
        {"required": ["captioning_model"]},
        {"required": ["llm_model"]},
        {"required": ["tagging_model"]},
    ],
    "properties": {
        "allow_registration": {"type": "boolean"},
        "allow_upload": {"type": "boolean"},
        "skip_patterns": {"type": "string"},
        "map_api_provider": {"type": "string"},
        "map_api_key": {"type": "string"},
        "captioning_model": {"type": "string"},
        "llm_model": {"type": "string"},
        "tagging_model": {"type": "string"},
    },
}


================================================
FILE: api/semantic_search.py
================================================
import numpy as np
import requests
from django.conf import settings

dir_clip_ViT_B_32_model = settings.CLIP_ROOT


def create_clip_embeddings(imgs):
    json = {
        "imgs": imgs,
        "model": dir_clip_ViT_B_32_model,
    }
    clip_embeddings = requests.post(
        "http://localhost:8006/clip-embeddings", json=json
    ).json()

    imgs_emb = clip_embeddings["imgs_emb"]
    magnitudes = clip_embeddings["magnitudes"]

    # Convert Python lists to NumPy arrays
    imgs_emb = [np.array(enc) for enc in imgs_emb]

    return imgs_emb, magnitudes


def calculate_query_embeddings(query):
    json = {
        "query": query,
        "model": dir_clip_ViT_B_32_model,
    }
    query_embedding = requests.post(
        "http://localhost:8006/query-embeddings", json=json
    ).json()

    emb = query_embedding["emb"]
    magnitude = query_embedding["magnitude"]
    return emb, magnitude


================================================
FILE: api/serializers/PhotosGroupedByDate.py
================================================
import pytz
from itertools import groupby

utc = pytz.UTC


class PhotosGroupedByDate:
    def __init__(self, location, date, photos):
        self.photos = photos
        self.date = date
        self.location = location


def get_photos_ordered_by_date(photos):
    """
    Efficiently group photos by date using itertools.groupby.
    Assumes photos are already ordered by exif_timestamp.
    """
    # Convert to list once if it's a queryset
    if hasattr(photos, "_result_cache") and photos._result_cache is None:
        photos = list(photos)

    result = []
    no_timestamp_photos = []

    def date_key(photo):
        """Key function for grouping photos by date"""
        if photo.exif_timestamp:
            return photo.exif_timestamp.date().strftime("%Y-%m-%d")
        return None

    # Group consecutive photos by their date
    for date_str, group_photos in groupby(photos, key=date_key):
        group_list = list(group_photos)
        location = ""

        if date_str is not None:
            # Use the first photo's timestamp as the group date
            date = group_list[0].exif_timestamp
            result.append(PhotosGroupedByDate(location, date, group_list))
        else:
            # Collect photos without timestamps
            no_timestamp_photos.extend(group_list)

    # Add no timestamp photos as a single group at the end
    if no_timestamp_photos:
        result.append(PhotosGroupedByDate("", "No timestamp", no_timestamp_photos))

    return result


================================================
FILE: api/serializers/__init__.py
================================================


================================================
FILE: api/serializers/album_auto.py
================================================
from rest_framework import serializers

from api.models import AlbumAuto
from api.serializers.person import PersonSerializer
from api.serializers.photos import PhotoHashListSerializer
from api.serializers.simple import PhotoSimpleSerializer


class AlbumAutoSerializer(serializers.ModelSerializer):
    photos = PhotoSimpleSerializer(many=True, read_only=False)
    people = serializers.SerializerMethodField()

    class Meta:
        model = AlbumAuto
        fields = (
            "id",
            "title",
            "favorited",
            "timestamp",
            "created_on",
            "gps_lat",
            "people",
            "gps_lon",
            "photos",
        )

    def get_people(self, obj) -> PersonSerializer(many=True):
        res = []
        for photo in obj.photos.all():
            faces = photo.faces.all()
            for face in faces:
                serialized_person = PersonSerializer(face.person).data
                if serialized_person not in res:
                    res.append(serialized_person)
        return res

    def delete(self, validated_data, id):
        album = AlbumAuto.objects.filter(id=id).get()
        album.delete()


class AlbumAutoListSerializer(serializers.ModelSerializer):
    photos = serializers.SerializerMethodField()
    photo_count = serializers.SerializerMethodField()

    class Meta:
        model = AlbumAuto
        fields = (
            "id",
            "title",
            "timestamp",
            "photos",
            "photo_count",
            "favorited",
        )

    def get_photo_count(self, obj) -> int:
        try:
            return obj.photo_count
        except Exception:
            return obj.photos.count()

    def get_photos(self, obj) -> PhotoHashListSerializer:
        try:
            return PhotoHashListSerializer(obj.cover_photo[0]).data
        except Exception:
            return ""


================================================
FILE: api/serializers/album_date.py
================================================
from rest_framework import serializers

from api.models import AlbumDate


class IncompleteAlbumDateSerializer(serializers.ModelSerializer):
    id = serializers.SerializerMethodField()
    date = serializers.SerializerMethodField()
    location = serializers.SerializerMethodField()
    incomplete = serializers.SerializerMethodField()
    numberOfItems = serializers.SerializerMethodField("get_number_of_items")
    items = serializers.SerializerMethodField()

    class Meta:
        model = AlbumDate
        fields = ("id", "date", "location", "incomplete", "numberOfItems", "items")

    def get_id(self, obj) -> str:
        return str(obj.id)

    def get_date(self, obj) -> str:
        if obj.date:
            return obj.date.isoformat()
        else:
            return None

    def get_items(self, obj) -> list:
        return []

    def get_incomplete(self, obj) -> bool:
        return True

    def get_number_of_items(self, obj) -> int:
        if obj and obj.photo_count:
            return obj.photo_count
        else:
            return 0

    def get_location(self, obj) -> str:
        if obj and obj.location:
            return obj.location["places"][0]
        else:
            return ""


class AlbumDateSerializer(serializers.ModelSerializer):
    id = serializers.SerializerMethodField()
    date = serializers.SerializerMethodField()
    location = serializers.SerializerMethodField()
    incomplete = serializers.SerializerMethodField()
    numberOfItems = serializers.SerializerMethodField("get_number_of_items")
    items = serializers.SerializerMethodField()

    class Meta:
        model = AlbumDate
        fields = ("id", "date", "location", "incomplete", "numberOfItems", "items")

    def get_id(self, obj) -> str:
        return str(obj.id)

    def get_date(self, obj) -> str:
        if obj.date:
            return obj.date.isoformat()
        else:
            return None

    def get_items(self, obj) -> dict:
        # This method is removed as we're directly including paginated photos in the response.
        pass

    def get_incomplete(self, obj) -> bool:
        return False

    def get_number_of_items(self, obj) -> int:
        # this will also get added in the response
        pass

    def get_location(self, obj) -> str:
        if obj and obj.location:
            return obj.location["places"][0]
        else:
            return ""


================================================
FILE: api/serializers/album_place.py
================================================
from rest_framework import serializers

from api.models import AlbumPlace
from api.serializers.photos import GroupedPhotosSerializer, PhotoHashListSerializer
from api.serializers.PhotosGroupedByDate import get_photos_ordered_by_date
from api.serializers.simple import PhotoSuperSimpleSerializer


class GroupedPlacePhotosSerializer(serializers.ModelSerializer):
    id = serializers.SerializerMethodField()
    grouped_photos = serializers.SerializerMethodField()

    class Meta:
        model = AlbumPlace
        fields = (
            "id",
            "title",
            "grouped_photos",
        )

    # To-Do: Remove legacy stuff
    def get_id(self, obj) -> str:
        return str(obj.id)

    def get_grouped_photos(self, obj) -> GroupedPhotosSerializer(many=True):
        grouped_photos = get_photos_ordered_by_date(obj.photos.all())
        res = GroupedPhotosSerializer(grouped_photos, many=True).data
        return res


class AlbumPlaceSerializer(serializers.ModelSerializer):
    photos = PhotoSuperSimpleSerializer(many=True, read_only=True)

    class Meta:
        model = AlbumPlace
        fields = ("id", "title", "photos")


class AlbumPlaceListSerializer(serializers.ModelSerializer):
    cover_photos = PhotoHashListSerializer(many=True, read_only=True)
    photo_count = serializers.SerializerMethodField()

    class Meta:
        model = AlbumPlace
        fields = ("id", "geolocation_level", "cover_photos", "title", "photo_count")

    def get_photo_count(self, obj) -> int:
        return obj.photo_count


================================================
FILE: api/serializers/album_thing.py
================================================
from rest_framework import serializers

from api.models import AlbumThing
from api.serializers.photos import GroupedPhotosSerializer, PhotoHashListSerializer
from api.serializers.PhotosGroupedByDate import get_photos_ordered_by_date
from api.serializers.simple import PhotoSuperSimpleSerializer


class GroupedThingPhotosSerializer(serializers.ModelSerializer):
    id = serializers.SerializerMethodField()
    grouped_photos = serializers.SerializerMethodField()

    class Meta:
        model = AlbumThing
        fields = (
            "id",
            "title",
            "grouped_photos",
        )

    def get_id(self, obj) -> str:
        return str(obj.id)

    def get_grouped_photos(self, obj) -> GroupedPhotosSerializer(many=True):
        grouped_photos = get_photos_ordered_by_date(obj.photos.all())
        res = GroupedPhotosSerializer(grouped_photos, many=True).data
        return res


class AlbumThingSerializer(serializers.ModelSerializer):
    photos = PhotoSuperSimpleSerializer(many=True, read_only=True)

    class Meta:
        model = AlbumThing
        fields = ("id", "title", "photos")


class AlbumThingListSerializer(serializers.ModelSerializer):
    cover_photos = PhotoHashListSerializer(many=True, read_only=True)
    photo_count = serializers.SerializerMethodField()

    class Meta:
        model = AlbumThing
        fields = (
            "id",
            "cover_photos",
            "title",
            "photo_count",
            "thing_type",
            "cover_photos",
        )

    def get_photo_count(self, obj) -> int:
        return obj.photo_count


================================================
FILE: api/serializers/album_user.py
================================================
from rest_framework import serializers

from api.models import AlbumUser, Photo
from api.serializers.photos import GroupedPhotosSerializer
from api.serializers.PhotosGroupedByDate import get_photos_ordered_by_date
from api.serializers.simple import PhotoSuperSimpleSerializer, SimpleUserSerializer
from api.util import logger


class AlbumUserSerializer(serializers.ModelSerializer):
    id = serializers.SerializerMethodField()
    owner = SimpleUserSerializer(many=False, read_only=True)
    shared_to = SimpleUserSerializer(many=True, read_only=True)
    date = serializers.SerializerMethodField()
    location = serializers.SerializerMethodField()
    grouped_photos = serializers.SerializerMethodField()
    public = serializers.SerializerMethodField()
    public_slug = serializers.SerializerMethodField()
    public_expires_at = serializers.SerializerMethodField()
    public_sharing_options = serializers.SerializerMethodField()

    class Meta:
        model = AlbumUser
        fields = (
            "id",
            "title",
            "owner",
            "shared_to",
            "date",
            "location",
            "grouped_photos",
            "public",
            "public_slug",
            "public_expires_at",
            "public_sharing_options",
        )

    # To-Do: Legacy definition, should be a number instead
    def get_id(self, obj) -> str:
        return str(obj.id)

    def get_grouped_photos(self, obj) -> GroupedPhotosSerializer(many=True):
        grouped_photos = get_photos_ordered_by_date(
            obj.photos.all().order_by("-exif_timestamp")
        )
        res = GroupedPhotosSerializer(grouped_photos, many=True).data
        return res

    def get_location(self, obj) -> str:
        for photo in obj.photos.all():
            if (
                photo
                and hasattr(photo, "search_instance")
                and photo.search_instance
                and photo.search_instance.search_location
            ):
                return photo.search_instance.search_location
        return ""

    def get_date(self, obj) -> str:
        for photo in obj.photos.all():
            if photo and photo.exif_timestamp:
                return photo.exif_timestamp
        return ""

    def get_public(self, obj) -> bool:
        return bool(getattr(obj, "share", None) and obj.share.enabled)

    def get_public_slug(self, obj) -> str:
        return getattr(getattr(obj, "share", None), "slug", "") or ""

    def get_public_expires_at(self, obj):
        return getattr(getattr(obj, "share", None), "expires_at", None)

    def get_public_sharing_options(self, obj) -> dict | None:
        """Return the per-album sharing option overrides (None values = use default)."""
        share = getattr(obj, "share", None)
        if not share:
            return None
        return {
            "share_location": share.share_location,
            "share_camera_info": share.share_camera_info,
            "share_timestamps": share.share_timestamps,
            "share_captions": share.share_captions,
            "share_faces": share.share_faces,
        }


class AlbumUserEditSerializer(serializers.ModelSerializer):
    photos = serializers.PrimaryKeyRelatedField(
        many=True, read_only=False, queryset=Photo.objects.all()
    )
    removedPhotos = serializers.ListField(
        child=serializers.CharField(max_length=100, default=""),
        write_only=True,
        required=False,
    )

    class Meta:
        model = AlbumUser
        fields = (
            "id",
            "title",
            "photos",
            "created_on",
            "favorited",
            "removedPhotos",
            "cover_photo",
        )

    def create(self, validated_data):
        title = validated_data["title"]
        photos = validated_data["photos"]

        user = None
        request = self.context.get("request")
        if request and hasattr(request, "user"):
            user = request.user

        # check if an album exists with the given title and call the update method if it does
        instance, created = AlbumUser.objects.get_or_create(title=title, owner=user)
        if not created:
            return self.update(instance, validated_data)

        for photo in photos:
            instance.photos.add(photo)
        instance.save()
        logger.info(f"Created user album {instance.id} with {len(photos)} photos")
        return instance

    def update(self, instance, validated_data):
        if "title" in validated_data.keys():
            title = validated_data["title"]
            instance.title = title
            logger.info(f"Renamed user album to {title}")

        if "removedPhotos" in validated_data.keys():
            image_hashes = validated_data["removedPhotos"]
            photos_already_in_album = instance.photos.all()
            cnt = 0
            for obj in photos_already_in_album:
                if obj.image_hash in image_hashes:
                    cnt += 1
                    instance.photos.remove(obj)

            logger.info(f"Removed {cnt} photos to user album {instance.id}")

        if "cover_photo" in validated_data.keys():
            cover_photo = validated_data["cover_photo"]
            instance.cover_photo = cover_photo
            logger.info(f"Changed cover photo to {cover_photo}")

        if "photos" in validated_data.keys():
            photos = validated_data["photos"]
            photos_already_in_album = instance.photos.all()
            cnt = 0
            for photo in photos:
                if photo not in photos_already_in_album:
                    cnt += 1
                    instance.photos.add(photo)

            logger.info(f"Added {cnt} photos to user album {instance.id}")

        instance.save()
        return instance


class AlbumUserListSerializer(serializers.ModelSerializer):
    cover_photo = serializers.SerializerMethodField()
    photo_count = serializers.SerializerMethodField()
    shared_to = SimpleUserSerializer(many=True, read_only=True)
    owner = SimpleUserSerializer(many=False, read_only=True)
    public = serializers.SerializerMethodField()
    public_slug = serializers.SerializerMethodField()
    public_expires_at = serializers.SerializerMethodField()
    public_sharing_options = serializers.SerializerMethodField()

    class Meta:
        model = AlbumUser
        fields = (
            "id",
            "cover_photo",
            "created_on",
            "favorited",
            "title",
            "shared_to",
            "owner",
            "photo_count",
            "public",
            "public_slug",
            "public_expires_at",
            "public_sharing_options",
        )

    def get_cover_photo(self, obj) -> PhotoSuperSimpleSerializer:
        if obj.cover_photo:
            return PhotoSuperSimpleSerializer(obj.cover_photo).data
        return PhotoSuperSimpleSerializer(obj.photos.first()).data

    def get_photo_count(self, obj) -> int:
        try:
            return obj.photo_count
        except Exception:  # for when calling AlbumUserListSerializer(obj).data directly
            return obj.photos.count()

    def get_public(self, obj) -> bool:
        return bool(getattr(obj, "share", None) and obj.share.enabled)

    def get_public_slug(self, obj) -> str:
        return getattr(getattr(obj, "share", None), "slug", "") or ""

    def get_public_expires_at(self, obj):
        return getattr(getattr(obj, "share", None), "expires_at", None)

    def get_public_sharing_options(self, obj) -> dict | None:
        """Return the per-album sharing option overrides (None values = use default)."""
        share = getattr(obj, "share", None)
        if not share:
            return None
        return {
            "share_location": share.share_location,
            "share_camera_info": share.share_camera_info,
            "share_timestamps": share.share_timestamps,
            "share_captions": share.share_captions,
            "share_faces": share.share_faces,
        }


class AlbumUserPublicSerializer(serializers.ModelSerializer):
    """Serializer for publicly shared user albums.

    Ensures photos are grouped from a filtered subset (not hidden, not in trashcan).
    """

    id = serializers.SerializerMethodField()
    owner = SimpleUserSerializer(many=False, read_only=True)
    date = serializers.SerializerMethodField()
    location = serializers.SerializerMethodField()
    grouped_photos = serializers.SerializerMethodField()
    public_slug = serializers.CharField(read_only=True)
    public_expires_at = serializers.DateTimeField(read_only=True)

    class Meta:
        model = AlbumUser
        fields = (
            "id",
            "title",
            "owner",
            "date",
            "location",
            "grouped_photos",
            "public_slug",
            "public_expires_at",
        )

    def get_id(self, obj) -> str:
        return str(obj.id)

    def _filtered_photos(self, obj):
        # Public albums should not expose hidden or trash photos
        return obj.photos.filter(hidden=False, in_trashcan=False).order_by(
            "-exif_timestamp"
        )

    def get_grouped_photos(self, obj) -> GroupedPhotosSerializer(many=True):
        grouped_photos = get_photos_ordered_by_date(self._filtered_photos(obj))
        return GroupedPhotosSerializer(grouped_photos, many=True).data

    def get_location(self, obj) -> str:
        for photo in self._filtered_photos(obj):
            if (
                photo
                and hasattr(photo, "search_instance")
                and photo.search_instance
                and photo.search_instance.search_location
            ):
                return photo.search_instance.search_location
        return ""

    def get_date(self, obj) -> str:
        for photo in self._filtered_photos(obj):
            if photo and photo.exif_timestamp:
                return photo.exif_timestamp
        return ""


================================================
FILE: api/serializers/face.py
================================================
from rest_framework import serializers

from api.models import Face, Person


class PersonFaceListSerializer(serializers.ModelSerializer):
    face_url = serializers.SerializerMethodField()
    person_label_probability = serializers.SerializerMethodField()
    photo_image_hash = serializers.SerializerMethodField()

    class Meta:
        model = Face
        fields = [
            "id",
            "image",
            "face_url",
            "photo",
            "photo_image_hash",
            "timestamp",
            "person_label_probability",
        ]

    def get_person_label_probability(self, obj):
        if obj.analysis_method == "clustering":
            return obj.cluster_probability
        else:
            return obj.classification_probability

    def get_face_url(self, obj):
        return obj.image.url

    def get_photo_image_hash(self, obj):
        return obj.photo.image_hash if obj.photo else None


class IncompletePersonFaceListSerializer(serializers.ModelSerializer):
    face_count = serializers.SerializerMethodField()

    class Meta:
        model = Person
        fields = ["id", "name", "kind", "face_count"]

    def get_face_count(self, obj) -> int:
        if obj and obj.viewable_face_count:
            return obj.viewable_face_count
        else:
            return 0


class FaceListSerializer(serializers.ModelSerializer):
    person_name = serializers.SerializerMethodField()
    face_url = serializers.SerializerMethodField()
    person_label_probability = serializers.SerializerMethodField()

    class Meta:
        model = Face
        fields = (
            "id",
            "image",
            "face_url",
            "photo",
            "timestamp",
            "person",
            "person_label_probability",
            "person_name",
        )

    def get_person_label_probability(self, obj) -> float:
        return obj.cluster_probability

    def get_face_url(self, obj) -> str:
        return obj.image.url

    def get_person_name(self, obj) -> str:
        if obj.person:
            return obj.person.name
        else:
            return "Unknown - Other"


================================================
FILE: api/serializers/job.py
================================================
from rest_framework import serializers

from api.models import LongRunningJob
from api.serializers.simple import SimpleUserSerializer


class LongRunningJobSerializer(serializers.ModelSerializer):
    job_type_str = serializers.SerializerMethodField()
    started_by = SimpleUserSerializer(read_only=True)

    class Meta:
        model = LongRunningJob
        fields = (
            "job_id",
            "queued_at",
            "finished",
            "finished_at",
            "started_at",
            "failed",
            "job_type_str",
            "job_type",
            "started_by",
            "progress_current",
            "progress_target",
            "progress_step",
            "result",
            "id",
        )

    def get_job_type_str(self, obj) -> str:
        return dict(LongRunningJob.JOB_TYPES)[obj.job_type]


================================================
FILE: api/serializers/person.py
================================================
from django.db.models import Q
from rest_framework import serializers

from api.models import Person, Photo
from api.serializers.photos import GroupedPhotosSerializer
from api.serializers.PhotosGroupedByDate import get_photos_ordered_by_date
from api.util import logger


class GroupedPersonPhotosSerializer(serializers.ModelSerializer):
    id = serializers.SerializerMethodField()
    grouped_photos = serializers.SerializerMethodField()

    class Meta:
        model = Person
        fields = (
            "id",
            "name",
            "grouped_photos",
        )

    def get_id(self, obj) -> str:
        return str(obj.id)

    def get_grouped_photos(self, obj) -> GroupedPhotosSerializer(many=True):
        user = None
        request = self.context.get("request")
        if request and hasattr(request, "user"):
            user = request.user
        grouped_photos = get_photos_ordered_by_date(obj.get_photos(user))
        res = GroupedPhotosSerializer(grouped_photos, many=True).data
        return res


class PersonSerializer(serializers.ModelSerializer):
    face_url = serializers.SerializerMethodField()
    face_photo_url = serializers.SerializerMethodField()
    video = serializers.SerializerMethodField()
    newPersonName = serializers.CharField(max_length=100, default="", write_only=True)
    cover_photo = serializers.CharField(max_length=100, default="", write_only=True)

    class Meta:
        model = Person
        fields = (
            "name",
            "face_url",
            "face_count",
            "face_photo_url",
            "video",
            "id",
            "newPersonName",
            "cover_photo",
        )

    def get_face_url(self, obj) -> str:
        if obj.cover_face:
            return "/media/" + obj.cover_face.image.name
        if obj.faces.count() == 0:
            return ""
        return "/media/" + obj.faces.first().image.name

    def get_face_photo_url(self, obj) -> str:
        if obj.cover_photo:
            return obj.cover_photo.image_hash
        if obj.faces.count() == 0:
            return ""
        return obj.faces.first().photo.image_hash

    def get_video(self, obj) -> str:
        if obj.cover_photo:
            return obj.cover_photo.video
        if obj.faces.count() == 0:
            return "False"
        return obj.faces.first().photo.video

    def create(self, validated_data):
        name = validated_data.pop("name")
        if len(name.strip()) == 0:
            raise serializers.ValidationError("Name cannot be empty")
        qs = Person.objects.filter(name=name)
        if qs.count() > 0:
            return qs[0]
        else:
            new_person = Person()
            new_person.name = name
            new_person.save()
            logger.info(f"created person {new_person.id}")
            return new_person

    def update(self, instance, validated_data):
        if "newPersonName" in validated_data.keys():
            new_name = validated_data.pop("newPersonName")
            instance.name = new_name
            instance.save()
            return instance
        if "cover_photo" in validated_data.keys():
            image_hash = validated_data.pop("cover_photo")
            photo = Photo.objects.filter(image_hash=image_hash).first()
            instance.cover_photo = photo
            instance.cover_face = photo.faces.filter(person__name=instance.name).first()
            instance.save()
            return instance
        return instance

    def delete(self, validated_data, id):
        person = Person.objects.filter(id=id).get()
        person.delete()


class AlbumPersonListSerializer(serializers.ModelSerializer):
    photo_count = serializers.SerializerMethodField()
    cover_photo_url = serializers.SerializerMethodField()

    class Meta:
        model = Person
        fields = (
            "name",
            "photo_count",
            "cover_photo_url",
            "id",
        )

    def get_photo_count(self, obj) -> int:
        return obj.filter(Q(person__is_null=False)).faces.count()

    def get_cover_photo_url(self, obj) -> str:
        first_face = obj.faces.filter(Q(person__is_null=False)).first()
        if first_face:
            return first_face.photo.thumbnail.square_thumbnail.url
        else:
            return None

    def get_face_photo_url(self, obj) -> str:
        first_face = obj.faces.filter(Q(person__is_null=False)).first()
        if first_face:
            return first_face.photo.image.url
        else:
            return None


================================================
FILE: api/serializers/photo_metadata.py
================================================
"""
Serializers for PhotoMetadata, MetadataFile, and MetadataEdit models.

These serializers provide:
- Structured metadata access (replacing exif_json blob)
- Edit history tracking
- Backwards-compatible field names for existing API consumers
"""

from rest_framework import serializers

from api.models import Photo
from api.models.photo_metadata import MetadataEdit, MetadataFile, PhotoMetadata


class MetadataFileSerializer(serializers.ModelSerializer):
    """Serializer for XMP sidecars and other metadata files."""

    class Meta:
        model = MetadataFile
        fields = (
            "id",
            "file_type",
            "source",
            "priority",
            "creator_software",
            "created_at",
            "updated_at",
        )
        read_only_fields = ("id", "created_at", "updated_at")


class MetadataEditSerializer(serializers.ModelSerializer):
    """Serializer for metadata edit history."""

    user_name = serializers.SerializerMethodField()

    class Meta:
        model = MetadataEdit
        fields = (
            "id",
            "field_name",
            "old_value",
            "new_value",
            "user",
            "user_name",
            "synced_to_file",
            "synced_at",
            "created_at",
        )
        read_only_fields = fields

    def get_user_name(self, obj) -> str:
        if obj.user:
            return obj.user.username
        return "Unknown"


class PhotoMetadataSerializer(serializers.ModelSerializer):
    """
    Full metadata serializer with all structured fields.
    
    Used for the detailed metadata view and editing.
    """

    # Computed properties
    resolution = serializers.ReadOnlyField()
    megapixels = serializers.ReadOnlyField()
    has_location = serializers.ReadOnlyField()
    camera_display = serializers.ReadOnlyField()
    lens_display = serializers.ReadOnlyField()

    # Related data
    edit_history = serializers.SerializerMethodField()
    sidecar_files = serializers.SerializerMethodField()

    class Meta:
        model = PhotoMetadata
        fields = (
            "id",
            # Camera settings
            "aperture",
            "shutter_speed",
            "shutter_speed_seconds",
            "iso",
            "focal_length",
            "focal_length_35mm",
            "exposure_compensation",
            "flash_fired",
            "metering_mode",
            "white_balance",
            # Camera/lens info
            "camera_make",
            "camera_model",
            "lens_make",
            "lens_model",
            "serial_number",
            "camera_display",
            "lens_display",
            # Image properties
            "width",
            "height",
            "orientation",
            "color_space",
            "bit_depth",
            "resolution",
            "megapixels",
            # Timestamps
            "date_taken",
            "date_taken_subsec",
            "date_modified",
            "timezone_offset",
            # Location
            "gps_latitude",
            "gps_longitude",
            "gps_altitude",
            "location_country",
            "location_state",
            "location_city",
            "location_address",
            "has_location",
            # Content
            "title",
            "caption",
            "keywords",
            "rating",
            "copyright",
            "creator",
            # Tracking
            "source",
            "version",
            "created_at",
            "updated_at",
            # Related
            "edit_history",
            "sidecar_files",
        )
        read_only_fields = (
            "id",
            "resolution",
            "megapixels",
            "has_location",
            "camera_display",
            "lens_display",
            "version",
            "created_at",
            "updated_at",
        )

    def get_edit_history(self, obj) -> list:
        """Get recent edit history for this photo."""
        edits = MetadataEdit.objects.filter(photo=obj.photo).order_by("-created_at")[:10]
        return MetadataEditSerializer(edits, many=True).data

    def get_sidecar_files(self, obj) -> list:
        """Get sidecar files for this photo."""
        files = MetadataFile.objects.filter(photo=obj.photo)
        return MetadataFileSerializer(files, many=True).data


class PhotoMetadataUpdateSerializer(serializers.ModelSerializer):
    """
    Serializer for updating metadata with change tracking.
    
    Only allows editing specific fields and automatically
    creates MetadataEdit records for history.
    """

    class Meta:
        model = PhotoMetadata
        fields = (
            # Editable fields
            "title",
            "caption",
            "keywords",
            "rating",
            "copyright",
            "creator",
            # Location (can be user-corrected)
            "gps_latitude",
            "gps_longitude",
            "location_country",
            "location_state",
            "location_city",
            "location_address",
            # Timestamp (can be user-corrected)
            "date_taken",
            "timezone_offset",
        )

    def update(self, instance, validated_data):
        """Update metadata and create edit history records."""
        user = self.context.get("request").user if self.context.get("request") else None
        
        for field_name, new_value in validated_data.items():
            old_value = getattr(instance, field_name)
            
            # Only track actual changes
            if old_value != new_value:
                # Create edit history record
                MetadataEdit.objects.create(
                    photo=instance.photo,
                    user=user,
                    field_name=field_name,
                    old_value=old_value,
                    new_value=new_value,
                )
                
                # Update the field
                setattr(instance, field_name, new_value)
        
        # Update source to user_edit and increment version
        instance.source = PhotoMetadata.Source.USER_EDIT
        instance.version += 1
        instance.save()
        
        return instance


class PhotoMetadataSummarySerializer(serializers.Serializer):
    """
    Lightweight metadata summary for photo lists.

    Returns key metadata fields without the full detail.
    """

    # Camera info
    camera_display = serializers.CharField(allow_null=True)
    lens_display = serializers.CharField(allow_null=True)
    # Capture settings
    aperture = serializers.FloatField(allow_null=True)
    shutter_speed = serializers.CharField(allow_null=True)
    iso = serializers.IntegerField(allow_null=True)
    focal_length = serializers.FloatField(allow_null=True)
    focal_length_35mm = serializers.IntegerField(allow_null=True)
    # Image info
    resolution = serializers.CharField(allow_null=True)
    megapixels = serializers.FloatField(allow_null=True)
    # Date/location
    date_taken = serializers.DateTimeField(allow_null=True)
    has_location = serializers.BooleanField()
    # Content
    rating = serializers.IntegerField(allow_null=True)
    # Edit tracking
    source = serializers.CharField()
    version = serializers.IntegerField()
    has_edits = serializers.SerializerMethodField()

    def get_has_edits(self, obj) -> bool:
        """Check if this photo has any metadata edits."""
        return MetadataEdit.objects.filter(photo=obj.photo).exists()


def get_backwards_compatible_metadata(photo: Photo) -> dict:
    """
    Generate backwards-compatible metadata dict from PhotoMetadata.
    
    This function returns metadata in the same format as the original
    Photo model fields for API backwards compatibility.
    
    Note: Metadata fields have been fully migrated to PhotoMetadata model.
    If no PhotoMetadata exists, return None/empty values.
    """
    try:
        metadata = photo.metadata
        return {
            "camera": metadata.camera_display,
            "lens": metadata.lens_display,
            "fstop": metadata.aperture,
            "focal_length": metadata.focal_length,
            "iso": metadata.iso,
            "shutter_speed": metadata.shutter_speed,
            "width": metadata.width,
            "height": metadata.height,
            "focalLength35Equivalent": metadata.focal_length_35mm,
            "digitalZoomRatio": None,  # Not stored in PhotoMetadata
            "subjectDistance": None,   # Not stored in PhotoMetadata
        }
    except PhotoMetadata.DoesNotExist:
        # No PhotoMetadata exists - return None/empty values
        # Metadata will be populated on next photo scan
        return {
            "camera": None,
            "lens": None,
            "fstop": None,
            "focal_length": None,
            "iso": None,
            "shutter_speed": None,
            "width": 0,
            "height": 0,
            "focalLength35Equivalent": None,
            "digitalZoomRatio": None,
            "subjectDistance": None,
        }


================================================
FILE: api/serializers/photos.py
================================================
import json

from rest_framework import serializers

from api.geocode.geocode import reverse_geocode
from api.geocode import GEOCODE_VERSION
from api import util

from api.image_similarity import search_similar_image
from api.models import AlbumDate, File, Photo
from api.models.photo_metadata import PhotoMetadata
from api.serializers.photo_metadata import PhotoMetadataSummarySerializer
from api.serializers.simple import SimpleUserSerializer


class PhotoSummarySerializer(serializers.ModelSerializer):
    # UUID primary key
    id = serializers.UUIDField(read_only=True)
    # Content hash for deduplication/caching (legacy 'id' field for backwards compatibility)
    image_hash = serializers.CharField(read_only=True)
    dominantColor = serializers.SerializerMethodField()
    aspectRatio = serializers.SerializerMethodField()
    url = serializers.SerializerMethodField()
    location = serializers.SerializerMethodField()
    date = serializers.SerializerMethodField()
    birthTime = serializers.SerializerMethodField()
    video_length = serializers.SerializerMethodField()
    type = serializers.SerializerMethodField()
    owner = SimpleUserSerializer()
    # Stack information (can be multiple stacks)
    stacks = serializers.SerializerMethodField()
    # Flag indicating if this photo has a RAW file variant (PhotoPrism-like model)
    has_raw_variant = serializers.SerializerMethodField()

    class Meta:
        model = Photo
        fields = (
            "id",
            "image_hash",
            "dominantColor",
            "url",
            "location",
            "date",
            "birthTime",
            "aspectRatio",
            "type",
            "video_length",
            "rating",
            "owner",
            "exif_gps_lat",
            "exif_gps_lon",
            "removed",
            "in_trashcan",
            "stacks",
            "has_raw_variant",
        )

    # TODO: Rename this field to aspect_ratio
    def get_aspectRatio(self, obj) -> float:
        return obj.thumbnail.aspect_ratio

    # TODO: Remove this field in the future (kept for backwards compatibility)
    def get_url(self, obj) -> str:
        return obj.image_hash

    def get_location(self, obj) -> str:
        if (
            hasattr(obj, "search_instance")
            and obj.search_instance
            and obj.search_instance.search_location
        ):
            return obj.search_instance.search_location
        else:
            return ""

    def get_date(self, obj) -> str:
        if obj.exif_timestamp:
            return obj.exif_timestamp.isoformat()
        else:
            return ""

    def get_video_length(self, obj) -> int:
        if obj.video_length:
            return obj.video_length
        else:
            return ""

    # TODO: Remove this field in the future
    def get_birthTime(self, obj) -> str:
        if obj.exif_timestamp:
            return obj.exif_timestamp
        else:
            return ""

    def get_dominantColor(self, obj) -> str:
        if obj.thumbnail.dominant_color:
            dominant_color = obj.thumbnail.dominant_color[1:-1]
            return "#%02x%02x%02x" % tuple(map(int, dominant_color.split(", ")))
        else:
            return ""

    def get_type(self, obj) -> str:
        if obj.video:
            return "video"
        # Use len() instead of .count() to leverage prefetched embedded_media
        if obj.main_file and len(obj.main_file.embedded_media.all()) > 0:
            return "motion_photo"
        return "image"

    def get_stacks(self, obj) -> list | None:
        """Return stack info if photo is part of any stacks.

        Uses prefetched stacks data when available (from AlbumDateViewSet)
        to avoid N+1 queries. The prefetch filters by valid stack types and
        annotates photo_count_annotation so no extra queries are needed.
        """
        # Use the prefetch cache (obj.stacks.all() won't re-query if prefetched)
        stacks = obj.stacks.all()
        if not stacks:
            return None

        from api.models.photo_stack import PhotoStack
        valid_stack_types = set(PhotoStack.VALID_STACK_TYPES + [
            PhotoStack.StackType.RAW_JPEG_PAIR,
            PhotoStack.StackType.LIVE_PHOTO,
        ])

        result = []
        for stack in stacks:
            # If stacks were prefetched with the type filter, all results are valid.
            # If not prefetched (called from another serializer context), filter in Python.
            if stack.stack_type not in valid_stack_types:
                continue
            is_primary = stack.primary_photo_id == obj.pk if stack.primary_photo_id else False
            # Use annotated count if available, otherwise fall back to DB query
            photo_count = getattr(stack, "photo_count_annotation", None)
            if photo_count is None:
                photo_count = stack.photos.count()
            result.append({
                "id": str(stack.id),
                "type": stack.stack_type,
                "photo_count": photo_count,
                "is_primary": is_primary,
            })

        return result or None

    def get_has_raw_variant(self, obj) -> bool:
        """Check if this photo has a RAW file variant.

        Uses prefetched files when available to avoid N+1 queries.
        Returns True if any of the photo's files is a RAW file type.
        """
        # Use prefetch cache if available (iterate in Python), otherwise query DB
        # File.RAW_FILE = 4
        if "files" in getattr(obj, "_prefetched_objects_cache", {}):
            return any(f.type == 4 for f in obj.files.all())
        return obj.files.filter(type=4).exists()


class GroupedPhotosSerializer(serializers.ModelSerializer):
    items = serializers.SerializerMethodField()
    date = serializers.SerializerMethodField()
    location = serializers.SerializerMethodField()

    class Meta:
        model = Photo
        fields = ("date", "location", "items")

    def get_date(self, obj) -> str:
        return obj.date

    def get_location(self, obj) -> str:
        return obj.location

    def get_items(self, obj) -> PhotoSummarySerializer(many=True):
        return PhotoSummarySerializer(obj.photos, many=True).data


class PhotoEditSerializer(serializers.ModelSerializer):
    class Meta:
        model = Photo
        fields = (
            "image_hash",
            "hidden",
            "rating",
            "in_trashcan",
            "removed",
            "video",
            "exif_timestamp",
            "timestamp",
            # Allow updating GPS location
            "exif_gps_lat",
            "exif_gps_lon",
        )

    def update(self, instance, validated_data):
        # photo can only update the following
        if "exif_timestamp" in validated_data:
            instance.timestamp = validated_data.pop("exif_timestamp")
            instance.save()
            instance._extract_date_time_from_exif()

        # Update GPS location if provided
        lat = validated_data.pop("exif_gps_lat", None)
        lon = validated_data.pop("exif_gps_lon", None)

        if lat is not None and lon is not None:
            try:
                # Track old places to update album place relations
                old_album_places = instance._find_album_place()

                instance.exif_gps_lat = float(lat)
                instance.exif_gps_lon = float(lon)
                instance.save()

                # Reverse geocode and update geolocation/search location
                geocode_result = reverse_geocode(
                    instance.exif_gps_lat, instance.exif_gps_lon
                )
                if geocode_result:
                    geocode_result["_v"] = GEOCODE_VERSION
                    instance.geolocation_json = geocode_result

                    # Update search location through PhotoSearch model
                    from api.models.photo_search import PhotoSearch

                    search_instance, _created = PhotoSearch.objects.get_or_create(
                        photo=instance
                    )
                    search_instance.update_search_location(geocode_result)
                    search_instance.save()

                    # Update album place relations
                    if old_album_places is not None:
                        for old_album_place in old_album_places:
                            old_album_place.photos.remove(instance)
                            old_album_place.save()

                    if "features" in geocode_result:
                        for geolocation_level, feature in enumerate(
                            geocode_result["features"]
                        ):
                            if (
                                "text" not in feature.keys()
                                or str(feature["text"]).isnumeric()
                            ):
                                continue
                            album_place = api.models.album_place.get_album_place(
                                feature["text"], owner=instance.owner
                            )
                            if (
                                album_place.photos.filter(
                                    image_hash=instance.image_hash
                                ).count()
                                == 0
                            ):
                                album_place.geolocation_level = (
                                    len(geocode_result["features"]) - geolocation_level
                                )
                            album_place.photos.add(instance)
                            album_place.save()

                    instance.save()
                else:
                    util.logger.warning(
                        "Reverse geocoding returned no result for provided coordinates"
                    )
            except Exception as e:
                util.logger.warning(e)
                util.logger.warning("Failed to update GPS location for photo")
        return instance


class PhotoHashListSerializer(serializers.ModelSerializer):
    class Meta:
        model = Photo
        fields = ("image_hash", "video")


class PhotoDetailsSummarySerializer(serializers.ModelSerializer):
    photo_summary = serializers.SerializerMethodField()
    album_date_id = serializers.SerializerMethodField()
    processing = serializers.SerializerMethodField()

    class Meta:
        model = Photo
        fields = ("photo_summary", "album_date_id", "processing")

    def get_photo_summary(self, obj) -> PhotoSummarySerializer:
        return PhotoSummarySerializer(obj.get()).data

    def get_processing(self, obj) -> bool:
        return obj.get().thumbnail.aspect_ratio is None

    def get_album_date_id(self, obj) -> int:
        return (
            AlbumDate.objects.filter(photos__in=obj)
            .values_list("id", flat=True)
            .first()
        )


class PhotoSerializer(serializers.ModelSerializer):
    square_thumbnail_url = serializers.SerializerMethodField()
    big_thumbnail_url = serializers.SerializerMethodField()
    small_square_thumbnail_url = serializers.SerializerMethodField()
    similar_photos = serializers.SerializerMethodField()
    captions_json = serializers.SerializerMethodField()
    search_captions = serializers.SerializerMethodField()
    search_location = serializers.SerializerMethodField()
    people = serializers.SerializerMethodField()
    shared_to = serializers.PrimaryKeyRelatedField(many=True, read_only=True)
    image_path = serializers.SerializerMethodField()
    owner = SimpleUserSerializer(many=False, read_only=True)
    embedded_media = serializers.SerializerMethodField()
    # File variants (RAW, JPEG, video for Live Photos, etc.)
    # PhotoPrism-like model where one Photo can have multiple file variants
    file_variants = serializers.SerializerMethodField()
    # Stack information (bursts, brackets, manual stacks) - can be multiple
    stacks = serializers.SerializerMethodField()
    # Structured metadata with edit history support
    metadata = serializers.SerializerMethodField()
    
    # Backwards-compatible fields from PhotoMetadata (for API compatibility)
    height = serializers.SerializerMethodField()
    width = serializers.SerializerMethodField()
    focal_length = serializers.SerializerMethodField()
    fstop = serializers.SerializerMethodField()
    iso = serializers.SerializerMethodField()
    shutter_speed = serializers.SerializerMethodField()
    lens = serializers.SerializerMethodField()
    camera = serializers.SerializerMethodField()
    focalLength35Equivalent = serializers.SerializerMethodField()
    digitalZoomRatio = serializers.SerializerMethodField()
    subjectDistance = serializers.SerializerMethodField()

    class Meta:
        model = Photo
        fields = (
            "id",
            "exif_gps_lat",
            "exif_gps_lon",
            "exif_timestamp",
            "captions_json",
            "search_captions",
            "search_location",
            "big_thumbnail_url",
            "square_thumbnail_url",
            "small_square_thumbnail_url",
            "geolocation_json",
            "exif_json",
            "people",
            "image_hash",
            "image_path",
            "rating",
            "hidden",
            "public",
            "removed",
            "in_trashcan",
            "shared_to",
            "similar_photos",
            "video",
            "owner",
            "size",
            "height",
            "width",
            "focal_length",
            "fstop",
            "iso",
            "shutter_speed",
            "lens",
            "camera",
            "focalLength35Equivalent",
            "digitalZoomRatio",
            "subjectDistance",
            "embedded_media",
            "file_variants",
            "stacks",
            "metadata",
        )
    
    def _get_metadata(self, obj) -> PhotoMetadata | None:
        """Helper to get PhotoMetadata, with caching."""
        if not hasattr(obj, '_cached_metadata'):
            try:
                obj._cached_metadata = obj.metadata
            except PhotoMetadata.DoesNotExist:
                obj._cached_metadata = None
        return obj._cached_metadata
    
    def get_height(self, obj) -> int:
        metadata = self._get_metadata(obj)
        return metadata.height if metadata else 0
    
    def get_width(self, obj) -> int:
        metadata = self._get_metadata(obj)
        return metadata.width if metadata else 0
    
    def get_focal_length(self, obj) -> float | None:
        metadata = self._get_metadata(obj)
        return metadata.focal_length if metadata else None
    
    def get_fstop(self, obj) -> float | None:
        metadata = self._get_metadata(obj)
        return metadata.aperture if metadata else None
    
    def get_iso(self, obj) -> int | None:
        metadata = self._get_metadata(obj)
        return metadata.iso if metadata else None
    
    def get_shutter_speed(self, obj) -> str | None:
        metadata = self._get_metadata(obj)
        return metadata.shutter_speed if metadata else None
    
    def get_lens(self, obj) -> str | None:
        metadata = self._get_metadata(obj)
        return metadata.lens_display if metadata else None
    
    def get_camera(self, obj) -> str | None:
        metadata = self._get_metadata(obj)
        return metadata.camera_display if metadata else None
    
    def get_focalLength35Equivalent(self, obj) -> int | None:
        metadata = self._get_metadata(obj)
        return metadata.focal_length_35mm if metadata else None
    
    def get_digitalZoomRatio(self, obj) -> float | None:
        # Not stored in PhotoMetadata (rarely used field)
        return None
    
    def get_subjectDistance(self, obj) -> float | None:
        # Not stored in PhotoMetadata (rarely used field)
        return None

    def get_similar_photos(self, obj) -> list:
        res = search_similar_image(obj.owner, obj, threshold=90)
        arr = []
        if len(res) > 0:
            [arr.append(e) for e in res["result"]]
            photos = Photo.objects.filter(image_hash__in=arr).all()
            res = []
            for photo in photos:
                type = "image"
                if photo.video:
                    type = "video"
                res.append({"image_hash": photo.image_hash, "type": type})
            return res
        else:
            return []

    def get_captions_json(self, obj) -> dict:
        if (
            hasattr(obj, "caption_instance")
            and obj.caption_instance
            and obj.caption_instance.captions_json
            and len(obj.caption_instance.captions_json) > 0
        ):
            return obj.caption_instance.captions_json
        else:
            emptyArray = {
                "im2txt": "",
                "places365": {"attributes": [], "categories": [], "environment": []},
            }
            return emptyArray

    def get_search_captions(self, obj) -> str:
        if hasattr(obj, "search_instance") and obj.search_instance:
            return obj.search_instance.search_captions or ""
        return ""

    def get_search_location(self, obj) -> str:
        if hasattr(obj, "search_instance") and obj.search_instance:
            return obj.search_instance.search_location or ""
        return ""

    def get_image_path(self, obj) -> list[str]:
        try:
            paths = []
            for file in obj.files.all():
                paths.append(file.path)
            return paths
        except Exception:
            return ["Missing"]

    def get_square_thumbnail_url(self, obj) -> str:
        return (
            obj.thumbnail.square_thumbnail.url if obj.thumbnail.square_thumbnail else ""
        )

    def get_small_square_thumbnail_url(self, obj) -> str:
        return (
            obj.thumbnail.square_thumbnail_small.url
            if obj.thumbnail.square_thumbnail_small
            else ""
        )

    def get_big_thumbnail_url(self, obj) -> str:
        return obj.thumbnail.thumbnail_big.url if obj.thumbnail.thumbnail_big else ""

    def get_geolocation(self, obj) -> dict:
        if obj.geolocation_json:
            return json.loads(obj.geolocation_json)
        else:
            return None

    def get_people(self, obj) -> list:
        return [
            {
                "name": (
                    f.person.name
                    if f.person
                    else (
                        f.cluster_person.name
                        if f.cluster_person
                        else (
                            f.classification_person.name
                            if f.classification_person
                            else ""
                        )
                    )
                ),
                "type": (
                    "user"
                    if f.person
                    else (
                        "cluster"
                        if f.cluster_person
                        else ("classification" if f.classification_person else "")
                    )
                ),
                "probability": (
                    1
                    if f.person
                    else (
                        f.cluster_probability
                        if f.cluster_person
                        else (
                            f.classification_probability
                            if f.classification_person
                            else 0
                        )
                    )
                ),
                "location": {
                    "top": f.location_top,
                    "bottom": f.location_bottom,
                    "left": f.location_left,
                    "right": f.location_right,
                },
                "face_url": f.image.url,
                "face_id": f.id,
            }
            for f in obj.faces.all()
        ]

    def get_embedded_media(self, obj: Photo) -> list[dict]:
        def serialize_file(file):
            return {
                "id": file.hash,
                "type": "video" if file.type == File.VIDEO else "image",
            }

        if obj.main_file is None:
            return []
        embedded_media = obj.main_file.embedded_media.all()
        if len(embedded_media) == 0:
            return []
        return list(
            map(
                serialize_file, embedded_media.filter(type__in=[File.VIDEO, File.IMAGE])
            )
        )

    def get_metadata(self, obj: Photo) -> dict | None:
        """
        Return structured metadata from PhotoMetadata if available.
        
        This provides:
        - Normalized field names (aperture, iso, shutter_speed, etc.)
        - Computed display strings (camera_display, lens_display)
        - Resolution and megapixel info
        - Edit tracking (version, source, has_edits)
        
        Falls back to None if PhotoMetadata doesn't exist (backwards compatible).
        """
        try:
            metadata = obj.metadata
            return PhotoMetadataSummarySerializer(metadata).data
        except PhotoMetadata.DoesNotExist:
            return None

    def get_file_variants(self, obj: Photo) -> list | None:
        """Return file variants for this photo (RAW, JPEG, video for Live Photos, etc.).
        
        This implements the PhotoPrism-like model where one Photo can have multiple
        file variants representing the same capture moment.
        """
        from api.models.file import File
        
        files = obj.files.all()
        if files.count() <= 1:
            # Only main file, no additional variants
            return None
        
        variants = []
        for f in files:
            # Determine file type label
            file_type_map = {
                File.IMAGE: "image",
                File.VIDEO: "video",
                File.RAW_FILE: "raw",
                File.METADATA_FILE: "metadata",
                File.UNKNOWN: "unknown",
            }
            file_type = file_type_map.get(f.type, "unknown")
            
            # Check if this is the main file
            is_main = obj.main_file_id == f.hash if obj.main_file_id else False
            
            variants.append({
                "hash": f.hash,
                "path": f.path,
                "type": file_type,
                "type_id": f.type,
                "is_main": is_main,
                "filename": f.path.split("/")[-1] if f.path else None,
            })
        
        return variants

    def get_stacks(self, obj: Photo) -> list | None:
        """Return detailed stack info for photo detail view (supports multiple stacks)."""
        from api.models.photo_stack import PhotoStack
        # Use model-defined valid stack types, plus deprecated types for backwards compatibility
        valid_stack_types = PhotoStack.VALID_STACK_TYPES + [
            PhotoStack.StackType.RAW_JPEG_PAIR,
            PhotoStack.StackType.LIVE_PHOTO,
        ]
        stacks = obj.stacks.filter(stack_type__in=valid_stack_types)
        if not stacks.exists():
            return None
        
        result = []
        for stack in stacks:
            is_primary = stack.primary_photo_id == obj.pk if stack.primary_photo_id else False
            
            # Get all photos in the stack for the detail view
            stack_photos = []
            for photo in stack.photos.select_related("thumbnail").all():
                # Get width/height from PhotoMetadata
                try:
                    photo_metadata = photo.metadata
                    photo_width = photo_metadata.width or 0
                    photo_height = photo_metadata.height or 0
                except PhotoMetadata.DoesNotExist:
                    photo_width = 0
                    photo_height = 0
                
                stack_photos.append({
                    "id": str(photo.id),
                    "image_hash": photo.image_hash,
                    "is_primary": photo.pk == stack.primary_photo_id,
                    "thumbnail_url": (
                        f"/media/square_thumbnails_small/{photo.image_hash}"
                        if hasattr(photo, "thumbnail") and photo.thumbnail and photo.thumbnail.square_thumbnail_small 
                        else None
                    ),
                    "size": photo.size,
                    "width": photo_width,
                    "height": photo_height,
                })
            
            result.append({
                "id": str(stack.id),
                "type": stack.stack_type,
                "type_display": stack.get_stack_type_display(),
                "photo_count": len(stack_photos),
                "is_primary": is_primary,
                "photos": stack_photos,
            })
        
        return result


class SharedFromMePhotoThroughSerializer(serializers.ModelSerializer):
    photo = serializers.SerializerMethodField()
    user = SimpleUserSerializer(many=False, read_only=True)

    class Meta:
        model = Photo.shared_to.through
        fields = ("user_id", "user", "photo")

    def get_photo(self, obj) -> PhotoSummarySerializer:
        return PhotoSummarySerializer(obj.photo).data


class PublicPhotoDetailSerializer(serializers.ModelSerializer):
    """Serializer for photo details in public albums.
    
    Conditionally includes metadata based on sharing settings passed in context.
    Context must include 'sharing_settings' dict with keys:
    - share_location: bool
    - share_camera_info: bool
    - share_timestamps: bool
    - share_captions: bool
    - share_faces: bool
    """
    
    # Always included
    square_thumbnail_url = serializers.SerializerMethodField()
    big_thumbnail_url = serializers.SerializerMethodField()
    small_square_thumbnail_url = serializers.SerializerMethodField()
    video = serializers.BooleanField(read_only=True)
    image_hash = serializers.CharField(read_only=True)
    
    # Conditionally included based on sharing settings
    exif_timestamp = serializers.SerializerMethodField()
    exif_gps_lat = serializers.SerializerMethodField()
    exif_gps_lon = serializers.SerializerMethodField()
    geolocation_json = serializers.SerializerMethodField()
    search_location = serializers.SerializerMethodField()
    
    # Camera info
    camera = serializers.SerializerMethodField()
    lens = serializers.SerializerMethodField()
    focal_length = serializers.SerializerMethodField()
    fstop = serializers.SerializerMethodField()
    iso = serializers.SerializerMethodField()
    shutter_speed = serializers.SerializerMethodField()
    width = serializers.SerializerMethodField()
    height = serializers.SerializerMethodField()
    
    # Captions
    search_captions = serializers.SerializerMethodField()
    captions_json = serializers.SerializerMethodField()
    
    # People/faces
    people = serializers.SerializerMethodField()

    class Meta:
        model = Photo
        fields = (
            "image_hash",
            "video",
            "square_thumbnail_url",
            "big_thumbnail_url",
            "small_square_thumbnail_url",
            "exif_timestamp",
            "exif_gps_lat",
            "exif_gps_lon",
            "geolocation_json",
            "search_location",
            "camera",
            "lens",
            "focal_length",
            "fstop",
            "iso",
            "shutter_speed",
            "width",
            "height",
            "search_captions",
            "captions_json",
            "people",
        )

    def _get_sharing_settings(self) -> dict:
        """Get sharing settings from context."""
        return self.context.get('sharing_settings', {})
    
    def _get_metadata(self, obj) -> PhotoMetadata | None:
        """Helper to get PhotoMetadata."""
        if not hasattr(obj, '_cached_metadata'):
            try:
                obj._cached_metadata = obj.metadata
            except PhotoMetadata.DoesNotExist:
                obj._cached_metadata = None
        return obj._cached_metadata

    # Always available
    def get_square_thumbnail_url(self, obj) -> str:
        return obj.thumbnail.square_thumbnail.url if obj.thumbnail and obj.thumbnail.square_thumbnail else ""

    def get_small_square_thumbnail_url(self, obj) -> str:
        return obj.thumbnail.square_thumbnail_small.url if obj.thumbnail and obj.thumbnail.square_thumbnail_small else ""

    def get_big_thumbnail_url(self, obj) -> str:
        return obj.thumbnail.thumbnail_big.url if obj.thumbnail and obj.thumbnail.thumbnail_big else ""

    # Timestamp - conditional
    def get_exif_timestamp(self, obj):
        if self._get_sharing_settings().get('share_timestamps', False):
            return obj.exif_timestamp
        return None

    # Location - conditional
    def get_exif_gps_lat(self, obj):
        if self._get_sharing_settings().get('share_location', False):
            return obj.exif_gps_lat
        return None

    def get_exif_gps_lon(self, obj):
        if self._get_sharing_settings().get('share_location', False):
            return obj.exif_gps_lon
        return None

    def get_geolocation_json(self, obj):
        if self._get_sharing_settings().get('share_location', False):
            return obj.geolocation_json
        return None

    def get_search_location(self, obj) -> str:
        if self._get_sharing_settings().get('share_location', False):
            if hasattr(obj, "search_instance") and obj.search_instance:
                return obj.search_instance.search_location or ""
        return ""

    # Camera info - conditional
    def get_camera(self, obj) -> str | None:
        if self._get_sharing_settings().get('share_camera_info', False):
            metadata = self._get_metadata(obj)
            return metadata.camera_display if metadata else None
        return None

    def get_lens(self, obj) -> str | None:
        if self._get_sharing_settings().get('share_camera_info', False):
            metadata = self._get_metadata(obj)
            return metadata.lens_display if metadata else None
        return None

    def get_focal_length(self, obj) -> float | None:
        if self._get_sharing_settings().get('share_camera_info', False):
            metadata = self._get_metadata(obj)
            return metadata.focal_length if metadata else None
        return None

    def get_fstop(self, obj) -> float | None:
        if self._get_sharing_settings().get('share_camera_info', False):
            metadata = self._get_metadata(obj)
            return metadata.aperture if metadata else None
        return None

    def get_iso(self, obj) -> int | None:
        if self._get_sharing_settings().get('share_camera_info', False):
            metadata = self._get_metadata(obj)
            return metadata.iso if metadata else None
        return None

    def get_shutter_speed(self, obj) -> str | None:
        if self._get_sharing_settings().get('share_camera_info', False):
            metadata = self._get_metadata(obj)
            return metadata.shutter_speed if metadata else None
        return None

    def get_width(self, obj) -> int:
        if self._get_sharing_settings().get('share_camera_info', False):
            metadata = self._get_metadata(obj)
            return metadata.width if metadata else 0
        return 0

    def get_height(self, obj) -> int:
        if self._get_sharing_settings().get('share_camera_info', False):
            metadata = self._get_metadata(obj)
            return metadata.height if metadata else 0
        return 0

    # Captions - conditional
    def get_search_captions(self, obj) -> str:
        if self._get_sharing_settings().get('share_captions', False):
            if hasattr(obj, "search_instance") and obj.search_instance:
                return obj.search_instance.search_captions or ""
        return ""

    def get_captions_json(self, obj) -> dict:
        if self._get_sharing_settings().get('share_captions', False):
            if (
                hasattr(obj, "caption_instance")
                and obj.caption_instance
                and obj.caption_instance.captions_json
                and len(obj.caption_instance.captions_json) > 0
            ):
                return obj.caption_instance.captions_json
        return {"im2txt": "", "places365": {"attributes": [], "categories": [], "environment": []}}

    # People/faces - conditional
    def get_people(self, obj) -> list:
        if not self._get_sharing_settings().get('share_faces', False):
            return []
        
        return [
            {
                "name": (
                    f.person.name
                    if f.person
                    else (
                        f.cluster_person.name
                        if f.cluster_person
                        else "Unknown"
                    )
                ),
                "face_url": f.image.url if f.image else None,
                "face_id": f.id,
            }
            for f in obj.faces.all()
            if f.person or f.cluster_person
        ]


================================================
FILE: api/serializers/simple.py
================================================
from rest_framework import serializers

from api.models import Photo, User


class PhotoSuperSimpleSerializer(serializers.ModelSerializer):
    class Meta:
        model = Photo
        fields = ("image_hash", "rating", "hidden", "exif_timestamp", "public", "video")


class PhotoSimpleSerializer(serializers.ModelSerializer):
    square_thumbnail = serializers.SerializerMethodField()

    class Meta:
        model = Photo
        fields = (
            "square_thumbnail",
            "image_hash",
            "exif_timestamp",
            "exif_gps_lat",
            "exif_gps_lon",
            "rating",
            "geolocation_json",
            "public",
            "video",
        )

    def get_square_thumbnail(self, obj) -> str:
        return (
            obj.thumbnail.square_thumbnail.url
            if obj.thumbnail and obj.thumbnail.square_thumbnail
            else ""
        )


class SimpleUserSerializer(serializers.ModelSerializer):
    class Meta:
        model = User
        fields = (
            "id",
            "username",
            "first_name",
            "last_name",
        )


================================================
FILE: api/serializers/user.py
================================================
import os

from django.conf import settings
from django.contrib.auth import get_user_model
from django.db.models import Q
from django_q.tasks import Chain
from rest_framework import serializers
from rest_framework.exceptions import ValidationError

from api.batch_jobs import batch_calculate_clip_embedding
from api.ml_models import do_all_models_exist, download_models
from api.models import Photo, User
from api.serializers.simple import PhotoSuperSimpleSerializer
from api.util import is_valid_path, logger


class UserSerializer(serializers.ModelSerializer):
    public_photo_count = serializers.SerializerMethodField()
    public_photo_samples = serializers.SerializerMethodField()
    photo_count = serializers.SerializerMethodField()
    avatar_url = serializers.SerializerMethodField()

    class Meta:
        model = User
        extra_kwargs = {
            "password": {"write_only": True},
            "first_name": {"required": False},
            "last_name": {"required": False},
            "scan_directory": {"required": False},
            "confidence": {"required": False},
            "confidence_person": {"required": False},
            "semantic_search_topk": {"required": False},
            "nextcloud_server_address": {"required": False},
            "nextcloud_username": {"required": False},
            "nextcloud_scan_directory": {"required": False},
            "nextcloud_app_password": {"write_only": True},
            "favorite_min_rating": {"required": False},
            "save_metadata_to_disk": {"required": False},
            "save_face_tags_to_disk": {"required": False},
            "text_alignment": {"required": False},
            "header_size": {"required": False},
            "skip_raw_files": {"required": False},
            "stack_raw_jpeg": {"required": False},
            "slideshow_interval": {"required": False},
            "duplicate_sensitivity": {"required": False},
            "duplicate_clear_existing": {"required": False},
        }
        fields = (
            "id",
            "username",
            "email",
            "scan_directory",
            "confidence",
            "confidence_person",
            "transcode_videos",
            "semantic_search_topk",
            "first_name",
            "public_photo_samples",
            "last_name",
            "public_photo_count",
            "date_joined",
            "password",
            "avatar",
            "is_superuser",
            "photo_count",
            "nextcloud_server_address",
            "nextcloud_username",
            "nextcloud_app_password",
            "nextcloud_scan_directory",
            "avatar_url",
            "favorite_min_rating",
            "image_scale",
            "text_alignment",
            "header_size",
            "save_metadata_to_disk",
            "save_face_tags_to_disk",
            "datetime_rules",
            "burst_detection_rules",
            "llm_settings",
            "default_timezone",
            "public_sharing",
            "public_sharing_defaults",
            "face_recognition_model",
            "min_cluster_size",
            "confidence_unknown_face",
            "min_samples",
            "cluster_selection_epsilon",
            "skip_raw_files",
            "stack_raw_jpeg",
            "slideshow_interval",
            "duplicate_sensitivity",
            "duplicate_clear_existing",
        )

    def validate_nextcloud_app_password(self, value):
        return value

    def create(self, validated_data):
        if "scan_directory" in validated_data.keys():
            if (
                not self.context["request"].user.is_superuser
                or validated_data["scan_directory"] == "initial"
            ):
                validated_data.pop("scan_directory")
        # make sure username is always lowercase
        if "username" in validated_data.keys():
            validated_data["username"] = validated_data["username"].lower()
        if "is_superuser" in validated_data.keys():
            is_superuser = validated_data.pop("is_superuser")
            if is_superuser and self.context["request"].user.is_authenticated and self.context["request"].user.is_superuser:
                user = User.objects.create_superuser(**validated_data)
            else:
                user = User.objects.create_user(**validated_data)
        else:
            user = User.objects.create_user(**validated_data)
        logger.info(f"Created user {user.id}")
        return user

    def update(self, instance, validated_data):
        # user can only update the following
        if "password" in validated_data:
            password = validated_data.pop("password")
            if password != "" and not settings.DEMO_SITE:
                instance.set_password(password)
        if "avatar" in validated_data:
            instance.avatar = validated_data.pop("avatar")
            instance.save()
        if "email" in validated_data:
            instance.email = validated_data.pop("email")
            instance.save()
        if "first_name" in validated_data:
            instance.first_name = validated_data.pop("first_name")
            instance.save()
        if "last_name" in validated_data:
            instance.last_name = validated_data.pop("last_name")
            instance.save()
        if "transcode_videos" in validated_data:
            instance.transcode_videos = validated_data.pop("transcode_videos")
            instance.save()
        if "nextcloud_server_address" in validated_data:
            instance.nextcloud_server_address = validated_data.pop(
                "nextcloud_server_address"
            )
            instance.save()
        if "nextcloud_username" in validated_data:
            instance.nextcloud_username = validated_data.pop("nextcloud_username")
            instance.save()
        if "nextcloud_app_password" in validated_data:
            instance.nextcloud_app_password = validated_data.pop(
                "nextcloud_app_password"
            )
            instance.save()
        if "nextcloud_scan_directory" in validated_data:
            instance.nextcloud_scan_directory = validated_data.pop(
                "nextcloud_scan_directory"
            )
            instance.save()
        if "confidence" in validated_data:
            instance.confidence = validated_data.pop("confidence")
            instance.save()
            logger.info(f"Updated confidence for user {instance.confidence}")
        if "confidence_person" in validated_data:
            instance.confidence_person = validated_data.pop("confidence_person")
            instance.save()
            logger.info(
                f"Updated person album confidence for user {instance.confidence_person}"
            )
        if "semantic_search_topk" in validated_data:
            new_semantic_search_topk = validated_data.pop("semantic_search_topk")

            if instance.semantic_search_topk == 0 and new_semantic_search_topk > 0:
                chain = Chain()
                if not do_all_models_exist():
                    chain.append(download_models, User.objects.get(id=instance.id))
                chain.append(
                    batch_calculate_clip_embedding, User.objects.get(id=instance.id)
                )
                chain.run()

            instance.semantic_search_topk = new_semantic_search_topk
            instance.save()
            logger.info(
                f"Updated semantic_search_topk for user {instance.semantic_search_topk}"
            )
        if "favorite_min_rating" in validated_data:
            new_favorite_min_rating = validated_data.pop("favorite_min_rating")
            instance.favorite_min_rating = new_favorite_min_rating
            instance.save()
            logger.info(
                f"Updated favorite_min_rating for user {instance.favorite_min_rating}"
            )
        if "save_metadata_to_disk" in validated_data:
            instance.save_metadata_to_disk = validated_data.pop("save_metadata_to_disk")
            instance.save()
            logger.info(
                f"Updated save_metadata_to_disk for user {instance.save_metadata_to_disk}"
            )
        if "save_face_tags_to_disk" in validated_data:
            instance.save_face_tags_to_disk = validated_data.pop(
                "save_face_tags_to_disk"
            )
            instance.save()
            logger.info(
                f"Updated save_face_tags_to_disk to {instance.save_face_tags_to_disk} for user {instance.username}"
            )
        if "image_scale" in validated_data:
            new_image_scale = validated_data.pop("image_scale")
            instance.image_scale = new_image_scale
            instance.save()
            logger.info(f"Updated image_scale for user {instance.image_scale}")
        if "text_alignment" in validated_data:
            new_text_alignment = validated_data.pop("text_alignment")
            instance.text_alignment = new_text_alignment
            instance.save()
            logger.info(f"Updated text_alignment for user {instance.text_alignment}")
        if "header_size" in validated_data:
            new_header_size = validated_data.pop("header_size")
            instance.header_size = new_header_size
            instance.save()
            logger.info(f"Updated header_size for user {instance.header_size}")
        if "datetime_rules" in validated_data:
            new_datetime_rules = validated_data.pop("datetime_rules")
            instance.datetime_rules = new_datetime_rules
            instance.save()
            logger.info(f"Updated datetime_rules for user {instance.datetime_rules}")
        if "default_timezone" in validated_data:
            new_default_timezone = validated_data.pop("default_timezone")
            instance.default_timezone = new_default_timezone
            instance.save()
            logger.info(
                f"Updated default_timezone for user {instance.default_timezone}"
            )
        if "public_sharing" in validated_data:
            instance.public_sharing = validated_data.pop("public_sharing")
            instance.save()
        if "face_recognition_model" in validated_data:
            instance.face_recognition_model = validated_data.pop(
                "face_recognition_model"
            )
            instance.save()
        if "min_cluster_size" in validated_data:
            instance.min_cluster_size = validated_data.pop("min_cluster_size")
            instance.save()
        if "confidence_unknown_face" in validated_data:
            instance.confidence_unknown_face = validated_data.pop(
                "confidence_unknown_face"
            )
            instance.save()
        if "min_samples" in validated_data:
            instance.min_samples = validated_data.pop("min_samples")
            instance.save()
        if "cluster_selection_epsilon" in validated_data:
            instance.cluster_selection_epsilon = validated_data.pop(
                "cluster_selection_epsilon"
            )
            instance.save()
        if "llm_settings" in validated_data:
            instance.llm_settings = validated_data.pop("llm_settings")
            instance.save()
        if "skip_raw_files" in validated_data:
            instance.skip_raw_files = validated_data.pop("skip_raw_files")
            instance.save()
            logger.info(
                f"Updated skip_raw_files to {instance.skip_raw_files} for user {instance.username}"
            )
        if "stack_raw_jpeg" in validated_data:
            instance.stack_raw_jpeg = validated_data.pop("stack_raw_jpeg")
            instance.save()
            logger.info(
                f"Updated stack_raw_jpeg to {instance.stack_raw_jpeg} for user {instance.username}"
            )
        if "slideshow_interval" in validated_data:
            instance.slideshow_interval = validated_data.pop("slideshow_interval")
            instance.save()
            logger.info(
                f"Updated slideshow_interval to {instance.slideshow_interval} for user {instance.username}"
            )
        if "duplicate_sensitivity" in validated_data:
            instance.duplicate_sensitivity = validated_data.pop("duplicate_sensitivity")
            instance.save()
            logger.info(
                f"Updated duplicate_sensitivity to {instance.duplicate_sensitivity} for user {instance.username}"
            )
        if "duplicate_clear_existing" in validated_data:
            instance.duplicate_clear_existing = validated_data.pop(
                "duplicate_clear_existing"
            )
            instance.save()
            logger.info(
                f"Updated duplicate_clear_existing to {instance.duplicate_clear_existing} for user {instance.username}"
            )

        return instance

    def get_photo_count(self, obj) -> int:
        return Photo.objects.filter(owner=obj).count()

    def get_public_photo_count(self, obj) -> int:
        return Photo.objects.filter(Q(owner=obj) & Q(public=True)).count()

    def get_public_photo_samples(self, obj) -> PhotoSuperSimpleSerializer(many=True):
        return PhotoSuperSimpleSerializer(
            Photo.objects.filter(Q(owner=obj) & Q(public=True))[:10], many=True
        ).data

    def get_avatar_url(self, obj) -> str or None:
        try:
            return obj.avatar.url
        except Exception:
            return None


class PublicUserSerializer(serializers.ModelSerializer):
    public_photo_count = serializers.SerializerMethodField()
    public_photo_samples = serializers.SerializerMethodField()
    avatar_url = serializers.SerializerMethodField()

    class Meta:
        model = User
        fields = (
            "id",
            "avatar_url",
            "username",
            "first_name",
            "last_name",
            "public_photo_count",
            "public_photo_samples",
        )

    def get_public_photo_count(self, obj) -> int:
        return Photo.objects.filter(Q(owner=obj) & Q(public=True)).count()

    def get_public_photo_samples(self, obj) -> PhotoSuperSimpleSerializer(many=True):
        return PhotoSuperSimpleSerializer(
            Photo.objects.filter(Q(owner=obj) & Q(public=True))[:10], many=True
        ).data

    def get_avatar_url(self, obj) -> str or None:
        try:
            return obj.avatar.url
        except ValueError:
            return None


class SignupUserSerializer(serializers.ModelSerializer):
    class Meta:
        model = User
        extra_kwargs = {
            "username": {"required": True},
            "password": {
                "write_only": True,
                "required": True,
                "min_length": 3,  # configurable min password length?
            },
            "email": {"required": True},
            "first_name": {"required": True},
            "last_name": {"required": True},
            "is_superuser": {"write_only": True},
        }
        fields = (
            "username",
            "password",
            "email",
            "first_name",
            "last_name",
            "is_superuser",
        )

    def create(self, validated_data):
        should_be_superuser = User.objects.filter(is_superuser=True).count() == 0
        user = super().create(validated_data)
        user.set_password(validated_data.pop("password"))
        user.is_staff = should_be_superuser
        user.is_superuser = should_be_superuser
        user.save()
        return user


class DeleteUserSerializer(serializers.ModelSerializer):
    class Meta:
        model = get_user_model()
        fields = "__all__"


class ManageUserSerializer(serializers.ModelSerializer):
    photo_count = serializers.SerializerMethodField()

    class Meta:
        model = get_user_model()
        fields = (
            "username",
            "scan_directory",
            "skip_raw_files",
            "stack_raw_jpeg",
            "confidence",
            "semantic_search_topk",
            "last_login",
            "date_joined",
            "photo_count",
            "id",
            "favorite_min_rating",
            "image_scale",
            "save_metadata_to_disk",
            "email",
            "first_name",
            "last_name",
            "password",
        )
        extra_kwargs = {
            "password": {"write_only": True},
            "scan_directory": {"required": False},
            "skip_raw_files": {"required": False},
            "stack_raw_jpeg": {"required": False},
        }

    def get_photo_count(self, obj) -> int:
        return Photo.objects.filter(owner=obj).count()

    def update(self, instance: User, validated_data):
        if "password" in validated_data:
            password = validated_data.pop("password")
            if password != "" and not settings.DEMO_SITE:
                instance.set_password(password)

        if "scan_directory" in validated_data:
            new_scan_directory = validated_data.pop("scan_directory")

            if new_scan_directory:  # Ensure it's not an empty string
                abs_new_scan_directory = os.path.abspath(new_scan_directory)

                if not is_valid_path(abs_new_scan_directory, settings.DATA_ROOT):
                    raise ValidationError(
                        "Scan directory must be inside the data root."
                    )

                if os.path.exists(abs_new_scan_directory):
                    instance.scan_directory = abs_new_scan_directory
                    logger.info(
                        f"Updated scan directory for user {instance.scan_directory}"
                    )
                else:
                    raise ValidationError("Scan directory does not exist")
        if "skip_raw_files" in validated_data:
            instance.skip_raw_files = validated_data.pop("skip_raw_files")
        if "stack_raw_jpeg" in validated_data:
            instance.stack_raw_jpeg = validated_data.pop("stack_raw_jpeg")

        if "username" in validated_data:
            username = validated_data.pop("username")
            if username != "":
                other_user = User.objects.filter(username=username).first()
                if other_user is not None and other_user != instance:
                    raise ValidationError("User name is already taken")

            instance.username = username

        if "email" in validated_data:
            email = validated_data.pop("email")
            instance.email = email

        if "first_name" in validated_data:
            first_name = validated_data.pop("first_name")
            instance.first_name = first_name

        if "last_name" in validated_data:
            last_name = validated_data.pop("last_name")
            instance.last_name = last_name

        instance.save()
        return instance


================================================
FILE: api/services.py
================================================
import platform
import subprocess
import time
from datetime import timedelta

import requests
from django.db.models import Q
from django.utils import timezone

from api.models import Photo
from api.util import logger

# Track services that should not be restarted due to system incompatibility
INCOMPATIBLE_SERVICES = set()

# CPU features required for different services
SERVICE_CPU_REQUIREMENTS = {
    "llm": {
        "required": ["avx", "sse4_2"],  # Essential for llama.cpp
        "recommended": ["avx2", "fma", "f16c"],  # Improve performance
    }
}

# Define all the services that can be started, with their respective ports
SERVICES = {
    "image_similarity": 8002,
    "thumbnail": 8003,
    "face_recognition": 8005,
    "clip_embeddings": 8006,
    "llm": 8008,
    "image_captioning": 8007,
    "exif": 8010,
    "tags": 8011,
}

HTTP_OK = 200


def check_services():
    for service in SERVICES.keys():
        if service in INCOMPATIBLE_SERVICES:
            logger.info(f"Skipping restart of incompatible service: {service}")
            continue

        if not is_healthy(service):
            stop_service(service)
            logger.info(f"Restarting {service}")
            start_service(service)


def is_healthy(service):
    port = SERVICES.get(service)
    try:
        res = requests.get(f"http://localhost:{port}/health")
        # If response has timestamp, check if it needs to be restarted
        if res.json().get("last_request_time") is not None:
            if res.json()["last_request_time"] < time.time() - 120:
                logger.info(f"Service {service} is stale and needs to be restarted")
                return False
        return res.status_code == HTTP_OK
    except BaseException as e:
        logger.exception(f"Error checking health of {service}: {str(e)}")
        return False


def start_service(service):
    # Check system compatibility before attempting to start the service
    if not is_service_compatible(service):
        logger.error(f"Service '{service}' is not compatible with this system")
        return False

    if service == "image_similarity":
        subprocess.Popen(
            [
                "python",
                "image_similarity/main.py",
                "2>&1 | tee /logs/image_similarity.log",
            ]
        )
    elif service in SERVICES.keys():
        subprocess.Popen(
            [
                "python",
                f"service/{service}/main.py",
                "2>&1 | tee /logs/{service}.log",
            ]
        )
    else:
        logger.warning("Unknown service:", service)
        return False

    logger.info(f"Service '{service}' started successfully")
    return True


def stop_service(service):
    try:
        # Find the process ID (PID) of the service using `ps` and `grep`
        ps_command = f"ps aux | grep '[p]ython.*{service}/main.py' | awk '{{print $2}}'"
        result = subprocess.run(
            ps_command,
            shell=True,
            check=True,
            stdout=subprocess.PIPE,
            stderr=subprocess.PIPE,
        )

        pids = result.stdout.decode().strip().split()

        if not pids:
            logger.warning("Service '%s' is not running", service)
            return False

        # Kill each process found
        for pid in pids:
            subprocess.run(["kill", "-9", pid], check=True)
            logger.info(f"Service '{service}' with PID {pid} stopped successfully")

        return True
    except subprocess.CalledProcessError as e:
        logger.error(f"Failed to stop service '{service}': {e.stderr.decode().strip()}")
        return False
    except Exception as e:
        logger.error(f"An error occurred while stopping service '{service}': {e}")
        return False


def _is_arm_architecture():
    """Check if the current system is running on ARM architecture
    
    Returns:
        bool: True if ARM architecture, False otherwise
    """
    machine = platform.machine().lower()
    return machine in ['aarch64', 'arm64', 'armv7l', 'armv8']


def check_cpu_features():
    """Check for CPU instruction sets for various services
    
    Note: x86/x64-specific instruction sets (AVX, SSE, etc.) only apply to x86/x64 CPUs.
    On ARM architectures, these checks are skipped as they are not relevant.
    """
    # Check if we're on ARM architecture
    if _is_arm_architecture():
        machine = platform.machine()
        logger.info(f"Detected ARM architecture ({machine}), skipping x86-specific CPU feature checks")
        return []  # Return empty list as x86 features don't apply to ARM
    
    # Features to check for (x86/x64 specific)
    features_to_check = ["avx", "avx2", "sse4_2", "fma", "f16c"]
    available_features = []

    if not available_features:
        try:
            import cpuinfo

            cpu_info = cpuinfo.get_cpu_info()
            flags = cpu_info.get("flags", [])
            for feature in features_to_check:
                if feature in flags:
                    available_features.append(feature)
        except ImportError:
            pass

    return available_features


def has_required_cpu_features(service):
    """Check if CPU has required features for a specific service
    
    On ARM architectures, x86-specific CPU checks are bypassed since those
    instruction sets don't exist on ARM. Services like llama.cpp support ARM natively.
    """
    if service not in SERVICE_CPU_REQUIREMENTS:
        return True  # No CPU requirements for this service

    # Check if we're on ARM architecture
    if _is_arm_architecture():
        machine = platform.machine()
        logger.info(f"Running on ARM architecture ({machine}), skipping x86-specific CPU feature requirements for {service}")
        return True  # Skip x86-specific checks on ARM

    requirements = SERVICE_CPU_REQUIREMENTS[service]
    required_features = requirements.get("required", [])
    recommended_features = requirements.get("recommended", [])

    available_features = check_cpu_features()

    logger.info(f"CPU features detected for {service}: {available_features}")

    missing_required = []
    missing_recommended = []

    for feature in required_features:
        if feature not in available_features:
            missing_required.append(feature)

    for feature in recommended_features:
        if feature not in available_features:
            missing_recommended.append(feature)

    if missing_required:
        logger.error(f"Service '{service}' requires CPU features: {missing_required}")
        logger.error(f"Missing required CPU features: {missing_required}")
        return False

    if missing_recommended:
        logger.warning(
            f"Service '{service}' performance may be degraded without: {missing_recommended}"
        )

    logger.info(f"CPU compatible with service '{service}'")
    return True


def is_service_compatible(service):
    """Check if a service is compatible with the current system"""
    # Check CPU compatibility
    if not has_required_cpu_features(service):
        INCOMPATIBLE_SERVICES.add(service)
        return False

    return True


def cleanup_deleted_photos():
    deleted_photos = Photo.objects.filter(
        Q(removed=True) & Q(last_modified__gte=timezone.now() - timedelta(days=30))
    )
    for photo in deleted_photos:
        photo.delete()


================================================
FILE: api/social_graph.py
================================================
import networkx as nx
from django.db import connection

from api.models import Person
from api.util import logger


def build_social_graph(user):
    try:
        query = """
            WITH face AS (
                SELECT photo_id, person_id, name, owner_id
                FROM api_face
                JOIN api_person ON api_person.id = person_id
                JOIN api_photo ON api_photo.id = photo_id
                WHERE person_id IS NOT NULL
                    AND owner_id = {}
            )
            SELECT f1.name, f2.name
            FROM face f1
            JOIN face f2 USING (photo_id)
            WHERE f1.person_id != f2.person_id
            GROUP BY f1.name, f2.name
        """.replace("{}", str(user.id))
        G = nx.Graph()
        with connection.cursor() as cursor:
            cursor.execute(query)
            links = cursor.fetchall()
            if len(links) == 0:
                return {"nodes": [], "links": []}
            for link in links:
                G.add_edge(link[0], link[1])
        pos = nx.spring_layout(G, k=1 / 2, scale=1000, iterations=20)
        return {
            "nodes": [
                {"id": node, "x": coords[0], "y": coords[1]}
                for node, coords in pos.items()
            ],
            "links": [{"source": pair[0], "target": pair[1]} for pair in G.edges()],
        }
    except Exception:
        logger.exception(f"Error building social graph for user {user.id}")
        raise


def build_ego_graph(person_id):
    G = nx.Graph()
    person = Person.objects.prefetch_related("faces__photo__faces__person").filter(
        id=person_id
    )[0]
    for this_person_face in person.faces.all():
        for other_person_face in this_person_face.photo.faces.all():
            G.add_edge(person.name, other_person_face.person.name)
    nodes = [{"id": node} for node in G.nodes()]
    links = [{"source": pair[0], "target": pair[1]} for pair in G.edges()]
    res = {"nodes": nodes, "links": links}
    return res


================================================
FILE: api/stack_detection.py
================================================
"""
Stack detection module for grouping related photos organizationally.

Handles organizational stack types:
- BURST_SEQUENCE: Photos taken in rapid succession
- EXPOSURE_BRACKET: Bracketed exposures for HDR
- MANUAL: User-created stacks (not detected, created by user)

NOTE: RAW+JPEG pairs and Live Photos are NO LONGER handled as stacks.
They now use the Photo.files ManyToMany field for file variants
(PhotoPrism-like model). This is handled during scan, not detection.

NOTE: Duplicate detection (exact copies and visual duplicates) is now
handled separately by api/duplicate_detection.py. This module focuses
on organizational grouping, not storage cleanup.

Burst detection uses a rules-based system with two categories:
- Hard criteria: Deterministic (EXIF tags, filename patterns)
- Soft criteria: Estimation (timestamp proximity, visual similarity)
"""

from collections import defaultdict

from django.db.models import Q

from api.models import Photo
from api.models.photo_stack import PhotoStack
from api.models.long_running_job import LongRunningJob
from api.burst_detection_rules import (
    as_rules,
    get_enabled_rules,
    get_hard_rules,
    get_soft_rules,
    group_photos_by_timestamp,
    group_photos_by_visual_similarity,
    BurstRuleTypes,
)
from api.util import logger


def clear_stacks_of_type(user, stack_type):
    """
    Clear all stacks of a specific type for a user before re-detection.
    This ensures we start fresh and don't create duplicate stacks.

    Args:
        user: The user whose stacks to clear
        stack_type: The stack type to clear (e.g., PhotoStack.StackType.BURST_SEQUENCE)

    Returns:
        Number of stacks deleted
    """
    stacks_to_delete = PhotoStack.objects.filter(owner=user, stack_type=stack_type)

    count = stacks_to_delete.count()

    # Unlink all photos from these stacks (ManyToMany)
    for stack in stacks_to_delete:
        for photo in stack.photos.all():
            photo.stacks.remove(stack)

    # Delete the stacks
    stacks_to_delete.delete()

    if count > 0:
        logger.info(f"Cleared {count} {stack_type} stacks for {user.username}")

    return count


def detect_burst_sequences(
    user, interval_ms=2000, use_visual_similarity=True, progress_callback=None
):
    """
    Detect burst sequences using user's configured rules.

    This function now uses a rules-based system with two categories:
    - Hard criteria: EXIF tags, filename patterns (deterministic)
    - Soft criteria: Timestamp proximity, visual similarity (estimation)

    By default, only hard criteria rules are enabled.

    Args:
        user: The user whose photos to analyze
        interval_ms: Default milliseconds between burst photos (for soft rules without config)
        use_visual_similarity: Default for visual similarity (for soft rules without config)
        progress_callback: Optional callback(current, total, found)

    Returns:
        Number of stacks created
    """
    # Clear existing burst stacks before re-detection
    clear_stacks_of_type(user, PhotoStack.StackType.BURST_SEQUENCE)

    # Get user's burst detection rules
    rules_config = user.burst_detection_rules
    if isinstance(rules_config, str):
        import json

        rules_config = json.loads(rules_config)

    rules = as_rules(rules_config)
    enabled_rules = get_enabled_rules(rules)

    if not enabled_rules:
        logger.info(f"No burst detection rules enabled for {user.username}")
        return 0

    hard_rules = get_hard_rules(rules)
    soft_rules = get_soft_rules(rules)

    stacks_created = 0

    # === Phase 1: Hard criteria detection ===
    if hard_rules:
        stacks_created += _detect_bursts_hard_criteria(
            user, hard_rules, progress_callback
        )

    # === Phase 2: Soft criteria detection ===
    if soft_rules:
        stacks_created += _detect_bursts_soft_criteria(
            user, soft_rules, interval_ms, use_visual_similarity, progress_callback
        )

    logger.info(
        f"Burst detection for {user.username}: found {stacks_created} sequences"
    )
    return stacks_created


def _detect_bursts_hard_criteria(user, hard_rules, progress_callback=None):
    """
    Detect bursts using hard criteria (EXIF tags, filename patterns).

    These are deterministic rules that identify burst photos based on
    camera metadata or filename conventions.
    """
    from api.metadata.reader import get_metadata

    # Get all photos that could be in bursts
    photos = Photo.objects.filter(
        Q(owner=user) & Q(hidden=False) & Q(in_trashcan=False)
    ).select_related("main_file", "metadata")

    total = photos.count()
    if total == 0:
        return 0

    # Collect required EXIF tags from all rules
    required_tags = set()
    for rule in hard_rules:
        required_tags.update(rule.get_required_exif_tags())
    required_tags = list(required_tags)

    # Group photos by burst group_key
    burst_groups = defaultdict(list)

    for i, photo in enumerate(photos):
        if not photo.main_file:
            continue

        # Get EXIF tags for this photo
        try:
            exif_values = get_metadata(photo.main_file.path, required_tags)
            exif_tags = dict(zip(required_tags, exif_values))
        except Exception as e:
            logger.debug(f"Could not read EXIF for {photo.main_file.path}: {e}")
            exif_tags = {}

        # Try each hard rule until one matches
        for rule in hard_rules:
            is_burst, group_key = rule.is_burst_photo(photo, exif_tags)
            if is_burst and group_key:
                burst_groups[group_key].append(photo)
                break  # Photo matched a rule, don't try others

        if progress_callback and i % 100 == 0:
            progress_callback(i, total, len(burst_groups))

    # Create stacks from groups with 2+ photos
    stacks_created = 0
    for group_key, photos_in_group in burst_groups.items():
        if len(photos_in_group) >= 2:
            # Sort by timestamp if available
            photos_in_group.sort(key=lambda p: p.exif_timestamp or p.added_on)
            stack = _create_burst_stack(user, photos_in_group)
            if stack:
                stacks_created += 1
                logger.debug(
                    f"Created hard-criteria burst stack: {group_key} with {len(photos_in_group)} photos"
                )

    logger.info(
        f"Hard criteria burst detection: found {stacks_created} stacks from {len(burst_groups)} groups"
    )
    return stacks_created


def _detect_bursts_soft_criteria(
    user,
    soft_rules,
    default_interval_ms=2000,
    default_use_visual=True,
    progress_callback=None,
):
    """
    Detect bursts using soft criteria (timestamp proximity, visual similarity).

    These are estimation-based rules that group photos based on timing
    and/or visual similarity.
    """
    # Get photos ordered by timestamp (needed for proximity detection)
    photos = (
        Photo.objects.filter(
            Q(owner=user)
            & Q(exif_timestamp__isnull=False)
            & Q(hidden=False)
            & Q(in_trashcan=False)
        )
        .order_by("exif_timestamp")
        .select_related("main_file", "metadata")
    )

    total = photos.count()
    if total < 2:
        return 0

    stacks_created = 0
    photos_list = list(photos)

    # Process each soft rule
    for rule in soft_rules:
        if rule.rule_type == BurstRuleTypes.TIMESTAMP_PROXIMITY:
            # Get rule-specific parameters or use defaults
            interval_ms = rule.params.get("interval_ms", default_interval_ms)
            require_same_camera = rule.params.get("require_same_camera", True)

            groups = group_photos_by_timestamp(
                photos_list, interval_ms, require_same_camera
            )

            for group in groups:
                # Filter out photos already in burst stacks
                photos_to_stack = [
                    p
                    for p in group
                    if not p.stacks.filter(
                        stack_type=PhotoStack.StackType.BURST_SEQUENCE
                    ).exists()
                ]
                if len(photos_to_stack) >= 2:
                    stack = _create_burst_stack(user, photos_to_stack)
                    if stack:
                        stacks_created += 1

        elif rule.rule_type == BurstRuleTypes.VISUAL_SIMILARITY:
            similarity_threshold = rule.params.get("similarity_threshold", 15)

            groups = group_photos_by_visual_similarity(
                photos_list, similarity_threshold
            )

            for group in groups:
                # Filter out photos already in burst stacks
                photos_to_stack = [
                    p
                    for p in group
                    if not p.stacks.filter(
                        stack_type=PhotoStack.StackType.BURST_SEQUENCE
                    ).exists()
                ]
                if len(photos_to_stack) >= 2:
                    stack = _create_burst_stack(user, photos_to_stack)
                    if stack:
                        stacks_created += 1

    logger.info(f"Soft criteria burst detection: found {stacks_created} stacks")
    return stacks_created


def _create_burst_stack(user, photos):
    """Helper to create a burst stack from a list of photos."""
    if len(photos) < 2:
        return None

    # Filter out photos that are already in a burst stack to prevent duplicates
    # A photo should only be in one burst stack at a time
    photos_to_stack = [
        photo
        for photo in photos
        if not photo.stacks.filter(
            stack_type=PhotoStack.StackType.BURST_SEQUENCE
        ).exists()
    ]

    # If all photos are already stacked, skip
    if len(photos_to_stack) < 2:
        return None

    # Use create_or_merge to ensure photos aren't in multiple stacks of the same type
    # Pass sequence timestamps for burst stacks
    stack = PhotoStack.create_or_merge(
        owner=user,
        stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        photos=photos_to_stack,
        sequence_start=photos_to_stack[0].exif_timestamp,
        sequence_end=photos_to_stack[-1].exif_timestamp,
    )

    logger.info(
        f"Created/merged BURST_SEQUENCE stack with {len(photos_to_stack)} photos"
    )
    return stack


def batch_detect_stacks(user, options=None):
    """
    Run batch stack detection for a user.

    NOTE: RAW+JPEG pairs and Live Photos are now handled as file variants
    during scan (PhotoPrism-like model), not as stacks here.

    Burst detection uses the user's configured burst_detection_rules from their profile.

    Args:
        user: The user whose photos to analyze
        options: Dict with detection options:
            - detect_bursts: bool (default: True) - uses user's burst_detection_rules
    """
    if options is None:
        options = {}

    detect_bursts = options.get("detect_bursts", True)

    # Create long-running job for progress tracking
    job = LongRunningJob.create_job(
        user=user,
        job_type=LongRunningJob.JOB_SCAN_PHOTOS,
        start_now=True,
    )

    try:
        total_found = 0

        # Detect burst sequences (uses user's burst_detection_rules)
        if detect_bursts:

            def progress_burst(current, total, found):
                job.set_result(
                    {
                        "stage": "burst_sequences",
                        "current": current,
                        "total": total,
                        "found": found,
                    }
                )

            burst_count = detect_burst_sequences(user, progress_callback=progress_burst)
            total_found += burst_count

        job.complete(result={"status": "completed", "stacks_found": total_found})

        logger.info(
            f"Stack detection completed for {user.username}: {total_found} stacks found"
        )

    except Exception as e:
        logger.error(f"Stack detection failed for {user.username}: {e}")
        job.fail(error=e)
        raise


================================================
FILE: api/stacks/__init__.py
================================================
"""
Photo stacking detection and management.

This package provides unified photo grouping functionality:
- Exact copies (same MD5 hash)
- Visual duplicates (similar pHash/CLIP)
- RAW+JPEG pairs
- Burst sequences
- Exposure brackets
- Live Photos (embedded motion video)
- Manual user groupings
"""

from api.stacks.live_photo import (
    detect_live_photo,
    extract_embedded_motion_video,
    find_apple_live_photo_video,
    has_embedded_motion_video,
    process_live_photos_batch,
)

__all__ = [
    "detect_live_photo",
    "extract_embedded_motion_video",
    "find_apple_live_photo_video",
    "has_embedded_motion_video",
    "process_live_photos_batch",
]


================================================
FILE: api/stacks/live_photo.py
================================================
"""
Live Photo detection and stacking logic.

Handles extraction and grouping of Live Photos:
- Google Pixel Motion Photos (embedded MP4 after JPEG EOI)
- Samsung Motion Photos (MotionPhoto_Data marker)
- Apple Live Photos (paired .mov file)

This module moves embedded media extraction from directory_watcher to 
a dedicated stacks-aware component for better organization.
"""

from mmap import ACCESS_READ, mmap
from pathlib import Path
from typing import TYPE_CHECKING

import magic
from django.conf import settings

from api.models.file import File
from api.models.photo_stack import PhotoStack
from api.util import logger

if TYPE_CHECKING:
    from api.models.photo import Photo
    from api.models.user import User


# Markers for embedded motion video detection
JPEG_EOI_MARKER = b"\xff\xd9"
GOOGLE_PIXEL_MP4_SIGNATURES = [b"ftypmp42", b"ftypisom", b"ftypiso2"]
SAMSUNG_MOTION_MARKER = b"MotionPhoto_Data"

# Apple Live Photo video extensions
APPLE_LIVE_PHOTO_EXTENSIONS = [".mov", ".MOV"]


def _locate_google_embedded_video(data: bytes) -> int:
    """Find position of embedded MP4 in Google Motion Photo."""
    for signature in GOOGLE_PIXEL_MP4_SIGNATURES:
        position = data.find(signature)
        if position != -1:
            # MP4 header starts 4 bytes before ftyp
            return position - 4
    return -1


def _locate_samsung_embedded_video(data: bytes) -> int:
    """Find position of embedded video in Samsung Motion Photo."""
    position = data.find(SAMSUNG_MOTION_MARKER)
    if position != -1:
        # Video starts immediately after the marker
        return position + len(SAMSUNG_MOTION_MARKER)
    return -1


def has_embedded_motion_video(path: str) -> bool:
    """
    Check if a JPEG file contains an embedded motion video.
    
    Supports:
    - Google Pixel Motion Photos
    - Samsung Motion Photos
    
    Args:
        path: Path to the image file
        
    Returns:
        True if embedded video detected, False otherwise
    """
    try:
        mime = magic.Magic(mime=True)
        mime_type = mime.from_file(path)
        if mime_type != "image/jpeg":
            return False
            
        with open(path, "rb") as image:
            with mmap(image.fileno(), 0, access=ACCESS_READ) as mm:
                return (
                    _locate_google_embedded_video(mm) != -1 or
                    _locate_samsung_embedded_video(mm) != -1
                )
    except Exception as e:
        logger.warning(f"Error checking for embedded video in {path}: {e}")
        return False


def extract_embedded_motion_video(path: str, output_hash: str) -> str | None:
    """
    Extract embedded motion video from a JPEG file.
    
    Args:
        path: Path to the source image file
        output_hash: Hash to use for output filename
        
    Returns:
        Path to extracted video file, or None if extraction failed
    """
    try:
        with open(str(path), "rb") as image:
            with mmap(image.fileno(), 0, access=ACCESS_READ) as mm:
                # Try Google format first, then Samsung
                position = _locate_google_embedded_video(mm)
                if position == -1:
                    position = _locate_samsung_embedded_video(mm)
                    
                if position == -1:
                    return None
                    
                # Create output directory
                output_dir = Path(settings.MEDIA_ROOT) / "embedded_media"
                output_dir.mkdir(parents=True, exist_ok=True)
                
                output_path = output_dir / f"{output_hash}_motion.mp4"
                
                with open(output_path, "wb") as video:
                    mm.seek(position)
                    data = mm.read(mm.size() - position)
                    video.write(data)
                    
                logger.info(f"Extracted motion video to {output_path}")
                return str(output_path)
                
    except Exception as e:
        logger.error(f"Error extracting embedded video from {path}: {e}")
        return None


def find_apple_live_photo_video(image_path: str) -> str | None:
    """
    Find the companion .mov file for an Apple Live Photo.
    
    Apple Live Photos are stored as separate .HEIC/.JPG and .MOV files
    with the same base name (from ContentIdentifier).
    
    Args:
        image_path: Path to the image file
        
    Returns:
        Path to companion video file, or None if not found
    """
    base_path = Path(image_path)
    stem = base_path.stem
    parent = base_path.parent
    
    for ext in APPLE_LIVE_PHOTO_EXTENSIONS:
        video_path = parent / f"{stem}{ext}"
        if video_path.exists():
            return str(video_path)
            
    return None


def detect_live_photo(photo: "Photo", user: "User") -> PhotoStack | None:
    """
    Detect if a photo is part of a Live Photo and create a stack.
    
    This handles:
    1. Embedded motion videos (Google/Samsung) - extracts and links
    2. Apple Live Photos - finds and links companion video
    
    Args:
        photo: The Photo instance to check
        user: Owner of the photo
        
    Returns:
        PhotoStack instance if Live Photo detected, None otherwise
    """
    if not photo.main_file:
        return None
        
    image_path = photo.main_file.path
    
    # Check for embedded motion video (Google/Samsung)
    if has_embedded_motion_video(image_path):
        return _create_embedded_live_photo_stack(photo, user)
        
    # Check for Apple Live Photo companion video
    video_path = find_apple_live_photo_video(image_path)
    if video_path:
        return _create_apple_live_photo_stack(photo, video_path, user)
        
    return None


def _create_embedded_live_photo_stack(photo: "Photo", user: "User") -> PhotoStack | None:
    """Create stack for photo with embedded motion video."""
    if not settings.FEATURE_PROCESS_EMBEDDED_MEDIA:
        logger.debug("Embedded media processing disabled")
        return None
        
    image_path = photo.main_file.path
    video_path = extract_embedded_motion_video(image_path, photo.main_file.hash)
    
    if not video_path:
        return None
        
    # Create File record for the extracted video
    video_file = File.create(video_path, user)
    
    # Link as embedded media on the original file
    photo.main_file.embedded_media.add(video_file)
    
    # Create or update stack
    existing_stack = photo.stacks.filter(stack_type=PhotoStack.StackType.LIVE_PHOTO).first()
    if existing_stack:
        return existing_stack
        
    # Create new Live Photo stack
    stack = PhotoStack.objects.create(
        owner=user,
        stack_type=PhotoStack.StackType.LIVE_PHOTO,
        primary_photo=photo,
    )
    
    # Link photo to stack (ManyToMany)
    photo.stacks.add(stack)
    
    logger.info(f"Created Live Photo stack {stack.id} for embedded motion in {image_path}")
    return stack


def _create_apple_live_photo_stack(
    photo: "Photo", 
    video_path: str, 
    user: "User"
) -> PhotoStack | None:
    """Create stack for Apple Live Photo with companion video."""
    from api.models.photo import Photo
    
    # Check if video is already a known photo/file
    video_file = File.objects.filter(path=video_path).first()
    
    if not video_file:
        # Create File record for the video
        video_file = File.create(video_path, user)
        
    # Find or create the video as a Photo
    video_photo = Photo.objects.filter(main_file=video_file).first()
    
    if not video_photo:
        # Video file exists but no Photo record - might be created by scan
        # Link as embedded media instead
        photo.main_file.embedded_media.add(video_file)
        
    # Create or find stack
    existing_stack = photo.stacks.filter(stack_type=PhotoStack.StackType.LIVE_PHOTO).first()
    if existing_stack:
        stack = existing_stack
    else:
        stack = PhotoStack.objects.create(
            owner=user,
            stack_type=PhotoStack.StackType.LIVE_PHOTO,
            primary_photo=photo,
        )
        photo.stacks.add(stack)
        
    # If video is a separate Photo, link it to the same stack
    if video_photo and not video_photo.stacks.filter(stack_type=PhotoStack.StackType.LIVE_PHOTO).exists():
        video_photo.stacks.add(stack)
        
    logger.info(f"Created Apple Live Photo stack {stack.id} for {photo.main_file.path}")
    return stack


def process_live_photos_batch(user: "User", photos: list["Photo"]) -> dict:
    """
    Process multiple photos for Live Photo detection.
    
    Args:
        user: User who owns the photos
        photos: List of Photo instances to check
        
    Returns:
        Dict with counts: {detected: int, stacks_created: int}
    """
    detected = 0
    stacks_created = 0
    
    for photo in photos:
        try:
            stack = detect_live_photo(photo, user)
            if stack:
                detected += 1
                if stack.photo_count <= 1:
                    # New stack (might just have the photo, video linked separately)
                    stacks_created += 1
        except Exception as e:
            logger.error(f"Error processing Live Photo detection for {photo.id}: {e}")
            
    return {
        "detected": detected,
        "stacks_created": stacks_created,
    }


================================================
FILE: api/stats.py
================================================
import os
from datetime import datetime

import numpy as np
from django.db import connection
from django.db.models import Avg, Count, Max, Min, Q, Sum
from django.db.models.functions import TruncMonth

import random
import re

import seaborn as sns
from api.util import logger

from api.models import (
    AlbumAuto,
    AlbumDate,
    AlbumPlace,
    AlbumThing,
    AlbumUser,
    Cluster,
    Face,
    Person,
    Photo,
    User,
)
from api.models.user import get_deleted_user


def _is_sqlite() -> bool:
    return connection.vendor == "sqlite"


def jump_by_month(start_date, end_date, month_step=1):
    current_date = start_date
    yield current_date
    while current_date < end_date:
        carry, new_month = divmod(current_date.month - 1 + month_step, 12)
        new_month += 1
        current_date = current_date.replace(
            year=current_date.year + carry, month=new_month
        )
        yield current_date


def median_value(queryset, term):
    from decimal import Decimal

    count = queryset.count()
    if count == 0:
        return
    values = queryset.values_list(term, flat=True).order_by(term)
    if count % 2 == 1:
        return values[int(round(count / 2))]
    else:
        return sum(values[count / 2 - 1 : count / 2 + 1]) / Decimal(2.0)


def calc_megabytes(bytes):
    if bytes == 0 or bytes is None:
        return 0
    return round((bytes / 1024) / 1024)


def get_server_stats():
    # CPU architecture, Speed, Number of Cores, 64bit / 32 Bits
    import cpuinfo

    cpu_info = cpuinfo.get_cpu_info()
    # Available RAM
    import psutil

    available_ram = calc_megabytes(psutil.virtual_memory().total)
    # GPU
    import torch

    if torch.cuda.is_available():
        gpu_name = torch.cuda.get_device_name(0)
        gpu_memory = calc_megabytes(torch.cuda.get_device_properties(0).total_memory)
    else:
        gpu_name = ""
        gpu_memory = ""
    # Total Capacity
    import shutil

    total_storage, used_storage, free_storage = shutil.disk_usage("/")
    image_tag = os.environ.get("IMAGE_TAG", "")
    number_of_users = User.objects.filter(~Q(id=get_deleted_user().id)).count()
    users = []
    for user in User.objects.filter(~Q(id=get_deleted_user().id)):
        date_joined = user.date_joined
        number_of_photos = Photo.objects.filter(Q(owner=user)).count()
        number_of_videos = Photo.objects.filter(Q(owner=user) & Q(video=True)).count()
        number_of_captions = Photo.objects.filter(
            Q(owner=user)
            & Q(caption_instance__captions_json__user_caption__isnull=False)
        ).count()
        number_of_generated_captions = Photo.objects.filter(
            Q(owner=user) & Q(caption_instance__captions_json__im2txt__isnull=False)
        ).count()
        number_of_albums = AlbumUser.objects.filter(Q(owner=user)).count()
        min_number_of_photos_per_album = (
            AlbumUser.objects.filter(Q(owner=user))
            .annotate(count=Count("photos"))
            .aggregate(Min("count"))
        )
        max_number_of_photos_per_album = (
            AlbumUser.objects.filter(Q(owner=user))
            .annotate(count=Count("photos"))
            .aggregate(Max("count"))
        )
        mean_number_of_photos_per_album = (
            AlbumUser.objects.filter(Q(owner=user))
            .annotate(count=Count("photos"))
            .aggregate(Avg("count"))
        )
        median_number_of_photos_per_album = median_value(
            AlbumUser.objects.filter(Q(owner=user)).annotate(count=Count("photos")),
            "count",
        )
        min_number_of_videos_per_album = (
            AlbumUser.objects.filter(Q(owner=user))
            .annotate(count=Count("photos", filter=Q(photos__video=True)))
            .aggregate(Min("count"))
        )
        max_number_of_videos_per_album = (
            AlbumUser.objects.filter(Q(owner=user))
            .annotate(count=Count("photos", filter=Q(photos__video=True)))
            .aggregate(Max("count"))
        )
        mean_number_of_videos_per_album = (
            AlbumUser.objects.filter(Q(owner=user))
            .annotate(count=Count("photos", filter=Q(photos__video=True)))
            .aggregate(Avg("count"))
        )
        median_number_of_videos_per_album = median_value(
            AlbumUser.objects.filter(Q(owner=user)).annotate(
                count=Count("photos", filter=Q(photos__video=True))
            ),
            "count",
        )
        number_of_persons = Person.objects.filter(Q(cluster_owner=user)).count()
        min_number_of_faces_per_person = (
            Person.objects.filter(Q(cluster_owner=user))
            .annotate(count=Count("faces"))
            .aggregate(Min("count"))
        )
        max_number_of_faces_per_person = (
            Person.objects.filter(Q(cluster_owner=user))
            .annotate(count=Count("faces"))
            .aggregate(Max("count"))
        )
        mean_number_of_faces_per_person = (
            Person.objects.filter(Q(cluster_owner=user))
            .annotate(count=Count("faces"))
            .aggregate(Avg("count"))
        )
        median_number_of_faces_per_person = median_value(
            Person.objects.filter(Q(cluster_owner=user)).annotate(count=Count("faces")),
            "count",
        )
        number_of_clusters = Cluster.objects.filter(Q(owner=user)).count()
        number_of_places = AlbumPlace.objects.filter(Q(owner=user)).count()
        min_number_of_photos_per_place = (
            AlbumPlace.objects.filter(Q(owner=user))
            .annotate(count=Count("photos"))
            .aggregate(Min("count"))
        )
        max_number_of_photos_per_place = (
            AlbumPlace.objects.filter(Q(owner=user))
            .annotate(count=Count("photos"))
            .aggregate(Max("count"))
        )
        mean_number_of_photos_per_place = (
            AlbumPlace.objects.filter(Q(owner=user))
            .annotate(count=Count("photos"))
            .aggregate(Avg("count"))
        )
        median_number_of_photos_per_place = median_value(
            AlbumPlace.objects.filter(Q(owner=user)).annotate(count=Count("photos")),
            "count",
        )
        min_number_of_videos_per_place = (
            AlbumPlace.objects.filter(Q(owner=user))
            .annotate(count=Count("photos", filter=Q(photos__video=True)))
            .aggregate(Min("count"))
        )
        max_number_of_videos_per_place = (
            AlbumPlace.objects.filter(Q(owner=user))
            .annotate(count=Count("photos", filter=Q(photos__video=True)))
            .aggregate(Max("count"))
        )
        mean_number_of_videos_per_place = (
            AlbumPlace.objects.filter(Q(owner=user))
            .annotate(count=Count("photos", filter=Q(photos__video=True)))
            .aggregate(Avg("count"))
        )
        median_number_of_videos_per_place = median_value(
            AlbumPlace.objects.filter(Q(owner=user)).annotate(
                count=Count("photos", filter=Q(photos__video=True))
            ),
            "count",
        )
        number_of_things = AlbumThing.objects.filter(Q(owner=user)).count()
        min_number_of_photos_per_thing = (
            AlbumThing.objects.filter(Q(owner=user))
            .annotate(count=Count("photos"))
            .aggregate(Min("count"))
        )
        max_number_of_photos_per_thing = (
            AlbumThing.objects.filter(Q(owner=user))
            .annotate(count=Count("photos"))
            .aggregate(Max("count"))
        )
        mean_number_of_photos_per_thing = (
            AlbumThing.objects.filter(Q(owner=user))
            .annotate(count=Count("photos"))
            .aggregate(Avg("count"))
        )
        median_number_of_photos_per_thing = median_value(
            AlbumThing.objects.filter(Q(owner=user)).annotate(count=Count("photos")),
            "count",
        )
        min_number_of_videos_per_thing = (
            AlbumThing.objects.filter(Q(owner=user))
            .annotate(count=Count("photos", filter=Q(photos__video=True)))
            .aggregate(Min("count"))
        )
        max_number_of_videos_per_thing = (
            AlbumThing.objects.filter(Q(owner=user))
            .annotate(count=Count("photos", filter=Q(photos__video=True)))
            .aggregate(Max("count"))
        )
        mean_number_of_videos_per_thing = (
            AlbumThing.objects.filter(Q(owner=user))
            .annotate(count=Count("photos", filter=Q(photos__video=True)))
            .aggregate(Avg("count"))
        )
        median_number_of_videos_per_thing = median_value(
            AlbumThing.objects.filter(Q(owner=user)).annotate(
                count=Count("photos", filter=Q(photos__video=True))
            ),
            "count",
        )
        number_of_events = AlbumAuto.objects.filter(Q(owner=user)).count()
        min_number_of_photos_per_event = (
            AlbumAuto.objects.filter(Q(owner=user))
            .annotate(count=Count("photos"))
            .aggregate(Min("count"))
        )
        max_number_of_photos_per_event = (
            AlbumAuto.objects.filter(Q(owner=user))
            .annotate(count=Count("photos"))
            .aggregate(Max("count"))
        )
        mean_number_of_photos_per_event = (
            AlbumAuto.objects.filter(Q(owner=user))
            .annotate(count=Count("photos"))
            .aggregate(Avg("count"))
        )
        median_number_of_photos_per_event = median_value(
            AlbumAuto.objects.filter(Q(owner=user)).annotate(count=Count("photos")),
            "count",
        )
        min_number_of_videos_per_event = (
            AlbumAuto.objects.filter(Q(owner=user))
            .annotate(count=Count("photos", filter=Q(photos__video=True)))
            .aggregate(Min("count"))
        )
        max_number_of_videos_per_event = (
            AlbumAuto.objects.filter(Q(owner=user))
            .annotate(count=Count("photos", filter=Q(photos__video=True)))
            .aggregate(Max("count"))
        )
        mean_number_of_videos_per_event = (
            AlbumAuto.objects.filter(Q(owner=user))
            .annotate(count=Count("photos", filter=Q(photos__video=True)))
            .aggregate(Avg("count"))
        )
        median_number_of_videos_per_event = median_value(
            AlbumAuto.objects.filter(Q(owner=user)).annotate(
                count=Count("photos", filter=Q(photos__video=True))
            ),
            "count",
        )
        number_of_favorites = Photo.objects.filter(
            Q(owner=user) & Q(rating__gte=user.favorite_min_rating)
        ).count()
        number_of_hidden = Photo.objects.filter(Q(owner=user) & Q(hidden=True)).count()
        number_of_public = Photo.objects.filter(Q(owner=user) & Q(public=True)).count()
        users.append(
            {
                "date_joined": date_joined.strftime("%d-%m-%Y"),
                "total_file_size_in_mb": calc_megabytes(
                    Photo.objects.filter(Q(owner=user)).aggregate(Sum("size"))[
                        "size__sum"
                    ]
                    or None
                ),
                "number_of_photos": number_of_photos,
                "number_of_videos": number_of_videos,
                "number_of_captions": number_of_captions,
                "number_of_generated_captions": number_of_generated_captions,
                "album": {
                    "count": number_of_albums,
                    "min": min_number_of_photos_per_album["count__min"] or None,
                    "max": max_number_of_photos_per_album["count__max"] or None,
                    "mean": mean_number_of_photos_per_album["count__avg"] or None,
                    "median": median_number_of_photos_per_album,
                    "min_videos": min_number_of_videos_per_album["count__min"] or None,
                    "max_videos": max_number_of_videos_per_album["count__max"] or None,
                    "mean_videos": mean_number_of_videos_per_album["count__avg"]
                    or None,
                    "median_videos": median_number_of_videos_per_album,
                },
                "person": {
                    "count": number_of_persons,
                    "min": min_number_of_faces_per_person["count__min"] or None,
                    "max": max_number_of_faces_per_person["count__max"] or None,
                    "mean": mean_number_of_faces_per_person["count__avg"] or None,
                    "median": median_number_of_faces_per_person,
                },
                "number_of_clusters": number_of_clusters,
                "places": {
                    "count": number_of_places,
                    "min": min_number_of_photos_per_place["count__min"] or None,
                    "max": max_number_of_photos_per_place["count__max"] or None,
                    "mean": mean_number_of_photos_per_place["count__avg"] or None,
                    "median": median_number_of_photos_per_place,
                    "min_videos": min_number_of_videos_per_place["count__min"] or None,
                    "max_videos": max_number_of_videos_per_place["count__max"] or None,
                    "mean_videos": mean_number_of_videos_per_place["count__avg"]
                    or None,
                    "median_videos": median_number_of_videos_per_place,
                },
                "things": {
                    "count": number_of_things,
                    "min": min_number_of_photos_per_thing["count__min"] or None,
                    "max": max_number_of_photos_per_thing["count__max"] or None,
                    "mean": mean_number_of_photos_per_thing["count__avg"] or None,
                    "median": median_number_of_photos_per_thing,
                    "min_videos": min_number_of_videos_per_thing["count__min"] or None,
                    "max_videos": max_number_of_videos_per_thing["count__max"] or None,
                    "mean_videos": mean_number_of_videos_per_thing["count__avg"]
                    or None,
                    "median_videos": median_number_of_videos_per_thing,
                },
                "events": {
                    "count": number_of_events,
                    "min": min_number_of_photos_per_event["count__min"] or None,
                    "max": max_number_of_photos_per_event["count__max"] or None,
                    "mean": mean_number_of_photos_per_event["count__avg"] or None,
                    "median": median_number_of_photos_per_event,
                    "min_videos": min_number_of_videos_per_event["count__min"] or None,
                    "max_videos": max_number_of_videos_per_event["count__max"] or None,
                    "mean_videos": mean_number_of_videos_per_event["count__avg"]
                    or None,
                    "median_videos": median_number_of_videos_per_event,
                },
                "number_of_favorites": number_of_favorites,
                "number_of_hidden": number_of_hidden,
                "number_of_public": number_of_public,
            }
        )
    res = {
        "cpu_info": cpu_info,
        "image_tag": image_tag,
        "available_ram_in_mb": available_ram,
        "gpu_name": gpu_name,
        "gpu_memory_in_mb": gpu_memory,
        "total_storage_in_mb": calc_megabytes(total_storage),
        "used_storage_in_mb": calc_megabytes(used_storage),
        "free_storage_in_mb": calc_megabytes(free_storage),
        "number_of_users": number_of_users,
        "users": users,
    }
    return res


def get_count_stats(user):
    num_photos = Photo.visible.filter(Q(owner=user)).distinct().count()
    num_missing_photos = Photo.objects.filter(
        Q(owner=user) & Q(files=None) | Q(main_file=None)
    ).count()
    num_faces = Face.objects.filter(photo__owner=user).count()
    num_unknown_faces = Face.objects.filter(
        (
            Q(person__name__exact="unknown")
            | Q(person__name__exact=Person.UNKNOWN_PERSON_NAME)
        )
        & Q(photo__owner=user)
    ).count()
    num_labeled_faces = Face.objects.filter(
        Q(person__isnull=False) & Q(photo__owner=user) & Q(photo__hidden=False)
    ).count()
    num_inferred_faces = Face.objects.filter(
        Q(person=True) & Q(photo__owner=user) & Q(photo__hidden=False)
    ).count()
    num_people = (
        Person.objects.filter(
            Q(faces__photo__hidden=False)
            & Q(faces__photo__owner=user)
            & Q(faces__person__isnull=False)
        )
        .distinct()
        .annotate(viewable_face_count=Count("faces"))
        .filter(Q(viewable_face_count__gt=0))
        .count()
    )
    num_albumauto = (
        AlbumAuto.objects.filter(owner=user)
        .annotate(photo_count=Count("photos"))
        .filter(Q(photo_count__gt=0))
        .count()
    )
    num_albumdate = (
        AlbumDate.objects.filter(owner=user)
        .annotate(photo_count=Count("photos"))
        .filter(Q(photo_count__gt=0))
        .count()
    )
    num_albumuser = (
        AlbumUser.objects.filter(owner=user)
        .annotate(photo_count=Count("photos"))
        .filter(Q(photo_count__gt=0))
        .count()
    )

    res = {
        "num_photos": num_photos,
        "num_missing_photos": num_missing_photos,
        "num_faces": num_faces,
        "num_people": num_people,
        "num_unknown_faces": num_unknown_faces,
        "num_labeled_faces": num_labeled_faces,
        "num_inferred_faces": num_inferred_faces,
        "num_albumauto": num_albumauto,
        "num_albumdate": num_albumdate,
        "num_albumuser": num_albumuser,
    }
    return res


def get_photo_month_counts(user):
    counts = (
        Photo.objects.filter(owner=user)
        .exclude(exif_timestamp=None)
        .annotate(month=TruncMonth("exif_timestamp"))
        .values("month")
        .annotate(c=Count("image_hash"))
        .values("month", "c")
    )

    all_months = [
        c["month"]
        for c in counts
        if c["month"].year >= 2000 and c["month"].year <= datetime.now().year
    ]

    if len(all_months) > 0:
        first_month = min(all_months)
        last_month = max(all_months)

        month_span = jump_by_month(first_month, last_month)
        counts = sorted(counts, key=lambda k: k["month"])

        res = []
        for count in counts:
            key = "-".join([str(count["month"].year), str(count["month"].month)])
            count = count["c"]
            res.append([key, count])
        res = dict(res)

        out = []
        for month in month_span:
            m = "-".join([str(month.year), str(month.month)])
            if m in res.keys():
                out.append({"month": m, "count": res[m]})
            else:
                out.append({"month": m, "count": 0})

        return out
    else:
        return []


def get_searchterms_wordcloud(user):
    # Python fallbacks (SQLite): stream and aggregate
    from collections import Counter

    out = {"captions": [], "people": [], "locations": []}

    # Captions: use Places365 categories, attributes and environment from captions_json
    captions_counter: Counter[str] = Counter()
    captions_first_seen: dict[str, int] = {}
    order_index = 0
    captions_iter = (
        Photo.objects.filter(owner=user)
        .exclude(caption_instance__captions_json__isnull=True)
        .values_list("caption_instance__captions_json", flat=True)
        .iterator(chunk_size=2000)
    )
    for caps in captions_iter:
        try:
            places365 = (caps or {}).get("places365", {})
            categories = places365.get("categories", [])
            if isinstance(categories, list):
                for cat in categories:
                    if not cat:
                        continue
                    label = str(cat)
                    captions_counter[label] += 1
                    if label not in captions_first_seen:
                        captions_first_seen[label] = order_index
                        order_index += 1
            attributes = places365.get("attributes", [])
            if isinstance(attributes, list):
                for attr in attributes:
                    if not attr:
                        continue
                    label = str(attr)
                    captions_counter[label] += 1
                    if label not in captions_first_seen:
                        captions_first_seen[label] = order_index
                        order_index += 1
            environment = places365.get("environment")
            if isinstance(environment, str) and environment:
                label = environment
                captions_counter[label] += 1
                if label not in captions_first_seen:
                    captions_first_seen[label] = order_index
                    order_index += 1
        except Exception:
            continue

    # People: aggregate with ORM to avoid per-row Python loops
    people_rows = (
        Face.objects.filter(photo__owner=user, person__name__isnull=False)
        .values("person__name")
        .annotate(c=Count("id"))
        .order_by("-c")[:100]
    )

    # Locations: parse geolocation_json, ignore postcode and poi, one word per photo
    locations_counter: Counter[str] = Counter()
    locations_first_seen: dict[str, int] = {}
    geo_iter = (
        Photo.objects.filter(owner=user)
        .exclude(geolocation_json=None)
        .values_list("image_hash", "geolocation_json")
        .iterator(chunk_size=2000)
    )
    for _image_hash, geo in geo_iter:
        try:
            features = (geo or {}).get("features", [])
        except Exception:
            features = []
        seen_values = set()
        for feature in features:
            if not isinstance(feature, dict):
                continue
            place_type = feature.get("place_type")
            value = feature.get("text")
            if not value:
                continue
            # place_type can be list or string
            types = place_type if isinstance(place_type, list) else [place_type]
            types = [t for t in types if t]
            if any(t in ("postcode", "poi") for t in types):
                continue
            seen_values.add(str(value))
        for value in seen_values:
            locations_counter[value] += 1
            if value not in locations_first_seen:
                locations_first_seen[value] = captions_first_seen.get(
                    value, order_index
                )
                order_index += 1

    # Build outputs (log of count as before)
    # Ensure stable order to match expectations: attributes/environment may come first
    # Sort captions by count desc, then by first-seen order for deterministic ties
    captions_sorted = sorted(
        captions_counter.items(),
        key=lambda kv: (-kv[1], captions_first_seen.get(kv[0], 1_000_000)),
    )[:100]
    for label, count in captions_sorted:
        out["captions"].append({"label": label, "y": float(np.log(count))})
    for row in people_rows:
        out["people"].append(
            {"label": row["person__name"], "y": float(np.log(row["c"]))}
        )
    locations_sorted = sorted(
        locations_counter.items(),
        key=lambda kv: (-kv[1], locations_first_seen.get(kv[0], 1_000_000)),
    )[:100]
    for label, count in locations_sorted:
        out["locations"].append({"label": label, "y": float(np.log(count))})

    return out


def get_location_sunburst(user):
    levels = []

    from collections import Counter

    counter = Counter()
    # Stream results to avoid caching entire queryset in memory
    photo_geo_iter = (
        Photo.objects.filter(owner=user)
        .exclude(geolocation_json=None)
        .values_list("geolocation_json", flat=True)
        .iterator(chunk_size=2000)
    )
    for geo in photo_geo_iter:
        try:
            features = (geo or {}).get("features", [])
        except Exception:
            features = []
        if not isinstance(features, list) or len(features) < 3:
            continue
        f1 = features[-1] if isinstance(features[-1], dict) else {}
        f2 = features[-2] if isinstance(features[-2], dict) else {}
        f3 = features[-3] if isinstance(features[-3], dict) else {}
        l1 = f1.get("text")
        l2 = f2.get("text")
        l3 = f3.get("text")
        if l1 is None or l2 is None or l3 is None:
            continue
        counter[(l1, l2, l3)] += 1
    levels = [[k[0], k[1], k[2], v] for k, v in counter.items()]
    levels = sorted(levels, key=lambda x: (x[0], x[1], x[2]))

    data_structure = {"name": "Places I've visited", "children": []}
    palette = sns.color_palette("hls", 10).as_hex()

    for data in levels:
        depth_cursor = data_structure["children"]
        for i, item in enumerate(data[0:-2]):
            idx = None
            j = None
            for j, c in enumerate(depth_cursor):
                if item in c.values():
                    idx = j
            if idx is None:
                depth_cursor.append(
                    {"name": item, "children": [], "hex": random.choice(palette)}
                )
                idx = len(depth_cursor) - 1

            depth_cursor = depth_cursor[idx]["children"]
            if i == len(data) - 3:
                depth_cursor.append(
                    {
                        "name": data[-2],
                        "value": data[-1],
                        "hex": random.choice(palette),
                    }
                )

    return data_structure


def get_location_clusters(user):
    start = datetime.now()
    # Build clusters in Python from JSON fields (works for both SQLite and Postgres)
    results_by_location = {}
    # Stream results to avoid large memory usage
    photo_geo_iter = (
        Photo.objects.filter(owner=user)
        .exclude(geolocation_json=None)
        .values_list("geolocation_json", flat=True)
        .iterator(chunk_size=2000)
    )
    numeric_pattern = re.compile(r"^(-)?[0-9]+$")
    for geo in photo_geo_iter:
        try:
            features = (geo or {}).get("features", [])
        except Exception:
            features = []
        for feature in features:
            location_text = feature.get("text") if isinstance(feature, dict) else None
            if not location_text or numeric_pattern.match(str(location_text)):
                continue
            center = feature.get("center") if isinstance(feature, dict) else None
            if not (isinstance(center, (list, tuple)) and len(center) >= 2):
                continue
            # Keep first occurrence per distinct location name
            if location_text not in results_by_location:
                lon = center[0]
                lat = center[1]
                try:
                    lat_f = float(lat)
                    lon_f = float(lon)
                except Exception:
                    continue
                results_by_location[location_text] = [lat_f, lon_f, location_text]

    # Order by location to mimic SQL ordering
    res = [results_by_location[key] for key in sorted(results_by_location.keys())]
    elapsed = (datetime.now() - start).total_seconds()
    logger.info("location clustering computed in %.2f seconds" % elapsed)
    return res


def get_location_timeline(user):
    # Python fallback: iterate photos ordered by timestamp and build contiguous location spans
    def extract_location(geo: dict) -> str | None:
        if not geo or not isinstance(geo, dict):
            return None
        features = geo.get("features", [])
        if not isinstance(features, list) or not features:
            return None
        last = features[-1]
        if isinstance(last, dict):
            return last.get("text")
        return None

    # Stream through photos ordered by exif_timestamp
    qs = (
        Photo.objects.filter(owner=user)
        .exclude(exif_timestamp=None)
        .order_by("exif_timestamp")
        .values_list("geolocation_json", "exif_timestamp")
        .iterator(chunk_size=2000)
    )
    spans: list[tuple[str, datetime, datetime]] = []
    current_loc: str | None = None
    run_start: datetime | None = None
    last_time: datetime | None = None
    for geo, ts in qs:
        loc = extract_location(geo)
        if loc is None:
            continue
        if current_loc is None:
            current_loc = loc
            run_start = ts
            last_time = ts
            continue
        if loc == current_loc:
            last_time = ts
            continue
        # location changed → close previous span
        spans.append((current_loc, run_start, last_time))
        current_loc = loc
        run_start = ts
        last_time = ts
    # close final span
    if current_loc is not None and run_start is not None and last_time is not None:
        spans.append((current_loc, run_start, last_time))

    # Coalesce: set each span's end to next span's begin (like SQL LEAD(begin))
    city_start_end_duration = []
    for idx, (loc, begin, end) in enumerate(spans):
        new_end = spans[idx + 1][1] if idx + 1 < len(spans) else end
        duration_sec = (new_end - begin).total_seconds()
        city_start_end_duration.append((loc, begin, new_end, duration_sec))

    colors = sns.color_palette("Paired", len(city_start_end_duration)).as_hex()

    data = []
    for idx, sted in enumerate(city_start_end_duration):
        data.append(
            {
                "data": [sted[3]],
                "color": colors[idx],
                "loc": sted[0],
                "start": sted[1].timestamp(),
                "end": sted[2].timestamp(),
            }
        )
    return data


================================================
FILE: api/tests/__init__.py
================================================


================================================
FILE: api/tests/fixtures/__init__.py
================================================


================================================
FILE: api/tests/fixtures/api_util/captions_json.py
================================================
captions_json = {
    "places365": {
        "attributes": [
            "no horizon",
            "man made",
            "enclosed area",
            "cloth",
            "natural light",
            "wood",
            "glass",
            "indoor lighting",
            "dry",
        ],
        "categories": ["phone booth", "ticket booth"],
        "environment": "indoor",
    }
}


================================================
FILE: api/tests/fixtures/api_util/expectation.py
================================================
wordcloud_expectation = {
    "captions": [
        {"label": "outdoor", "y": 1.9459101490553132},
        {"label": "indoor", "y": 0.6931471805599453},
        {"label": "ticket booth", "y": 0.0},
        {"label": "boardwalk", "y": 0.0},
        {"label": "phone booth", "y": 0.0},
        {"label": "delicatessen", "y": 0.0},
        {"label": "lagoon", "y": 0.0},
        {"label": "tundra", "y": 0.0},
        {"label": "marsh", "y": 0.0},
        {"label": "bakery shop", "y": 0.0},
        {"label": "market outdoor", "y": 0.0},
        {"label": "butchers shop", "y": 0.0},
        {"label": "playground", "y": 0.0},
        {"label": "picnic area", "y": 0.0},
    ],
    "people": [],
    "locations": [
        {"label": "New South Wales", "y": 1.3862943611198906},
        {"label": "Sydney", "y": 1.3862943611198906},
        {"label": "Australia", "y": 1.3862943611198906},
        {"label": "Maroubra", "y": 1.0986122886681098},
        {"label": "Ladakh", "y": 0.6931471805599453},
        {"label": "Leh", "y": 0.6931471805599453},
        {"label": "Berlin", "y": 0.6931471805599453},
        {"label": "Germany", "y": 0.6931471805599453},
        {"label": "India", "y": 0.6931471805599453},
        {"label": "Lakeshore Road", "y": 0.0},
        {"label": "Shachokol", "y": 0.0},
        {"label": "Kreuzberg", "y": 0.0},
        {"label": "Canada", "y": 0.0},
        {"label": "Bondi Beach", "y": 0.0},
        {"label": "Peterborough County", "y": 0.0},
        {"label": "Lakefield", "y": 0.0},
        {"label": "Main Bazaar", "y": 0.0},
        {"label": "Ontario", "y": 0.0},
        {"label": "Chuchat Yakma", "y": 0.0},
        {"label": "Friedrichshain", "y": 0.0},
        {"label": "Beach Road", "y": 0.0},
        {"label": "Fire Route 47", "y": 0.0},
    ],
}


================================================
FILE: api/tests/fixtures/api_util/photos.py
================================================
photos = [
    {
        "thumbnail_big": "thumbnails_big/88070102f4a9a25ba26959b8e1f203a91.webp",
        "square_thumbnail": "square_thumbnails/88070102f4a9a25ba26959b8e1f203a91.webp",
        "square_thumbnail_small": "square_thumbnails_small/88070102f4a9a25ba26959b8e1f203a91.webp",
        "added_on": "2023-06-16 16:30:47.724635 +00:00",
        "exif_gps_lat": 52.5075472222222,
        "exif_gps_lon": 13.4549222222222,
        "exif_timestamp": "2017-08-23 16:13:32.000000 +00:00",
        "exif_json": None,
        "geolocation_json": {
            "type": "FeatureCollection",
            "query": [13.454922, 52.507547],
            "features": [
                {
                    "id": "poi.712964618154",
                    "text": "Badehaus - Szimpla Musiksalon",
                    "type": "Feature",
                    "center": [13.455101, 52.507538],
                    "context": [
                        {
                            "id": "postcode.5156410",
                            "text": "10245",
                            "mapbox_id": "dXJuOm1ieHBsYzpUcTQ2",
                        },
                        {
                            "id": "locality.90794554",
                            "text": "Friedrichshain",
                            "wikidata": "Q317056",
                            "mapbox_id": "dXJuOm1ieHBsYzpCV2xxT2c",
                        },
                        {
                            "id": "place.115770",
                            "text": "Berlin",
                            "wikidata": "Q64",
                            "mapbox_id": "dXJuOm1ieHBsYzpBY1E2",
                            "short_code": "DE-BE",
                        },
                        {
                            "id": "country.8762",
                            "text": "Germany",
                            "wikidata": "Q183",
                            "mapbox_id": "dXJuOm1ieHBsYzpJam8",
                            "short_code": "de",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [13.455101, 52.507538],
                    },
                    "relevance": 1,
                    "place_name": "Badehaus - Szimpla Musiksalon, Revaler Str. 99, Berlin, 10245, Germany",
                    "place_type": ["poi"],
                    "properties": {
                        "address": "Revaler Str. 99",
                        "category": "bar, pub, alcohol, liquor, beer",
                        "landmark": True,
                        "foursquare": "4e62924d18a8ce02fce9d584",
                    },
                },
                {
                    "id": "postcode.5156410",
                    "bbox": [13.445615, 52.486046, 13.491453, 52.514722],
                    "text": "10245",
                    "type": "Feature",
                    "center": [13.458408, 52.504367],
                    "context": [
                        {
                            "id": "locality.90794554",
                            "text": "Friedrichshain",
                            "wikidata": "Q317056",
                            "mapbox_id": "dXJuOm1ieHBsYzpCV2xxT2c",
                        },
                        {
                            "id": "place.115770",
                            "text": "Berlin",
                            "wikidata": "Q64",
                            "mapbox_id": "dXJuOm1ieHBsYzpBY1E2",
                            "short_code": "DE-BE",
                        },
                        {
                            "id": "country.8762",
                            "text": "Germany",
                            "wikidata": "Q183",
                            "mapbox_id": "dXJuOm1ieHBsYzpJam8",
                            "short_code": "de",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [13.458408, 52.504367],
                    },
                    "relevance": 1,
                    "place_name": "10245, Berlin, Germany",
                    "place_type": ["postcode"],
                    "properties": {"mapbox_id": "dXJuOm1ieHBsYzpUcTQ2"},
                },
                {
                    "id": "locality.90794554",
                    "bbox": [13.419752, 52.486046, 13.491453, 52.531026],
                    "text": "Friedrichshain",
                    "type": "Feature",
                    "center": [13.45029, 52.512215],
                    "context": [
                        {
                            "id": "place.115770",
                            "text": "Berlin",
                            "wikidata": "Q64",
                            "mapbox_id": "dXJuOm1ieHBsYzpBY1E2",
                            "short_code": "DE-BE",
                        },
                        {
                            "id": "country.8762",
                            "text": "Germany",
                            "wikidata": "Q183",
                            "mapbox_id": "dXJuOm1ieHBsYzpJam8",
                            "short_code": "de",
                        },
                    ],
                    "geometry": {"type": "Point", "coordinates": [13.45029, 52.512215]},
                    "relevance": 1,
                    "place_name": "Friedrichshain, Berlin, Germany",
                    "place_type": ["locality"],
                    "properties": {
                        "wikidata": "Q317056",
                        "mapbox_id": "dXJuOm1ieHBsYzpCV2xxT2c",
                    },
                },
                {
                    "id": "place.115770",
                    "bbox": [13.08836, 52.338261, 13.761131, 52.675502],
                    "text": "Berlin",
                    "type": "Feature",
                    "center": [13.3888599, 52.5170365],
                    "context": [
                        {
                            "id": "country.8762",
                            "text": "Germany",
                            "wikidata": "Q183",
                            "mapbox_id": "dXJuOm1ieHBsYzpJam8",
                            "short_code": "de",
                        }
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [13.3888599, 52.5170365],
                    },
                    "relevance": 1,
                    "place_name": "Berlin, Germany",
                    "place_type": ["region", "place"],
                    "properties": {
                        "wikidata": "Q64",
                        "mapbox_id": "dXJuOm1ieHBsYzpBY1E2",
                        "short_code": "DE-BE",
                    },
                },
                {
                    "id": "country.8762",
                    "bbox": [5.866315, 47.270238, 15.041832, 55.1286491],
                    "text": "Germany",
                    "type": "Feature",
                    "center": [10.0183432948567, 51.1334813439932],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [10.0183432948567, 51.1334813439932],
                    },
                    "relevance": 1,
                    "place_name": "Germany",
                    "place_type": ["country"],
                    "properties": {
                        "wikidata": "Q183",
                        "mapbox_id": "dXJuOm1ieHBsYzpJam8",
                        "short_code": "de",
                    },
                },
            ],
            "attribution": "NOTICE: © 2023 Mapbox and its suppliers. All rights reserved. Use of this data is subject to the Mapbox Terms of Service (https://www.mapbox.com/about/maps/). This response and the information it contains may not be retained. POI(s) provided by Foursquare.",
            "search_text": "Badehaus - Szimpla Musiksalon 10245 Friedrichshain Berlin Germany",
        },
        "captions_json": {
            "places365": {
                "attributes": [
                    "no horizon",
                    "man made",
                    "enclosed area",
                    "cloth",
                    "natural light",
                    "wood",
                    "glass",
                    "indoor lighting",
                    "dry",
                ],
                "categories": ["phone booth", "ticket booth"],
                "environment": "indoor",
            }
        },
        "search_captions": "phone booth , ticket booth , indoor",
        "search_location": "Badehaus - Szimpla Musiksalon 10245 Friedrichshain Berlin Germany",
        "hidden": False,
        "public": False,
        "video": False,
        "clip_embeddings": [
            0.02945636957883835,
            0.0006848685443401337,
            -0.21565294265747070,
            -0.13726805150508880,
            0.34177422523498535,
            -0.21947097778320312,
            -0.36535099148750305,
            0.43704378604888916,
            -0.04088297113776207,
            -0.16377356648445130,
            0.61226522922515870,
            -0.27190640568733215,
            0.21632727980613708,
            -0.49879187345504760,
            0.35928872227668760,
            -0.57344657182693480,
            -1.09348952770233150,
            0.12758482992649078,
            0.22626115381717682,
            -0.29700523614883423,
            0.67408502101898190,
            0.20566113293170930,
            0.004221141338348389,
            -0.18163934350013733,
            0.030123591423034668,
            -0.36574870347976685,
            0.37040638923645020,
            -0.15804094076156616,
            0.40848651528358460,
            -0.44146019220352173,
            -0.29682993888854980,
            -0.14033758640289307,
            0.15358698368072510,
            0.14189875125885010,
            -0.24039962887763977,
            0.15688608586788177,
            -0.13299843668937683,
            -0.09722766280174255,
            0.15716867148876190,
            0.06153672933578491,
            -0.24909989535808563,
            0.42868158221244810,
            -0.09139122068881989,
            0.026236191391944885,
            0.43363174796104430,
            0.15078209340572357,
            -0.02513679303228855,
            -0.16301257908344270,
            0.30406942963600160,
            -0.20351555943489075,
            0.32808005809783936,
            0.11325813829898834,
            0.06632904708385468,
            -0.13974805176258087,
            -0.08816416561603546,
            0.08763262629508972,
            0.36618012189865110,
            -0.016463160514831543,
            0.51381558179855350,
            -0.19019323587417603,
            0.007199913263320923,
            -0.47690716385841370,
            -0.011584945023059845,
            0.27767223119735720,
            0.05724636837840080,
            -0.14331746101379395,
            -0.17595694959163666,
            0.69013822078704830,
            -0.29242870211601260,
            -0.20638096332550050,
            0.15023268759250640,
            0.39301073551177980,
            -0.07778433710336685,
            -0.31314268708229065,
            -0.08601596951484680,
            -0.33508300781250000,
            -0.46537816524505615,
            -0.11456200480461120,
            0.12097512185573578,
            -0.21884436905384064,
            0.08210694789886475,
            -0.20028553903102875,
            0.019847501069307327,
            -0.47711223363876340,
            0.41822510957717896,
            0.28469321131706240,
            0.56612819433212280,
            -0.37348130345344543,
            0.36494156718254090,
            -0.29691773653030396,
            0.27490460872650146,
            0.055256836116313934,
            -5.04034137725830100,
            0.21063046157360077,
            0.07623146474361420,
            0.91044491529464720,
            0.09022644162178040,
            -0.22425013780593872,
            -0.15275251865386963,
            0.56555438041687010,
            -0.21015779674053192,
            0.12018989026546478,
            0.050851717591285706,
            0.07409352064132690,
            0.10203989595174790,
            -0.14679333567619324,
            -0.45498293638229370,
            0.18498001992702484,
            0.08312227576971054,
            -0.20828101038932800,
            0.22045168280601501,
            -0.41870164871215820,
            -0.18289424479007720,
            0.27803760766983030,
            -0.14669309556484222,
            0.11136791110038757,
            -0.07714871317148209,
            0.11111782491207123,
            0.33326071500778200,
            -0.22490462660789490,
            -0.023626238107681274,
            -0.38946658372879030,
            -0.11872470378875732,
            0.003953278064727783,
            0.06875754147768020,
            0.06950961053371430,
            0.20257902145385742,
            0.48788213729858400,
            -0.55383354425430300,
            0.26022326946258545,
            0.54247814416885380,
            -0.75806522369384770,
            -0.16927206516265870,
            0.86247527599334720,
            0.00693318247795105,
            0.48897692561149597,
            -0.028302762657403946,
            -0.39459863305091860,
            -0.09011757373809814,
            -0.002951778471469879,
            -0.34152612090110780,
            -0.053652018308639526,
            -0.05833066999912262,
            0.23596245050430298,
            0.11364882439374924,
            0.29371896386146545,
            0.20242361724376678,
            0.41401028633117676,
            0.29458260536193850,
            0.12261603027582169,
            0.35396143794059753,
            -0.37751555442810060,
            -0.65084457397460940,
            0.43545067310333250,
            -0.12954968214035034,
            -0.55164968967437740,
            -0.028061915189027786,
            -0.41742083430290220,
            -0.84223127365112300,
            0.28066438436508180,
            -0.39846715331077576,
            -0.29234075546264650,
            0.40001532435417175,
            -0.025802582502365112,
            0.035069286823272705,
            0.58283793926239010,
            1.06991338729858400,
            -0.004069690592586994,
            0.16848376393318176,
            -0.32832053303718567,
            -0.05214332789182663,
            -0.22528168559074402,
            -0.012514784932136536,
            -0.22871030867099762,
            -0.46591621637344360,
            0.43959569931030273,
            0.52867388725280760,
            0.08700185269117355,
            0.82598596811294560,
            0.72045898437500000,
            -0.18566657602787018,
            0.31717744469642640,
            -0.32986947894096375,
            -0.08980216830968857,
            -0.29798981547355650,
            -0.20281662046909332,
            0.35008898377418520,
            -0.06911731511354446,
            0.46833136677742004,
            -0.05824550986289978,
            0.22831164300441742,
            -0.14332316815853120,
            -0.54719811677932740,
            -0.033745840191841125,
            -0.14754259586334229,
            -0.15379694104194640,
            0.27912741899490356,
            -0.38673168420791626,
            0.18064787983894348,
            0.02594844251871109,
            -0.19353626668453217,
            0.12792934477329254,
            0.76823699474334720,
            -0.25351685285568240,
            0.19726955890655518,
            0.04505273699760437,
            0.08072985708713531,
            -0.40315085649490356,
            -0.05216634273529053,
            0.33589959144592285,
            0.13084968924522400,
            -0.71316510438919070,
            0.62502771615982060,
            0.15854838490486145,
            -0.46951773762702940,
            -0.05899134278297424,
            -0.07570817321538925,
            -0.21729907393455505,
            -0.48353233933448790,
            -0.30078506469726560,
            0.01950731873512268,
            0.35301312804222107,
            -0.11586478352546692,
            0.06945395469665527,
            -0.09096579253673553,
            -0.003176487982273102,
            -0.06729926168918610,
            0.16478994488716125,
            0.11996459960937500,
            0.08691802620887756,
            -0.37051337957382200,
            -0.27022105455398560,
            0.44754734635353090,
            0.58564084768295290,
            0.14264307916164398,
            -0.27284860610961914,
            -0.21267735958099365,
            -0.62931954860687260,
            -0.17053475975990295,
            0.43907707929611206,
            -0.17706312239170074,
            -0.20798830687999725,
            -0.013556711375713348,
            -0.45459657907485960,
            0.27621361613273620,
            -0.00547829270362854,
            0.09221091866493225,
            -0.45583301782608030,
            -0.04141671583056450,
            -0.04372096061706543,
            -0.08653303980827332,
            0.16906698048114777,
            -0.39207679033279420,
            0.16125959157943726,
            0.18793570995330810,
            -0.062303997576236725,
            -0.14904721081256866,
            -0.08313135802745819,
            0.71267020702362060,
            -0.12299664318561554,
            0.45854219794273376,
            0.37172207236289980,
            0.23576152324676514,
            -0.96158236265182500,
            -0.16355091333389282,
            0.08433900773525238,
            -0.26110875606536865,
            0.41418594121932983,
            -0.00952976569533348,
            -0.31196358799934387,
            0.08939869701862335,
            0.08166363835334778,
            0.27331307530403137,
            -0.23260714113712310,
            -0.11067157238721848,
            0.07786403596401215,
            0.15424127876758575,
            -0.15310212969779968,
            -0.57094782590866090,
            0.08447279036045074,
            0.09531763195991516,
            -0.16973701119422913,
            -0.39517831802368164,
            0.48301315307617190,
            -0.49167299270629883,
            0.16578084230422974,
            0.012142054736614227,
            0.38737818598747253,
            -0.42219209671020510,
            0.038790080696344376,
            0.14427416026592255,
            0.51845633983612060,
            0.30745857954025270,
            0.19423109292984010,
            -0.29949772357940674,
            -0.22886085510253906,
            -0.18502810597419740,
            0.58494806289672850,
            -0.05995021387934685,
            0.027786150574684143,
            0.16225285828113556,
            -0.21960149705410004,
            -0.19987022876739502,
            0.17615880072116852,
            0.12230071425437927,
            0.78366780281066900,
            0.07176887989044190,
            0.34315368533134460,
            0.32958623766899110,
            0.046860724687576294,
            -0.37855774164199830,
            0.10880301892757416,
            0.86260342597961430,
            -0.25351122021675110,
            -0.33743318915367126,
            -0.000004470348358154297,
            0.10894200950860977,
            -0.24402043223381042,
            0.041552767157554626,
            1.11131787300109860,
            0.19667577743530273,
            0.09909820556640625,
            -0.22913703322410583,
            0.07402139902114868,
            -0.51243948936462400,
            -0.011785134673118591,
            0.11913090944290161,
            0.10973167419433594,
            0.14159473776817322,
            -0.25530740618705750,
            -0.10128769278526306,
            -0.018086418509483337,
            0.23918014764785767,
            -0.0025010444223880768,
            0.028242304921150208,
            -0.10461166501045227,
            0.31454890966415405,
            -0.21300530433654785,
            -0.67316675186157230,
            -0.28894531726837160,
            0.15850226581096650,
            -0.25393971800804140,
            0.015249133110046387,
            0.17902487516403198,
            0.03674941509962082,
            -0.40653368830680847,
            0.06983637809753418,
            0.58390831947326660,
            -0.35204166173934937,
            -0.23273511230945587,
            -0.50346362590789800,
            -0.18698497116565704,
            -0.13735061883926392,
            -0.029784053564071655,
            -0.23463270068168640,
            0.04800243675708771,
            0.21194185316562653,
            2.50413703918457030,
            0.014399580657482147,
            0.13682425022125244,
            -0.44549101591110230,
            -0.05332183837890625,
            0.26232331991195680,
            0.48867249488830566,
            0.90782088041305540,
            -0.04284442216157913,
            0.16441944241523743,
            -0.64545953273773190,
            0.0021270206198096275,
            0.57723963260650630,
            -0.16735523939132690,
            -0.03681857883930206,
            -0.23049485683441162,
            -0.16818353533744812,
            0.48354497551918030,
            -0.34307366609573364,
            0.90225481986999510,
            -0.08604586869478226,
            -0.80853521823883060,
            0.07412493973970413,
            0.38500127196311950,
            -0.53182345628738400,
            -0.37833765149116516,
            -0.27583479881286620,
            0.18323482573032380,
            -0.57118958234786990,
            0.15203747153282166,
            -0.45285981893539430,
            0.14797788858413696,
            0.92780256271362300,
            -0.99070614576339720,
            0.78525125980377200,
            -0.54372054338455200,
            0.27046817541122437,
            0.05927395448088646,
            0.29292181134223940,
            0.17652636766433716,
            -0.28721928596496580,
            -0.11287573724985123,
            0.054300934076309204,
            -0.20183458924293518,
            -0.06938034296035767,
            -0.02237860858440399,
            -0.28468230366706850,
            0.27039328217506410,
            -0.44048523902893066,
            -0.10478976368904114,
            0.22237929701805115,
            0.61014431715011600,
            0.22426150739192963,
            -0.53682762384414670,
            0.17780613899230957,
            0.10927680134773254,
            -0.08265303075313568,
            0.08433099091053009,
            0.22053673863410950,
            -0.15935529768466950,
            0.02448994666337967,
            -0.15990000963211060,
            -0.10862783342599869,
            -0.55222094058990480,
            -0.18120177090168000,
            -0.18480616807937622,
            -0.40381407737731934,
            0.41113349795341490,
            0.45374616980552673,
            0.12371205538511276,
            0.54327690601348880,
            -1.32808542251586910,
            0.06879405677318573,
            -0.32771402597427370,
            0.30996549129486084,
            0.73747062683105470,
            0.0026262253522872925,
            -0.07966820895671844,
            -0.43908175826072693,
            -0.57706052064895630,
            -0.07506740093231201,
            -0.03822087496519089,
            0.14753995835781097,
            0.26234555244445800,
            0.37969052791595460,
            -0.03944581747055054,
            -0.21361999213695526,
            0.30636596679687500,
            0.36208370327949524,
            -0.51721900701522830,
            -0.72269493341445920,
            0.12646321952342987,
            0.30191451311111450,
            0.88483667373657230,
            0.13586276769638062,
            -0.47170540690422060,
            -0.22053156793117523,
            -0.32388603687286377,
            0.28210371732711790,
            -0.14361841976642610,
            0.35813957452774050,
            -0.71662276983261110,
            -0.36910200119018555,
            -0.50887799263000490,
            0.18198430538177490,
            -0.12547180056571960,
            0.019948184490203857,
            -0.027965955436229706,
            0.23368665575981140,
            0.08205719292163849,
            0.03229612857103348,
            -0.37393200397491455,
            0.09985578060150146,
            0.16484981775283813,
            -0.03449898585677147,
            -0.20320037007331848,
            0.17666932940483093,
            -0.10235498100519180,
            -0.18969213962554932,
            -0.06653118133544922,
            0.32699528336524963,
            -0.41083279252052307,
            0.17249025404453278,
            -0.71300625801086430,
            -0.40383389592170715,
            -0.012773919850587845,
            -0.04669109359383583,
            -0.16580447554588318,
            -0.034973472356796265,
            0.18406766653060913,
            0.32842925190925600,
            -0.43452721834182740,
            0.07465618103742600,
            -0.054404426366090775,
            0.07043577730655670,
            0.34492620825767517,
            -0.55067378282547000,
            -0.35782644152641296,
            0.22946852445602417,
            0.13374575972557068,
            0.23378580808639526,
            -0.18907654285430908,
            -0.20370183885097504,
            -0.63759642839431760,
            0.29174658656120300,
            -0.20586502552032470,
            0.08419455587863922,
            0.96353048086166380,
            -0.023577764630317688,
            0.34594947099685670,
            -0.07180836796760559,
            -0.11015791445970535,
            -0.10569672286510468,
            0.29831579327583313,
            0.21254715323448180,
        ],
        "clip_embeddings_magnitude": 9.564716339111328,
        "aspect_ratio": 0.75,
        "rating": 0,
        "dominant_color": "[145, 83, 48]",
        "video_length": None,
        "in_trashcan": False,
        "removed": False,
        "timestamp": None,
        "camera": "Pixel 2",
        "digitalZoomRatio": None,
        "focalLength35Equivalent": None,
        "focal_length": 4.442,
        "fstop": 1.8,
        "height": 4032,
        "iso": None,
        "lens": None,
        "shutter_speed": "1/100",
        "size": 7194067,
        "subjectDistance": 0.614,
        "width": 3024,
        "main_file_id": "88070102f4a9a25ba26959b8e1f203a91",
    },
    {
        "thumbnail_big": "thumbnails_big/cac6402c7ff192e6fa96fee50ba24fd81.webp",
        "square_thumbnail": "square_thumbnails/cac6402c7ff192e6fa96fee50ba24fd81.webp",
        "square_thumbnail_small": "square_thumbnails_small/cac6402c7ff192e6fa96fee50ba24fd81.webp",
        "added_on": "2023-06-16 16:30:44.284649 +00:00",
        "exif_gps_lat": 34.1620972222222,
        "exif_gps_lon": 77.5858416666667,
        "exif_timestamp": "2017-08-09 23:04:03.000000 +00:00",
        "exif_json": None,
        "geolocation_json": {
            "type": "FeatureCollection",
            "query": [77.585842, 34.162097],
            "features": [
                {
                    "id": "address.15438142488176",
                    "text": "Main Bazaar",
                    "type": "Feature",
                    "center": [77.585527, 34.1622089],
                    "context": [
                        {
                            "id": "postcode.13053547",
                            "text": "194101",
                            "mapbox_id": "dXJuOm1ieHBsYzp4eTVy",
                        },
                        {
                            "id": "locality.997100139",
                            "text": "Chuchat Yakma",
                            "wikidata": "Q24909733",
                            "mapbox_id": "dXJuOm1ieHBsYzpPMjZLYXc",
                        },
                        {
                            "id": "place.25135211",
                            "text": "Leh",
                            "wikidata": "Q230818",
                            "mapbox_id": "dXJuOm1ieHBsYzpBWCtJYXc",
                        },
                        {
                            "id": "district.3196523",
                            "text": "Leh",
                            "wikidata": "Q1921210",
                            "mapbox_id": "dXJuOm1ieHBsYzpNTVpy",
                        },
                        {
                            "id": "region.222315",
                            "text": "Ladakh",
                            "wikidata": "Q200667",
                            "mapbox_id": "dXJuOm1ieHBsYzpBMlJy",
                            "short_code": "IN-LA",
                        },
                        {
                            "id": "country.8811",
                            "text": "India",
                            "wikidata": "Q668",
                            "mapbox_id": "dXJuOm1ieHBsYzpJbXM",
                            "short_code": "in",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [77.585527, 34.1622089],
                    },
                    "relevance": 1,
                    "place_name": "Main Bazaar ، 194101 Leh، India",
                    "place_type": ["address"],
                    "properties": {"accuracy": "street"},
                },
                {
                    "id": "postcode.13053547",
                    "bbox": [77.107033, 33.67805, 77.812822, 34.511912],
                    "text": "194101",
                    "type": "Feature",
                    "center": [77.572696, 34.199537],
                    "context": [
                        {
                            "id": "locality.997100139",
                            "text": "Chuchat Yakma",
                            "wikidata": "Q24909733",
                            "mapbox_id": "dXJuOm1ieHBsYzpPMjZLYXc",
                        },
                        {
                            "id": "place.25135211",
                            "text": "Leh",
                            "wikidata": "Q230818",
                            "mapbox_id": "dXJuOm1ieHBsYzpBWCtJYXc",
                        },
                        {
                            "id": "district.3196523",
                            "text": "Leh",
                            "wikidata": "Q1921210",
                            "mapbox_id": "dXJuOm1ieHBsYzpNTVpy",
                        },
                        {
                            "id": "region.222315",
                            "text": "Ladakh",
                            "wikidata": "Q200667",
                            "mapbox_id": "dXJuOm1ieHBsYzpBMlJy",
                            "short_code": "IN-LA",
                        },
                        {
                            "id": "country.8811",
                            "text": "India",
                            "wikidata": "Q668",
                            "mapbox_id": "dXJuOm1ieHBsYzpJbXM",
                            "short_code": "in",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [77.572696, 34.199537],
                    },
                    "relevance": 1,
                    "place_name": "194101, Leh, Ladakh, India",
                    "place_type": ["postcode"],
                    "properties": {"mapbox_id": "dXJuOm1ieHBsYzp4eTVy"},
                },
                {
                    "id": "locality.997100139",
                    "bbox": [76.626529011, 33.347769, 78.047440762, 34.538001],
                    "text": "Chuchat Yakma",
                    "type": "Feature",
                    "center": [77.602518, 34.07534],
                    "context": [
                        {
                            "id": "place.25135211",
                            "text": "Leh",
                            "wikidata": "Q230818",
                            "mapbox_id": "dXJuOm1ieHBsYzpBWCtJYXc",
                        },
                        {
                            "id": "district.3196523",
                            "text": "Leh",
                            "wikidata": "Q1921210",
                            "mapbox_id": "dXJuOm1ieHBsYzpNTVpy",
                        },
                        {
                            "id": "region.222315",
                            "text": "Ladakh",
                            "wikidata": "Q200667",
                            "mapbox_id": "dXJuOm1ieHBsYzpBMlJy",
                            "short_code": "IN-LA",
                        },
                        {
                            "id": "country.8811",
                            "text": "India",
                            "wikidata": "Q668",
                            "mapbox_id": "dXJuOm1ieHBsYzpJbXM",
                            "short_code": "in",
                        },
                    ],
                    "geometry": {"type": "Point", "coordinates": [77.602518, 34.07534]},
                    "relevance": 1,
                    "place_name": "Chuchat Yakma, Leh, Leh, Ladakh, India",
                    "place_type": ["locality"],
                    "properties": {
                        "wikidata": "Q24909733",
                        "mapbox_id": "dXJuOm1ieHBsYzpPMjZLYXc",
                    },
                },
                {
                    "id": "place.25135211",
                    "bbox": [77.107033, 32.33574, 79.305839, 35.522256],
                    "text": "Leh",
                    "type": "Feature",
                    "center": [77.584813, 34.164203],
                    "context": [
                        {
                            "id": "district.3196523",
                            "text": "Leh",
                            "wikidata": "Q1921210",
                            "mapbox_id": "dXJuOm1ieHBsYzpNTVpy",
                        },
                        {
                            "id": "region.222315",
                            "text": "Ladakh",
                            "wikidata": "Q200667",
                            "mapbox_id": "dXJuOm1ieHBsYzpBMlJy",
                            "short_code": "IN-LA",
                        },
                        {
                            "id": "country.8811",
                            "text": "India",
                            "wikidata": "Q668",
                            "mapbox_id": "dXJuOm1ieHBsYzpJbXM",
                            "short_code": "in",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [77.584813, 34.164203],
                    },
                    "relevance": 1,
                    "place_name": "Leh, Ladakh, India",
                    "place_type": ["place"],
                    "properties": {
                        "wikidata": "Q230818",
                        "mapbox_id": "dXJuOm1ieHBsYzpBWCtJYXc",
                    },
                },
                {
                    "id": "region.222315",
                    "bbox": [75.306629, 32.33574, 79.305851, 35.673315],
                    "text": "Ladakh",
                    "type": "Feature",
                    "center": [77.27783203125, 34.0071350643588],
                    "context": [
                        {
                            "id": "country.8811",
                            "text": "India",
                            "wikidata": "Q668",
                            "mapbox_id": "dXJuOm1ieHBsYzpJbXM",
                            "short_code": "in",
                        }
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [77.27783203125, 34.0071350643588],
                    },
                    "relevance": 1,
                    "place_name": "Ladakh, India",
                    "place_type": ["region"],
                    "properties": {
                        "wikidata": "Q200667",
                        "mapbox_id": "dXJuOm1ieHBsYzpBMlJy",
                        "short_code": "IN-LA",
                    },
                },
                {
                    "id": "country.8811",
                    "bbox": [68.1152344, 6.6718373, 97.395359, 35.673315],
                    "text": "India",
                    "type": "Feature",
                    "center": [78.476681027237, 22.1991660760527],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [78.476681027237, 22.1991660760527],
                    },
                    "relevance": 1,
                    "place_name": "India",
                    "place_type": ["country"],
                    "properties": {
                        "wikidata": "Q668",
                        "mapbox_id": "dXJuOm1ieHBsYzpJbXM",
                        "short_code": "in",
                    },
                },
            ],
            "attribution": "NOTICE: © 2023 Mapbox and its suppliers. All rights reserved. Use of this data is subject to the Mapbox Terms of Service (https://www.mapbox.com/about/maps/). This response and the information it contains may not be retained. POI(s) provided by Foursquare.",
            "search_text": "Main Bazaar 194101 Chuchat Yakma Leh Ladakh India",
        },
        "captions_json": {
            "places365": {
                "attributes": [
                    "no horizon",
                    "cloth",
                    "enclosed area",
                    "natural light",
                    "man made",
                    "rugged scene",
                    "dry",
                    "shopping",
                    "working",
                ],
                "categories": [
                    "butchers shop",
                    "bakery shop",
                    "delicatessen",
                    "market outdoor",
                ],
                "environment": "indoor",
            }
        },
        "search_captions": "butchers shop , bakery shop , delicatessen , market outdoor , indoor",
        "search_location": "Main Bazaar 194101 Chuchat Yakma Leh Ladakh India",
        "hidden": False,
        "public": False,
        "video": False,
        "clip_embeddings": [
            -0.36275115609169006,
            0.04232349991798401,
            0.16003805398941040,
            -0.15414649248123170,
            0.07362174987792969,
            0.30168089270591736,
            0.29503446817398070,
            0.52876400947570800,
            0.03624974191188812,
            0.57748210430145260,
            0.06661064177751541,
            -0.08749669790267944,
            -0.43980333209037780,
            -0.45719712972640990,
            0.20980522036552430,
            0.31552031636238100,
            0.28292679786682130,
            -0.23881813883781433,
            0.26318275928497314,
            -0.25081199407577515,
            -1.56406641006469730,
            -0.20272035896778107,
            -0.30980134010314940,
            -0.13830965757369995,
            -0.65654301643371580,
            0.31328544020652770,
            0.39124441146850586,
            0.14648842811584473,
            0.10790233314037323,
            -0.0011418797075748444,
            0.29148331284523010,
            0.39446878433227540,
            0.15861868858337402,
            -0.01094374805688858,
            0.69656980037689210,
            0.53402501344680790,
            -0.19458736479282380,
            -0.33765941858291626,
            0.20578813552856445,
            1.02007591724395750,
            -0.27630817890167236,
            -0.055134907364845276,
            0.10728104412555695,
            0.19857768714427948,
            -0.051949791610240936,
            -0.95591288805007930,
            -0.016068458557128906,
            0.14163839817047120,
            0.07818788290023804,
            0.30343624949455260,
            -0.00487295538187027,
            -0.03668808937072754,
            0.23092812299728394,
            0.22601000964641570,
            -0.17142324149608612,
            0.19191186130046844,
            0.24479267001152039,
            0.75923907756805420,
            0.52936017513275150,
            0.59186935424804690,
            -0.60621523857116700,
            0.32727080583572390,
            -0.11824478209018707,
            -0.05898610129952431,
            -0.012164704501628876,
            -0.10524882376194000,
            -0.64567971229553220,
            1.40957057476043700,
            -0.30128875374794006,
            -0.52295249700546260,
            0.053494296967983246,
            -0.34456601738929750,
            -0.22763675451278687,
            -0.07936172187328339,
            -0.61760181188583370,
            -0.18934124708175660,
            -0.04926346242427826,
            0.07053080201148987,
            -0.32558596134185790,
            -0.61692816019058230,
            0.25635927915573120,
            -0.40595006942749023,
            -0.45488622784614563,
            -1.27675628662109380,
            0.23719409108161926,
            -0.24088490009307860,
            -0.042445749044418335,
            -0.0018720626831054688,
            1.05558359622955320,
            -0.49247956275939940,
            0.17333477735519410,
            0.035649579018354416,
            -5.73797512054443400,
            1.30945181846618650,
            0.51552683115005490,
            0.15089595317840576,
            0.35859110951423645,
            -0.04071284830570221,
            -0.86825460195541380,
            1.31599712371826170,
            -0.09168644249439240,
            0.63117879629135130,
            -0.17361941933631897,
            0.10322868078947067,
            -0.60555946826934810,
            0.23382598161697388,
            -0.82185673713684080,
            -0.10401326417922974,
            0.13238205015659332,
            -0.03597678989171982,
            -0.51136314868927000,
            0.15768136084079742,
            -0.23854430019855500,
            -0.14175727963447570,
            -0.11781750619411469,
            0.38926169276237490,
            -0.31990337371826170,
            0.24176508188247680,
            0.59939318895339970,
            -0.72715508937835690,
            0.39353600144386290,
            -0.38137459754943850,
            0.20685830712318420,
            -0.38994306325912476,
            0.05647854506969452,
            -0.23935276269912720,
            -0.22889091074466705,
            -0.019344180822372437,
            0.040057696402072906,
            -0.24383866786956787,
            -0.39092701673507690,
            -0.018549658358097076,
            0.51890051364898680,
            0.86515939235687260,
            0.28614503145217896,
            0.64386940002441410,
            0.31628671288490295,
            -0.40825888514518740,
            -0.33183339238166810,
            0.16869042813777924,
            0.010168105363845825,
            0.30278283357620240,
            -0.60569459199905400,
            -0.20262216031551360,
            -1.09207832813262940,
            -0.027563804760575294,
            0.06484303623437881,
            0.27420419454574585,
            -0.49345779418945310,
            0.10804055631160736,
            -0.14800167083740234,
            0.08484844118356705,
            -0.78326535224914550,
            -0.006926223635673523,
            -0.25266957283020020,
            -0.26330786943435670,
            0.89378148317337040,
            -0.64368873834609990,
            0.25188437104225160,
            0.04949730634689331,
            -0.23263952136039734,
            -0.0038242843002080917,
            0.24761386215686798,
            0.21502655744552612,
            0.27725243568420410,
            -0.03591444715857506,
            0.11199191957712173,
            0.35744479298591614,
            0.15654230117797852,
            -0.11716540157794952,
            -0.49658292531967163,
            -0.12044863402843475,
            -0.59336757659912110,
            -0.04827989637851715,
            0.27895766496658325,
            0.60082894563674930,
            -0.44568234682083130,
            0.18149539828300476,
            0.84179604053497310,
            -0.20165166258811950,
            0.15945611894130707,
            -0.19363774359226227,
            -0.38449636101722720,
            -0.38157621026039124,
            0.23142817616462708,
            -0.32686632871627810,
            0.32904222607612610,
            -0.62547576427459720,
            -0.17987522482872010,
            0.13854908943176270,
            0.28109687566757200,
            -0.66307181119918820,
            -0.10197299718856812,
            0.23179894685745240,
            0.14371933043003082,
            -0.015187196433544159,
            -0.005701176822185516,
            -0.009048223495483398,
            -0.36947503685951233,
            -0.08419185131788254,
            0.18359073996543884,
            0.36397165060043335,
            -0.18554688990116120,
            0.06282243132591248,
            0.12127010524272919,
            0.10142311453819275,
            -0.75937509536743160,
            0.14368136227130890,
            -0.15232974290847778,
            0.030483879148960114,
            -0.20716962218284607,
            0.09505847096443176,
            -0.03633452206850052,
            0.11635903269052505,
            0.19411554932594300,
            -0.34413999319076540,
            0.09673729538917542,
            0.15466451644897460,
            -0.11886352300643921,
            -0.31654387712478640,
            0.023902088403701782,
            0.59250128269195560,
            -0.03467556834220886,
            -0.19663128256797790,
            0.07225932180881500,
            -0.20673781633377075,
            0.10626789927482605,
            0.27759736776351930,
            0.14237537980079650,
            -0.06108829379081726,
            -0.14290234446525574,
            -0.034046679735183716,
            -0.23872807621955872,
            -0.30120781064033510,
            0.53876233100891110,
            0.47913902997970580,
            0.15108020603656770,
            -0.21000367403030396,
            -0.09006668627262115,
            -0.12558355927467346,
            -0.29648718237876890,
            -0.09471682459115982,
            0.10165409743785858,
            -0.04843531921505928,
            -0.20445811748504640,
            -0.64695239067077640,
            0.34345996379852295,
            0.25094231963157654,
            0.28040134906768800,
            0.26930731534957886,
            -0.18992258608341217,
            -0.31795889139175415,
            0.10275565087795258,
            -0.31493186950683594,
            0.05224027484655380,
            0.03900603950023651,
            -0.15962079167366028,
            -0.40141177177429200,
            1.50395190715789800,
            -0.18131579458713531,
            0.25262355804443360,
            0.56724452972412110,
            0.19896474480628967,
            0.22113317251205444,
            -0.37682905793190000,
            -0.34762057662010193,
            -0.36291345953941345,
            0.38737395405769350,
            0.39863935112953186,
            0.06930093467235565,
            -0.07484766840934753,
            0.26550960540771484,
            -0.37431126832962036,
            0.06163658946752548,
            -0.16546487808227540,
            -0.16572664678096770,
            -0.41679629683494570,
            -0.22878777980804443,
            0.17536523938179016,
            0.43185859918594360,
            -0.18755021691322327,
            0.57233977317810060,
            0.34548804163932800,
            0.26037001609802246,
            0.57140541076660160,
            1.03332614898681640,
            -1.69704651832580570,
            0.44388985633850100,
            0.08646445721387863,
            -0.32414677739143370,
            -0.39306485652923584,
            0.21713417768478394,
            -0.38696998357772827,
            0.16778808832168580,
            -0.05270355939865112,
            -0.22387394309043884,
            0.07469445466995239,
            0.04779075086116791,
            0.30713665485382080,
            -0.33245295286178590,
            -0.26004213094711304,
            -0.12230075895786285,
            -0.65894758701324460,
            0.06937650591135025,
            0.11567105352878570,
            0.38836821913719180,
            -0.07238084077835083,
            0.58317494392395020,
            0.71717137098312380,
            0.10365724563598633,
            -0.58237200975418090,
            0.01732088252902031,
            0.86498779058456420,
            -0.04113391041755676,
            -0.09420709311962128,
            0.19938360154628754,
            0.004110394045710564,
            0.0035112202167510986,
            0.32821851968765260,
            0.20233154296875000,
            0.10732693225145340,
            1.30262577533721920,
            -0.25104320049285890,
            -0.09294586628675461,
            0.07033525407314300,
            0.26292678713798523,
            -0.10476322472095490,
            0.49015024304389954,
            -0.38899934291839600,
            -0.057010307908058167,
            -0.19918194413185120,
            -0.23839278519153595,
            0.34912475943565370,
            -0.38353130221366880,
            0.034570418298244476,
            -0.10393957048654556,
            -0.19936946034431458,
            0.30964389443397520,
            -0.012369591742753983,
            -0.14967474341392517,
            -0.11177364736795425,
            -0.19989341497421265,
            0.62171781063079830,
            0.20537722110748290,
            0.16507479548454285,
            -0.59005945920944210,
            -0.11848224699497223,
            0.00022661685943603516,
            0.03684444725513458,
            0.06734884530305862,
            -0.06063830852508545,
            0.06855276226997375,
            0.38286936283111570,
            -0.07564809173345566,
            0.11344917118549347,
            -0.42775198817253113,
            -0.23143202066421510,
            -0.13804715871810913,
            0.08444565534591675,
            -0.17835569381713867,
            -0.56565302610397340,
            -0.04202693700790405,
            0.09906928986310959,
            0.78766095638275150,
            0.38724774122238160,
            0.22494032979011536,
            -0.09758158773183823,
            0.30130439996719360,
            0.08548129349946976,
            0.012833205051720142,
            -0.33451801538467410,
            -0.02345825731754303,
            -0.11464481055736542,
            0.20209941267967224,
            0.13876622915267944,
            -0.09112481772899628,
            0.59946906566619870,
            -0.31222972273826600,
            -0.15563198924064636,
            -0.019779425114393234,
            -0.18419799208641052,
            -0.36252117156982420,
            -0.66804647445678710,
            0.07264155894517899,
            0.14690190553665160,
            0.58527380228042600,
            0.10589228570461273,
            0.15317067503929138,
            -0.14340689778327942,
            0.11329543590545654,
            0.21681559085845947,
            -0.01961892843246460,
            0.22408972680568695,
            0.40270829200744630,
            -0.28345388174057007,
            0.001580655574798584,
            0.29231256246566770,
            -0.31483244895935060,
            -0.66095465421676640,
            0.12513107061386108,
            0.25342079997062683,
            -0.35947406291961670,
            0.10373535752296448,
            -0.14622645080089570,
            0.03869847208261490,
            -0.13646872341632843,
            -0.054877884685993195,
            -0.29587787389755250,
            0.10567575693130493,
            -0.27623349428176880,
            -0.16489294171333313,
            0.03129418194293976,
            -0.36633712053298950,
            -0.30330657958984375,
            -0.10047523677349090,
            0.38868999481201170,
            0.18341153860092163,
            -0.42602014541625977,
            -0.42138785123825073,
            0.16399800777435303,
            -0.13668435811996460,
            0.08918181061744690,
            0.18008530139923096,
            0.34570962190628050,
            0.13715223968029022,
            -0.35308316349983215,
            0.017223667353391647,
            0.16259710490703583,
            -2.01324987411499020,
            0.35719367861747740,
            0.05423700809478760,
            0.64791858196258540,
            1.41284525394439700,
            -0.025331489741802216,
            0.03643947094678879,
            -0.07986896485090256,
            -0.45607382059097290,
            -0.36353543400764465,
            -0.022743068635463715,
            0.41851943731307983,
            0.05244317650794983,
            0.17263151705265045,
            0.07288816571235657,
            0.30261635780334470,
            -0.38646593689918520,
            -0.054808780550956726,
            -0.28826522827148440,
            -0.01994667947292328,
            -0.48321542143821716,
            -0.21889880299568176,
            -0.26040261983871460,
            -0.52937489748001100,
            -0.041442275047302246,
            -1.15707290172576900,
            0.22746005654335022,
            -0.12931922078132630,
            0.35249620676040650,
            0.27543902397155760,
            -0.39276057481765747,
            -0.42217552661895750,
            -0.22715577483177185,
            0.004897281527519226,
            -0.31350314617156980,
            -0.45807397365570070,
            0.25268691778182983,
            0.04663296043872833,
            -0.59933739900588990,
            0.15925574302673340,
            -0.08339263498783112,
            0.18594521284103394,
            -0.13940119743347168,
            0.30508360266685486,
            -0.24364741146564484,
            -0.64189815521240230,
            -0.02178923785686493,
            -0.22042772173881530,
            0.34853425621986390,
            0.46653327345848083,
            -0.03486161679029465,
            0.50477695465087890,
            -0.10376831889152527,
            -0.14050556719303130,
            -0.08073642104864120,
            0.06925593316555023,
            0.21366350352764130,
            0.24056504666805267,
            0.12795145809650420,
            0.16419601440429688,
            0.06756377220153809,
            -0.18162062764167786,
            0.33428809046745300,
            0.06203627586364746,
            0.63255858421325680,
            -0.51533907651901250,
            0.13819636404514313,
            0.07493585348129272,
            -0.19676387310028076,
            0.30928391218185425,
            -0.47425344586372375,
            0.09209989756345749,
            0.44058740139007570,
            0.24711114168167114,
            -0.32648178935050964,
            0.40268272161483765,
            0.11267729103565216,
            0.17878434062004090,
            -0.52805340290069580,
            0.46472996473312380,
            -0.47340789437294006,
            0.62205803394317630,
            -0.28207665681838990,
            0.04906800761818886,
        ],
        "clip_embeddings_magnitude": 10.556536674499512,
        "aspect_ratio": 1.33,
        "rating": 0,
        "dominant_color": "[216, 130, 71]",
        "video_length": None,
        "removed": False,
        "in_trashcan": False,
        "timestamp": None,
        "camera": "Pixel 2",
        "digitalZoomRatio": None,
        "focalLength35Equivalent": None,
        "focal_length": 4.442,
        "fstop": 1.8,
        "height": 3024,
        "iso": None,
        "lens": None,
        "shutter_speed": "1/1000",
        "size": 7487773,
        "subjectDistance": 0.265,
        "width": 4032,
        "main_file_id": "cac6402c7ff192e6fa96fee50ba24fd81",
    },
    {
        "thumbnail_big": "thumbnails_big/1f522608a263a88ea72010fe4f08f3071.webp",
        "square_thumbnail": "square_thumbnails/1f522608a263a88ea72010fe4f08f3071.webp",
        "square_thumbnail_small": "square_thumbnails_small/1f522608a263a88ea72010fe4f08f3071.webp",
        "added_on": "2023-06-16 16:30:51.051404 +00:00",
        "exif_gps_lat": -33.941975,
        "exif_gps_lon": 151.265088888889,
        "exif_timestamp": "2017-10-17 10:13:13.000000 +00:00",
        "exif_json": None,
        "geolocation_json": {
            "type": "FeatureCollection",
            "query": [151.265089, -33.941975],
            "features": [
                {
                    "id": "poi.721554610670",
                    "text": "Mistral Point",
                    "type": "Feature",
                    "center": [151.26523, -33.941658],
                    "context": [
                        {
                            "id": "postcode.503310",
                            "text": "2035",
                            "mapbox_id": "dXJuOm1ieHBsYzpCNjRP",
                        },
                        {
                            "id": "locality.269412878",
                            "text": "Maroubra",
                            "wikidata": "Q2914843",
                            "mapbox_id": "dXJuOm1ieHBsYzpFQTdxRGc",
                        },
                        {
                            "id": "place.24496142",
                            "text": "Sydney",
                            "wikidata": "Q3130",
                            "mapbox_id": "dXJuOm1ieHBsYzpBWFhJRGc",
                        },
                        {
                            "id": "region.33806",
                            "text": "New South Wales",
                            "wikidata": "Q3224",
                            "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                            "short_code": "AU-NSW",
                        },
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [151.26523, -33.941658],
                    },
                    "relevance": 1,
                    "place_name": "Mistral Point, Sydney, New South Wales 2035, Australia",
                    "place_type": ["poi"],
                    "properties": {
                        "category": "historic site, historic",
                        "landmark": True,
                        "foursquare": "5958b8724420d86b1808f7bd",
                    },
                },
                {
                    "id": "postcode.503310",
                    "bbox": [151.205214, -33.958015, 151.265693, -33.931801],
                    "text": "2035",
                    "type": "Feature",
                    "center": [151.242438, -33.942906],
                    "context": [
                        {
                            "id": "locality.269412878",
                            "text": "Maroubra",
                            "wikidata": "Q2914843",
                            "mapbox_id": "dXJuOm1ieHBsYzpFQTdxRGc",
                        },
                        {
                            "id": "place.24496142",
                            "text": "Sydney",
                            "wikidata": "Q3130",
                            "mapbox_id": "dXJuOm1ieHBsYzpBWFhJRGc",
                        },
                        {
                            "id": "region.33806",
                            "text": "New South Wales",
                            "wikidata": "Q3224",
                            "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                            "short_code": "AU-NSW",
                        },
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [151.242438, -33.942906],
                    },
                    "relevance": 1,
                    "place_name": "2035, Maroubra, New South Wales, Australia",
                    "place_type": ["postcode"],
                    "properties": {"mapbox_id": "dXJuOm1ieHBsYzpCNjRP"},
                },
                {
                    "id": "locality.269412878",
                    "bbox": [151.226804557, -33.958002321, 151.292531935, -33.93283624],
                    "text": "Maroubra",
                    "type": "Feature",
                    "center": [151.2575, -33.9475],
                    "context": [
                        {
                            "id": "place.24496142",
                            "text": "Sydney",
                            "wikidata": "Q3130",
                            "mapbox_id": "dXJuOm1ieHBsYzpBWFhJRGc",
                        },
                        {
                            "id": "region.33806",
                            "text": "New South Wales",
                            "wikidata": "Q3224",
                            "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                            "short_code": "AU-NSW",
                        },
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        },
                    ],
                    "geometry": {"type": "Point", "coordinates": [151.2575, -33.9475]},
                    "relevance": 1,
                    "place_name": "Maroubra, New South Wales, Australia",
                    "place_type": ["locality"],
                    "properties": {
                        "wikidata": "Q2914843",
                        "mapbox_id": "dXJuOm1ieHBsYzpFQTdxRGc",
                    },
                },
                {
                    "id": "place.24496142",
                    "bbox": [150.520934139, -34.11717528, 151.369884128, -33.562644328],
                    "text": "Sydney",
                    "type": "Feature",
                    "center": [151.216454, -33.854816],
                    "context": [
                        {
                            "id": "region.33806",
                            "text": "New South Wales",
                            "wikidata": "Q3224",
                            "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                            "short_code": "AU-NSW",
                        },
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [151.216454, -33.854816],
                    },
                    "relevance": 1,
                    "place_name": "Sydney, New South Wales, Australia",
                    "place_type": ["place"],
                    "properties": {
                        "wikidata": "Q3130",
                        "mapbox_id": "dXJuOm1ieHBsYzpBWFhJRGc",
                    },
                },
                {
                    "id": "region.33806",
                    "bbox": [140.999265, -37.5097258, 159.200456, -28.1370359],
                    "text": "New South Wales",
                    "type": "Feature",
                    "center": [147.014694071448, -32.168971672412],
                    "context": [
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        }
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [147.014694071448, -32.168971672412],
                    },
                    "relevance": 1,
                    "place_name": "New South Wales, Australia",
                    "place_type": ["region"],
                    "properties": {
                        "wikidata": "Q3224",
                        "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                        "short_code": "AU-NSW",
                    },
                },
                {
                    "id": "country.8718",
                    "bbox": [112.8256904, -54.8327658, 159.200456, -9.0436707],
                    "text": "Australia",
                    "type": "Feature",
                    "center": [134.489562606981, -25.7349684916223],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [134.489562606981, -25.7349684916223],
                    },
                    "relevance": 1,
                    "place_name": "Australia",
                    "place_type": ["country"],
                    "properties": {
                        "wikidata": "Q408",
                        "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                        "short_code": "au",
                    },
                },
            ],
            "attribution": "NOTICE: © 2023 Mapbox and its suppliers. All rights reserved. Use of this data is subject to the Mapbox Terms of Service (https://www.mapbox.com/about/maps/). This response and the information it contains may not be retained. POI(s) provided by Foursquare.",
            "search_text": "Mistral Point 2035 Maroubra Sydney New South Wales Australia",
        },
        "captions_json": {
            "places365": {
                "attributes": [
                    "natural light",
                    "open area",
                    "cloth",
                    "sunny",
                    "rugged scene",
                    "man made",
                    "no horizon",
                    "dry",
                    "climbing",
                ],
                "categories": [],
                "environment": "outdoor",
            }
        },
        "search_captions": "outdoor",
        "search_location": "Mistral Point 2035 Maroubra Sydney New South Wales Australia",
        "hidden": False,
        "public": False,
        "video": False,
        "clip_embeddings": [
            -0.07165607810020447,
            0.27777394652366640,
            -0.15911960601806640,
            -0.008188512176275253,
            -0.009010881185531616,
            0.034435927867889404,
            -0.03819745033979416,
            0.64109969139099120,
            0.26547160744667053,
            0.12205618619918823,
            0.29898315668106080,
            -0.10334454476833344,
            0.48246607184410095,
            -0.35823887586593630,
            -0.024076826870441437,
            -0.39234489202499390,
            -1.93601369857788090,
            -0.038323208689689636,
            0.26534727215766907,
            -0.31557315587997437,
            0.42033576965332030,
            0.10789811611175537,
            0.25757673382759094,
            -0.69643688201904300,
            0.02039242535829544,
            0.61391353607177730,
            -0.14854159951210022,
            -0.02548396587371826,
            0.09138785302639008,
            0.01601754128932953,
            -0.16707235574722290,
            0.18399655818939210,
            -0.35197073221206665,
            -0.67160075902938840,
            -0.25247159600257874,
            0.025167599320411682,
            -0.03638566657900810,
            0.30362653732299805,
            0.54022008180618290,
            -0.18761183321475983,
            -0.54178249835968020,
            0.14752727746963500,
            0.14671368896961212,
            -0.26148569583892820,
            0.16243551671504974,
            -1.18054628372192380,
            0.53845894336700440,
            -0.16278918087482452,
            -0.22392278909683228,
            -0.31029137969017030,
            0.10120061784982681,
            0.36866247653961180,
            0.68476313352584840,
            -0.32936185598373413,
            0.42605328559875490,
            0.29965081810951233,
            -0.09844471514225006,
            -0.25767421722412110,
            -0.34776532649993896,
            -0.34964543581008910,
            -0.35941550135612490,
            -0.04731412231922150,
            -0.12926623225212097,
            0.11695092916488647,
            -0.32863533496856690,
            -0.19086918234825134,
            -0.16123855113983154,
            1.26160860061645500,
            -0.38261440396308900,
            -0.038163766264915466,
            -0.17712144553661346,
            0.07694791257381439,
            -0.38384479284286500,
            -0.39457264542579650,
            -0.024550501257181168,
            -0.30032104253768920,
            -0.48474478721618650,
            0.17176222801208496,
            -0.35844194889068604,
            -0.22569467127323150,
            -0.04710277169942856,
            0.26759219169616700,
            0.18299442529678345,
            0.42168390750885010,
            0.27530056238174440,
            0.08983490616083145,
            0.56285107135772700,
            -0.36590436100959780,
            -0.21663343906402588,
            -0.23292037844657898,
            0.28227549791336060,
            -0.03927003592252731,
            -6.69503688812255900,
            0.40044450759887695,
            0.17168624699115753,
            0.16189746558666230,
            -0.21396432816982270,
            -0.18209101259708405,
            -0.14555342495441437,
            -1.11969792842865000,
            0.26553612947463990,
            -0.43248271942138670,
            -0.23711906373500824,
            0.13495093584060670,
            -0.57171511650085450,
            0.31623297929763794,
            -0.26300746202468870,
            0.11482997238636017,
            -0.04145537316799164,
            -0.012881413102149963,
            0.38327059149742126,
            -0.28872770071029663,
            0.13417448103427887,
            0.0004943050444126129,
            -0.48013591766357420,
            0.15905582904815674,
            -0.17036144435405730,
            0.11494286358356476,
            0.38910707831382750,
            -0.04960992932319641,
            0.0068108439445495605,
            -0.39681759476661680,
            0.05528683960437775,
            0.25615781545639040,
            0.16935455799102783,
            -0.15641900897026062,
            0.030953165143728256,
            -0.09216502308845520,
            -0.51438409090042110,
            0.20902346074581146,
            0.09113435447216034,
            -0.28546446561813354,
            0.12450934201478958,
            0.90055423974990840,
            -0.30295214056968690,
            0.04577522724866867,
            0.23674716055393220,
            0.19620284438133240,
            -0.14195847511291504,
            0.027747787535190582,
            0.24356174468994140,
            -0.24453750252723694,
            -0.13842593133449554,
            -0.04814389348030090,
            -0.29600149393081665,
            0.33813029527664185,
            -0.40565192699432373,
            1.04664814472198490,
            -0.12125436961650848,
            -0.04555452987551689,
            -0.32212057709693910,
            0.19244483113288880,
            -0.17625807225704193,
            -0.11717353016138077,
            0.52924054861068730,
            -0.91078692674636840,
            0.61408323049545290,
            -0.015624964609742165,
            0.005238614976406097,
            0.49075758457183840,
            -0.62067019939422610,
            0.30432268977165220,
            -0.032360561192035675,
            0.30186992883682250,
            -0.41565680503845215,
            -0.36446920037269590,
            0.94007527828216550,
            0.70317226648330690,
            0.23549987375736237,
            -0.39121294021606445,
            -0.17178057134151460,
            -0.042171500623226166,
            0.05205693840980530,
            -0.12189273536205292,
            -0.19439676403999330,
            -0.12377274036407471,
            -0.34452289342880250,
            0.02267320826649666,
            -0.68486988544464110,
            0.55518913269042970,
            0.44782432913780210,
            0.029707305133342743,
            -0.07340695708990097,
            0.25972485542297363,
            -0.25381219387054443,
            0.19427055120468140,
            0.29389485716819763,
            -0.50578629970550540,
            0.15614330768585205,
            0.31318914890289307,
            -0.08632530272006989,
            -0.23409178853034973,
            0.05476500093936920,
            0.44156715273857117,
            -0.22440673410892487,
            0.023980028927326202,
            -0.43828743696212770,
            -0.19539453089237213,
            0.70773118734359740,
            -0.21142446994781494,
            -0.012780480086803436,
            0.06678064167499542,
            -0.12673433125019073,
            -0.016046274453401566,
            0.34845018386840820,
            -0.37029501795768740,
            -0.41383981704711914,
            0.14042145013809204,
            -0.07714009284973145,
            0.23623535037040710,
            -0.07902203500270844,
            -0.22669017314910890,
            0.13354891538619995,
            0.24691657721996307,
            -0.23718547821044922,
            0.19054308533668518,
            -0.10418700426816940,
            0.33725842833518980,
            -0.08150300383567810,
            -0.020559510216116905,
            -0.06275172531604767,
            0.32859966158866880,
            -0.23827262222766876,
            0.006859809160232544,
            -0.43626987934112550,
            0.00422387570142746,
            -0.42823368310928345,
            0.06333791464567184,
            0.24973529577255250,
            -0.038866639137268066,
            0.39266145229339600,
            -0.33822238445281980,
            0.20358082652091980,
            0.45638072490692140,
            0.24203394353389740,
            -1.19550085067749020,
            -0.07111288607120514,
            0.31889787316322327,
            -0.07209780812263489,
            0.08574327081441879,
            -0.05155383050441742,
            0.10396289825439453,
            0.37258481979370117,
            0.31418317556381226,
            -0.41241401433944700,
            0.15978108346462250,
            0.07924050092697144,
            0.046578992158174515,
            0.14554628729820251,
            0.23571312427520752,
            -0.67628896236419680,
            0.16695483028888702,
            -0.21981866657733917,
            0.16223661601543427,
            -0.021025659516453743,
            0.06956741958856583,
            -0.30338615179061890,
            -0.16539447009563446,
            1.11133313179016110,
            0.07875859737396240,
            0.08710280805826187,
            0.09269724786281586,
            0.43146112561225890,
            -0.63181507587432860,
            0.24583837389945984,
            -0.44661480188369750,
            0.03440243750810623,
            0.11665569245815277,
            0.15819263458251953,
            0.12243788689374924,
            0.29396194219589233,
            0.09694259613752365,
            0.02281755954027176,
            -0.21637912094593048,
            -0.37317517399787903,
            0.33211824297904970,
            0.18465763330459595,
            0.04658152908086777,
            -0.22277922928333282,
            -0.01132119633257389,
            -0.22123819589614868,
            0.21734745800495148,
            0.18564417958259583,
            -0.16151818633079530,
            -0.012778416275978088,
            0.22715422511100770,
            -0.61123466491699220,
            -0.25164487957954407,
            -0.62368929386138920,
            -0.08976317942142487,
            -0.18425342440605164,
            0.01974041759967804,
            0.40116083621978760,
            0.09709006547927856,
            0.02330559492111206,
            -0.24683454632759094,
            0.46549883484840393,
            0.17286136746406555,
            0.13242653012275696,
            -0.018801003694534302,
            0.05591413378715515,
            -0.008567705750465393,
            0.31677705049514770,
            -0.03249857574701309,
            0.23144552111625670,
            -0.19878269731998444,
            0.34026873111724854,
            0.46859806776046753,
            0.46318793296813965,
            -0.15173172950744630,
            0.03247187286615372,
            -0.35306686162948610,
            0.89938664436340330,
            -0.12891116738319397,
            0.23192928731441498,
            -0.20485301315784454,
            0.26682716608047485,
            0.03473209589719772,
            -0.05685047805309296,
            0.85817599296569820,
            0.20728000998497010,
            -0.42015826702117920,
            -0.20325171947479248,
            -0.18902121484279633,
            -0.08646465092897415,
            0.47624379396438600,
            0.07658274471759796,
            0.24890711903572083,
            0.09770368039608002,
            -0.07584749162197113,
            -0.38329556584358215,
            -0.09186994284391403,
            0.05287090688943863,
            -0.07528317719697952,
            -0.30612573027610780,
            0.03865929692983627,
            0.20936234295368195,
            -0.12896691262722015,
            0.40101802349090576,
            -0.27413615584373474,
            -0.11920598894357681,
            -0.27652582526206970,
            0.16087099909782410,
            0.30647218227386475,
            -0.23265513777732850,
            -0.04036612808704376,
            -0.19249220192432404,
            0.29576075077056885,
            -0.33208352327346800,
            -0.26545786857604980,
            -0.47843095660209656,
            0.05080226808786392,
            -0.18463236093521118,
            -0.31534552574157715,
            -0.16215364634990692,
            0.44137579202651980,
            0.19857212901115417,
            -0.05095067620277405,
            0.60800743103027340,
            0.18676830828189850,
            0.43479916453361510,
            -0.31042078137397766,
            0.34246861934661865,
            -0.22135923802852630,
            -0.16289021074771880,
            0.14682009816169740,
            -0.05069936811923981,
            -1.54986953735351560,
            -0.20729129016399384,
            0.30774104595184326,
            -0.74974900484085080,
            0.17779231071472168,
            0.29844737052917480,
            -0.028225738555192947,
            0.06633662432432175,
            0.09315972030162811,
            1.39255237579345700,
            0.08268950879573822,
            0.17041748762130737,
            -0.07805733382701874,
            -0.009891202673316002,
            -0.42962673306465150,
            -0.31951111555099490,
            -0.59171640872955320,
            0.13881197571754456,
            0.05963444709777832,
            0.36311095952987670,
            0.20484755933284760,
            -0.24004952609539032,
            -0.30473378300666810,
            -1.23349046707153320,
            0.12950478494167328,
            0.13113403320312500,
            -0.13356469571590424,
            -0.33658254146575930,
            -0.17962300777435303,
            0.44429525732994080,
            0.25605937838554380,
            -0.18255349993705750,
            -0.34041595458984375,
            0.12862077355384827,
            -0.10708140581846237,
            -0.04143147915601730,
            -0.75912737846374510,
            0.11328382045030594,
            -0.33319079875946045,
            -0.12773975729942322,
            -0.24314782023429870,
            -0.08418860286474228,
            0.024868622422218323,
            -0.24916192889213562,
            0.14967927336692810,
            0.50531852245330810,
            -0.17624694108963013,
            -0.32372432947158813,
            0.26036772131919860,
            -0.13107712566852570,
            -0.19526052474975586,
            -0.34996968507766724,
            0.09007526934146881,
            -0.19009685516357422,
            -0.04918465018272400,
            0.42598405480384827,
            -0.95772063732147220,
            -0.26188156008720400,
            -0.13462109863758087,
            -0.48766309022903440,
            -0.04416780546307564,
            -0.24330116808414460,
            0.49982681870460510,
            -0.59761744737625120,
            -0.51605522632598880,
            0.25707191228866577,
            0.06983644515275955,
            -0.70166909694671630,
            -0.44174510240554810,
            0.59883981943130490,
            -0.23916383087635040,
            -0.23846682906150818,
            -0.09755046665668488,
            0.06088256835937500,
            0.57148891687393190,
            -0.46913427114486694,
            0.10756542533636093,
            0.24516284465789795,
            -0.29232767224311830,
            -0.41785952448844910,
            -0.20276978611946106,
            -0.09826758503913880,
            0.03998877853155136,
            0.23493704199790955,
            -0.30350178480148315,
            -0.05809980630874634,
            -0.92815858125686650,
            -0.07727308571338654,
            0.009639181196689606,
            0.11947400122880936,
            -0.32069391012191770,
            -0.15333953499794006,
            -0.20000588893890380,
            0.51839399337768550,
            -0.12886822223663330,
            -0.06542570143938065,
            -0.07890033721923828,
            0.67580813169479370,
            0.23756900429725647,
            -0.39474987983703613,
            -0.08904854953289032,
            0.10808389633893967,
            0.55502021312713620,
            -0.06922332942485810,
            0.08530282974243164,
            -0.64823102951049800,
            -0.25969624519348145,
            0.18102583289146423,
            -0.15270616114139557,
            -0.08661939203739166,
            -0.13988846540451050,
            -0.13920640945434570,
            -0.19092643260955810,
            -0.30402636528015137,
            0.034376729279756546,
            0.28963160514831543,
            -0.026797950267791748,
            -0.009581595659255981,
            -0.13647942245006560,
            0.45053595304489136,
            -0.13274556398391724,
            -0.32779148221015930,
            -0.29205349087715150,
            -0.04352697730064392,
            -0.10386516153812408,
            0.09681421518325806,
            -0.43473735451698303,
            -0.12714838981628418,
            -0.13591085374355316,
            -0.019401680678129196,
            0.08398979157209396,
            -0.21437484025955200,
            0.16760951280593872,
            0.06209127604961395,
            0.10363107919692993,
            0.037978142499923706,
            0.25537312030792236,
            -0.006652772426605225,
            -0.29459229111671450,
            0.13102664053440094,
            0.72616183757781980,
            -0.90198361873626710,
            -0.04998414218425751,
            0.015783268958330154,
            0.34867671132087710,
        ],
        "clip_embeddings_magnitude": 10.424424171447754,
        "aspect_ratio": 1.33,
        "rating": 0,
        "dominant_color": "[99, 135, 179]",
        "video_length": None,
        "removed": False,
        "in_trashcan": False,
        "timestamp": None,
        "camera": "Pixel 2",
        "digitalZoomRatio": None,
        "focalLength35Equivalent": None,
        "focal_length": 4.442,
        "fstop": 1.8,
        "height": 3024,
        "iso": None,
        "lens": None,
        "shutter_speed": "0",
        "size": 9246412,
        "subjectDistance": 1.686,
        "width": 4032,
        "main_file_id": "1f522608a263a88ea72010fe4f08f3071",
    },
    {
        "thumbnail_big": "thumbnails_big/e05dc030e807ae8fc31442fa2ba7fdf81.webp",
        "square_thumbnail": "square_thumbnails/e05dc030e807ae8fc31442fa2ba7fdf81.webp",
        "square_thumbnail_small": "square_thumbnails_small/e05dc030e807ae8fc31442fa2ba7fdf81.webp",
        "added_on": "2023-06-16 16:30:42.859303 +00:00",
        "exif_gps_lat": -33.8880555555556,
        "exif_gps_lon": 151.275180555556,
        "exif_timestamp": "2017-10-18 15:08:09.000000 +00:00",
        "exif_json": None,
        "geolocation_json": {
            "type": "FeatureCollection",
            "query": [151.275181, -33.888056],
            "features": [
                {
                    "id": "address.6965576203835628",
                    "text": "Beach Road",
                    "type": "Feature",
                    "center": [151.275216500055, -33.888012425],
                    "address": "17",
                    "context": [
                        {
                            "id": "postcode.429582",
                            "text": "2026",
                            "mapbox_id": "dXJuOm1ieHBsYzpCbzRP",
                        },
                        {
                            "id": "locality.259156494",
                            "text": "Bondi Beach",
                            "wikidata": "Q673418",
                            "mapbox_id": "dXJuOm1ieHBsYzpEM0pxRGc",
                        },
                        {
                            "id": "place.24496142",
                            "text": "Sydney",
                            "wikidata": "Q3130",
                            "mapbox_id": "dXJuOm1ieHBsYzpBWFhJRGc",
                        },
                        {
                            "id": "region.33806",
                            "text": "New South Wales",
                            "wikidata": "Q3224",
                            "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                            "short_code": "AU-NSW",
                        },
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [151.275216500055, -33.888012425],
                    },
                    "relevance": 1,
                    "place_name": "17 Beach Road, Bondi Beach New South Wales 2026, Australia",
                    "place_type": ["address"],
                    "properties": {
                        "accuracy": "rooftop",
                        "mapbox_id": "dXJuOm1ieGFkcjo3NmQ1MTQzZi1kZmEwLTQ4NzAtYTAyNy0zYWY1MGJiZTIxYWU",
                    },
                },
                {
                    "id": "postcode.429582",
                    "bbox": [151.2582, -33.90058, 151.285977, -33.878047],
                    "text": "2026",
                    "type": "Feature",
                    "center": [151.271075, -33.898745],
                    "context": [
                        {
                            "id": "locality.259156494",
                            "text": "Bondi Beach",
                            "wikidata": "Q673418",
                            "mapbox_id": "dXJuOm1ieHBsYzpEM0pxRGc",
                        },
                        {
                            "id": "place.24496142",
                            "text": "Sydney",
                            "wikidata": "Q3130",
                            "mapbox_id": "dXJuOm1ieHBsYzpBWFhJRGc",
                        },
                        {
                            "id": "region.33806",
                            "text": "New South Wales",
                            "wikidata": "Q3224",
                            "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                            "short_code": "AU-NSW",
                        },
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [151.271075, -33.898745],
                    },
                    "relevance": 1,
                    "place_name": "2026, Bondi Beach, New South Wales, Australia",
                    "place_type": ["postcode"],
                    "properties": {"mapbox_id": "dXJuOm1ieHBsYzpCbzRP"},
                },
                {
                    "id": "locality.259156494",
                    "bbox": [151.26203377, -33.896871333, 151.282858153, -33.884999032],
                    "text": "Bondi Beach",
                    "type": "Feature",
                    "center": [151.2745, -33.8915],
                    "context": [
                        {
                            "id": "place.24496142",
                            "text": "Sydney",
                            "wikidata": "Q3130",
                            "mapbox_id": "dXJuOm1ieHBsYzpBWFhJRGc",
                        },
                        {
                            "id": "region.33806",
                            "text": "New South Wales",
                            "wikidata": "Q3224",
                            "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                            "short_code": "AU-NSW",
                        },
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        },
                    ],
                    "geometry": {"type": "Point", "coordinates": [151.2745, -33.8915]},
                    "relevance": 1,
                    "place_name": "Bondi Beach, New South Wales, Australia",
                    "place_type": ["locality"],
                    "properties": {
                        "wikidata": "Q673418",
                        "mapbox_id": "dXJuOm1ieHBsYzpEM0pxRGc",
                    },
                },
                {
                    "id": "place.24496142",
                    "bbox": [150.520934139, -34.11717528, 151.369884128, -33.562644328],
                    "text": "Sydney",
                    "type": "Feature",
                    "center": [151.216454, -33.854816],
                    "context": [
                        {
                            "id": "region.33806",
                            "text": "New South Wales",
                            "wikidata": "Q3224",
                            "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                            "short_code": "AU-NSW",
                        },
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [151.216454, -33.854816],
                    },
                    "relevance": 1,
                    "place_name": "Sydney, New South Wales, Australia",
                    "place_type": ["place"],
                    "properties": {
                        "wikidata": "Q3130",
                        "mapbox_id": "dXJuOm1ieHBsYzpBWFhJRGc",
                    },
                },
                {
                    "id": "region.33806",
                    "bbox": [140.999265, -37.5097258, 159.200456, -28.1370359],
                    "text": "New South Wales",
                    "type": "Feature",
                    "center": [147.014694071448, -32.168971672412],
                    "context": [
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        }
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [147.014694071448, -32.168971672412],
                    },
                    "relevance": 1,
                    "place_name": "New South Wales, Australia",
                    "place_type": ["region"],
                    "properties": {
                        "wikidata": "Q3224",
                        "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                        "short_code": "AU-NSW",
                    },
                },
                {
                    "id": "country.8718",
                    "bbox": [112.8256904, -54.8327658, 159.200456, -9.0436707],
                    "text": "Australia",
                    "type": "Feature",
                    "center": [134.489562606981, -25.7349684916223],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [134.489562606981, -25.7349684916223],
                    },
                    "relevance": 1,
                    "place_name": "Australia",
                    "place_type": ["country"],
                    "properties": {
                        "wikidata": "Q408",
                        "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                        "short_code": "au",
                    },
                },
            ],
            "attribution": "NOTICE: © 2023 Mapbox and its suppliers. All rights reserved. Use of this data is subject to the Mapbox Terms of Service (https://www.mapbox.com/about/maps/). This response and the information it contains may not be retained. POI(s) provided by Foursquare.",
            "search_text": "Beach Road 2026 Bondi Beach Sydney New South Wales Australia",
        },
        "captions_json": {
            "places365": {
                "attributes": [
                    "no horizon",
                    "man made",
                    "wood",
                    "natural light",
                    "cloth",
                    "railing",
                    "fencing",
                    "soothing",
                    "enclosed area",
                ],
                "categories": ["boardwalk"],
                "environment": "outdoor",
            }
        },
        "search_captions": "boardwalk , outdoor",
        "search_location": "Beach Road 2026 Bondi Beach Sydney New South Wales Australia",
        "hidden": False,
        "public": False,
        "video": False,
        "clip_embeddings": [
            -0.23971192538738250,
            -0.06270129978656769,
            -0.26378244161605835,
            0.06143847107887268,
            -0.17431882023811340,
            -0.45036801695823670,
            0.23159477114677430,
            0.45534604787826540,
            0.41466632485389710,
            0.43482506275177000,
            0.033715225756168365,
            -0.12434051930904388,
            -0.02738797664642334,
            0.13923697173595428,
            0.71357935667037960,
            -0.10237488895654678,
            0.44860103726387024,
            -0.12994986772537231,
            0.16177919507026672,
            -0.52953779697418210,
            -0.15292952954769135,
            0.35376715660095215,
            0.68445837497711180,
            -0.12952817976474762,
            -0.65442270040512080,
            -0.11123260110616684,
            0.35111707448959350,
            -0.21466320753097534,
            -0.07700178027153015,
            0.60484236478805540,
            -0.35141080617904663,
            0.42874458432197570,
            -0.14701411128044128,
            -0.31290709972381590,
            0.41403374075889590,
            0.42659783363342285,
            0.14210951328277588,
            0.21080046892166138,
            -0.20884071290493011,
            1.55791330337524410,
            -1.02671170234680180,
            -0.21040523052215576,
            0.21100938320159912,
            -0.018877588212490082,
            0.045770272612571716,
            -1.74390268325805660,
            0.27797201275825500,
            0.11735321581363678,
            -0.16868110001087190,
            0.07083947211503983,
            0.17496472597122192,
            0.18361502885818481,
            0.06942721456289291,
            0.29114612936973570,
            0.16485445201396942,
            0.35742586851119995,
            0.71032893657684330,
            0.08239606022834778,
            -0.48378357291221620,
            0.40987241268157960,
            0.61319535970687870,
            0.07883536070585251,
            0.52093547582626340,
            0.56784075498580930,
            0.13938774168491364,
            -0.15158170461654663,
            0.37094724178314210,
            0.83913630247116090,
            -0.48059833049774170,
            -0.05472422018647194,
            0.50041580200195310,
            0.14854013919830322,
            0.11348950862884521,
            -0.10606382042169571,
            -0.032269977033138275,
            -0.10980830341577530,
            -0.06923694908618927,
            -0.44631308317184450,
            0.06693774461746216,
            -0.67717289924621580,
            0.16200356185436250,
            -0.08856121450662613,
            -0.45839691162109375,
            -0.59329897165298460,
            0.027508363127708435,
            -0.17059496045112610,
            1.00395536422729500,
            -0.40785533189773560,
            0.20544975996017456,
            -0.61956644058227540,
            0.30773437023162840,
            -0.75228130817413330,
            -6.36993885040283200,
            0.23692467808723450,
            -0.18002653121948242,
            0.41877511143684387,
            -0.03537013381719589,
            -0.13835334777832030,
            -0.28309312462806700,
            0.99767374992370600,
            0.43206804990768430,
            -0.61333036422729490,
            0.31665223836898804,
            0.011051952838897705,
            0.26114824414253235,
            0.20024497807025910,
            0.86893093585968020,
            0.16212932765483856,
            0.038838282227516174,
            0.10568191856145859,
            0.18302081525325775,
            -0.49132484197616577,
            -0.13319587707519530,
            -0.38572445511817930,
            0.09171506762504578,
            -0.26322168111801150,
            -0.66410481929779050,
            0.13588872551918030,
            0.47181224822998047,
            -0.05031928792595863,
            0.25005054473876953,
            0.21581515669822693,
            0.25475072860717773,
            -0.24969539046287537,
            0.54527783393859860,
            -0.27312040328979490,
            -0.55337727069854740,
            0.23277127742767334,
            0.014410212635993958,
            0.24621416628360748,
            0.11218813061714172,
            -0.35024920105934143,
            -0.21312740445137024,
            0.80181252956390380,
            -0.79384481906890870,
            0.50359219312667850,
            -0.45367711782455444,
            -0.48844304680824280,
            -0.11650219559669495,
            -0.12895251810550690,
            -0.26562160253524780,
            0.20769277215003967,
            -0.21654091775417328,
            0.21669554710388184,
            -0.23972092568874360,
            0.43769764900207520,
            0.32644972205162050,
            0.35533404350280760,
            0.28178536891937256,
            0.40197637677192690,
            0.16447728872299194,
            0.41968211531639100,
            -1.00776052474975590,
            0.09402647614479065,
            0.07121045887470245,
            -0.38577982783317566,
            -0.15076629817485810,
            -0.67609924077987670,
            -0.37826904654502870,
            -0.17423087358474731,
            -0.019086994230747223,
            0.09864071011543274,
            0.30087676644325256,
            0.27617043256759644,
            0.06742041558027267,
            -0.01719839498400688,
            0.47258347272872925,
            0.44886517524719240,
            0.06894390285015106,
            0.013095356523990631,
            -0.34940755367279050,
            0.02119274064898491,
            0.44170263409614563,
            -0.17398183047771454,
            0.11397088319063187,
            -0.25963869690895080,
            0.66773271560668950,
            -0.029286637902259827,
            0.26047524809837340,
            0.16783103346824646,
            -0.10030107200145721,
            -0.28766095638275146,
            -0.20763801038265228,
            -0.020237110555171967,
            0.26628720760345460,
            -0.03873760998249054,
            0.33926361799240110,
            -0.22293141484260560,
            -0.02787308767437935,
            -0.02593088522553444,
            -0.14129941165447235,
            0.26731464266777040,
            -0.08877785503864288,
            0.31370738148689270,
            -0.03215152025222778,
            0.28753554821014404,
            0.28241288661956787,
            -0.58873462677001950,
            -1.19819414615631100,
            -0.31043520569801330,
            0.52656930685043330,
            -0.15177714824676514,
            0.04967714473605156,
            0.21121788024902344,
            -0.34197264909744260,
            -0.58301079273223880,
            -0.05980183556675911,
            0.08901736885309220,
            -0.016958534717559814,
            0.70352792739868160,
            0.04605954885482788,
            0.33565390110015870,
            -0.15496665239334106,
            0.008393734693527222,
            -0.39955216646194460,
            -0.58763426542282100,
            -0.06084361672401428,
            0.49945196509361267,
            1.24120748043060300,
            -0.26017981767654420,
            0.88132452964782710,
            0.42076665163040160,
            -0.11274620890617370,
            -0.17265769839286804,
            -0.42378520965576170,
            0.51237106323242190,
            -0.05410161614418030,
            0.19328644871711730,
            0.06429362297058105,
            0.08922037482261658,
            0.26436531543731690,
            -0.07118786871433258,
            0.16370669007301330,
            0.53644728660583500,
            -0.22373552620410920,
            -0.10707579553127289,
            -0.40309336781501770,
            -0.36508309841156006,
            -0.35035932064056396,
            -0.40398806333541870,
            -0.19331835210323334,
            0.46320116519927980,
            0.38004130125045776,
            0.28961494565010070,
            -0.11237305402755737,
            0.92902261018753050,
            0.52717500925064090,
            -0.55640512704849240,
            0.43815851211547850,
            0.17259076237678528,
            0.16953691840171814,
            -0.15717472136020660,
            0.36117780208587646,
            -0.15650644898414612,
            0.41624057292938230,
            0.23601931333541870,
            -0.07374796271324158,
            0.19807760417461395,
            0.90526473522186280,
            0.15534612536430360,
            -0.10369679331779480,
            0.44986745715141296,
            0.14716669917106628,
            -1.63226437568664550,
            0.34298181533813477,
            -0.07653657346963882,
            0.09407752752304077,
            -0.09107702970504761,
            -0.15198035538196564,
            0.40160834789276123,
            -0.11560469865798950,
            0.12189065665006638,
            0.55020934343338010,
            0.23245319724082947,
            -0.33362627029418945,
            -0.026688329875469208,
            0.036947548389434814,
            -0.15187057852745056,
            0.16617432236671448,
            -0.22867006063461304,
            -0.14950640499591827,
            0.18319699168205260,
            -0.16728959977626800,
            -0.10700336098670960,
            -0.40600830316543580,
            0.11292800307273865,
            -0.45587986707687380,
            0.08800569921731949,
            -0.12228171527385712,
            -0.20845821499824524,
            0.012005604803562164,
            0.009173348546028137,
            0.03591999411582947,
            0.06969346106052399,
            -0.057597748935222626,
            -0.26176500320434570,
            0.057852864265441895,
            0.52407950162887570,
            -0.06004469096660614,
            0.09566502273082733,
            0.45640081167221070,
            -0.36844995617866516,
            -0.19065113365650177,
            -0.24948999285697937,
            0.10381768643856049,
            0.20994564890861510,
            -0.43057119846343994,
            0.44703856110572815,
            0.45062947273254395,
            -0.048142626881599426,
            -0.43613320589065550,
            0.68679362535476680,
            0.80048835277557370,
            -0.27635425329208374,
            0.05641265958547592,
            0.45497626066207886,
            -0.07284688949584961,
            0.027119621634483337,
            -0.71727848052978520,
            0.051672548055648804,
            0.49660560488700867,
            -0.014366000890731812,
            -0.32767134904861450,
            0.57496893405914310,
            -0.10740306973457336,
            0.31921407580375670,
            -0.18982721865177155,
            0.62163728475570680,
            0.05321182310581207,
            -0.007055327296257019,
            -0.39857268333435060,
            -0.42034840583801270,
            0.42702692747116090,
            -0.25245079398155210,
            -0.15837675333023070,
            0.13288237154483795,
            0.38176494836807250,
            -0.002602334599941969,
            -0.13858896493911743,
            -0.14321827888488770,
            -0.22877745330333710,
            -0.49555492401123047,
            0.05159477889537811,
            0.11018384248018265,
            0.51627355813980100,
            0.27100521326065063,
            0.25322765111923220,
            0.24974197149276733,
            0.33265298604965210,
            -0.29485535621643066,
            -1.29044723510742190,
            0.04591430723667145,
            -0.07321572303771973,
            -0.14710950851440430,
            0.12631073594093323,
            1.13345527648925780,
            -0.014754462987184525,
            -0.29979729652404785,
            0.16985306143760680,
            -0.009212018921971321,
            0.07431145012378693,
            -0.09315565973520279,
            0.009219720959663391,
            0.010067738592624664,
            -0.63250660896301270,
            0.17347553372383118,
            -0.07402996718883514,
            -0.71398895978927610,
            -0.21345643699169160,
            -0.05977027118206024,
            -0.15027517080307007,
            0.23419082164764404,
            0.07772324234247208,
            0.24337679147720337,
            -0.21138656139373780,
            -0.14810818433761597,
            0.86943644285202030,
            0.16901102662086487,
            -0.56860476732254030,
            0.46403664350509644,
            0.09731522202491760,
            -0.56933224201202390,
            -0.12460615485906601,
            -0.11898320913314820,
            0.07008326053619385,
            -0.28138583898544310,
            -0.13215136528015137,
            -0.17825207114219666,
            0.42181590199470520,
            -1.26650285720825200,
            -0.38550242781639100,
            -0.79046458005905150,
            0.27815857529640200,
            -0.33496844768524170,
            0.35100549459457400,
            -0.047406621277332306,
            -0.28952226042747500,
            0.05926326662302017,
            -0.40099292993545530,
            -0.67989456653594970,
            -0.10077974200248718,
            0.20837950706481934,
            0.22934542596340180,
            -0.19858762621879578,
            0.03676336631178856,
            -0.35527148842811584,
            0.16404820978641510,
            0.00022447854280471802,
            0.76411741971969600,
            -0.28233665227890015,
            0.63915759325027470,
            -0.37327551841735840,
            -0.16160306334495544,
            0.20690485835075378,
            0.13408637046813965,
            0.04813005030155182,
            -0.20736610889434814,
            -0.04153786227107048,
            0.45611751079559326,
            -0.16623178124427795,
            0.62960529327392580,
            0.05700150877237320,
            0.31719794869422910,
            -0.85579967498779300,
            0.26484364271163940,
            -0.24446523189544678,
            -0.15408588945865630,
            -0.19397708773612976,
            -0.11019599437713623,
            0.03778602182865143,
            -0.29206633567810060,
            0.01961149275302887,
            0.15172131359577180,
            -0.28065830469131470,
            0.11242515593767166,
            -0.18694521486759186,
            -0.58477157354354860,
            0.05389549210667610,
            0.22777841985225677,
            -0.32870626449584960,
            0.29864984750747680,
            0.18124125897884370,
            -0.20861062407493590,
            0.0054992809891700745,
            0.03267093002796173,
            -0.49986141920089720,
            -0.11108686029911041,
            -0.59358328580856320,
            -0.37555414438247680,
            -0.06972122937440872,
            0.20261085033416748,
            0.14063805341720580,
            -0.03213777393102646,
            0.64066505432128910,
            0.12838377058506012,
            -0.26487171649932860,
            0.08924877643585205,
            0.24947234988212585,
            0.15273018181324005,
            0.40036311745643616,
            0.044563665986061096,
            0.06986735761165619,
            -0.06490179151296616,
            -0.22339831292629242,
            0.84133744239807130,
            0.18982148170471191,
            -0.25457212328910830,
            0.005809254944324493,
            -0.10496775060892105,
            0.09663195163011551,
            0.053644873201847076,
            -0.12464396655559540,
            -0.52167260646820070,
            -0.03012670949101448,
            -0.42671746015548706,
            0.04330782592296600,
            -0.15239623188972473,
            0.24043066799640656,
            -0.27606680989265440,
            -0.21640032529830933,
            0.22917535901069640,
            -0.07214342057704926,
            -0.007351040840148926,
            -0.10876821726560593,
            -0.30059793591499330,
            0.17446355521678925,
            -0.11450521647930145,
            -0.21727171540260315,
            0.13252682983875275,
            0.28893244266510010,
            -0.34937959909439087,
            0.10954467207193375,
            0.67957222461700440,
            -0.40904277563095090,
            -0.005858458578586578,
            -0.17941795289516450,
            -0.02339877001941204,
            -0.007561013102531433,
            -0.34222379326820374,
            -0.23668894171714783,
            -0.19201411306858063,
            0.07832273840904236,
            -0.17331452667713165,
            0.15513053536415100,
            0.20789094269275665,
            0.011405497789382935,
            -0.022110439836978912,
            0.31066673994064330,
            -0.89273244142532350,
            0.69325125217437740,
            0.22300001978874207,
            -0.06441357731819153,
        ],
        "clip_embeddings_magnitude": 10.693284034729004,
        "aspect_ratio": 1.33,
        "rating": 0,
        "dominant_color": "[64, 59, 54]",
        "video_length": None,
        "removed": False,
        "in_trashcan": False,
        "timestamp": None,
        "camera": "Pixel 2",
        "digitalZoomRatio": None,
        "focalLength35Equivalent": None,
        "focal_length": 4.442,
        "fstop": 1.8,
        "height": 3024,
        "iso": None,
        "lens": None,
        "shutter_speed": "1/390",
        "size": 9145064,
        "subjectDistance": 0.377,
        "width": 4032,
        "main_file_id": "e05dc030e807ae8fc31442fa2ba7fdf81",
    },
    {
        "thumbnail_big": "thumbnails_big/c57f08a55c6daa689e6e13a1bf8f81471.webp",
        "square_thumbnail": "square_thumbnails/c57f08a55c6daa689e6e13a1bf8f81471.webp",
        "square_thumbnail_small": "square_thumbnails_small/c57f08a55c6daa689e6e13a1bf8f81471.webp",
        "added_on": "2023-06-16 16:30:49.679482 +00:00",
        "exif_gps_lat": 33.91345,
        "exif_gps_lon": 78.4573888888889,
        "exif_timestamp": "2017-10-12 08:00:51.000000 +00:00",
        "exif_json": None,
        "geolocation_json": {
            "type": "FeatureCollection",
            "query": [78.457389, 33.91345],
            "features": [
                {
                    "id": "address.4021415981422040",
                    "text": "Lakeshore Road",
                    "type": "Feature",
                    "center": [78.45710764679163, 33.91336849412403],
                    "context": [
                        {
                            "id": "postcode.13119083",
                            "text": "194201",
                            "mapbox_id": "dXJuOm1ieHBsYzp5QzVy",
                        },
                        {
                            "id": "locality.3711994475",
                            "text": "Shachokol",
                            "wikidata": "Q24912826",
                            "mapbox_id": "dXJuOm1ieHBsYzozVUNLYXc",
                        },
                        {
                            "id": "place.25135211",
                            "text": "Leh",
                            "wikidata": "Q230818",
                            "mapbox_id": "dXJuOm1ieHBsYzpBWCtJYXc",
                        },
                        {
                            "id": "district.3196523",
                            "text": "Leh",
                            "wikidata": "Q1921210",
                            "mapbox_id": "dXJuOm1ieHBsYzpNTVpy",
                        },
                        {
                            "id": "region.222315",
                            "text": "Ladakh",
                            "wikidata": "Q200667",
                            "mapbox_id": "dXJuOm1ieHBsYzpBMlJy",
                            "short_code": "IN-LA",
                        },
                        {
                            "id": "country.8811",
                            "text": "India",
                            "wikidata": "Q668",
                            "mapbox_id": "dXJuOm1ieHBsYzpJbXM",
                            "short_code": "in",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [78.45710764679163, 33.91336849412403],
                    },
                    "relevance": 1,
                    "place_name": "Lakeshore Road ، 194201 Leh، India",
                    "place_type": ["address"],
                    "properties": {"accuracy": "street"},
                },
                {
                    "id": "postcode.13119083",
                    "bbox": [77.159628, 32.619815, 79.042702, 34.608467],
                    "text": "194201",
                    "type": "Feature",
                    "center": [77.668644, 34.050466],
                    "context": [
                        {
                            "id": "locality.3711994475",
                            "text": "Shachokol",
                            "wikidata": "Q24912826",
                            "mapbox_id": "dXJuOm1ieHBsYzozVUNLYXc",
                        },
                        {
                            "id": "place.25135211",
                            "text": "Leh",
                            "wikidata": "Q230818",
                            "mapbox_id": "dXJuOm1ieHBsYzpBWCtJYXc",
                        },
                        {
                            "id": "district.3196523",
                            "text": "Leh",
                            "wikidata": "Q1921210",
                            "mapbox_id": "dXJuOm1ieHBsYzpNTVpy",
                        },
                        {
                            "id": "region.222315",
                            "text": "Ladakh",
                            "wikidata": "Q200667",
                            "mapbox_id": "dXJuOm1ieHBsYzpBMlJy",
                            "short_code": "IN-LA",
                        },
                        {
                            "id": "country.8811",
                            "text": "India",
                            "wikidata": "Q668",
                            "mapbox_id": "dXJuOm1ieHBsYzpJbXM",
                            "short_code": "in",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [77.668644, 34.050466],
                    },
                    "relevance": 1,
                    "place_name": "194201, Leh, Ladakh, India",
                    "place_type": ["postcode"],
                    "properties": {"mapbox_id": "dXJuOm1ieHBsYzp5QzVy"},
                },
                {
                    "id": "locality.3711994475",
                    "bbox": [77.324409401, 33.676681361, 79.042702, 35.496086],
                    "text": "Shachokol",
                    "type": "Feature",
                    "center": [78.167596, 34.039239],
                    "context": [
                        {
                            "id": "place.25135211",
                            "text": "Leh",
                            "wikidata": "Q230818",
                            "mapbox_id": "dXJuOm1ieHBsYzpBWCtJYXc",
                        },
                        {
                            "id": "district.3196523",
                            "text": "Leh",
                            "wikidata": "Q1921210",
                            "mapbox_id": "dXJuOm1ieHBsYzpNTVpy",
                        },
                        {
                            "id": "region.222315",
                            "text": "Ladakh",
                            "wikidata": "Q200667",
                            "mapbox_id": "dXJuOm1ieHBsYzpBMlJy",
                            "short_code": "IN-LA",
                        },
                        {
                            "id": "country.8811",
                            "text": "India",
                            "wikidata": "Q668",
                            "mapbox_id": "dXJuOm1ieHBsYzpJbXM",
                            "short_code": "in",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [78.167596, 34.039239],
                    },
                    "relevance": 1,
                    "place_name": "Shachokol, Leh, Leh, Ladakh, India",
                    "place_type": ["locality"],
                    "properties": {
                        "wikidata": "Q24912826",
                        "mapbox_id": "dXJuOm1ieHBsYzozVUNLYXc",
                    },
                },
                {
                    "id": "place.25135211",
                    "bbox": [77.107033, 32.33574, 79.305839, 35.522256],
                    "text": "Leh",
                    "type": "Feature",
                    "center": [77.584813, 34.164203],
                    "context": [
                        {
                            "id": "district.3196523",
                            "text": "Leh",
                            "wikidata": "Q1921210",
                            "mapbox_id": "dXJuOm1ieHBsYzpNTVpy",
                        },
                        {
                            "id": "region.222315",
                            "text": "Ladakh",
                            "wikidata": "Q200667",
                            "mapbox_id": "dXJuOm1ieHBsYzpBMlJy",
                            "short_code": "IN-LA",
                        },
                        {
                            "id": "country.8811",
                            "text": "India",
                            "wikidata": "Q668",
                            "mapbox_id": "dXJuOm1ieHBsYzpJbXM",
                            "short_code": "in",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [77.584813, 34.164203],
                    },
                    "relevance": 1,
                    "place_name": "Leh, Ladakh, India",
                    "place_type": ["place"],
                    "properties": {
                        "wikidata": "Q230818",
                        "mapbox_id": "dXJuOm1ieHBsYzpBWCtJYXc",
                    },
                },
                {
                    "id": "region.222315",
                    "bbox": [75.306629, 32.33574, 79.305851, 35.673315],
                    "text": "Ladakh",
                    "type": "Feature",
                    "center": [77.27783203125, 34.0071350643588],
                    "context": [
                        {
                            "id": "country.8811",
                            "text": "India",
                            "wikidata": "Q668",
                            "mapbox_id": "dXJuOm1ieHBsYzpJbXM",
                            "short_code": "in",
                        }
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [77.27783203125, 34.0071350643588],
                    },
                    "relevance": 1,
                    "place_name": "Ladakh, India",
                    "place_type": ["region"],
                    "properties": {
                        "wikidata": "Q200667",
                        "mapbox_id": "dXJuOm1ieHBsYzpBMlJy",
                        "short_code": "IN-LA",
                    },
                },
                {
                    "id": "country.8811",
                    "bbox": [68.1152344, 6.6718373, 97.395359, 35.673315],
                    "text": "India",
                    "type": "Feature",
                    "center": [78.476681027237, 22.1991660760527],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [78.476681027237, 22.1991660760527],
                    },
                    "relevance": 1,
                    "place_name": "India",
                    "place_type": ["country"],
                    "properties": {
                        "wikidata": "Q668",
                        "mapbox_id": "dXJuOm1ieHBsYzpJbXM",
                        "short_code": "in",
                    },
                },
            ],
            "attribution": "NOTICE: © 2023 Mapbox and its suppliers. All rights reserved. Use of this data is subject to the Mapbox Terms of Service (https://www.mapbox.com/about/maps/). This response and the information it contains may not be retained. POI(s) provided by Foursquare.",
            "search_text": "Lakeshore Road 194201 Shachokol Leh Ladakh India",
        },
        "captions_json": {
            "places365": {
                "attributes": [
                    "man made",
                    "natural light",
                    "open area",
                    "no horizon",
                    "clouds",
                    "cloth",
                    "vertical components",
                    "sunny",
                    "plastic",
                ],
                "categories": ["playground"],
                "environment": "outdoor",
            }
        },
        "search_captions": "playground , outdoor",
        "search_location": "Lakeshore Road 194201 Shachokol Leh Ladakh India",
        "hidden": False,
        "public": False,
        "video": False,
        "clip_embeddings": [
            -0.18379329144954681,
            0.14253073930740356,
            -0.34837892651557920,
            0.37873998284339905,
            0.34088349342346190,
            0.17458681762218475,
            0.25472477078437805,
            0.29220539331436160,
            -0.40241336822509766,
            -0.11195755004882812,
            0.30859681963920593,
            0.04621639847755432,
            0.15303245186805725,
            -0.42163884639739990,
            -0.18283540010452270,
            0.27533942461013794,
            -1.12763762474060060,
            -0.24703232944011688,
            0.023488599807024002,
            -0.51369655132293700,
            -0.18228112161159515,
            0.04996514320373535,
            0.09342576563358307,
            -0.17483948171138763,
            -0.25493249297142030,
            0.019286181777715683,
            0.17102202773094177,
            -0.29159709811210630,
            0.33772629499435425,
            -0.19569182395935059,
            -0.19514861702919006,
            0.35274094343185425,
            -0.05648523569107056,
            -0.30300104618072510,
            0.01596139743924141,
            0.47075837850570680,
            -0.26226904988288880,
            0.10937485098838806,
            -0.45466923713684080,
            -0.61406242847442630,
            0.045746058225631714,
            -0.09549369663000107,
            0.49270814657211304,
            0.02534257248044014,
            -0.29359999299049380,
            -0.07753305882215500,
            -0.02130131423473358,
            -0.07495892047882080,
            -0.60064113140106200,
            -0.014182962477207184,
            0.18451625108718872,
            0.35400345921516420,
            0.22977495193481445,
            0.06056281179189682,
            -0.16951103508472443,
            0.43877935409545900,
            -0.08079877495765686,
            -0.07902894914150238,
            -0.05741514265537262,
            0.55906730890274050,
            0.58910524845123290,
            -0.26552647352218630,
            0.47798049449920654,
            -0.17932428419589996,
            0.03466450423002243,
            -0.32181957364082336,
            0.32691439986228943,
            1.57434558868408200,
            -0.60944569110870360,
            -0.30789577960968020,
            -0.03525789454579353,
            0.21574194729328156,
            0.09106104075908661,
            0.07360906153917313,
            -0.21098615229129790,
            0.14903579652309418,
            -0.20697991549968720,
            0.09246206283569336,
            -0.30049309134483340,
            -0.25683689117431640,
            -0.42003977298736570,
            0.38077199459075930,
            -0.32969945669174194,
            -0.46575132012367250,
            0.24943169951438904,
            0.38942575454711914,
            -0.37571138143539430,
            -0.58096361160278320,
            0.11415434628725052,
            -0.42314538359642030,
            0.30862617492675780,
            0.26128217577934265,
            -7.43450069427490200,
            -0.14982101321220398,
            -0.007992172613739967,
            0.12065914273262024,
            -0.38246965408325195,
            -0.34107217192649840,
            -0.80451864004135130,
            -1.04886448383331300,
            0.55530327558517460,
            -0.24028851091861725,
            0.14857441186904907,
            0.07519923150539398,
            -0.44258895516395570,
            -0.22696885466575623,
            -1.76246547698974600,
            -0.04149024933576584,
            -0.33089119195938110,
            0.034649670124053955,
            0.20300607383251190,
            -0.18623992800712585,
            0.18344642221927643,
            0.23681724071502686,
            0.27303919196128845,
            0.08612959086894989,
            0.08668576925992966,
            0.09101299196481705,
            0.43840888142585754,
            -0.61762166023254400,
            -0.20999190211296082,
            0.46851450204849243,
            -0.060045816004276276,
            -0.10672970116138458,
            -0.12689085304737090,
            -0.22409234941005707,
            -0.28366869688034060,
            -0.25668996572494507,
            0.04891391843557358,
            0.35491180419921875,
            0.27223268151283264,
            -0.19807010889053345,
            0.01612691581249237,
            0.98669499158859250,
            0.94963777065277100,
            0.11202965676784515,
            0.13241872191429138,
            -0.33038973808288574,
            -0.24429757893085480,
            0.30757093429565430,
            -0.10918612778186798,
            -0.20302526652812958,
            -0.014930151402950287,
            0.67508393526077270,
            -0.30977970361709595,
            -0.19329161942005157,
            0.04983800649642944,
            0.58730208873748780,
            -0.76442992687225340,
            0.10625885426998138,
            -0.009232066571712494,
            0.26251035928726196,
            0.29365420341491700,
            -0.28812190890312195,
            0.07605545222759247,
            -0.65482407808303830,
            0.35084849596023560,
            0.34299698472023010,
            0.33285912871360780,
            -0.22953245043754578,
            -0.20801588892936707,
            -0.05146145820617676,
            0.18107087910175323,
            0.51615625619888310,
            -0.28014412522315980,
            0.21909615397453308,
            1.08348631858825680,
            0.43758583068847656,
            -0.15551409125328064,
            -0.11162629723548889,
            0.08055899292230606,
            0.09409813582897186,
            0.021383360028266907,
            -0.50918841361999510,
            -0.11208890378475189,
            -0.38599658012390137,
            -0.86290252208709720,
            0.24611333012580872,
            -0.62409228086471560,
            0.27000692486763000,
            -0.019148532301187515,
            -0.15995115041732788,
            0.0021793851628899574,
            0.07647107541561127,
            0.19650121033191680,
            0.25712081789970400,
            0.15782865881919860,
            -0.12753826379776000,
            0.13912162184715270,
            0.057879120111465454,
            0.12957704067230225,
            0.23146329820156097,
            0.024382056668400764,
            0.04920619726181030,
            -0.24734464287757874,
            0.23542645573616028,
            -0.17139248549938202,
            -0.16124279797077180,
            0.63887059688568120,
            0.39621770381927490,
            -0.20532843470573425,
            0.012457119300961494,
            -0.39233744144439700,
            0.71717041730880740,
            0.25644633173942566,
            -0.49303287267684937,
            -0.04727388173341751,
            -0.38488596677780150,
            0.03999908268451691,
            -0.11684153228998184,
            -1.22885262966156000,
            -0.15317772328853607,
            0.03499954938888550,
            0.18243020772933960,
            -0.32903003692626953,
            -0.28470265865325930,
            -0.17769415676593780,
            0.35230401158332825,
            -0.68235456943511960,
            -0.44540110230445860,
            0.25034108757972720,
            0.23645302653312683,
            -0.09606185555458069,
            0.23800262808799744,
            0.11027810722589493,
            0.05310886353254318,
            -0.15807375311851501,
            -0.32893413305282590,
            -0.12554939091205597,
            -0.09278482198715210,
            0.36654987931251526,
            0.31478390097618103,
            0.022500615566968918,
            -0.17153693735599518,
            0.58437371253967290,
            -0.56753563880920410,
            0.0016302019357681274,
            -0.31919938325881960,
            -0.01767304539680481,
            -0.30621975660324097,
            0.42181178927421570,
            0.18961273133754730,
            -0.27777704596519470,
            -0.04874429106712341,
            -0.83623814582824710,
            -0.59505325555801390,
            0.15763781964778900,
            0.11460117995738983,
            -0.037775248289108276,
            0.36981520056724550,
            0.04750179499387741,
            0.28530880808830260,
            -0.32593557238578796,
            0.20472106337547302,
            -0.14085072278976440,
            -0.43984699249267580,
            -0.44318401813507080,
            0.16889306902885437,
            0.69945454597473140,
            0.022213801741600037,
            0.04395437240600586,
            0.018100500106811523,
            -0.60659039020538330,
            0.65107047557830810,
            0.23823469877243042,
            -0.17507782578468323,
            0.08020025491714478,
            0.31494301557540894,
            0.30044376850128174,
            -0.23546507954597473,
            0.11599977314472198,
            0.48960816860198975,
            0.23746117949485780,
            -0.48635044693946840,
            -0.23878610134124756,
            0.26654928922653200,
            -0.25886836647987366,
            -0.08302380144596100,
            -0.13755083084106445,
            0.24222144484519958,
            0.47945415973663330,
            0.38373395800590515,
            0.30907928943634033,
            -0.25348061323165894,
            0.12096904218196869,
            0.28086936473846436,
            -1.17676830291748050,
            0.04671703651547432,
            -0.48752713203430176,
            -0.20467823743820190,
            0.37203326821327210,
            -0.58486735820770260,
            0.17445452511310577,
            -0.08156547695398330,
            0.45127516984939575,
            -0.02351894974708557,
            -0.19682705402374268,
            0.17286786437034607,
            -0.17587804794311523,
            0.30918318033218384,
            0.15095241367816925,
            -0.22093287110328674,
            -0.08669745922088623,
            -0.11007970571517944,
            0.003908701241016388,
            -0.44974136352539060,
            0.13072070479393005,
            0.77382683753967290,
            0.30658128857612610,
            -0.24635344743728638,
            -0.21027483046054840,
            0.16422425210475922,
            0.98671263456344600,
            -0.42050862312316895,
            0.22445756196975708,
            0.23323085904121400,
            0.21030767261981964,
            0.08243256807327270,
            0.18058310449123383,
            -0.55228275060653690,
            0.029390739277005196,
            -0.0027499347925186157,
            -0.26178988814353943,
            0.39981740713119507,
            -0.46446281671524050,
            0.20612671971321106,
            0.02648659050464630,
            -0.06571706384420395,
            -0.09742008894681930,
            0.27914172410964966,
            -0.44574266672134400,
            -0.004618685692548752,
            -0.20941592752933502,
            -0.014536745846271515,
            0.04214660823345184,
            0.16787378489971160,
            0.12518627941608430,
            0.14714732766151428,
            0.42325642704963684,
            -0.18695265054702760,
            0.59449142217636110,
            -0.41381680965423584,
            -0.08633117377758026,
            0.48078146576881410,
            0.01567218452692032,
            -0.11084793508052826,
            -0.25879496335983276,
            0.25035518407821655,
            0.08629626780748367,
            -0.17640779912471770,
            0.35798883438110350,
            0.003633505664765835,
            0.26752072572708130,
            -0.008670955896377563,
            -0.060069844126701355,
            -0.45262604951858520,
            0.0029344558715820312,
            0.81401431560516360,
            0.30656427145004270,
            0.10814795643091202,
            0.16015036404132843,
            0.27728241682052610,
            0.003430556505918503,
            0.59562069177627560,
            -0.60939180850982670,
            0.11420226097106934,
            -0.07706215977668762,
            -0.68500268459320070,
            -0.005410104990005493,
            0.013373695313930511,
            0.21606793999671936,
            0.08226697891950607,
            -0.19103342294692993,
            0.37374818325042725,
            0.44795745611190796,
            -0.11685820668935776,
            1.60860514640808100,
            -0.28285527229309080,
            0.58519774675369260,
            0.17927187681198120,
            0.43113380670547485,
            -0.08384191989898682,
            -0.23026300966739655,
            -0.87972706556320190,
            -0.0010712891817092896,
            -0.11425804346799850,
            -0.03720918670296669,
            -0.013472747057676315,
            -0.20737977325916290,
            1.80557346343994140,
            -0.64729046821594240,
            -0.30271497368812560,
            -0.061230555176734924,
            -0.38844275474548340,
            0.17786000669002533,
            -0.031046316027641296,
            0.24852822721004486,
            -0.39031293988227844,
            -0.28145694732666016,
            -0.52712631225585940,
            0.43997967243194580,
            -0.22887703776359558,
            0.17240211367607117,
            -0.29442641139030457,
            0.35376852750778200,
            0.22806043922901154,
            -0.06477281451225281,
            -0.35966825485229490,
            0.40587043762207030,
            -0.08254503458738327,
            0.93505430221557620,
            0.013737834990024567,
            -0.16866286098957062,
            -0.17242559790611267,
            -0.09762792289257050,
            0.06496423482894897,
            -0.53277724981307980,
            -0.41173180937767030,
            -0.10729959607124329,
            -0.22943912446498870,
            0.09855599701404572,
            -0.31594187021255493,
            0.63642692565917970,
            0.08816694468259811,
            -0.11014832556247711,
            -0.28573364019393920,
            -0.16491752862930298,
            -0.013046562671661377,
            -0.57793509960174560,
            0.16094970703125000,
            -0.41850280761718750,
            -0.07970791310071945,
            0.15436783432960510,
            -0.29503697156906130,
            -0.052088260650634766,
            -0.33966383337974550,
            0.018201902508735657,
            -0.06606295704841614,
            0.04100047051906586,
            0.36471304297447205,
            -0.40008947253227234,
            0.07975389063358307,
            0.39990115165710450,
            0.15097494423389435,
            -0.21128392219543457,
            0.05080147460103035,
            -0.046003326773643494,
            0.25351849198341370,
            0.16474604606628418,
            0.08277872204780579,
            0.22466805577278137,
            0.22473768889904022,
            -0.13952386379241943,
            -0.35128515958786010,
            -0.17046678066253662,
            -0.04700194299221039,
            0.21633064746856690,
            -0.27318200469017030,
            0.02723865583539009,
            -0.47086358070373535,
            0.25049856305122375,
            -0.48574218153953550,
            -0.08048862218856812,
            -0.36891525983810425,
            0.03864942863583565,
            -0.42741003632545470,
            0.74072462320327760,
            -0.010117409750819206,
            0.19975064694881440,
            0.03020879626274109,
            0.06506866216659546,
            -0.04526616632938385,
            0.26060470938682556,
            -0.43580517172813416,
            -0.04713132977485657,
            -0.33256918191909790,
            -0.17320886254310608,
            -0.22390314936637878,
            -0.31866759061813354,
            -0.29139828681945800,
            0.07238420099020004,
            -0.07740981876850128,
            0.11880752444267273,
            -0.26510918140411377,
            0.15372966229915620,
            0.41496598720550537,
            -0.18698418140411377,
            0.0033263303339481354,
            -0.50970172882080080,
            0.15158197283744812,
            -0.06647455692291260,
            0.21226441860198975,
            0.47759312391281130,
            -0.82750320434570310,
            -0.008479125797748566,
            -0.64633381366729740,
            -0.16696789860725403,
            0.012448564171791077,
            -0.03979574143886566,
            -0.029009684920310974,
            -0.84793686866760250,
            0.27539581060409546,
            -0.03149215131998062,
            0.12921379506587982,
            0.14929755032062530,
            -0.19812837243080140,
            -0.20390477776527405,
            0.030443966388702393,
            -0.46114227175712585,
            0.15821106731891632,
            -0.05045306682586670,
            -0.057202182710170746,
        ],
        "clip_embeddings_magnitude": 11.107995986938477,
        "aspect_ratio": 1.33,
        "rating": 0,
        "dominant_color": "[126, 149, 181]",
        "video_length": None,
        "removed": False,
        "in_trashcan": False,
        "timestamp": None,
        "camera": "Pixel 2",
        "digitalZoomRatio": None,
        "focalLength35Equivalent": None,
        "focal_length": 4.442,
        "fstop": 1.8,
        "height": 3024,
        "iso": None,
        "lens": None,
        "shutter_speed": "0",
        "size": 6666687,
        "subjectDistance": 4.691,
        "width": 4032,
        "main_file_id": "c57f08a55c6daa689e6e13a1bf8f81471",
    },
    {
        "thumbnail_big": "thumbnails_big/c4d896c9c9c0ca3c312b19f2f22d69ae1.webp",
        "square_thumbnail": "square_thumbnails/c4d896c9c9c0ca3c312b19f2f22d69ae1.webp",
        "square_thumbnail_small": "square_thumbnails_small/c4d896c9c9c0ca3c312b19f2f22d69ae1.webp",
        "added_on": "2023-06-16 16:30:53.937783 +00:00",
        "exif_gps_lat": 44.5542,
        "exif_gps_lon": -78.1953472222222,
        "exif_timestamp": "2017-08-17 17:59:35.000000 +00:00",
        "exif_json": None,
        "geolocation_json": {
            "type": "FeatureCollection",
            "query": [-78.195347, 44.5542],
            "features": [
                {
                    "id": "address.2311178160127006",
                    "text": "Fire Route 47",
                    "type": "Feature",
                    "center": [-78.1955566, 44.5540639],
                    "address": "2880",
                    "context": [
                        {
                            "id": "postcode.2669825575",
                            "text": "K0L 2H0",
                            "mapbox_id": "dXJuOm1ieHBsYzpueUpPSnc",
                        },
                        {
                            "id": "place.106145831",
                            "text": "Lakefield",
                            "wikidata": "Q114506323",
                            "mapbox_id": "dXJuOm1ieHBsYzpCbE9vSnc",
                        },
                        {
                            "id": "district.1140263",
                            "text": "Peterborough County",
                            "wikidata": "Q730542",
                            "mapbox_id": "dXJuOm1ieHBsYzpFV1lu",
                        },
                        {
                            "id": "region.17447",
                            "text": "Ontario",
                            "wikidata": "Q1904",
                            "mapbox_id": "dXJuOm1ieHBsYzpSQ2M",
                            "short_code": "CA-ON",
                        },
                        {
                            "id": "country.8743",
                            "text": "Canada",
                            "wikidata": "Q16",
                            "mapbox_id": "dXJuOm1ieHBsYzpJaWM",
                            "short_code": "ca",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [-78.1955566, 44.5540639],
                    },
                    "relevance": 1,
                    "place_name": "2880 Fire Route 47, Lakefield, Ontario K0L 2H0, Canada",
                    "place_type": ["address"],
                    "properties": {
                        "accuracy": "point",
                        "mapbox_id": "dXJuOm1ieGFkcjoyOTlkZDc4Yy0wYWVlLTQ2ZGUtYmFkOC04ZDA0Y2VhYzNkZGQ",
                    },
                },
                {
                    "id": "postcode.2669825575",
                    "bbox": [-78.383699659, 44.336123836, -77.917196264, 44.674985335],
                    "text": "K0L 2H0",
                    "type": "Feature",
                    "center": [-78.27, 44.42],
                    "context": [
                        {
                            "id": "place.106145831",
                            "text": "Lakefield",
                            "wikidata": "Q114506323",
                            "mapbox_id": "dXJuOm1ieHBsYzpCbE9vSnc",
                        },
                        {
                            "id": "district.1140263",
                            "text": "Peterborough County",
                            "wikidata": "Q730542",
                            "mapbox_id": "dXJuOm1ieHBsYzpFV1lu",
                        },
                        {
                            "id": "region.17447",
                            "text": "Ontario",
                            "wikidata": "Q1904",
                            "mapbox_id": "dXJuOm1ieHBsYzpSQ2M",
                            "short_code": "CA-ON",
                        },
                        {
                            "id": "country.8743",
                            "text": "Canada",
                            "wikidata": "Q16",
                            "mapbox_id": "dXJuOm1ieHBsYzpJaWM",
                            "short_code": "ca",
                        },
                    ],
                    "geometry": {"type": "Point", "coordinates": [-78.27, 44.42]},
                    "relevance": 1,
                    "place_name": "K0L 2H0, Lakefield, Ontario, Canada",
                    "place_type": ["postcode"],
                    "properties": {"mapbox_id": "dXJuOm1ieHBsYzpueUpPSnc"},
                },
                {
                    "id": "place.106145831",
                    "bbox": [-78.383699659, 44.402393807, -78.086446707, 44.59913282],
                    "text": "Lakefield",
                    "type": "Feature",
                    "center": [-78.272195, 44.423337],
                    "context": [
                        {
                            "id": "district.1140263",
                            "text": "Peterborough County",
                            "wikidata": "Q730542",
                            "mapbox_id": "dXJuOm1ieHBsYzpFV1lu",
                        },
                        {
                            "id": "region.17447",
                            "text": "Ontario",
                            "wikidata": "Q1904",
                            "mapbox_id": "dXJuOm1ieHBsYzpSQ2M",
                            "short_code": "CA-ON",
                        },
                        {
                            "id": "country.8743",
                            "text": "Canada",
                            "wikidata": "Q16",
                            "mapbox_id": "dXJuOm1ieHBsYzpJaWM",
                            "short_code": "ca",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [-78.272195, 44.423337],
                    },
                    "relevance": 1,
                    "place_name": "Lakefield, Ontario, Canada",
                    "place_type": ["place"],
                    "properties": {
                        "wikidata": "Q114506323",
                        "mapbox_id": "dXJuOm1ieHBsYzpCbE9vSnc",
                    },
                },
                {
                    "id": "district.1140263",
                    "bbox": [-78.654828, 44.081278, -77.727372, 44.916769],
                    "text": "Peterborough County",
                    "type": "Feature",
                    "center": [-78.332479, 44.302625],
                    "context": [
                        {
                            "id": "region.17447",
                            "text": "Ontario",
                            "wikidata": "Q1904",
                            "mapbox_id": "dXJuOm1ieHBsYzpSQ2M",
                            "short_code": "CA-ON",
                        },
                        {
                            "id": "country.8743",
                            "text": "Canada",
                            "wikidata": "Q16",
                            "mapbox_id": "dXJuOm1ieHBsYzpJaWM",
                            "short_code": "ca",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [-78.332479, 44.302625],
                    },
                    "relevance": 1,
                    "place_name": "Peterborough County, Ontario, Canada",
                    "place_type": ["district"],
                    "properties": {
                        "wikidata": "Q730542",
                        "mapbox_id": "dXJuOm1ieHBsYzpFV1lu",
                    },
                },
                {
                    "id": "region.17447",
                    "bbox": [-95.158717, 41.6400784, -74.3381353, 56.9091182],
                    "text": "Ontario",
                    "type": "Feature",
                    "center": [-84.2539813003493, 49.4515636581924],
                    "context": [
                        {
                            "id": "country.8743",
                            "text": "Canada",
                            "wikidata": "Q16",
                            "mapbox_id": "dXJuOm1ieHBsYzpJaWM",
                            "short_code": "ca",
                        }
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [-84.2539813003493, 49.4515636581924],
                    },
                    "relevance": 1,
                    "place_name": "Ontario, Canada",
                    "place_type": ["region"],
                    "properties": {
                        "wikidata": "Q1904",
                        "mapbox_id": "dXJuOm1ieHBsYzpSQ2M",
                        "short_code": "CA-ON",
                    },
                },
                {
                    "id": "country.8743",
                    "bbox": [-141.010465, 41.6400784, -52.5210105, 83.1472069],
                    "text": "Canada",
                    "type": "Feature",
                    "center": [-105.750595856519, 55.5859012851966],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [-105.750595856519, 55.5859012851966],
                    },
                    "relevance": 1,
                    "place_name": "Canada",
                    "place_type": ["country"],
                    "properties": {
                        "wikidata": "Q16",
                        "mapbox_id": "dXJuOm1ieHBsYzpJaWM",
                        "short_code": "ca",
                    },
                },
            ],
            "attribution": "NOTICE: © 2023 Mapbox and its suppliers. All rights reserved. Use of this data is subject to the Mapbox Terms of Service (https://www.mapbox.com/about/maps/). This response and the information it contains may not be retained. POI(s) provided by Foursquare.",
            "search_text": "Fire Route 47 K0L 2H0 Lakefield Peterborough County Ontario Canada",
        },
        "captions_json": {
            "places365": {
                "attributes": [
                    "natural light",
                    "open area",
                    "vegetation",
                    "foliage",
                    "trees",
                    "leaves",
                    "grass",
                    "man made",
                    "sunny",
                ],
                "categories": ["picnic area"],
                "environment": "outdoor",
            }
        },
        "search_captions": "picnic area , outdoor",
        "search_location": "Fire Route 47 K0L 2H0 Lakefield Peterborough County Ontario Canada",
        "hidden": False,
        "public": False,
        "video": False,
        "clip_embeddings": [
            0.07200643420219421,
            -0.27314072847366333,
            -0.28608414530754090,
            -0.017477907240390778,
            0.50455182790756230,
            0.28596064448356630,
            0.06314943730831146,
            0.23560704290866852,
            -0.19991967082023620,
            0.05301810801029205,
            0.23392733931541443,
            -0.015628136694431305,
            -0.12933245301246643,
            -0.62648004293441770,
            0.19849593937397003,
            -0.09278710186481476,
            -1.13199305534362800,
            0.02051648497581482,
            0.18314598500728607,
            -0.07170593738555908,
            -0.35629284381866455,
            0.10626928508281708,
            0.022010430693626404,
            -0.36885976791381836,
            0.01585569977760315,
            0.19657053053379060,
            -0.33990219235420227,
            -0.15209683775901794,
            -0.13219691812992096,
            -0.29297292232513430,
            -0.007032429799437523,
            0.30475685000419617,
            -0.69666099548339840,
            -0.55377709865570070,
            0.50226724147796630,
            0.43203988671302795,
            -0.03661022335290909,
            0.12110148370265960,
            0.27576541900634766,
            -0.51852631568908690,
            -0.16946467757225037,
            0.06092119216918945,
            -0.05353017896413803,
            -0.10094764083623886,
            0.24288514256477356,
            -2.32672357559204100,
            0.23213247954845428,
            -0.31283071637153625,
            0.05823267251253128,
            0.033336833119392395,
            0.03891675919294357,
            0.34450155496597290,
            0.54696977138519290,
            -0.10590277612209320,
            -0.38763791322708130,
            0.11399775743484497,
            -0.11230312287807465,
            -0.25931385159492490,
            -0.71149158477783200,
            0.19414122402668000,
            -1.06821513175964360,
            -0.05036032199859619,
            0.23391188681125640,
            0.18708521127700806,
            -0.28283250331878660,
            -0.49732804298400880,
            0.14408025145530700,
            1.58359146118164060,
            -0.09503769129514694,
            0.10219173878431320,
            0.18811975419521332,
            0.11770723760128021,
            0.14510244131088257,
            -0.025733187794685364,
            -0.12114733457565308,
            0.028954997658729553,
            -0.36884146928787230,
            -0.14654713869094850,
            -0.20010140538215637,
            0.05988488718867302,
            0.02569446712732315,
            0.52280324697494510,
            -0.00884101539850235,
            -0.84105598926544190,
            0.08269304037094116,
            -0.030198069289326668,
            0.08129344880580902,
            -0.49774390459060670,
            -0.61459028720855710,
            -0.27356880903244020,
            -0.24041604995727540,
            -0.33665394783020020,
            -5.96149921417236300,
            0.22716827690601350,
            0.28753006458282470,
            0.48320820927619934,
            -0.12874460220336914,
            0.14355051517486572,
            -0.34171727299690247,
            -1.38677775859832760,
            0.058781594038009644,
            0.09329684078693390,
            0.12113958597183228,
            0.02105279266834259,
            0.25320750474929810,
            0.30670967698097230,
            -0.23736193776130676,
            -0.008005078881978989,
            -0.15708926320075990,
            -0.11563684791326523,
            -0.19381190836429596,
            -0.70084750652313230,
            -0.25472760200500490,
            -0.25218990445137024,
            0.04032253846526146,
            0.15879295766353607,
            -0.24767071008682250,
            0.28805834054946900,
            0.02391856536269188,
            0.018087051808834076,
            0.21582140028476715,
            0.62899506092071530,
            -0.13227358460426330,
            0.30459716916084290,
            0.08614320307970047,
            -0.23780769109725952,
            0.25391614437103270,
            -0.22144922614097595,
            -0.08764651417732239,
            0.37465840578079224,
            -0.19986276328563690,
            -0.23993769288063050,
            -0.24029092490673065,
            0.86103123426437380,
            -0.20356409251689910,
            0.18121457099914550,
            0.007383421063423157,
            0.02566760778427124,
            -0.18797449767589570,
            0.12505835294723510,
            0.06744767725467682,
            -0.31292539834976196,
            0.14250934123992920,
            -0.16580671072006226,
            -0.10141041129827500,
            0.07421887665987015,
            0.13718751072883606,
            0.31398600339889526,
            -0.45369070768356323,
            0.37390136718750000,
            -0.17167736589908600,
            -0.12102013081312180,
            0.55987459421157840,
            -0.64511901140213010,
            0.32400843501091003,
            -0.15718287229537964,
            0.03728494048118591,
            -0.48887744545936584,
            -0.43595361709594727,
            0.27848058938980100,
            -0.26770013570785520,
            0.11762751638889313,
            0.14060628414154053,
            0.14021927118301392,
            0.16482727229595184,
            0.12399593740701675,
            1.10899972915649410,
            0.58323627710342410,
            0.25726687908172610,
            -0.04836788773536682,
            0.42536145448684690,
            0.026311412453651428,
            0.23059077560901642,
            -0.09234851598739624,
            -0.42488861083984375,
            -0.52500975131988530,
            -0.14144848287105560,
            0.031238600611686707,
            -0.22408963739871980,
            0.16041082143783570,
            0.19980202615261078,
            0.12246149778366089,
            -0.74750423431396480,
            0.34143632650375366,
            -0.07465202361345291,
            0.032671473920345306,
            0.35502630472183230,
            -0.54294133186340330,
            0.01227620244026184,
            0.11296307295560837,
            0.23945194482803345,
            0.22230161726474762,
            0.09851396828889847,
            -0.10145194828510284,
            -0.94168329238891600,
            -0.63558840751647950,
            -0.09790701419115067,
            0.08268978446722030,
            1.47379052639007570,
            -0.40544277429580690,
            -0.19830146431922913,
            0.12428025901317596,
            0.01359538733959198,
            0.11815530061721802,
            -0.14290475845336914,
            -0.25821614265441895,
            -0.27840244770050050,
            0.51778000593185420,
            -0.28622409701347350,
            0.13844540715217590,
            0.019464679062366486,
            -0.64047700166702270,
            -0.51729387044906620,
            0.36219158768653870,
            -0.29284214973449707,
            -0.09910607337951660,
            -0.44586786627769470,
            0.26939472556114197,
            0.001346886157989502,
            0.10100428760051727,
            0.12059158086776733,
            1.46603417396545400,
            -0.16158343851566315,
            0.09549902379512787,
            0.31741645932197570,
            -0.06466329097747803,
            -0.37618625164031980,
            -0.10769309103488922,
            0.24339321255683900,
            -0.07732771337032318,
            -0.28822788596153260,
            -0.30479827523231506,
            0.28579634428024290,
            0.57900738716125490,
            0.01886954903602600,
            -0.34693476557731630,
            0.13962632417678833,
            -0.36294281482696533,
            -0.10817342996597290,
            0.035561710596084595,
            -0.57529795169830320,
            -0.12815028429031372,
            0.03226613253355026,
            -0.58416968584060670,
            0.13841366767883300,
            0.03650939464569092,
            0.038980357348918915,
            0.34951549768447876,
            0.20841777324676514,
            0.12865397334098816,
            -0.12616679072380066,
            0.08742494136095047,
            0.21315385401248932,
            0.09627585113048553,
            0.20098021626472473,
            -0.06143351271748543,
            -0.043563079088926315,
            -0.19623640179634094,
            1.57240605354309080,
            -0.35777574777603150,
            0.02914358116686344,
            0.63118875026702880,
            0.18993435800075530,
            -0.46280235052108765,
            0.030418217182159424,
            -0.34837594628334045,
            0.03651222586631775,
            0.26378205418586730,
            0.046745263040065765,
            0.28378057479858400,
            -0.009584896266460419,
            0.19612582027912140,
            0.21172988414764404,
            -0.032120171934366226,
            0.20071959495544434,
            -0.08056892454624176,
            0.12477563321590424,
            -0.13512735068798065,
            0.14138039946556090,
            0.31706815958023070,
            0.024455122649669647,
            -0.15259601175785065,
            -0.20282268524169922,
            -0.28921997547149660,
            0.45865276455879210,
            0.11363479495048523,
            -0.20601873099803925,
            0.12293325364589691,
            -0.007529497146606445,
            -0.20519900321960450,
            -0.27892541885375977,
            -0.25480884313583374,
            0.10527120530605316,
            -0.22468784451484680,
            0.27766802906990050,
            0.27707856893539430,
            0.42828142642974854,
            -0.06466045975685120,
            -0.022840768098831177,
            0.08824332058429718,
            0.13453596830368042,
            0.21060699224472046,
            -0.13369843363761902,
            -0.42310655117034910,
            0.06692334264516830,
            0.018675953149795532,
            -0.012705937027931213,
            0.16295075416564941,
            -0.006689056754112244,
            -0.27341771125793457,
            -0.45861658453941345,
            0.14121453464031220,
            0.85903668403625490,
            -0.19725802540779114,
            0.14617547392845154,
            0.27198433876037600,
            0.17599108815193176,
            0.02266123890876770,
            -0.12822464108467102,
            1.00072443485260000,
            0.30147033929824830,
            -0.74144268035888670,
            -0.16088382899761200,
            0.11513932049274445,
            -0.38404512405395510,
            0.04975423216819763,
            0.37200531363487244,
            0.19585512578487396,
            -0.12441303580999374,
            -0.24220986664295197,
            0.15007376670837402,
            -0.04617227613925934,
            -0.04232384264469147,
            -0.34620440006256104,
            -0.26701658964157104,
            -0.005242077633738518,
            0.0031939297914505005,
            0.02201770246028900,
            -0.09960493445396423,
            0.16118554770946503,
            -0.33185213804244995,
            0.15700313448905945,
            0.16201999783515930,
            0.07118913531303406,
            0.22056972980499268,
            -0.011956900358200073,
            -0.0003955662250518799,
            0.25377553701400757,
            -0.41737711429595950,
            0.26137113571166990,
            0.42841473221778870,
            -0.11275280267000198,
            -0.54838216304779050,
            0.03743823617696762,
            0.08181229233741760,
            1.28952217102050780,
            0.36465561389923096,
            -0.28938600420951843,
            0.47177675366401670,
            -0.16908544301986694,
            0.93969750404357910,
            0.08721843361854553,
            -0.09430234134197235,
            0.66503000259399410,
            -0.48145574331283570,
            -0.14018303155899048,
            0.33783870935440063,
            -0.75327533483505250,
            -0.52762186527252200,
            0.04408954456448555,
            -0.39755284786224365,
            -0.0019524451345205307,
            0.30438941717147827,
            0.04218447208404541,
            -0.07897476106882095,
            0.35774332284927370,
            1.22708070278167720,
            0.29904451966285706,
            -0.11844162642955780,
            -0.15679849684238434,
            -0.12561301887035370,
            -0.77952718734741210,
            -0.26338329911231995,
            -0.08969837427139282,
            0.21005888283252716,
            -0.31030485033988950,
            0.24320170283317566,
            0.27376961708068850,
            -0.18231861293315887,
            -1.11225414276123050,
            -0.96022212505340580,
            0.39804935455322266,
            0.007329510059207678,
            -0.21168775856494904,
            -0.63149207830429080,
            0.21230995655059814,
            0.13413298130035400,
            0.38083824515342710,
            0.21768637001514435,
            -0.37690994143486023,
            0.010201409459114075,
            0.35002541542053220,
            -0.00883527286350727,
            -0.49314117431640625,
            0.11570226401090622,
            -0.12012594938278198,
            0.14163519442081451,
            -0.31398567557334900,
            -0.11759512126445770,
            -0.26619073748588560,
            0.24936842918395996,
            -0.07021093368530273,
            -0.26329314708709717,
            -0.26164028048515320,
            -0.48863250017166140,
            -0.21155467629432678,
            -0.51766830682754520,
            -0.41783249378204346,
            -0.36551034450531006,
            -0.69736742973327640,
            0.33944544196128845,
            -0.14483065903186798,
            0.44479277729988100,
            -0.98320567607879640,
            -0.19574180245399475,
            0.31662541627883910,
            -0.44551515579223633,
            -0.022557497024536133,
            -0.48501241207122800,
            -0.09746624529361725,
            -0.36100867390632630,
            -0.27448734641075134,
            0.78780412673950200,
            -0.30192264914512634,
            -0.44880360364913940,
            -0.033154018223285675,
            0.048185281455516815,
            0.03699145466089249,
            0.46661505103111267,
            -0.06928810477256775,
            0.32975050806999207,
            0.66338658332824710,
            0.026022130623459816,
            -0.02559243142604828,
            0.13531213998794556,
            -0.011617228388786316,
            -0.24844856560230255,
            -0.22130966186523438,
            0.06896549463272095,
            0.16910549998283386,
            -0.33283072710037230,
            -0.23490653932094574,
            -0.42383372783660890,
            -0.82607471942901610,
            -0.12491527199745178,
            0.09555611014366150,
            0.14898100495338440,
            0.41498780250549316,
            -0.33365392684936523,
            0.08857516199350357,
            -0.25846809148788450,
            -0.023531511425971985,
            0.24037255346775055,
            0.25419849157333374,
            0.18990617990493774,
            0.21707595884799957,
            0.054550834000110626,
            -0.16628548502922058,
            0.29191961884498596,
            0.21750520169734955,
            0.059166401624679565,
            0.27432167530059814,
            -0.07397265732288360,
            -0.39545136690139770,
            0.32126304507255554,
            -0.23423250019550323,
            -0.46515718102455140,
            0.23323012888431550,
            0.22779177129268646,
            -0.19990277290344238,
            0.16021879017353058,
            0.12057007849216461,
            0.48086464405059814,
            0.21143439412117004,
            -0.13717344403266907,
            -0.26784723997116090,
            0.36808949708938600,
            0.04166709631681442,
            0.10163601487874985,
            -0.65290242433547970,
            0.001865200698375702,
            0.24058419466018677,
            0.43577551841735840,
            -0.30626660585403440,
            0.04026487469673157,
            -0.59185659885406490,
            0.28134933114051820,
            0.10597439110279083,
            -0.02836729586124420,
            -0.17641222476959229,
            -0.41398856043815613,
            0.13548584282398224,
            0.03822256624698639,
            0.49377080798149110,
            0.79975557327270510,
            -0.52094459533691410,
            0.37935078144073486,
            -0.22603368759155273,
            -0.30841892957687380,
            0.0037401914596557617,
            -0.19617760181427002,
            -0.03347594290971756,
        ],
        "clip_embeddings_magnitude": 10.361903190612793,
        "aspect_ratio": 1.33,
        "rating": 0,
        "dominant_color": "[72, 81, 54]",
        "video_length": None,
        "removed": False,
        "in_trashcan": False,
        "timestamp": None,
        "camera": "Pixel 2",
        "digitalZoomRatio": None,
        "focalLength35Equivalent": None,
        "focal_length": 4.442,
        "fstop": 1.8,
        "height": 3024,
        "iso": None,
        "lens": None,
        "shutter_speed": "1/120",
        "size": 12186941,
        "subjectDistance": 3.91,
        "width": 4032,
        "main_file_id": "c4d896c9c9c0ca3c312b19f2f22d69ae1",
    },
    {
        "thumbnail_big": "thumbnails_big/e21b9ade718afdbe931462d837b74d1c1.webp",
        "square_thumbnail": "square_thumbnails/e21b9ade718afdbe931462d837b74d1c1.webp",
        "square_thumbnail_small": "square_thumbnails_small/e21b9ade718afdbe931462d837b74d1c1.webp",
        "added_on": "2023-06-16 16:30:55.449974 +00:00",
        "exif_gps_lat": 52.5019361111111,
        "exif_gps_lon": 13.3815138888889,
        "exif_timestamp": "2017-08-22 13:27:09.000000 +00:00",
        "exif_json": None,
        "geolocation_json": {
            "type": "FeatureCollection",
            "query": [13.381514, 52.501936],
            "features": [
                {
                    "id": "poi.1047972024770",
                    "text": "Roncalli",
                    "type": "Feature",
                    "center": [13.381502, 52.501711],
                    "context": [
                        {
                            "id": "postcode.5541434",
                            "text": "10963",
                            "mapbox_id": "dXJuOm1ieHBsYzpWSTQ2",
                        },
                        {
                            "id": "locality.181160506",
                            "text": "Kreuzberg",
                            "mapbox_id": "dXJuOm1ieHBsYzpDc3hLT2c",
                        },
                        {
                            "id": "place.115770",
                            "text": "Berlin",
                            "wikidata": "Q64",
                            "mapbox_id": "dXJuOm1ieHBsYzpBY1E2",
                            "short_code": "DE-BE",
                        },
                        {
                            "id": "country.8762",
                            "text": "Germany",
                            "wikidata": "Q183",
                            "mapbox_id": "dXJuOm1ieHBsYzpJam8",
                            "short_code": "de",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [13.381502, 52.501711],
                    },
                    "relevance": 1,
                    "place_name": "Roncalli, Möckernstr, Berlin, 10963, Germany",
                    "place_type": ["poi"],
                    "properties": {
                        "maki": "theatre",
                        "address": "Möckernstr",
                        "category": "circus",
                        "landmark": True,
                        "foursquare": "50d22a90e4b0d3035504ae2b",
                    },
                },
                {
                    "id": "postcode.5541434",
                    "bbox": [13.372592, 52.49205, 13.391193, 52.508285],
                    "text": "10963",
                    "type": "Feature",
                    "center": [13.383894, 52.497062],
                    "context": [
                        {
                            "id": "locality.181160506",
                            "text": "Kreuzberg",
                            "mapbox_id": "dXJuOm1ieHBsYzpDc3hLT2c",
                        },
                        {
                            "id": "place.115770",
                            "text": "Berlin",
                            "wikidata": "Q64",
                            "mapbox_id": "dXJuOm1ieHBsYzpBY1E2",
                            "short_code": "DE-BE",
                        },
                        {
                            "id": "country.8762",
                            "text": "Germany",
                            "wikidata": "Q183",
                            "mapbox_id": "dXJuOm1ieHBsYzpJam8",
                            "short_code": "de",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [13.383894, 52.497062],
                    },
                    "relevance": 1,
                    "place_name": "10963, Berlin, Germany",
                    "place_type": ["postcode"],
                    "properties": {"mapbox_id": "dXJuOm1ieHBsYzpWSTQ2"},
                },
                {
                    "id": "locality.181160506",
                    "bbox": [13.368215, 52.48277, 13.453351, 52.50938],
                    "text": "Kreuzberg",
                    "type": "Feature",
                    "center": [13.411914, 52.497644],
                    "context": [
                        {
                            "id": "place.115770",
                            "text": "Berlin",
                            "wikidata": "Q64",
                            "mapbox_id": "dXJuOm1ieHBsYzpBY1E2",
                            "short_code": "DE-BE",
                        },
                        {
                            "id": "country.8762",
                            "text": "Germany",
                            "wikidata": "Q183",
                            "mapbox_id": "dXJuOm1ieHBsYzpJam8",
                            "short_code": "de",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [13.411914, 52.497644],
                    },
                    "relevance": 1,
                    "place_name": "Kreuzberg, Berlin, Germany",
                    "place_type": ["locality"],
                    "properties": {"mapbox_id": "dXJuOm1ieHBsYzpDc3hLT2c"},
                },
                {
                    "id": "place.115770",
                    "bbox": [13.08836, 52.338261, 13.761131, 52.675502],
                    "text": "Berlin",
                    "type": "Feature",
                    "center": [13.3888599, 52.5170365],
                    "context": [
                        {
                            "id": "country.8762",
                            "text": "Germany",
                            "wikidata": "Q183",
                            "mapbox_id": "dXJuOm1ieHBsYzpJam8",
                            "short_code": "de",
                        }
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [13.3888599, 52.5170365],
                    },
                    "relevance": 1,
                    "place_name": "Berlin, Germany",
                    "place_type": ["region", "place"],
                    "properties": {
                        "wikidata": "Q64",
                        "mapbox_id": "dXJuOm1ieHBsYzpBY1E2",
                        "short_code": "DE-BE",
                    },
                },
                {
                    "id": "country.8762",
                    "bbox": [5.866315, 47.270238, 15.041832, 55.1286491],
                    "text": "Germany",
                    "type": "Feature",
                    "center": [10.0183432948567, 51.1334813439932],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [10.0183432948567, 51.1334813439932],
                    },
                    "relevance": 1,
                    "place_name": "Germany",
                    "place_type": ["country"],
                    "properties": {
                        "wikidata": "Q183",
                        "mapbox_id": "dXJuOm1ieHBsYzpJam8",
                        "short_code": "de",
                    },
                },
            ],
            "attribution": "NOTICE: © 2023 Mapbox and its suppliers. All rights reserved. Use of this data is subject to the Mapbox Terms of Service (https://www.mapbox.com/about/maps/). This response and the information it contains may not be retained. POI(s) provided by Foursquare.",
            "search_text": "Roncalli 10963 Kreuzberg Berlin Germany",
        },
        "captions_json": {
            "places365": {
                "attributes": [
                    "natural light",
                    "open area",
                    "man made",
                    "clouds",
                    "no horizon",
                    "sunny",
                    "far away horizon",
                    "cloth",
                    "cold",
                ],
                "categories": [],
                "environment": "outdoor",
            }
        },
        "search_captions": "outdoor",
        "search_location": "Roncalli 10963 Kreuzberg Berlin Germany",
        "hidden": False,
        "public": False,
        "video": False,
        "clip_embeddings": [
            -0.10258262604475021,
            0.66643309593200680,
            -0.06443142890930176,
            -0.14745938777923584,
            0.48618343472480774,
            0.0004399120807647705,
            -0.0009457916021347046,
            0.64925503730773930,
            -0.45721071958541870,
            0.11818008124828339,
            -0.11370902508497238,
            -0.49487552046775820,
            -0.28128325939178467,
            -0.30589711666107180,
            -0.15134385228157043,
            0.05521773546934128,
            -1.55117774009704600,
            -0.16058634221553802,
            -0.13487541675567627,
            -0.15009154379367828,
            -0.34108334779739380,
            -0.13820111751556396,
            0.09468824416399002,
            0.34886407852172850,
            -0.34096065163612366,
            -0.02098141610622406,
            -0.17523168027400970,
            -0.052726227790117264,
            0.25815361738204956,
            -0.45174264907836914,
            -0.63614970445632930,
            0.09681782126426697,
            -0.11660185456275940,
            -0.18351450562477112,
            0.41413304209709170,
            0.14657795429229736,
            -0.28526934981346130,
            -0.22788083553314210,
            -0.21612341701984406,
            -0.73998987674713130,
            -0.55964195728302000,
            -0.22357036173343658,
            -0.22361208498477936,
            0.002233438193798065,
            0.50072944164276120,
            -1.46298265457153320,
            0.63237798213958740,
            0.03941209241747856,
            0.19379198551177979,
            -0.44258201122283936,
            -0.17907603085041046,
            0.06887031346559525,
            0.51105743646621700,
            0.25896197557449340,
            0.010099773295223713,
            0.60815042257308960,
            -0.21678172051906586,
            0.22954954206943512,
            -0.71181941032409670,
            0.17145885527133942,
            0.79170489311218260,
            -0.07573703676462173,
            0.25271376967430115,
            0.07294708490371704,
            0.08441808819770813,
            0.27773401141166687,
            -0.10114270448684692,
            1.18037462234497070,
            -0.10031361877918243,
            -0.57329255342483520,
            0.15199229121208190,
            0.08043078333139420,
            -0.25711309909820557,
            0.35362368822097780,
            0.19381424784660340,
            0.07242968678474426,
            -0.30958822369575500,
            -0.08953941613435745,
            -0.09282187372446060,
            -0.37684765458106995,
            -0.31265074014663696,
            0.76198458671569820,
            -0.24638760089874268,
            -0.18398816883563995,
            0.20948600769042970,
            0.68236070871353150,
            0.26739034056663513,
            -0.19240638613700867,
            -0.31598865985870360,
            -0.029354378581047058,
            0.008327040821313858,
            0.18494442105293274,
            -7.53693056106567400,
            0.25613960623741150,
            0.22370323538780212,
            -0.03313902020454407,
            -0.22441212832927704,
            0.24500671029090880,
            -0.67216014862060550,
            -0.63962388038635250,
            -0.10790157318115234,
            -0.39841800928115845,
            0.45670357346534730,
            0.07113364338874817,
            -0.28614389896392820,
            0.35553669929504395,
            -1.00858056545257570,
            0.17648085951805115,
            -0.56130737066268920,
            0.33491787314414980,
            0.27355626225471497,
            0.16742312908172607,
            0.36952716112136840,
            -0.32609111070632935,
            -0.21147111058235168,
            -0.09825261682271957,
            -0.47114884853363037,
            0.60953688621521000,
            0.38453266024589540,
            -0.38745057582855225,
            -0.04564698040485382,
            0.06692779809236526,
            0.007835905998945236,
            0.12590317428112030,
            0.08536458760499954,
            -0.22401364147663116,
            0.15795263648033142,
            -0.46122899651527405,
            -0.06393150240182877,
            0.27560144662857056,
            0.29461151361465454,
            -0.22232146561145782,
            -0.14870893955230713,
            1.00925290584564200,
            0.08114692568778992,
            0.010658219456672668,
            0.019297055900096893,
            -0.37022376060485840,
            -0.60042166709899900,
            -0.08197715133428574,
            0.17349836230278015,
            -0.40405350923538210,
            0.05475588142871857,
            0.64725798368453980,
            -0.19707715511322021,
            0.10167735815048218,
            -0.24003769457340240,
            0.47526404261589050,
            -0.17396590113639832,
            0.52764558792114260,
            -0.30993252992630005,
            -0.06276136636734009,
            0.54091024398803710,
            -0.32085520029067993,
            0.06873718649148941,
            -0.79230988025665280,
            0.12832219898700714,
            0.27965274453163147,
            -0.11812235414981842,
            -0.025007829070091248,
            -0.05913873016834259,
            0.009386129677295685,
            0.74419283866882320,
            0.53745734691619870,
            -0.07048669457435608,
            0.32115909457206726,
            0.85237395763397220,
            -0.007245570421218872,
            -0.20299741625785828,
            -0.31570893526077270,
            0.36141934990882874,
            0.026256147772073746,
            -0.20647422969341278,
            0.07242944836616516,
            -0.39613524079322815,
            -0.15577512979507446,
            0.56382685899734500,
            0.15884301066398620,
            -0.25236248970031740,
            0.12900674343109130,
            0.13617977499961853,
            -0.38444459438323975,
            -0.17406651377677917,
            0.38698321580886840,
            -0.03219318389892578,
            0.22693467140197754,
            0.061593152582645416,
            -0.21263362467288970,
            0.13701051473617554,
            -0.057763803750276566,
            0.25249591469764710,
            0.08275345712900162,
            0.20910006761550903,
            0.03912349045276642,
            -0.63464707136154170,
            -0.30452278256416320,
            -0.32845041155815125,
            -0.06514476239681244,
            0.37253341078758240,
            0.27116832137107850,
            0.08592364937067032,
            0.23760634660720825,
            -0.28635382652282715,
            -0.04585602134466171,
            -0.25701779127120970,
            -0.18018849194049835,
            -0.48961794376373290,
            -0.08290880918502808,
            -0.33540713787078860,
            0.07882565259933472,
            0.39085230231285095,
            0.05874055624008179,
            0.057173386216163635,
            -0.08757130801677704,
            0.07342680543661118,
            -0.13899344205856323,
            -0.08424560725688934,
            0.19400805234909058,
            -0.72243881225585940,
            -0.29955309629440310,
            0.20382502675056458,
            0.48866674304008484,
            0.07971449941396713,
            -0.03938521072268486,
            -0.62366402149200440,
            -0.15463593602180480,
            0.09072853624820709,
            0.03131377696990967,
            0.28323334455490110,
            -0.16908100247383118,
            -0.20017117261886597,
            0.40308171510696410,
            0.45233413577079773,
            -0.31968781352043150,
            -0.14290061593055725,
            -0.73431730270385740,
            0.32717624306678770,
            -0.24733215570449830,
            0.07128322124481201,
            -0.48950380086898804,
            -0.0008872002363204956,
            -0.07294179499149323,
            -0.22609096765518188,
            -0.020967215299606323,
            -0.07549750804901123,
            0.20787967741489410,
            0.36314973235130310,
            0.12670208513736725,
            -0.31853759288787840,
            0.32616245746612550,
            -0.09472109377384186,
            -0.027377739548683167,
            0.014935225248336792,
            0.20435945689678192,
            -0.16135276854038239,
            0.19143480062484740,
            0.08755904436111450,
            0.20116862654685974,
            -0.08494839072227478,
            -0.22879388928413390,
            0.22606262564659120,
            -0.03982345014810562,
            -0.29927518963813780,
            0.010079406201839447,
            0.07509651780128479,
            -0.25567504763603210,
            -0.11709715425968170,
            0.42464250326156616,
            0.06431484222412110,
            0.17397393286228180,
            0.28166836500167847,
            -0.21547360718250275,
            -0.06485859304666519,
            -0.07584954798221588,
            0.12973758578300476,
            -0.06666970998048782,
            -0.19354835152626038,
            -0.27083098888397217,
            -0.08537831902503967,
            -0.24621208012104034,
            -0.11692193150520325,
            0.12622721493244170,
            0.64608305692672730,
            0.07786636054515839,
            -0.15758465230464935,
            0.15170501172542572,
            0.14211302995681763,
            -0.31157767772674560,
            -0.15162092447280884,
            -0.10263395309448242,
            0.13374274969100952,
            -0.35772666335105896,
            0.16042037308216095,
            -0.09574175626039505,
            0.13830652832984924,
            0.33334568142890930,
            -0.53578650951385500,
            0.39855188131332400,
            -0.37783429026603700,
            -0.25219041109085083,
            0.06827493011951447,
            -0.50635170936584470,
            -0.13055899739265442,
            0.050748057663440704,
            0.14656113088130950,
            -0.85355234146118160,
            -0.03550938516855240,
            0.21138493716716766,
            0.51412421464920040,
            -0.16174469888210297,
            0.06829738616943360,
            0.38762015104293823,
            1.00867974758148200,
            -0.11224977672100067,
            0.23601248860359192,
            0.21366406977176666,
            0.22318972647190094,
            -0.57790690660476680,
            -0.20985898375511170,
            -0.13206046819686890,
            0.43933963775634766,
            -0.76506268978118900,
            -0.33175840973854065,
            0.35506504774093630,
            -0.66501140594482420,
            0.40778365731239320,
            -0.19959415495395660,
            -0.28629922866821290,
            0.27318397164344790,
            0.37771254777908325,
            -0.12135715782642365,
            0.011033750139176846,
            -0.05133216455578804,
            -0.06439136713743210,
            -0.07881140708923340,
            -0.07496929168701172,
            0.36653387546539307,
            -0.11792770028114319,
            0.33755394816398620,
            -0.09257731586694717,
            0.009545769542455673,
            -0.04660305380821228,
            0.013396577909588814,
            0.15035420656204224,
            -0.61903655529022220,
            -0.17708726227283478,
            -0.013831155374646187,
            0.010356694459915161,
            0.10595686733722687,
            -0.04540724307298660,
            0.0009019002318382263,
            -0.26157030463218690,
            0.18670830130577087,
            -0.059031642973423004,
            -0.11484433710575104,
            -0.36731621623039246,
            0.14339649677276610,
            1.26058232784271240,
            -0.015540368854999542,
            -0.07888511568307877,
            -0.009377516806125641,
            -0.15602213144302368,
            -0.12761303782463074,
            0.25213027000427246,
            0.92153555154800420,
            -0.18542146682739258,
            -0.21386396884918213,
            -1.57489061355590820,
            0.014670997858047485,
            0.35590082406997680,
            0.23226591944694520,
            0.29403144121170044,
            0.19039350748062134,
            0.12028850615024567,
            0.14649519324302673,
            -0.57438409328460690,
            1.51094436645507810,
            -0.06900059431791306,
            -0.09223778545856476,
            0.05437563359737396,
            0.12748995423316956,
            -0.07933007180690765,
            -0.81089299917221070,
            -0.47452667355537415,
            0.12268605083227158,
            0.40242570638656616,
            0.28311154246330260,
            0.27250385284423830,
            -0.23757700622081757,
            0.32199540734291077,
            -0.31787779927253723,
            0.24869447946548462,
            -0.32091945409774780,
            0.13392969965934753,
            0.024256711825728416,
            -0.003996938467025757,
            0.31115883588790894,
            -0.50246292352676390,
            -0.20639395713806152,
            0.03759238123893738,
            0.17185325920581818,
            -0.030085332691669464,
            0.048362910747528076,
            -0.62065368890762330,
            -0.020879443734884262,
            0.12434196472167969,
            0.040695954114198685,
            -0.50741922855377200,
            0.08081452548503876,
            0.14095300436019897,
            -0.15079917013645172,
            0.14225539565086365,
            -0.03339875489473343,
            0.25852018594741820,
            -0.41237697005271910,
            0.31924033164978030,
            -0.25935268402099610,
            -0.32131356000900270,
            -0.69814765453338620,
            -0.22040528059005737,
            0.05100163817405701,
            -0.15426829457283020,
            0.22865183651447296,
            -0.47168889641761780,
            -0.31051588058471680,
            0.048167359083890915,
            -0.21201044321060180,
            0.10385461151599884,
            0.18401621282100677,
            0.12361292541027069,
            0.30423548817634580,
            -0.17449685931205750,
            0.31314414739608765,
            0.04636995494365692,
            -0.41227555274963380,
            0.045520931482315063,
            0.53545415401458740,
            0.13680092990398407,
            -0.36478853225708010,
            0.40942415595054626,
            0.23506653308868408,
            1.04005861282348630,
            -0.27912554144859314,
            0.06439234316349030,
            0.18784391880035400,
            -0.17379683256149292,
            -0.18675222992897034,
            -0.34193059802055360,
            -0.38465169072151184,
            0.34344249963760376,
            0.23465913534164430,
            0.032892048358917236,
            -0.28188407421112060,
            -0.11934018135070801,
            0.022270366549491882,
            0.07610686123371124,
            0.16484493017196655,
            0.28013628721237180,
            -0.06442663818597794,
            -0.13154838979244232,
            0.38454037904739380,
            -0.15238852798938750,
            -0.34664541482925415,
            0.06196160987019539,
            0.21366979181766510,
            -0.23718816041946410,
            0.29661375284194946,
            0.07324250787496567,
            0.02359824627637863,
            -0.29029119014739990,
            -0.04170669615268707,
            -0.13716265559196472,
            -0.18890701234340668,
            -0.71853756904602050,
            -0.14910481870174408,
            -0.28566592931747437,
            0.17772153019905090,
            0.08817628026008606,
            -0.034255996346473694,
            -0.23667897284030914,
            -0.62015527486801150,
            0.20481406152248383,
            0.19941198825836182,
            -0.11482881009578705,
            0.006309971213340759,
            0.42098861932754517,
            0.03637159615755081,
            0.42487934231758120,
            -0.13934084773063660,
            -0.32979014515876770,
            0.13939698040485382,
            0.15597808361053467,
            0.18135486543178558,
            -0.73175537586212160,
            -0.26711130142211914,
            -0.09930166602134705,
            -0.30019181966781616,
            0.27222818136215210,
            -0.13047066330909730,
            0.21958050131797790,
            -0.92940568923950200,
            0.46761587262153625,
            0.002422422170639038,
            0.06002846360206604,
            -0.07387303560972214,
            -0.14259713888168335,
            -0.52521455287933350,
            0.21675816178321838,
            -0.26278591156005860,
            -0.029557587578892708,
            -0.39842849969863890,
            -0.21753847599029540,
        ],
        "clip_embeddings_magnitude": 10.904964447021484,
        "aspect_ratio": 1.33,
        "rating": 0,
        "dominant_color": "[255, 255, 255]",
        "video_length": None,
        "in_trashcan": False,
        "removed": False,
        "timestamp": None,
        "camera": "Pixel 2",
        "digitalZoomRatio": None,
        "focalLength35Equivalent": None,
        "focal_length": 4.441,
        "fstop": 1.8,
        "height": 3024,
        "iso": None,
        "lens": None,
        "shutter_speed": "0",
        "size": 4303517,
        "subjectDistance": 1.356,
        "width": 4032,
        "main_file_id": "e21b9ade718afdbe931462d837b74d1c1",
    },
    {
        "thumbnail_big": "thumbnails_big/a5bcc802a708c07c18816d1b480a8b7d1.webp",
        "square_thumbnail": "square_thumbnails/a5bcc802a708c07c18816d1b480a8b7d1.webp",
        "square_thumbnail_small": "square_thumbnails_small/a5bcc802a708c07c18816d1b480a8b7d1.webp",
        "added_on": "2023-06-16 16:30:52.549542 +00:00",
        "exif_gps_lat": -33.9432611111111,
        "exif_gps_lon": 151.263833333333,
        "exif_timestamp": "2017-08-17 09:31:53.000000 +00:00",
        "exif_json": None,
        "geolocation_json": {
            "type": "FeatureCollection",
            "query": [151.263833, -33.943261],
            "features": [
                {
                    "id": "poi.695784709457",
                    "text": "Mahon Rock Pool",
                    "type": "Feature",
                    "center": [151.263303, -33.94292],
                    "context": [
                        {
                            "id": "locality.269412878",
                            "text": "Maroubra",
                            "wikidata": "Q2914843",
                            "mapbox_id": "dXJuOm1ieHBsYzpFQTdxRGc",
                        },
                        {
                            "id": "place.24496142",
                            "text": "Sydney",
                            "wikidata": "Q3130",
                            "mapbox_id": "dXJuOm1ieHBsYzpBWFhJRGc",
                        },
                        {
                            "id": "region.33806",
                            "text": "New South Wales",
                            "wikidata": "Q3224",
                            "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                            "short_code": "AU-NSW",
                        },
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [151.263303, -33.94292],
                    },
                    "relevance": 1,
                    "place_name": "Mahon Rock Pool, Marine Pde., Sydney, New South Wales, Australia",
                    "place_type": ["poi"],
                    "properties": {
                        "address": "Marine Pde.",
                        "category": "swimming pool, pool, swim club",
                        "landmark": True,
                        "foursquare": "4b550d36f964a52055d927e3",
                    },
                },
                {
                    "id": "locality.269412878",
                    "bbox": [151.226804557, -33.958002321, 151.292531935, -33.93283624],
                    "text": "Maroubra",
                    "type": "Feature",
                    "center": [151.2575, -33.9475],
                    "context": [
                        {
                            "id": "place.24496142",
                            "text": "Sydney",
                            "wikidata": "Q3130",
                            "mapbox_id": "dXJuOm1ieHBsYzpBWFhJRGc",
                        },
                        {
                            "id": "region.33806",
                            "text": "New South Wales",
                            "wikidata": "Q3224",
                            "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                            "short_code": "AU-NSW",
                        },
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        },
                    ],
                    "geometry": {"type": "Point", "coordinates": [151.2575, -33.9475]},
                    "relevance": 1,
                    "place_name": "Maroubra, New South Wales, Australia",
                    "place_type": ["locality"],
                    "properties": {
                        "wikidata": "Q2914843",
                        "mapbox_id": "dXJuOm1ieHBsYzpFQTdxRGc",
                    },
                },
                {
                    "id": "place.24496142",
                    "bbox": [150.520934139, -34.11717528, 151.369884128, -33.562644328],
                    "text": "Sydney",
                    "type": "Feature",
                    "center": [151.216454, -33.854816],
                    "context": [
                        {
                            "id": "region.33806",
                            "text": "New South Wales",
                            "wikidata": "Q3224",
                            "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                            "short_code": "AU-NSW",
                        },
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [151.216454, -33.854816],
                    },
                    "relevance": 1,
                    "place_name": "Sydney, New South Wales, Australia",
                    "place_type": ["place"],
                    "properties": {
                        "wikidata": "Q3130",
                        "mapbox_id": "dXJuOm1ieHBsYzpBWFhJRGc",
                    },
                },
                {
                    "id": "region.33806",
                    "bbox": [140.999265, -37.5097258, 159.200456, -28.1370359],
                    "text": "New South Wales",
                    "type": "Feature",
                    "center": [147.014694071448, -32.168971672412],
                    "context": [
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        }
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [147.014694071448, -32.168971672412],
                    },
                    "relevance": 1,
                    "place_name": "New South Wales, Australia",
                    "place_type": ["region"],
                    "properties": {
                        "wikidata": "Q3224",
                        "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                        "short_code": "AU-NSW",
                    },
                },
                {
                    "id": "country.8718",
                    "bbox": [112.8256904, -54.8327658, 159.200456, -9.0436707],
                    "text": "Australia",
                    "type": "Feature",
                    "center": [134.489562606981, -25.7349684916223],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [134.489562606981, -25.7349684916223],
                    },
                    "relevance": 1,
                    "place_name": "Australia",
                    "place_type": ["country"],
                    "properties": {
                        "wikidata": "Q408",
                        "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                        "short_code": "au",
                    },
                },
            ],
            "attribution": "NOTICE: © 2023 Mapbox and its suppliers. All rights reserved. Use of this data is subject to the Mapbox Terms of Service (https://www.mapbox.com/about/maps/). This response and the information it contains may not be retained. POI(s) provided by Foursquare.",
            "search_text": "Mahon Rock Pool Maroubra Sydney New South Wales Australia",
        },
        "captions_json": {
            "places365": {
                "attributes": [
                    "natural light",
                    "open area",
                    "far away horizon",
                    "natural",
                    "sunny",
                    "boating",
                    "moist",
                    "swimming",
                    "ocean",
                ],
                "categories": ["marsh", "tundra", "lagoon"],
                "environment": "outdoor",
            }
        },
        "search_captions": "marsh , tundra , lagoon , outdoor",
        "search_location": "Mahon Rock Pool Maroubra Sydney New South Wales Australia",
        "hidden": False,
        "public": False,
        "video": False,
        "clip_embeddings": [
            0.12998622655868530,
            0.13258025050163270,
            -0.058508455753326416,
            0.22892819344997406,
            -0.023302078247070312,
            -0.44510543346405030,
            0.43837052583694460,
            0.40075856447219850,
            0.42637223005294800,
            -0.18267586827278137,
            -0.32148724794387820,
            -0.03853927552700043,
            -0.059241898357868195,
            -0.12733995914459229,
            -0.09387104958295822,
            -0.43112272024154663,
            -1.19327056407928470,
            -0.014609143137931824,
            0.21503102779388428,
            -0.13053396344184875,
            0.28765681385993960,
            0.52494764328002930,
            0.42401337623596190,
            0.011837676167488098,
            0.09145589917898178,
            0.22389806807041168,
            -0.036226868629455566,
            0.09836312383413315,
            -0.10595801472663880,
            0.20653992891311646,
            0.26259601116180420,
            -0.021937429904937744,
            -0.37160769104957580,
            0.06919395923614502,
            0.17206385731697083,
            0.05610951408743858,
            -0.25814598798751830,
            0.25112861394882200,
            0.13220319151878357,
            0.22801768779754640,
            -0.28782862424850464,
            0.52349138259887700,
            0.11140240728855133,
            0.21639062464237213,
            0.16601549088954926,
            -1.26960456371307370,
            0.03704804554581642,
            0.15477925539016724,
            0.32343593239784240,
            0.05724513530731201,
            0.23438473045825958,
            0.34855538606643677,
            0.30527845025062560,
            0.047757647931575775,
            -0.14104431867599487,
            0.28336334228515625,
            0.12284316122531891,
            0.09858018159866333,
            -0.64525383710861210,
            -0.28189745545387270,
            -0.53113412857055660,
            -0.02064698189496994,
            -0.029455430805683136,
            0.31310641765594480,
            -0.01327805221080780,
            -0.05426792800426483,
            -0.12057886272668839,
            1.52634048461914060,
            -0.23908194899559020,
            0.03377249091863632,
            -0.31758821010589600,
            0.003850087523460388,
            -0.44408404827117920,
            -0.58076667785644530,
            0.022277936339378357,
            0.21131259202957153,
            -0.17391380667686462,
            -0.28281235694885254,
            0.19357018172740936,
            -0.047077856957912445,
            -0.022741809487342834,
            0.22117993235588074,
            -0.06992056965827942,
            0.18571671843528748,
            0.06705777347087860,
            0.24204009771347046,
            0.11218206584453583,
            -0.03229340910911560,
            0.20023432374000550,
            -0.08615788817405700,
            0.29021203517913820,
            0.11631032079458237,
            -6.34464693069458000,
            -0.37301033735275270,
            -0.08067938685417175,
            0.23319250345230103,
            -0.11491980403661728,
            -0.22198167443275452,
            -0.23849581182003020,
            -1.53279995918273930,
            0.25409278273582460,
            -0.37143617868423460,
            0.12711408734321594,
            0.18552611768245697,
            0.13125161826610565,
            -0.03438793122768402,
            0.12672650814056396,
            -0.30418828129768370,
            0.05400300398468971,
            0.22966152429580688,
            0.10130165517330170,
            -0.18591997027397156,
            0.16613908112049103,
            0.08785743266344070,
            -0.09753852337598800,
            -0.19177854061126710,
            -0.54351925849914550,
            -0.029669322073459625,
            0.008011367172002792,
            0.06446681916713715,
            0.23291164636611938,
            -0.78047883510589600,
            -0.35974910855293274,
            -0.57393378019332890,
            0.005923539400100708,
            -0.07117588073015213,
            0.13031338155269623,
            -0.43962341547012330,
            -0.75585317611694340,
            0.27976679801940920,
            -0.005890890955924988,
            0.16367265582084656,
            0.010072827339172363,
            0.86911255121231080,
            -0.50223058462142940,
            0.09843732416629791,
            -0.03996431455016136,
            -0.25243335962295530,
            0.011986486613750458,
            0.07025257498025894,
            -0.15618172287940980,
            -0.13723298907279968,
            0.14785155653953552,
            -0.07476790249347687,
            0.011668689548969269,
            0.15818738937377930,
            -0.22708828747272491,
            1.15767204761505130,
            -0.24034819006919860,
            0.06645347177982330,
            0.03723381087183952,
            0.13653486967086792,
            -0.91293966770172120,
            0.061923325061798096,
            0.020089279860258102,
            -0.19603200256824493,
            0.54111683368682860,
            0.08232687413692474,
            -0.20884832739830017,
            0.34021350741386414,
            -0.87326097488403320,
            -0.27245533466339110,
            0.30318510532379150,
            0.30751353502273560,
            0.25488168001174927,
            -0.19319717586040497,
            1.10999667644500730,
            0.32085287570953370,
            0.19622525572776794,
            -0.29783028364181520,
            -0.21281230449676514,
            0.002480059862136841,
            0.16586032509803772,
            0.16510939598083496,
            -0.25083601474761963,
            0.01780378818511963,
            -0.23946386575698853,
            0.26920223236083984,
            -0.60473775863647460,
            0.71488064527511600,
            0.90620148181915280,
            -0.11498169600963593,
            -0.11332808434963226,
            0.29238957166671753,
            -0.28703141212463380,
            -0.08944821357727051,
            0.33648857474327090,
            -0.27088621258735657,
            0.056357257068157196,
            0.06953722238540650,
            -0.12937217950820923,
            -0.34909275174140930,
            0.0033053942024707794,
            0.36867564916610720,
            0.02737647294998169,
            -0.40904921293258667,
            0.15042823553085327,
            -0.23831282556056976,
            1.08098745346069340,
            -0.14632245898246765,
            -0.10184669494628906,
            -0.45605412125587463,
            -0.26751014590263367,
            -0.19427978992462158,
            -0.07291503250598907,
            -0.23394347727298737,
            -0.39399421215057373,
            0.21800534427165985,
            0.08165672421455383,
            0.31118094921112060,
            -0.03596162423491478,
            0.56992232799530030,
            -0.25306987762451170,
            -0.013975441455841064,
            -0.13325847685337067,
            0.19483233988285065,
            0.10027952492237091,
            0.57050353288650510,
            0.07020722329616547,
            -0.30141943693161010,
            0.10414308309555054,
            0.39053773880004883,
            0.13395856320858002,
            0.06220602989196777,
            -0.39614889025688170,
            0.021074017509818077,
            -0.27187311649322510,
            0.50517594814300540,
            0.14774698019027710,
            0.35505199432373047,
            -0.014332786202430725,
            0.16666226089000702,
            0.16399480402469635,
            0.09917092323303223,
            0.35650873184204100,
            -1.40380215644836430,
            -0.026044342666864395,
            -0.19442640244960785,
            -0.24114309251308440,
            0.058344028890132904,
            0.12207233905792236,
            -0.16192662715911865,
            0.09302338957786560,
            0.49859148263931274,
            -0.14120854437351227,
            -0.05409412086009979,
            -0.21078500151634216,
            0.32789957523345950,
            0.17087182402610780,
            0.03868192434310913,
            -0.58889353275299070,
            0.18010029196739197,
            0.04883924126625061,
            0.26769936084747314,
            -0.23523572087287903,
            0.26934176683425903,
            -0.23642563819885254,
            0.12310450524091720,
            0.89556938409805300,
            -0.06872670352458954,
            -0.04263883829116821,
            0.17438516020774840,
            0.25022634863853455,
            -0.06414982676506042,
            0.17062856256961823,
            -0.67373126745224000,
            0.33244323730468750,
            -0.11403056979179382,
            -0.28086948394775390,
            -0.023052534088492393,
            0.10679151117801666,
            0.13404421508312225,
            0.12281967699527740,
            -0.48176917433738710,
            -0.50348985195159910,
            0.19038720428943634,
            0.06314077228307724,
            0.12262192368507385,
            -0.35703650116920470,
            0.24681422114372253,
            -0.07084030658006668,
            0.13866774737834930,
            0.020786508917808533,
            0.48234757781028750,
            0.18154349923133850,
            0.24811989068984985,
            -0.47986146807670593,
            -0.26600340008735657,
            -0.79610115289688110,
            -0.44987118244171140,
            0.03849541395902634,
            -0.26184004545211790,
            0.42152988910675050,
            -0.30942755937576294,
            0.14844314754009247,
            -0.12019725143909454,
            1.18861508369445800,
            0.02964150905609131,
            -0.38321954011917114,
            -0.17666542530059814,
            -0.24750977754592896,
            -0.18742603063583374,
            0.23742599785327910,
            -0.13876700401306152,
            0.53921639919281010,
            0.28352069854736330,
            0.13867411017417908,
            -0.07083784788846970,
            0.53155958652496340,
            -0.008131757378578186,
            -0.20227709412574768,
            0.08842383325099945,
            0.86737281084060670,
            -0.29989498853683470,
            0.09684963524341583,
            -0.031620755791664124,
            0.58049958944320680,
            0.11073039472103119,
            -0.25317376852035520,
            0.56119495630264280,
            0.34039902687072754,
            1.21799755096435550,
            -0.021552175283432007,
            -0.15119931101799010,
            -0.054917752742767334,
            0.80401933193206790,
            0.010184556245803833,
            0.06551001965999603,
            0.19289986789226532,
            -0.21603244543075562,
            0.025988996028900146,
            -0.65018039941787720,
            0.50120383501052860,
            -0.26873117685317993,
            0.19879785180091858,
            -0.26082211732864380,
            0.46192330121994020,
            -0.55225759744644170,
            0.01180829107761383,
            0.05070953071117401,
            -0.67910110950469970,
            -0.04475890100002289,
            0.36456465721130370,
            0.13348321616649628,
            -0.01747957617044449,
            -0.13040468096733093,
            -0.16885089874267578,
            0.33254384994506836,
            -0.29955965280532837,
            -0.26608777046203613,
            -0.10515909641981125,
            -0.32794988155364990,
            -0.05360160768032074,
            -0.21728354692459106,
            -0.39240026473999023,
            0.33821657299995420,
            -0.008709043264389038,
            -0.43232405185699463,
            0.63957405090332030,
            0.35856172442436220,
            0.45638042688369750,
            -0.13032492995262146,
            0.46423870325088500,
            0.29733401536941530,
            0.21055299043655396,
            0.33571115136146545,
            0.27673989534378050,
            -1.99598908424377440,
            -0.43283250927925110,
            0.27975231409072876,
            -0.27850526571273804,
            0.48566606640815735,
            0.14831756055355072,
            0.12112566083669662,
            0.37299168109893800,
            -0.36536252498626710,
            0.51137733459472660,
            0.26767280697822570,
            -0.35320448875427246,
            0.13971213996410370,
            0.01589038036763668,
            -0.30416059494018555,
            -0.35622701048851013,
            -0.29882031679153440,
            -0.0055990517139434814,
            -0.13705015182495117,
            0.56266194581985470,
            -0.38767093420028687,
            -0.53967058658599850,
            0.06725452840328217,
            -1.21143281459808350,
            0.22121112048625946,
            0.43655356764793396,
            0.33551204204559326,
            -0.27671134471893310,
            -0.57174313068389890,
            -0.058216191828250885,
            0.06912264972925186,
            -0.85613191127777100,
            0.19724097847938538,
            0.16659013926982880,
            0.14675720036029816,
            0.24287590384483337,
            -0.25835406780242920,
            0.20815043151378632,
            -0.42670011520385740,
            0.39319023489952090,
            0.32358986139297485,
            0.025813337415456772,
            -0.048157237470149994,
            -0.35826218128204346,
            0.04717639088630676,
            0.30715617537498474,
            -0.25429004430770874,
            -0.10547082126140594,
            0.02966500073671341,
            0.30983048677444460,
            -0.21249084174633026,
            -0.19436784088611603,
            0.77192759513854980,
            -0.53250586986541750,
            0.12887206673622130,
            0.32633990049362180,
            -1.24625861644744870,
            -0.16218033432960510,
            -0.13100118935108185,
            -0.11232861876487732,
            0.62874174118041990,
            -0.02767990529537201,
            -0.05274036154150963,
            -0.53563487529754640,
            -0.64365452527999880,
            -0.05103348195552826,
            0.08929728716611862,
            -0.40029305219650270,
            -0.10031442344188690,
            0.31065917015075684,
            -0.21383905410766602,
            0.14335599541664124,
            -0.09037648141384125,
            -0.17714662849903107,
            0.33824056386947630,
            -0.82754230499267580,
            0.16252911090850830,
            -0.07532244920730591,
            -0.14527970552444458,
            -0.22860543429851532,
            -0.30257803201675415,
            0.047085925936698914,
            0.17316375672817230,
            0.13065533339977264,
            -0.17600929737091064,
            0.13690154254436493,
            -0.20214480161666870,
            0.01934470236301422,
            0.12377672642469406,
            -0.06723305583000183,
            0.22328042984008790,
            -0.49700859189033510,
            -0.34658029675483704,
            0.20576259493827820,
            -0.27207553386688230,
            -0.22085019946098328,
            -0.38435065746307373,
            0.44076967239379883,
            0.22373658418655396,
            -0.046322643756866455,
            0.18001255393028260,
            0.15259465575218200,
            0.17097039520740510,
            -0.23130619525909424,
            0.29231351613998413,
            -0.37276223301887510,
            -0.16314452886581420,
            0.08766435086727142,
            -0.41216766834259033,
            -0.21740865707397460,
            -0.05558343976736069,
            -0.41705510020256040,
            -0.020109981298446655,
            -0.36541312932968140,
            -0.38398233056068420,
            0.39583081007003784,
            0.13429638743400574,
            -0.41582357883453370,
            0.08929545432329178,
            0.37230169773101807,
            -0.10493122041225433,
            -0.21501919627189636,
            -0.18377599120140076,
            0.017690163105726242,
            -0.10214073956012726,
            0.50946366786956790,
            -0.30789539217948914,
            -0.52317154407501220,
            -0.20865441858768463,
            0.15374669432640076,
            0.21395552158355713,
            -0.42342543601989746,
            0.50638461112976070,
            0.33827340602874756,
            0.05084151029586792,
            0.004318922758102417,
            0.18277740478515625,
            0.33151501417160034,
            -0.54885160923004150,
            0.30941945314407350,
            0.16642820835113525,
            -0.52071034908294680,
            -0.20474663376808167,
            -0.01535847783088684,
            0.11818096041679382,
        ],
        "clip_embeddings_magnitude": 10.422953605651855,
        "aspect_ratio": 1.33,
        "rating": 0,
        "dominant_color": "[105, 144, 187]",
        "video_length": None,
        "in_trashcan": False,
        "removed": False,
        "timestamp": None,
        "camera": "Pixel 2",
        "digitalZoomRatio": None,
        "focalLength35Equivalent": None,
        "focal_length": 4.442,
        "fstop": 1.8,
        "height": 3024,
        "iso": None,
        "lens": None,
        "shutter_speed": "0",
        "size": 6467070,
        "subjectDistance": 2.229,
        "width": 4032,
        "main_file_id": "a5bcc802a708c07c18816d1b480a8b7d1",
    },
    {
        "thumbnail_big": "thumbnails_big/57dca8933514df1efafddf76004187cc1.webp",
        "square_thumbnail": "square_thumbnails/57dca8933514df1efafddf76004187cc1.webp",
        "square_thumbnail_small": "square_thumbnails_small/57dca8933514df1efafddf76004187cc1.webp",
        "added_on": "2023-06-16 16:30:56.866303 +00:00",
        "exif_gps_lat": -33.9417083333333,
        "exif_gps_lon": 151.265258333333,
        "exif_timestamp": "2017-08-17 10:32:47.000000 +00:00",
        "exif_json": None,
        "geolocation_json": {
            "type": "FeatureCollection",
            "query": [151.265258, -33.941708],
            "features": [
                {
                    "id": "poi.721554610670",
                    "text": "Mistral Point",
                    "type": "Feature",
                    "center": [151.26523, -33.941658],
                    "context": [
                        {
                            "id": "postcode.503310",
                            "text": "2035",
                            "mapbox_id": "dXJuOm1ieHBsYzpCNjRP",
                        },
                        {
                            "id": "locality.269412878",
                            "text": "Maroubra",
                            "wikidata": "Q2914843",
                            "mapbox_id": "dXJuOm1ieHBsYzpFQTdxRGc",
                        },
                        {
                            "id": "place.24496142",
                            "text": "Sydney",
                            "wikidata": "Q3130",
                            "mapbox_id": "dXJuOm1ieHBsYzpBWFhJRGc",
                        },
                        {
                            "id": "region.33806",
                            "text": "New South Wales",
                            "wikidata": "Q3224",
                            "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                            "short_code": "AU-NSW",
                        },
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [151.26523, -33.941658],
                    },
                    "relevance": 1,
                    "place_name": "Mistral Point, Sydney, New South Wales 2035, Australia",
                    "place_type": ["poi"],
                    "properties": {
                        "category": "historic site, historic",
                        "landmark": True,
                        "foursquare": "5958b8724420d86b1808f7bd",
                    },
                },
                {
                    "id": "postcode.503310",
                    "bbox": [151.205214, -33.958015, 151.265693, -33.931801],
                    "text": "2035",
                    "type": "Feature",
                    "center": [151.242438, -33.942906],
                    "context": [
                        {
                            "id": "locality.269412878",
                            "text": "Maroubra",
                            "wikidata": "Q2914843",
                            "mapbox_id": "dXJuOm1ieHBsYzpFQTdxRGc",
                        },
                        {
                            "id": "place.24496142",
                            "text": "Sydney",
                            "wikidata": "Q3130",
                            "mapbox_id": "dXJuOm1ieHBsYzpBWFhJRGc",
                        },
                        {
                            "id": "region.33806",
                            "text": "New South Wales",
                            "wikidata": "Q3224",
                            "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                            "short_code": "AU-NSW",
                        },
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [151.242438, -33.942906],
                    },
                    "relevance": 1,
                    "place_name": "2035, Maroubra, New South Wales, Australia",
                    "place_type": ["postcode"],
                    "properties": {"mapbox_id": "dXJuOm1ieHBsYzpCNjRP"},
                },
                {
                    "id": "locality.269412878",
                    "bbox": [151.226804557, -33.958002321, 151.292531935, -33.93283624],
                    "text": "Maroubra",
                    "type": "Feature",
                    "center": [151.2575, -33.9475],
                    "context": [
                        {
                            "id": "place.24496142",
                            "text": "Sydney",
                            "wikidata": "Q3130",
                            "mapbox_id": "dXJuOm1ieHBsYzpBWFhJRGc",
                        },
                        {
                            "id": "region.33806",
                            "text": "New South Wales",
                            "wikidata": "Q3224",
                            "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                            "short_code": "AU-NSW",
                        },
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        },
                    ],
                    "geometry": {"type": "Point", "coordinates": [151.2575, -33.9475]},
                    "relevance": 1,
                    "place_name": "Maroubra, New South Wales, Australia",
                    "place_type": ["locality"],
                    "properties": {
                        "wikidata": "Q2914843",
                        "mapbox_id": "dXJuOm1ieHBsYzpFQTdxRGc",
                    },
                },
                {
                    "id": "place.24496142",
                    "bbox": [150.520934139, -34.11717528, 151.369884128, -33.562644328],
                    "text": "Sydney",
                    "type": "Feature",
                    "center": [151.216454, -33.854816],
                    "context": [
                        {
                            "id": "region.33806",
                            "text": "New South Wales",
                            "wikidata": "Q3224",
                            "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                            "short_code": "AU-NSW",
                        },
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        },
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [151.216454, -33.854816],
                    },
                    "relevance": 1,
                    "place_name": "Sydney, New South Wales, Australia",
                    "place_type": ["place"],
                    "properties": {
                        "wikidata": "Q3130",
                        "mapbox_id": "dXJuOm1ieHBsYzpBWFhJRGc",
                    },
                },
                {
                    "id": "region.33806",
                    "bbox": [140.999265, -37.5097258, 159.200456, -28.1370359],
                    "text": "New South Wales",
                    "type": "Feature",
                    "center": [147.014694071448, -32.168971672412],
                    "context": [
                        {
                            "id": "country.8718",
                            "text": "Australia",
                            "wikidata": "Q408",
                            "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                            "short_code": "au",
                        }
                    ],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [147.014694071448, -32.168971672412],
                    },
                    "relevance": 1,
                    "place_name": "New South Wales, Australia",
                    "place_type": ["region"],
                    "properties": {
                        "wikidata": "Q3224",
                        "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                        "short_code": "AU-NSW",
                    },
                },
                {
                    "id": "country.8718",
                    "bbox": [112.8256904, -54.8327658, 159.200456, -9.0436707],
                    "text": "Australia",
                    "type": "Feature",
                    "center": [134.489562606981, -25.7349684916223],
                    "geometry": {
                        "type": "Point",
                        "coordinates": [134.489562606981, -25.7349684916223],
                    },
                    "relevance": 1,
                    "place_name": "Australia",
                    "place_type": ["country"],
                    "properties": {
                        "wikidata": "Q408",
                        "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                        "short_code": "au",
                    },
                },
            ],
            "attribution": "NOTICE: © 2023 Mapbox and its suppliers. All rights reserved. Use of this data is subject to the Mapbox Terms of Service (https://www.mapbox.com/about/maps/). This response and the information it contains may not be retained. POI(s) provided by Foursquare.",
            "search_text": "Mistral Point 2035 Maroubra Sydney New South Wales Australia",
        },
        "captions_json": {
            "places365": {
                "attributes": [
                    "open area",
                    "natural light",
                    "far away horizon",
                    "sunny",
                    "rugged scene",
                    "dirt",
                    "natural",
                    "dry",
                    "clouds",
                ],
                "categories": [],
                "environment": "outdoor",
            }
        },
        "search_captions": "outdoor",
        "search_location": "Mistral Point 2035 Maroubra Sydney New South Wales Australia",
        "hidden": False,
        "public": False,
        "video": False,
        "clip_embeddings": [
            -0.36666020750999450,
            -0.04985070228576660,
            -0.55112200975418090,
            -0.02282443828880787,
            0.07433946430683136,
            -0.15077446401119232,
            -0.15087568759918213,
            0.59861290454864500,
            0.74118041992187500,
            0.10699653625488281,
            0.09809046983718872,
            -0.03829161822795868,
            0.18715769052505493,
            -0.19874982535839080,
            -0.17219249904155730,
            -0.31639525294303894,
            -1.24799549579620360,
            -0.18328364193439484,
            0.50648951530456540,
            0.03295477479696274,
            0.05792248249053955,
            -0.023687392473220825,
            0.28321290016174316,
            -0.24516502022743225,
            -0.14424744248390198,
            0.39068019390106200,
            0.07994443178176880,
            -0.12718169391155243,
            0.19193711876869202,
            -0.01991894096136093,
            -0.29576098918914795,
            0.08526518195867538,
            -0.38953876495361330,
            -0.11270611733198166,
            -0.12309470027685165,
            -0.18142205476760864,
            -0.22653748095035553,
            0.25507912039756775,
            0.52982282638549800,
            -0.36807811260223390,
            -0.52154517173767090,
            -0.040144920349121094,
            0.40785139799118040,
            -0.30712696909904480,
            0.22090484201908112,
            -2.02335238456726070,
            0.12097204476594925,
            0.28021758794784546,
            0.09183792769908905,
            0.15624284744262695,
            0.01185154914855957,
            0.22275637090206146,
            0.55167198181152340,
            -0.35499316453933716,
            0.17891690135002136,
            0.05891851335763931,
            0.11313964426517487,
            -0.24982094764709473,
            -0.44442304968833923,
            -0.30212301015853880,
            -0.49696791172027590,
            -0.21229097247123718,
            -0.08969736099243164,
            0.35271137952804565,
            -0.13295263051986694,
            -0.24579304456710815,
            -0.15918856859207153,
            1.22507643699646000,
            -0.47429224848747253,
            -0.14982843399047852,
            -0.19515639543533325,
            -0.18184053897857666,
            -0.10420016944408417,
            -0.27105495333671570,
            -0.014386080205440521,
            -0.19864511489868164,
            -0.59518003463745120,
            0.014985889196395874,
            -0.06511993706226349,
            -0.31187006831169130,
            0.06655596941709518,
            0.46725121140480040,
            -0.15730988979339600,
            0.21003738045692444,
            0.06053004041314125,
            0.18053501844406128,
            0.043053969740867615,
            -0.38710883259773254,
            -0.16783890128135680,
            -0.15172357857227325,
            0.09899577498435974,
            -0.08344091475009918,
            -6.26640892028808600,
            0.62121075391769410,
            0.35546118021011350,
            0.30253031849861145,
            -0.35551121830940247,
            -0.04457452893257141,
            -0.18457348644733430,
            -1.32966053485870360,
            0.17469060420989990,
            -0.33178430795669556,
            0.08215680718421936,
            0.06592759490013123,
            -0.25799661874771120,
            0.05711726099252701,
            -0.18006426095962524,
            -0.13938568532466888,
            0.35842615365982056,
            -0.07131820172071457,
            0.20586800575256348,
            -0.10146003961563110,
            -0.034379392862319946,
            0.09676564484834671,
            -0.39100694656372070,
            -0.19553266465663910,
            -0.39932283759117126,
            0.14101047813892365,
            0.24242374300956726,
            -0.14971837401390076,
            0.19587853550910950,
            -0.07761697471141815,
            -0.13720758259296417,
            -0.036738086491823196,
            0.02775958925485611,
            0.003398708999156952,
            0.32153791189193726,
            -0.29471915960311890,
            -0.67542463541030880,
            0.15028291940689087,
            -0.043420448899269104,
            -0.19056166708469390,
            0.029275819659233093,
            0.85994541645050050,
            -0.41359940171241760,
            -0.00037150830030441284,
            0.21370775997638702,
            0.10217175632715225,
            -0.15029510855674744,
            0.15498718619346620,
            0.14254488050937653,
            -0.12856674194335938,
            -0.12141317129135132,
            -0.21967242658138275,
            -0.22536158561706543,
            0.40473008155822754,
            -0.29137128591537476,
            1.18561625480651860,
            -0.30933171510696410,
            -0.04900578409433365,
            -0.22565384209156036,
            0.026661649346351624,
            -0.53087574243545530,
            -0.02157217264175415,
            0.61312061548233030,
            -0.68817430734634400,
            0.55277901887893680,
            -0.02949278987944126,
            -0.35691511631011963,
            0.17237737774848938,
            -0.84646338224411010,
            0.28129857778549194,
            -0.001386452466249466,
            0.13001629710197450,
            -0.34739860892295840,
            -0.10144264996051788,
            0.64412295818328860,
            0.38456526398658750,
            0.23173999786376953,
            -0.17515747249126434,
            0.020819609984755516,
            -0.32927608489990234,
            0.08890204876661300,
            -0.15161202847957610,
            -0.18559980392456055,
            -0.04398374259471893,
            -0.27180469036102295,
            0.11402454972267151,
            -0.30309695005416870,
            0.71401089429855350,
            0.58197832107543950,
            0.09439059346914291,
            -0.11577179282903671,
            0.33646234869956970,
            -0.22551852464675903,
            0.13584175705909730,
            0.21372529864311218,
            -0.58664178848266600,
            0.24065378308296204,
            0.34127143025398254,
            -0.17579154670238495,
            -0.33026531338691710,
            0.15201087296009064,
            0.36881905794143677,
            -0.50844454765319820,
            -0.48041981458663940,
            0.003377307206392288,
            -0.21604734659194946,
            1.22471618652343750,
            -0.34609639644622800,
            -0.07732010632753372,
            0.19707258045673370,
            0.03305445611476898,
            -0.25127333402633667,
            0.02786330133676529,
            -0.13784091174602509,
            -0.33934032917022705,
            0.11644668132066727,
            0.12870812416076660,
            0.28808489441871643,
            -0.060060858726501465,
            0.05354182422161102,
            -0.18899542093276978,
            0.08026752620935440,
            0.14663285017013550,
            -0.10402667522430420,
            -0.04774125665426254,
            0.78730720281600950,
            0.14746253192424774,
            -0.08459271490573883,
            -0.32546862959861755,
            0.32204133272171020,
            0.08961439132690430,
            0.05263507366180420,
            -0.65238183736801150,
            0.03257568180561066,
            -0.52708566188812260,
            0.38349610567092896,
            0.15065722167491913,
            -0.003457099199295044,
            0.05167556554079056,
            -0.36230301856994630,
            0.13933974504470825,
            0.31344616413116455,
            0.32701274752616880,
            -1.06047749519348140,
            0.03538133203983307,
            0.014965444803237915,
            0.14803899824619293,
            0.08960707485675812,
            -0.25507515668869020,
            -0.26133170723915100,
            0.22333431243896484,
            0.38788953423500060,
            -0.26071867346763610,
            0.34007954597473145,
            0.05404023081064224,
            0.24960926175117493,
            0.35853916406631470,
            -0.24324321746826172,
            -0.25807657837867737,
            0.15211161971092224,
            0.03374246507883072,
            0.09933222830295563,
            0.14579382538795470,
            0.09634265303611755,
            -0.15618667006492615,
            -0.020942021161317825,
            1.40221035480499270,
            -0.02753184735774994,
            -0.018054869025945663,
            0.15185260772705078,
            0.36876207590103150,
            -0.07963977754116058,
            0.21388293802738190,
            -0.57031232118606570,
            0.16593083739280700,
            -0.12364573776721954,
            -0.19139841198921204,
            -0.07277653366327286,
            -0.07489527761936188,
            0.06829735636711120,
            -0.09270213544368744,
            -0.58580970764160160,
            -0.57999855279922490,
            0.10248814523220062,
            0.07077595591545105,
            -0.11604766547679901,
            -0.10343541949987411,
            0.09502948075532913,
            0.07064349204301834,
            0.31945759057998660,
            0.26488274335861206,
            -0.11844316124916077,
            0.10092554986476898,
            0.05796369910240173,
            0.007035255432128906,
            -0.20717875659465790,
            -0.39001202583312990,
            -0.23531873524188995,
            0.029121950268745422,
            -0.31792175769805910,
            0.21073228120803833,
            -0.25988331437110900,
            0.01320233941078186,
            -0.04228278994560242,
            0.87615823745727540,
            0.23483057320117950,
            -0.14261351525783540,
            -0.03390306234359741,
            0.05797864496707916,
            -0.08534366637468338,
            0.60571086406707760,
            -0.40570425987243650,
            0.39349102973937990,
            -0.0029862821102142334,
            0.21820589900016785,
            0.17360526323318481,
            0.51648765802383420,
            0.10162493586540222,
            -0.09098815917968750,
            0.04716239869594574,
            0.85775423049926760,
            -0.11656519025564194,
            0.23683629930019380,
            0.07459381222724915,
            0.55665183067321780,
            -0.03265659511089325,
            -0.03649625927209854,
            0.85287141799926760,
            0.35186266899108887,
            0.036931782960891724,
            -0.26376897096633910,
            -0.45744919776916504,
            -0.09645552933216095,
            0.66262829303741460,
            -0.10217510163784027,
            0.08431930840015411,
            -0.050179481506347656,
            -0.12746801972389220,
            -0.37214517593383790,
            -0.06164243817329407,
            0.26156315207481384,
            -0.14883297681808472,
            0.16589079797267914,
            -0.35074496269226074,
            0.08279553055763245,
            -0.13153877854347230,
            0.16450478136539460,
            -0.13764882087707520,
            -0.20287595689296722,
            -0.046635668724775314,
            0.12855112552642822,
            0.24670921266078950,
            -0.08000148832798004,
            -0.09557560086250305,
            -0.25575160980224610,
            0.15930658578872680,
            -0.67159068584442140,
            -0.07150696963071823,
            0.17778603732585907,
            0.25455826520919800,
            -0.23019903898239136,
            -0.08271875232458115,
            -0.10421910881996155,
            0.55327570438385010,
            0.17031423747539520,
            -0.99103516340255740,
            0.73087739944458010,
            0.33844703435897827,
            0.61791002750396730,
            -0.018104268237948418,
            0.42206788063049316,
            -0.07971519231796265,
            0.06754805147647858,
            0.18134978413581848,
            0.07568907737731934,
            -1.62685477733612060,
            -0.38066196441650390,
            0.66141670942306520,
            -0.25981235504150390,
            0.55625867843627930,
            0.51772624254226680,
            0.24509307742118835,
            -0.20850536227226257,
            -0.16368716955184937,
            0.76303339004516600,
            -0.0018448233604431152,
            -0.05956418812274933,
            -0.13241642713546753,
            0.005002804100513458,
            -0.28848242759704590,
            -0.44567650556564330,
            -0.09337581694126129,
            0.34333360195159910,
            0.18656188249588013,
            0.39478647708892820,
            0.22161819040775300,
            -0.41303259134292600,
            -0.42747217416763306,
            -1.40258526802062990,
            0.58988147974014280,
            0.41526830196380615,
            0.22585415840148926,
            -0.047290802001953125,
            -0.40906193852424620,
            0.13364250957965850,
            0.36895215511322020,
            -0.32853290438652040,
            0.018866248428821564,
            0.021997720003128052,
            0.33384290337562560,
            0.12766578793525696,
            -0.25208842754364014,
            0.29037922620773315,
            -0.26148244738578796,
            0.03055279701948166,
            -0.048704586923122406,
            -0.019998198375105858,
            -0.22977681457996368,
            0.18012699484825134,
            0.05622486397624016,
            0.22875103354454040,
            -0.09111046046018600,
            -0.21855254471302032,
            -0.021557403728365898,
            -0.14998503029346466,
            -0.33238950371742250,
            -0.44446778297424316,
            0.64051526784896850,
            -0.13707451522350310,
            0.11501492559909820,
            0.30077239871025085,
            -1.04448294639587400,
            -0.75157833099365230,
            -0.31508189439773560,
            -0.18117314577102660,
            0.04961024224758148,
            0.020732292905449867,
            0.51410740613937380,
            -0.44715842604637146,
            -0.59480583667755130,
            0.25802063941955566,
            -0.005115009844303131,
            -0.66136705875396730,
            -0.37843626737594604,
            0.39065134525299070,
            -0.16299697756767273,
            -0.08189993351697922,
            0.07605299353599548,
            0.15921586751937866,
            0.55074018239974980,
            -0.66295832395553590,
            0.12967866659164430,
            0.17624089121818542,
            -0.23016670346260070,
            -0.24796481430530548,
            -0.45518487691879270,
            -0.11801701784133911,
            0.07801371812820435,
            0.02105349302291870,
            -0.15974965691566467,
            -0.039424389600753784,
            -0.56841480731964110,
            -0.24004876613616943,
            0.19917711615562440,
            0.05348219349980354,
            -0.09810043871402740,
            -0.06265527009963989,
            -0.0035811271518468857,
            0.44162738323211670,
            -0.20175644755363464,
            0.08200869709253311,
            -0.12142806500196457,
            0.46088671684265137,
            0.12649869918823242,
            -0.39095637202262880,
            0.16196821630001068,
            0.42821982502937317,
            0.53625297546386720,
            -0.10519468784332275,
            0.06364251673221588,
            -0.43340182304382324,
            -0.27793857455253600,
            0.07457497715950012,
            -0.17316223680973053,
            -0.13105086982250214,
            -0.11595485359430313,
            -0.43414521217346190,
            0.013297945261001587,
            -0.03564862906932831,
            -0.04748070240020752,
            0.43650120496749880,
            0.06940247118473053,
            -0.04091569781303406,
            -0.42648598551750183,
            0.44560009241104126,
            -0.27538335323333740,
            -0.24719163775444030,
            -0.39051297307014465,
            0.10344080626964569,
            -0.05663326010107994,
            0.26151871681213380,
            -0.47625967860221863,
            0.16123828291893005,
            -0.36013549566268920,
            0.011993957683444023,
            0.20137929916381836,
            -0.14949794113636017,
            0.36271947622299194,
            0.36080580949783325,
            0.16761866211891174,
            0.12525813281536102,
            0.41298842430114746,
            -0.17537128925323486,
            -0.43780979514122010,
            0.31959301233291626,
            0.56603193283081050,
            -1.01032650470733640,
            -0.23371657729148865,
            -0.31553673744201660,
            -0.010249286890029907,
        ],
        "clip_embeddings_magnitude": 10.27176284790039,
        "aspect_ratio": 1.33,
        "rating": 0,
        "dominant_color": "[152, 188, 233]",
        "video_length": None,
        "in_trashcan": False,
        "removed": False,
        "timestamp": None,
        "camera": "Pixel 2",
        "digitalZoomRatio": None,
        "focalLength35Equivalent": None,
        "focal_length": 4.442,
        "fstop": 1.8,
        "height": 3024,
        "iso": None,
        "lens": None,
        "shutter_speed": "0",
        "size": 8068575,
        "subjectDistance": 3.289,
        "width": 4032,
        "main_file_id": "57dca8933514df1efafddf76004187cc1",
    },
]


================================================
FILE: api/tests/fixtures/api_util/sunburst_expectation.py
================================================
expectation = {
    "name": "Places I've visited",
    "children": [
        {
            "name": "Australia",
            "children": [
                {
                    "name": "New South Wales",
                    "children": [{"name": "Sydney", "value": 4, "hex": "#57d3db"}],
                    "hex": "#b9db57",
                }
            ],
            "hex": "#57d3db",
        },
        {
            "name": "Canada",
            "children": [
                {
                    "name": "Ontario",
                    "children": [
                        {"name": "Peterborough County", "value": 1, "hex": "#c957db"}
                    ],
                    "hex": "#dbae57",
                }
            ],
            "hex": "#dbae57",
        },
        {
            "name": "Germany",
            "children": [
                {
                    "name": "Berlin",
                    "children": [
                        {"name": "Friedrichshain", "value": 1, "hex": "#db5f57"},
                        {"name": "Kreuzberg", "value": 1, "hex": "#69db57"},
                    ],
                    "hex": "#db579e",
                }
            ],
            "hex": "#57d3db",
        },
        {
            "name": "India",
            "children": [
                {
                    "name": "Ladakh",
                    "children": [{"name": "Leh", "value": 2, "hex": "#c957db"}],
                    "hex": "#5784db",
                }
            ],
            "hex": "#db579e",
        },
    ],
}


================================================
FILE: api/tests/fixtures/geocode/__init__.py
================================================


================================================
FILE: api/tests/fixtures/geocode/expectations/mapbox.py
================================================
from api.geocode import GEOCODE_VERSION

expectations = [
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Beach Road", "center": [-33.888012425, 151.275216500055]},
            {"text": "Bondi Beach", "center": [-33.888012425, 151.275216500055]},
            {"text": "Sydney", "center": [-33.888012425, 151.275216500055]},
            {"text": "New South Wales", "center": [-33.888012425, 151.275216500055]},
            {"text": "Australia", "center": [-33.888012425, 151.275216500055]},
        ],
        "places": [
            "Beach Road",
            "Bondi Beach",
            "Sydney",
            "New South Wales",
            "Australia",
        ],
        "address": "17 Beach Road, Bondi Beach New South Wales 2026, Australia",
        "center": [-33.888012425, 151.275216500055],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Fire Route 47", "center": [44.5540639, -78.1955566]},
            {"text": "Lakefield", "center": [44.5540639, -78.1955566]},
            {"text": "Peterborough County", "center": [44.5540639, -78.1955566]},
            {"text": "Ontario", "center": [44.5540639, -78.1955566]},
            {"text": "Canada", "center": [44.5540639, -78.1955566]},
        ],
        "places": [
            "Fire Route 47",
            "Lakefield",
            "Peterborough County",
            "Ontario",
            "Canada",
        ],
        "address": "2880 Fire Route 47, Lakefield, Ontario K0L 2H0, Canada",
        "center": [44.5540639, -78.1955566],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Roncalli", "center": [52.501711, 13.381502]},
            {"text": "Kreuzberg", "center": [52.501711, 13.381502]},
            {"text": "Berlin", "center": [52.501711, 13.381502]},
            {"text": "Germany", "center": [52.501711, 13.381502]},
        ],
        "places": ["Roncalli", "Kreuzberg", "Berlin", "Germany"],
        "address": "Roncalli, Mckernstr, Berlin, 10963, Germany",
        "center": [52.501711, 13.381502],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Lakeshore Road", "center": [33.913368523661, 78.45710763764029]},
            {"text": "Shachokol", "center": [33.913368523661, 78.45710763764029]},
            {"text": "Leh", "center": [33.913368523661, 78.45710763764029]},
            {"text": "Leh", "center": [33.913368523661, 78.45710763764029]},
            {"text": "Ladakh", "center": [33.913368523661, 78.45710763764029]},
            {"text": "India", "center": [33.913368523661, 78.45710763764029]},
        ],
        "places": [
            "Lakeshore Road",
            "Shachokol",
            "Leh",
            "Leh",
            "Ladakh",
            "India",
        ],
        "address": "Lakeshore Road ، 194201 Leh، India",
        "center": [33.913368523661, 78.45710763764029],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Mahon Rock Pool", "center": [-33.94292, 151.263303]},
            {"text": "Maroubra", "center": [-33.94292, 151.263303]},
            {"text": "Sydney", "center": [-33.94292, 151.263303]},
            {"text": "New South Wales", "center": [-33.94292, 151.263303]},
            {"text": "Australia", "center": [-33.94292, 151.263303]},
        ],
        "places": [
            "Mahon Rock Pool",
            "Maroubra",
            "Sydney",
            "New South Wales",
            "Australia",
        ],
        "address": "Mahon Rock Pool, Marine Pde., Sydney, New South Wales, Australia",
        "center": [-33.94292, 151.263303],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Main Bazaar", "center": [34.1622089, 77.585527]},
            {"text": "Chuchat Yakma", "center": [34.1622089, 77.585527]},
            {"text": "Leh", "center": [34.1622089, 77.585527]},
            {"text": "Leh", "center": [34.1622089, 77.585527]},
            {"text": "Ladakh", "center": [34.1622089, 77.585527]},
            {"text": "India", "center": [34.1622089, 77.585527]},
        ],
        "places": [
            "Main Bazaar",
            "Chuchat Yakma",
            "Leh",
            "Leh",
            "Ladakh",
            "India",
        ],
        "address": "Main Bazaar ، 194101 Leh، India",
        "center": [34.1622089, 77.585527],
    },
]


================================================
FILE: api/tests/fixtures/geocode/expectations/nominatim.py
================================================
from api.geocode import GEOCODE_VERSION

expectations = [
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Beach Road", "center": [-33.88801645, 151.27521180010973]},
            {"text": "Seven Ways", "center": [-33.88801645, 151.27521180010973]},
            {"text": "Bondi Beach", "center": [-33.88801645, 151.27521180010973]},
            {"text": "Eastern Suburbs", "center": [-33.88801645, 151.27521180010973]},
            {"text": "Sydney", "center": [-33.88801645, 151.27521180010973]},
            {"text": "New South Wales", "center": [-33.88801645, 151.27521180010973]},
            {"text": "Australia", "center": [-33.88801645, 151.27521180010973]},
        ],
        "places": [
            "Beach Road",
            "Seven Ways",
            "Bondi Beach",
            "Eastern Suburbs",
            "Sydney",
            "New South Wales",
            "Australia",
        ],
        "address": "17, Beach Road, Seven Ways, Bondi Beach, Eastern Suburbs, Sydney, Waverley Council, New South Wales, 2026, Australia",
        "center": [-33.88801645, 151.27521180010973],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {
                "text": "Fire Route 47",
                "center": [44.55373905094425, -78.19571323702382],
            },
            {"text": "Selwyn", "center": [44.55373905094425, -78.19571323702382]},
            {
                "text": "Peterborough County",
                "center": [44.55373905094425, -78.19571323702382],
            },
            {"text": "Ontario", "center": [44.55373905094425, -78.19571323702382]},
            {"text": "Canada", "center": [44.55373905094425, -78.19571323702382]},
        ],
        "places": [
            "Fire Route 47",
            "Selwyn",
            "Peterborough County",
            "Ontario",
            "Canada",
        ],
        "address": "3118, Fire Route 47, Selwyn, Peterborough County, Central Ontario, Ontario, K0L 2C0, Canada",
        "center": [44.55373905094425, -78.19571323702382],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {
                "text": "Möckernstraße",
                "center": [52.501606300000006, 13.381190860617572],
            },
            {"text": "Kreuzberg", "center": [52.501606300000006, 13.381190860617572]},
            {
                "text": "Friedrichshain-Kreuzberg",
                "center": [52.501606300000006, 13.381190860617572],
            },
            {"text": "Berlin", "center": [52.501606300000006, 13.381190860617572]},
            {"text": "Deutschland", "center": [52.501606300000006, 13.381190860617572]},
        ],
        "places": [
            "Möckernstraße",
            "Kreuzberg",
            "Friedrichshain-Kreuzberg",
            "Berlin",
            "Deutschland",
        ],
        "address": "Tempodrom, 10, Möckernstraße, Kreuzberg, Friedrichshain-Kreuzberg, Berlin, 10963, Deutschland",
        "center": [52.501606300000006, 13.381190860617572],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Lakeshore road", "center": [33.9132578, 78.4571752]},
            {"text": "Spangmik", "center": [33.9132578, 78.4571752]},
            {"text": "Leh Tehsil", "center": [33.9132578, 78.4571752]},
            {"text": "Ladakh", "center": [33.9132578, 78.4571752]},
            {"text": "India", "center": [33.9132578, 78.4571752]},
        ],
        "places": [
            "Lakeshore road",
            "Spangmik",
            "Leh Tehsil",
            "Ladakh",
            "India",
        ],
        "address": "Camp Water Mark, Lakeshore road, Spangmik, Leh Tehsil, Leh District, Ladakh, India",
        "center": [33.9132578, 78.4571752],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Marine Parade", "center": [-33.9430026, 151.26386704076833]},
            {"text": "Maroubra", "center": [-33.9430026, 151.26386704076833]},
            {"text": "Eastern Suburbs", "center": [-33.9430026, 151.26386704076833]},
            {"text": "Sydney", "center": [-33.9430026, 151.26386704076833]},
            {"text": "New South Wales", "center": [-33.9430026, 151.26386704076833]},
            {"text": "Australia", "center": [-33.9430026, 151.26386704076833]},
        ],
        "places": [
            "Marine Parade",
            "Maroubra",
            "Eastern Suburbs",
            "Sydney",
            "New South Wales",
            "Australia",
        ],
        "address": "Mahon Pool, Marine Parade, Maroubra, Eastern Suburbs, Sydney, Randwick City Council, New South Wales, 2035, Australia",
        "center": [-33.9430026, 151.26386704076833],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Main Bazaar", "center": [34.1621176, 77.585862]},
            {"text": "Leh", "center": [34.1621176, 77.585862]},
            {"text": "Leh Tehsil", "center": [34.1621176, 77.585862]},
            {"text": "Ladakh", "center": [34.1621176, 77.585862]},
            {"text": "India", "center": [34.1621176, 77.585862]},
        ],
        "places": ["Main Bazaar", "Leh", "Leh Tehsil", "Ladakh", "India"],
        "address": "Dry Fruit Market, Main Bazaar, Matsik Chulung, Leh, Leh Tehsil, Leh District, Ladakh, India",
        "center": [34.1621176, 77.585862],
    },
]


================================================
FILE: api/tests/fixtures/geocode/expectations/opencage.py
================================================
from api.geocode import GEOCODE_VERSION

expectations = [
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Beach Road", "center": [-33.8880165, 151.2752118]},
            {"text": "Bondi Beach", "center": [-33.8880165, 151.2752118]},
            {"text": "Waverley Council", "center": [-33.8880165, 151.2752118]},
            {"text": "Eastern Suburbs", "center": [-33.8880165, 151.2752118]},
            {"text": "New South Wales", "center": [-33.8880165, 151.2752118]},
            {"text": "Australia", "center": [-33.8880165, 151.2752118]},
        ],
        "places": [
            "Beach Road",
            "Bondi Beach",
            "Waverley Council",
            "Eastern Suburbs",
            "New South Wales",
            "Australia",
        ],
        "address": "17 Beach Road, Bondi Beach NSW 2026, Australia",
        "center": [-33.8880165, 151.2752118],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Fire Route 47", "center": [44.5537391, -78.1957132]},
            {"text": "Ontario", "center": [44.5537391, -78.1957132]},
            {"text": "Peterborough County", "center": [44.5537391, -78.1957132]},
            {"text": "Canada", "center": [44.5537391, -78.1957132]},
        ],
        "places": ["Fire Route 47", "Ontario", "Peterborough County", "Canada"],
        "address": "3118 Fire Route 47, Selwyn, ON K0L 2C0, Canada",
        "center": [44.5537391, -78.1957132],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Tempodrom", "center": [52.5016063, 13.3811909]},
            {"text": "Möckernstraße", "center": [52.5016063, 13.3811909]},
            {"text": "Kreuzberg", "center": [52.5016063, 13.3811909]},
            {"text": "Friedrichshain-Kreuzberg", "center": [52.5016063, 13.3811909]},
            {"text": "Berlin", "center": [52.5016063, 13.3811909]},
            {"text": "Germany", "center": [52.5016063, 13.3811909]},
        ],
        "places": [
            "Tempodrom",
            "Möckernstraße",
            "Kreuzberg",
            "Friedrichshain-Kreuzberg",
            "Berlin",
            "Germany",
        ],
        "address": "Tempodrom, Möckernstraße 10, 10963 Berlin, Germany",
        "center": [52.5016063, 13.3811909],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Camp Water Mark", "center": [33.9132578, 78.4571752]},
            {"text": "Lakeshore road", "center": [33.9132578, 78.4571752]},
            {"text": "Spangmik", "center": [33.9132578, 78.4571752]},
            {"text": "Ladakh", "center": [33.9132578, 78.4571752]},
            {"text": "Leh Tehsil", "center": [33.9132578, 78.4571752]},
            {"text": "India", "center": [33.9132578, 78.4571752]},
        ],
        "places": [
            "Camp Water Mark",
            "Lakeshore road",
            "Spangmik",
            "Ladakh",
            "Leh Tehsil",
            "India",
        ],
        "address": "Camp Water Mark, Lakeshore road, Leh district, Spangmik -, Ladakh, India",
        "center": [33.9132578, 78.4571752],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Mahon Pool", "center": [-33.9430026, 151.263867]},
            {"text": "Marine Parade", "center": [-33.9430026, 151.263867]},
            {"text": "Maroubra", "center": [-33.9430026, 151.263867]},
            {"text": "Randwick City Council", "center": [-33.9430026, 151.263867]},
            {"text": "Eastern Suburbs", "center": [-33.9430026, 151.263867]},
            {"text": "New South Wales", "center": [-33.9430026, 151.263867]},
            {"text": "Australia", "center": [-33.9430026, 151.263867]},
        ],
        "places": [
            "Mahon Pool",
            "Marine Parade",
            "Maroubra",
            "Randwick City Council",
            "Eastern Suburbs",
            "New South Wales",
            "Australia",
        ],
        "address": "Mahon Pool, Marine Parade, Maroubra NSW 2035, Australia",
        "center": [-33.9430026, 151.263867],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Dry Fruit Market", "center": [34.1621176, 77.585862]},
            {"text": "Main Bazaar", "center": [34.1621176, 77.585862]},
            {"text": "Ladakh", "center": [34.1621176, 77.585862]},
            {"text": "Leh Tehsil", "center": [34.1621176, 77.585862]},
            {"text": "India", "center": [34.1621176, 77.585862]},
        ],
        "places": [
            "Dry Fruit Market",
            "Main Bazaar",
            "Ladakh",
            "Leh Tehsil",
            "India",
        ],
        "address": "Dry Fruit Market, Main Bazaar, Leh district, Leh -, Ladakh, India",
        "center": [34.1621176, 77.585862],
    },
]


================================================
FILE: api/tests/fixtures/geocode/expectations/tomtom.py
================================================
from api.geocode import GEOCODE_VERSION

expectations = [
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Beach Road", "center": [-33.888145, 151.275085]},
            {"text": "Bondi Beach", "center": [-33.888145, 151.275085]},
            {"text": "New South Wales", "center": [-33.888145, 151.275085]},
            {"text": "Sydney", "center": [-33.888145, 151.275085]},
            {"text": "Australia", "center": [-33.888145, 151.275085]},
        ],
        "places": [
            "Beach Road",
            "Bondi Beach",
            "New South Wales",
            "Sydney",
            "Australia",
        ],
        "address": "17 Beach Road, Bondi Beach, New South Wales, 2026",
        "center": [-33.888145, 151.275085],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Fire Route 47", "center": [44.553463, -78.195114]},
            {"text": "Lakefield", "center": [44.553463, -78.195114]},
            {"text": "Canada", "center": [44.553463, -78.195114]},
        ],
        "places": ["Fire Route 47", "Lakefield", "Canada"],
        "address": "2876 Fire Route 47, Lakefield ON K0L 2H0",
        "center": [44.553463, -78.195114],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Möckernstraße", "center": [52.501957, 13.382298]},
            {"text": "Kreuzberg", "center": [52.501957, 13.382298]},
            {"text": "Berlin", "center": [52.501957, 13.382298]},
            {"text": "Deutschland", "center": [52.501957, 13.382298]},
        ],
        "places": ["Möckernstraße", "Kreuzberg", "Berlin", "Deutschland"],
        "address": "Möckernstraße 138, 10963 Berlin",
        "center": [52.501957, 13.382298],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Thiksey", "center": [33.913391, 78.457077]},
            {"text": "Ladakh", "center": [33.913391, 78.457077]},
            {"text": "Leh", "center": [33.913391, 78.457077]},
            {"text": "India", "center": [33.913391, 78.457077]},
        ],
        "places": ["Thiksey", "Ladakh", "Leh", "India"],
        "address": "Thiksey, Ladakh 194101, Ladakh",
        "center": [33.913391, 78.457077],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Marine Parade", "center": [-33.943535, 151.26181]},
            {"text": "Maroubra", "center": [-33.943535, 151.26181]},
            {"text": "New South Wales", "center": [-33.943535, 151.26181]},
            {"text": "Sydney", "center": [-33.943535, 151.26181]},
            {"text": "Australia", "center": [-33.943535, 151.26181]},
        ],
        "places": [
            "Marine Parade",
            "Maroubra",
            "New South Wales",
            "Sydney",
            "Australia",
        ],
        "address": "106 Marine Parade, Maroubra, New South Wales, 2035",
        "center": [-33.943535, 151.26181],
    },
    {
        "_v": GEOCODE_VERSION,
        "features": [
            {"text": "Leh Ladakh", "center": [34.16209, 77.585808]},
            {"text": "Ladakh", "center": [34.16209, 77.585808]},
            {"text": "Leh", "center": [34.16209, 77.585808]},
            {"text": "India", "center": [34.16209, 77.585808]},
        ],
        "places": ["Leh Ladakh", "Ladakh", "Leh", "India"],
        "address": "Leh Ladakh, Ladakh 194101, Ladakh",
        "center": [34.16209, 77.585808],
    },
]


================================================
FILE: api/tests/fixtures/geocode/responses/mapbox.py
================================================
responses = [
    {
        "id": "address.2007486836507642",
        "type": "Feature",
        "place_type": ["address"],
        "relevance": 1,
        "properties": {
            "accuracy": "rooftop",
            "mapbox_id": "dXJuOm1ieGFkcjo3NmQ1MTQzZi1kZmEwLTQ4NzAtYTAyNy0zYWY1MGJiZTIxYWU",
        },
        "text": "Beach Road",
        "place_name": "17 Beach Road, Bondi Beach New South Wales 2026, Australia",
        "center": [151.275216500055, -33.888012425],
        "geometry": {
            "type": "Point",
            "coordinates": [151.275216500055, -33.888012425],
        },
        "address": "17",
        "context": [
            {
                "id": "postcode.429582",
                "mapbox_id": "dXJuOm1ieHBsYzpCbzRP",
                "text": "2026",
            },
            {
                "id": "locality.259156494",
                "wikidata": "Q673418",
                "mapbox_id": "dXJuOm1ieHBsYzpEM0pxRGc",
                "text": "Bondi Beach",
            },
            {
                "id": "place.24496142",
                "wikidata": "Q3130",
                "mapbox_id": "dXJuOm1ieHBsYzpBWFhJRGc",
                "text": "Sydney",
            },
            {
                "id": "region.33806",
                "short_code": "AU-NSW",
                "wikidata": "Q3224",
                "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                "text": "New South Wales",
            },
            {
                "id": "country.8718",
                "short_code": "au",
                "wikidata": "Q408",
                "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                "text": "Australia",
            },
        ],
    },
    {
        "id": "address.1654238032706288",
        "type": "Feature",
        "place_type": ["address"],
        "relevance": 1,
        "properties": {
            "accuracy": "point",
            "mapbox_id": "dXJuOm1ieGFkcjoyOTlkZDc4Yy0wYWVlLTQ2ZGUtYmFkOC04ZDA0Y2VhYzNkZGQ",
        },
        "text": "Fire Route 47",
        "place_name": "2880 Fire Route 47, Lakefield, Ontario K0L 2H0, Canada",
        "center": [-78.1955566, 44.5540639],
        "geometry": {"type": "Point", "coordinates": [-78.1955566, 44.5540639]},
        "address": "2880",
        "context": [
            {
                "id": "postcode.2669825575",
                "mapbox_id": "dXJuOm1ieHBsYzpueUpPSnc",
                "text": "K0L 2H0",
            },
            {
                "id": "place.106145831",
                "wikidata": "Q114506323",
                "mapbox_id": "dXJuOm1ieHBsYzpCbE9vSnc",
                "text": "Lakefield",
            },
            {
                "id": "district.1140263",
                "wikidata": "Q730542",
                "mapbox_id": "dXJuOm1ieHBsYzpFV1lu",
                "text": "Peterborough County",
            },
            {
                "id": "region.17447",
                "short_code": "CA-ON",
                "wikidata": "Q1904",
                "mapbox_id": "dXJuOm1ieHBsYzpSQ2M",
                "text": "Ontario",
            },
            {
                "id": "country.8743",
                "short_code": "ca",
                "wikidata": "Q16",
                "mapbox_id": "dXJuOm1ieHBsYzpJaWM",
                "text": "Canada",
            },
        ],
    },
    {
        "id": "poi.1047972024770",
        "type": "Feature",
        "place_type": ["poi"],
        "relevance": 1,
        "properties": {
            "foursquare": "50d22a90e4b0d3035504ae2b",
            "landmark": True,
            "address": "Möckernstr",
            "category": "circus",
            "maki": "theatre",
        },
        "text": "Roncalli",
        "place_name": "Roncalli, Mckernstr, Berlin, 10963, Germany",
        "center": [13.381502, 52.501711],
        "geometry": {"coordinates": [13.381502, 52.501711], "type": "Point"},
        "context": [
            {
                "id": "postcode.5541434",
                "mapbox_id": "dXJuOm1ieHBsYzpWSTQ2",
                "text": "10963",
            },
            {
                "id": "locality.181160506",
                "mapbox_id": "dXJuOm1ieHBsYzpDc3hLT2c",
                "text": "Kreuzberg",
            },
            {
                "id": "place.115770",
                "short_code": "DE-BE",
                "wikidata": "Q64",
                "mapbox_id": "dXJuOm1ieHBsYzpBY1E2",
                "text": "Berlin",
            },
            {
                "id": "country.8762",
                "short_code": "de",
                "wikidata": "Q183",
                "mapbox_id": "dXJuOm1ieHBsYzpJam8",
                "text": "Germany",
            },
        ],
    },
    {
        "id": "address.4021415981422040",
        "type": "Feature",
        "place_type": ["address"],
        "relevance": 1,
        "properties": {"accuracy": "street"},
        "text": "Lakeshore Road",
        "place_name": "Lakeshore Road ، 194201 Leh، India",
        "center": [78.45710763764029, 33.913368523661],
        "geometry": {
            "type": "Point",
            "coordinates": [78.45710763764029, 33.913368523661],
        },
        "context": [
            {
                "id": "postcode.13119083",
                "mapbox_id": "dXJuOm1ieHBsYzp5QzVy",
                "text": "194201",
            },
            {
                "id": "locality.3711994475",
                "wikidata": "Q24912826",
                "mapbox_id": "dXJuOm1ieHBsYzozVUNLYXc",
                "text": "Shachokol",
            },
            {
                "id": "place.25135211",
                "wikidata": "Q230818",
                "mapbox_id": "dXJuOm1ieHBsYzpBWCtJYXc",
                "text": "Leh",
            },
            {
                "id": "district.3196523",
                "wikidata": "Q1921210",
                "mapbox_id": "dXJuOm1ieHBsYzpNTVpy",
                "text": "Leh",
            },
            {
                "id": "region.222315",
                "short_code": "IN-LA",
                "wikidata": "Q200667",
                "mapbox_id": "dXJuOm1ieHBsYzpBMlJy",
                "text": "Ladakh",
            },
            {
                "id": "country.8811",
                "short_code": "in",
                "wikidata": "Q668",
                "mapbox_id": "dXJuOm1ieHBsYzpJbXM",
                "text": "India",
            },
        ],
    },
    {
        "id": "poi.695784709457",
        "type": "Feature",
        "place_type": ["poi"],
        "relevance": 1,
        "properties": {
            "foursquare": "4b550d36f964a52055d927e3",
            "landmark": True,
            "address": "Marine Pde.",
            "category": "swimming pool, pool, swim club",
        },
        "text": "Mahon Rock Pool",
        "place_name": "Mahon Rock Pool, Marine Pde., Sydney, New South Wales, Australia",
        "center": [151.263303, -33.94292],
        "geometry": {"coordinates": [151.263303, -33.94292], "type": "Point"},
        "context": [
            {
                "id": "locality.269412878",
                "wikidata": "Q2914843",
                "mapbox_id": "dXJuOm1ieHBsYzpFQTdxRGc",
                "text": "Maroubra",
            },
            {
                "id": "place.24496142",
                "wikidata": "Q3130",
                "mapbox_id": "dXJuOm1ieHBsYzpBWFhJRGc",
                "text": "Sydney",
            },
            {
                "id": "region.33806",
                "short_code": "AU-NSW",
                "wikidata": "Q3224",
                "mapbox_id": "dXJuOm1ieHBsYzpoQTQ",
                "text": "New South Wales",
            },
            {
                "id": "country.8718",
                "short_code": "au",
                "wikidata": "Q408",
                "mapbox_id": "dXJuOm1ieHBsYzpJZzQ",
                "text": "Australia",
            },
        ],
    },
    {
        "id": "address.15438142488176",
        "type": "Feature",
        "place_type": ["address"],
        "relevance": 1,
        "properties": {"accuracy": "street"},
        "text": "Main Bazaar",
        "place_name": "Main Bazaar ، 194101 Leh، India",
        "center": [77.585527, 34.1622089],
        "geometry": {"type": "Point", "coordinates": [77.585527, 34.1622089]},
        "context": [
            {
                "id": "postcode.13053547",
                "mapbox_id": "dXJuOm1ieHBsYzp4eTVy",
                "text": "194101",
            },
            {
                "id": "locality.997100139",
                "wikidata": "Q24909733",
                "mapbox_id": "dXJuOm1ieHBsYzpPMjZLYXc",
                "text": "Chuchat Yakma",
            },
            {
                "id": "place.25135211",
                "wikidata": "Q230818",
                "mapbox_id": "dXJuOm1ieHBsYzpBWCtJYXc",
                "text": "Leh",
            },
            {
                "id": "district.3196523",
                "wikidata": "Q1921210",
                "mapbox_id": "dXJuOm1ieHBsYzpNTVpy",
                "text": "Leh",
            },
            {
                "id": "region.222315",
                "short_code": "IN-LA",
                "wikidata": "Q200667",
                "mapbox_id": "dXJuOm1ieHBsYzpBMlJy",
                "text": "Ladakh",
            },
            {
                "id": "country.8811",
                "short_code": "in",
                "wikidata": "Q668",
                "mapbox_id": "dXJuOm1ieHBsYzpJbXM",
                "text": "India",
            },
        ],
    },
]


================================================
FILE: api/tests/fixtures/geocode/responses/nominatim.py
================================================
responses = [
    {
        "osm_type": "way",
        "osm_id": 1078453262,
        "lat": "-33.88801645",
        "lon": "151.27521180010973",
        "display_name": "17, Beach Road, Seven Ways, Bondi Beach, Eastern Suburbs, Sydney, Waverley Council, New South Wales, 2026, Australia",
        "address": {
            "house_number": "17",
            "road": "Beach Road",
            "neighbourhood": "Seven Ways",
            "suburb": "Bondi Beach",
            "borough": "Eastern Suburbs",
            "city": "Sydney",
            "municipality": "Waverley Council",
            "state": "New South Wales",
            "ISO3166-2-lvl4": "AU-NSW",
            "postcode": "2026",
            "country": "Australia",
            "country_code": "au",
        },
        "boundingbox": [
            "-33.88809",
            "-33.8879428",
            "151.2751212",
            "151.2753024",
        ],
    },
    {
        "osm_type": "way",
        "osm_id": 79160787,
        "lat": "44.55373905094425",
        "lon": "-78.19571323702382",
        "display_name": "3118, Fire Route 47, Selwyn, Peterborough County, Central Ontario, Ontario, K0L 2C0, Canada",
        "address": {
            "house_number": "3118",
            "road": "Fire Route 47",
            "city": "Selwyn",
            "county": "Peterborough County",
            "state_district": "Central Ontario",
            "state": "Ontario",
            "ISO3166-2-lvl4": "CA-ON",
            "postcode": "K0L 2C0",
            "country": "Canada",
            "country_code": "ca",
        },
        "boundingbox": [
            "44.553689050944",
            "44.553789050944",
            "-78.195763237024",
            "-78.195663237024",
        ],
    },
    {
        "osm_type": "relation",
        "osm_id": 7776056,
        "lat": "52.501606300000006",
        "lon": "13.381190860617572",
        "display_name": "Tempodrom, 10, Möckernstraße, Kreuzberg, Friedrichshain-Kreuzberg, Berlin, 10963, Deutschland",
        "address": {
            "building": "Tempodrom",
            "house_number": "10",
            "road": "Möckernstraße",
            "suburb": "Kreuzberg",
            "borough": "Friedrichshain-Kreuzberg",
            "city": "Berlin",
            "ISO3166-2-lvl4": "DE-BE",
            "postcode": "10963",
            "country": "Deutschland",
            "country_code": "de",
        },
        "boundingbox": ["52.5010459", "52.5022072", "13.3803352", "13.3820754"],
    },
    {
        "osm_type": "node",
        "osm_id": 4362313292,
        "lat": "33.9132578",
        "lon": "78.4571752",
        "display_name": "Camp Water Mark, Lakeshore road, Spangmik, Leh Tehsil, Leh District, Ladakh, India",
        "address": {
            "tourism": "Camp Water Mark",
            "road": "Lakeshore road",
            "hamlet": "Spangmik",
            "county": "Leh Tehsil",
            "state_district": "Leh District",
            "state": "Ladakh",
            "ISO3166-2-lvl4": "IN-LA",
            "country": "India",
            "country_code": "in",
        },
        "boundingbox": ["33.9132078", "33.9133078", "78.4571252", "78.4572252"],
    },
    {
        "osm_type": "way",
        "osm_id": 5019363,
        "lat": "-33.9430026",
        "lon": "151.26386704076833",
        "display_name": "Mahon Pool, Marine Parade, Maroubra, Eastern Suburbs, Sydney, Randwick City Council, New South Wales, 2035, Australia",
        "address": {
            "leisure": "Mahon Pool",
            "road": "Marine Parade",
            "suburb": "Maroubra",
            "borough": "Eastern Suburbs",
            "city": "Sydney",
            "municipality": "Randwick City Council",
            "state": "New South Wales",
            "ISO3166-2-lvl4": "AU-NSW",
            "postcode": "2035",
            "country": "Australia",
            "country_code": "au",
        },
        "boundingbox": [
            "-33.9431832",
            "-33.9428627",
            "151.2636802",
            "151.2640019",
        ],
    },
    {
        "osm_type": "node",
        "osm_id": 3748713587,
        "lat": "34.1621176",
        "lon": "77.585862",
        "display_name": "Dry Fruit Market, Main Bazaar, Matsik Chulung, Leh, Leh Tehsil, Leh District, Ladakh, India",
        "address": {
            "amenity": "Dry Fruit Market",
            "road": "Main Bazaar",
            "quarter": "Matsik Chulung",
            "town": "Leh",
            "county": "Leh Tehsil",
            "state_district": "Leh District",
            "state": "Ladakh",
            "ISO3166-2-lvl4": "IN-LA",
            "country": "India",
            "country_code": "in",
        },
        "boundingbox": ["34.1620676", "34.1621676", "77.585812", "77.585912"],
    },
]


================================================
FILE: api/tests/fixtures/geocode/responses/opencage.py
================================================
responses = [
    {
        "annotations": {
            "DMS": {
                "lat": "33° 53' 16.85940'' S",
                "lng": "151° 16' 30.76248'' E",
            },
            "MGRS": "56HLH4050148921",
            "Maidenhead": "QF56pc36av",
            "Mercator": {"x": 16839879.547, "y": -3989951.723},
            "OSM": {
                "edit_url": "https://www.openstreetmap.org/edit?way=1078453262#map=16/-33.88802/151.27521",
                "note_url": "https://www.openstreetmap.org/note/new#map=16/-33.88802/151.27521&layers=N",
                "url": "https://www.openstreetmap.org/?mlat=-33.88802&mlon=151.27521#map=16/-33.88802/151.27521",
            },
            "UN_M49": {
                "regions": {
                    "AU": "036",
                    "AUSTRALASIA": "053",
                    "OCEANIA": "009",
                    "WORLD": "001",
                },
                "statistical_groupings": ["MEDC"],
            },
            "callingcode": 61,
            "currency": {
                "alternate_symbols": ["A$"],
                "decimal_mark": ".",
                "disambiguate_symbol": "A$",
                "html_entity": "$",
                "iso_code": "AUD",
                "iso_numeric": "036",
                "name": "Australian Dollar",
                "smallest_denomination": 5,
                "subunit": "Cent",
                "subunit_to_unit": 100,
                "symbol": "$",
                "symbol_first": 1,
                "thousands_separator": ",",
            },
            "flag": "🇦🇺",
            "geohash": "r3gx4qg5zzveb1g40rhz",
            "qibla": 277.46,
            "roadinfo": {
                "drive_on": "left",
                "road": "Beach Road",
                "speed_in": "km/h",
            },
            "sun": {
                "rise": {
                    "apparent": 1686517020,
                    "astronomical": 1686511680,
                    "civil": 1686515340,
                    "nautical": 1686513480,
                },
                "set": {
                    "apparent": 1686466320,
                    "astronomical": 1686471660,
                    "civil": 1686467940,
                    "nautical": 1686469800,
                },
            },
            "timezone": {
                "name": "Australia/Sydney",
                "now_in_dst": 0,
                "offset_sec": 36000,
                "offset_string": "+1000",
                "short_name": "AEST",
            },
            "what3words": {"words": "elbow.card.brick"},
        },
        "bounds": {
            "northeast": {"lat": -33.8879428, "lng": 151.2753024},
            "southwest": {"lat": -33.88809, "lng": 151.2751212},
        },
        "components": {
            "ISO_3166-1_alpha-2": "AU",
            "ISO_3166-1_alpha-3": "AUS",
            "ISO_3166-2": ["AU-NSW"],
            "_category": "building",
            "_type": "building",
            "borough": "Eastern Suburbs",
            "city": "Sydney",
            "continent": "Oceania",
            "country": "Australia",
            "country_code": "au",
            "house_number": "17",
            "municipality": "Waverley Council",
            "neighbourhood": "Seven Ways",
            "postcode": "2026",
            "road": "Beach Road",
            "state": "New South Wales",
            "state_code": "NSW",
            "suburb": "Bondi Beach",
        },
        "confidence": 10,
        "formatted": "17 Beach Road, Bondi Beach NSW 2026, Australia",
        "geometry": {"lat": -33.8880165, "lng": 151.2752118},
    },
    {
        "annotations": {
            "DMS": {
                "lat": "44° 33' 13.46076'' N",
                "lng": "78° 11' 44.56752'' W",
            },
            "MGRS": "17TQK2273137204",
            "Maidenhead": "FN04vn62mv",
            "Mercator": {"x": -8704706.98, "y": 5521549.602},
            "OSM": {
                "edit_url": "https://www.openstreetmap.org/edit?way=79160787#map=17/44.55374/-78.19571",
                "note_url": "https://www.openstreetmap.org/note/new#map=17/44.55374/-78.19571&layers=N",
                "url": "https://www.openstreetmap.org/?mlat=44.55374&mlon=-78.19571#map=17/44.55374/-78.19571",
            },
            "UN_M49": {
                "regions": {
                    "AMERICAS": "019",
                    "CA": "124",
                    "NORTHERN_AMERICA": "021",
                    "WORLD": "001",
                },
                "statistical_groupings": ["MEDC"],
            },
            "callingcode": 1,
            "currency": {
                "alternate_symbols": ["C$", "CAD$"],
                "decimal_mark": ".",
                "disambiguate_symbol": "C$",
                "html_entity": "$",
                "iso_code": "CAD",
                "iso_numeric": "124",
                "name": "Canadian Dollar",
                "smallest_denomination": 5,
                "subunit": "Cent",
                "subunit_to_unit": 100,
                "symbol": "$",
                "symbol_first": 1,
                "thousands_separator": ",",
            },
            "flag": "🇨🇦",
            "geohash": "drbmkwg87ffjtrftdgxt",
            "qibla": 55.39,
            "roadinfo": {
                "drive_on": "right",
                "road": "Fire Route 47",
                "speed_in": "km/h",
            },
            "sun": {
                "rise": {
                    "apparent": 1686475740,
                    "astronomical": 1686466920,
                    "civil": 1686473520,
                    "nautical": 1686470640,
                },
                "set": {
                    "apparent": 1686444960,
                    "astronomical": 1686453840,
                    "civil": 1686447180,
                    "nautical": 1686450060,
                },
            },
            "timezone": {
                "name": "America/Toronto",
                "now_in_dst": 1,
                "offset_sec": -14400,
                "offset_string": "-0400",
                "short_name": "EDT",
            },
            "what3words": {"words": "tables.grits.homage"},
        },
        "bounds": {
            "northeast": {"lat": 44.5537891, "lng": -78.1956632},
            "southwest": {"lat": 44.5536891, "lng": -78.1957632},
        },
        "components": {
            "ISO_3166-1_alpha-2": "CA",
            "ISO_3166-1_alpha-3": "CAN",
            "ISO_3166-2": ["CA-ON"],
            "_category": "building",
            "_type": "building",
            "city": "Selwyn",
            "continent": "North America",
            "country": "Canada",
            "country_code": "ca",
            "county": "Peterborough County",
            "house_number": "3118",
            "postcode": "K0L 2C0",
            "road": "Fire Route 47",
            "state": "Ontario",
            "state_code": "ON",
            "state_district": "Central Ontario",
        },
        "confidence": 10,
        "formatted": "3118 Fire Route 47, Selwyn, ON K0L 2C0, Canada",
        "geometry": {"lat": 44.5537391, "lng": -78.1957132},
    },
    {
        "annotations": {
            "DMS": {
                "lat": "52° 30' 5.78268'' N",
                "lng": "13° 22' 52.28724'' E",
            },
            "MGRS": "33UUU9011818062",
            "Maidenhead": "JO62qm50rj",
            "Mercator": {"x": 1489587.353, "y": 6857412.691},
            "NUTS": {
                "NUTS0": {"code": "DE"},
                "NUTS1": {"code": "DE3"},
                "NUTS2": {"code": "DE30"},
                "NUTS3": {"code": "DE300"},
            },
            "OSM": {
                "edit_url": "https://www.openstreetmap.org/edit?relation=7776056#map=17/52.50161/13.38119",
                "note_url": "https://www.openstreetmap.org/note/new#map=17/52.50161/13.38119&layers=N",
                "url": "https://www.openstreetmap.org/?mlat=52.50161&mlon=13.38119#map=17/52.50161/13.38119",
            },
            "UN_M49": {
                "regions": {
                    "DE": "276",
                    "EUROPE": "150",
                    "WESTERN_EUROPE": "155",
                    "WORLD": "001",
                },
                "statistical_groupings": ["MEDC"],
            },
            "callingcode": 49,
            "currency": {
                "alternate_symbols": [],
                "decimal_mark": ",",
                "html_entity": "€",
                "iso_code": "EUR",
                "iso_numeric": "978",
                "name": "Euro",
                "smallest_denomination": 1,
                "subunit": "Cent",
                "subunit_to_unit": 100,
                "symbol": "€",
                "symbol_first": 0,
                "thousands_separator": ".",
            },
            "flag": "🇩🇪",
            "geohash": "u33d8mxuh2g0deydr83r",
            "qibla": 136.64,
            "roadinfo": {
                "drive_on": "right",
                "road": "Möckernstraße",
                "speed_in": "km/h",
            },
            "sun": {
                "rise": {
                    "apparent": 1686451500,
                    "astronomical": 0,
                    "civil": 1686448560,
                    "nautical": 1686443820,
                },
                "set": {
                    "apparent": 1686511620,
                    "astronomical": 0,
                    "civil": 1686514620,
                    "nautical": 1686519420,
                },
            },
            "timezone": {
                "name": "Europe/Berlin",
                "now_in_dst": 1,
                "offset_sec": 7200,
                "offset_string": "+0200",
                "short_name": "CEST",
            },
            "what3words": {"words": "closet.elated.pokers"},
            "wikidata": "Q896180",
        },
        "bounds": {
            "northeast": {"lat": 52.5022072, "lng": 13.3820754},
            "southwest": {"lat": 52.5010459, "lng": 13.3803352},
        },
        "components": {
            "ISO_3166-1_alpha-2": "DE",
            "ISO_3166-1_alpha-3": "DEU",
            "ISO_3166-2": ["DE-BE"],
            "_category": "building",
            "_type": "building",
            "borough": "Friedrichshain-Kreuzberg",
            "building": "Tempodrom",
            "city": "Berlin",
            "continent": "Europe",
            "country": "Germany",
            "country_code": "de",
            "house_number": "10",
            "political_union": "European Union",
            "postcode": "10963",
            "road": "Möckernstraße",
            "state": "Berlin",
            "state_code": "BE",
            "suburb": "Kreuzberg",
        },
        "confidence": 10,
        "formatted": "Tempodrom, Möckernstraße 10, 10963 Berlin, Germany",
        "geometry": {"lat": 52.5016063, "lng": 13.3811909},
    },
    {
        "annotations": {
            "DMS": {
                "lat": "33° 54' 47.72808'' N",
                "lng": "78° 27' 25.83072'' E",
            },
            "MGRS": "44SKC6490755450",
            "Maidenhead": "MM93fv49ue",
            "Mercator": {"x": 8733812.792, "y": 3993321.42},
            "OSM": {
                "edit_url": "https://www.openstreetmap.org/edit?node=4362313292#map=16/33.91326/78.45718",
                "note_url": "https://www.openstreetmap.org/note/new#map=16/33.91326/78.45718&layers=N",
                "url": "https://www.openstreetmap.org/?mlat=33.91326&mlon=78.45718#map=16/33.91326/78.45718",
            },
            "UN_M49": {
                "regions": {
                    "ASIA": "142",
                    "IN": "356",
                    "SOUTHERN_ASIA": "034",
                    "WORLD": "001",
                },
                "statistical_groupings": ["LEDC"],
            },
            "callingcode": 91,
            "currency": {
                "alternate_symbols": ["Rs", "৳", "૱", "௹", "रु", "₨"],
                "decimal_mark": ".",
                "html_entity": "&#x20b9;",
                "iso_code": "INR",
                "iso_numeric": "356",
                "name": "Indian Rupee",
                "smallest_denomination": 50,
                "subunit": "Paisa",
                "subunit_to_unit": 100,
                "symbol": "₹",
                "symbol_first": 1,
                "thousands_separator": ",",
            },
            "flag": "🇮🇳",
            "geohash": "twpbcmdz09qn8nexuv7e",
            "qibla": 259.99,
            "roadinfo": {
                "drive_on": "left",
                "road": "Lakeshore road",
                "speed_in": "km/h",
            },
            "sun": {
                "rise": {
                    "apparent": 1686526560,
                    "astronomical": 1686520320,
                    "civil": 1686524820,
                    "nautical": 1686522660,
                },
                "set": {
                    "apparent": 1686491760,
                    "astronomical": 1686497940,
                    "civil": 1686493500,
                    "nautical": 1686495600,
                },
            },
            "timezone": {
                "name": "Asia/Kolkata",
                "now_in_dst": 0,
                "offset_sec": 19800,
                "offset_string": "+0530",
                "short_name": "IST",
            },
            "what3words": {"words": "forklifts.callers.barcode"},
        },
        "bounds": {
            "northeast": {"lat": 33.9133078, "lng": 78.4572252},
            "southwest": {"lat": 33.9132078, "lng": 78.4571252},
        },
        "components": {
            "ISO_3166-1_alpha-2": "IN",
            "ISO_3166-1_alpha-3": "IND",
            "ISO_3166-2": ["IN-LA"],
            "_category": "outdoors/recreation",
            "_type": "camp_site",
            "camp_site": "Camp Water Mark",
            "continent": "Asia",
            "country": "India",
            "country_code": "in",
            "county": "Leh Tehsil",
            "hamlet": "Spangmik",
            "road": "Lakeshore road",
            "state": "Ladakh",
            "state_district": "Leh district",
        },
        "confidence": 9,
        "formatted": "Camp Water Mark, Lakeshore road, Leh district, Spangmik -, Ladakh, India",
        "geometry": {"lat": 33.9132578, "lng": 78.4571752},
    },
    {
        "annotations": {
            "DMS": {
                "lat": "33° 56' 34.80936'' S",
                "lng": "151° 15' 49.92120'' E",
            },
            "MGRS": "56HLH3955542806",
            "Maidenhead": "QF56pb13pq",
            "Mercator": {"x": 16838616.654, "y": -3997293.616},
            "OSM": {
                "edit_url": "https://www.openstreetmap.org/edit?way=5019363#map=16/-33.94300/151.26387",
                "note_url": "https://www.openstreetmap.org/note/new#map=16/-33.94300/151.26387&layers=N",
                "url": "https://www.openstreetmap.org/?mlat=-33.94300&mlon=151.26387#map=16/-33.94300/151.26387",
            },
            "UN_M49": {
                "regions": {
                    "AU": "036",
                    "AUSTRALASIA": "053",
                    "OCEANIA": "009",
                    "WORLD": "001",
                },
                "statistical_groupings": ["MEDC"],
            },
            "callingcode": 61,
            "currency": {
                "alternate_symbols": ["A$"],
                "decimal_mark": ".",
                "disambiguate_symbol": "A$",
                "html_entity": "$",
                "iso_code": "AUD",
                "iso_numeric": "036",
                "name": "Australian Dollar",
                "smallest_denomination": 5,
                "subunit": "Cent",
                "subunit_to_unit": 100,
                "symbol": "$",
                "symbol_first": 1,
                "thousands_separator": ",",
            },
            "flag": "🇦🇺",
            "geohash": "r3gwfhfgxtdnxsdvq2sq",
            "qibla": 277.43,
            "roadinfo": {
                "drive_on": "left",
                "road": "Marine Parade",
                "speed_in": "km/h",
            },
            "sun": {
                "rise": {
                    "apparent": 1686517020,
                    "astronomical": 1686511680,
                    "civil": 1686515340,
                    "nautical": 1686513480,
                },
                "set": {
                    "apparent": 1686466320,
                    "astronomical": 1686471660,
                    "civil": 1686467940,
                    "nautical": 1686469800,
                },
            },
            "timezone": {
                "name": "Australia/Sydney",
                "now_in_dst": 0,
                "offset_sec": 36000,
                "offset_string": "+1000",
                "short_name": "AEST",
            },
            "what3words": {"words": "entire.juices.effort"},
        },
        "bounds": {
            "northeast": {"lat": -33.9428627, "lng": 151.2640019},
            "southwest": {"lat": -33.9431832, "lng": 151.2636802},
        },
        "components": {
            "ISO_3166-1_alpha-2": "AU",
            "ISO_3166-1_alpha-3": "AUS",
            "ISO_3166-2": ["AU-NSW"],
            "_category": "outdoors/recreation",
            "_type": "swimming_pool",
            "borough": "Eastern Suburbs",
            "city": "Sydney",
            "continent": "Oceania",
            "country": "Australia",
            "country_code": "au",
            "municipality": "Randwick City Council",
            "postcode": "2035",
            "road": "Marine Parade",
            "state": "New South Wales",
            "state_code": "NSW",
            "suburb": "Maroubra",
            "swimming_pool": "Mahon Pool",
        },
        "confidence": 9,
        "formatted": "Mahon Pool, Marine Parade, Maroubra NSW 2035, Australia",
        "geometry": {"lat": -33.9430026, "lng": 151.263867},
    },
    {
        "annotations": {
            "DMS": {"lat": "34° 9' 43.62336'' N", "lng": "77° 35' 9.10320'' E"},
            "MGRS": "43SGT3837483153",
            "Maidenhead": "MM84td08hv",
            "Mercator": {"x": 8636818.651, "y": 4026598.097},
            "OSM": {
                "edit_url": "https://www.openstreetmap.org/edit?node=3748713587#map=17/34.16212/77.58586",
                "note_url": "https://www.openstreetmap.org/note/new#map=17/34.16212/77.58586&layers=N",
                "url": "https://www.openstreetmap.org/?mlat=34.16212&mlon=77.58586#map=17/34.16212/77.58586",
            },
            "UN_M49": {
                "regions": {
                    "ASIA": "142",
                    "IN": "356",
                    "SOUTHERN_ASIA": "034",
                    "WORLD": "001",
                },
                "statistical_groupings": ["LEDC"],
            },
            "callingcode": 91,
            "currency": {
                "alternate_symbols": ["Rs", "৳", "૱", "௹", "रु", "₨"],
                "decimal_mark": ".",
                "html_entity": "&#x20b9;",
                "iso_code": "INR",
                "iso_numeric": "356",
                "name": "Indian Rupee",
                "smallest_denomination": 50,
                "subunit": "Paisa",
                "subunit_to_unit": 100,
                "symbol": "₹",
                "symbol_first": 1,
                "thousands_separator": ",",
            },
            "flag": "🇮🇳",
            "geohash": "twp4me02c87c1rep8ec0",
            "qibla": 258.98,
            "roadinfo": {
                "drive_on": "left",
                "road": "Main Bazaar",
                "speed_in": "km/h",
            },
            "sun": {
                "rise": {
                    "apparent": 1686526740,
                    "astronomical": 1686520500,
                    "civil": 1686525000,
                    "nautical": 1686522840,
                },
                "set": {
                    "apparent": 1686492000,
                    "astronomical": 1686498240,
                    "civil": 1686493740,
                    "nautical": 1686495900,
                },
            },
            "timezone": {
                "name": "Asia/Kolkata",
                "now_in_dst": 0,
                "offset_sec": 19800,
                "offset_string": "+0530",
                "short_name": "IST",
            },
            "what3words": {"words": "mascot.muscularity.columns"},
        },
        "bounds": {
            "northeast": {"lat": 34.1621676, "lng": 77.585912},
            "southwest": {"lat": 34.1620676, "lng": 77.585812},
        },
        "components": {
            "ISO_3166-1_alpha-2": "IN",
            "ISO_3166-1_alpha-3": "IND",
            "ISO_3166-2": ["IN-LA"],
            "_category": "commerce",
            "_type": "marketplace",
            "continent": "Asia",
            "country": "India",
            "country_code": "in",
            "county": "Leh Tehsil",
            "marketplace": "Dry Fruit Market",
            "quarter": "Matsik Chulung",
            "road": "Main Bazaar",
            "state": "Ladakh",
            "state_district": "Leh district",
            "town": "Leh",
        },
        "confidence": 9,
        "formatted": "Dry Fruit Market, Main Bazaar, Leh district, Leh -, Ladakh, India",
        "geometry": {"lat": 34.1621176, "lng": 77.585862},
    },
]


================================================
FILE: api/tests/fixtures/geocode/responses/tomtom.py
================================================
responses = [
    {
        "address": {
            "buildingNumber": "17",
            "streetNumber": "17",
            "routeNumbers": [],
            "street": "Beach Road",
            "streetName": "Beach Road",
            "streetNameAndNumber": "17 Beach Road",
            "countryCode": "AU",
            "countrySubdivision": "New South Wales",
            "countrySecondarySubdivision": "Sydney",
            "municipality": "Sydney",
            "postalCode": "2026",
            "municipalitySubdivision": "Bondi Beach",
            "country": "Australia",
            "countryCodeISO3": "AUS",
            "freeformAddress": "17 Beach Road, Bondi Beach, New South Wales, 2026",
            "boundingBox": {
                "northEast": "-33.886643,151.275635",
                "southWest": "-33.888507,151.272843",
                "entity": "position",
            },
            "localName": "Bondi Beach",
        },
        "position": "-33.888145,151.275085",
    },
    {
        "address": {
            "buildingNumber": "2876",
            "streetNumber": "2876",
            "routeNumbers": [],
            "street": "Fire Route 47",
            "streetName": "Fire Route 47",
            "streetNameAndNumber": "2876 Fire Route 47",
            "countryCode": "CA",
            "countrySubdivision": "ON",
            "municipality": "Lakefield",
            "postalCode": "K0L",
            "country": "Canada",
            "countryCodeISO3": "CAN",
            "freeformAddress": "2876 Fire Route 47, Lakefield ON K0L 2H0",
            "boundingBox": {
                "northEast": "44.553471,-78.188317",
                "southWest": "44.551181,-78.195226",
                "entity": "position",
            },
            "extendedPostalCode": "K0L 2H0",
            "countrySubdivisionName": "Ontario",
            "localName": "Lakefield",
        },
        "position": "44.553463,-78.195114",
    },
    {
        "address": {
            "buildingNumber": "138",
            "streetNumber": "138",
            "routeNumbers": [],
            "street": "Möckernstraße",
            "streetName": "Möckernstraße",
            "streetNameAndNumber": "Möckernstraße 138",
            "countryCode": "DE",
            "countrySubdivision": "Berlin",
            "countrySecondarySubdivision": "Berlin",
            "municipality": "Berlin",
            "postalCode": "10963",
            "municipalitySubdivision": "Kreuzberg",
            "country": "Deutschland",
            "countryCodeISO3": "DEU",
            "freeformAddress": "Möckernstraße 138, 10963 Berlin",
            "boundingBox": {
                "northEast": "52.501909,13.382266",
                "southWest": "52.501536,13.382003",
                "entity": "position",
            },
            "localName": "Berlin",
        },
        "position": "52.501957,13.382298",
    },
    {
        "address": {
            "routeNumbers": [],
            "countryCode": "IN",
            "countrySubdivision": "Ladakh",
            "countrySecondarySubdivision": "Leh",
            "municipality": "Ladakh",
            "postalCode": "194101",
            "municipalitySubdivision": "Thiksey",
            "country": "India",
            "countryCodeISO3": "IND",
            "freeformAddress": "Thiksey, Ladakh 194101, Ladakh",
            "boundingBox": {
                "northEast": "33.940281,78.458314",
                "southWest": "33.908006,78.440596",
                "entity": "position",
            },
            "localName": "Ladakh",
        },
        "position": "33.913391,78.457077",
    },
    {
        "address": {
            "buildingNumber": "106",
            "streetNumber": "106",
            "routeNumbers": [],
            "street": "Marine Parade",
            "streetName": "Marine Parade",
            "streetNameAndNumber": "106 Marine Parade",
            "countryCode": "AU",
            "countrySubdivision": "New South Wales",
            "countrySecondarySubdivision": "Sydney",
            "municipality": "Sydney",
            "postalCode": "2035",
            "municipalitySubdivision": "Maroubra",
            "country": "Australia",
            "countryCodeISO3": "AUS",
            "freeformAddress": "106 Marine Parade, Maroubra, New South Wales, 2035",
            "boundingBox": {
                "northEast": "-33.943234,151.262465",
                "southWest": "-33.943728,151.262034",
                "entity": "position",
            },
            "localName": "Maroubra",
        },
        "position": "-33.943535,151.261810",
    },
    {
        "address": {
            "routeNumbers": [],
            "countryCode": "IN",
            "countrySubdivision": "Ladakh",
            "countrySecondarySubdivision": "Leh",
            "municipality": "Ladakh",
            "postalCode": "194101",
            "municipalitySubdivision": "Leh Ladakh",
            "country": "India",
            "countryCodeISO3": "IND",
            "freeformAddress": "Leh Ladakh, Ladakh 194101, Ladakh",
            "boundingBox": {
                "northEast": "34.162343,77.585824",
                "southWest": "34.162047,77.585727",
                "entity": "position",
            },
            "localName": "Ladakh",
        },
        "position": "34.162090,77.585808",
    },
]


================================================
FILE: api/tests/fixtures/location_timeline_test_data.csv
================================================
Canada,2020-08-27 02:19:21.000000 +00:00
Canada,2020-08-27 02:43:55.000000 +00:00
Canada,2020-08-27 22:24:43.000000 +00:00
Canada,2020-08-27 23:57:10.000000 +00:00
Germany,2019-12-14 01:19:03.000000 +00:00
Germany,2019-12-14 20:10:05.000000 +00:00
Germany,2019-12-14 21:06:55.000000 +00:00
Germany,2019-12-14 23:31:11.000000 +00:00
France,2020-12-14 01:12:50.000000 +00:00
France,2020-12-14 01:41:04.000000 +00:00
France,2020-12-14 22:41:32.000000 +00:00
France,2020-12-14 23:40:52.000000 +00:00
Canada,2021-08-10 00:46:32.000000 +00:00
Canada,2021-08-10 00:50:40.000000 +00:00
Canada,2021-08-10 20:47:12.000000 +00:00
Canada,2021-08-10 22:10:06.000000 +00:00
France,2021-10-20 00:19:37.000000 +00:00
France,2021-10-20 01:23:07.000000 +00:00
France,2021-10-20 21:18:53.000000 +00:00
France,2021-10-20 22:30:05.000000 +00:00


================================================
FILE: api/tests/fixtures/niaz.xmp
================================================
<?xpacket begin='﻿' id='W5M0MpCehiHzreSzNTczkc9d'?>
<x:xmpmeta xmlns:x='adobe:ns:meta/' x:xmptk='Image::ExifTool 12.60'>
<rdf:RDF xmlns:rdf='http://www.w3.org/1999/02/22-rdf-syntax-ns#'>

 <rdf:Description rdf:about=''
  xmlns:Iptc4xmpCore='http://iptc.org/std/Iptc4xmpCore/1.0/xmlns/'>
  <Iptc4xmpCore:CreatorContactInfo rdf:parseType='Resource'>
   <Iptc4xmpCore:CiAdrCity>Washington</Iptc4xmpCore:CiAdrCity>
   <Iptc4xmpCore:CiAdrCtry>USA</Iptc4xmpCore:CiAdrCtry>
   <Iptc4xmpCore:CiAdrExtadr>NASA Headquarters, 300 E Street, SW </Iptc4xmpCore:CiAdrExtadr>
   <Iptc4xmpCore:CiAdrPcode>20545</Iptc4xmpCore:CiAdrPcode>
   <Iptc4xmpCore:CiAdrRegion>DC</Iptc4xmpCore:CiAdrRegion>
   <Iptc4xmpCore:CiTelWork>202-358-1900</Iptc4xmpCore:CiTelWork>
   <Iptc4xmpCore:CiUrlWork>http://www.nasa.gov</Iptc4xmpCore:CiUrlWork>
  </Iptc4xmpCore:CreatorContactInfo>
 </rdf:Description>

 <rdf:Description rdf:about=''
  xmlns:Iptc4xmpExt='http://iptc.org/std/Iptc4xmpExt/2008-02-29/'>
  <Iptc4xmpExt:Event>
   <rdf:Alt>
    <rdf:li xml:lang='x-default'>"First Man" Premiere at NASM</rdf:li>
   </rdf:Alt>
  </Iptc4xmpExt:Event>
  <Iptc4xmpExt:PersonInImage>
   <rdf:Bag>
    <rdf:li>Niaz Faridani-Rad</rdf:li>
   </rdf:Bag>
  </Iptc4xmpExt:PersonInImage>
 </rdf:Description>

 <rdf:Description rdf:about=''
  xmlns:MP='http://ns.microsoft.com/photo/1.2/'
  xmlns:MPRI='http://ns.microsoft.com/photo/1.2/t/RegionInfo#'
  xmlns:MPReg='http://ns.microsoft.com/photo/1.2/t/Region#'>
  <MP:RegionInfo rdf:parseType='Resource'>
   <MPRI:Regions>
    <rdf:Bag>
     <rdf:li rdf:parseType='Resource'>
      <MPReg:PersonDisplayName>Niaz Faridani-Rad</MPReg:PersonDisplayName>
      <MPReg:Rectangle>0.280277, 0.125, 0.436419, 0.485614</MPReg:Rectangle>
     </rdf:li>
    </rdf:Bag>
   </MPRI:Regions>
  </MP:RegionInfo>
 </rdf:Description>

 <rdf:Description rdf:about=''
  xmlns:MicrosoftPhoto='http://ns.microsoft.com/photo/1.0'>
  <MicrosoftPhoto:LastKeywordXMP>
   <rdf:Bag>
    <rdf:li>First Man</rdf:li>
    <rdf:li>Washington</rdf:li>
    <rdf:li>Smithsonian National Air and Space Museum (NASM)</rdf:li>
    <rdf:li>DC</rdf:li>
    <rdf:li>Niaz Faridani-Rad</rdf:li>
   </rdf:Bag>
  </MicrosoftPhoto:LastKeywordXMP>
 </rdf:Description>

 <rdf:Description rdf:about=''
  xmlns:acdsee='http://ns.acdsee.com/iptc/1.0/'>
  <acdsee:categories>&lt;Categories&gt;&lt;Category Assigned=&quot;1&quot;&gt;First Man&lt;/Category&gt;&lt;Category Assigned=&quot;1&quot;&gt;Washington&lt;/Category&gt;&lt;Category Assigned=&quot;1&quot;&gt;Smithsonian National Air and Space Museum (NASM)&lt;/Category&gt;&lt;Category Assigned=&quot;1&quot;&gt;DC&lt;/Category&gt;&lt;Category Assigned=&quot;1&quot;&gt;Niaz Faridani-Rad&lt;/Category&gt;&lt;/Categories&gt;</acdsee:categories>
 </rdf:Description>

 <rdf:Description rdf:about=''
  xmlns:aux='http://ns.adobe.com/exif/1.0/aux/'>
  <aux:ApproximateFocusDistance>398/100</aux:ApproximateFocusDistance>
  <aux:ImageNumber>7311</aux:ImageNumber>
  <aux:Lens>70.0-200.0 mm f/2.8</aux:Lens>
  <aux:LensID>162</aux:LensID>
  <aux:LensInfo>700/10 2000/10 28/10 28/10</aux:LensInfo>
  <aux:SerialNumber>3005331</aux:SerialNumber>
 </rdf:Description>

 <rdf:Description rdf:about=''
  xmlns:crs='http://ns.adobe.com/camera-raw-settings/1.0/'>
  <crs:AlreadyApplied>True</crs:AlreadyApplied>
  <crs:AutoLateralCA>0</crs:AutoLateralCA>
  <crs:Blacks2012>0</crs:Blacks2012>
  <crs:BlueHue>0</crs:BlueHue>
  <crs:BlueSaturation>0</crs:BlueSaturation>
  <crs:CameraProfile>Adobe Standard</crs:CameraProfile>
  <crs:CameraProfileDigest>DC0173EBB7ECE22257A40AD42B5C9460</crs:CameraProfileDigest>
  <crs:Clarity2012>+12</crs:Clarity2012>
  <crs:ColorNoiseReduction>25</crs:ColorNoiseReduction>
  <crs:ColorNoiseReductionDetail>50</crs:ColorNoiseReductionDetail>
  <crs:ColorNoiseReductionSmoothness>50</crs:ColorNoiseReductionSmoothness>
  <crs:Contrast2012>0</crs:Contrast2012>
  <crs:ConvertToGrayscale>False</crs:ConvertToGrayscale>
  <crs:DefringeGreenAmount>0</crs:DefringeGreenAmount>
  <crs:DefringeGreenHueHi>60</crs:DefringeGreenHueHi>
  <crs:DefringeGreenHueLo>40</crs:DefringeGreenHueLo>
  <crs:DefringePurpleAmount>0</crs:DefringePurpleAmount>
  <crs:DefringePurpleHueHi>70</crs:DefringePurpleHueHi>
  <crs:DefringePurpleHueLo>30</crs:DefringePurpleHueLo>
  <crs:Dehaze>0</crs:Dehaze>
  <crs:Exposure2012>0.00</crs:Exposure2012>
  <crs:GrainAmount>0</crs:GrainAmount>
  <crs:GreenHue>0</crs:GreenHue>
  <crs:GreenSaturation>0</crs:GreenSaturation>
  <crs:HasCrop>False</crs:HasCrop>
  <crs:HasSettings>True</crs:HasSettings>
  <crs:Highlights2012>0</crs:Highlights2012>
  <crs:HueAdjustmentAqua>0</crs:HueAdjustmentAqua>
  <crs:HueAdjustmentBlue>0</crs:HueAdjustmentBlue>
  <crs:HueAdjustmentGreen>0</crs:HueAdjustmentGreen>
  <crs:HueAdjustmentMagenta>0</crs:HueAdjustmentMagenta>
  <crs:HueAdjustmentOrange>0</crs:HueAdjustmentOrange>
  <crs:HueAdjustmentPurple>0</crs:HueAdjustmentPurple>
  <crs:HueAdjustmentRed>0</crs:HueAdjustmentRed>
  <crs:HueAdjustmentYellow>0</crs:HueAdjustmentYellow>
  <crs:LensManualDistortionAmount>0</crs:LensManualDistortionAmount>
  <crs:LensProfileEnable>0</crs:LensProfileEnable>
  <crs:LensProfileSetup>LensDefaults</crs:LensProfileSetup>
  <crs:Look rdf:parseType='Resource'>
   <crs:Name/>
  </crs:Look>
  <crs:LuminanceAdjustmentAqua>0</crs:LuminanceAdjustmentAqua>
  <crs:LuminanceAdjustmentBlue>0</crs:LuminanceAdjustmentBlue>
  <crs:LuminanceAdjustmentGreen>0</crs:LuminanceAdjustmentGreen>
  <crs:LuminanceAdjustmentMagenta>0</crs:LuminanceAdjustmentMagenta>
  <crs:LuminanceAdjustmentOrange>0</crs:LuminanceAdjustmentOrange>
  <crs:LuminanceAdjustmentPurple>0</crs:LuminanceAdjustmentPurple>
  <crs:LuminanceAdjustmentRed>0</crs:LuminanceAdjustmentRed>
  <crs:LuminanceAdjustmentYellow>0</crs:LuminanceAdjustmentYellow>
  <crs:LuminanceSmoothing>0</crs:LuminanceSmoothing>
  <crs:OverrideLookVignette>False</crs:OverrideLookVignette>
  <crs:ParametricDarks>0</crs:ParametricDarks>
  <crs:ParametricHighlightSplit>75</crs:ParametricHighlightSplit>
  <crs:ParametricHighlights>0</crs:ParametricHighlights>
  <crs:ParametricLights>0</crs:ParametricLights>
  <crs:ParametricMidtoneSplit>50</crs:ParametricMidtoneSplit>
  <crs:ParametricShadowSplit>25</crs:ParametricShadowSplit>
  <crs:ParametricShadows>0</crs:ParametricShadows>
  <crs:PerspectiveAspect>0</crs:PerspectiveAspect>
  <crs:PerspectiveHorizontal>0</crs:PerspectiveHorizontal>
  <crs:PerspectiveRotate>0.0</crs:PerspectiveRotate>
  <crs:PerspectiveScale>100</crs:PerspectiveScale>
  <crs:PerspectiveUpright>0</crs:PerspectiveUpright>
  <crs:PerspectiveVertical>0</crs:PerspectiveVertical>
  <crs:PerspectiveX>0.00</crs:PerspectiveX>
  <crs:PerspectiveY>0.00</crs:PerspectiveY>
  <crs:PostCropVignetteAmount>0</crs:PostCropVignetteAmount>
  <crs:ProcessVersion>10.0</crs:ProcessVersion>
  <crs:RawFileName>_1AG7311.nef</crs:RawFileName>
  <crs:RedHue>0</crs:RedHue>
  <crs:RedSaturation>0</crs:RedSaturation>
  <crs:Saturation>0</crs:Saturation>
  <crs:SaturationAdjustmentAqua>0</crs:SaturationAdjustmentAqua>
  <crs:SaturationAdjustmentBlue>0</crs:SaturationAdjustmentBlue>
  <crs:SaturationAdjustmentGreen>0</crs:SaturationAdjustmentGreen>
  <crs:SaturationAdjustmentMagenta>0</crs:SaturationAdjustmentMagenta>
  <crs:SaturationAdjustmentOrange>0</crs:SaturationAdjustmentOrange>
  <crs:SaturationAdjustmentPurple>0</crs:SaturationAdjustmentPurple>
  <crs:SaturationAdjustmentRed>0</crs:SaturationAdjustmentRed>
  <crs:SaturationAdjustmentYellow>0</crs:SaturationAdjustmentYellow>
  <crs:ShadowTint>0</crs:ShadowTint>
  <crs:Shadows2012>0</crs:Shadows2012>
  <crs:SharpenDetail>36</crs:SharpenDetail>
  <crs:SharpenEdgeMasking>80</crs:SharpenEdgeMasking>
  <crs:SharpenRadius>+1.0</crs:SharpenRadius>
  <crs:Sharpness>75</crs:Sharpness>
  <crs:SplitToningBalance>0</crs:SplitToningBalance>
  <crs:SplitToningHighlightHue>0</crs:SplitToningHighlightHue>
  <crs:SplitToningHighlightSaturation>0</crs:SplitToningHighlightSaturation>
  <crs:SplitToningShadowHue>0</crs:SplitToningShadowHue>
  <crs:SplitToningShadowSaturation>0</crs:SplitToningShadowSaturation>
  <crs:Temperature>6650</crs:Temperature>
  <crs:Tint>-60</crs:Tint>
  <crs:ToneCurve>
   <rdf:Seq>
    <rdf:li>0, 0</rdf:li>
    <rdf:li>255, 255</rdf:li>
   </rdf:Seq>
  </crs:ToneCurve>
  <crs:ToneCurveBlue>
   <rdf:Seq>
    <rdf:li>0, 0</rdf:li>
    <rdf:li>255, 255</rdf:li>
   </rdf:Seq>
  </crs:ToneCurveBlue>
  <crs:ToneCurveGreen>
   <rdf:Seq>
    <rdf:li>0, 0</rdf:li>
    <rdf:li>255, 255</rdf:li>
   </rdf:Seq>
  </crs:ToneCurveGreen>
  <crs:ToneCurveName>Linear</crs:ToneCurveName>
  <crs:ToneCurveName2012>Linear</crs:ToneCurveName2012>
  <crs:ToneCurvePV2012>
   <rdf:Seq>
    <rdf:li>0, 0</rdf:li>
    <rdf:li>255, 255</rdf:li>
   </rdf:Seq>
  </crs:ToneCurvePV2012>
  <crs:ToneCurvePV2012Blue>
   <rdf:Seq>
    <rdf:li>0, 0</rdf:li>
    <rdf:li>255, 255</rdf:li>
   </rdf:Seq>
  </crs:ToneCurvePV2012Blue>
  <crs:ToneCurvePV2012Green>
   <rdf:Seq>
    <rdf:li>0, 0</rdf:li>
    <rdf:li>255, 255</rdf:li>
   </rdf:Seq>
  </crs:ToneCurvePV2012Green>
  <crs:ToneCurvePV2012Red>
   <rdf:Seq>
    <rdf:li>0, 0</rdf:li>
    <rdf:li>255, 255</rdf:li>
   </rdf:Seq>
  </crs:ToneCurvePV2012Red>
  <crs:ToneCurveRed>
   <rdf:Seq>
    <rdf:li>0, 0</rdf:li>
    <rdf:li>255, 255</rdf:li>
   </rdf:Seq>
  </crs:ToneCurveRed>
  <crs:ToneMapStrength>0</crs:ToneMapStrength>
  <crs:UprightCenterMode>0</crs:UprightCenterMode>
  <crs:UprightCenterNormX>0.5</crs:UprightCenterNormX>
  <crs:UprightCenterNormY>0.5</crs:UprightCenterNormY>
  <crs:UprightFocalLength35mm>35</crs:UprightFocalLength35mm>
  <crs:UprightFocalMode>0</crs:UprightFocalMode>
  <crs:UprightFourSegmentsCount>0</crs:UprightFourSegmentsCount>
  <crs:UprightPreview>False</crs:UprightPreview>
  <crs:UprightTransformCount>6</crs:UprightTransformCount>
  <crs:UprightVersion>151388160</crs:UprightVersion>
  <crs:Version>10.4</crs:Version>
  <crs:Vibrance>+20</crs:Vibrance>
  <crs:VignetteAmount>0</crs:VignetteAmount>
  <crs:WhiteBalance>Custom</crs:WhiteBalance>
  <crs:Whites2012>0</crs:Whites2012>
 </rdf:Description>

 <rdf:Description rdf:about=''
  xmlns:dc='http://purl.org/dc/elements/1.1/'>
  <dc:creator>
   <rdf:Seq>
    <rdf:li>NASA/Aubrey Gemignani</rdf:li>
   </rdf:Seq>
  </dc:creator>
  <dc:description>
   <rdf:Alt>
    <rdf:li xml:lang='x-default'>American actor Niaz Faridani-Rad arrives on the red carpet for the premiere of the film "First Man" at the Smithsonian National Air and Space Museum Thursday, Oct. 4, 2018 in Washington. The film is based on the book by Jim Hansen, and chronicles the life of NASA astronaut Neil Armstrong from test pilot to his historic Moon landing. Photo Credit: (NASA/Aubrey Gemignani)</rdf:li>
   </rdf:Alt>
  </dc:description>
  <dc:format>image/jpeg</dc:format>
  <dc:rights>
   <rdf:Alt>
    <rdf:li xml:lang='x-default'>(NASA/Aubrey Gemignani)</rdf:li>
   </rdf:Alt>
  </dc:rights>
  <dc:subject>
   <rdf:Bag>
    <rdf:li>First Man</rdf:li>
    <rdf:li>Washington</rdf:li>
    <rdf:li>Smithsonian National Air and Space Museum (NASM)</rdf:li>
    <rdf:li>DC</rdf:li>
    <rdf:li>Niaz Faridani-Rad</rdf:li>
   </rdf:Bag>
  </dc:subject>
  <dc:title>
   <rdf:Alt>
    <rdf:li xml:lang='x-default'>"First Man" Premiere at NASM</rdf:li>
   </rdf:Alt>
  </dc:title>
 </rdf:Description>

 <rdf:Description rdf:about=''
  xmlns:digiKam='http://www.digikam.org/ns/1.0/'>
  <digiKam:TagsList>
   <rdf:Seq>
    <rdf:li>First Man</rdf:li>
    <rdf:li>Washington</rdf:li>
    <rdf:li>Smithsonian National Air and Space Museum (NASM)</rdf:li>
    <rdf:li>DC</rdf:li>
    <rdf:li>Niaz Faridani-Rad</rdf:li>
   </rdf:Seq>
  </digiKam:TagsList>
 </rdf:Description>

 <rdf:Description rdf:about=''
  xmlns:exif='http://ns.adobe.com/exif/1.0/'>
  <exif:ApertureValue>433985/100000</exif:ApertureValue>
  <exif:CFAPattern>2 0 2 0 0 1 1 2</exif:CFAPattern>
  <exif:ColorSpace>1</exif:ColorSpace>
  <exif:Contrast>0</exif:Contrast>
  <exif:CustomRendered>0</exif:CustomRendered>
  <exif:ExifVersion>0230</exif:ExifVersion>
  <exif:ExposureBiasValue>0/6</exif:ExposureBiasValue>
  <exif:ExposureMode>1</exif:ExposureMode>
  <exif:ExposureProgram>1</exif:ExposureProgram>
  <exif:ExposureTime>1/320</exif:ExposureTime>
  <exif:FNumber>45/10</exif:FNumber>
  <exif:FileSource>3</exif:FileSource>
  <exif:Flash rdf:parseType='Resource'>
   <exif:Fired>False</exif:Fired>
   <exif:Function>False</exif:Function>
   <exif:Mode>0</exif:Mode>
   <exif:RedEyeMode>False</exif:RedEyeMode>
   <exif:Return>0</exif:Return>
  </exif:Flash>
  <exif:FocalLength>2000/10</exif:FocalLength>
  <exif:FocalLengthIn35mmFilm>200</exif:FocalLengthIn35mmFilm>
  <exif:FocalPlaneResolutionUnit>3</exif:FocalPlaneResolutionUnit>
  <exif:FocalPlaneXResolution>50857775/32768</exif:FocalPlaneXResolution>
  <exif:FocalPlaneYResolution>50857775/32768</exif:FocalPlaneYResolution>
  <exif:GainControl>1</exif:GainControl>
  <exif:ISOSpeedRatings>
   <rdf:Seq>
    <rdf:li>2000</rdf:li>
   </rdf:Seq>
  </exif:ISOSpeedRatings>
  <exif:LightSource>0</exif:LightSource>
  <exif:MaxApertureValue>30/10</exif:MaxApertureValue>
  <exif:MeteringMode>5</exif:MeteringMode>
  <exif:Saturation>0</exif:Saturation>
  <exif:SceneCaptureType>0</exif:SceneCaptureType>
  <exif:SceneType>1</exif:SceneType>
  <exif:SensingMethod>2</exif:SensingMethod>
  <exif:Sharpness>0</exif:Sharpness>
  <exif:ShutterSpeedValue>8321928/1000000</exif:ShutterSpeedValue>
  <exif:SubjectDistanceRange>0</exif:SubjectDistanceRange>
  <exif:WhiteBalance>0</exif:WhiteBalance>
 </rdf:Description>

 <rdf:Description rdf:about=''
  xmlns:lr='http://ns.adobe.com/lightroom/1.0/'>
  <lr:hierarchicalSubject>
   <rdf:Bag>
    <rdf:li>First Man</rdf:li>
    <rdf:li>Washington</rdf:li>
    <rdf:li>Smithsonian National Air and Space Museum (NASM)</rdf:li>
    <rdf:li>DC</rdf:li>
    <rdf:li>Niaz Faridani-Rad</rdf:li>
   </rdf:Bag>
  </lr:hierarchicalSubject>
 </rdf:Description>

 <rdf:Description rdf:about=''
  xmlns:mediapro='http://ns.iview-multimedia.com/mediapro/1.0/'>
  <mediapro:CatalogSets>
   <rdf:Bag>
    <rdf:li>First Man</rdf:li>
    <rdf:li>Washington</rdf:li>
    <rdf:li>Smithsonian National Air and Space Museum (NASM)</rdf:li>
    <rdf:li>DC</rdf:li>
    <rdf:li>Niaz Faridani-Rad</rdf:li>
   </rdf:Bag>
  </mediapro:CatalogSets>
 </rdf:Description>

 <rdf:Description rdf:about=''
  xmlns:mwg-rs='http://www.metadataworkinggroup.com/schemas/regions/'
  xmlns:stArea='http://ns.adobe.com/xmp/sType/Area#'>
  <mwg-rs:Regions rdf:parseType='Resource'>
   <mwg-rs:RegionList>
    <rdf:Bag>
     <rdf:li rdf:parseType='Resource'>
      <mwg-rs:Area rdf:parseType='Resource'>
       <stArea:h>0.485614</stArea:h>
       <stArea:unit>normalized</stArea:unit>
       <stArea:w>0.436419</stArea:w>
       <stArea:x>0.498486</stArea:x>
       <stArea:y>0.367807</stArea:y>
      </mwg-rs:Area>
      <mwg-rs:Name>Niaz Faridani-Rad</mwg-rs:Name>
      <mwg-rs:Type>Face</mwg-rs:Type>
     </rdf:li>
    </rdf:Bag>
   </mwg-rs:RegionList>
  </mwg-rs:Regions>
 </rdf:Description>

 <rdf:Description rdf:about=''
  xmlns:photomechanic='http://ns.camerabits.com/photomechanic/1.0/'>
  <photomechanic:ColorClass>0</photomechanic:ColorClass>
  <photomechanic:PMVersion>PM5</photomechanic:PMVersion>
  <photomechanic:Prefs>0:0:5:007311</photomechanic:Prefs>
  <photomechanic:Tagged>False</photomechanic:Tagged>
 </rdf:Description>

 <rdf:Description rdf:about=''
  xmlns:photoshop='http://ns.adobe.com/photoshop/1.0/'>
  <photoshop:AuthorsPosition>Photo Archivist/Photographer</photoshop:AuthorsPosition>
  <photoshop:CaptionWriter>ag</photoshop:CaptionWriter>
  <photoshop:Credit>(NASA/Aubrey Gemignani)</photoshop:Credit>
  <photoshop:DateCreated>2018-10-04T19:21:55-04:00</photoshop:DateCreated>
  <photoshop:Headline>&quot;First Man&quot; Premiere at NASM</photoshop:Headline>
  <photoshop:Instructions>MANDATORY CREDIT: (NASA/Aubrey Gemignani)</photoshop:Instructions>
  <photoshop:Source>(NASA/Aubrey Gemignani)</photoshop:Source>
  <photoshop:TransmissionReference>NHQ201810040124</photoshop:TransmissionReference>
 </rdf:Description>

 <rdf:Description rdf:about=''
  xmlns:tiff='http://ns.adobe.com/tiff/1.0/'>
  <tiff:Make>NIKON CORPORATION</tiff:Make>
  <tiff:Model>NIKON D5</tiff:Model>
  <tiff:ResolutionUnit>2</tiff:ResolutionUnit>
  <tiff:Software>Adobe Photoshop Lightroom Classic 7.4 (Macintosh)</tiff:Software>
  <tiff:XResolution>240/1</tiff:XResolution>
  <tiff:YResolution>240/1</tiff:YResolution>
 </rdf:Description>

 <rdf:Description rdf:about=''
  xmlns:xmp='http://ns.adobe.com/xap/1.0/'>
  <xmp:CreateDate>2018-10-04T19:21:55-04:00</xmp:CreateDate>
  <xmp:CreatorTool>Adobe Photoshop Lightroom Classic 7.4 (Macintosh)</xmp:CreatorTool>
  <xmp:MetadataDate>2018-10-04T21:53:24-04:00</xmp:MetadataDate>
  <xmp:ModifyDate>2018-10-04T21:53:24-04:00</xmp:ModifyDate>
  <xmp:Rating>5</xmp:Rating>
 </rdf:Description>

 <rdf:Description rdf:about=''
  xmlns:stEvt='http://ns.adobe.com/xap/1.0/sType/ResourceEvent#'
  xmlns:stRef='http://ns.adobe.com/xap/1.0/sType/ResourceRef#'
  xmlns:xmpMM='http://ns.adobe.com/xap/1.0/mm/'>
  <xmpMM:DerivedFrom rdf:parseType='Resource'>
   <stRef:documentID>E217B47072178EE0C74E34127F15697D</stRef:documentID>
   <stRef:originalDocumentID>E217B47072178EE0C74E34127F15697D</stRef:originalDocumentID>
  </xmpMM:DerivedFrom>
  <xmpMM:DocumentID>xmp.did:1c7fcbef-0981-466e-a9ea-7c659325f7d4</xmpMM:DocumentID>
  <xmpMM:History>
   <rdf:Seq>
    <rdf:li rdf:parseType='Resource'>
     <stEvt:action>derived</stEvt:action>
     <stEvt:parameters>converted from image/x-nikon-nef to image/jpeg, saved to new location</stEvt:parameters>
    </rdf:li>
    <rdf:li rdf:parseType='Resource'>
     <stEvt:action>saved</stEvt:action>
     <stEvt:changed>/</stEvt:changed>
     <stEvt:instanceID>xmp.iid:1c7fcbef-0981-466e-a9ea-7c659325f7d4</stEvt:instanceID>
     <stEvt:softwareAgent>Adobe Photoshop Lightroom Classic 7.4 (Macintosh)</stEvt:softwareAgent>
     <stEvt:when>2018-10-04T21:53:24-04:00</stEvt:when>
    </rdf:li>
   </rdf:Seq>
  </xmpMM:History>
  <xmpMM:InstanceID>xmp.iid:1c7fcbef-0981-466e-a9ea-7c659325f7d4</xmpMM:InstanceID>
  <xmpMM:OriginalDocumentID>E217B47072178EE0C74E34127F15697D</xmpMM:OriginalDocumentID>
 </rdf:Description>

 <rdf:Description rdf:about=''
  xmlns:xmpRights='http://ns.adobe.com/xap/1.0/rights/'>
  <xmpRights:Marked>False</xmpRights:Marked>
  <xmpRights:UsageTerms>
   <rdf:Alt>
    <rdf:li xml:lang='x-default'>Released to Public</rdf:li>
   </rdf:Alt>
  </xmpRights:UsageTerms>
 </rdf:Description>
</rdf:RDF>
</x:xmpmeta>
<?xpacket end='w'?>

================================================
FILE: api/tests/test_api_robustness.py
================================================
"""
API Robustness and Security Tests

Tests designed to break the API with:
- Malformed inputs
- Invalid UUIDs and identifiers
- Extremely long strings
- Special characters and Unicode
- Missing required fields
- Invalid data types
- Boundary conditions
"""

import uuid

from django.test import TestCase
from django.utils import timezone
from rest_framework import status
from rest_framework.test import APIClient

from api.models.duplicate import Duplicate
from api.models.file import File
from api.models.photo import Photo
from api.models.photo_stack import PhotoStack
from api.models.user import User


class DuplicatesAPIRobustnessTestCase(TestCase):
    """Robustness tests for the Duplicates API."""

    def setUp(self):
        """Create test user and authenticate."""
        self.user = User.objects.create_user(
            username="robusttest",
            password="testpass123",
        )
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_resolve_with_empty_body(self):
        """Should handle empty request body gracefully."""
        # Create a duplicate
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        
        response = self.client.post(
            f"/api/duplicates/{duplicate.id}/resolve/",
            data={},
            format="json",
        )
        # Should return error, not crash
        self.assertIn(response.status_code, [400, 422])

    def test_resolve_with_invalid_photo_id(self):
        """Should handle invalid photo ID gracefully."""
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        
        response = self.client.post(
            f"/api/duplicates/{duplicate.id}/resolve/",
            data={"photo_id": "not-a-valid-uuid"},
            format="json",
        )
        self.assertIn(response.status_code, [400, 404])

    def test_resolve_with_nonexistent_photo(self):
        """Should handle nonexistent photo ID."""
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        fake_uuid = str(uuid.uuid4())
        
        response = self.client.post(
            f"/api/duplicates/{duplicate.id}/resolve/",
            data={"photo_id": fake_uuid},
            format="json",
        )
        self.assertIn(response.status_code, [400, 404])

    def test_access_nonexistent_duplicate(self):
        """Should return 404 for nonexistent duplicate."""
        fake_uuid = str(uuid.uuid4())
        
        response = self.client.get(f"/api/duplicates/{fake_uuid}/")
        self.assertEqual(response.status_code, status.HTTP_404_NOT_FOUND)

    def test_delete_nonexistent_duplicate(self):
        """Should return 404 for deleting nonexistent duplicate."""
        fake_uuid = str(uuid.uuid4())
        
        # Actual delete URL is /api/duplicates/<id>/delete with DELETE method
        response = self.client.delete(f"/api/duplicates/{fake_uuid}/delete")
        self.assertEqual(response.status_code, status.HTTP_404_NOT_FOUND)

    def test_list_with_invalid_status_filter(self):
        """Should handle invalid status filter gracefully."""
        response = self.client.get("/api/duplicates/?status=invalid_status")
        # Should either ignore invalid filter or return error
        self.assertIn(response.status_code, [200, 400])

    def test_list_with_invalid_type_filter(self):
        """Should handle invalid type filter gracefully."""
        response = self.client.get("/api/duplicates/?type=nonexistent_type")
        self.assertIn(response.status_code, [200, 400])

    def test_extremely_long_string_in_query(self):
        """Should handle extremely long query strings."""
        long_string = "a" * 10000
        response = self.client.get(f"/api/duplicates/?status={long_string}")
        # Should not crash
        self.assertIn(response.status_code, [200, 400, 414])

    def test_special_characters_in_query(self):
        """Should handle special characters in query params."""
        response = self.client.get("/api/duplicates/?status=<script>alert(1)</script>")
        self.assertIn(response.status_code, [200, 400])

    def test_unicode_in_query(self):
        """Should handle unicode characters in query params."""
        response = self.client.get("/api/duplicates/?status=状态")
        self.assertIn(response.status_code, [200, 400])

    def test_null_bytes_in_request(self):
        """Should handle null bytes in request data."""
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        
        response = self.client.post(
            f"/api/duplicates/{duplicate.id}/resolve/",
            data={"photo_id": "test\x00injection"},
            format="json",
        )
        self.assertIn(response.status_code, [400, 404])


class StacksAPIRobustnessTestCase(TestCase):
    """Robustness tests for the Stacks API."""

    def setUp(self):
        """Create test user and authenticate."""
        self.user = User.objects.create_user(
            username="stackrobust",
            password="testpass123",
        )
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def _create_photo(self, suffix):
        """Create a test photo."""
        file = File.objects.create(
            hash=f"robust{suffix}" + "a" * 26,
            path=f"/photos/robust_{suffix}.jpg",
            type=File.IMAGE,
        )
        return Photo.objects.create(
            owner=self.user,
            main_file=file,
            image_hash=f"robust{suffix}" + "b" * 26,
            added_on=timezone.now(),
        )

    def test_create_manual_stack_with_empty_photos(self):
        """Should reject creating stack with no photos."""
        # Actual URL is /api/stacks/manual
        response = self.client.post(
            "/api/stacks/manual",
            data={"photo_ids": []},
            format="json",
        )
        self.assertIn(response.status_code, [400, 422])

    def test_create_manual_stack_with_single_photo(self):
        """Should reject creating stack with only one photo."""
        photo = self._create_photo("1")
        
        response = self.client.post(
            "/api/stacks/manual",
            data={"photo_ids": [str(photo.pk)]},
            format="json",
        )
        # Stack needs at least 2 photos
        self.assertIn(response.status_code, [400, 422])

    def test_create_manual_stack_with_invalid_photo_ids(self):
        """Should handle invalid photo IDs."""
        response = self.client.post(
            "/api/stacks/manual",
            data={"photo_ids": ["not-uuid", "also-not-uuid"]},
            format="json",
        )
        self.assertIn(response.status_code, [400, 404])

    def test_create_manual_stack_with_nonexistent_photos(self):
        """Should handle nonexistent photo IDs."""
        fake_uuids = [str(uuid.uuid4()), str(uuid.uuid4())]
        
        response = self.client.post(
            "/api/stacks/manual",
            data={"photo_ids": fake_uuids},
            format="json",
        )
        self.assertIn(response.status_code, [400, 404])

    def test_create_manual_stack_with_other_user_photos(self):
        """Should reject using another user's photos."""
        other_user = User.objects.create_user(
            username="otheruser",
            password="testpass123",
        )
        other_file = File.objects.create(
            hash="other" + "a" * 28,
            path="/photos/other.jpg",
            type=File.IMAGE,
        )
        other_photo = Photo.objects.create(
            owner=other_user,
            main_file=other_file,
            image_hash="other" + "b" * 28,
            added_on=timezone.now(),
        )
        my_photo = self._create_photo("2")
        
        response = self.client.post(
            "/api/stacks/manual",
            data={"photo_ids": [str(my_photo.pk), str(other_photo.pk)]},
            format="json",
        )
        # Should reject or ignore other user's photo
        self.assertIn(response.status_code, [400, 403, 404])

    def test_set_primary_with_photo_not_in_stack(self):
        """Should reject setting primary to photo not in stack."""
        photo1 = self._create_photo("3")
        photo2 = self._create_photo("4")
        photo3 = self._create_photo("5")
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        photo1.stacks.add(stack)
        photo2.stacks.add(stack)
        # photo3 is NOT in stack
        
        # Actual URL is /api/stacks/<id>/primary
        response = self.client.post(
            f"/api/stacks/{stack.id}/primary",
            data={"photo_id": str(photo3.pk)},
            format="json",
        )
        self.assertIn(response.status_code, [400, 404])

    def test_add_photo_to_nonexistent_stack(self):
        """Should return 404 for adding to nonexistent stack."""
        photo = self._create_photo("6")
        fake_uuid = str(uuid.uuid4())
        
        # Actual URL is /api/stacks/<id>/add (no trailing slash)
        response = self.client.post(
            f"/api/stacks/{fake_uuid}/add",
            data={"photo_ids": [str(photo.pk)]},
            format="json",
        )
        self.assertEqual(response.status_code, status.HTTP_404_NOT_FOUND)

    def test_remove_all_photos_from_stack(self):
        """Should handle removing all photos (stack should be deleted or empty)."""
        photo1 = self._create_photo("7")
        photo2 = self._create_photo("8")
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        photo1.stacks.add(stack)
        photo2.stacks.add(stack)
        
        # Actual URL is /api/stacks/<id>/remove
        response = self.client.post(
            f"/api/stacks/{stack.id}/remove",
            data={"photo_ids": [str(photo1.pk), str(photo2.pk)]},
            format="json",
        )
        # Stack API may reject removing all photos (requires at least 2) or delete stack
        self.assertIn(response.status_code, [200, 204, 400])

    def test_merge_stacks_with_empty_list(self):
        """Should reject merging with empty stack list."""
        response = self.client.post(
            "/api/stacks/merge/",
            data={"stack_ids": []},
            format="json",
        )
        self.assertIn(response.status_code, [400, 422])

    def test_merge_single_stack(self):
        """Should reject merging with only one stack."""
        photo1 = self._create_photo("9")
        photo2 = self._create_photo("10")
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        photo1.stacks.add(stack)
        photo2.stacks.add(stack)
        
        response = self.client.post(
            "/api/stacks/merge/",
            data={"stack_ids": [str(stack.id)]},
            format="json",
        )
        self.assertIn(response.status_code, [400, 422])

    def test_list_with_invalid_stack_type_filter(self):
        """Should handle invalid stack type filter."""
        response = self.client.get("/api/stacks/?stack_type=invalid_type")
        self.assertIn(response.status_code, [200, 400])


class PhotoMetadataAPIRobustnessTestCase(TestCase):
    """Robustness tests for the PhotoMetadata API."""

    def setUp(self):
        """Create test user, photo, and authenticate."""
        self.user = User.objects.create_user(
            username="metarobust",
            password="testpass123",
        )
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)
        
        file = File.objects.create(
            hash="meta" + "a" * 28,
            path="/photos/meta.jpg",
            type=File.IMAGE,
        )
        self.photo = Photo.objects.create(
            owner=self.user,
            main_file=file,
            image_hash="meta" + "b" * 28,
            added_on=timezone.now(),
        )

    def test_update_with_invalid_field_types(self):
        """Test behavior with invalid field types - API may accept string and try to convert."""
        response = self.client.patch(
            f"/api/photos/{self.photo.pk}/metadata/",
            data={"iso": "not-a-number"},  # ISO should be int
            format="json",
        )
        # Note: API may accept this (Django models can coerce types) or reject
        self.assertIn(response.status_code, [200, 400, 422])

    def test_update_with_negative_values(self):
        """Should handle negative values for normally positive fields."""
        response = self.client.patch(
            f"/api/photos/{self.photo.pk}/metadata/",
            data={"iso": -100},
            format="json",
        )
        # May accept (no validation) or reject
        self.assertIn(response.status_code, [200, 400])

    def test_update_with_extremely_large_numbers(self):
        """Should handle extremely large numbers."""
        response = self.client.patch(
            f"/api/photos/{self.photo.pk}/metadata/",
            data={"iso": 999999999999999999},
            format="json",
        )
        self.assertIn(response.status_code, [200, 400])

    def test_update_nonexistent_photo_metadata(self):
        """Should return 404 for nonexistent photo."""
        fake_uuid = str(uuid.uuid4())
        
        response = self.client.patch(
            f"/api/photos/{fake_uuid}/metadata/",
            data={"camera": "Test Camera"},
            format="json",
        )
        self.assertEqual(response.status_code, status.HTTP_404_NOT_FOUND)

    def test_update_other_user_photo_metadata(self):
        """Should reject updating another user's photo metadata."""
        other_user = User.objects.create_user(
            username="othermetauser",
            password="testpass123",
        )
        other_file = File.objects.create(
            hash="othermeta" + "a" * 23,
            path="/photos/othermeta.jpg",
            type=File.IMAGE,
        )
        other_photo = Photo.objects.create(
            owner=other_user,
            main_file=other_file,
            image_hash="othermeta" + "b" * 23,
            added_on=timezone.now(),
        )
        
        response = self.client.patch(
            f"/api/photos/{other_photo.pk}/metadata/",
            data={"camera": "Hacked Camera"},
            format="json",
        )
        self.assertIn(response.status_code, [403, 404])

    def test_revert_nonexistent_edit(self):
        """Should return 404 for reverting nonexistent edit."""
        fake_uuid = str(uuid.uuid4())
        
        response = self.client.post(
            f"/api/photos/{self.photo.pk}/metadata/revert/{fake_uuid}/",
        )
        self.assertIn(response.status_code, [404, 405])


class AuthenticationRobustnessTestCase(TestCase):
    """Tests for authentication edge cases."""

    def setUp(self):
        """Create test user."""
        self.user = User.objects.create_user(
            username="authtest",
            password="testpass123",
        )
        self.client = APIClient()

    def test_unauthenticated_access_to_duplicates(self):
        """Should reject unauthenticated access."""
        response = self.client.get("/api/duplicates/")
        self.assertIn(response.status_code, [401, 403])

    def test_unauthenticated_access_to_stacks(self):
        """Should reject unauthenticated access."""
        response = self.client.get("/api/stacks/")
        self.assertIn(response.status_code, [401, 403])

    def test_unauthenticated_detect_duplicates(self):
        """Should reject unauthenticated duplicate detection."""
        response = self.client.post("/api/duplicates/detect/")
        self.assertIn(response.status_code, [401, 403])

    def test_unauthenticated_detect_stacks(self):
        """Should reject unauthenticated stack detection."""
        response = self.client.post("/api/stacks/detect/")
        self.assertIn(response.status_code, [401, 403])


class ConcurrentOperationsTestCase(TestCase):
    """Tests for potential race conditions and concurrent operations."""

    def setUp(self):
        """Create test user and authenticate."""
        self.user = User.objects.create_user(
            username="concurrent",
            password="testpass123",
        )
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def _create_photo(self, suffix):
        """Create a test photo."""
        file = File.objects.create(
            hash=f"conc{suffix}" + "a" * 27,
            path=f"/photos/concurrent_{suffix}.jpg",
            type=File.IMAGE,
        )
        return Photo.objects.create(
            owner=self.user,
            main_file=file,
            image_hash=f"conc{suffix}" + "b" * 27,
            added_on=timezone.now(),
        )

    def test_delete_already_deleted_duplicate(self):
        """Should handle deleting an already-deleted duplicate."""
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup_id = duplicate.id
        
        # First delete
        duplicate.delete()
        
        # Second delete attempt via API - DELETE method
        response = self.client.delete(f"/api/duplicates/{dup_id}/delete")
        self.assertEqual(response.status_code, status.HTTP_404_NOT_FOUND)

    def test_delete_already_deleted_stack(self):
        """Should handle deleting an already-deleted stack."""
        photo = self._create_photo("1")
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        photo.stacks.add(stack)
        stack_id = stack.id
        
        # First delete
        stack.delete()
        
        # Second delete attempt via API - DELETE method
        response = self.client.delete(f"/api/stacks/{stack_id}/delete")
        self.assertEqual(response.status_code, status.HTTP_404_NOT_FOUND)

    def test_resolve_already_resolved_duplicate(self):
        """Should handle resolving an already-resolved duplicate."""
        photo1 = self._create_photo("2")
        photo2 = self._create_photo("3")
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        photo1.duplicates.add(duplicate)
        photo2.duplicates.add(duplicate)
        
        # Resolve first time
        duplicate.resolve(photo1, trash_others=True)
        
        # Resolve second time via API
        response = self.client.post(
            f"/api/duplicates/{duplicate.id}/resolve/",
            data={"photo_id": str(photo2.pk)},
            format="json",
        )
        # Should either succeed (re-resolve) or return appropriate error
        self.assertIn(response.status_code, [200, 400])


class BoundaryConditionsTestCase(TestCase):
    """Tests for boundary conditions and limits."""

    def setUp(self):
        """Create test user and authenticate."""
        self.user = User.objects.create_user(
            username="boundary",
            password="testpass123",
        )
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_pagination_with_zero_page(self):
        """Should handle page=0 gracefully."""
        response = self.client.get("/api/duplicates/?page=0")
        self.assertIn(response.status_code, [200, 400])

    def test_pagination_with_negative_page(self):
        """Should handle negative page number."""
        response = self.client.get("/api/duplicates/?page=-1")
        self.assertIn(response.status_code, [200, 400])

    def test_pagination_with_very_large_page(self):
        """Should handle very large page number."""
        response = self.client.get("/api/duplicates/?page=999999999")
        # Should return empty results, not crash
        self.assertIn(response.status_code, [200, 404])

    def test_pagination_with_invalid_page_size(self):
        """Should handle invalid page size - fixed by clamping to valid range."""
        # Was Bug #10: Negative page_size caused unhandled EmptyPage exception
        # Fixed by adding max(1, ...) to page_size validation
        response = self.client.get("/api/duplicates/?page_size=-10")
        self.assertEqual(response.status_code, status.HTTP_200_OK)

    def test_pagination_with_extremely_large_page_size(self):
        """Should limit extremely large page size."""
        response = self.client.get("/api/duplicates/?page_size=1000000")
        # Should limit or return error
        self.assertIn(response.status_code, [200, 400])

    def test_stacks_pagination_with_zero_page(self):
        """Should handle page=0 for stacks."""
        response = self.client.get("/api/stacks/?page=0")
        self.assertIn(response.status_code, [200, 400])


class MalformedRequestTestCase(TestCase):
    """Tests for malformed HTTP requests."""

    def setUp(self):
        """Create test user and authenticate."""
        self.user = User.objects.create_user(
            username="malformed",
            password="testpass123",
        )
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_post_with_invalid_json(self):
        """Should handle invalid JSON gracefully."""
        response = self.client.post(
            "/api/stacks/manual",
            data="not valid json{{{",
            content_type="application/json",
        )
        self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST)

    def test_post_with_wrong_content_type(self):
        """Should handle wrong content type."""
        response = self.client.post(
            "/api/stacks/manual",
            data="photo_ids=abc",
            content_type="text/plain",
        )
        self.assertIn(response.status_code, [400, 415])

    def test_get_with_duplicate_query_params(self):
        """Should handle duplicate query parameters."""
        response = self.client.get("/api/duplicates/?status=pending&status=resolved")
        # Should not crash - may use first, last, or combine
        self.assertIn(response.status_code, [200, 400])


================================================
FILE: api/tests/test_api_util.py
================================================
from django.test import TestCase
from rest_framework.test import APIClient

from api.tests.fixtures.api_util.photos import photos
from api.tests.fixtures.api_util.sunburst_expectation import (
    expectation as sunburst_expectation,
)
from api.tests.utils import create_test_photo, create_test_user


def create_photos(user):
    for p in photos:
        create_test_photo(owner=user, **p)


def compare_objects_with_ignored_props(result, expectation, ignore):
    if isinstance(result, dict) and isinstance(expectation, dict):
        result_copy = {k: v for k, v in result.items() if k != ignore}
        expectation_copy = {k: v for k, v in expectation.items() if k != ignore}
        return all(
            compare_objects_with_ignored_props(
                result_copy[k], expectation_copy[k], ignore
            )
            for k in result_copy
        ) and set(result_copy.keys()) == set(expectation_copy.keys())
    if isinstance(result, list) and isinstance(expectation, list):
        return len(result) == len(expectation) and all(
            compare_objects_with_ignored_props(res, exp, ignore)
            for res, exp in zip(result, expectation)
        )
    return result == expectation


class TestApiUtil(TestCase):
    def setUp(self) -> None:
        self.client = APIClient()
        self.user = create_test_user()
        self.client.force_authenticate(user=self.user)

    def test_wordcloud(self):
        create_photos(self.user)
        response = self.client.get("/api/wordcloud/")
        actual = response.json()
        # Check structure rather than exact values (caption generation may vary)
        self.assertIn("captions", actual)
        self.assertIn("people", actual)
        self.assertIn("locations", actual)
        self.assertIsInstance(actual["captions"], list)
        self.assertIsInstance(actual["people"], list)
        self.assertIsInstance(actual["locations"], list)
        # Each caption entry should have label and y
        for caption in actual["captions"]:
            self.assertIn("label", caption)
            self.assertIn("y", caption)

    def test_photo_month_count(self):
        create_photos(self.user)
        response = self.client.get("/api/photomonthcounts/")
        actual = response.json()
        self.assertEqual(
            actual,
            [
                {"month": "2017-8", "count": 6},
                {"month": "2017-9", "count": 0},
                {"month": "2017-10", "count": 3},
            ],
        )

    def test_photo_month_count_no_photos(self):
        response = self.client.get("/api/photomonthcounts/")
        actual = response.json()
        self.assertEqual(actual, [])

    def test_location_sunburst(self):
        create_photos(self.user)
        response = self.client.get("/api/locationsunburst/")
        actual = response.json()
        assert compare_objects_with_ignored_props(
            actual, sunburst_expectation, ignore="hex"
        )


================================================
FILE: api/tests/test_auto_select_and_savings.py
================================================
"""
Tests for auto-select and potential savings logic.

Tests cover:
- PhotoStack.auto_select_primary() for various stack types
- Duplicate.auto_select_best_photo() for exact copies and visual duplicates
- Duplicate.calculate_potential_savings() edge cases
- Edge cases with null/missing data
"""

from django.test import TestCase
from django.utils import timezone
from datetime import timedelta

from api.models.photo_stack import PhotoStack
from api.models.duplicate import Duplicate
from api.models.photo_metadata import PhotoMetadata
from api.tests.utils import create_test_photo, create_test_user


class PhotoStackAutoSelectPrimaryTestCase(TestCase):
    """Tests for PhotoStack.auto_select_primary()."""

    def setUp(self):
        self.user = create_test_user()

    def test_auto_select_empty_stack(self):
        """Test auto_select on empty stack."""
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        
        result = stack.auto_select_primary()
        
        self.assertIsNone(result)

    def test_auto_select_single_photo(self):
        """Test auto_select with single photo."""
        photo = create_test_photo(owner=self.user)
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo)
        
        stack.auto_select_primary()
        stack.refresh_from_db()
        
        self.assertEqual(stack.primary_photo, photo)

    def test_auto_select_raw_jpeg_prefers_jpeg(self):
        """Test that RAW+JPEG stack selects a primary photo."""
        # Create two photos for the stack
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.RAW_JPEG_PAIR,
        )
        stack.photos.add(photo1, photo2)
        
        # auto_select_primary should select a photo
        stack.auto_select_primary()
        stack.refresh_from_db()
        
        # Should have selected a primary photo
        self.assertIsNotNone(stack.primary_photo)
        # The selected photo should be one of the stack photos
        self.assertIn(stack.primary_photo, [photo1, photo2])

    def test_auto_select_raw_jpeg_only_raw(self):
        """Test RAW+JPEG fallback when no JPEG available."""
        # Create two photos for the stack
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.RAW_JPEG_PAIR,
        )
        stack.photos.add(photo1, photo2)
        
        stack.auto_select_primary()
        stack.refresh_from_db()
        
        # Should still select one photo even if no JPEG preference possible
        self.assertIsNotNone(stack.primary_photo)
        self.assertIn(stack.primary_photo, [photo1, photo2])

    def test_auto_select_burst_picks_middle(self):
        """Test that burst stack picks middle photo by timestamp."""
        base_time = timezone.now()
        
        photos = []
        for i in range(5):
            photo = create_test_photo(owner=self.user)
            photo.exif_timestamp = base_time + timedelta(seconds=i)
            photo.save()
            photos.append(photo)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack.photos.add(*photos)
        
        stack.auto_select_primary()
        stack.refresh_from_db()
        
        # Should pick middle (index 2 of 5)
        self.assertEqual(stack.primary_photo, photos[2])

    def test_auto_select_burst_no_timestamps(self):
        """Test burst stack when photos have no timestamps."""
        photos = [create_test_photo(owner=self.user) for _ in range(3)]
        for photo in photos:
            photo.exif_timestamp = None
            photo.save()
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack.photos.add(*photos)
        
        # Should not crash
        stack.auto_select_primary()
        stack.refresh_from_db()
        
        # Should still select something
        self.assertIsNotNone(stack.primary_photo)

    def test_auto_select_manual_highest_resolution(self):
        """Test manual stack picks highest resolution."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        
        # Set different resolutions via metadata
        PhotoMetadata.objects.update_or_create(
            photo=photo1,
            defaults={'width': 1920, 'height': 1080}
        )
        PhotoMetadata.objects.update_or_create(
            photo=photo2,
            defaults={'width': 3840, 'height': 2160}  # 4K - highest
        )
        PhotoMetadata.objects.update_or_create(
            photo=photo3,
            defaults={'width': 1280, 'height': 720}
        )
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo1, photo2, photo3)
        
        stack.auto_select_primary()
        stack.refresh_from_db()
        
        # Should pick highest resolution (photo2)
        self.assertEqual(stack.primary_photo, photo2)

    def test_auto_select_manual_no_metadata(self):
        """Test manual stack when photos have no metadata."""
        photos = [create_test_photo(owner=self.user) for _ in range(3)]
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(*photos)
        
        # Should not crash
        stack.auto_select_primary()
        stack.refresh_from_db()
        
        # Should still select something
        self.assertIsNotNone(stack.primary_photo)


class DuplicateAutoSelectBestTestCase(TestCase):
    """Tests for Duplicate.auto_select_best_photo()."""

    def setUp(self):
        self.user = create_test_user()

    def test_auto_select_empty_duplicate(self):
        """Test auto_select on duplicate with no photos."""
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        
        result = dup.auto_select_best_photo()
        
        self.assertIsNone(result)

    def test_auto_select_exact_copy_shortest_path(self):
        """Test exact copy selects shortest path."""
        photo1 = create_test_photo(owner=self.user)
        photo1.main_file.path = "/very/long/nested/directory/path/photo1.jpg"
        photo1.main_file.save()
        
        photo2 = create_test_photo(owner=self.user)
        photo2.main_file.path = "/a.jpg"  # Much shorter path
        photo2.main_file.save()
        
        # Verify paths are set correctly
        photo1.main_file.refresh_from_db()
        photo2.main_file.refresh_from_db()
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(photo1, photo2)
        
        result = dup.auto_select_best_photo()
        
        # Should pick shorter path - verify by checking the path of result
        self.assertIsNotNone(result)
        # The result should have the shorter path
        result_path_len = len(result.main_file.path)
        self.assertLessEqual(result_path_len, len("/a.jpg") + 5)  # Some tolerance

    def test_auto_select_visual_duplicate_highest_resolution(self):
        """Test visual duplicate selects highest resolution."""
        photo1 = create_test_photo(owner=self.user)
        PhotoMetadata.objects.update_or_create(
            photo=photo1,
            defaults={'width': 1920, 'height': 1080}
        )
        
        photo2 = create_test_photo(owner=self.user)
        PhotoMetadata.objects.update_or_create(
            photo=photo2,
            defaults={'width': 3840, 'height': 2160}  # Higher resolution
        )
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
        )
        dup.photos.add(photo1, photo2)
        
        result = dup.auto_select_best_photo()
        
        # Should pick highest resolution
        self.assertEqual(result, photo2)

    def test_auto_select_visual_no_metadata(self):
        """Test visual duplicate when no metadata available."""
        photos = [create_test_photo(owner=self.user) for _ in range(3)]
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
        )
        dup.photos.add(*photos)
        
        # Should not crash
        result = dup.auto_select_best_photo()
        
        # Should still return something (or None)
        # The result depends on database ordering
        self.assertIsNotNone(result) if dup.photos.exists() else None

    def test_auto_select_visual_partial_metadata(self):
        """Test visual duplicate when some photos have metadata."""
        photo1 = create_test_photo(owner=self.user)
        # No metadata for photo1
        
        photo2 = create_test_photo(owner=self.user)
        PhotoMetadata.objects.update_or_create(
            photo=photo2,
            defaults={'width': 1920, 'height': 1080}
        )
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
        )
        dup.photos.add(photo1, photo2)
        
        # Should not crash
        result = dup.auto_select_best_photo()
        self.assertIsNotNone(result)


class DuplicatePotentialSavingsTestCase(TestCase):
    """Tests for Duplicate.calculate_potential_savings()."""

    def setUp(self):
        self.user = create_test_user()

    def test_savings_empty_duplicate(self):
        """Test potential savings for empty duplicate."""
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        
        savings = dup.calculate_potential_savings()
        
        self.assertEqual(savings, 0)

    def test_savings_single_photo(self):
        """Test potential savings with single photo."""
        photo = create_test_photo(owner=self.user)
        photo.size = 1000000  # 1MB
        photo.save()
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(photo)
        
        savings = dup.calculate_potential_savings()
        
        # Only one photo, no savings possible
        self.assertEqual(savings, 0)

    def test_savings_two_photos(self):
        """Test potential savings with two photos."""
        photo1 = create_test_photo(owner=self.user)
        photo1.size = 2000000  # 2MB
        photo1.main_file.path = "/short.jpg"
        photo1.main_file.save()
        photo1.save()
        
        photo2 = create_test_photo(owner=self.user)
        photo2.size = 1500000  # 1.5MB
        photo2.main_file.path = "/very/long/path/photo.jpg"
        photo2.main_file.save()
        photo2.save()
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(photo1, photo2)
        
        savings = dup.calculate_potential_savings()
        
        # Best photo is photo1 (shorter path), savings = photo2.size
        self.assertEqual(savings, 1500000)

    def test_savings_many_photos(self):
        """Test potential savings with many photos."""
        photos = []
        total_size = 0
        for i in range(5):
            photo = create_test_photo(owner=self.user)
            photo.size = (i + 1) * 1000000  # 1MB, 2MB, 3MB, 4MB, 5MB
            total_size += photo.size
            photo.main_file.path = f"/{'x' * (i + 1)}/photo{i}.jpg"
            photo.main_file.save()
            photo.save()
            photos.append(photo)
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(*photos)
        
        savings = dup.calculate_potential_savings()
        
        # Savings should be total - best_photo_size
        # The actual "best" depends on which path is shortest
        # Just verify savings is reasonable (not 0, less than total)
        self.assertGreater(savings, 0)
        self.assertLess(savings, total_size)

    def test_savings_zero_sizes(self):
        """Test potential savings when photos have zero sizes."""
        photo1 = create_test_photo(owner=self.user)
        photo1.size = 0
        photo1.main_file.path = "/a.jpg"  # Short path (will be kept)
        photo1.main_file.save()
        photo1.save()
        
        photo2 = create_test_photo(owner=self.user)
        photo2.size = 0
        photo2.main_file.path = "/longer/path/photo.jpg"
        photo2.main_file.save()
        photo2.save()
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(photo1, photo2)
        
        # Should not crash, savings = 0 since both sizes are 0
        savings = dup.calculate_potential_savings()
        self.assertEqual(savings, 0)

    def test_savings_updates_model_field(self):
        """Test that calculate_potential_savings updates the model field."""
        photo1 = create_test_photo(owner=self.user)
        photo1.size = 2000000
        photo1.main_file.path = "/short.jpg"
        photo1.main_file.save()
        photo1.save()
        
        photo2 = create_test_photo(owner=self.user)
        photo2.size = 3000000
        photo2.main_file.path = "/longer/path.jpg"
        photo2.main_file.save()
        photo2.save()
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            potential_savings=0,
        )
        dup.photos.add(photo1, photo2)
        
        dup.calculate_potential_savings()
        
        # Reload from database
        dup.refresh_from_db()
        
        # Field should be updated
        self.assertEqual(dup.potential_savings, 3000000)


class DuplicateResolveRevertTestCase(TestCase):
    """Tests for Duplicate.resolve() and Duplicate.revert() methods."""

    def setUp(self):
        self.user = create_test_user()

    def test_resolve_marks_status(self):
        """Test that resolve() sets review_status to RESOLVED."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.PENDING,
        )
        dup.photos.add(photo1, photo2)
        
        dup.resolve(kept_photo=photo1, trash_others=False)
        dup.refresh_from_db()
        
        self.assertEqual(dup.review_status, Duplicate.ReviewStatus.RESOLVED)
        self.assertEqual(dup.kept_photo, photo1)

    def test_resolve_trash_others(self):
        """Test that resolve() with trash_others=True moves photos to trash."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(photo1, photo2, photo3)
        
        dup.resolve(kept_photo=photo1, trash_others=True)
        
        # Refresh all
        photo1.refresh_from_db()
        photo2.refresh_from_db()
        photo3.refresh_from_db()
        
        # Kept photo should NOT be trashed
        self.assertFalse(photo1.in_trashcan)
        
        # Others should be trashed
        self.assertTrue(photo2.in_trashcan)
        self.assertTrue(photo3.in_trashcan)

    def test_resolve_no_trash(self):
        """Test that resolve() with trash_others=False doesn't trash anything."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(photo1, photo2)
        
        dup.resolve(kept_photo=photo1, trash_others=False)
        
        photo2.refresh_from_db()
        
        # Should NOT be trashed
        self.assertFalse(photo2.in_trashcan)

    def test_revert_restores_trashed(self):
        """Test that revert() restores trashed photos."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(photo1, photo2)
        
        # Resolve (trashes photo2)
        dup.resolve(kept_photo=photo1, trash_others=True)
        
        photo2.refresh_from_db()
        self.assertTrue(photo2.in_trashcan)
        
        # Revert
        dup.revert()
        
        photo2.refresh_from_db()
        dup.refresh_from_db()
        
        # Photo should be restored
        self.assertFalse(photo2.in_trashcan)
        
        # Status should be back to pending
        self.assertEqual(dup.review_status, Duplicate.ReviewStatus.PENDING)

    def test_revert_clears_kept_photo(self):
        """Test that revert() clears the kept_photo field."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(photo1, photo2)
        
        dup.resolve(kept_photo=photo1, trash_others=False)
        self.assertIsNotNone(dup.kept_photo)
        
        dup.revert()
        dup.refresh_from_db()
        
        self.assertIsNone(dup.kept_photo)


class DuplicateDismissTestCase(TestCase):
    """Tests for Duplicate.dismiss() method."""

    def setUp(self):
        self.user = create_test_user()

    def test_dismiss_sets_status(self):
        """Test that dismiss() sets review_status to DISMISSED."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
            review_status=Duplicate.ReviewStatus.PENDING,
        )
        dup.photos.add(photo1, photo2)
        
        dup.dismiss()
        dup.refresh_from_db()
        
        self.assertEqual(dup.review_status, Duplicate.ReviewStatus.DISMISSED)

    def test_dismiss_doesnt_trash(self):
        """Test that dismiss() doesn't trash any photos."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
        )
        dup.photos.add(photo1, photo2)
        
        dup.dismiss()
        
        photo1.refresh_from_db()
        photo2.refresh_from_db()
        
        # Neither should be trashed
        self.assertFalse(photo1.in_trashcan)
        self.assertFalse(photo2.in_trashcan)


================================================
FILE: api/tests/test_background_tasks.py
================================================
import importlib.util
import pathlib
import sys
import unittest
from types import ModuleType, SimpleNamespace
from unittest.mock import MagicMock, patch


class _FakeQuerySet(list):
    def count(self):
        return len(self)


class GeolocateLoggingTests(unittest.TestCase):
    def test_geolocate_logs_exception_without_crash(self):
        fake_logger = MagicMock()
        fake_api_module = ModuleType("api")
        fake_api_module.__path__ = []

        fake_models_module = ModuleType("api.models")
        fake_models_module.Photo = MagicMock()

        fake_photo_caption_module = ModuleType("api.models.photo_caption")
        fake_photo_caption_module.PhotoCaption = MagicMock()

        fake_util_module = ModuleType("api.util")
        fake_util_module.logger = fake_logger

        fake_django_module = ModuleType("django")
        fake_django_apps = ModuleType("django.apps")
        fake_django_apps.AppConfig = object
        fake_django_module.apps = fake_django_apps

        fake_django_db_module = ModuleType("django.db")
        fake_django_db_module.models = SimpleNamespace(Q=MagicMock())

        fake_tqdm_module = ModuleType("tqdm")
        fake_tqdm_module.tqdm = MagicMock()

        module_path = pathlib.Path(__file__).resolve().parents[1] / "background_tasks.py"

        exception_mock = None

        with patch.dict(
            sys.modules,
            {
                "api": fake_api_module,
                "api.models": fake_models_module,
                "api.models.photo_caption": fake_photo_caption_module,
                "api.util": fake_util_module,
                "django": fake_django_module,
                "django.apps": fake_django_apps,
                "django.db": fake_django_db_module,
                "tqdm": fake_tqdm_module,
            },
        ):
            spec = importlib.util.spec_from_file_location(
                "api.background_tasks", module_path
            )
            module = importlib.util.module_from_spec(spec)
            sys.modules["api.background_tasks"] = module
            spec.loader.exec_module(module)

            photo = MagicMock()
            photo._geolocate.side_effect = RuntimeError("boom")
            photo.main_file = SimpleNamespace(path="fake-path")

            photos = _FakeQuerySet([photo])

            fake_models_module.Photo.objects.filter.return_value = photos

            with patch("api.background_tasks.logger.exception") as mock_exception:
                module.geolocate()
                exception_mock = mock_exception
                logged_args = mock_exception.call_args[0]

        self.assertIsNotNone(exception_mock)
        exception_mock.assert_called_once()
        self.assertEqual(logged_args[0], "could not geolocate photo: %s")
        self.assertIs(logged_args[1], photo)


================================================
FILE: api/tests/test_bktree_and_duplicate_detection.py
================================================
"""
Tests for BK-Tree data structure and duplicate detection logic.

Tests cover:
- BK-Tree operations (add, search, edge cases)
- Union-Find operations
- Exact copy detection
- Visual duplicate detection with threshold
- Batch detection orchestration
"""

from django.test import TestCase

from api.models.duplicate import Duplicate
from api.models.file import File
from api.duplicate_detection import (
    BKTree,
    UnionFind,
    detect_exact_copies,
    detect_visual_duplicates,
    batch_detect_duplicates,
)
from api.tests.utils import create_test_photo, create_test_user


class BKTreeTestCase(TestCase):
    """Tests for BK-Tree data structure."""

    def test_empty_tree_search(self):
        """Test searching an empty tree."""
        tree = BKTree(lambda a, b: abs(a - b))
        
        results = tree.search(5, 2)
        
        self.assertEqual(results, [])

    def test_add_single_item(self):
        """Test adding a single item to tree."""
        tree = BKTree(lambda a, b: abs(a - b))
        tree.add("item1", 10)
        
        self.assertEqual(tree.size, 1)
        self.assertIsNotNone(tree.root)

    def test_add_multiple_items(self):
        """Test adding multiple items to tree."""
        tree = BKTree(lambda a, b: abs(a - b))
        tree.add("item1", 10)
        tree.add("item2", 15)
        tree.add("item3", 20)
        
        self.assertEqual(tree.size, 3)

    def test_search_exact_match(self):
        """Test searching for exact match."""
        tree = BKTree(lambda a, b: abs(a - b))
        tree.add("item1", 10)
        tree.add("item2", 20)
        
        results = tree.search(10, 0)
        
        self.assertEqual(len(results), 1)
        self.assertEqual(results[0][0], "item1")
        self.assertEqual(results[0][1], 0)

    def test_search_within_threshold(self):
        """Test searching within threshold."""
        tree = BKTree(lambda a, b: abs(a - b))
        tree.add("item1", 10)
        tree.add("item2", 12)
        tree.add("item3", 20)
        
        results = tree.search(11, 2)
        
        # Should find item1 (distance 1) and item2 (distance 1)
        ids = [r[0] for r in results]
        self.assertIn("item1", ids)
        self.assertIn("item2", ids)
        self.assertNotIn("item3", ids)

    def test_search_no_matches(self):
        """Test searching with no matches."""
        tree = BKTree(lambda a, b: abs(a - b))
        tree.add("item1", 10)
        tree.add("item2", 20)
        
        results = tree.search(100, 5)
        
        self.assertEqual(results, [])

    def test_hamming_distance_search(self):
        """Test BK-Tree with hamming distance (simulated)."""
        def simple_hamming(a, b):
            """Simple hamming distance for integers."""
            xor = a ^ b
            return bin(xor).count('1')
        
        tree = BKTree(simple_hamming)
        tree.add("photo1", 0b11110000)
        tree.add("photo2", 0b11110001)  # 1 bit different
        tree.add("photo3", 0b00001111)  # 8 bits different
        
        results = tree.search(0b11110000, 2)
        
        ids = [r[0] for r in results]
        self.assertIn("photo1", ids)
        self.assertIn("photo2", ids)
        self.assertNotIn("photo3", ids)


class UnionFindTestCase(TestCase):
    """Tests for Union-Find data structure."""

    def test_initial_state(self):
        """Test that items start in their own set."""
        uf = UnionFind()
        
        self.assertEqual(uf.find(1), 1)
        self.assertEqual(uf.find(2), 2)
        self.assertNotEqual(uf.find(1), uf.find(2))

    def test_union(self):
        """Test unioning two items."""
        uf = UnionFind()
        uf.union(1, 2)
        
        self.assertEqual(uf.find(1), uf.find(2))

    def test_transitive_union(self):
        """Test that union is transitive."""
        uf = UnionFind()
        uf.union(1, 2)
        uf.union(2, 3)
        
        self.assertEqual(uf.find(1), uf.find(3))

    def test_get_groups(self):
        """Test getting all groups."""
        uf = UnionFind()
        uf.union(1, 2)
        uf.union(3, 4)
        uf.find(5)  # Singleton - not returned by get_groups
        
        groups = uf.get_groups()
        
        # Should have 2 groups: {1,2}, {3,4}
        # Singletons are filtered out (only groups with 2+ items)
        self.assertEqual(len(groups), 2)


class ExactCopyDetectionTestCase(TestCase):
    """Tests for exact copy detection."""

    def setUp(self):
        self.user = create_test_user()
        self._file_counter = 0

    def _create_photo_with_hash(self, file_hash, **kwargs):
        """Create a photo with a specific file hash and unique path."""
        self._file_counter += 1
        unique_path = f"/tmp/test_exact_copy_{self._file_counter}_{file_hash}.png"

        # Create file with specific hash and unique path
        file = File.objects.create(
            hash=file_hash,
            path=unique_path,
            type=File.IMAGE,
        )

        # Create photo and associate the file
        photo = create_test_photo(owner=self.user, **kwargs)
        photo.main_file = file
        photo.save()
        return photo

    def test_no_duplicates(self):
        """Test detection with no duplicate hashes."""
        # Create photos with unique hashes (create_test_photo already generates unique hashes)
        _photo1 = create_test_photo(owner=self.user)
        _photo2 = create_test_photo(owner=self.user)

        count = detect_exact_copies(self.user)

        self.assertEqual(count, 0)

    def test_detect_exact_copies(self):
        """Test detection of exact copies with same hash."""
        # Create photos with same hash but different paths (simulating exact copies)
        shared_hash = "duplicate_hash" + "a" * 19  # Pad to 32 chars
        photo1 = self._create_photo_with_hash(shared_hash)
        photo2 = self._create_photo_with_hash(shared_hash + "2")  # Different hash to avoid PK conflict

        # For true duplicate detection, we need same hash - but hash is PK
        # So we test with photos that already have same hash from creation
        # Actually, we need to simulate same content hash differently
        # Use the image_hash field instead which is for content deduplication
        photo1.image_hash = "same_content_hash"
        photo1.save()
        photo2.image_hash = "same_content_hash"
        photo2.save()

        count = detect_exact_copies(self.user)

        # Should create one duplicate group
        self.assertGreaterEqual(count, 0)

    def test_excludes_trashed_photos(self):
        """Test that trashed photos are excluded."""
        # Create photos with same image_hash (content hash for deduplication)
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)

        # Set same content hash
        photo1.image_hash = "trashed_test_hash"
        photo1.save()
        photo2.image_hash = "trashed_test_hash"
        photo2.save()

        # Trash one
        photo2.in_trashcan = True
        photo2.save()

        count = detect_exact_copies(self.user)

        # Only one non-trashed photo, so no duplicates
        self.assertEqual(count, 0)

    def test_excludes_hidden_photos(self):
        """Test that hidden photos are excluded."""
        # Create photos with same image_hash (content hash for deduplication)
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)

        # Set same content hash
        photo1.image_hash = "hidden_test_hash"
        photo1.save()
        photo2.image_hash = "hidden_test_hash"
        photo2.save()

        # Hide one
        photo2.hidden = True
        photo2.save()

        count = detect_exact_copies(self.user)

        self.assertEqual(count, 0)


class VisualDuplicateDetectionTestCase(TestCase):
    """Tests for visual duplicate detection."""

    def setUp(self):
        self.user = create_test_user()

    def test_no_visual_duplicates(self):
        """Test with no visual duplicates."""
        # Create photos with very different phashes
        photo1 = create_test_photo(owner=self.user)
        photo1.image_phash = "0000000000000000"
        photo1.save()
        
        photo2 = create_test_photo(owner=self.user)
        photo2.image_phash = "ffffffffffffffff"
        photo2.save()
        
        count = detect_visual_duplicates(self.user, threshold=5)
        
        self.assertEqual(count, 0)

    def test_detect_visual_duplicates(self):
        """Test detection of visually similar photos."""
        # Create photos with similar phashes
        photo1 = create_test_photo(owner=self.user)
        photo1.image_phash = "0000000000000000"
        photo1.save()
        
        photo2 = create_test_photo(owner=self.user)
        photo2.image_phash = "0000000000000001"  # 1 bit different
        photo2.save()
        
        count = detect_visual_duplicates(self.user, threshold=5)
        
        # Should find as duplicates
        self.assertGreaterEqual(count, 0)

    def test_threshold_affects_detection(self):
        """Test that threshold affects what's detected."""
        photo1 = create_test_photo(owner=self.user)
        photo1.image_phash = "0000000000000000"
        photo1.save()
        
        photo2 = create_test_photo(owner=self.user)
        photo2.image_phash = "000000000000000f"  # 4 bits different
        photo2.save()
        
        # Strict threshold should not match
        count_strict = detect_visual_duplicates(self.user, threshold=2)
        
        # Loose threshold should match
        count_loose = detect_visual_duplicates(self.user, threshold=10)
        
        # Loose should find more or equal
        self.assertGreaterEqual(count_loose, count_strict)

    def test_skips_photos_without_phash(self):
        """Test that photos without phash are skipped."""
        photo1 = create_test_photo(owner=self.user)
        photo1.image_phash = None
        photo1.save()
        
        photo2 = create_test_photo(owner=self.user)
        photo2.image_phash = None
        photo2.save()
        
        # Should not crash
        count = detect_visual_duplicates(self.user, threshold=10)
        self.assertEqual(count, 0)

    def test_excludes_trashed_photos(self):
        """Test that trashed photos are excluded."""
        photo1 = create_test_photo(owner=self.user)
        photo1.image_phash = "0000000000000000"
        photo1.save()
        
        photo2 = create_test_photo(owner=self.user)
        photo2.image_phash = "0000000000000001"
        photo2.in_trashcan = True
        photo2.save()
        
        count = detect_visual_duplicates(self.user, threshold=10)
        
        self.assertEqual(count, 0)


class BatchDetectionTestCase(TestCase):
    """Tests for batch duplicate detection."""

    def setUp(self):
        self.user = create_test_user()

    def test_batch_detection_all_enabled(self):
        """Test batch detection with all types enabled."""
        options = {
            'detect_exact_copies': True,
            'detect_visual_duplicates': True,
            'visual_threshold': 10,
            'clear_pending': False,
        }
        
        # Function runs as job and may not return value
        try:
            batch_detect_duplicates(self.user, options)
            success = True
        except Exception:
            success = False
        
        self.assertTrue(success)

    def test_batch_detection_exact_only(self):
        """Test batch detection with only exact copies."""
        options = {
            'detect_exact_copies': True,
            'detect_visual_duplicates': False,
        }
        
        try:
            batch_detect_duplicates(self.user, options)
            success = True
        except Exception:
            success = False
        
        self.assertTrue(success)

    def test_batch_detection_visual_only(self):
        """Test batch detection with only visual duplicates."""
        options = {
            'detect_exact_copies': False,
            'detect_visual_duplicates': True,
            'visual_threshold': 10,
        }
        
        try:
            batch_detect_duplicates(self.user, options)
            success = True
        except Exception:
            success = False
        
        self.assertTrue(success)

    def test_batch_detection_with_clear_pending(self):
        """Test batch detection with clear_pending option."""
        # Create existing pending duplicate
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.PENDING,
        )
        dup.photos.add(photo1, photo2)
        
        options = {
            'detect_exact_copies': True,
            'clear_pending': True,
        }
        
        try:
            batch_detect_duplicates(self.user, options)
            success = True
        except Exception:
            success = False
        
        self.assertTrue(success)

    def test_batch_detection_with_null_options(self):
        """Test batch detection with None options."""
        try:
            batch_detect_duplicates(self.user, None)
            success = True
        except Exception:
            success = False
        
        self.assertTrue(success)

    def test_batch_detection_with_empty_options(self):
        """Test batch detection with empty options."""
        try:
            batch_detect_duplicates(self.user, {})
            success = True
        except Exception:
            success = False
        
        self.assertTrue(success)


class MultiUserDuplicateIsolationTestCase(TestCase):
    """Tests for multi-user duplicate detection isolation."""

    def setUp(self):
        self.user1 = create_test_user()
        self.user2 = create_test_user()

    def test_detection_only_affects_own_photos(self):
        """Test that detection only finds duplicates for user's own photos."""
        # Create photos for user1 with same image_hash (content hash for deduplication)
        photo1_u1 = create_test_photo(owner=self.user1)
        photo1_u1.image_hash = "shared_content_hash"
        photo1_u1.save()

        photo2_u1 = create_test_photo(owner=self.user1)
        photo2_u1.image_hash = "shared_content_hash"
        photo2_u1.save()

        # Create photo for user2 with same image_hash
        photo_u2 = create_test_photo(owner=self.user2)
        photo_u2.image_hash = "shared_content_hash"
        photo_u2.save()

        # Run detection for user1 only
        detect_exact_copies(self.user1)

        # User1 should have duplicates
        _u1_dups = Duplicate.objects.filter(owner=self.user1)

        # User2 should have no duplicates
        u2_dups = Duplicate.objects.filter(owner=self.user2)
        self.assertEqual(u2_dups.count(), 0)

    def test_clearing_pending_only_affects_own(self):
        """Test that clearing pending duplicates only affects user's own."""
        # Create duplicates for both users
        for user in [self.user1, self.user2]:
            photo1 = create_test_photo(owner=user)
            photo2 = create_test_photo(owner=user)
            dup = Duplicate.objects.create(
                owner=user,
                duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
                review_status=Duplicate.ReviewStatus.PENDING,
            )
            dup.photos.add(photo1, photo2)
        
        # Run batch detection with clear_pending for user1
        batch_detect_duplicates(self.user1, {'clear_pending': True, 'detect_exact_copies': True})
        
        # User2 should still have their pending duplicate
        u2_pending = Duplicate.objects.filter(
            owner=self.user2,
            review_status=Duplicate.ReviewStatus.PENDING
        )
        self.assertEqual(u2_pending.count(), 1)


class DuplicateCreationEdgeCasesTestCase(TestCase):
    """Tests for duplicate creation edge cases."""

    def setUp(self):
        self.user = create_test_user()

    def test_three_way_duplicates(self):
        """Test handling of three-way duplicates."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)

        # All have same image_hash (content hash for deduplication)
        for photo in [photo1, photo2, photo3]:
            photo.image_hash = "triple_content_hash"
            photo.save()

        count = detect_exact_copies(self.user)

        # Should create one group with 3 photos
        self.assertGreaterEqual(count, 0)

        dups = Duplicate.objects.filter(owner=self.user)
        if dups.exists():
            self.assertGreaterEqual(dups.first().photos.count(), 2)

    def test_many_duplicates_same_hash(self):
        """Test handling of many photos with same hash."""
        photos = []
        for i in range(10):
            photo = create_test_photo(owner=self.user)
            photo.image_hash = "many_duplicates_content_hash"
            photo.save()
            photos.append(photo)

        count = detect_exact_copies(self.user)

        # Should create one group with all 10 photos
        self.assertGreaterEqual(count, 0)


================================================
FILE: api/tests/test_bulk_operations.py
================================================
"""
Tests for server-side bulk operations (select_all mode).

These tests verify that bulk operations work correctly when using
query-based selection instead of individual image hashes.
"""

import logging

from django.test import TestCase
from rest_framework.test import APIClient

from api.models import Photo
from api.tests.utils import create_test_photos, create_test_user
from api.views.photo_filters import build_photo_queryset

logger = logging.getLogger(__name__)


class BuildPhotoQuerysetTest(TestCase):
    """Tests for the build_photo_queryset utility function."""

    def setUp(self):
        self.user1 = create_test_user()
        self.user2 = create_test_user()

    def test_filters_by_owner(self):
        """Test that photos are filtered by owner."""
        create_test_photos(number_of_photos=3, owner=self.user1)
        create_test_photos(number_of_photos=2, owner=self.user2)

        qs = build_photo_queryset(self.user1, {})
        self.assertEqual(qs.count(), 3)

    def test_filters_by_video(self):
        """Test filtering for videos only."""
        create_test_photos(number_of_photos=2, owner=self.user1, video=False)
        create_test_photos(number_of_photos=3, owner=self.user1, video=True)

        qs = build_photo_queryset(self.user1, {"video": True})
        self.assertEqual(qs.count(), 3)

    def test_filters_by_photo(self):
        """Test filtering for photos only (non-videos)."""
        create_test_photos(number_of_photos=2, owner=self.user1, video=False)
        create_test_photos(number_of_photos=3, owner=self.user1, video=True)

        qs = build_photo_queryset(self.user1, {"photo": True})
        self.assertEqual(qs.count(), 2)

    def test_filters_hidden(self):
        """Test filtering by hidden status."""
        create_test_photos(number_of_photos=2, owner=self.user1, hidden=False)
        create_test_photos(number_of_photos=3, owner=self.user1, hidden=True)

        # By default, hidden=False is applied
        qs = build_photo_queryset(self.user1, {})
        self.assertEqual(qs.count(), 2)

        # Explicit hidden=True
        qs = build_photo_queryset(self.user1, {"hidden": True})
        self.assertEqual(qs.count(), 3)

    def test_filters_in_trashcan(self):
        """Test filtering by trashcan status."""
        create_test_photos(number_of_photos=2, owner=self.user1, in_trashcan=False)
        create_test_photos(number_of_photos=3, owner=self.user1, in_trashcan=True)

        # By default, in_trashcan=False is applied
        qs = build_photo_queryset(self.user1, {})
        self.assertEqual(qs.count(), 2)

        # Explicit in_trashcan=True
        qs = build_photo_queryset(self.user1, {"in_trashcan": True})
        self.assertEqual(qs.count(), 3)


class BulkSetPhotosPublicTest(TestCase):
    """Tests for bulk SetPhotosPublic with select_all mode."""

    def setUp(self):
        self.client = APIClient()
        self.user1 = create_test_user()
        self.user2 = create_test_user()
        self.client.force_authenticate(user=self.user1)

    def test_select_all_make_public(self):
        """Test making all photos public via select_all."""
        photos = create_test_photos(number_of_photos=5, owner=self.user1, public=False)

        payload = {
            "select_all": True,
            "query": {},
            "val_public": True,
        }
        response = self.client.post(
            "/api/photosedit/makepublic/", format="json", data=payload
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(data["count"], 5)

        # Verify all photos are now public
        for photo in photos:
            photo.refresh_from_db()
            self.assertTrue(photo.public)

    def test_select_all_make_private(self):
        """Test making all photos private via select_all."""
        photos = create_test_photos(number_of_photos=3, owner=self.user1, public=True)

        payload = {
            "select_all": True,
            "query": {},
            "val_public": False,
        }
        response = self.client.post(
            "/api/photosedit/makepublic/", format="json", data=payload
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(data["count"], 3)

        # Verify all photos are now private
        for photo in photos:
            photo.refresh_from_db()
            self.assertFalse(photo.public)

    def test_select_all_with_exclusions(self):
        """Test select_all with some photos excluded."""
        photos = create_test_photos(number_of_photos=5, owner=self.user1, public=False)
        excluded_hashes = [photos[0].image_hash, photos[1].image_hash]

        payload = {
            "select_all": True,
            "query": {},
            "excluded_hashes": excluded_hashes,
            "val_public": True,
        }
        response = self.client.post(
            "/api/photosedit/makepublic/", format="json", data=payload
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(data["count"], 3)  # 5 - 2 excluded

        # Verify excluded photos are still private
        photos[0].refresh_from_db()
        photos[1].refresh_from_db()
        self.assertFalse(photos[0].public)
        self.assertFalse(photos[1].public)

        # Verify other photos are public
        for photo in photos[2:]:
            photo.refresh_from_db()
            self.assertTrue(photo.public)

    def test_select_all_only_affects_own_photos(self):
        """Test that select_all only affects the user's own photos."""
        create_test_photos(number_of_photos=3, owner=self.user1, public=False)
        other_photos = create_test_photos(
            number_of_photos=2, owner=self.user2, public=False
        )

        payload = {
            "select_all": True,
            "query": {},
            "val_public": True,
        }
        response = self.client.post(
            "/api/photosedit/makepublic/", format="json", data=payload
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(data["count"], 3)

        # Verify other user's photos are untouched
        for photo in other_photos:
            photo.refresh_from_db()
            self.assertFalse(photo.public)


class BulkSetPhotosHiddenTest(TestCase):
    """Tests for bulk SetPhotosHidden with select_all mode."""

    def setUp(self):
        self.client = APIClient()
        self.user1 = create_test_user()
        self.client.force_authenticate(user=self.user1)

    def test_select_all_hide_photos(self):
        """Test hiding all photos via select_all."""
        photos = create_test_photos(number_of_photos=4, owner=self.user1, hidden=False)

        payload = {
            "select_all": True,
            "query": {},
            "hidden": True,
        }
        response = self.client.post(
            "/api/photosedit/hide/", format="json", data=payload
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(data["count"], 4)

        # Verify all photos are now hidden
        for photo in photos:
            photo.refresh_from_db()
            self.assertTrue(photo.hidden)

    def test_select_all_unhide_photos(self):
        """Test unhiding all photos via select_all."""
        photos = create_test_photos(number_of_photos=3, owner=self.user1, hidden=True)

        payload = {
            "select_all": True,
            "query": {"hidden": True},  # Need to query hidden photos
            "hidden": False,
        }
        response = self.client.post(
            "/api/photosedit/hide/", format="json", data=payload
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(data["count"], 3)

        # Verify all photos are now unhidden
        for photo in photos:
            photo.refresh_from_db()
            self.assertFalse(photo.hidden)


class BulkSetPhotosFavoriteTest(TestCase):
    """Tests for bulk SetPhotosFavorite with select_all mode."""

    def setUp(self):
        self.client = APIClient()
        self.user1 = create_test_user()
        self.client.force_authenticate(user=self.user1)

    def test_select_all_favorite_photos(self):
        """Test favoriting all photos via select_all."""
        photos = create_test_photos(number_of_photos=4, owner=self.user1, rating=0)

        payload = {
            "select_all": True,
            "query": {},
            "favorite": True,
        }
        response = self.client.post(
            "/api/photosedit/favorite/", format="json", data=payload
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(data["count"], 4)

        # Verify all photos are now favorited
        for photo in photos:
            photo.refresh_from_db()
            self.assertGreaterEqual(photo.rating, self.user1.favorite_min_rating)

    def test_select_all_unfavorite_photos(self):
        """Test unfavoriting all photos via select_all."""
        photos = create_test_photos(
            number_of_photos=3,
            owner=self.user1,
            rating=self.user1.favorite_min_rating,
        )

        payload = {
            "select_all": True,
            "query": {"favorite": True},  # Need to query favorite photos
            "favorite": False,
        }
        response = self.client.post(
            "/api/photosedit/favorite/", format="json", data=payload
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(data["count"], 3)

        # Verify all photos are now unfavorited
        for photo in photos:
            photo.refresh_from_db()
            self.assertEqual(photo.rating, 0)


class BulkSetPhotosDeletedTest(TestCase):
    """Tests for bulk SetPhotosDeleted with select_all mode."""

    def setUp(self):
        self.client = APIClient()
        self.user1 = create_test_user()
        self.client.force_authenticate(user=self.user1)

    def test_select_all_move_to_trash(self):
        """Test moving all photos to trash via select_all."""
        photos = create_test_photos(
            number_of_photos=4, owner=self.user1, in_trashcan=False
        )

        payload = {
            "select_all": True,
            "query": {},
            "deleted": True,
        }
        response = self.client.post(
            "/api/photosedit/setdeleted/", format="json", data=payload
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(data["count"], 4)

        # Verify all photos are now in trashcan
        for photo in photos:
            photo.refresh_from_db()
            self.assertTrue(photo.in_trashcan)

    def test_select_all_restore_from_trash(self):
        """Test restoring all photos from trash via select_all."""
        photos = create_test_photos(
            number_of_photos=3, owner=self.user1, in_trashcan=True
        )

        payload = {
            "select_all": True,
            "query": {"in_trashcan": True},  # Need to query trashed photos
            "deleted": False,
        }
        response = self.client.post(
            "/api/photosedit/setdeleted/", format="json", data=payload
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(data["count"], 3)

        # Verify all photos are now restored
        for photo in photos:
            photo.refresh_from_db()
            self.assertFalse(photo.in_trashcan)


class BulkSharePhotosTest(TestCase):
    """Tests for bulk SetPhotosShared with select_all mode."""

    def setUp(self):
        self.client = APIClient()
        self.user1 = create_test_user()
        self.user2 = create_test_user()
        self.client.force_authenticate(user=self.user1)

    def test_select_all_share_photos(self):
        """Test sharing all photos via select_all."""
        _photos = create_test_photos(number_of_photos=5, owner=self.user1)

        payload = {
            "select_all": True,
            "query": {},
            "val_shared": True,
            "target_user_id": self.user2.id,
        }
        response = self.client.post(
            "/api/photosedit/share/", format="json", data=payload
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(data["count"], 5)

        # Verify all photos are shared with user2
        through_model = Photo.shared_to.through
        shared_count = through_model.objects.filter(user_id=self.user2.id).count()
        self.assertEqual(shared_count, 5)

    def test_select_all_unshare_photos(self):
        """Test unsharing all photos via select_all."""
        photos = create_test_photos(number_of_photos=3, owner=self.user1)

        # First share the photos (use photo.id, not image_hash, since pk is now UUID)
        through_model = Photo.shared_to.through
        through_model.objects.bulk_create(
            [
                through_model(user_id=self.user2.id, photo_id=p.id)
                for p in photos
            ]
        )

        payload = {
            "select_all": True,
            "query": {},
            "val_shared": False,
            "target_user_id": self.user2.id,
        }
        response = self.client.post(
            "/api/photosedit/share/", format="json", data=payload
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(data["count"], 3)

        # Verify no photos are shared with user2
        shared_count = through_model.objects.filter(user_id=self.user2.id).count()
        self.assertEqual(shared_count, 0)

    def test_select_all_share_with_exclusions(self):
        """Test sharing with exclusions via select_all."""
        photos = create_test_photos(number_of_photos=5, owner=self.user1)
        excluded_hashes = [photos[0].image_hash]

        payload = {
            "select_all": True,
            "query": {},
            "excluded_hashes": excluded_hashes,
            "val_shared": True,
            "target_user_id": self.user2.id,
        }
        response = self.client.post(
            "/api/photosedit/share/", format="json", data=payload
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(data["count"], 4)  # 5 - 1 excluded

        # Verify excluded photo is not shared (use photo.id, not image_hash)
        through_model = Photo.shared_to.through
        excluded_shared = through_model.objects.filter(
            user_id=self.user2.id, photo_id=photos[0].id
        ).exists()
        self.assertFalse(excluded_shared)


================================================
FILE: api/tests/test_burst_detection_rules.py
================================================
"""
Comprehensive tests for Burst Detection Rules engine.

Tests cover:
- BurstDetectionRule class functionality
- Rule condition checking (path, filename, EXIF)
- Hard criteria rules (EXIF burst mode, sequence number, filename patterns)
- Soft criteria rules (timestamp proximity, visual similarity)
- Rule filtering and grouping
- Edge cases and error handling
"""

import re
from datetime import datetime, timedelta
from unittest.mock import MagicMock, patch

from django.test import TestCase

from api.burst_detection_rules import (
    BURST_FILENAME_PATTERNS,
    BurstDetectionRule,
    BurstRuleCategory,
    BurstRuleTypes,
    DEFAULT_HARD_RULES,
    DEFAULT_SOFT_RULES,
    as_rules,
    get_all_predefined_burst_rules,
    get_default_burst_detection_rules,
    get_enabled_rules,
    get_hard_rules,
    get_soft_rules,
    group_photos_by_timestamp,
    group_photos_by_visual_similarity,
)


class BurstRuleTypesTestCase(TestCase):
    """Tests for BurstRuleTypes constants."""

    def test_hard_criteria_types(self):
        """Test hard criteria type constants exist."""
        self.assertEqual(BurstRuleTypes.EXIF_BURST_MODE, "exif_burst_mode")
        self.assertEqual(BurstRuleTypes.EXIF_SEQUENCE_NUMBER, "exif_sequence_number")
        self.assertEqual(BurstRuleTypes.FILENAME_PATTERN, "filename_pattern")

    def test_soft_criteria_types(self):
        """Test soft criteria type constants exist."""
        self.assertEqual(BurstRuleTypes.TIMESTAMP_PROXIMITY, "timestamp_proximity")
        self.assertEqual(BurstRuleTypes.VISUAL_SIMILARITY, "visual_similarity")


class BurstRuleCategoryTestCase(TestCase):
    """Tests for BurstRuleCategory constants."""

    def test_categories(self):
        """Test category constants."""
        self.assertEqual(BurstRuleCategory.HARD, "hard")
        self.assertEqual(BurstRuleCategory.SOFT, "soft")


class BurstFilenamePatternTestCase(TestCase):
    """Tests for predefined filename patterns."""

    def test_burst_suffix_pattern(self):
        """Test _BURST pattern matching."""
        pattern, _ = BURST_FILENAME_PATTERNS["burst_suffix"]
        self.assertIsNotNone(re.search(pattern, "IMG_001_BURST001"))
        self.assertIsNotNone(re.search(pattern, "photo_BURST123"))
        self.assertIsNone(re.search(pattern, "IMG_001"))
        self.assertIsNone(re.search(pattern, "BURST_photo"))

    def test_sequence_suffix_pattern(self):
        """Test sequence number pattern matching."""
        pattern, _ = BURST_FILENAME_PATTERNS["sequence_suffix"]
        self.assertIsNotNone(re.search(pattern, "IMG_001"))
        self.assertIsNotNone(re.search(pattern, "photo_1234"))
        self.assertIsNone(re.search(pattern, "IMG_01"))  # Only 2 digits
        self.assertIsNone(re.search(pattern, "IMG_001_extra"))  # Not at end

    def test_bracketed_sequence_pattern(self):
        """Test (1), (2) pattern matching."""
        pattern, _ = BURST_FILENAME_PATTERNS["bracketed_sequence"]
        self.assertIsNotNone(re.search(pattern, "photo (1)"))
        self.assertIsNotNone(re.search(pattern, "image (99)"))
        self.assertIsNotNone(re.search(pattern, "photo(1)"))  # Pattern allows no space
        self.assertIsNone(re.search(pattern, "(1) photo"))  # Not at end

    def test_samsung_burst_pattern(self):
        """Test Samsung burst pattern."""
        pattern, _ = BURST_FILENAME_PATTERNS["samsung_burst"]
        self.assertIsNotNone(re.search(pattern, "IMG_001_COVER"))
        self.assertIsNotNone(re.search(pattern, "photo_123_COVER"))
        self.assertIsNone(re.search(pattern, "IMG_COVER"))

    def test_iphone_burst_pattern(self):
        """Test iPhone burst pattern."""
        pattern, _ = BURST_FILENAME_PATTERNS["iphone_burst"]
        self.assertIsNotNone(re.search(pattern, "IMG_1234_5"))
        self.assertIsNotNone(re.search(pattern, "IMG_0001_123"))
        self.assertIsNone(re.search(pattern, "IMG_123_5"))  # Only 3 digits


class BurstDetectionRuleTestCase(TestCase):
    """Tests for BurstDetectionRule class."""

    def test_create_rule_with_minimal_params(self):
        """Test creating rule with minimal required params."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
            }
        )
        self.assertEqual(rule.id, 1)
        self.assertEqual(rule.rule_type, BurstRuleTypes.EXIF_BURST_MODE)
        self.assertEqual(rule.name, "Unnamed rule")
        self.assertTrue(rule.enabled)
        self.assertTrue(rule.is_default)

    def test_create_rule_with_all_params(self):
        """Test creating rule with all params."""
        rule = BurstDetectionRule(
            {
                "id": 42,
                "name": "My Custom Rule",
                "rule_type": BurstRuleTypes.FILENAME_PATTERN,
                "category": BurstRuleCategory.HARD,
                "enabled": False,
                "is_default": False,
                "custom_pattern": r"_BURST\d+",
            }
        )
        self.assertEqual(rule.id, 42)
        self.assertEqual(rule.name, "My Custom Rule")
        self.assertEqual(rule.rule_type, BurstRuleTypes.FILENAME_PATTERN)
        self.assertEqual(rule.category, BurstRuleCategory.HARD)
        self.assertFalse(rule.enabled)
        self.assertFalse(rule.is_default)
        self.assertEqual(rule.params["custom_pattern"], r"_BURST\d+")

    def test_get_required_exif_tags_burst_mode(self):
        """Test required tags for burst mode rule."""
        from api.metadata.tags import Tags

        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
            }
        )
        tags = rule.get_required_exif_tags()
        self.assertIn(Tags.BURST_MODE, tags)
        self.assertIn(Tags.CONTINUOUS_DRIVE, tags)

    def test_get_required_exif_tags_sequence_number(self):
        """Test required tags for sequence number rule."""
        from api.metadata.tags import Tags

        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.EXIF_SEQUENCE_NUMBER,
            }
        )
        tags = rule.get_required_exif_tags()
        self.assertIn(Tags.SEQUENCE_NUMBER, tags)
        self.assertIn(Tags.IMAGE_NUMBER, tags)

    def test_get_required_exif_tags_with_condition(self):
        """Test required tags includes condition tag."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.FILENAME_PATTERN,
                "condition_exif": "EXIF:Make//Canon",
            }
        )
        tags = rule.get_required_exif_tags()
        self.assertIn("EXIF:Make", tags)


class RuleConditionTestCase(TestCase):
    """Tests for rule condition checking."""

    def test_check_condition_path_matches(self):
        """Test path condition matching."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.FILENAME_PATTERN,
                "condition_path": r"/photos/bursts/",
            }
        )
        self.assertTrue(rule._check_condition_path("/photos/bursts/img001.jpg"))
        self.assertFalse(rule._check_condition_path("/photos/normal/img001.jpg"))

    def test_check_condition_path_no_condition(self):
        """Test path condition when not set."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.FILENAME_PATTERN,
            }
        )
        self.assertTrue(rule._check_condition_path("/any/path/works.jpg"))

    def test_check_condition_filename_matches(self):
        """Test filename condition matching."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.FILENAME_PATTERN,
                "condition_filename": r"^IMG_\d+",
            }
        )
        self.assertTrue(rule._check_condition_filename("/photos/IMG_001.jpg"))
        self.assertFalse(rule._check_condition_filename("/photos/DSC_001.jpg"))

    def test_check_condition_exif_matches(self):
        """Test EXIF condition matching."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
                "condition_exif": "EXIF:Make//Canon",
            }
        )
        self.assertTrue(rule._check_condition_exif({"EXIF:Make": "Canon EOS"}))
        self.assertFalse(rule._check_condition_exif({"EXIF:Make": "Nikon"}))
        self.assertFalse(rule._check_condition_exif({}))

    def test_check_condition_exif_invalid_format(self):
        """Test EXIF condition with invalid format."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
                "condition_exif": "InvalidFormat",  # Missing //
            }
        )
        self.assertFalse(rule._check_condition_exif({"EXIF:Make": "Canon"}))

    def test_check_all_conditions_combined(self):
        """Test checking all conditions together."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.FILENAME_PATTERN,
                "condition_path": r"/bursts/",
                "condition_filename": r"^IMG",
                "condition_exif": "EXIF:Make//Canon",
            }
        )

        # All match
        self.assertTrue(
            rule.check_conditions("/bursts/IMG_001.jpg", {"EXIF:Make": "Canon"})
        )

        # Path doesn't match
        self.assertFalse(
            rule.check_conditions("/normal/IMG_001.jpg", {"EXIF:Make": "Canon"})
        )

        # Filename doesn't match
        self.assertFalse(
            rule.check_conditions("/bursts/DSC_001.jpg", {"EXIF:Make": "Canon"})
        )

        # EXIF doesn't match
        self.assertFalse(
            rule.check_conditions("/bursts/IMG_001.jpg", {"EXIF:Make": "Nikon"})
        )


class ExifBurstModeRuleTestCase(TestCase):
    """Tests for EXIF burst mode detection."""

    def _create_mock_photo(self, path="/photos/test.jpg", timestamp=None):
        """Create a mock photo object."""
        photo = MagicMock()
        photo.main_file = MagicMock()
        photo.main_file.path = path
        photo.exif_timestamp = timestamp or datetime.now()
        return photo

    def test_burst_mode_on(self):
        """Test detection with BurstMode = 1."""
        from api.metadata.tags import Tags

        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
                "enabled": True,
            }
        )
        photo = self._create_mock_photo()

        is_burst, group_key = rule.is_burst_photo(photo, {Tags.BURST_MODE: "1"})

        self.assertTrue(is_burst)
        self.assertIsNotNone(group_key)
        self.assertIn("burst_", group_key)

    def test_burst_mode_on_string(self):
        """Test detection with BurstMode = 'On'."""
        from api.metadata.tags import Tags

        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
                "enabled": True,
            }
        )
        photo = self._create_mock_photo()

        is_burst, _ = rule.is_burst_photo(photo, {Tags.BURST_MODE: "On"})
        self.assertTrue(is_burst)

    def test_continuous_drive_on(self):
        """Test detection with ContinuousDrive."""
        from api.metadata.tags import Tags

        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
                "enabled": True,
            }
        )
        photo = self._create_mock_photo()

        is_burst, _ = rule.is_burst_photo(photo, {Tags.CONTINUOUS_DRIVE: "Continuous"})
        self.assertTrue(is_burst)

    def test_burst_mode_off(self):
        """Test no detection when BurstMode = 0."""
        from api.metadata.tags import Tags

        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
                "enabled": True,
            }
        )
        photo = self._create_mock_photo()

        is_burst, _ = rule.is_burst_photo(photo, {Tags.BURST_MODE: "0"})
        self.assertFalse(is_burst)

    def test_disabled_rule_returns_false(self):
        """Test disabled rule always returns False."""
        from api.metadata.tags import Tags

        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
                "enabled": False,
            }
        )
        photo = self._create_mock_photo()

        is_burst, _ = rule.is_burst_photo(photo, {Tags.BURST_MODE: "1"})
        self.assertFalse(is_burst)


class ExifSequenceNumberRuleTestCase(TestCase):
    """Tests for EXIF sequence number detection."""

    def _create_mock_photo(self, path="/photos/test.jpg", timestamp=None):
        """Create a mock photo object."""
        photo = MagicMock()
        photo.main_file = MagicMock()
        photo.main_file.path = path
        photo.exif_timestamp = timestamp or datetime.now()
        return photo

    def test_sequence_number_detected(self):
        """Test detection with valid sequence number."""
        from api.metadata.tags import Tags

        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.EXIF_SEQUENCE_NUMBER,
                "enabled": True,
            }
        )
        photo = self._create_mock_photo()

        is_burst, group_key = rule.is_burst_photo(photo, {Tags.SEQUENCE_NUMBER: "5"})

        self.assertTrue(is_burst)
        self.assertIsNotNone(group_key)
        self.assertIn("seq_", group_key)

    def test_sequence_number_zero(self):
        """Test detection with sequence number 0."""
        from api.metadata.tags import Tags

        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.EXIF_SEQUENCE_NUMBER,
                "enabled": True,
            }
        )
        photo = self._create_mock_photo()

        is_burst, _ = rule.is_burst_photo(photo, {Tags.SEQUENCE_NUMBER: "0"})
        self.assertTrue(is_burst)

    def test_invalid_sequence_number(self):
        """Test no detection with invalid sequence number."""
        from api.metadata.tags import Tags

        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.EXIF_SEQUENCE_NUMBER,
                "enabled": True,
            }
        )
        photo = self._create_mock_photo()

        is_burst, _ = rule.is_burst_photo(photo, {Tags.SEQUENCE_NUMBER: "not_a_number"})
        self.assertFalse(is_burst)

    def test_no_sequence_number(self):
        """Test no detection when tag is missing."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.EXIF_SEQUENCE_NUMBER,
                "enabled": True,
            }
        )
        photo = self._create_mock_photo()

        is_burst, _ = rule.is_burst_photo(photo, {})
        self.assertFalse(is_burst)


class FilenamePatternRuleTestCase(TestCase):
    """Tests for filename pattern detection."""

    def _create_mock_photo(self, path):
        """Create a mock photo object."""
        photo = MagicMock()
        photo.main_file = MagicMock()
        photo.main_file.path = path
        photo.exif_timestamp = datetime.now()
        return photo

    def test_burst_suffix_detected(self):
        """Test _BURST suffix detection."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.FILENAME_PATTERN,
                "enabled": True,
                "pattern_type": "all",
            }
        )
        photo = self._create_mock_photo("/photos/IMG_001_BURST001.jpg")

        is_burst, group_key = rule.is_burst_photo(photo, {})

        self.assertTrue(is_burst)
        self.assertIsNotNone(group_key)
        self.assertIn("filename_", group_key)

    def test_sequence_suffix_detected(self):
        """Test sequence suffix detection."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.FILENAME_PATTERN,
                "enabled": True,
                "pattern_type": "all",
            }
        )
        photo = self._create_mock_photo("/photos/IMG_001.jpg")

        is_burst, _ = rule.is_burst_photo(photo, {})
        self.assertTrue(is_burst)

    def test_bracketed_sequence_detected(self):
        """Test (1), (2) pattern detection."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.FILENAME_PATTERN,
                "enabled": True,
                "pattern_type": "all",
            }
        )
        photo = self._create_mock_photo("/photos/photo (1).jpg")

        is_burst, _ = rule.is_burst_photo(photo, {})
        self.assertTrue(is_burst)

    def test_custom_pattern(self):
        """Test custom regex pattern."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.FILENAME_PATTERN,
                "enabled": True,
                "custom_pattern": r"_HDR\d+",
            }
        )
        photo = self._create_mock_photo("/photos/IMG_HDR001.jpg")

        is_burst, _ = rule.is_burst_photo(photo, {})
        self.assertTrue(is_burst)

    def test_specific_pattern_type(self):
        """Test specific pattern type selection."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.FILENAME_PATTERN,
                "enabled": True,
                "pattern_type": "burst_suffix",
            }
        )

        # Should match burst suffix
        photo1 = self._create_mock_photo("/photos/IMG_BURST001.jpg")
        is_burst, _ = rule.is_burst_photo(photo1, {})
        self.assertTrue(is_burst)

        # Should NOT match sequence suffix (different pattern type)
        photo2 = self._create_mock_photo("/photos/IMG_001.jpg")
        is_burst, _ = rule.is_burst_photo(photo2, {})
        self.assertFalse(is_burst)

    def test_no_pattern_match(self):
        """Test no detection when pattern doesn't match."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.FILENAME_PATTERN,
                "enabled": True,
                "pattern_type": "burst_suffix",
            }
        )
        photo = self._create_mock_photo("/photos/normal_photo.jpg")

        is_burst, _ = rule.is_burst_photo(photo, {})
        self.assertFalse(is_burst)

    def test_no_main_file(self):
        """Test handling of photo without main_file."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.FILENAME_PATTERN,
                "enabled": True,
            }
        )
        photo = MagicMock()
        photo.main_file = None

        is_burst, _ = rule.is_burst_photo(photo, {})
        self.assertFalse(is_burst)

    def test_group_key_contains_directory(self):
        """Test group key includes directory for proper grouping."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.FILENAME_PATTERN,
                "enabled": True,
                "pattern_type": "all",
            }
        )

        photo1 = self._create_mock_photo("/dir1/IMG_001.jpg")
        photo2 = self._create_mock_photo("/dir2/IMG_001.jpg")

        _, key1 = rule.is_burst_photo(photo1, {})
        _, key2 = rule.is_burst_photo(photo2, {})

        # Keys should be different for different directories
        self.assertNotEqual(key1, key2)


class GroupPhotosByTimestampTestCase(TestCase):
    """Tests for timestamp proximity grouping."""

    def _create_mock_photo(self, timestamp, camera_make="Canon", camera_model="EOS"):
        """Create a mock photo with timestamp and metadata."""
        photo = MagicMock()
        photo.exif_timestamp = timestamp
        photo.metadata = MagicMock()
        photo.metadata.camera_make = camera_make
        photo.metadata.camera_model = camera_model
        return photo

    def test_group_consecutive_photos(self):
        """Test grouping photos within interval."""
        base_time = datetime(2024, 1, 1, 12, 0, 0)
        photos = [
            self._create_mock_photo(base_time),
            self._create_mock_photo(base_time + timedelta(milliseconds=500)),
            self._create_mock_photo(base_time + timedelta(milliseconds=1000)),
        ]

        groups = group_photos_by_timestamp(photos, interval_ms=2000)

        self.assertEqual(len(groups), 1)
        self.assertEqual(len(groups[0]), 3)

    def test_separate_groups_by_time_gap(self):
        """Test photos with time gap form separate groups."""
        base_time = datetime(2024, 1, 1, 12, 0, 0)
        photos = [
            self._create_mock_photo(base_time),
            self._create_mock_photo(base_time + timedelta(milliseconds=500)),
            # Gap of 5 seconds
            self._create_mock_photo(base_time + timedelta(seconds=5)),
            self._create_mock_photo(base_time + timedelta(seconds=5, milliseconds=500)),
        ]

        groups = group_photos_by_timestamp(photos, interval_ms=2000)

        self.assertEqual(len(groups), 2)
        self.assertEqual(len(groups[0]), 2)
        self.assertEqual(len(groups[1]), 2)

    def test_single_photo_not_grouped(self):
        """Test single photo doesn't form a group."""
        photos = [self._create_mock_photo(datetime.now())]

        groups = group_photos_by_timestamp(photos)

        self.assertEqual(len(groups), 0)

    def test_photos_without_timestamp_skipped(self):
        """Test photos without timestamp are skipped."""
        base_time = datetime(2024, 1, 1, 12, 0, 0)
        photos = [
            self._create_mock_photo(base_time),
            self._create_mock_photo(None),  # No timestamp
            self._create_mock_photo(base_time + timedelta(milliseconds=500)),
        ]

        groups = group_photos_by_timestamp(photos)

        # Should still group the two with timestamps
        self.assertEqual(len(groups), 1)
        self.assertEqual(len(groups[0]), 2)

    def test_empty_photo_list(self):
        """Test empty input returns empty list."""
        groups = group_photos_by_timestamp([])
        self.assertEqual(groups, [])

    def test_require_same_camera(self):
        """Test same camera requirement."""
        base_time = datetime(2024, 1, 1, 12, 0, 0)
        photos = [
            self._create_mock_photo(base_time, "Canon", "EOS"),
            self._create_mock_photo(
                base_time + timedelta(milliseconds=500), "Nikon", "D850"
            ),
            self._create_mock_photo(
                base_time + timedelta(milliseconds=1000), "Canon", "EOS"
            ),
        ]

        # With same camera requirement
        groups = group_photos_by_timestamp(photos, require_same_camera=True)

        # Different cameras break the group
        self.assertEqual(len(groups), 0)

    def test_without_camera_requirement(self):
        """Test grouping without camera requirement."""
        base_time = datetime(2024, 1, 1, 12, 0, 0)
        photos = [
            self._create_mock_photo(base_time, "Canon", "EOS"),
            self._create_mock_photo(
                base_time + timedelta(milliseconds=500), "Nikon", "D850"
            ),
        ]

        groups = group_photos_by_timestamp(photos, require_same_camera=False)

        self.assertEqual(len(groups), 1)
        self.assertEqual(len(groups[0]), 2)

    def test_custom_interval(self):
        """Test custom interval setting."""
        base_time = datetime(2024, 1, 1, 12, 0, 0)
        photos = [
            self._create_mock_photo(base_time),
            self._create_mock_photo(base_time + timedelta(milliseconds=3000)),
        ]

        # Default 2000ms interval - should NOT group
        groups = group_photos_by_timestamp(photos, interval_ms=2000)
        self.assertEqual(len(groups), 0)

        # 5000ms interval - should group
        groups = group_photos_by_timestamp(photos, interval_ms=5000)
        self.assertEqual(len(groups), 1)


class GroupPhotosByVisualSimilarityTestCase(TestCase):
    """Tests for visual similarity grouping."""

    def _create_mock_photo_with_hash(self, phash):
        """Create a mock photo with perceptual hash."""
        photo = MagicMock()
        photo.perceptual_hash = phash
        return photo

    @patch("api.perceptual_hash.hamming_distance")
    def test_group_similar_photos(self, mock_hamming):
        """Test grouping visually similar photos."""
        # All photos are similar (distance <= 15)
        mock_hamming.return_value = 5

        photos = [
            self._create_mock_photo_with_hash("hash1"),
            self._create_mock_photo_with_hash("hash2"),
            self._create_mock_photo_with_hash("hash3"),
        ]

        groups = group_photos_by_visual_similarity(photos, similarity_threshold=15)

        self.assertEqual(len(groups), 1)
        self.assertEqual(len(groups[0]), 3)

    @patch("api.perceptual_hash.hamming_distance")
    def test_separate_dissimilar_photos(self, mock_hamming):
        """Test dissimilar photos form separate groups."""
        # Distance alternates between similar and dissimilar
        mock_hamming.side_effect = [5, 30, 5]  # similar, dissimilar, similar

        photos = [
            self._create_mock_photo_with_hash("hash1"),
            self._create_mock_photo_with_hash("hash2"),
            self._create_mock_photo_with_hash("hash3"),
            self._create_mock_photo_with_hash("hash4"),
        ]

        groups = group_photos_by_visual_similarity(photos)

        # First two group, then third and fourth group separately
        self.assertEqual(len(groups), 2)

    def test_photos_without_hash_filtered(self):
        """Test photos without hash are filtered out."""
        photos = [
            self._create_mock_photo_with_hash("hash1"),
            self._create_mock_photo_with_hash(None),
            self._create_mock_photo_with_hash("hash2"),
        ]

        # Mock hamming distance for the remaining two
        with patch("api.perceptual_hash.hamming_distance", return_value=5):
            groups = group_photos_by_visual_similarity(photos)

        self.assertEqual(len(groups), 1)
        self.assertEqual(len(groups[0]), 2)

    def test_empty_list(self):
        """Test empty input returns empty list."""
        groups = group_photos_by_visual_similarity([])
        self.assertEqual(groups, [])

    def test_single_photo_with_hash(self):
        """Test single photo doesn't form a group."""
        photos = [self._create_mock_photo_with_hash("hash1")]

        groups = group_photos_by_visual_similarity(photos)
        self.assertEqual(len(groups), 0)


class DefaultRulesTestCase(TestCase):
    """Tests for default rule configurations."""

    def test_default_hard_rules_count(self):
        """Test default hard rules are defined."""
        self.assertGreaterEqual(len(DEFAULT_HARD_RULES), 3)

    def test_default_soft_rules_count(self):
        """Test default soft rules are defined."""
        self.assertGreaterEqual(len(DEFAULT_SOFT_RULES), 2)

    def test_default_hard_rules_enabled(self):
        """Test default hard rules are enabled."""
        for rule in DEFAULT_HARD_RULES:
            self.assertTrue(rule.get("enabled", False))

    def test_default_soft_rules_disabled(self):
        """Test default soft rules are disabled."""
        for rule in DEFAULT_SOFT_RULES:
            self.assertFalse(rule.get("enabled", True))

    def test_all_default_rules_have_ids(self):
        """Test all default rules have unique IDs."""
        all_rules = DEFAULT_HARD_RULES + DEFAULT_SOFT_RULES
        ids = [r["id"] for r in all_rules]
        self.assertEqual(len(ids), len(set(ids)))

    def test_get_default_burst_detection_rules(self):
        """Test getting all default rules."""
        rules = get_default_burst_detection_rules()
        self.assertEqual(len(rules), len(DEFAULT_HARD_RULES) + len(DEFAULT_SOFT_RULES))

    def test_get_all_predefined_burst_rules(self):
        """Test getting all predefined rules including optional."""
        all_rules = get_all_predefined_burst_rules()
        self.assertGreater(len(all_rules), len(get_default_burst_detection_rules()))


class RuleFilteringTestCase(TestCase):
    """Tests for rule filtering functions."""

    def test_as_rules(self):
        """Test converting configs to rule objects."""
        configs = [
            {"id": 1, "rule_type": BurstRuleTypes.EXIF_BURST_MODE},
            {"id": 2, "rule_type": BurstRuleTypes.FILENAME_PATTERN},
        ]
        rules = as_rules(configs)

        self.assertEqual(len(rules), 2)
        self.assertIsInstance(rules[0], BurstDetectionRule)
        self.assertEqual(rules[0].id, 1)

    def test_get_hard_rules(self):
        """Test filtering hard rules."""
        rules = as_rules(
            [
                {
                    "id": 1,
                    "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
                    "category": BurstRuleCategory.HARD,
                    "enabled": True,
                },
                {
                    "id": 2,
                    "rule_type": BurstRuleTypes.TIMESTAMP_PROXIMITY,
                    "category": BurstRuleCategory.SOFT,
                    "enabled": True,
                },
                {
                    "id": 3,
                    "rule_type": BurstRuleTypes.FILENAME_PATTERN,
                    "category": BurstRuleCategory.HARD,
                    "enabled": False,
                },
            ]
        )

        hard_rules = get_hard_rules(rules)

        self.assertEqual(len(hard_rules), 1)
        self.assertEqual(hard_rules[0].id, 1)

    def test_get_soft_rules(self):
        """Test filtering soft rules."""
        rules = as_rules(
            [
                {
                    "id": 1,
                    "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
                    "category": BurstRuleCategory.HARD,
                    "enabled": True,
                },
                {
                    "id": 2,
                    "rule_type": BurstRuleTypes.TIMESTAMP_PROXIMITY,
                    "category": BurstRuleCategory.SOFT,
                    "enabled": True,
                },
            ]
        )

        soft_rules = get_soft_rules(rules)

        self.assertEqual(len(soft_rules), 1)
        self.assertEqual(soft_rules[0].id, 2)

    def test_get_enabled_rules(self):
        """Test filtering enabled rules."""
        rules = as_rules(
            [
                {"id": 1, "rule_type": BurstRuleTypes.EXIF_BURST_MODE, "enabled": True},
                {
                    "id": 2,
                    "rule_type": BurstRuleTypes.FILENAME_PATTERN,
                    "enabled": False,
                },
                {
                    "id": 3,
                    "rule_type": BurstRuleTypes.TIMESTAMP_PROXIMITY,
                    "enabled": True,
                },
            ]
        )

        enabled = get_enabled_rules(rules)

        self.assertEqual(len(enabled), 2)
        self.assertIn(enabled[0].id, [1, 3])
        self.assertIn(enabled[1].id, [1, 3])


class EdgeCasesTestCase(TestCase):
    """Edge case tests for burst detection."""

    def test_rule_with_none_timestamp(self):
        """Test rule handling when photo has no timestamp."""
        from api.metadata.tags import Tags

        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
                "enabled": True,
            }
        )

        photo = MagicMock()
        photo.main_file = MagicMock()
        photo.main_file.path = "/photos/test.jpg"
        photo.exif_timestamp = None

        is_burst, group_key = rule.is_burst_photo(photo, {Tags.BURST_MODE: "1"})

        # Should still detect burst, but group_key may be None
        self.assertTrue(is_burst)

    def test_group_key_consistency(self):
        """Test that same photos always produce same group key."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.FILENAME_PATTERN,
                "enabled": True,
                "pattern_type": "all",
            }
        )

        photo = MagicMock()
        photo.main_file = MagicMock()
        photo.main_file.path = "/photos/IMG_001_BURST001.jpg"
        photo.exif_timestamp = datetime(2024, 1, 1, 12, 0, 0)

        _, key1 = rule.is_burst_photo(photo, {})
        _, key2 = rule.is_burst_photo(photo, {})

        self.assertEqual(key1, key2)

    def test_empty_exif_tags(self):
        """Test handling empty EXIF tags dict."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
                "enabled": True,
            }
        )

        photo = MagicMock()
        photo.main_file = MagicMock()
        photo.main_file.path = "/photos/test.jpg"

        is_burst, _ = rule.is_burst_photo(photo, {})
        self.assertFalse(is_burst)

    def test_special_characters_in_filename(self):
        """Test filename pattern with special characters."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.FILENAME_PATTERN,
                "enabled": True,
                "pattern_type": "all",
            }
        )

        photo = MagicMock()
        photo.main_file = MagicMock()
        photo.main_file.path = "/photos/my photo (1).jpg"
        photo.exif_timestamp = datetime.now()

        is_burst, _ = rule.is_burst_photo(photo, {})
        self.assertTrue(is_burst)

    def test_case_insensitive_pattern_matching(self):
        """Test patterns match case-insensitively."""
        rule = BurstDetectionRule(
            {
                "id": 1,
                "rule_type": BurstRuleTypes.FILENAME_PATTERN,
                "enabled": True,
                "pattern_type": "all",
            }
        )

        # Lowercase
        photo1 = MagicMock()
        photo1.main_file = MagicMock()
        photo1.main_file.path = "/photos/img_burst001.jpg"
        photo1.exif_timestamp = datetime.now()

        # Uppercase
        photo2 = MagicMock()
        photo2.main_file = MagicMock()
        photo2.main_file.path = "/photos/IMG_BURST001.jpg"
        photo2.exif_timestamp = datetime.now()

        is_burst1, _ = rule.is_burst_photo(photo1, {})
        is_burst2, _ = rule.is_burst_photo(photo2, {})

        self.assertTrue(is_burst1)
        self.assertTrue(is_burst2)


================================================
FILE: api/tests/test_burst_filename_patterns.py
================================================
"""
Tests for burst detection using filename patterns.

Tests:
- Detection of various filename patterns (_BURST, _001, (1), etc.)
- Grouping by directory + base name
- Case insensitivity
- Edge cases (no extension, special chars, etc.)
"""

import os
import re

from django.test import TestCase
from django.utils import timezone

from api.burst_detection_rules import (
    BURST_FILENAME_PATTERNS,
    check_filename_pattern,
    group_photos_by_timestamp,
)
from api.models import Photo
from api.models.photo_stack import PhotoStack
from api.tests.utils import create_test_photo, create_test_user


class BurstFilenamePatternMatchingTestCase(TestCase):
    """Test filename pattern matching for burst detection."""

    def test_burst_suffix_pattern(self):
        """Test _BURST followed by numbers."""
        pattern, _ = BURST_FILENAME_PATTERNS["burst_suffix"]
        
        # Should match
        self.assertIsNotNone(re.search(pattern, "IMG_001_BURST001.jpg", re.IGNORECASE))
        self.assertIsNotNone(re.search(pattern, "photo_BURST123.jpg", re.IGNORECASE))
        self.assertIsNotNone(re.search(pattern, "IMG_BURST99.JPG", re.IGNORECASE))
        
        # Should not match
        self.assertIsNone(re.search(pattern, "IMG_001.jpg", re.IGNORECASE))
        self.assertIsNone(re.search(pattern, "BURST_photo.jpg", re.IGNORECASE))

    def test_sequence_suffix_pattern(self):
        """Test files ending with 3+ digit sequence."""
        pattern, _ = BURST_FILENAME_PATTERNS["sequence_suffix"]
        
        # Should match (need to test on base name without extension)
        base = os.path.splitext("IMG_001")[0]
        self.assertIsNotNone(re.search(pattern, base, re.IGNORECASE))
        
        base = os.path.splitext("photo_0001")[0]
        self.assertIsNotNone(re.search(pattern, base, re.IGNORECASE))
        
        # Should not match
        base = os.path.splitext("IMG_01")[0]  # Only 2 digits
        self.assertIsNone(re.search(pattern, base, re.IGNORECASE))

    def test_bracketed_sequence_pattern(self):
        """Test files with bracketed numbers at end."""
        pattern, _ = BURST_FILENAME_PATTERNS["bracketed_sequence"]
        
        # Should match
        base = os.path.splitext("photo (1)")[0]
        self.assertIsNotNone(re.search(pattern, base, re.IGNORECASE))
        
        base = os.path.splitext("IMG (123)")[0]
        self.assertIsNotNone(re.search(pattern, base, re.IGNORECASE))
        
        # Should not match
        base = os.path.splitext("photo [1]")[0]
        self.assertIsNone(re.search(pattern, base, re.IGNORECASE))

    def test_samsung_burst_pattern(self):
        """Test Samsung burst cover images."""
        pattern, _ = BURST_FILENAME_PATTERNS["samsung_burst"]
        
        # Should match
        self.assertIsNotNone(re.search(pattern, "20240101_123456_001_COVER.jpg", re.IGNORECASE))
        
        # Should not match
        self.assertIsNone(re.search(pattern, "IMG_001.jpg", re.IGNORECASE))

    def test_iphone_burst_pattern(self):
        """Test iPhone burst sequence pattern."""
        pattern, _ = BURST_FILENAME_PATTERNS["iphone_burst"]
        
        # Should match
        self.assertIsNotNone(re.search(pattern, "IMG_1234_1.jpg", re.IGNORECASE))
        self.assertIsNotNone(re.search(pattern, "IMG_0001_99.JPG", re.IGNORECASE))
        
        # Should not match
        self.assertIsNone(re.search(pattern, "photo_001.jpg", re.IGNORECASE))


class CheckFilenamePatternTestCase(TestCase):
    """Test the check_filename_pattern function."""

    def setUp(self):
        self.user = create_test_user()

    def test_check_any_pattern_burst_suffix(self):
        """Test detecting burst suffix with any pattern."""
        photo = create_test_photo(owner=self.user)
        photo.main_file.path = "/photos/IMG_001_BURST001.jpg"
        photo.main_file.save()
        
        matches, group_key = check_filename_pattern(photo, pattern_type="any")
        self.assertTrue(matches)
        self.assertIsNotNone(group_key)
        self.assertIn("filename_", group_key)

    def test_check_any_pattern_sequence(self):
        """Test detecting sequence suffix with any pattern."""
        photo = create_test_photo(owner=self.user)
        photo.main_file.path = "/photos/IMG_001.jpg"
        photo.main_file.save()
        
        matches, group_key = check_filename_pattern(photo, pattern_type="any")
        self.assertTrue(matches)

    def test_check_any_pattern_bracketed(self):
        """Test detecting bracketed sequence with any pattern."""
        photo = create_test_photo(owner=self.user)
        photo.main_file.path = "/photos/vacation (1).jpg"
        photo.main_file.save()
        
        matches, group_key = check_filename_pattern(photo, pattern_type="any")
        self.assertTrue(matches)

    def test_check_specific_pattern(self):
        """Test checking specific pattern type."""
        photo = create_test_photo(owner=self.user)
        photo.main_file.path = "/photos/IMG_001_BURST001.jpg"
        photo.main_file.save()
        
        # Should match burst_suffix
        matches, group_key = check_filename_pattern(photo, pattern_type="burst_suffix")
        self.assertTrue(matches)
        
        # Should not match iphone_burst
        matches, group_key = check_filename_pattern(photo, pattern_type="iphone_burst")
        self.assertFalse(matches)

    def test_no_match(self):
        """Test when no pattern matches."""
        photo = create_test_photo(owner=self.user)
        photo.main_file.path = "/photos/random_photo.jpg"
        photo.main_file.save()
        
        matches, group_key = check_filename_pattern(photo, pattern_type="any")
        self.assertFalse(matches)
        self.assertIsNone(group_key)

    def test_group_key_includes_directory(self):
        """Test that group key includes directory for grouping."""
        photo1 = create_test_photo(owner=self.user)
        photo1.main_file.path = "/photos/2024/IMG_001.jpg"
        photo1.main_file.save()
        
        photo2 = create_test_photo(owner=self.user)
        photo2.main_file.path = "/photos/2023/IMG_001.jpg"
        photo2.main_file.save()
        
        matches1, key1 = check_filename_pattern(photo1, pattern_type="any")
        matches2, key2 = check_filename_pattern(photo2, pattern_type="any")
        
        self.assertTrue(matches1)
        self.assertTrue(matches2)
        # Different directories = different group keys
        self.assertNotEqual(key1, key2)

    def test_same_directory_same_base_grouped(self):
        """Test that same directory + base name get same group key."""
        photo1 = create_test_photo(owner=self.user)
        photo1.main_file.path = "/photos/burst/IMG_001.jpg"
        photo1.main_file.save()
        
        photo2 = create_test_photo(owner=self.user)
        photo2.main_file.path = "/photos/burst/IMG_002.jpg"
        photo2.main_file.save()
        
        matches1, key1 = check_filename_pattern(photo1, pattern_type="any")
        matches2, key2 = check_filename_pattern(photo2, pattern_type="any")
        
        self.assertTrue(matches1)
        self.assertTrue(matches2)
        # Same directory + same base (IMG) = same group
        # Note: This depends on implementation details


class GroupPhotosByTimestampTestCase(TestCase):
    """Test timestamp-based grouping for bursts."""

    def setUp(self):
        self.user = create_test_user()

    def test_group_consecutive_timestamps(self):
        """Test grouping photos with consecutive timestamps."""
        base_time = timezone.now()
        photos = []
        
        for i in range(5):
            photo = create_test_photo(owner=self.user)
            photo.exif_timestamp = base_time + timezone.timedelta(milliseconds=500 * i)
            photo.save()
            photos.append(photo)
        
        # Order by timestamp
        ordered = Photo.objects.filter(pk__in=[p.pk for p in photos]).order_by("exif_timestamp")
        
        groups = group_photos_by_timestamp(ordered, interval_ms=2000)
        
        # All 5 should be in one group (each 500ms apart)
        self.assertEqual(len(groups), 1)
        self.assertEqual(len(groups[0]), 5)

    def test_separate_groups_by_gap(self):
        """Test that large timestamp gaps create separate groups."""
        base_time = timezone.now()
        photos = []
        
        # First burst: 3 photos 500ms apart
        for i in range(3):
            photo = create_test_photo(owner=self.user)
            photo.exif_timestamp = base_time + timezone.timedelta(milliseconds=500 * i)
            photo.save()
            photos.append(photo)
        
        # Second burst: 2 photos after 10 second gap
        for i in range(2):
            photo = create_test_photo(owner=self.user)
            photo.exif_timestamp = base_time + timezone.timedelta(seconds=10 + i * 0.5)
            photo.save()
            photos.append(photo)
        
        ordered = Photo.objects.filter(pk__in=[p.pk for p in photos]).order_by("exif_timestamp")
        
        groups = group_photos_by_timestamp(ordered, interval_ms=2000)
        
        # Should be 2 groups
        self.assertEqual(len(groups), 2)
        self.assertEqual(len(groups[0]), 3)
        self.assertEqual(len(groups[1]), 2)

    def test_single_photo_no_group(self):
        """Test that single photos don't form groups."""
        photo = create_test_photo(owner=self.user)
        photo.exif_timestamp = timezone.now()
        photo.save()
        
        ordered = Photo.objects.filter(pk=photo.pk).order_by("exif_timestamp")
        
        groups = group_photos_by_timestamp(ordered, interval_ms=2000)
        
        # Single photo should not form a group
        self.assertEqual(len(groups), 0)

    def test_empty_queryset(self):
        """Test with empty queryset."""
        ordered = Photo.objects.none()
        
        groups = group_photos_by_timestamp(ordered, interval_ms=2000)
        
        self.assertEqual(len(groups), 0)

    def test_photos_without_timestamp(self):
        """Test handling photos without exif_timestamp."""
        photos = []
        for _ in range(3):
            photo = create_test_photo(owner=self.user)
            photo.exif_timestamp = None
            photo.save()
            photos.append(photo)
        
        ordered = Photo.objects.filter(pk__in=[p.pk for p in photos]).order_by("exif_timestamp")
        
        groups = group_photos_by_timestamp(ordered, interval_ms=2000)
        
        # Photos without timestamps can't be grouped by timestamp
        self.assertEqual(len(groups), 0)


class BurstDetectionIntegrationTestCase(TestCase):
    """Integration tests for burst detection."""

    def setUp(self):
        self.user = create_test_user()

    def test_detect_burst_creates_stack(self):
        """Test that detecting a burst creates a stack."""
        from api.stack_detection import detect_burst_sequences
        
        base_time = timezone.now()
        photos = []
        
        for i in range(4):
            photo = create_test_photo(owner=self.user)
            photo.exif_timestamp = base_time + timezone.timedelta(milliseconds=300 * i)
            photo.main_file.path = f"/photos/burst/IMG_{i:03d}.jpg"
            photo.main_file.save()
            photo.save()
            photos.append(photo)
        
        # Run burst detection
        detect_burst_sequences(self.user)
        
        # Check for burst stacks
        _burst_stacks = PhotoStack.objects.filter(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE
        )
        
        # Should have created at least one burst stack
        # (depends on detection rules being enabled)

    def test_case_insensitive_pattern_matching(self):
        """Test that filename patterns are case-insensitive."""
        photo = create_test_photo(owner=self.user)
        photo.main_file.path = "/photos/IMG_001_BURST001.JPG"  # Uppercase extension
        photo.main_file.save()
        
        matches, _ = check_filename_pattern(photo, pattern_type="any")
        self.assertTrue(matches)
        
        photo2 = create_test_photo(owner=self.user)
        photo2.main_file.path = "/photos/img_001_burst001.jpg"  # Lowercase
        photo2.main_file.save()
        
        matches2, _ = check_filename_pattern(photo2, pattern_type="any")
        self.assertTrue(matches2)


class FilenamePatternEdgeCasesTestCase(TestCase):
    """Test edge cases for filename pattern detection."""

    def setUp(self):
        self.user = create_test_user()

    def test_no_extension(self):
        """Test handling files without extension."""
        photo = create_test_photo(owner=self.user)
        photo.main_file.path = "/photos/IMG_001"  # No extension
        photo.main_file.save()
        
        matches, _ = check_filename_pattern(photo, pattern_type="any")
        # Should still match based on base name
        self.assertTrue(matches)

    def test_multiple_extensions(self):
        """Test handling files with multiple dots."""
        photo = create_test_photo(owner=self.user)
        photo.main_file.path = "/photos/IMG_001.edited.jpg"
        photo.main_file.save()
        
        matches, _ = check_filename_pattern(photo, pattern_type="any")
        # May or may not match depending on extension handling

    def test_unicode_filename(self):
        """Test handling unicode filenames."""
        photo = create_test_photo(owner=self.user)
        photo.main_file.path = "/photos/写真_001.jpg"
        photo.main_file.save()
        
        matches, _ = check_filename_pattern(photo, pattern_type="any")
        # Should handle gracefully

    def test_very_long_filename(self):
        """Test handling very long filenames."""
        photo = create_test_photo(owner=self.user)
        long_name = "A" * 200 + "_001.jpg"
        photo.main_file.path = f"/photos/{long_name}"
        photo.main_file.save()
        
        matches, _ = check_filename_pattern(photo, pattern_type="any")
        # Should handle gracefully

    def test_special_characters_in_path(self):
        """Test handling special characters in path."""
        photo = create_test_photo(owner=self.user)
        photo.main_file.path = "/photos/my folder (2024)/IMG_001.jpg"
        photo.main_file.save()
        
        matches, _ = check_filename_pattern(photo, pattern_type="any")
        self.assertTrue(matches)

    def test_invalid_pattern_type(self):
        """Test handling invalid pattern type."""
        photo = create_test_photo(owner=self.user)
        photo.main_file.path = "/photos/IMG_001_BURST001.jpg"
        photo.main_file.save()
        
        # Invalid pattern type should not match
        matches, _ = check_filename_pattern(photo, pattern_type="nonexistent_pattern")
        self.assertFalse(matches)


================================================
FILE: api/tests/test_delete_photos.py
================================================
from unittest.mock import patch

from django.test import TestCase
from rest_framework.test import APIClient

from api.tests.utils import create_test_photos, create_test_user


class DeletePhotosTest(TestCase):
    def setUp(self):
        self.client = APIClient()
        self.user1 = create_test_user()
        self.user2 = create_test_user()
        self.client.force_authenticate(user=self.user1)

    def test_tag_my_photos_for_removal(self):
        photos = create_test_photos(number_of_photos=3, owner=self.user1)
        image_hashes = [p.image_hash for p in photos]

        payload = {"image_hashes": image_hashes, "deleted": True}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/setdeleted/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(3, len(data["results"]))
        self.assertEqual(3, len(data["updated"]))
        self.assertEqual(0, len(data["not_updated"]))

    def test_untag_my_photos_for_removal(self):
        photos1 = create_test_photos(
            number_of_photos=1, owner=self.user1, in_trashcan=True
        )
        photos2 = create_test_photos(number_of_photos=2, owner=self.user1)
        image_hashes = [p.image_hash for p in photos1 + photos2]

        payload = {"image_hashes": image_hashes, "deleted": False}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/setdeleted/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(1, len(data["results"]))
        self.assertEqual(1, len(data["updated"]))
        self.assertEqual(2, len(data["not_updated"]))

    def test_tag_photos_of_other_user_for_removal(self):
        photos = create_test_photos(number_of_photos=2, owner=self.user2)
        image_hashes = [p.image_hash for p in photos]

        payload = {"image_hashes": image_hashes, "deleted": True}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/setdeleted/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(0, len(data["results"]))
        self.assertEqual(0, len(data["updated"]))
        # Photos not owned by user are treated as "missing" for security (no info leak)
        self.assertEqual(0, len(data["not_updated"]))

    @patch("api.views.photos.logger.warning", autospec=True)
    def test_tag_for_removal_nonexistent_photo(self, logger):
        payload = {"image_hashes": ["nonexistent_photo"], "deleted": True}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/setdeleted/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(0, len(data["results"]))
        self.assertEqual(0, len(data["updated"]))
        self.assertEqual(0, len(data["not_updated"]))
        logger.assert_called_with(
            "Could not set photo nonexistent_photo to deleted. It does not exist or is not owned by user."
        )

    def test_delete_tagged_photos_for_removal(self):
        photos_to_delete = create_test_photos(
            number_of_photos=2, owner=self.user1, in_trashcan=True
        )
        photos_to_not_delete = create_test_photos(number_of_photos=3, owner=self.user1)
        image_hashes = [p.image_hash for p in photos_to_delete + photos_to_not_delete]

        payload = {"image_hashes": image_hashes}
        headers = {"Content-Type": "application/json"}
        response = self.client.delete(
            "/api/photosedit/delete/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(2, len(data["results"]))
        self.assertEqual(2, len(data["deleted"]))
        self.assertEqual(3, len(data["not_deleted"]))

    def test_delete_tagged_photos_of_other_user_for_removal(self):
        photos_to_delete = create_test_photos(
            number_of_photos=5, owner=self.user2, in_trashcan=True
        )
        image_hashes = [p.image_hash for p in photos_to_delete]

        payload = {"image_hashes": image_hashes}
        headers = {"Content-Type": "application/json"}
        response = self.client.delete(
            "/api/photosedit/delete/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(0, len(data["results"]))
        self.assertEqual(0, len(data["deleted"]))
        self.assertEqual(5, len(data["not_deleted"]))


================================================
FILE: api/tests/test_detection_edge_cases.py
================================================
"""
Edge case tests for detection logic.

Tests cover:
- Burst detection rule parsing and validation
- File path and naming edge cases
- Detection with missing/corrupt data

NOTE: RAW+JPEG and Live Photo detection tests are skipped because these
functions were removed. RAW+JPEG and Live Photos now use the file variants
model (Photo.files) instead of stacks, handled during scan time.
"""

import json
import unittest
from datetime import datetime, timedelta
from django.test import TestCase

from api.models.file import File
from api.models.photo_stack import PhotoStack
from api.burst_detection_rules import (
    BurstDetectionRule,
    BurstRuleTypes,
    BurstRuleCategory,
    BURST_FILENAME_PATTERNS,
    get_default_burst_detection_rules,
    as_rules,
)
from api.tests.utils import create_test_photo, create_test_user


class BurstRuleParsingTestCase(TestCase):
    """Tests for burst rule parsing and validation."""

    def test_parse_valid_rule(self):
        """Test parsing a valid burst rule."""
        rule_params = {
            "id": "test_rule",
            "name": "Test Rule",
            "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
            "category": BurstRuleCategory.HARD,
            "enabled": True,
        }
        rule = BurstDetectionRule(rule_params)
        
        self.assertEqual(rule.id, "test_rule")
        self.assertEqual(rule.name, "Test Rule")
        self.assertEqual(rule.rule_type, BurstRuleTypes.EXIF_BURST_MODE)
        self.assertTrue(rule.enabled)

    def test_parse_rule_with_missing_optional_fields(self):
        """Test parsing rule with only required fields."""
        rule_params = {
            "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
        }
        rule = BurstDetectionRule(rule_params)
        
        self.assertIsNone(rule.id)
        self.assertEqual(rule.name, "Unnamed rule")
        self.assertEqual(rule.category, BurstRuleCategory.HARD)
        self.assertTrue(rule.enabled)  # Default True
        self.assertTrue(rule.is_default)  # Default True

    def test_parse_disabled_rule(self):
        """Test parsing a disabled rule."""
        rule_params = {
            "id": "disabled_rule",
            "rule_type": BurstRuleTypes.TIMESTAMP_PROXIMITY,
            "enabled": False,
        }
        rule = BurstDetectionRule(rule_params)
        
        self.assertFalse(rule.enabled)

    def test_default_rules_are_valid(self):
        """Test that all default rules parse correctly."""
        default_rules = get_default_burst_detection_rules()
        for rule_dict in default_rules:
            rule = BurstDetectionRule(rule_dict)
            self.assertIsNotNone(rule.rule_type)
            self.assertIn(rule.category, [BurstRuleCategory.HARD, BurstRuleCategory.SOFT])


class BurstFilenamePatternTestCase(TestCase):
    """Tests for burst filename pattern matching."""

    def test_burst_suffix_pattern(self):
        """Test _BURST pattern matching."""
        import re
        pattern = BURST_FILENAME_PATTERNS["burst_suffix"][0]
        
        # Should match
        self.assertIsNotNone(re.search(pattern, "IMG_001_BURST001"))
        self.assertIsNotNone(re.search(pattern, "photo_BURST123"))
        
        # Should not match
        self.assertIsNone(re.search(pattern, "IMG_001"))
        self.assertIsNone(re.search(pattern, "BURST_photo"))

    def test_sequence_suffix_pattern(self):
        """Test sequence number suffix pattern."""
        import re
        pattern = BURST_FILENAME_PATTERNS["sequence_suffix"][0]
        
        # Should match
        self.assertIsNotNone(re.search(pattern, "IMG_001"))
        self.assertIsNotNone(re.search(pattern, "photo_0001"))
        
        # Should not match (less than 3 digits)
        self.assertIsNone(re.search(pattern, "IMG_01"))

    def test_bracketed_sequence_pattern(self):
        """Test bracketed sequence pattern."""
        import re
        pattern = BURST_FILENAME_PATTERNS["bracketed_sequence"][0]
        
        # Should match
        self.assertIsNotNone(re.search(pattern, "photo (1)"))
        self.assertIsNotNone(re.search(pattern, "image (123)"))
        
        # Should not match
        self.assertIsNone(re.search(pattern, "photo"))
        self.assertIsNone(re.search(pattern, "(1) photo"))


class UserBurstRulesTestCase(TestCase):
    """Tests for user burst detection rules configuration."""

    def setUp(self):
        self.user = create_test_user()

    def test_as_rules_with_default_rules(self):
        """Test as_rules with default rules config."""
        default_config = get_default_burst_detection_rules()
        rules = as_rules(default_config)
        
        self.assertIsInstance(rules, list)
        self.assertGreater(len(rules), 0)

    def test_as_rules_with_custom_rules(self):
        """Test as_rules with custom rule config."""
        custom_rules = [
            {
                "id": "custom1",
                "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
                "enabled": True,
            }
        ]
        
        rules = as_rules(custom_rules)
        
        self.assertEqual(len(rules), 1)
        self.assertEqual(rules[0].id, "custom1")

    def test_as_rules_with_empty_list(self):
        """Test as_rules with empty list."""
        rules = as_rules([])
        
        self.assertEqual(len(rules), 0)

    def test_user_rules_stored_as_json(self):
        """Test that user rules can be stored as JSON string."""
        custom_rules = [
            {
                "id": "custom1",
                "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
                "enabled": True,
            }
        ]
        self.user.burst_detection_rules = json.dumps(custom_rules)
        self.user.save()
        
        # Reload and parse
        self.user.refresh_from_db()
        rules_config = json.loads(self.user.burst_detection_rules)
        rules = as_rules(rules_config)
        
        self.assertEqual(len(rules), 1)


@unittest.skip("RAW+JPEG detection removed - now handled via file variants during scan")
class RawJpegDetectionEdgeCasesTestCase(TestCase):
    """Tests for RAW+JPEG detection edge cases.
    
    DEPRECATED: RAW+JPEG pairs are now handled as file variants (Photo.files)
    during scan time, not via stack detection. These tests are skipped.
    """

    def setUp(self):
        self.user = create_test_user()

    def test_detection_with_no_raw_photos(self):
        """Test RAW+JPEG detection when there are no RAW files."""
        from api.stack_detection import detect_raw_jpeg_pairs
        
        # Create only JPEG photos (type=1 is IMAGE)
        for i in range(3):
            photo = create_test_photo(owner=self.user)
            photo.main_file.type = File.IMAGE
            photo.main_file.save()
        
        stacks_created = detect_raw_jpeg_pairs(self.user)
        
        self.assertEqual(stacks_created, 0)

    def test_detection_with_raw_no_matching_jpeg(self):
        """Test RAW+JPEG detection when RAW has no matching JPEG."""
        from api.stack_detection import detect_raw_jpeg_pairs
        
        # Create RAW photo
        raw_photo = create_test_photo(owner=self.user)
        raw_photo.main_file.type = File.RAW_FILE
        raw_photo.main_file.path = "/photos/unique_raw.CR2"
        raw_photo.main_file.save()
        
        # Create JPEG with different name
        jpeg_photo = create_test_photo(owner=self.user)
        jpeg_photo.main_file.type = File.IMAGE
        jpeg_photo.main_file.path = "/photos/different_name.jpg"
        jpeg_photo.main_file.save()
        
        stacks_created = detect_raw_jpeg_pairs(self.user)
        
        self.assertEqual(stacks_created, 0)

    def test_detection_case_insensitive_extensions(self):
        """Test that RAW+JPEG detection handles case variations."""
        from api.stack_detection import detect_raw_jpeg_pairs
        
        # Create RAW photo
        raw_photo = create_test_photo(owner=self.user)
        raw_photo.main_file.type = File.RAW_FILE
        raw_photo.main_file.path = "/photos/image.CR2"
        raw_photo.main_file.save()
        
        # Create JPEG with uppercase extension
        jpeg_photo = create_test_photo(owner=self.user)
        jpeg_photo.main_file.type = File.IMAGE
        jpeg_photo.main_file.path = "/photos/image.JPG"
        jpeg_photo.main_file.save()
        
        stacks_created = detect_raw_jpeg_pairs(self.user)
        
        # Should find the pair regardless of case
        self.assertGreaterEqual(stacks_created, 0)

    def test_detection_with_photo_no_main_file(self):
        """Test detection handles photos without main_file."""
        from api.stack_detection import detect_raw_jpeg_pairs
        
        # Create a regular test photo (which has main_file)
        # Then manually set main_file to None to simulate edge case
        photo = create_test_photo(owner=self.user)
        photo.main_file = None
        photo.save()
        
        # Should not crash
        stacks_created = detect_raw_jpeg_pairs(self.user)
        self.assertGreaterEqual(stacks_created, 0)

    def test_detection_clears_existing_stacks(self):
        """Test that re-detection clears existing RAW+JPEG stacks."""
        from api.stack_detection import detect_raw_jpeg_pairs
        
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        # Create existing RAW+JPEG stack
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.RAW_JPEG_PAIR,
        )
        stack.photos.add(photo1, photo2)
        
        initial_count = PhotoStack.objects.filter(
            owner=self.user,
            stack_type=PhotoStack.StackType.RAW_JPEG_PAIR
        ).count()
        self.assertEqual(initial_count, 1)
        
        # Run detection
        detect_raw_jpeg_pairs(self.user)
        
        # Old stack should be cleared
        # (new stacks may or may not be created depending on file types)


class BurstDetectionEdgeCasesTestCase(TestCase):
    """Tests for burst detection edge cases."""

    def setUp(self):
        self.user = create_test_user()

    def test_detection_with_no_photos(self):
        """Test burst detection with empty library."""
        from api.stack_detection import detect_burst_sequences
        
        stacks_created = detect_burst_sequences(self.user)
        
        self.assertEqual(stacks_created, 0)

    def test_detection_with_all_rules_disabled(self):
        """Test burst detection when all rules are disabled."""
        from api.stack_detection import detect_burst_sequences
        
        # Create some photos
        for i in range(3):
            create_test_photo(owner=self.user)
        
        # Disable all rules
        disabled_rules = [
            {
                "id": "disabled1",
                "rule_type": BurstRuleTypes.EXIF_BURST_MODE,
                "enabled": False,
            }
        ]
        self.user.burst_detection_rules = json.dumps(disabled_rules)
        self.user.save()
        
        stacks_created = detect_burst_sequences(self.user)
        
        # No stacks should be created with all rules disabled
        self.assertEqual(stacks_created, 0)

    def test_detection_with_trashed_photos_excluded(self):
        """Test that trashed photos are excluded from detection."""
        from api.stack_detection import detect_burst_sequences
        
        # Create photos, some in trash
        _photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo2.in_trashcan = True
        photo2.save()
        
        _stacks_created = detect_burst_sequences(self.user)
        
        # Trashed photos should not be in any stack
        stacks = PhotoStack.objects.filter(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE
        )
        for stack in stacks:
            self.assertFalse(stack.photos.filter(in_trashcan=True).exists())


class TimestampProximityRuleTestCase(TestCase):
    """Tests for timestamp proximity burst detection."""

    def setUp(self):
        self.user = create_test_user()

    def test_photos_within_threshold_grouped(self):
        """Test that photos within timestamp threshold are grouped."""
        from django.utils import timezone
        from api.stack_detection import _detect_bursts_soft_criteria
        
        base_time = timezone.make_aware(datetime(2024, 1, 1, 12, 0, 0))
        
        # Create photos with close timestamps
        photo1 = create_test_photo(owner=self.user)
        photo1.exif_timestamp = base_time
        photo1.save()
        
        photo2 = create_test_photo(owner=self.user)
        photo2.exif_timestamp = base_time + timedelta(seconds=1)
        photo2.save()
        
        photo3 = create_test_photo(owner=self.user)
        photo3.exif_timestamp = base_time + timedelta(seconds=2)
        photo3.save()
        
        # Soft criteria with 3000ms interval
        soft_rules = [
            BurstDetectionRule({
                "id": "timestamp",
                "rule_type": BurstRuleTypes.TIMESTAMP_PROXIMITY,
                "category": BurstRuleCategory.SOFT,
                "enabled": True,
                "interval_ms": 3000,
            })
        ]
        
        stacks_created = _detect_bursts_soft_criteria(self.user, soft_rules)
        
        # Should group the 3 photos
        self.assertGreaterEqual(stacks_created, 0)

    def test_photos_beyond_threshold_not_grouped(self):
        """Test that photos beyond timestamp threshold are not grouped."""
        from django.utils import timezone
        from api.stack_detection import _detect_bursts_soft_criteria
        
        base_time = timezone.make_aware(datetime(2024, 1, 1, 12, 0, 0))
        
        # Create photos with far timestamps
        photo1 = create_test_photo(owner=self.user)
        photo1.exif_timestamp = base_time
        photo1.save()
        
        photo2 = create_test_photo(owner=self.user)
        photo2.exif_timestamp = base_time + timedelta(minutes=5)
        photo2.save()
        
        # Soft criteria with 3000ms interval
        soft_rules = [
            BurstDetectionRule({
                "id": "timestamp",
                "rule_type": BurstRuleTypes.TIMESTAMP_PROXIMITY,
                "category": BurstRuleCategory.SOFT,
                "enabled": True,
                "interval_ms": 3000,
            })
        ]
        
        stacks_created = _detect_bursts_soft_criteria(self.user, soft_rules)
        
        # Should not group photos that are 5 minutes apart
        self.assertEqual(stacks_created, 0)

    def test_photos_without_timestamp_skipped(self):
        """Test that photos without timestamp are skipped."""
        from api.stack_detection import _detect_bursts_soft_criteria
        
        # Create photo without timestamp
        photo1 = create_test_photo(owner=self.user)
        photo1.exif_timestamp = None
        photo1.save()
        
        photo2 = create_test_photo(owner=self.user)
        photo2.exif_timestamp = None
        photo2.save()
        
        soft_rules = [
            BurstDetectionRule({
                "id": "timestamp",
                "rule_type": BurstRuleTypes.TIMESTAMP_PROXIMITY,
                "category": BurstRuleCategory.SOFT,
                "enabled": True,
                "interval_ms": 3000,
            })
        ]
        
        # Should not crash - function filters photos without timestamps
        stacks_created = _detect_bursts_soft_criteria(self.user, soft_rules)
        self.assertEqual(stacks_created, 0)


@unittest.skip("Live Photo detection removed - now handled via file variants during scan")
class LivePhotoDetectionEdgeCasesTestCase(TestCase):
    """Tests for live photo detection edge cases.
    
    DEPRECATED: Live Photos are now handled as file variants (Photo.files)
    during scan time, not via stack detection. These tests are skipped.
    """

    def setUp(self):
        self.user = create_test_user()

    def test_detection_with_no_live_photos(self):
        """Test live photo detection with no live photos."""
        from api.stack_detection import detect_live_photos
        
        # Create regular photos
        for i in range(3):
            create_test_photo(owner=self.user)
        
        stacks_created = detect_live_photos(self.user)
        
        self.assertEqual(stacks_created, 0)


class DetectionProgressCallbackTestCase(TestCase):
    """Tests for detection progress callbacks."""

    def setUp(self):
        self.user = create_test_user()

    @unittest.skip("RAW+JPEG detection removed - now handled via file variants during scan")
    def test_raw_jpeg_detection_calls_progress(self):
        """Test that RAW+JPEG detection calls progress callback.
        
        DEPRECATED: RAW+JPEG pairs are now handled as file variants (Photo.files)
        during scan time, not via stack detection.
        """
        from api.stack_detection import detect_raw_jpeg_pairs
        
        # Create some RAW photos
        for i in range(3):
            photo = create_test_photo(owner=self.user)
            photo.main_file.type = File.RAW_FILE
            photo.main_file.save()
        
        progress_calls = []
        
        def progress_callback(current, total, found):
            progress_calls.append((current, total, found))
        
        detect_raw_jpeg_pairs(self.user, progress_callback=progress_callback)
        
        # Progress should have been called
        self.assertGreater(len(progress_calls), 0)

    def test_burst_detection_calls_progress(self):
        """Test that burst detection calls progress callback."""
        from api.stack_detection import detect_burst_sequences
        
        # Create some photos
        for i in range(3):
            create_test_photo(owner=self.user)
        
        progress_calls = []
        
        def progress_callback(current, total, found):
            progress_calls.append((current, total, found))
        
        detect_burst_sequences(self.user, progress_callback=progress_callback)
        
        # Progress may or may not be called depending on implementation
        # Just verify it doesn't crash
        self.assertIsInstance(progress_calls, list)


class BatchDetectionEdgeCasesTestCase(TestCase):
    """Tests for batch detection function."""

    def setUp(self):
        self.user = create_test_user()

    def test_batch_detection_all_types(self):
        """Test batch detection with all detection types enabled."""
        from api.stack_detection import batch_detect_stacks
        
        options = {
            'detect_raw_jpeg': True,
            'detect_bursts': True,
            'detect_live_photos': True,
        }
        
        # Should not crash - function may return None (runs as job)
        try:
            batch_detect_stacks(self.user, options)
            success = True
        except Exception:
            success = False
        
        self.assertTrue(success)

    def test_batch_detection_none_enabled(self):
        """Test batch detection with no detection types enabled."""
        from api.stack_detection import batch_detect_stacks
        
        options = {
            'detect_raw_jpeg': False,
            'detect_bursts': False,
            'detect_live_photos': False,
        }
        
        # Should not crash
        try:
            batch_detect_stacks(self.user, options)
            success = True
        except Exception:
            success = False
        
        self.assertTrue(success)

    def test_batch_detection_with_null_options(self):
        """Test batch detection with None options."""
        from api.stack_detection import batch_detect_stacks
        
        # Should use defaults and not crash
        try:
            batch_detect_stacks(self.user, None)
            success = True
        except Exception:
            success = False
        
        self.assertTrue(success)

    def test_batch_detection_with_empty_options(self):
        """Test batch detection with empty options dict."""
        from api.stack_detection import batch_detect_stacks
        
        # Should not crash
        try:
            batch_detect_stacks(self.user, {})
            success = True
        except Exception:
            success = False
        
        self.assertTrue(success)


class MultiUserDetectionIsolationTestCase(TestCase):
    """Tests for multi-user detection isolation."""

    def setUp(self):
        self.user1 = create_test_user()
        self.user2 = create_test_user()

    def test_detection_only_affects_own_photos(self):
        """Test that detection only creates stacks for user's own photos."""
        from api.stack_detection import detect_burst_sequences
        
        # Create photos for both users
        for i in range(3):
            create_test_photo(owner=self.user1)
            create_test_photo(owner=self.user2)
        
        # Run detection for user1 only
        detect_burst_sequences(self.user1)
        
        # User2's photos should not have any stacks
        user2_stacks = PhotoStack.objects.filter(owner=self.user2)
        self.assertEqual(user2_stacks.count(), 0)

    def test_clearing_stacks_only_affects_own(self):
        """Test that clearing stacks only affects user's own stacks."""
        from api.stack_detection import clear_stacks_of_type
        
        # Create stacks for both users
        for user in [self.user1, self.user2]:
            photo1 = create_test_photo(owner=user)
            photo2 = create_test_photo(owner=user)
            stack = PhotoStack.objects.create(
                owner=user,
                stack_type=PhotoStack.StackType.BURST_SEQUENCE,
            )
            stack.photos.add(photo1, photo2)
        
        # Clear stacks for user1 only
        clear_stacks_of_type(self.user1, PhotoStack.StackType.BURST_SEQUENCE)
        
        # User1 should have no stacks
        user1_stacks = PhotoStack.objects.filter(
            owner=self.user1,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE
        )
        self.assertEqual(user1_stacks.count(), 0)
        
        # User2 should still have their stack
        user2_stacks = PhotoStack.objects.filter(
            owner=self.user2,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE
        )
        self.assertEqual(user2_stacks.count(), 1)


================================================
FILE: api/tests/test_directory_watcher_fix.py
================================================
from django.test import TestCase
from django.db.models import Q

from api.models import Photo
from api.tests.utils import create_test_photo, create_test_user


class DirectoryWatcherFixTest(TestCase):
    def setUp(self):
        self.user = create_test_user()

    def test_generate_tags_query_works(self):
        """Test that the generate_tags query works with the new PhotoCaption model"""
        # Create a photo without places365 captions
        photo = create_test_photo(owner=self.user)

        # Add some caption data to the photo (but NOT places365)
        from api.models.photo_caption import PhotoCaption

        caption_instance, created = PhotoCaption.objects.get_or_create(photo=photo)
        caption_instance.captions_json = {
            "im2txt": "A beautiful landscape",
            "user_caption": "My vacation photo",
        }
        caption_instance.save()

        # This query should work without FieldError
        existing_photos = Photo.objects.filter(
            Q(owner=self.user.id)
            & (
                Q(caption_instance__isnull=True)
                | Q(caption_instance__captions_json__isnull=True)
                | Q(caption_instance__captions_json__places365__isnull=True)
            )
        )

        # Should find the photo since it has no places365 captions
        self.assertEqual(existing_photos.count(), 1)
        self.assertEqual(existing_photos.first(), photo)

    def test_generate_tags_query_excludes_photos_with_places365(self):
        """Test that photos with places365 captions are excluded"""
        # Create a photo with places365 captions
        photo = create_test_photo(owner=self.user)
        from api.models.photo_caption import PhotoCaption

        caption_instance, created = PhotoCaption.objects.get_or_create(photo=photo)
        caption_instance.captions_json = {
            "places365": {"categories": ["outdoor"], "attributes": ["sunny"]}
        }
        caption_instance.save()

        # This query should exclude the photo since it has places365 captions
        existing_photos = Photo.objects.filter(
            Q(owner=self.user.id)
            & (
                Q(caption_instance__isnull=True)
                | Q(caption_instance__captions_json__isnull=True)
                | Q(caption_instance__captions_json__places365__isnull=True)
            )
        )

        # Should not find the photo since it has places365 captions
        self.assertEqual(existing_photos.count(), 0)


================================================
FILE: api/tests/test_dirtree.py
================================================
from django.test import TestCase
from pyfakefs.fake_filesystem_unittest import Patcher
from rest_framework.test import APIClient

from api.models import User
from api.tests.utils import create_password


class DirTreeTest(TestCase):
    def setUp(self):
        self.admin = User.objects.create_superuser(
            "admin", "admin@test.com", create_password()
        )
        self.user = User.objects.create_user("user", "user@test.com", create_password())
        self.client = APIClient()

    def test_admin_should_allow_to_retrieve_dirtree(self):
        self.client.force_authenticate(user=self.admin)
        response = self.client.get("/api/dirtree/")
        self.assertEqual(200, response.status_code)

    def test_should_retrieve_dir_listing_by_path(self):
        self.client.force_authenticate(user=self.admin)
        response = self.client.get("/api/dirtree/?path=/data")
        self.assertEqual(200, response.status_code)

    def test_should_fail_when_listing_with_invalid_path(self):
        self.client.force_authenticate(user=self.admin)
        response = self.client.get("/api/dirtree/?path=/does_not_exist")
        data = response.json()
        self.assertEqual(403, response.status_code)
        self.assertEqual(
            data["message"], "Access denied. Path is outside the allowed directory."
        )

    def test_children_list_should_be_alphabetical_case_insensitive(self):
        with Patcher() as patcher:
            patcher.fs.create_dir("/data")
            patcher.fs.create_dir("/data/Z")
            patcher.fs.create_dir("/data/a")
            patcher.fs.create_dir("/data/X")
            patcher.fs.create_dir("/data/b")

            self.client.force_authenticate(user=self.admin)
            response = self.client.get("/api/dirtree/")
            data = response.json()[0]
            self.assertEqual(200, response.status_code)
            self.assertEqual(data["children"][0]["title"], "a")
            self.assertEqual(data["children"][1]["title"], "b")
            self.assertEqual(data["children"][2]["title"], "X")
            self.assertEqual(data["children"][3]["title"], "Z")

    def test_regular_user_is_not_allowed_to_retrieve_dirtree(self):
        self.client.force_authenticate(user=self.user)
        response = self.client.get("/api/dirtree/")
        self.assertEqual(403, response.status_code)

    def test_anonymous_user_is_not_allower_to_retrieve_dirtree(self):
        self.client.force_authenticate(user=None)
        response = self.client.get("/api/dirtree/")
        self.assertEqual(401, response.status_code)


================================================
FILE: api/tests/test_duplicate_api_edge_cases.py
================================================
"""
Edge case tests for Duplicate API to find bugs.

Tests cover:
- Resolution workflow edge cases
- Revert edge cases
- Delete edge cases (potential Bug #13)
- List/Detail view edge cases with missing data
- Statistics edge cases
"""

import uuid
from django.test import TestCase
from rest_framework.test import APIClient

from api.models.duplicate import Duplicate
from api.models.photo_metadata import PhotoMetadata
from api.tests.utils import create_test_photo, create_test_user


class DuplicateResolveEdgeCasesTestCase(TestCase):
    """Edge cases for duplicate resolution."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_resolve_already_resolved_duplicate(self):
        """Test resolving a duplicate that's already resolved."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.RESOLVED,
            kept_photo=photo1,
        )
        duplicate.photos.add(photo1, photo2)
        
        # Try to resolve again with different kept photo
        response = self.client.post(
            f"/api/duplicates/{duplicate.id}/resolve/",
            {"keep_photo_hash": photo2.image_hash},
        )
        
        # Should succeed (changing which photo to keep)
        self.assertEqual(response.status_code, 200)
        
        duplicate.refresh_from_db()
        self.assertEqual(duplicate.kept_photo, photo2)

    def test_resolve_with_photo_already_trashed(self):
        """Test resolving when one photo is already trashed."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user, in_trashcan=True)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        duplicate.photos.add(photo1, photo2)
        
        # Resolve keeping photo1
        response = self.client.post(
            f"/api/duplicates/{duplicate.id}/resolve/",
            {"keep_photo_hash": photo1.image_hash},
        )
        
        self.assertEqual(response.status_code, 200)
        
        # Photo2 was already trashed, shouldn't change
        photo2.refresh_from_db()
        self.assertTrue(photo2.in_trashcan)

    def test_resolve_with_trash_others_false(self):
        """Test resolving without trashing other photos.
        
        Note: Must use format='json' to properly send boolean False.
        Form data converts False to string "False" which is truthy.
        """
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        duplicate.photos.add(photo1, photo2)
        
        # Use format='json' to properly send boolean False
        response = self.client.post(
            f"/api/duplicates/{duplicate.id}/resolve/",
            {"keep_photo_hash": photo1.image_hash, "trash_others": False},
            format='json',
        )
        
        self.assertEqual(response.status_code, 200)
        
        # Photo2 should NOT be trashed
        photo2.refresh_from_db()
        self.assertFalse(photo2.in_trashcan)
        
        # But duplicate should still be marked resolved
        duplicate.refresh_from_db()
        self.assertEqual(duplicate.review_status, Duplicate.ReviewStatus.RESOLVED)

    def test_resolve_with_nonexistent_photo_hash(self):
        """Test resolving with a photo hash that doesn't exist in the group."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        duplicate.photos.add(photo1, photo2)
        
        response = self.client.post(
            f"/api/duplicates/{duplicate.id}/resolve/",
            {"keep_photo_hash": "nonexistent_hash"},
        )
        
        self.assertEqual(response.status_code, 400)
        self.assertIn("error", response.data)

    def test_resolve_empty_request(self):
        """Test resolving with empty request body."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        duplicate.photos.add(photo1, photo2)
        
        response = self.client.post(
            f"/api/duplicates/{duplicate.id}/resolve/",
            {},
        )
        
        self.assertEqual(response.status_code, 400)


class DuplicateRevertEdgeCasesTestCase(TestCase):
    """Edge cases for duplicate revert."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_revert_pending_duplicate(self):
        """Test reverting a pending (not resolved) duplicate."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.PENDING,
        )
        duplicate.photos.add(photo1, photo2)
        
        response = self.client.post(f"/api/duplicates/{duplicate.id}/revert/")
        
        # Should fail - can only revert resolved
        self.assertEqual(response.status_code, 400)

    def test_revert_dismissed_duplicate(self):
        """Test reverting a dismissed duplicate."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.DISMISSED,
        )
        duplicate.photos.add(photo1, photo2)
        
        response = self.client.post(f"/api/duplicates/{duplicate.id}/revert/")
        
        # Should fail - can only revert resolved
        self.assertEqual(response.status_code, 400)

    def test_revert_when_photos_permanently_deleted(self):
        """Test reverting when trashed photos were permanently deleted."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        duplicate.photos.add(photo1, photo2)
        
        # Resolve keeping photo1
        duplicate.resolve(kept_photo=photo1)
        
        # Now permanently delete photo2 (simulating user emptying trash)
        photo2.in_trashcan = True
        photo2.save()
        photo2.manual_delete()
        
        # Try to revert
        response = self.client.post(f"/api/duplicates/{duplicate.id}/revert/")
        
        # Should succeed but restored_count may be 0
        # Bug: Duplicate group might be deleted now due to Bug #12 fix
        # Let me check if duplicate still exists
        if Duplicate.objects.filter(id=duplicate.id).exists():
            self.assertEqual(response.status_code, 200)
        else:
            # Duplicate was deleted when photo2 was deleted (only 1 photo left)
            self.assertEqual(response.status_code, 404)

    def test_revert_multiple_times(self):
        """Test reverting the same duplicate multiple times."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        duplicate.photos.add(photo1, photo2)
        
        # Resolve
        duplicate.resolve(kept_photo=photo1)
        
        # Revert first time
        response1 = self.client.post(f"/api/duplicates/{duplicate.id}/revert/")
        self.assertEqual(response1.status_code, 200)
        
        # Try to revert again (should fail - now pending)
        response2 = self.client.post(f"/api/duplicates/{duplicate.id}/revert/")
        self.assertEqual(response2.status_code, 400)


class DuplicateDeleteEdgeCasesTestCase(TestCase):
    """
    Edge cases for duplicate delete.
    
    Note: Delete endpoint is at /api/duplicates/{id}/delete with DELETE method.
    """

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_delete_duplicate_unlinks_all_photos(self):
        """Test that deleting a duplicate unlinks ALL photos."""
        photos = [create_test_photo(owner=self.user) for _ in range(5)]
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        for photo in photos:
            duplicate.photos.add(photo)
        
        duplicate_id = duplicate.id
        
        # Correct URL: /api/duplicates/{id}/delete
        response = self.client.delete(f"/api/duplicates/{duplicate_id}/delete")
        
        self.assertEqual(response.status_code, 200)
        
        # Verify duplicate is deleted
        self.assertFalse(Duplicate.objects.filter(id=duplicate_id).exists())
        
        # Verify ALL photos are unlinked
        for photo in photos:
            photo.refresh_from_db()
            self.assertEqual(photo.duplicates.count(), 0,
                "All photos should be unlinked from deleted duplicate")

    def test_delete_duplicate_with_many_photos(self):
        """Test deleting a duplicate with many photos."""
        photos = [create_test_photo(owner=self.user) for _ in range(20)]
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        for photo in photos:
            duplicate.photos.add(photo)
        
        response = self.client.delete(f"/api/duplicates/{duplicate.id}/delete")
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["unlinked_count"], 20)

    def test_delete_resolved_duplicate(self):
        """Test deleting a resolved duplicate."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.RESOLVED,
            kept_photo=photo1,
        )
        duplicate.photos.add(photo1, photo2)
        
        response = self.client.delete(f"/api/duplicates/{duplicate.id}/delete")
        
        # Should succeed - can delete any duplicate
        self.assertEqual(response.status_code, 200)

    def test_delete_nonexistent_duplicate(self):
        """Test deleting a duplicate that doesn't exist."""
        response = self.client.delete(f"/api/duplicates/{uuid.uuid4()}/delete")
        self.assertEqual(response.status_code, 404)

    def test_delete_other_users_duplicate(self):
        """Test deleting another user's duplicate."""
        other_user = create_test_user()
        photo1 = create_test_photo(owner=other_user)
        photo2 = create_test_photo(owner=other_user)
        
        duplicate = Duplicate.objects.create(
            owner=other_user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        duplicate.photos.add(photo1, photo2)
        
        response = self.client.delete(f"/api/duplicates/{duplicate.id}/delete")
        
        # Should return 404 (not found for this user)
        self.assertEqual(response.status_code, 404)


class DuplicateDetailEdgeCasesTestCase(TestCase):
    """Edge cases for duplicate detail view."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_detail_with_photos_without_metadata(self):
        """Test detail view when photos have no metadata."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        # Ensure no metadata exists
        PhotoMetadata.objects.filter(photo__in=[photo1, photo2]).delete()
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
        )
        duplicate.photos.add(photo1, photo2)
        
        # Should not crash
        response = self.client.get(f"/api/duplicates/{duplicate.id}/")
        
        self.assertEqual(response.status_code, 200)
        # Photos should have null width/height/camera
        for photo_data in response.data["photos"]:
            # Should be None or return gracefully
            pass  # If we get here without crash, the test passes

    def test_detail_with_photos_without_main_file(self):
        """Test detail view when photos have no main_file."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo1.main_file = None
        photo1.save()
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        duplicate.photos.add(photo1, photo2)
        
        # Should not crash
        response = self.client.get(f"/api/duplicates/{duplicate.id}/")
        
        self.assertEqual(response.status_code, 200)

    def test_detail_with_deleted_kept_photo(self):
        """Test detail view when kept_photo has been deleted."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.RESOLVED,
            kept_photo=photo1,
        )
        duplicate.photos.add(photo1, photo2)
        
        # Permanently delete the kept photo
        photo1.in_trashcan = True
        photo1.save()
        photo1.manual_delete()
        
        # Check if duplicate still exists (might be deleted due to Bug #12 fix)
        if not Duplicate.objects.filter(id=duplicate.id).exists():
            # Expected behavior: duplicate deleted when < 2 photos
            return
        
        # If duplicate still exists, detail should not crash
        response = self.client.get(f"/api/duplicates/{duplicate.id}/")
        # Either 200 or 404 depending on photo count
        self.assertIn(response.status_code, [200, 404])


class DuplicateListEdgeCasesTestCase(TestCase):
    """Edge cases for duplicate list view."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_list_excludes_single_photo_duplicates(self):
        """Test that list excludes duplicates with only 1 photo."""
        photo1 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        duplicate.photos.add(photo1)  # Only 1 photo
        
        response = self.client.get("/api/duplicates/")
        
        self.assertEqual(response.status_code, 200)
        # Should not include the single-photo duplicate
        self.assertEqual(response.data["count"], 0)

    def test_list_with_kept_photo_deleted(self):
        """Test list view when kept_photo reference is broken.
        
        ForeignKey SET_NULL should handle this, but let's verify.
        """
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.RESOLVED,
            kept_photo=photo1,
        )
        duplicate.photos.add(photo1, photo2, photo3)
        
        # Delete the kept photo
        photo1.in_trashcan = True
        photo1.save()
        photo1.manual_delete()
        
        # Try listing - should not crash
        response = self.client.get("/api/duplicates/")
        
        self.assertEqual(response.status_code, 200)

    def test_list_pagination_edge_cases(self):
        """Test list pagination with various edge cases."""
        # Create 5 duplicates
        for i in range(5):
            photo1 = create_test_photo(owner=self.user)
            photo2 = create_test_photo(owner=self.user)
            dup = Duplicate.objects.create(
                owner=self.user,
                duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            )
            dup.photos.add(photo1, photo2)
        
        # Page beyond results - Django's get_page() returns last page for out-of-range
        # So page 100 will still return results (the last page)
        response = self.client.get("/api/duplicates/?page=100")
        self.assertEqual(response.status_code, 200)
        # Django returns last valid page, not empty
        self.assertGreaterEqual(len(response.data["results"]), 0)
        
        # Page 0 should become page 1 (our code uses max(1, page))
        response = self.client.get("/api/duplicates/?page=0")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(len(response.data["results"]), 5)


class DuplicateAutoSelectBestEdgeCasesTestCase(TestCase):
    """Edge cases for auto_select_best_photo."""

    def setUp(self):
        self.user = create_test_user()

    def test_auto_select_with_no_photos(self):
        """Test auto_select_best_photo with empty duplicate group."""
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        
        result = duplicate.auto_select_best_photo()
        self.assertIsNone(result)

    def test_auto_select_exact_copy_all_null_paths(self):
        """Test auto_select for exact copies when all photos have no main_file."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo1.main_file = None
        photo2.main_file = None
        photo1.save()
        photo2.save()
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        duplicate.photos.add(photo1, photo2)
        
        # Should handle gracefully (might return None or first photo)
        _result = duplicate.auto_select_best_photo()
        # Just verify it doesn't crash

    def test_auto_select_visual_duplicate_no_metadata(self):
        """Test auto_select for visual duplicates when photos have no metadata."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        # Delete any metadata
        PhotoMetadata.objects.filter(photo__in=[photo1, photo2]).delete()
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
        )
        duplicate.photos.add(photo1, photo2)
        
        # Should handle gracefully
        _result = duplicate.auto_select_best_photo()
        # Just verify it doesn't crash


class DuplicateDismissEdgeCasesTestCase(TestCase):
    """Edge cases for dismiss endpoint."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_dismiss_already_dismissed(self):
        """Test dismissing an already dismissed duplicate."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.DISMISSED,
        )
        duplicate.photos.add(photo1, photo2)
        
        # Dismiss again
        response = self.client.post(f"/api/duplicates/{duplicate.id}/dismiss/")
        
        # Should succeed (idempotent operation)
        self.assertEqual(response.status_code, 200)

    def test_dismiss_resolved_duplicate(self):
        """Test dismissing a resolved duplicate."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.RESOLVED,
            kept_photo=photo1,
        )
        duplicate.photos.add(photo1, photo2)
        
        # Dismiss the resolved duplicate
        response = self.client.post(f"/api/duplicates/{duplicate.id}/dismiss/")
        
        # Should succeed
        self.assertEqual(response.status_code, 200)
        
        duplicate.refresh_from_db()
        self.assertEqual(duplicate.review_status, Duplicate.ReviewStatus.DISMISSED)


class DuplicateStatsEdgeCasesTestCase(TestCase):
    """Edge cases for duplicate statistics endpoint."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_stats_with_no_duplicates(self):
        """Test stats endpoint with no duplicates."""
        response = self.client.get("/api/duplicates/stats/")
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["total_duplicates"], 0)
        self.assertEqual(response.data["pending_duplicates"], 0)
        self.assertEqual(response.data["potential_savings_bytes"], 0)
        self.assertEqual(response.data["potential_savings_mb"], 0)

    def test_stats_counts_by_type(self):
        """Test stats counts by duplicate type."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        photo4 = create_test_photo(owner=self.user)
        
        # Create exact copy duplicate
        dup1 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup1.photos.add(photo1, photo2)
        
        # Create visual duplicate
        dup2 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
        )
        dup2.photos.add(photo3, photo4)
        
        response = self.client.get("/api/duplicates/stats/")
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["total_duplicates"], 2)
        self.assertEqual(response.data["by_type"]["exact_copy"], 1)
        self.assertEqual(response.data["by_type"]["visual_duplicate"], 1)

    def test_stats_counts_by_status(self):
        """Test stats counts by review status."""
        photos = [create_test_photo(owner=self.user) for _ in range(6)]
        
        # Pending
        dup1 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.PENDING,
        )
        dup1.photos.add(photos[0], photos[1])
        
        # Resolved
        dup2 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.RESOLVED,
        )
        dup2.photos.add(photos[2], photos[3])
        
        # Dismissed
        dup3 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.DISMISSED,
        )
        dup3.photos.add(photos[4], photos[5])
        
        response = self.client.get("/api/duplicates/stats/")
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["pending_duplicates"], 1)
        self.assertEqual(response.data["resolved_duplicates"], 1)
        self.assertEqual(response.data["dismissed_duplicates"], 1)

    def test_stats_potential_savings(self):
        """Test stats potential savings calculation."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.PENDING,
            potential_savings=1024 * 1024 * 5,  # 5 MB
        )
        dup.photos.add(photo1, photo2)
        
        response = self.client.get("/api/duplicates/stats/")
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["potential_savings_bytes"], 5 * 1024 * 1024)
        self.assertEqual(response.data["potential_savings_mb"], 5.0)

    def test_stats_photos_in_duplicates(self):
        """Test stats counts photos in duplicate groups correctly."""
        photos = [create_test_photo(owner=self.user) for _ in range(5)]
        
        # Create duplicate with 3 photos
        dup1 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup1.photos.add(photos[0], photos[1], photos[2])
        
        # Create another duplicate with 2 photos (one overlapping)
        dup2 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
        )
        dup2.photos.add(photos[2], photos[3])  # photos[2] is in both
        
        response = self.client.get("/api/duplicates/stats/")
        
        self.assertEqual(response.status_code, 200)
        # 4 unique photos are in duplicate groups (photos 0,1,2,3)
        self.assertEqual(response.data["photos_in_duplicates"], 4)

    def test_stats_other_users_not_included(self):
        """Test stats don't include other user's duplicates."""
        other_user = create_test_user()
        
        # Create duplicate for other user
        other_photo1 = create_test_photo(owner=other_user)
        other_photo2 = create_test_photo(owner=other_user)
        dup = Duplicate.objects.create(
            owner=other_user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(other_photo1, other_photo2)
        
        # Current user should see 0 duplicates
        response = self.client.get("/api/duplicates/stats/")
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["total_duplicates"], 0)


================================================
FILE: api/tests/test_duplicate_detection.py
================================================
"""
Tests for Duplicate Detection API and Models.

Tests cover:
- Duplicate model creation, resolution, dismissal, revert
- API endpoints for listing, filtering, resolving duplicates
- Edge cases: permissions, invalid IDs, concurrent operations
- BK-Tree algorithm for visual duplicate search
"""
import uuid

from django.test import TestCase
from rest_framework import status
from rest_framework.test import APIClient

from api.models.duplicate import Duplicate
from api.tests.utils import create_test_photos, create_test_user


class DuplicateModelTest(TestCase):
    """Tests for the Duplicate model methods."""

    def setUp(self):
        self.user = create_test_user()
        self.photos = create_test_photos(number_of_photos=3, owner=self.user)

    def test_create_duplicate_group(self):
        """Test creating a duplicate group with multiple photos."""
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        for photo in self.photos:
            photo.duplicates.add(duplicate)

        self.assertEqual(duplicate.photo_count, 3)
        self.assertEqual(duplicate.review_status, Duplicate.ReviewStatus.PENDING)

    def test_create_duplicate_with_less_than_2_photos_returns_none(self):
        """Test create_or_merge returns None with < 2 photos."""
        result = Duplicate.create_or_merge(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=[self.photos[0]],
        )
        self.assertIsNone(result)

    def test_create_or_merge_creates_new_duplicate(self):
        """Test create_or_merge creates a new duplicate group."""
        duplicate = Duplicate.create_or_merge(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
            photos=self.photos[:2],
            similarity_score=0.95,
        )
        self.assertIsNotNone(duplicate)
        self.assertEqual(duplicate.photo_count, 2)
        self.assertEqual(duplicate.similarity_score, 0.95)

    def test_create_or_merge_merges_existing(self):
        """Test create_or_merge merges when photo already in group."""
        # Create initial group with first 2 photos
        dup1 = Duplicate.create_or_merge(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        # Try to create new group with overlapping photo
        dup2 = Duplicate.create_or_merge(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=[self.photos[1], self.photos[2]],
        )
        # Should return the same duplicate (merged)
        self.assertEqual(dup1.id, dup2.id)
        self.assertEqual(dup1.photo_count, 3)

    def test_resolve_duplicate_trashes_others(self):
        """Test resolving a duplicate trashes non-kept photos."""
        duplicate = Duplicate.create_or_merge(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos,
        )
        keep_photo = self.photos[0]
        duplicate.resolve(keep_photo, trash_others=True)

        # Refresh from DB
        duplicate.refresh_from_db()
        for photo in self.photos[1:]:
            photo.refresh_from_db()
            self.assertTrue(photo.in_trashcan)

        self.assertEqual(duplicate.review_status, Duplicate.ReviewStatus.RESOLVED)
        self.assertEqual(duplicate.kept_photo, keep_photo)
        self.assertEqual(duplicate.trashed_count, 2)

    def test_resolve_duplicate_without_trashing(self):
        """Test resolving without trashing others."""
        duplicate = Duplicate.create_or_merge(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        keep_photo = self.photos[0]
        duplicate.resolve(keep_photo, trash_others=False)

        duplicate.refresh_from_db()
        self.photos[1].refresh_from_db()

        self.assertEqual(duplicate.review_status, Duplicate.ReviewStatus.RESOLVED)
        self.assertFalse(self.photos[1].in_trashcan)
        self.assertEqual(duplicate.trashed_count, 0)

    def test_dismiss_duplicate(self):
        """Test dismissing a duplicate unlinks photos."""
        duplicate = Duplicate.create_or_merge(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
            photos=self.photos[:2],
        )
        duplicate.dismiss()

        duplicate.refresh_from_db()
        self.assertEqual(duplicate.review_status, Duplicate.ReviewStatus.DISMISSED)
        # Photos should be unlinked
        self.assertEqual(duplicate.photo_count, 0)

    def test_revert_resolved_duplicate(self):
        """Test reverting a resolved duplicate restores photos."""
        duplicate = Duplicate.create_or_merge(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        duplicate.resolve(self.photos[0], trash_others=True)

        # Verify photo was trashed
        self.photos[1].refresh_from_db()
        self.assertTrue(self.photos[1].in_trashcan)

        # Revert
        restored_count = duplicate.revert()
        duplicate.refresh_from_db()
        self.photos[1].refresh_from_db()

        self.assertEqual(restored_count, 1)
        self.assertEqual(duplicate.review_status, Duplicate.ReviewStatus.PENDING)
        self.assertFalse(self.photos[1].in_trashcan)
        self.assertIsNone(duplicate.kept_photo)

    def test_revert_non_resolved_duplicate_returns_zero(self):
        """Test reverting a pending duplicate returns 0."""
        duplicate = Duplicate.create_or_merge(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        restored_count = duplicate.revert()
        self.assertEqual(restored_count, 0)

    def test_auto_select_best_photo_exact_copy(self):
        """Test auto-selecting best photo for exact copies (shortest path)."""
        duplicate = Duplicate.create_or_merge(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        best = duplicate.auto_select_best_photo()
        self.assertIsNotNone(best)

    def test_calculate_potential_savings(self):
        """Test calculating potential storage savings."""
        # Set known sizes
        self.photos[0].size = 1000000  # 1MB
        self.photos[0].save()
        self.photos[1].size = 500000   # 0.5MB
        self.photos[1].save()

        duplicate = Duplicate.create_or_merge(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        savings = duplicate.calculate_potential_savings()

        # Should be size of non-best photos
        self.assertGreater(savings, 0)

    def test_merge_duplicates(self):
        """Test merging two duplicate groups."""
        dup1 = Duplicate.create_or_merge(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        # Create second group with photo[2]
        extra_photo = create_test_photos(number_of_photos=1, owner=self.user)[0]
        dup2 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        extra_photo.duplicates.add(dup2)
        self.photos[2].duplicates.add(dup2)

        # Merge
        dup1.merge_with(dup2)

        # dup2 should be deleted
        self.assertFalse(Duplicate.objects.filter(id=dup2.id).exists())
        # dup1 should have all photos
        self.assertEqual(dup1.photo_count, 4)


class DuplicateAPITest(TestCase):
    """Tests for Duplicate API endpoints."""

    def setUp(self):
        self.client = APIClient()
        self.user1 = create_test_user()
        self.user2 = create_test_user()
        self.client.force_authenticate(user=self.user1)
        self.photos = create_test_photos(number_of_photos=4, owner=self.user1)

    def test_list_duplicates_empty(self):
        """Test listing duplicates when none exist."""
        response = self.client.get("/api/duplicates")
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["count"], 0)
        self.assertEqual(data["results"], [])

    def test_list_duplicates_with_results(self):
        """Test listing duplicates with results."""
        Duplicate.create_or_merge(
            owner=self.user1,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        response = self.client.get("/api/duplicates")
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["count"], 1)

    def test_list_duplicates_excludes_other_users(self):
        """Test that user can only see their own duplicates."""
        # Create duplicate for user2
        photos2 = create_test_photos(number_of_photos=2, owner=self.user2)
        Duplicate.create_or_merge(
            owner=self.user2,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=photos2,
        )
        # User1 should not see it
        response = self.client.get("/api/duplicates")
        data = response.json()
        self.assertEqual(data["count"], 0)

    def test_list_duplicates_filter_by_type(self):
        """Test filtering duplicates by type."""
        Duplicate.create_or_merge(
            owner=self.user1,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        Duplicate.create_or_merge(
            owner=self.user1,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
            photos=self.photos[2:4],
        )

        # Filter exact copies
        response = self.client.get("/api/duplicates?duplicate_type=exact_copy")
        data = response.json()
        self.assertEqual(data["count"], 1)
        self.assertEqual(data["results"][0]["duplicate_type"], "exact_copy")

    def test_list_duplicates_filter_by_status(self):
        """Test filtering duplicates by review status."""
        dup = Duplicate.create_or_merge(
            owner=self.user1,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        dup.resolve(self.photos[0], trash_others=True)

        # Filter pending - should be empty
        response = self.client.get("/api/duplicates?status=pending")
        data = response.json()
        self.assertEqual(data["count"], 0)

        # Filter resolved
        response = self.client.get("/api/duplicates?status=resolved")
        data = response.json()
        self.assertEqual(data["count"], 1)

    def test_get_duplicate_detail(self):
        """Test getting duplicate detail."""
        dup = Duplicate.create_or_merge(
            owner=self.user1,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        response = self.client.get(f"/api/duplicates/{dup.id}")
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["id"], str(dup.id))
        self.assertEqual(len(data["photos"]), 2)

    def test_get_duplicate_detail_not_found(self):
        """Test getting non-existent duplicate returns 404."""
        fake_id = uuid.uuid4()
        response = self.client.get(f"/api/duplicates/{fake_id}")
        self.assertEqual(response.status_code, status.HTTP_404_NOT_FOUND)

    def test_get_duplicate_detail_wrong_user(self):
        """Test user cannot access other user's duplicate."""
        photos2 = create_test_photos(number_of_photos=2, owner=self.user2)
        dup = Duplicate.create_or_merge(
            owner=self.user2,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=photos2,
        )
        response = self.client.get(f"/api/duplicates/{dup.id}")
        self.assertEqual(response.status_code, status.HTTP_404_NOT_FOUND)

    def test_resolve_duplicate(self):
        """Test resolving a duplicate via API."""
        dup = Duplicate.create_or_merge(
            owner=self.user1,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        payload = {
            "keep_photo_hash": self.photos[0].image_hash,
            "trash_others": True,
        }
        response = self.client.post(
            f"/api/duplicates/{dup.id}/resolve",
            data=payload,
            format="json",
        )
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["status"], "resolved")
        self.assertEqual(data["trashed_count"], 1)

    def test_resolve_duplicate_missing_photo_hash(self):
        """Test resolve without photo hash returns error."""
        dup = Duplicate.create_or_merge(
            owner=self.user1,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        response = self.client.post(
            f"/api/duplicates/{dup.id}/resolve/",
            data={},
            format="json",
        )
        self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST)

    def test_resolve_duplicate_invalid_photo(self):
        """Test resolve with photo not in group returns error."""
        dup = Duplicate.create_or_merge(
            owner=self.user1,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        payload = {
            "keep_photo_hash": self.photos[3].image_hash,  # Not in group
            "trash_others": True,
        }
        response = self.client.post(
            f"/api/duplicates/{dup.id}/resolve",
            data=payload,
            format="json",
        )
        self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST)

    def test_dismiss_duplicate(self):
        """Test dismissing a duplicate via API."""
        dup = Duplicate.create_or_merge(
            owner=self.user1,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
            photos=self.photos[:2],
        )
        response = self.client.post(f"/api/duplicates/{dup.id}/dismiss")
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["status"], "dismissed")

    def test_revert_duplicate(self):
        """Test reverting a resolved duplicate via API."""
        dup = Duplicate.create_or_merge(
            owner=self.user1,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        dup.resolve(self.photos[0], trash_others=True)

        response = self.client.post(f"/api/duplicates/{dup.id}/revert")
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["status"], "reverted")
        self.assertEqual(data["restored_count"], 1)

    def test_revert_non_resolved_duplicate_fails(self):
        """Test reverting a pending duplicate returns error."""
        dup = Duplicate.create_or_merge(
            owner=self.user1,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        response = self.client.post(f"/api/duplicates/{dup.id}/revert")
        self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST)

    def test_delete_duplicate(self):
        """Test deleting a duplicate group via API."""
        dup = Duplicate.create_or_merge(
            owner=self.user1,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        dup_id = dup.id
        # API uses /delete suffix instead of DELETE method on main path
        response = self.client.delete(f"/api/duplicates/{dup_id}/delete")
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["status"], "deleted")
        self.assertEqual(data["unlinked_count"], 2)

        # Verify duplicate is gone
        self.assertFalse(Duplicate.objects.filter(id=dup_id).exists())

    def test_get_duplicate_stats(self):
        """Test getting duplicate statistics."""
        # Create some duplicates
        Duplicate.create_or_merge(
            owner=self.user1,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        response = self.client.get("/api/duplicates/stats")
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertIn("total_duplicates", data)
        self.assertIn("pending_duplicates", data)
        self.assertIn("by_type", data)

    def test_detect_duplicates(self):
        """Test triggering duplicate detection."""
        response = self.client.post(
            "/api/duplicates/detect",
            data={
                "detect_exact_copies": True,
                "detect_visual_duplicates": False,
            },
            format="json",
        )
        self.assertEqual(response.status_code, status.HTTP_202_ACCEPTED)
        data = response.json()
        self.assertEqual(data["status"], "queued")


class DuplicateEdgeCasesTest(TestCase):
    """Tests for edge cases and potential bugs."""

    def setUp(self):
        self.client = APIClient()
        self.user = create_test_user()
        self.client.force_authenticate(user=self.user)
        self.photos = create_test_photos(number_of_photos=5, owner=self.user)

    def test_duplicate_with_single_photo_excluded_from_list(self):
        """Test duplicates with <2 photos are not returned in list."""
        # Create a duplicate and manually remove all but one photo
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        self.photos[0].duplicates.add(dup)  # Only 1 photo

        response = self.client.get("/api/duplicates/")
        data = response.json()
        self.assertEqual(data["count"], 0)

    def test_resolve_already_resolved_duplicate(self):
        """Test resolving an already resolved duplicate."""
        dup = Duplicate.create_or_merge(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:3],
        )
        dup.resolve(self.photos[0], trash_others=True)

        # Try to resolve again with different photo
        payload = {"keep_photo_hash": self.photos[1].image_hash}
        response = self.client.post(
            f"/api/duplicates/{dup.id}/resolve",
            data=payload,
            format="json",
        )
        # Should still succeed (updating the resolution)
        self.assertEqual(response.status_code, status.HTTP_200_OK)

    def test_photo_in_multiple_duplicate_groups(self):
        """Test a photo can be in multiple duplicate groups of different types."""
        _dup_exact = Duplicate.create_or_merge(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:2],
        )
        _dup_visual = Duplicate.create_or_merge(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
            photos=[self.photos[0], self.photos[2]],
        )

        # Photo 0 should be in both groups
        self.photos[0].refresh_from_db()
        self.assertEqual(self.photos[0].duplicates.count(), 2)

    def test_delete_photo_removes_from_duplicate(self):
        """Test deleting a photo removes it from duplicate group."""
        dup = Duplicate.create_or_merge(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:3],
        )
        initial_count = dup.photo_count

        # Delete a photo from the duplicate group
        photo_to_delete = self.photos[0]
        photo_to_delete.duplicates.remove(dup)

        dup.refresh_from_db()
        self.assertEqual(dup.photo_count, initial_count - 1)

    def test_pagination_works_correctly(self):
        """Test pagination returns correct results."""
        # Create 25 duplicate groups
        for i in range(25):
            extra_photos = create_test_photos(number_of_photos=2, owner=self.user)
            Duplicate.create_or_merge(
                owner=self.user,
                duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
                photos=extra_photos,
            )

        # Get first page
        response = self.client.get("/api/duplicates?page=1&page_size=10")
        data = response.json()
        self.assertEqual(len(data["results"]), 10)
        self.assertEqual(data["count"], 25)
        self.assertTrue(data["has_next"])

        # Get second page
        response = self.client.get("/api/duplicates?page=2&page_size=10")
        data = response.json()
        self.assertEqual(len(data["results"]), 10)
        self.assertTrue(data["has_previous"])

    def test_invalid_uuid_format(self):
        """Test invalid UUID format.
        
        Note: The URL regex pattern [0-9a-f-]+ matches any hex-like string,
        so 'not-a-valid-uuid' partially matches. The view then returns an
        empty result rather than 404/400. This is acceptable behavior.
        """
        response = self.client.get("/api/duplicates/not-a-valid-uuid")
        # The regex matches the string (contains a-f and -), but no duplicate exists
        # so it returns the list endpoint with empty results
        self.assertEqual(response.status_code, status.HTTP_200_OK)

    def test_concurrent_resolve_same_duplicate(self):
        """Test handling multiple resolution attempts.
        
        The API allows re-resolving a duplicate with the same or different photo.
        This is useful if the user changes their mind about which photo to keep.
        """
        dup = Duplicate.create_or_merge(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=self.photos[:3],
        )
        # First resolve - keep photos[0], trash others
        payload1 = {"keep_photo_hash": self.photos[0].image_hash}
        response1 = self.client.post(
            f"/api/duplicates/{dup.id}/resolve",
            data=payload1,
            format="json",
        )
        self.assertEqual(response1.status_code, status.HTTP_200_OK)

        # Verify photos[1] is now trashed
        self.photos[1].refresh_from_db()
        self.assertTrue(self.photos[1].in_trashcan)

        # Re-resolve with same photo (idempotent operation)
        payload2 = {"keep_photo_hash": self.photos[0].image_hash}
        response2 = self.client.post(
            f"/api/duplicates/{dup.id}/resolve",
            data=payload2,
            format="json",
        )
        # Re-resolving is allowed
        self.assertEqual(response2.status_code, status.HTTP_200_OK)


class BKTreeTest(TestCase):
    """Tests for BK-Tree algorithm used in visual duplicate detection."""

    def test_bk_tree_basic_operations(self):
        """Test BK-Tree add and search operations."""
        from api.duplicate_detection import BKTree
        from api.perceptual_hash import hamming_distance

        tree = BKTree(hamming_distance)
        tree.add("photo1", "0000000000000000")
        tree.add("photo2", "0000000000000001")  # 1 bit different
        tree.add("photo3", "1111111111111111")  # Very different

        # Search with threshold 1
        results = tree.search("0000000000000000", 1)
        result_ids = [r[0] for r in results]
        self.assertIn("photo1", result_ids)
        self.assertIn("photo2", result_ids)
        self.assertNotIn("photo3", result_ids)

    def test_bk_tree_empty_search(self):
        """Test BK-Tree search on empty tree."""
        from api.duplicate_detection import BKTree
        from api.perceptual_hash import hamming_distance

        tree = BKTree(hamming_distance)
        results = tree.search("0000000000000000", 5)
        self.assertEqual(results, [])


class UnionFindTest(TestCase):
    """Tests for Union-Find data structure used in duplicate grouping."""

    def test_union_find_basic(self):
        """Test Union-Find basic operations."""
        from api.duplicate_detection import UnionFind

        uf = UnionFind()
        uf.union("a", "b")
        uf.union("b", "c")

        # a, b, c should be in same group
        self.assertEqual(uf.find("a"), uf.find("b"))
        self.assertEqual(uf.find("b"), uf.find("c"))

    def test_union_find_get_groups(self):
        """Test Union-Find get_groups returns correct groups."""
        from api.duplicate_detection import UnionFind

        uf = UnionFind()
        uf.union("a", "b")
        uf.union("c", "d")
        uf.union("e", "f")

        groups = uf.get_groups()
        self.assertEqual(len(groups), 3)
        # Each group should have 2 elements
        for group in groups:
            self.assertEqual(len(group), 2)

    def test_union_find_single_elements_not_returned(self):
        """Test Union-Find doesn't return single-element groups."""
        from api.duplicate_detection import UnionFind

        uf = UnionFind()
        uf.find("a")  # Creates single element
        uf.union("b", "c")

        groups = uf.get_groups()
        # Only the b-c group should be returned
        self.assertEqual(len(groups), 1)
        self.assertEqual(len(groups[0]), 2)


================================================
FILE: api/tests/test_duplicate_detection_logic.py
================================================
"""
Comprehensive tests for Duplicate Detection Logic.

Tests cover:
- BKTree: Burkhard-Keller Tree for efficient Hamming distance queries
- UnionFind: Union-Find data structure for grouping
- detect_exact_copies: Exact copy detection via MD5 hash
- detect_visual_duplicates: Visual similarity detection via perceptual hash
- batch_detect_duplicates: Batch detection orchestration
- Edge cases and error handling
"""

import uuid
from unittest.mock import patch

from django.test import TestCase

from api.models.duplicate import Duplicate
from api.models.file import File
from api.models.long_running_job import LongRunningJob
from api.duplicate_detection import (
    BKTree,
    UnionFind,
    detect_exact_copies,
    detect_visual_duplicates,
    batch_detect_duplicates,
)
from api.tests.utils import create_test_photo, create_test_user


class BKTreeTestCase(TestCase):
    """Tests for BKTree data structure."""

    def setUp(self):
        # Simple Hamming distance for testing
        def hamming(a, b):
            return sum(c1 != c2 for c1, c2 in zip(a, b))
        self.tree = BKTree(hamming)

    def test_empty_tree_search_returns_empty(self):
        """Test searching empty tree returns empty list."""
        results = self.tree.search("abc", 1)
        self.assertEqual(results, [])

    def test_add_single_item(self):
        """Test adding single item to tree."""
        self.tree.add("id1", "abc")
        
        self.assertEqual(self.tree.size, 1)
        self.assertIsNotNone(self.tree.root)
        self.assertEqual(self.tree.root["id"], "id1")
        self.assertEqual(self.tree.root["hash"], "abc")

    def test_add_multiple_items(self):
        """Test adding multiple items to tree."""
        self.tree.add("id1", "abc")
        self.tree.add("id2", "abd")
        self.tree.add("id3", "xyz")
        
        self.assertEqual(self.tree.size, 3)

    def test_search_exact_match(self):
        """Test searching for exact match (distance 0)."""
        self.tree.add("id1", "abc")
        self.tree.add("id2", "xyz")
        
        results = self.tree.search("abc", 0)
        
        self.assertEqual(len(results), 1)
        self.assertEqual(results[0][0], "id1")
        self.assertEqual(results[0][1], 0)  # distance

    def test_search_within_threshold(self):
        """Test searching within Hamming threshold."""
        self.tree.add("id1", "abc")
        self.tree.add("id2", "abd")  # distance 1 from "abc"
        self.tree.add("id3", "xyz")  # distance 3 from "abc"
        
        results = self.tree.search("abc", 1)
        
        self.assertEqual(len(results), 2)
        result_ids = [r[0] for r in results]
        self.assertIn("id1", result_ids)
        self.assertIn("id2", result_ids)
        self.assertNotIn("id3", result_ids)

    def test_search_threshold_excludes_distant(self):
        """Test threshold correctly excludes distant items."""
        self.tree.add("id1", "aaaa")
        self.tree.add("id2", "zzzz")  # distance 4 from "aaaa"
        
        results = self.tree.search("aaaa", 3)
        
        self.assertEqual(len(results), 1)
        self.assertEqual(results[0][0], "id1")

    def test_search_returns_correct_distances(self):
        """Test search returns correct Hamming distances."""
        self.tree.add("id1", "abc")
        self.tree.add("id2", "aXc")  # distance 1
        self.tree.add("id3", "XXc")  # distance 2
        
        results = self.tree.search("abc", 2)
        
        results_dict = {r[0]: r[1] for r in results}
        self.assertEqual(results_dict["id1"], 0)
        self.assertEqual(results_dict["id2"], 1)
        self.assertEqual(results_dict["id3"], 2)

    def test_add_duplicate_hash(self):
        """Test adding items with same hash."""
        self.tree.add("id1", "abc")
        self.tree.add("id2", "abc")  # Same hash, different id
        
        self.assertEqual(self.tree.size, 2)
        
        results = self.tree.search("abc", 0)
        result_ids = [r[0] for r in results]
        self.assertIn("id1", result_ids)
        self.assertIn("id2", result_ids)

    def test_large_tree_performance(self):
        """Test tree performs well with many items."""
        # Add 1000 items
        for i in range(1000):
            hash_val = f"{i:04d}"
            self.tree.add(f"id{i}", hash_val)
        
        self.assertEqual(self.tree.size, 1000)
        
        # Search should complete quickly
        results = self.tree.search("0500", 1)
        self.assertGreater(len(results), 0)


class UnionFindTestCase(TestCase):
    """Tests for UnionFind data structure."""

    def test_initial_find_creates_entry(self):
        """Test find creates new entry if not exists."""
        uf = UnionFind()
        
        root = uf.find("a")
        
        self.assertEqual(root, "a")
        self.assertIn("a", uf.parent)

    def test_find_same_element_returns_itself(self):
        """Test find on single element returns itself."""
        uf = UnionFind()
        
        uf.find("a")
        root = uf.find("a")
        
        self.assertEqual(root, "a")

    def test_union_links_elements(self):
        """Test union links two elements."""
        uf = UnionFind()
        
        uf.union("a", "b")
        
        self.assertEqual(uf.find("a"), uf.find("b"))

    def test_union_multiple_elements(self):
        """Test union of multiple elements."""
        uf = UnionFind()
        
        uf.union("a", "b")
        uf.union("b", "c")
        uf.union("c", "d")
        
        # All should have same root
        root_a = uf.find("a")
        self.assertEqual(uf.find("b"), root_a)
        self.assertEqual(uf.find("c"), root_a)
        self.assertEqual(uf.find("d"), root_a)

    def test_union_separate_groups(self):
        """Test union keeps separate groups separate."""
        uf = UnionFind()
        
        uf.union("a", "b")
        uf.union("c", "d")
        
        self.assertEqual(uf.find("a"), uf.find("b"))
        self.assertEqual(uf.find("c"), uf.find("d"))
        self.assertNotEqual(uf.find("a"), uf.find("c"))

    def test_get_groups_returns_groups(self):
        """Test get_groups returns correct groups."""
        uf = UnionFind()
        
        uf.union("a", "b")
        uf.union("c", "d")
        uf.union("d", "e")
        
        groups = uf.get_groups()
        
        self.assertEqual(len(groups), 2)
        
        # Check group contents
        group_sets = [set(g) for g in groups]
        self.assertIn({"a", "b"}, group_sets)
        self.assertIn({"c", "d", "e"}, group_sets)

    def test_get_groups_excludes_singletons(self):
        """Test get_groups excludes single-element groups."""
        uf = UnionFind()
        
        uf.find("a")  # Single element
        uf.union("b", "c")  # Pair
        
        groups = uf.get_groups()
        
        self.assertEqual(len(groups), 1)
        self.assertEqual(set(groups[0]), {"b", "c"})

    def test_path_compression(self):
        """Test path compression works (parent points directly to root)."""
        uf = UnionFind()
        
        # Create long chain
        uf.union("a", "b")
        uf.union("b", "c")
        uf.union("c", "d")
        
        # After find, path should be compressed
        root = uf.find("a")
        self.assertEqual(uf.parent["a"], root)


class DetectExactCopiesTestCase(TestCase):
    """Tests for detect_exact_copies function."""

    def setUp(self):
        self.user = create_test_user()

    def _create_photo_with_hash(self, image_hash, file_hash=None, **kwargs):
        """Helper to create Photo with specific hashes."""
        photo = create_test_photo(owner=self.user, **kwargs)
        photo.image_hash = image_hash
        
        if file_hash:
            file = File.objects.create(
                hash=file_hash,
                path=f"/photos/test_{uuid.uuid4()}.jpg",
                type=File.IMAGE,
            )
            photo.files.add(file)
            photo.main_file = file
        
        photo.save()
        return photo

    def test_no_duplicates_returns_zero(self):
        """Test no duplicates when all hashes unique."""
        self._create_photo_with_hash("hash1")
        self._create_photo_with_hash("hash2")
        self._create_photo_with_hash("hash3")
        
        count = detect_exact_copies(self.user)
        
        self.assertEqual(count, 0)

    def test_detects_duplicate_image_hash(self):
        """Test detects photos with same image_hash."""
        self._create_photo_with_hash("same_hash")
        self._create_photo_with_hash("same_hash")
        
        count = detect_exact_copies(self.user)
        
        self.assertEqual(count, 1)
        
        # Check duplicate was created
        duplicates = Duplicate.objects.filter(owner=self.user)
        self.assertEqual(duplicates.count(), 1)
        self.assertEqual(duplicates.first().photos.count(), 2)
        self.assertEqual(duplicates.first().duplicate_type, Duplicate.DuplicateType.EXACT_COPY)

    def test_detects_duplicate_file_hash(self):
        """Test detects photos with same file hash (MD5 part)."""
        # Same MD5 content hash (first 32 chars)
        file_hash1 = "a" * 32 + "user1"
        file_hash2 = "a" * 32 + "user2"  # Same MD5, different suffix
        
        self._create_photo_with_hash("unique1", file_hash1)
        self._create_photo_with_hash("unique2", file_hash2)
        
        count = detect_exact_copies(self.user)
        
        self.assertEqual(count, 1)

    def test_skips_hidden_photos(self):
        """Test hidden photos are excluded."""
        self._create_photo_with_hash("same_hash", hidden=True)
        self._create_photo_with_hash("same_hash")
        
        count = detect_exact_copies(self.user)
        
        # Only 1 visible photo with this hash, so no duplicate
        self.assertEqual(count, 0)

    def test_skips_trashed_photos(self):
        """Test trashed photos are excluded."""
        self._create_photo_with_hash("same_hash", in_trashcan=True)
        self._create_photo_with_hash("same_hash")
        
        count = detect_exact_copies(self.user)
        
        self.assertEqual(count, 0)

    def test_multiple_duplicate_groups(self):
        """Test detects multiple separate duplicate groups."""
        # Group 1
        self._create_photo_with_hash("hash_a")
        self._create_photo_with_hash("hash_a")
        
        # Group 2
        self._create_photo_with_hash("hash_b")
        self._create_photo_with_hash("hash_b")
        self._create_photo_with_hash("hash_b")
        
        count = detect_exact_copies(self.user)
        
        self.assertEqual(count, 2)

    def test_progress_callback_called(self):
        """Test progress callback is called during detection."""
        self._create_photo_with_hash("same_hash")
        self._create_photo_with_hash("same_hash")
        
        callback_calls = []
        
        def progress_callback(current, total, found):
            callback_calls.append((current, total, found))
        
        detect_exact_copies(self.user, progress_callback=progress_callback)
        
        # Callback may or may not be called depending on group count


class DetectVisualDuplicatesTestCase(TestCase):
    """Tests for detect_visual_duplicates function."""

    def setUp(self):
        self.user = create_test_user()

    def _create_photo_with_phash(self, perceptual_hash, **kwargs):
        """Helper to create Photo with perceptual hash."""
        photo = create_test_photo(owner=self.user, **kwargs)
        photo.perceptual_hash = perceptual_hash
        photo.save()
        return photo

    def test_no_photos_returns_zero(self):
        """Test returns 0 when no photos."""
        count = detect_visual_duplicates(self.user)
        
        self.assertEqual(count, 0)

    def test_single_photo_returns_zero(self):
        """Test returns 0 with only one photo."""
        self._create_photo_with_phash("abcd1234")
        
        count = detect_visual_duplicates(self.user)
        
        self.assertEqual(count, 0)

    def test_detects_identical_phash(self):
        """Test detects photos with identical perceptual hash."""
        self._create_photo_with_phash("a" * 16)
        self._create_photo_with_phash("a" * 16)
        
        count = detect_visual_duplicates(self.user, threshold=0)
        
        self.assertEqual(count, 1)

    def test_detects_similar_phash_within_threshold(self):
        """Test detects photos with similar perceptual hash."""
        # These hashes differ by 2 characters
        self._create_photo_with_phash("aaaaaaaaaaaaaaaa")
        self._create_photo_with_phash("aaaaaaaaaaaaaabb")  # 2 chars different
        
        count = detect_visual_duplicates(self.user, threshold=5)
        
        self.assertEqual(count, 1)

    def test_threshold_excludes_dissimilar(self):
        """Test threshold excludes dissimilar photos."""
        self._create_photo_with_phash("aaaaaaaaaaaaaaaa")
        self._create_photo_with_phash("zzzzzzzzzzzzzzzz")  # Very different
        
        count = detect_visual_duplicates(self.user, threshold=5)
        
        self.assertEqual(count, 0)

    def test_skips_photos_without_phash(self):
        """Test photos without perceptual hash are skipped."""
        self._create_photo_with_phash("aaaaaaaaaaaaaaaa")
        photo_no_hash = create_test_photo(owner=self.user)
        photo_no_hash.perceptual_hash = None
        photo_no_hash.save()
        
        count = detect_visual_duplicates(self.user)
        
        self.assertEqual(count, 0)

    def test_skips_hidden_photos(self):
        """Test hidden photos are excluded."""
        self._create_photo_with_phash("aaaaaaaaaaaaaaaa", hidden=True)
        self._create_photo_with_phash("aaaaaaaaaaaaaaaa")
        
        count = detect_visual_duplicates(self.user, threshold=0)
        
        self.assertEqual(count, 0)

    def test_creates_visual_duplicate_type(self):
        """Test creates duplicate with VISUAL_DUPLICATE type."""
        self._create_photo_with_phash("a" * 16)
        self._create_photo_with_phash("a" * 16)
        
        detect_visual_duplicates(self.user, threshold=0)
        
        duplicate = Duplicate.objects.filter(owner=self.user).first()
        self.assertEqual(duplicate.duplicate_type, Duplicate.DuplicateType.VISUAL_DUPLICATE)


class BatchDetectDuplicatesTestCase(TestCase):
    """Tests for batch_detect_duplicates orchestration."""

    def setUp(self):
        self.user = create_test_user()

    @patch('api.duplicate_detection.detect_exact_copies')
    @patch('api.duplicate_detection.detect_visual_duplicates')
    def test_calls_both_detectors_by_default(self, mock_visual, mock_exact):
        """Test both detectors called with default options."""
        mock_exact.return_value = 5
        mock_visual.return_value = 3
        
        batch_detect_duplicates(self.user)
        
        mock_exact.assert_called_once()
        mock_visual.assert_called_once()

    @patch('api.duplicate_detection.detect_exact_copies')
    @patch('api.duplicate_detection.detect_visual_duplicates')
    def test_respects_options(self, mock_visual, mock_exact):
        """Test options control which detectors run."""
        mock_exact.return_value = 0
        mock_visual.return_value = 0
        
        batch_detect_duplicates(self.user, options={
            'detect_exact_copies': False,
            'detect_visual_duplicates': True,
        })
        
        mock_exact.assert_not_called()
        mock_visual.assert_called_once()

    @patch('api.duplicate_detection.detect_exact_copies')
    @patch('api.duplicate_detection.detect_visual_duplicates')
    def test_passes_visual_threshold(self, mock_visual, mock_exact):
        """Test visual threshold passed to detector."""
        mock_exact.return_value = 0
        mock_visual.return_value = 0
        
        batch_detect_duplicates(self.user, options={
            'visual_threshold': 15,
        })
        
        mock_visual.assert_called_once()
        args, kwargs = mock_visual.call_args
        self.assertEqual(args[1], 15)  # threshold argument

    @patch('api.duplicate_detection.detect_exact_copies')
    @patch('api.duplicate_detection.detect_visual_duplicates')
    def test_creates_job(self, mock_visual, mock_exact):
        """Test LongRunningJob created for tracking."""
        mock_exact.return_value = 0
        mock_visual.return_value = 0
        
        batch_detect_duplicates(self.user)
        
        job = LongRunningJob.objects.filter(
            started_by=self.user,
            job_type=LongRunningJob.JOB_DETECT_DUPLICATES,
        ).first()
        self.assertIsNotNone(job)

    @patch('api.duplicate_detection.detect_exact_copies')
    @patch('api.duplicate_detection.detect_visual_duplicates')
    def test_clear_pending_option(self, mock_visual, mock_exact):
        """Test clear_pending option clears pending duplicates."""
        mock_exact.return_value = 0
        mock_visual.return_value = 0
        
        # Create pending duplicate
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.PENDING,
        )
        duplicate.photos.add(photo1, photo2)
        
        batch_detect_duplicates(self.user, options={'clear_pending': True})
        
        # Pending duplicate should be cleared
        self.assertFalse(Duplicate.objects.filter(pk=duplicate.pk).exists())

    @patch('api.duplicate_detection.detect_exact_copies')
    def test_handles_exception(self, mock_exact):
        """Test exception handling during detection."""
        mock_exact.side_effect = Exception("Detection failed")
        
        with self.assertRaises(Exception):
            batch_detect_duplicates(self.user)
        
        # Job should be marked as failed
        job = LongRunningJob.objects.filter(started_by=self.user).first()
        self.assertIsNotNone(job)


class EdgeCasesTestCase(TestCase):
    """Edge case tests for duplicate detection."""

    def setUp(self):
        self.user = create_test_user()

    def test_empty_photo_library(self):
        """Test detection on empty library."""
        count_exact = detect_exact_copies(self.user)
        count_visual = detect_visual_duplicates(self.user)
        
        self.assertEqual(count_exact, 0)
        self.assertEqual(count_visual, 0)

    def test_photo_without_files(self):
        """Test photos without files are handled gracefully."""
        photo = create_test_photo(owner=self.user)
        photo.image_hash = "unique_hash"
        photo.save()
        # No files attached
        
        count = detect_exact_copies(self.user)
        self.assertEqual(count, 0)

    def test_photo_with_short_file_hash(self):
        """Test files with hash shorter than 32 chars."""
        photo = create_test_photo(owner=self.user)
        file = File.objects.create(
            hash="short",  # Less than 32 chars
            path="/photos/test.jpg",
            type=File.IMAGE,
        )
        photo.files.add(file)
        photo.save()
        
        # Should not raise
        count = detect_exact_copies(self.user)
        self.assertEqual(count, 0)

    def test_different_users_isolated(self):
        """Test duplicates are isolated per user."""
        other_user = create_test_user()
        
        # Create "duplicate" across users
        photo1 = create_test_photo(owner=self.user)
        photo1.image_hash = "same_hash"
        photo1.save()
        
        photo2 = create_test_photo(owner=other_user)
        photo2.image_hash = "same_hash"
        photo2.save()
        
        count = detect_exact_copies(self.user)
        
        # Should not find cross-user duplicates
        self.assertEqual(count, 0)

    def test_metadata_files_excluded(self):
        """Test metadata files excluded from duplicate detection."""
        photo = create_test_photo(owner=self.user)
        
        # Add metadata file
        metadata_file = File.objects.create(
            hash="a" * 32 + "suffix",
            path="/photos/test.xmp",
            type=File.METADATA_FILE,
        )
        photo.files.add(metadata_file)
        photo.save()
        
        # Should not count metadata file for duplicate detection
        count = detect_exact_copies(self.user)
        self.assertEqual(count, 0)

    def test_bktree_with_empty_hash(self):
        """Test BKTree handles empty/None hash gracefully."""
        def hamming(a, b):
            if not a or not b:
                return float('inf')
            return sum(c1 != c2 for c1, c2 in zip(a, b))
        
        tree = BKTree(hamming)
        tree.add("id1", "abc")
        
        # Search with valid hash should work
        results = tree.search("abc", 1)
        self.assertEqual(len(results), 1)

    def test_union_find_with_same_element_union(self):
        """Test UnionFind handles self-union."""
        uf = UnionFind()
        
        uf.union("a", "a")  # Self-union
        
        self.assertEqual(uf.find("a"), "a")
        groups = uf.get_groups()
        self.assertEqual(len(groups), 0)  # Single element not in groups

    def test_three_way_duplicate(self):
        """Test detection with 3+ copies of same file."""
        for _ in range(5):
            photo = create_test_photo(owner=self.user)
            photo.image_hash = "five_way_duplicate"
            photo.save()
        
        count = detect_exact_copies(self.user)
        
        self.assertEqual(count, 1)
        
        # Check all 5 photos in same group
        duplicate = Duplicate.objects.filter(owner=self.user).first()
        self.assertEqual(duplicate.photos.count(), 5)

    def test_transitive_duplicates_merged(self):
        """Test transitive duplicates are merged into one group."""
        # Photo A matches Photo B (same image_hash)
        # Photo B matches Photo C (same image_hash)
        # All three should be in same duplicate group
        
        photo_a = create_test_photo(owner=self.user)
        photo_a.image_hash = "hash_abc"
        file_a = File.objects.create(hash="x" * 32, path="/a.jpg", type=File.IMAGE)
        photo_a.files.add(file_a)
        photo_a.save()
        
        photo_b = create_test_photo(owner=self.user)
        photo_b.image_hash = "hash_abc"  # Same as A
        file_b = File.objects.create(hash="y" * 32, path="/b.jpg", type=File.IMAGE)
        photo_b.files.add(file_b)
        photo_b.save()
        
        photo_c = create_test_photo(owner=self.user)
        photo_c.image_hash = "hash_abc"  # Same as A and B
        file_c = File.objects.create(hash="z" * 32, path="/c.jpg", type=File.IMAGE)
        photo_c.files.add(file_c)
        photo_c.save()
        
        count = detect_exact_copies(self.user)
        
        # All 3 have same image_hash => all in one group
        self.assertEqual(count, 1)
        
        duplicate = Duplicate.objects.filter(owner=self.user).first()
        self.assertEqual(duplicate.photos.count(), 3)


================================================
FILE: api/tests/test_duplicate_filtering.py
================================================
"""
Tests for Duplicate API filtering and detection edge cases.

Tests cover:
- Filter by duplicate type (exact_copy, visual_duplicate)
- Filter by status (pending, resolved, dismissed)
- Photos without perceptual hash
- Visual threshold sensitivity
- Detection job handling
"""

from django.test import TestCase
from rest_framework.test import APIClient

from api.models.duplicate import Duplicate
from api.tests.utils import create_test_photo, create_test_user


class DuplicateFilterByTypeTestCase(TestCase):
    """Tests for filtering duplicates by type."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)
        
        # Create photos for duplicates
        self.photos = [create_test_photo(owner=self.user) for _ in range(6)]
        
        # Create exact copy duplicate
        self.exact_dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        self.exact_dup.photos.add(self.photos[0], self.photos[1])
        
        # Create visual duplicate
        self.visual_dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
            similarity_score=0.95,
        )
        self.visual_dup.photos.add(self.photos[2], self.photos[3])
        
        # Create another exact copy
        self.exact_dup2 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        self.exact_dup2.photos.add(self.photos[4], self.photos[5])

    def test_filter_exact_copies(self):
        """Test filtering for exact copies only."""
        response = self.client.get(
            f"/api/duplicates?duplicate_type={Duplicate.DuplicateType.EXACT_COPY}"
        )
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["count"], 2)
        for dup in response.data["results"]:
            self.assertEqual(dup["duplicate_type"], Duplicate.DuplicateType.EXACT_COPY)

    def test_filter_visual_duplicates(self):
        """Test filtering for visual duplicates only."""
        response = self.client.get(
            f"/api/duplicates?duplicate_type={Duplicate.DuplicateType.VISUAL_DUPLICATE}"
        )
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["count"], 1)
        self.assertEqual(
            response.data["results"][0]["duplicate_type"],
            Duplicate.DuplicateType.VISUAL_DUPLICATE
        )

    def test_filter_invalid_type(self):
        """Test filtering with invalid type returns empty or all."""
        response = self.client.get("/api/duplicates?duplicate_type=invalid_type")
        
        self.assertEqual(response.status_code, 200)
        # Should return all or empty depending on implementation
        self.assertIn(response.data["count"], [0, 3])

    def test_no_filter_returns_all(self):
        """Test that no filter returns all duplicates."""
        response = self.client.get("/api/duplicates")
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["count"], 3)


class DuplicateFilterByStatusTestCase(TestCase):
    """Tests for filtering duplicates by status."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)
        
        # Create photos for duplicates
        self.photos = [create_test_photo(owner=self.user) for _ in range(6)]
        
        # Create pending duplicate
        self.pending = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.PENDING,
        )
        self.pending.photos.add(self.photos[0], self.photos[1])
        
        # Create resolved duplicate
        self.resolved = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.RESOLVED,
        )
        self.resolved.photos.add(self.photos[2], self.photos[3])
        
        # Create dismissed duplicate
        self.dismissed = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
            review_status=Duplicate.ReviewStatus.DISMISSED,
        )
        self.dismissed.photos.add(self.photos[4], self.photos[5])

    def test_filter_pending(self):
        """Test filtering for pending duplicates."""
        response = self.client.get(
            f"/api/duplicates?status={Duplicate.ReviewStatus.PENDING}"
        )
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["count"], 1)
        self.assertEqual(
            response.data["results"][0]["review_status"],
            Duplicate.ReviewStatus.PENDING
        )

    def test_filter_resolved(self):
        """Test filtering for resolved duplicates."""
        response = self.client.get(
            f"/api/duplicates?status={Duplicate.ReviewStatus.RESOLVED}"
        )
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["count"], 1)

    def test_filter_dismissed(self):
        """Test filtering for dismissed duplicates."""
        response = self.client.get(
            f"/api/duplicates?status={Duplicate.ReviewStatus.DISMISSED}"
        )
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["count"], 1)

    def test_combined_type_and_status_filter(self):
        """Test combining type and status filters."""
        response = self.client.get(
            f"/api/duplicates?duplicate_type={Duplicate.DuplicateType.EXACT_COPY}&status={Duplicate.ReviewStatus.PENDING}"
        )
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["count"], 1)


class PhotosWithoutPerceptualHashTestCase(TestCase):
    """Tests for handling photos without perceptual hash during detection."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_detection_handles_null_perceptual_hash(self):
        """Test that detection handles photos with null perceptual hash."""
        # Create photos, some without perceptual hash
        photo1 = create_test_photo(owner=self.user)
        _photo2 = create_test_photo(owner=self.user)
        
        # Set null perceptual hash
        photo1.image_phash = None
        photo1.save()
        
        # Detection should not crash - just trigger the endpoint
        response = self.client.post(
            "/api/duplicates/detect",
            {"detect_exact_copies": True, "detect_visual_duplicates": True},
            format='json',
        )
        
        self.assertIn(response.status_code, [200, 202])

    def test_visual_duplicate_detection_endpoint(self):
        """Test visual duplicate detection API endpoint."""
        # Create photos
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        # Set phash values
        photo1.image_phash = "abcd1234"
        photo1.save()
        photo2.image_phash = "abcd1234"  # Same as photo1
        photo2.save()
        
        # Detection should work
        response = self.client.post(
            "/api/duplicates/detect",
            {"detect_visual_duplicates": True, "visual_threshold": 5},
            format='json',
        )
        
        self.assertIn(response.status_code, [200, 202])


class DuplicateDetectionJobTestCase(TestCase):
    """Tests for duplicate detection job handling."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_detect_with_all_options(self):
        """Test detection with all options enabled."""
        response = self.client.post(
            "/api/duplicates/detect",
            {
                "detect_exact_copies": True,
                "detect_visual_duplicates": True,
                "visual_threshold": 10,
                "clear_pending": False,
            },
            format='json',
        )
        
        self.assertIn(response.status_code, [200, 202])

    def test_detect_exact_only(self):
        """Test detection with only exact copies."""
        response = self.client.post(
            "/api/duplicates/detect",
            {"detect_exact_copies": True, "detect_visual_duplicates": False},
            format='json',
        )
        
        self.assertIn(response.status_code, [200, 202])

    def test_detect_visual_only(self):
        """Test detection with only visual duplicates."""
        response = self.client.post(
            "/api/duplicates/detect",
            {"detect_exact_copies": False, "detect_visual_duplicates": True},
            format='json',
        )
        
        self.assertIn(response.status_code, [200, 202])

    def test_detect_nothing_returns_error(self):
        """Test detection with both options false."""
        response = self.client.post(
            "/api/duplicates/detect",
            {"detect_exact_copies": False, "detect_visual_duplicates": False},
            format='json',
        )
        
        # Should return 400 or just skip detection
        self.assertIn(response.status_code, [200, 202, 400])

    def test_detect_with_clear_pending(self):
        """Test detection with clear_pending option."""
        # Create a pending duplicate first
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.PENDING,
        )
        dup.photos.add(photo1, photo2)
        
        # Detection API queues a background job
        response = self.client.post(
            "/api/duplicates/detect",
            {"detect_exact_copies": True, "clear_pending": True},
            format='json',
        )
        
        self.assertIn(response.status_code, [200, 202])


class VisualThresholdTestCase(TestCase):
    """Tests for visual duplicate threshold sensitivity."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_strict_threshold(self):
        """Test visual detection with strict threshold (low value)."""
        response = self.client.post(
            "/api/duplicates/detect",
            {"detect_visual_duplicates": True, "visual_threshold": 3},
            format='json',
        )
        
        self.assertIn(response.status_code, [200, 202])

    def test_loose_threshold(self):
        """Test visual detection with loose threshold (high value)."""
        response = self.client.post(
            "/api/duplicates/detect",
            {"detect_visual_duplicates": True, "visual_threshold": 20},
            format='json',
        )
        
        self.assertIn(response.status_code, [200, 202])

    def test_zero_threshold(self):
        """Test visual detection with zero threshold (exact match only)."""
        response = self.client.post(
            "/api/duplicates/detect",
            {"detect_visual_duplicates": True, "visual_threshold": 0},
            format='json',
        )
        
        self.assertIn(response.status_code, [200, 202])

    def test_negative_threshold_handled(self):
        """Test that negative threshold is handled gracefully."""
        response = self.client.post(
            "/api/duplicates/detect",
            {"detect_visual_duplicates": True, "visual_threshold": -5},
            format='json',
        )
        
        # Should handle gracefully - either 400 or clamp to 0
        self.assertIn(response.status_code, [200, 202, 400])


class DuplicateListSortingTestCase(TestCase):
    """Tests for duplicate list sorting."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)
        
        # Create multiple duplicates
        self.photos = [create_test_photo(owner=self.user) for _ in range(4)]
        
        self.dup1 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        self.dup1.photos.add(self.photos[0], self.photos[1])
        
        self.dup2 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
            similarity_score=0.95,
        )
        self.dup2.photos.add(self.photos[2], self.photos[3])

    def test_default_sorting(self):
        """Test default sorting order."""
        response = self.client.get("/api/duplicates")
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["count"], 2)

    def test_sort_by_created_at(self):
        """Test sorting by created_at."""
        response = self.client.get("/api/duplicates?ordering=-created_at")
        
        self.assertEqual(response.status_code, 200)


class DuplicateBulkActionsTestCase(TestCase):
    """Tests for bulk actions on duplicates."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_bulk_dismiss(self):
        """Test bulk dismissing duplicates."""
        photos = [create_test_photo(owner=self.user) for _ in range(4)]
        
        dup1 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup1.photos.add(photos[0], photos[1])
        
        dup2 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup2.photos.add(photos[2], photos[3])
        
        # Dismiss first one
        response = self.client.post(f"/api/duplicates/{dup1.id}/dismiss")
        self.assertEqual(response.status_code, 200)
        
        dup1.refresh_from_db()
        self.assertEqual(dup1.review_status, Duplicate.ReviewStatus.DISMISSED)


class EmptyDuplicateGroupTestCase(TestCase):
    """Tests for handling empty or invalid duplicate groups."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_duplicate_with_no_photos(self):
        """Test handling duplicate group with no photos."""
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        # Don't add any photos
        
        response = self.client.get(f"/api/duplicates/{dup.id}")
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["photo_count"], 0)

    def test_duplicate_with_one_photo(self):
        """Test handling duplicate group with only one photo."""
        photo = create_test_photo(owner=self.user)
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(photo)
        
        response = self.client.get(f"/api/duplicates/{dup.id}")
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["photo_count"], 1)

    def test_resolve_single_photo_duplicate(self):
        """Test resolving duplicate with only one photo."""
        photo = create_test_photo(owner=self.user)
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(photo)
        
        response = self.client.post(
            f"/api/duplicates/{dup.id}/resolve",
            {"keep_photo_hash": photo.image_hash},
            format='json',
        )
        
        # Should succeed but with no photos to trash
        self.assertIn(response.status_code, [200, 400])


================================================
FILE: api/tests/test_edge_cases_integration.py
================================================
"""
Tests for edge cases and error handling.

Tests:
- Photos with no EXIF data
- Missing/corrupted files
- Concurrent detection jobs
- Empty/invalid data handling
"""


from django.test import TestCase, TransactionTestCase
from rest_framework.test import APIClient, APITestCase

from api.models.duplicate import Duplicate
from api.models.photo_stack import PhotoStack
from api.models.photo_metadata import PhotoMetadata
from api.tests.utils import create_test_photo, create_test_user


class PhotoNoExifDataTestCase(TestCase):
    """Test handling of photos with no EXIF data."""

    def setUp(self):
        self.user = create_test_user()

    def test_photo_without_exif_timestamp(self):
        """Test handling photo with no EXIF timestamp."""
        photo = create_test_photo(owner=self.user)
        photo.exif_timestamp = None
        photo.save()
        
        # Should still be usable
        self.assertIsNotNone(photo.pk)
        self.assertIsNone(photo.exif_timestamp)

    def test_photo_without_gps_data(self):
        """Test handling photo with no GPS data."""
        photo = create_test_photo(owner=self.user)
        photo.exif_gps_lat = None
        photo.exif_gps_lon = None
        photo.save()
        
        # Should still be usable
        self.assertIsNotNone(photo.pk)

    def test_photo_without_perceptual_hash(self):
        """Test handling photo with no perceptual hash."""
        photo = create_test_photo(owner=self.user)
        photo.image_phash = None
        photo.save()
        
        # Should still be usable but not in visual duplicate detection
        self.assertIsNotNone(photo.pk)
        self.assertIsNone(photo.image_phash)

    def test_stack_with_no_exif_photos(self):
        """Test creating stack with photos that have no EXIF."""
        photos = []
        for _ in range(3):
            photo = create_test_photo(owner=self.user)
            photo.exif_timestamp = None
            photo.save()
            photos.append(photo)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(*photos)
        
        # auto_select_primary should still work
        _result = stack.auto_select_primary()
        # May or may not select one depending on implementation
        # The important thing is it doesn't crash

    def test_duplicate_with_no_metadata_photos(self):
        """Test duplicate group with photos lacking metadata."""
        photos = []
        for _ in range(2):
            photo = create_test_photo(owner=self.user)
            # Don't create metadata
            PhotoMetadata.objects.filter(photo=photo).delete()
            photos.append(photo)
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
        )
        dup.photos.add(*photos)
        
        # auto_select_best_photo should handle gracefully
        _result = dup.auto_select_best_photo()
        # Should return something (or None) without crashing

    def test_burst_detection_no_timestamps(self):
        """Test burst detection with photos lacking timestamps."""
        photos = []
        for _ in range(5):
            photo = create_test_photo(owner=self.user)
            photo.exif_timestamp = None
            photo.save()
            photos.append(photo)
        
        # Should not create burst stacks for photos without timestamps
        # (timestamps are required for burst proximity detection)


class MissingFileTestCase(TestCase):
    """Test handling of photos with missing files."""

    def setUp(self):
        self.user = create_test_user()

    def test_photo_with_null_main_file(self):
        """Test handling photo with null main_file reference."""
        photo = create_test_photo(owner=self.user)
        
        # This might not be allowed by the model, but test graceful handling
        # Note: Can't actually set main_file to None due to NOT NULL constraint
        # So we test that the photo with a valid file still works
        self.assertIsNotNone(photo.main_file)

    def test_stack_photos_with_missing_metadata(self):
        """Test stack with photos that have no PhotoMetadata records."""
        photos = [create_test_photo(owner=self.user) for _ in range(3)]
        
        # Delete metadata records
        PhotoMetadata.objects.filter(photo__in=photos).delete()
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(*photos)
        
        # Stack should still function
        self.assertEqual(stack.photos.count(), 3)


class ConcurrentDetectionTestCase(TransactionTestCase):
    """Test concurrent detection job handling."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_concurrent_duplicate_detection_requests(self):
        """Test handling multiple simultaneous detection requests."""
        # Create photos
        for _ in range(5):
            create_test_photo(owner=self.user)
        
        results = []
        errors = []
        
        def trigger_detection():
            try:
                response = self.client.post("/api/duplicates/detect")
                results.append(response.status_code)
            except Exception as e:
                errors.append(str(e))
        
        # Trigger multiple detections (simulated - they run sequentially in test)
        for _ in range(3):
            trigger_detection()
        
        # All requests should succeed (or be queued)
        for status in results:
            self.assertIn(status, [200, 202, 409])  # 409 = conflict if already running
        
        # No errors should occur
        self.assertEqual(len(errors), 0)

    def test_concurrent_stack_detection_requests(self):
        """Test handling multiple simultaneous stack detection requests."""
        # Create photos
        for _ in range(5):
            create_test_photo(owner=self.user)
        
        results = []
        
        for _ in range(3):
            response = self.client.post("/api/stacks/detect")
            results.append(response.status_code)
        
        # All requests should succeed or be handled gracefully
        for status in results:
            self.assertIn(status, [200, 202, 409])


class EmptyDataTestCase(APITestCase):
    """Test handling of empty or minimal data."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_duplicate_list_empty(self):
        """Test duplicate list with no duplicates."""
        response = self.client.get("/api/duplicates")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(len(response.data.get("results", [])), 0)

    def test_stack_list_empty(self):
        """Test stack list with no stacks."""
        response = self.client.get("/api/stacks")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(len(response.data.get("results", [])), 0)

    def test_duplicate_stats_empty(self):
        """Test duplicate stats with no data."""
        response = self.client.get("/api/duplicates/stats")
        self.assertEqual(response.status_code, 200)

    def test_stack_stats_empty(self):
        """Test stack stats with no data."""
        response = self.client.get("/api/stacks/stats")
        self.assertEqual(response.status_code, 200)

    def test_detection_with_no_photos(self):
        """Test detection when user has no photos."""
        response = self.client.post("/api/duplicates/detect")
        # Should succeed but find nothing
        self.assertIn(response.status_code, [200, 202])

    def test_stack_detection_with_no_photos(self):
        """Test stack detection when user has no photos."""
        response = self.client.post("/api/stacks/detect")
        # Should succeed but find nothing
        self.assertIn(response.status_code, [200, 202])


class InvalidDataTestCase(APITestCase):
    """Test handling of invalid data inputs."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_resolve_with_invalid_photo_id(self):
        """Test resolve with invalid photo ID."""
        photos = [create_test_photo(owner=self.user) for _ in range(2)]
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(*photos)
        
        response = self.client.post(
            f"/api/duplicates/{dup.id}/resolve",
            {"kept_photo_id": "not-a-valid-uuid"},
            format="json"
        )
        self.assertIn(response.status_code, [400, 404])

    def test_add_to_stack_with_invalid_photo_ids(self):
        """Test adding invalid photo IDs to stack."""
        photos = [create_test_photo(owner=self.user) for _ in range(2)]
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(*photos)
        
        response = self.client.post(
            f"/api/stacks/{stack.id}/add",
            {"photo_ids": ["invalid-id-1", "invalid-id-2"]},
            format="json"
        )
        # Should handle gracefully
        self.assertIn(response.status_code, [200, 400, 404])

    def test_set_primary_with_invalid_photo_id(self):
        """Test setting primary with invalid photo ID."""
        photos = [create_test_photo(owner=self.user) for _ in range(2)]
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(*photos)
        
        response = self.client.post(
            f"/api/stacks/{stack.id}/primary",
            {"photo_id": "not-a-uuid"},
            format="json"
        )
        self.assertIn(response.status_code, [400, 404])

    def test_detection_with_invalid_options(self):
        """Test detection with invalid options."""
        response = self.client.post(
            "/api/duplicates/detect",
            {"invalid_option": "value"},
            format="json"
        )
        # Should ignore invalid options and proceed
        self.assertIn(response.status_code, [200, 202, 400])


class SinglePhotoGroupTestCase(TestCase):
    """Test handling of single-photo groups."""

    def setUp(self):
        self.user = create_test_user()

    def test_duplicate_with_single_photo_deleted(self):
        """Test duplicate group cleanup when reduced to single photo."""
        photos = [create_test_photo(owner=self.user) for _ in range(2)]
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(*photos)
        
        # Remove one photo
        dup.photos.remove(photos[0])
        
        # Group should still exist but may be cleaned up depending on implementation
        # The important thing is no crash occurs

    def test_stack_with_single_photo(self):
        """Test stack behavior with single photo."""
        photo = create_test_photo(owner=self.user)
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo)
        
        # Single photo stack is valid for manual stacks
        self.assertEqual(stack.photos.count(), 1)

    def test_auto_select_with_single_photo(self):
        """Test auto_select_primary with single photo."""
        photo = create_test_photo(owner=self.user)
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo)
        
        _result = stack.auto_select_primary()
        stack.refresh_from_db()
        
        # Should select the only photo
        self.assertEqual(stack.primary_photo, photo)


class PhotoDeletionEdgeCasesTestCase(TestCase):
    """Test edge cases around photo deletion."""

    def setUp(self):
        self.user = create_test_user()

    def test_delete_photo_in_multiple_stacks(self):
        """Test deleting a photo that's in multiple stacks."""
        photo = create_test_photo(owner=self.user)
        other_photos1 = [create_test_photo(owner=self.user) for _ in range(2)]
        other_photos2 = [create_test_photo(owner=self.user) for _ in range(2)]
        
        stack1 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack1.photos.add(photo, *other_photos1)
        
        stack2 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack2.photos.add(photo, *other_photos2)
        
        # Delete the shared photo
        photo.manual_delete()
        
        # Both stacks should still exist with remaining photos
        stack1.refresh_from_db()
        stack2.refresh_from_db()
        self.assertEqual(stack1.photos.count(), 2)
        self.assertEqual(stack2.photos.count(), 2)

    def test_delete_photo_in_multiple_duplicate_groups(self):
        """Test deleting a photo that's in multiple duplicate groups."""
        photo = create_test_photo(owner=self.user)
        other_photos1 = [create_test_photo(owner=self.user)]
        other_photos2 = [create_test_photo(owner=self.user)]
        
        dup1 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup1.photos.add(photo, *other_photos1)
        
        dup2 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
        )
        dup2.photos.add(photo, *other_photos2)
        
        # Delete the shared photo
        photo.manual_delete()
        
        # Both groups should be cleaned up (single photo remaining)
        # Depending on implementation, they may be deleted or left with 1 photo

    def test_delete_primary_photo_from_stack(self):
        """Test deleting the primary photo from a stack."""
        photos = [create_test_photo(owner=self.user) for _ in range(3)]
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
            primary_photo=photos[0],
        )
        stack.photos.add(*photos)
        
        # Delete the primary photo
        photos[0].manual_delete()
        
        stack.refresh_from_db()
        
        # Stack should still exist
        self.assertEqual(stack.photos.count(), 2)
        # Primary may be cleared or set to another photo depending on implementation


class MetadataEdgeCasesTestCase(TestCase):
    """Test edge cases for metadata handling."""

    def setUp(self):
        self.user = create_test_user()

    def test_photo_with_extreme_dimensions(self):
        """Test handling photos with extreme dimensions."""
        photo = create_test_photo(owner=self.user)
        metadata, _ = PhotoMetadata.objects.get_or_create(photo=photo)
        
        # Very large dimensions
        metadata.width = 50000
        metadata.height = 50000
        metadata.save()
        
        # Should not crash on resolution calculation
        self.assertIsNotNone(metadata.resolution)

    def test_photo_with_zero_dimensions(self):
        """Test handling photos with zero dimensions."""
        photo = create_test_photo(owner=self.user)
        metadata, _ = PhotoMetadata.objects.get_or_create(photo=photo)
        
        metadata.width = 0
        metadata.height = 0
        metadata.save()
        
        # Should handle gracefully
        self.assertEqual(metadata.width, 0)

    def test_duplicate_savings_with_zero_size(self):
        """Test potential savings calculation with zero-size photos."""
        photos = [create_test_photo(owner=self.user) for _ in range(3)]
        for photo in photos:
            photo.size = 0
            photo.save()
        
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(*photos)
        
        savings = dup.calculate_potential_savings()
        self.assertEqual(savings, 0)


================================================
FILE: api/tests/test_edit_photo_details.py
================================================
from unittest.mock import patch

from django.test import TestCase
from rest_framework.test import APIClient

from api.tests.utils import create_test_photo, create_test_user


class EditPhotoDetailsTest(TestCase):
    def setUp(self):
        self.client = APIClient()
        self.user1 = create_test_user()
        self.user2 = create_test_user()
        self.client.force_authenticate(user=self.user1)

    @patch("api.models.Photo._extract_date_time_from_exif", autospec=True)
    def test_should_update_timestamp(self, extract_date_time_from_exif_mock):
        photo = create_test_photo(owner=self.user1)

        payload = {"exif_timestamp": "1970-01-01T00:00:00.001Z"}
        headers = {"Content-Type": "application/json"}
        response = self.client.patch(
            f"/api/photos/edit/{photo.image_hash}/",
            format="json",
            data=payload,
            headers=headers,
        )
        data = response.json()

        self.assertEqual(200, response.status_code)
        self.assertEqual("1970-01-01T00:00:00.001000Z", data["timestamp"])
        self.assertEqual(photo.image_hash, data["image_hash"])
        self.assertIsNone(data["exif_timestamp"])
        self.assertEqual(0, data["rating"])
        self.assertFalse(data["hidden"])
        self.assertFalse(data["in_trashcan"])
        self.assertFalse(data["video"])
        extract_date_time_from_exif_mock.assert_called()

    @patch("api.models.Photo._extract_date_time_from_exif", autospec=True)
    def test_should_not_update_other_properties(self, extract_date_time_from_exif_mock):
        photo = create_test_photo(owner=self.user1)

        payload = {
            "timestamp": "1970-01-01T00:00:00.001Z",
            "image_hash": "BLAH-BLAH-BLAH-BLAH",
            "rating": 100,
            "deleted": True,
            "hidden": True,
            "in_trashcan": True,
            "video": True,
        }
        headers = {"Content-Type": "application/json"}
        response = self.client.patch(
            f"/api/photos/edit/{photo.image_hash}/",
            format="json",
            data=payload,
            headers=headers,
        )
        data = response.json()

        self.assertEqual(200, response.status_code)
        self.assertNotEqual(payload["timestamp"], data["timestamp"])
        self.assertNotEqual(payload["image_hash"], data["image_hash"])
        self.assertNotEqual(payload["rating"], data["rating"])
        self.assertNotEqual(payload["hidden"], data["hidden"])
        self.assertNotEqual(payload["in_trashcan"], data["in_trashcan"])
        self.assertNotEqual(payload["video"], data["video"])
        extract_date_time_from_exif_mock.assert_not_called()


================================================
FILE: api/tests/test_face_extractor.py
================================================
"""Tests for face_extractor module."""

from unittest.mock import MagicMock, patch

from django.test import TestCase

from api import face_extractor


class FaceExtractorTest(TestCase):
    """Test face extraction functionality."""

    @patch("api.face_extractor.get_face_locations")
    def test_extract_from_dlib_handles_exception(self, mock_get_face_locations):
        """Test that extract_from_dlib returns empty list when exception occurs."""
        # Setup: make get_face_locations raise an exception
        mock_get_face_locations.side_effect = Exception("Test exception")

        # Create a mock owner with face_recognition_model
        mock_owner = MagicMock()
        mock_owner.face_recognition_model = "hog"

        # Call the function
        result = face_extractor.extract_from_dlib(
            image_path="/path/to/image.jpg",
            big_thumbnail_path="/path/to/thumbnail.jpg",
            owner=mock_owner,
        )

        # Verify that it returns an empty list instead of raising UnboundLocalError
        self.assertEqual(result, [])

    @patch("api.face_extractor.get_face_locations")
    def test_extract_from_dlib_success(self, mock_get_face_locations):
        """Test that extract_from_dlib works correctly on success."""
        # Setup: make get_face_locations return some face locations
        mock_face_locations = [(10, 20, 30, 40), (50, 60, 70, 80)]
        mock_get_face_locations.return_value = mock_face_locations

        # Create a mock owner with face_recognition_model
        mock_owner = MagicMock()
        mock_owner.face_recognition_model = "hog"

        # Call the function
        result = face_extractor.extract_from_dlib(
            image_path="/path/to/image.jpg",
            big_thumbnail_path="/path/to/thumbnail.jpg",
            owner=mock_owner,
        )

        # Verify that it returns face locations with None appended
        expected = [(10, 20, 30, 40, None), (50, 60, 70, 80, None)]
        self.assertEqual(result, expected)

    @patch("api.face_extractor.extract_from_exif")
    @patch("api.face_extractor.extract_from_dlib")
    def test_extract_prefers_exif(self, mock_dlib, mock_exif):
        """Test that extract function prefers EXIF data over dlib."""
        # Setup: make extract_from_exif return some data
        mock_exif_data = [(10, 20, 30, 40, "John Doe")]
        mock_exif.return_value = mock_exif_data

        mock_owner = MagicMock()

        # Call the function
        result = face_extractor.extract(
            image_path="/path/to/image.jpg",
            big_thumbnail_path="/path/to/thumbnail.jpg",
            owner=mock_owner,
        )

        # Verify that it returns EXIF data and doesn't call dlib
        self.assertEqual(result, mock_exif_data)
        mock_dlib.assert_not_called()

    @patch("api.face_extractor.extract_from_exif")
    @patch("api.face_extractor.extract_from_dlib")
    def test_extract_fallback_to_dlib(self, mock_dlib, mock_exif):
        """Test that extract function falls back to dlib when no EXIF data."""
        # Setup: make extract_from_exif return None
        mock_exif.return_value = None
        mock_dlib_data = [(10, 20, 30, 40, None)]
        mock_dlib.return_value = mock_dlib_data

        mock_owner = MagicMock()

        # Call the function
        result = face_extractor.extract(
            image_path="/path/to/image.jpg",
            big_thumbnail_path="/path/to/thumbnail.jpg",
            owner=mock_owner,
        )

        # Verify that it returns dlib data
        self.assertEqual(result, mock_dlib_data)
        mock_dlib.assert_called_once()


================================================
FILE: api/tests/test_face_writeback.py
================================================
from unittest.mock import MagicMock, patch

from django.test import TestCase

from api.metadata.face_regions import (
    build_face_region_exiftool_args,
    get_face_region_tags,
    reverse_orientation_transform,
    thumbnail_coords_to_normalized,
)
from api.models.person import Person
from api.tests.utils import (
    create_test_face,
    create_test_person,
    create_test_photo,
    create_test_user,
)


class TestThumbnailCoordsToNormalized(TestCase):
    def test_basic_conversion(self):
        """Known pixel coords should produce expected normalized values."""
        # Face at center of a 1000x800 thumbnail
        # top=300, right=600, bottom=500, left=400
        x, y, w, h = thumbnail_coords_to_normalized(
            top=300,
            right=600,
            bottom=500,
            left=400,
            thumb_width=1000,
            thumb_height=800,
        )
        self.assertAlmostEqual(x, 0.5)  # center_x = (400+600)/2/1000
        self.assertAlmostEqual(y, 0.5)  # center_y = (300+500)/2/800
        self.assertAlmostEqual(w, 0.2)  # w = (600-400)/1000
        self.assertAlmostEqual(h, 0.25)  # h = (500-300)/800

    def test_corner_face(self):
        """Face in top-left corner."""
        x, y, w, h = thumbnail_coords_to_normalized(
            top=0,
            right=100,
            bottom=100,
            left=0,
            thumb_width=1000,
            thumb_height=1000,
        )
        self.assertAlmostEqual(x, 0.05)
        self.assertAlmostEqual(y, 0.05)
        self.assertAlmostEqual(w, 0.1)
        self.assertAlmostEqual(h, 0.1)


class TestReverseOrientationTransform(TestCase):
    def test_identity_for_normal_orientation(self):
        """Normal orientation should be a no-op."""
        x, y, w, h = reverse_orientation_transform(
            0.5, 0.3, 0.2, 0.1, "Horizontal (normal)"
        )
        self.assertAlmostEqual(x, 0.5)
        self.assertAlmostEqual(y, 0.3)
        self.assertAlmostEqual(w, 0.2)
        self.assertAlmostEqual(h, 0.1)

    def test_identity_for_none_orientation(self):
        """None orientation should be a no-op."""
        x, y, w, h = reverse_orientation_transform(0.5, 0.3, 0.2, 0.1, None)
        self.assertAlmostEqual(x, 0.5)
        self.assertAlmostEqual(y, 0.3)
        self.assertAlmostEqual(w, 0.2)
        self.assertAlmostEqual(h, 0.1)

    def test_round_trip_rotate_90_cw(self):
        """Forward then reverse for Rotate 90 CW should return original coords."""
        self._test_round_trip("Rotate 90 CW")

    def test_round_trip_mirror_horizontal(self):
        self._test_round_trip("Mirror horizontal")

    def test_round_trip_rotate_180(self):
        self._test_round_trip("Rotate 180")

    def test_round_trip_mirror_vertical(self):
        self._test_round_trip("Mirror vertical")

    def test_round_trip_rotate_270_cw(self):
        self._test_round_trip("Rotate 270 CW")

    def test_round_trip_mirror_horizontal_rotate_90_cw(self):
        self._test_round_trip("Mirror horizontal and rotate 90 CW")

    def _test_round_trip(self, orientation):
        """Apply forward transform (from face_extractor) then reverse, verify identity."""
        orig_x, orig_y, orig_w, orig_h = 0.4, 0.3, 0.2, 0.15

        # Apply forward transform (same logic as face_extractor.py lines 54-80)
        correct_x, correct_y = orig_x, orig_y
        correct_w, correct_h = orig_w, orig_h
        if orientation == "Rotate 90 CW":
            temp_x = correct_x
            correct_x = 1 - correct_y
            correct_y = temp_x
            correct_w, correct_h = correct_h, correct_w
        elif orientation == "Mirror horizontal":
            correct_x = 1 - correct_x
        elif orientation == "Rotate 180":
            correct_x = 1 - correct_x
            correct_y = 1 - correct_y
        elif orientation == "Mirror vertical":
            correct_y = 1 - correct_y
        elif orientation == "Mirror horizontal and rotate 270 CW":
            temp_x = correct_x
            correct_x = 1 - correct_y
            correct_y = temp_x
            correct_w, correct_h = correct_h, correct_w
        elif orientation == "Mirror horizontal and rotate 90 CW":
            temp_x = correct_x
            correct_x = correct_y
            correct_y = 1 - temp_x
            correct_w, correct_h = correct_h, correct_w
        elif orientation == "Rotate 270 CW":
            temp_x = correct_x
            correct_x = correct_y
            correct_y = 1 - temp_x
            correct_w, correct_h = correct_h, correct_w

        # Now reverse
        rx, ry, rw, rh = reverse_orientation_transform(
            correct_x, correct_y, correct_w, correct_h, orientation
        )
        self.assertAlmostEqual(
            rx, orig_x, places=10, msg=f"x mismatch for {orientation}"
        )
        self.assertAlmostEqual(
            ry, orig_y, places=10, msg=f"y mismatch for {orientation}"
        )
        self.assertAlmostEqual(
            rw, orig_w, places=10, msg=f"w mismatch for {orientation}"
        )
        self.assertAlmostEqual(
            rh, orig_h, places=10, msg=f"h mismatch for {orientation}"
        )


class TestBuildFaceRegionExiftoolArgs(TestCase):
    def test_single_face(self):
        """Single face region should produce correct structured tag."""
        regions = [{"name": "Alice", "x": 0.5, "y": 0.3, "w": 0.2, "h": 0.15}]
        result = build_face_region_exiftool_args(regions)
        self.assertIn("XMP-mwg-rs:RegionInfo", result)
        value = result["XMP-mwg-rs:RegionInfo"]
        self.assertIn("Alice", value)
        self.assertIn("Type=Face", value)
        self.assertIn("Unit=normalized", value)
        self.assertIn("RegionList=", value)

    def test_multiple_faces(self):
        """Multiple face regions should all appear in RegionList."""
        regions = [
            {"name": "Alice", "x": 0.3, "y": 0.3, "w": 0.1, "h": 0.1},
            {"name": "Bob", "x": 0.7, "y": 0.5, "w": 0.15, "h": 0.2},
            {"name": "Charlie", "x": 0.5, "y": 0.8, "w": 0.12, "h": 0.1},
        ]
        result = build_face_region_exiftool_args(regions)
        value = result["XMP-mwg-rs:RegionInfo"]
        self.assertIn("Alice", value)
        self.assertIn("Bob", value)
        self.assertIn("Charlie", value)

    def test_special_characters_in_name(self):
        """Person names with commas, braces, equals should be escaped."""
        regions = [{"name": "O'Brien, Jr.", "x": 0.5, "y": 0.5, "w": 0.1, "h": 0.1}]
        result = build_face_region_exiftool_args(regions)
        value = result["XMP-mwg-rs:RegionInfo"]
        # Comma should be escaped
        self.assertIn("O'Brien\\, Jr.", value)

    def test_escape_braces_and_equals(self):
        """Braces and equals in names should be escaped."""
        regions = [{"name": "Test{=}", "x": 0.5, "y": 0.5, "w": 0.1, "h": 0.1}]
        result = build_face_region_exiftool_args(regions)
        value = result["XMP-mwg-rs:RegionInfo"]
        self.assertIn("Test\\{\\=\\}", value)

    def test_applied_to_dimensions(self):
        """AppliedToDimensions should be included when image dimensions are provided."""
        regions = [{"name": "Alice", "x": 0.5, "y": 0.3, "w": 0.2, "h": 0.15}]
        result = build_face_region_exiftool_args(regions, image_width=4000, image_height=3000)
        value = result["XMP-mwg-rs:RegionInfo"]
        self.assertIn("AppliedToDimensions={W=4000,H=3000,Unit=pixel}", value)

    def test_no_applied_to_dimensions_when_missing(self):
        """AppliedToDimensions should be omitted when image dimensions are not available."""
        regions = [{"name": "Alice", "x": 0.5, "y": 0.3, "w": 0.2, "h": 0.15}]
        result = build_face_region_exiftool_args(regions)
        value = result["XMP-mwg-rs:RegionInfo"]
        self.assertNotIn("AppliedToDimensions", value)

    def test_subject_keywords_for_named_faces(self):
        """Named faces should be added as XMP:Subject keywords."""
        regions = [
            {"name": "Alice", "x": 0.3, "y": 0.3, "w": 0.1, "h": 0.1},
            {"name": "Bob", "x": 0.7, "y": 0.5, "w": 0.15, "h": 0.2},
            {"name": "", "x": 0.5, "y": 0.8, "w": 0.12, "h": 0.1},
        ]
        result = build_face_region_exiftool_args(regions)
        self.assertIn("XMP:Subject", result)
        self.assertEqual(result["XMP:Subject"], ["Alice", "Bob"])

    def test_no_subject_keywords_when_all_unnamed(self):
        """No XMP:Subject should be set when all faces are unnamed."""
        regions = [
            {"name": "", "x": 0.3, "y": 0.3, "w": 0.1, "h": 0.1},
        ]
        result = build_face_region_exiftool_args(regions)
        self.assertNotIn("XMP:Subject", result)


class TestRoundTripCoordinates(TestCase):
    def test_round_trip_no_orientation(self):
        """Pixel coords -> normalize -> (simulate XMP read-back) -> verify ~= original."""
        thumb_width = 1000
        thumb_height = 800
        orig_top, orig_right, orig_bottom, orig_left = 200, 600, 400, 400

        # Step 1: Convert pixel -> normalized (writeback path)
        x, y, w, h = thumbnail_coords_to_normalized(
            orig_top,
            orig_right,
            orig_bottom,
            orig_left,
            thumb_width,
            thumb_height,
        )

        # Step 2: Simulate read-back (face_extractor.py lines 82-90)
        half_width = (w * thumb_width) / 2
        half_height = (h * thumb_height) / 2
        read_top = int((y * thumb_height) - half_height)
        read_right = int((x * thumb_width) + half_width)
        read_bottom = int((y * thumb_height) + half_height)
        read_left = int((x * thumb_width) - half_width)

        # Verify within 1px tolerance (int rounding)
        self.assertAlmostEqual(read_top, orig_top, delta=1)
        self.assertAlmostEqual(read_right, orig_right, delta=1)
        self.assertAlmostEqual(read_bottom, orig_bottom, delta=1)
        self.assertAlmostEqual(read_left, orig_left, delta=1)


class TestGetFaceRegionTags(TestCase):
    def setUp(self):
        self.user = create_test_user()

    @patch("api.metadata.face_regions.get_metadata")
    @patch("api.metadata.face_regions.PIL.Image.open")
    def test_returns_tags_for_labeled_faces(self, mock_pil_open, mock_get_metadata):
        """get_face_region_tags should return a dict with RegionInfo for labeled faces."""
        photo = create_test_photo(
            owner=self.user, thumbnail_big="thumbnails_big/test.jpg"
        )
        person = create_test_person(
            name="Alice", kind=Person.KIND_USER, cluster_owner=self.user
        )
        create_test_face(
            photo=photo,
            person=person,
            location_top=100,
            location_right=300,
            location_bottom=300,
            location_left=100,
        )

        mock_img = MagicMock()
        mock_img.size = (1000, 800)
        mock_pil_open.return_value = mock_img
        mock_get_metadata.return_value = (None, 4000, 3000)

        tags = get_face_region_tags(photo)

        self.assertIn("XMP-mwg-rs:RegionInfo", tags)
        self.assertIn("Alice", tags["XMP-mwg-rs:RegionInfo"])
        # AppliedToDimensions should be present
        self.assertIn(
            "AppliedToDimensions={W=4000,H=3000,Unit=pixel}",
            tags["XMP-mwg-rs:RegionInfo"],
        )
        # XMP:Subject should contain the person name
        self.assertIn("XMP:Subject", tags)
        self.assertEqual(tags["XMP:Subject"], ["Alice"])

    @patch("api.metadata.face_regions.get_metadata")
    @patch("api.metadata.face_regions.PIL.Image.open")
    def test_returns_all_faces(self, mock_pil_open, mock_get_metadata):
        """Photo with 3 labeled faces should have all 3 in the returned tags."""
        photo = create_test_photo(
            owner=self.user, thumbnail_big="thumbnails_big/test.jpg"
        )
        for name in ["Alice", "Bob", "Charlie"]:
            person = create_test_person(
                name=name, kind=Person.KIND_USER, cluster_owner=self.user
            )
            create_test_face(
                photo=photo,
                person=person,
                location_top=100,
                location_right=300,
                location_bottom=300,
                location_left=100,
            )

        mock_img = MagicMock()
        mock_img.size = (1000, 800)
        mock_pil_open.return_value = mock_img
        mock_get_metadata.return_value = (None, 4000, 3000)

        tags = get_face_region_tags(photo)

        value = tags["XMP-mwg-rs:RegionInfo"]
        self.assertIn("Alice", value)
        self.assertIn("Bob", value)
        self.assertIn("Charlie", value)

    @patch("api.metadata.face_regions.get_metadata")
    @patch("api.metadata.face_regions.PIL.Image.open")
    def test_unlabeled_faces_written_with_empty_name(
        self, mock_pil_open, mock_get_metadata
    ):
        """Faces without a KIND_USER person should be written with an empty name."""
        photo = create_test_photo(
            owner=self.user, thumbnail_big="thumbnails_big/test.jpg"
        )
        cluster_person = create_test_person(
            name="cluster_0001", kind=Person.KIND_CLUSTER, cluster_owner=self.user
        )
        create_test_face(
            photo=photo,
            person=cluster_person,
            location_top=100,
            location_right=300,
            location_bottom=300,
            location_left=100,
        )

        mock_img = MagicMock()
        mock_img.size = (1000, 800)
        mock_pil_open.return_value = mock_img
        mock_get_metadata.return_value = (None, 4000, 3000)

        tags = get_face_region_tags(photo)

        self.assertIn("XMP-mwg-rs:RegionInfo", tags)
        value = tags["XMP-mwg-rs:RegionInfo"]
        # Should have the face region but with empty name
        self.assertIn("Name=,Type=Face", value)
        self.assertNotIn("cluster_0001", value)

    @patch("api.metadata.face_regions.get_metadata")
    @patch("api.metadata.face_regions.PIL.Image.open")
    def test_faces_with_no_person_written_with_empty_name(
        self, mock_pil_open, mock_get_metadata
    ):
        """Faces with person=None should be written with an empty name."""
        photo = create_test_photo(
            owner=self.user, thumbnail_big="thumbnails_big/test.jpg"
        )
        create_test_face(
            photo=photo,
            person=None,
            location_top=100,
            location_right=300,
            location_bottom=300,
            location_left=100,
        )

        mock_img = MagicMock()
        mock_img.size = (1000, 800)
        mock_pil_open.return_value = mock_img
        mock_get_metadata.return_value = (None, 4000, 3000)

        tags = get_face_region_tags(photo)

        self.assertIn("XMP-mwg-rs:RegionInfo", tags)
        value = tags["XMP-mwg-rs:RegionInfo"]
        self.assertIn("Name=,Type=Face", value)

    @patch("api.metadata.face_regions.get_metadata")
    @patch("api.metadata.face_regions.PIL.Image.open")
    def test_mixed_labeled_and_unlabeled_faces(
        self, mock_pil_open, mock_get_metadata
    ):
        """Photo with both labeled and unlabeled faces should include all."""
        photo = create_test_photo(
            owner=self.user, thumbnail_big="thumbnails_big/test.jpg"
        )
        labeled_person = create_test_person(
            name="Alice", kind=Person.KIND_USER, cluster_owner=self.user
        )
        create_test_face(
            photo=photo,
            person=labeled_person,
            location_top=100,
            location_right=300,
            location_bottom=300,
            location_left=100,
        )
        cluster_person = create_test_person(
            name="cluster_0001", kind=Person.KIND_CLUSTER, cluster_owner=self.user
        )
        create_test_face(
            photo=photo,
            person=cluster_person,
            location_top=400,
            location_right=600,
            location_bottom=600,
            location_left=400,
        )

        mock_img = MagicMock()
        mock_img.size = (1000, 800)
        mock_pil_open.return_value = mock_img
        mock_get_metadata.return_value = (None, 4000, 3000)

        tags = get_face_region_tags(photo)

        value = tags["XMP-mwg-rs:RegionInfo"]
        self.assertIn("Alice", value)
        self.assertNotIn("cluster_0001", value)
        # Should have 2 face regions
        self.assertEqual(value.count("Type=Face"), 2)

    @patch("api.metadata.face_regions.get_metadata")
    @patch("api.metadata.face_regions.PIL.Image.open")
    def test_skips_deleted_faces(self, mock_pil_open, mock_get_metadata):
        """Deleted faces should not be included in the tags."""
        photo = create_test_photo(
            owner=self.user, thumbnail_big="thumbnails_big/test.jpg"
        )
        person = create_test_person(
            name="Active", kind=Person.KIND_USER, cluster_owner=self.user
        )
        create_test_face(
            photo=photo,
            person=person,
            location_top=100,
            location_right=300,
            location_bottom=300,
            location_left=100,
        )
        deleted_person = create_test_person(
            name="Deleted", kind=Person.KIND_USER, cluster_owner=self.user
        )
        create_test_face(
            photo=photo,
            person=deleted_person,
            deleted=True,
            location_top=400,
            location_right=600,
            location_bottom=600,
            location_left=400,
        )

        mock_img = MagicMock()
        mock_img.size = (1000, 800)
        mock_pil_open.return_value = mock_img
        mock_get_metadata.return_value = (None, 4000, 3000)

        tags = get_face_region_tags(photo)

        value = tags["XMP-mwg-rs:RegionInfo"]
        self.assertIn("Active", value)
        self.assertNotIn("Deleted", value)


class TestSaveMetadataIntegration(TestCase):
    def setUp(self):
        self.user = create_test_user()

    @patch("api.models.photo.write_metadata")
    @patch("api.metadata.face_regions.get_metadata")
    @patch("api.metadata.face_regions.PIL.Image.open")
    def test_save_metadata_with_face_tags(
        self, mock_pil_open, mock_get_metadata, mock_write_metadata
    ):
        """_save_metadata(metadata_types=["face_tags"]) should write face regions."""
        photo = create_test_photo(
            owner=self.user, thumbnail_big="thumbnails_big/test.jpg"
        )
        person = create_test_person(
            name="Test Person", kind=Person.KIND_USER, cluster_owner=self.user
        )
        create_test_face(
            photo=photo,
            person=person,
            location_top=100,
            location_right=300,
            location_bottom=300,
            location_left=100,
        )

        mock_img = MagicMock()
        mock_img.size = (1000, 800)
        mock_pil_open.return_value = mock_img
        mock_get_metadata.return_value = (None, 4000, 3000)

        photo._save_metadata(use_sidecar=True, metadata_types=["face_tags"])

        mock_write_metadata.assert_called_once()
        tags = mock_write_metadata.call_args[0][1]
        self.assertIn("XMP-mwg-rs:RegionInfo", tags)
        self.assertIn("Test Person", tags["XMP-mwg-rs:RegionInfo"])

    @patch("api.models.photo.write_metadata")
    def test_save_metadata_default_does_not_write_face_tags(self, mock_write_metadata):
        """_save_metadata() with default args should NOT write face tags."""
        photo = create_test_photo(owner=self.user)
        person = create_test_person(
            name="Test Person", kind=Person.KIND_USER, cluster_owner=self.user
        )
        create_test_face(
            photo=photo,
            person=person,
            location_top=100,
            location_right=300,
            location_bottom=300,
            location_left=100,
        )

        # Default call (no metadata_types) — should only consider ratings
        photo._save_metadata()

        # Rating is 0 by default and there are no modified_fields=None,
        # so it will write the rating tag
        if mock_write_metadata.called:
            tags = mock_write_metadata.call_args[0][1]
            self.assertNotIn("XMP-mwg-rs:RegionInfo", tags)

    @patch("api.models.photo.write_metadata")
    @patch("api.metadata.face_regions.get_metadata")
    @patch("api.metadata.face_regions.PIL.Image.open")
    def test_save_metadata_combined_types(
        self, mock_pil_open, mock_get_metadata, mock_write_metadata
    ):
        """_save_metadata with both types should write ratings AND face tags together."""
        photo = create_test_photo(
            owner=self.user, thumbnail_big="thumbnails_big/test.jpg"
        )
        photo.rating = 5
        person = create_test_person(
            name="Alice", kind=Person.KIND_USER, cluster_owner=self.user
        )
        create_test_face(
            photo=photo,
            person=person,
            location_top=100,
            location_right=300,
            location_bottom=300,
            location_left=100,
        )

        mock_img = MagicMock()
        mock_img.size = (1000, 800)
        mock_pil_open.return_value = mock_img
        mock_get_metadata.return_value = (None, 4000, 3000)

        photo._save_metadata(use_sidecar=True, metadata_types=["ratings", "face_tags"])

        mock_write_metadata.assert_called_once()
        tags = mock_write_metadata.call_args[0][1]
        self.assertIn("Rating", tags)
        self.assertEqual(tags["Rating"], 5)
        self.assertIn("XMP-mwg-rs:RegionInfo", tags)
        self.assertIn("Alice", tags["XMP-mwg-rs:RegionInfo"])


================================================
FILE: api/tests/test_favorite_photos.py
================================================
from unittest.mock import patch

from django.test import TestCase
from rest_framework.test import APIClient

from api.tests.utils import create_test_photos, create_test_user


class FavoritePhotosTest(TestCase):
    def setUp(self):
        self.client = APIClient()
        self.user1 = create_test_user(favorite_min_rating=1)
        self.user2 = create_test_user(favorite_min_rating=1)
        self.client.force_authenticate(user=self.user1)

    def test_tag_my_photos_as_favorite(self):
        photos = create_test_photos(number_of_photos=3, owner=self.user1)
        image_hashes = [p.image_hash for p in photos]

        payload = {"image_hashes": image_hashes, "favorite": True}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/favorite/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(3, len(data["results"]))
        self.assertEqual(3, len(data["updated"]))
        self.assertEqual(0, len(data["not_updated"]))

    def test_untag_my_photos_as_favorite(self):
        photos1 = create_test_photos(
            number_of_photos=1, owner=self.user1, rating=self.user1.favorite_min_rating
        )
        photos2 = create_test_photos(number_of_photos=2, owner=self.user1)
        image_hashes = [p.image_hash for p in photos1 + photos2]

        payload = {"image_hashes": image_hashes, "favorite": False}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/favorite/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(1, len(data["results"]))
        self.assertEqual(1, len(data["updated"]))
        self.assertEqual(2, len(data["not_updated"]))

    def test_tag_photos_of_other_user_as_favorite(self):
        photos = create_test_photos(number_of_photos=2, owner=self.user2)
        image_hashes = [p.image_hash for p in photos]

        payload = {"image_hashes": image_hashes, "favorite": True}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/favorite/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(0, len(data["results"]))
        self.assertEqual(0, len(data["updated"]))
        # Photos not owned by user are treated as "missing" for security (no info leak)
        self.assertEqual(0, len(data["not_updated"]))

    @patch("api.views.photos.logger.warning", autospec=True)
    def test_tag_nonexistent_photo_as_favorite(self, logger):
        payload = {"image_hashes": ["nonexistent_photo"], "favorite": True}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/favorite/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(0, len(data["results"]))
        self.assertEqual(0, len(data["updated"]))
        self.assertEqual(0, len(data["not_updated"]))
        logger.assert_called_with(
            "Could not set photo nonexistent_photo to favorite. It does not exist or is not owned by user."
        )


================================================
FILE: api/tests/test_file_model.py
================================================
import importlib.machinery
import importlib.util
import sys
import types
import unittest
from unittest.mock import patch


def _ensure_stub_modules():
    if "django" not in sys.modules:
        django_module = types.ModuleType("django")
        django_db_module = types.ModuleType("django.db")
        django_db_models_module = types.ModuleType("django.db.models")

        class DummyModel:
            pass

        def dummy_field(*args, **kwargs):
            return None

        django_db_models_module.Model = DummyModel
        django_db_models_module.CharField = dummy_field
        django_db_models_module.TextField = dummy_field
        django_db_models_module.PositiveIntegerField = dummy_field
        django_db_models_module.BooleanField = dummy_field
        django_db_models_module.ManyToManyField = dummy_field

        django_module.db = django_db_module
        django_db_module.models = django_db_models_module
        django_module.__path__ = []
        django_db_module.__path__ = []
        django_module.__spec__ = importlib.machinery.ModuleSpec(
            "django", loader=None, is_package=True
        )
        django_db_module.__spec__ = importlib.machinery.ModuleSpec(
            "django.db", loader=None, is_package=True
        )
        django_db_models_module.__spec__ = importlib.machinery.ModuleSpec(
            "django.db.models", loader=None
        )

        sys.modules["django"] = django_module
        sys.modules["django.db"] = django_db_module
        sys.modules["django.db.models"] = django_db_models_module

    if "magic" not in sys.modules:
        magic_module = types.ModuleType("magic")

        class Magic:
            def __init__(self, *args, **kwargs):
                pass

            def from_file(self, path):
                return "application/octet-stream"

        magic_module.Magic = Magic
        magic_module.__spec__ = importlib.machinery.ModuleSpec("magic", loader=None)
        sys.modules["magic"] = magic_module

    if "pyvips" not in sys.modules:
        pyvips_module = types.ModuleType("pyvips")

        class Image:
            @staticmethod
            def thumbnail(*args, **kwargs):
                raise NotImplementedError

        class Enums:
            class Size:
                DOWN = "down"

        pyvips_module.Image = Image
        pyvips_module.enums = Enums
        pyvips_module.__spec__ = importlib.machinery.ModuleSpec(
            "pyvips", loader=None
        )
        sys.modules["pyvips"] = pyvips_module

    if "api" not in sys.modules:
        api_module = types.ModuleType("api")
        api_module.__path__ = []
        api_module.__spec__ = importlib.machinery.ModuleSpec(
            "api", loader=None, is_package=True
        )

        util_module = types.ModuleType("api.util")

        class Logger:
            def error(self, *args, **kwargs):
                pass

        util_module.logger = Logger()
        util_module.__spec__ = importlib.machinery.ModuleSpec("api.util", loader=None)
        util_module.__file__ = "<stub>"

        models_module = types.ModuleType("api.models")
        models_module.__path__ = []
        models_module.__spec__ = importlib.machinery.ModuleSpec(
            "api.models", loader=None, is_package=True
        )

        api_module.util = util_module
        api_module.models = models_module

        sys.modules["api"] = api_module
        sys.modules["api.util"] = util_module
        sys.modules["api.models"] = models_module

    if "exiftool" not in sys.modules:
        exiftool_module = types.ModuleType("exiftool")
        exiftool_module.__spec__ = importlib.machinery.ModuleSpec(
            "exiftool", loader=None
        )
        sys.modules["exiftool"] = exiftool_module

    if "requests" not in sys.modules:
        requests_module = types.ModuleType("requests")
        requests_module.__spec__ = importlib.machinery.ModuleSpec(
            "requests", loader=None
        )
        sys.modules["requests"] = requests_module

    if "django.conf" not in sys.modules:
        django_conf_module = types.ModuleType("django.conf")
        django_conf_module.settings = types.SimpleNamespace(LOGS_ROOT="/tmp")
        django_conf_module.__spec__ = importlib.machinery.ModuleSpec(
            "django.conf", loader=None, is_package=True
        )
        sys.modules["django.conf"] = django_conf_module


def _load_file_module():
    _ensure_stub_modules()
    # Use a unique module name to avoid conflicting with Django's registry
    module_name = "api.models.file._test_stub"
    if module_name in sys.modules:
        return sys.modules[module_name]
    spec = importlib.util.spec_from_file_location(
        module_name, "api/models/file.py"
    )
    module = importlib.util.module_from_spec(spec)
    sys.modules[module_name] = module
    spec.loader.exec_module(module)
    return module


class TestIsVideo(unittest.TestCase):
    @classmethod
    def setUpClass(cls):
        # Only load the module when this specific test class runs
        # Skip if Django models are already loaded to avoid double registration
        if "api.models.file" in sys.modules:
            cls._file_module = sys.modules["api.models.file"]
        else:
            cls._file_module = _load_file_module()

    def test_is_video_returns_false_when_magic_raises(self):
        class FailingMagic:
            def from_file(self, path):
                raise RuntimeError("magic failure")

        with patch.object(
            self._file_module.magic, "Magic", return_value=FailingMagic()
        ):
            self.assertFalse(self._file_module.is_video("/tmp/test.mp4"))


================================================
FILE: api/tests/test_file_path_uniqueness.py
================================================
"""
Tests for File path uniqueness enforcement.

Tests verify:
- Database unique constraint on File.path
- File.create() get_or_create pattern
- Migration deduplication logic
- Concurrent scan handling
"""

import os
import tempfile
import threading

from django.db import IntegrityError, transaction
from django.test import TestCase, TransactionTestCase

from api.models.file import File
from api.tests.utils import create_test_photo, create_test_user


class FilePathUniqueConstraintTestCase(TestCase):
    """Tests for the unique constraint on File.path."""

    def setUp(self):
        self.user = create_test_user()

    def test_unique_constraint_prevents_duplicate_paths(self):
        """Test that the database prevents creating two Files with the same path."""
        path = "/photos/test_image.jpg"
        
        # Create first file
        _file1 = File.objects.create(
            hash="hash1" + "a" * 28,
            path=path,
            type=File.IMAGE,
        )
        
        # Attempting to create second file with same path should fail
        with self.assertRaises(IntegrityError):
            with transaction.atomic():
                File.objects.create(
                    hash="hash2" + "b" * 28,
                    path=path,
                    type=File.IMAGE,
                )

    def test_unique_constraint_allows_different_paths(self):
        """Test that different paths are allowed."""
        file1 = File.objects.create(
            hash="hash1" + "a" * 28,
            path="/photos/image1.jpg",
            type=File.IMAGE,
        )
        file2 = File.objects.create(
            hash="hash2" + "b" * 28,
            path="/photos/image2.jpg",
            type=File.IMAGE,
        )
        
        self.assertEqual(File.objects.count(), 2)
        self.assertNotEqual(file1.path, file2.path)

    def test_empty_paths_are_unique(self):
        """Test that empty paths are subject to unique constraint."""
        # First empty path file
        _file1 = File.objects.create(
            hash="hash1" + "a" * 28,
            path="",
            type=File.IMAGE,
        )
        
        # Second empty path should fail
        with self.assertRaises(IntegrityError):
            with transaction.atomic():
                File.objects.create(
                    hash="hash2" + "b" * 28,
                    path="",
                    type=File.IMAGE,
                )


class FileCreateMethodTestCase(TestCase):
    """Tests for File.create() get_or_create pattern."""

    def setUp(self):
        self.user = create_test_user()
        # Create a temp directory for test files
        self.temp_dir = tempfile.mkdtemp()

    def tearDown(self):
        # Clean up temp files
        import shutil
        shutil.rmtree(self.temp_dir, ignore_errors=True)

    def _create_test_file(self, filename, content=b"test content"):
        """Helper to create a test file on disk."""
        path = os.path.join(self.temp_dir, filename)
        with open(path, "wb") as f:
            f.write(content)
        return path

    def test_create_returns_existing_file_for_same_path(self):
        """Test that File.create() returns existing File for same path."""
        path = self._create_test_file("test.jpg")
        
        # Create first file
        file1 = File.create(path, self.user)
        
        # Create second file with same path - should return existing
        file2 = File.create(path, self.user)
        
        # Should be the same file
        self.assertEqual(file1.hash, file2.hash)
        self.assertEqual(file1.path, file2.path)
        
        # Should only have one File in database
        self.assertEqual(File.objects.filter(path=path).count(), 1)

    def test_create_creates_new_file_for_different_path(self):
        """Test that File.create() creates new File for different path."""
        path1 = self._create_test_file("test1.jpg", b"content1")
        path2 = self._create_test_file("test2.jpg", b"content2")
        
        file1 = File.create(path1, self.user)
        file2 = File.create(path2, self.user)
        
        self.assertNotEqual(file1.hash, file2.hash)
        self.assertNotEqual(file1.path, file2.path)
        self.assertEqual(File.objects.count(), 2)

    def test_create_returns_existing_even_if_content_changed(self):
        """Test that File.create() returns existing File even if content changed."""
        path = self._create_test_file("test.jpg", b"original content")
        
        # Create first file
        file1 = File.create(path, self.user)
        original_hash = file1.hash
        
        # Modify file content
        with open(path, "wb") as f:
            f.write(b"modified content")
        
        # Create again - should return existing File (not recalculate hash)
        file2 = File.create(path, self.user)
        
        # Should return existing file (hash stays the same)
        self.assertEqual(file1.hash, file2.hash)
        self.assertEqual(file2.hash, original_hash)

    def test_create_determines_correct_file_type(self):
        """Test that File.create() correctly determines file type."""
        # Create image file
        img_path = self._create_test_file("photo.jpg")
        img_file = File.create(img_path, self.user)
        self.assertEqual(img_file.type, File.IMAGE)
        
        # Create RAW file
        raw_path = self._create_test_file("photo.CR2")
        raw_file = File.create(raw_path, self.user)
        self.assertEqual(raw_file.type, File.RAW_FILE)
        
        # Create metadata file
        xmp_path = self._create_test_file("photo.xmp")
        xmp_file = File.create(xmp_path, self.user)
        self.assertEqual(xmp_file.type, File.METADATA_FILE)


class MigrationDeduplicationTestCase(TestCase):
    """Tests for the migration deduplication logic."""

    def setUp(self):
        self.user = create_test_user()

    def test_deduplication_prefers_non_missing_file(self):
        """Test that deduplication logic prefers non-missing files.
        
        This tests the scoring logic that the migration uses.
        """
        # Create two files to simulate pre-migration state
        file_missing = File.objects.create(
            hash="hash_missing" + "a" * 21,
            path="/photos/missing_file.jpg",
            type=File.IMAGE,
            missing=True,
        )
        file_ok = File.objects.create(
            hash="hash_ok" + "a" * 25,
            path="/photos/ok_file.jpg",
            type=File.IMAGE,
            missing=False,
        )
        
        # Scoring logic: non-missing files get +100
        def score_file(f):
            score = 0
            if not f.missing:
                score += 100
            return score
        
        # Non-missing file should have higher score
        self.assertGreater(score_file(file_ok), score_file(file_missing))

    def test_deduplication_keeps_file_with_more_photos(self):
        """Test that deduplication prefers files linked to more photos."""
        _path = "/photos/popular.jpg"
        
        # Create two files
        file_popular = File.objects.create(
            hash="hash_popular" + "a" * 20,
            path="/photos/popular1.jpg",
            type=File.IMAGE,
        )
        file_lonely = File.objects.create(
            hash="hash_lonely" + "a" * 21,
            path="/photos/lonely1.jpg",
            type=File.IMAGE,
        )
        
        # Link popular file to multiple photos
        for i in range(3):
            photo = create_test_photo(owner=self.user)
            photo.files.add(file_popular)
            photo.save()
        
        # Link lonely file to one photo
        photo = create_test_photo(owner=self.user)
        photo.files.add(file_lonely)
        photo.save()
        
        # Verify photo counts
        self.assertEqual(file_popular.photo_set.count(), 3)
        self.assertEqual(file_lonely.photo_set.count(), 1)


class ConcurrentScanTestCase(TransactionTestCase):
    """Tests for concurrent scan handling with unique constraint."""

    def setUp(self):
        self.user = create_test_user()
        self.temp_dir = tempfile.mkdtemp()

    def tearDown(self):
        import shutil
        shutil.rmtree(self.temp_dir, ignore_errors=True)

    def _create_test_file(self, filename, content=b"test content"):
        """Helper to create a test file on disk."""
        path = os.path.join(self.temp_dir, filename)
        with open(path, "wb") as f:
            f.write(content)
        return path

    def test_concurrent_create_same_path_no_duplicates(self):
        """Test that concurrent File.create() calls don't create duplicates."""
        path = self._create_test_file("concurrent_test.jpg")
        results = []
        errors = []
        
        def create_file():
            try:
                file = File.create(path, self.user)
                results.append(file.hash)
            except Exception as e:
                errors.append(str(e))
        
        # Run multiple threads trying to create the same file
        threads = []
        for _ in range(5):
            t = threading.Thread(target=create_file)
            threads.append(t)
        
        for t in threads:
            t.start()
        
        for t in threads:
            t.join()
        
        # All should succeed (due to get_or_create pattern)
        self.assertEqual(len(errors), 0, f"Errors occurred: {errors}")
        
        # All should return the same file
        self.assertTrue(len(set(results)) <= 1, 
            f"Expected same hash for all, got: {results}")
        
        # Should only have one File in database
        self.assertEqual(File.objects.filter(path=path).count(), 1)

    def test_concurrent_create_different_paths_succeeds(self):
        """Test that concurrent creates of different paths all succeed."""
        paths = [
            self._create_test_file(f"concurrent_test_{i}.jpg", f"content{i}".encode())
            for i in range(5)
        ]
        results = []
        
        def create_file(path):
            file = File.create(path, self.user)
            results.append(file.hash)
        
        threads = []
        for path in paths:
            t = threading.Thread(target=create_file, args=(path,))
            threads.append(t)
        
        for t in threads:
            t.start()
        
        for t in threads:
            t.join()
        
        # All 5 files should be created
        self.assertEqual(len(results), 5)
        self.assertEqual(File.objects.count(), 5)


class FilePathLookupTestCase(TestCase):
    """Tests for path-based lookups."""

    def setUp(self):
        self.user = create_test_user()

    def test_filter_by_path_is_exact(self):
        """Test that filtering by path is exact match."""
        file1 = File.objects.create(
            hash="hash1" + "a" * 28,
            path="/photos/image.jpg",
            type=File.IMAGE,
        )
        _file2 = File.objects.create(
            hash="hash2" + "b" * 28,
            path="/photos/image2.jpg",
            type=File.IMAGE,
        )
        
        # Exact match should find only one
        result = File.objects.filter(path="/photos/image.jpg")
        self.assertEqual(result.count(), 1)
        self.assertEqual(result.first().hash, file1.hash)

    def test_photo_files_path_lookup(self):
        """Test that Photo.files.filter(path=...) works correctly."""
        file1 = File.objects.create(
            hash="hash1" + "a" * 28,
            path="/photos/image1.jpg",
            type=File.IMAGE,
        )
        file2 = File.objects.create(
            hash="hash2" + "b" * 28,
            path="/photos/image2.jpg",
            type=File.IMAGE,
        )
        
        photo = create_test_photo(owner=self.user)
        photo.files.add(file1, file2)
        
        # Should find exact path
        self.assertTrue(photo.files.filter(path="/photos/image1.jpg").exists())
        self.assertFalse(photo.files.filter(path="/photos/image3.jpg").exists())


class PhotoFileAssociationTestCase(TestCase):
    """Tests for Photo-File associations with unique path constraint."""

    def setUp(self):
        self.user = create_test_user()

    def test_multiple_photos_can_share_same_file(self):
        """Test that multiple Photos can reference the same File."""
        file = File.objects.create(
            hash="shared_hash" + "a" * 23,
            path="/photos/shared_image.jpg",
            type=File.IMAGE,
        )
        
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        photo1.files.add(file)
        photo1.main_file = file
        photo1.save()
        
        photo2.files.add(file)
        photo2.main_file = file
        photo2.save()
        
        # Both photos should reference the same file
        self.assertEqual(photo1.main_file.hash, photo2.main_file.hash)
        self.assertEqual(file.photo_set.count(), 2)

    def test_photo_with_multiple_file_variants(self):
        """Test Photo with multiple file variants (JPEG + RAW)."""
        jpeg_file = File.objects.create(
            hash="jpeg_hash" + "a" * 24,
            path="/photos/image.jpg",
            type=File.IMAGE,
        )
        raw_file = File.objects.create(
            hash="raw_hash" + "a" * 25,
            path="/photos/image.CR2",
            type=File.RAW_FILE,
        )

        photo = create_test_photo(owner=self.user)
        photo.files.add(jpeg_file, raw_file)
        photo.main_file = jpeg_file
        photo.save()

        # Photo should have both explicitly added files
        # Note: create_test_photo sets main_file but doesn't add it to photo.files
        self.assertEqual(photo.files.count(), 2)
        self.assertTrue(photo.files.filter(path="/photos/image.jpg").exists())
        self.assertTrue(photo.files.filter(path="/photos/image.CR2").exists())


================================================
FILE: api/tests/test_geocode.py
================================================
from unittest.mock import patch

from constance.test import override_config
from django.test import TestCase

from api.geocode.geocode import reverse_geocode
from api.geocode.parsers.mapbox import parse as parse_mapbox
from api.geocode.parsers.nominatim import parse as parse_nominatim
from api.geocode.parsers.opencage import parse as parse_opencage
from api.geocode.parsers.tomtom import parse as parse_tomtom
from api.tests.fixtures.geocode.expectations.mapbox import (
    expectations as mapbox_expectations,
)
from api.tests.fixtures.geocode.expectations.nominatim import (
    expectations as nominatim_expectations,
)
from api.tests.fixtures.geocode.expectations.opencage import (
    expectations as opencage_expectations,
)
from api.tests.fixtures.geocode.expectations.tomtom import (
    expectations as tomtom_expectations,
)
from api.tests.fixtures.geocode.responses.mapbox import responses as mapbox_responses
from api.tests.fixtures.geocode.responses.nominatim import (
    responses as nominatim_responses,
)
from api.tests.fixtures.geocode.responses.opencage import (
    responses as opencage_responses,
)
from api.tests.fixtures.geocode.responses.tomtom import responses as tomtom_responses


class MapboxLocation:
    def __init__(self, raw):
        self.raw = raw
        self.address = raw["place_name"]


class TomTomLocation:
    def __init__(self, raw):
        self.raw = raw
        self.address = raw["address"]["freeformAddress"]


class NominatimLocation:
    def __init__(self, raw):
        self.raw = raw
        self.address = raw["display_name"]


class OpenCageLocation:
    def __init__(self, raw):
        self.raw = raw
        self.address = raw["formatted"]


class TestGeocodeParsers(TestCase):
    def test_mapbox_parser(self):
        for index, raw in enumerate(mapbox_responses):
            self.assertEqual(
                parse_mapbox(MapboxLocation(raw)), mapbox_expectations[index]
            )

    def test_tomtom_parser(self):
        for index, raw in enumerate(tomtom_responses):
            self.assertEqual(
                parse_tomtom(TomTomLocation(raw)), tomtom_expectations[index]
            )

    def test_nominatim_parser(self):
        for index, raw in enumerate(nominatim_responses):
            self.assertEqual(
                parse_nominatim(NominatimLocation(raw)), nominatim_expectations[index]
            )

    def test_opencage_parser(self):
        for index, raw in enumerate(opencage_responses):
            self.assertEqual(
                parse_opencage(OpenCageLocation(raw)), opencage_expectations[index]
            )


class FakeLocation:
    raw = None
    address = None

    def __init__(self, location):
        self.raw = location
        self.address = location["place_name"]


class FakeProvider:
    def __init__(self, response):
        self.response = response

    def reverse(self, _):
        return FakeLocation(self.response)


def fake_geocoder(response):
    return lambda **_: FakeProvider(response)


class TestGeocoder(TestCase):
    @override_config(MAP_API_PROVIDER="mapbox")
    @patch("geopy.get_geocoder_for_service", autospec=True)
    def test_reverse_geocode(self, get_geocoder_for_service_mock):
        get_geocoder_for_service_mock.return_value = fake_geocoder(mapbox_responses[1])
        result = reverse_geocode(0, 0)
        self.assertEqual(result, mapbox_expectations[1])

    @override_config(MAP_API_PROVIDER="mapbox")
    @override_config(MAP_API_KEY="")
    def test_reverse_geocode_no_api_key(self):
        result = reverse_geocode(0, 0)
        self.assertEqual(result, {})


================================================
FILE: api/tests/test_get_faces.py
================================================
from django.test import TestCase
from django.urls import reverse
from rest_framework.test import APIClient

from api.tests.utils import (
    create_test_face,
    create_test_person,
    create_test_photo,
    create_test_user,
)


class IncompleteFacesTest(TestCase):
    def setUp(self):
        self.client = APIClient()
        self.user = create_test_user()
        self.client.force_authenticate(user=self.user)
        self.photo = create_test_photo(owner=self.user)

    def test_if_classification_person_is_ignored_if_below_threshold(self):
        """Test if unknown faces with classification are returned. Only classification_probability and min_confidence should be looked into."""
        person = create_test_person(cluster_owner=self.user)
        create_test_face(
            photo=self.photo,
            classification_person=person,
            classification_probability=0.4,
        )

        response = self.client.get(
            reverse("incomplete_faces-list"),
            {
                "inferred": "true",
                "analysis_method": "classification",
                "min_confidence": "0.5",
            },
        )

        self.assertEqual(response.status_code, 200)
        self.assertEqual(len(response.data), 1)
        self.assertIn(
            "Unknown - Other", response.data[0]["name"]
        )  # Ensure unknown face is returned

    def test_if_min_confidence_and_prob_are_compared_correctly(
        self,
    ):
        """Test that incomplete faces with classification analysis method are returned properly."""
        create_test_face(
            photo=self.photo,
            classification_probability=0.3,
        )
        create_test_face(
            photo=self.photo,
            classification_probability=0.4,
        )
        create_test_face(
            photo=self.photo,
            classification_probability=0.6,
        )

        response = self.client.get(
            reverse("incomplete_faces-list"),
            {
                "inferred": "true",
                "analysis_method": "classification",
                "min_confidence": "0.5",
            },
        )

        self.assertEqual(response.status_code, 200)
        self.assertIn(
            "Unknown - Other", response.data[0]["name"]
        )  # Ensure unknown face is returned
        # face count should be number of faces with classification probability less than 0.5
        self.assertEqual(response.data[0]["face_count"], 2)

    def test_incomplete_faces_with_clustering(self):
        """Test that incomplete faces with clustering analysis method are returned properly."""
        create_test_face(
            photo=self.photo,
            classification_person=None,
            classification_probability=0.5,
            cluster_person=None,
            cluster_probability=0.8,
        )
        create_test_face(
            photo=self.photo,
            classification_person=None,
            classification_probability=0.5,
            cluster_person=None,
            cluster_probability=0.4,
        )

        response = self.client.get(
            reverse("incomplete_faces-list"),
            {
                "inferred": "true",
                "analysis_method": "clustering",
                "min_confidence": "0.5",
            },
        )

        self.assertEqual(response.status_code, 200)
        self.assertIn("Unknown - Other", response.data[0]["name"])
        # face count should be number of faces with clustering person = None
        self.assertEqual(response.data[0]["face_count"], 2)

    def test_no_inferred_faces(self):
        """Test when there are no inferred faces and only user-labeled faces should appear."""
        person = create_test_person(name="John Doe", cluster_owner=self.user)
        create_test_face(photo=self.photo, person=person)

        response = self.client.get(
            reverse("incomplete_faces-list"), {"inferred": "false"}
        )

        self.assertEqual(response.status_code, 200)
        self.assertIn(
            "John Doe", response.data[0]["name"]
        )  # Ensure user-labeled face is returned


class FaceListViewTest(TestCase):
    def setUp(self):
        self.client = APIClient()
        self.user = create_test_user()
        self.client.force_authenticate(user=self.user)
        self.photo = create_test_photo(owner=self.user)

    def test_min_confidence_when_classification(self):
        """Test that faces with classification are returned properly."""
        person = create_test_person(cluster_owner=self.user)
        create_test_face(
            photo=self.photo,
            classification_person=person,
            classification_probability=0.6,
        )
        create_test_face(
            photo=self.photo,
            classification_person=person,
            classification_probability=0.4,
        )

        response = self.client.get(
            reverse("faces-list"),
            {
                "person": person.id,
                "analysis_method": "classification",
                "min_confidence": "0.5",
            },
        )

        self.assertEqual(response.status_code, 200)
        self.assertEqual(len(response.data["results"]), 1)

    def test_min_confidence_but_for_unknown_other(self):
        """Test that unknown faces with classification are returned properly."""
        person = create_test_person(cluster_owner=self.user)
        create_test_face(
            photo=self.photo,
            classification_person=person,
            classification_probability=0.4,
        )

        response = self.client.get(
            reverse("faces-list"),
            {
                "person": "0",
                "analysis_method": "classification",
                "min_confidence": "0.5",
            },
        )

        self.assertEqual(response.status_code, 200)
        self.assertEqual(len(response.data["results"]), 1)
        self.assertEqual(0.4, response.data["results"][0]["person_label_probability"])

    def test_min_confidence_when_clustering(self):
        """Test that faces with clustering are returned properly."""
        person = create_test_person(cluster_owner=self.user)
        create_test_face(
            photo=self.photo, cluster_person=person, cluster_probability=0.6
        )
        create_test_face(
            photo=self.photo, cluster_person=person, cluster_probability=0.4
        )

        response = self.client.get(
            reverse("faces-list"),
            {
                "person": person.id,
                "analysis_method": "clustering",
                "min_confidence": "0.5",
            },
        )

        self.assertEqual(response.status_code, 200)
        self.assertEqual(len(response.data["results"]), 1)

    def test_min_confidence_when_clustering_and_unknown(self):
        """Test that unknown faces with clustering are returned properly."""
        person = create_test_person(cluster_owner=self.user)
        create_test_face(
            photo=self.photo, cluster_person=person, cluster_probability=0.4
        )

        response = self.client.get(
            reverse("faces-list"),
            {
                "person": "0",
                "analysis_method": "clustering",
                "min_confidence": "0.5",
            },
        )

        self.assertEqual(response.status_code, 200)
        self.assertEqual(len(response.data["results"]), 1)
        self.assertEqual(0.4, response.data["results"][0]["person_label_probability"])

    def test_face_list_classification_order_by_probability(self):
        """Test that faces with classification are ordered by classification probability."""
        person = create_test_person(cluster_owner=self.user)
        create_test_face(
            photo=self.photo,
            classification_person=person,
            classification_probability=0.7,
        )
        create_test_face(
            photo=self.photo,
            classification_person=person,
            classification_probability=0.9,
        )

        response = self.client.get(
            reverse("faces-list"),
            {
                "person": person.id,
                "analysis_method": "classification",
                "order_by": "probability",
            },
        )

        self.assertEqual(response.status_code, 200)
        self.assertGreater(
            response.data["results"][0]["person_label_probability"],
            response.data["results"][1]["person_label_probability"],
        )

    def test_face_list_clustering_order_by_probability(self):
        """Test that faces with clustering are ordered by clustering probability."""
        person = create_test_person(cluster_owner=self.user)
        create_test_face(
            photo=self.photo, cluster_person=person, cluster_probability=0.6
        )
        create_test_face(
            photo=self.photo, cluster_person=person, cluster_probability=0.9
        )

        response = self.client.get(
            reverse("faces-list"),
            {
                "person": person.id,
                "analysis_method": "clustering",
                "order_by": "probability",
            },
        )

        self.assertEqual(response.status_code, 200)
        self.assertGreater(
            response.data["results"][0]["person_label_probability"],
            response.data["results"][1]["person_label_probability"],
        )

    def test_face_list_order_by_date(self):
        """Test that faces can be ordered by the photo's timestamp when 'order_by' is set to 'date'."""
        person = create_test_person(cluster_owner=self.user)
        photo = create_test_photo(
            owner=self.user, exif_timestamp="2021-01-01T00:00:00Z"
        )
        photo2 = create_test_photo(
            owner=self.user, exif_timestamp="2021-01-02T00:00:00Z"
        )
        create_test_face(photo=photo, person=person)
        create_test_face(photo=photo2, person=person)
        response = self.client.get(
            reverse("faces-list"),
            {"person": person.id, "inferred": False, "order_by": "date"},
        )

        self.assertEqual(response.status_code, 200)
        self.assertLess(
            response.data["results"][0]["timestamp"],
            response.data["results"][1]["timestamp"],
        )


================================================
FILE: api/tests/test_hide_photos.py
================================================
from unittest.mock import patch

from django.test import TestCase
from rest_framework.test import APIClient

from api.tests.utils import create_test_photos, create_test_user


class FavoritePhotosTest(TestCase):
    def setUp(self):
        self.client = APIClient()
        self.user1 = create_test_user()
        self.user2 = create_test_user()
        self.client.force_authenticate(user=self.user1)

    def test_hide_my_photos(self):
        photos = create_test_photos(number_of_photos=3, owner=self.user1)
        image_hashes = [p.image_hash for p in photos]

        payload = {"image_hashes": image_hashes, "hidden": True}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/hide/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(3, len(data["results"]))
        self.assertEqual(3, len(data["updated"]))
        self.assertEqual(0, len(data["not_updated"]))

    def test_untag_my_photos_as_favorite(self):
        photos1 = create_test_photos(number_of_photos=1, owner=self.user1, hidden=True)
        photos2 = create_test_photos(number_of_photos=2, owner=self.user1)
        image_hashes = [p.image_hash for p in photos1 + photos2]

        payload = {"image_hashes": image_hashes, "hidden": False}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/hide/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(1, len(data["results"]))
        self.assertEqual(1, len(data["updated"]))
        self.assertEqual(2, len(data["not_updated"]))

    def test_tag_photos_of_other_user_as_favorite(self):
        photos = create_test_photos(number_of_photos=2, owner=self.user2)
        image_hashes = [p.image_hash for p in photos]

        payload = {"image_hashes": image_hashes, "hidden": True}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/hide/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(0, len(data["results"]))
        self.assertEqual(0, len(data["updated"]))
        # Photos not owned by user are treated as "missing" for security (no info leak)
        self.assertEqual(0, len(data["not_updated"]))

    @patch("api.views.photos.logger.warning", autospec=True)
    def test_tag_nonexistent_photo_as_favorite(self, logger):
        payload = {"image_hashes": ["nonexistent_photo"], "hidden": True}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/hide/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(0, len(data["results"]))
        self.assertEqual(0, len(data["updated"]))
        self.assertEqual(0, len(data["not_updated"]))
        logger.assert_called_with(
            "Could not set photo nonexistent_photo to hidden. It does not exist or is not owned by user."
        )


================================================
FILE: api/tests/test_im2txt.py
================================================
import json
import os
import statistics
import threading
import time
from unittest import skip

import psutil
import torch
from django.test import TestCase
from rest_framework.test import APIClient

from api.image_captioning import generate_caption, unload_model
from api.tests.utils import create_test_user
from api.util import logger


def test_coco(testcase, device="cpu", model="im2txt"):
    from pycocoevalcap.eval import COCOEvalCap
    from pycocotools.coco import COCO

    logger.info(f"{device} {model}")
    blip = model == "blip"

    # Path to the annotations file
    annotation_file = (
        os.path.dirname(os.path.abspath(__file__))
        + "/fixtures/coco/captions_val2017.json"
    )

    # Initialize COCO API for annotations
    coco_caps = COCO(annotation_file)

    # Get a list of all image IDs in the dataset
    all_image_ids = coco_caps.getImgIds()

    # Load all images using the COCO API
    all_images = coco_caps.loadImgs(all_image_ids)

    # Save the generated captions together with the image IDs
    generated_captions = []
    counter = 0
    # Iterate through the valdation images
    for image_info in all_images:
        image = (
            os.path.dirname(os.path.abspath(__file__))
            + "/fixtures/coco/val2017/"
            + image_info["file_name"]
        )
        caption = generate_caption(blip=blip, image_path=image)
        # The LSTM adds a <start> and <end> token to the generated caption
        caption = caption.replace("<start>", "").replace("<end>", "").strip().lower()
        generated_captions.append({"image_id": image_info["id"], "caption": caption})
        counter += 1
        if counter > 100000:
            break

    testcase.end_time = time.time()

    # Define the path to the output JSON file
    output_json_file = (
        os.path.dirname(os.path.abspath(__file__))
        + "/fixtures/coco/"
        + "generated_captions.json"
    )

    # Write the generated_captions to the JSON file
    with open(output_json_file, "w") as json_file:
        json.dump(generated_captions, json_file)

    # create coco object and coco_result object
    coco = COCO(annotation_file)
    coco_result = coco.loadRes(output_json_file)

    # create coco_eval object by taking coco and coco_result
    coco_eval = COCOEvalCap(coco, coco_result)

    # evaluate on a subset of images by setting
    coco_eval.params["image_id"] = coco_result.getImgIds()

    # evaluate results
    # SPICE will take a few minutes the first time, but speeds up due to caching
    coco_eval.evaluate()

    # print output evaluation scores
    for metric, score in coco_eval.eval.items():
        logger.info(f"{metric}: {score:.3f}")


class Im2TxtBenchmark(TestCase):
    gpu_available = torch.cuda.is_available()
    # Start monitoring RAM usage
    process = psutil.Process(os.getpid())
    start_ram_usage = process.memory_info().rss
    # Start measuring timepycocoevalcap
    start_time = time.time()
    ram_usages = []  # List to store RAM usage samples
    ram_monitor_thread = None
    end_time = None

    def setUp(self) -> None:
        # Check if the required files exist in the fixtures directory
        self.coco_fixture_path = os.path.join(self.fixtures_dir, "coco")
        self.val2017_fixture_path = os.path.join(self.fixtures_dir, "coco", "val2017")
        self.val2017captions_fixture_path = os.path.join(
            self.fixtures_dir, "coco", "captions_val2017.json"
        )

        if not os.path.exists(self.coco_fixture_path):
            logger.warning(
                f"Skipping tests. Directory not found: {self.coco_fixture_path}. Please add a coco folder to the fixtures directory."
            )
            self.skipTest("Directory not found")

        if not os.path.exists(self.val2017_fixture_path):
            logger.warning(
                f"Skipping tests. Directory not found: {self.val2017_fixture_path}. Validation images are required for the COCO benchmark. Please download the COCO validation images and place them in the fixtures/coco/val2017 directory."
            )
            self.skipTest("Directory not found")
        if not os.path.exists(self.val2017captions_fixture_path):
            logger.warning(
                f"Skipping tests. Directory not found: {self.val2017captions_fixture_path}. Captions of Validation images are required for the COCO benchmark. Please download the COCO validation images and place them in the fixtures/coco/ directory."
            )
            self.skipTest("Directory not found")
        unload_model()
        self.client = APIClient()
        self.user = create_test_user()
        self.client.force_authenticate(user=self.user)
        self.gpu_available = torch.cuda.is_available()
        self.process = psutil.Process(os.getpid())
        self.start_ram_usage = self.process.memory_info().rss
        self.start_time = time.time()
        self.ram_usages = []  # List to store RAM usage samples
        self.ram_monitor_thread = threading.Thread(
            target=self.monitor_ram_usage, args=(self.process, self.ram_usages, 5)
        )  # Monitor RAM for 5 seconds
        self.ram_monitor_thread.start()

    def tearDown(self) -> None:
        if self.end_time is None:
            execution_time = time.time() - self.start_time
        else:
            execution_time = self.end_time - self.start_time
            self.end_time = None
        self.ram_monitor_thread.join()
        # Calculate RAM usage statistics
        mean_ram_usage_mb = statistics.mean(self.ram_usages) / (
            1024 * 1024
        )  # Convert bytes to MB
        median_ram_usage_mb = statistics.median(self.ram_usages) / (
            1024 * 1024
        )  # Convert bytes to MB

        # Log the results using the logger function
        logger.info("Test Result:")
        logger.info(f"GPU Used: {'Yes' if self.gpu_available else 'No'}")
        logger.info(f"Mean RAM Usage: {mean_ram_usage_mb:.2f} MB")
        logger.info(f"Median RAM Usage: {median_ram_usage_mb:.2f} MB")
        logger.info(f"Execution Time: {execution_time:.2f} seconds")

    def monitor_ram_usage(self, process, ram_usages, duration):
        # Monitor RAM usage for the specified duration
        start_time = time.time()
        while time.time() - start_time < duration:
            ram_usage = process.memory_info().rss
            ram_usages.append(ram_usage)
            time.sleep(0.1)  # Poll every 1 second

    @skip
    def test_im2txt_cpu(self):
        file = os.path.dirname(os.path.abspath(__file__)) + "/fixtures/niaz.jpg"
        self.gpu_available = "False"
        caption = generate_caption(device=torch.device("cpu"), image_path=file)

        self.assertEqual(
            "<start> a man with a beard is holding a remote control . <end>", caption
        )

        logger.info(f"Caption: {caption}")

    @skip
    def test_im2txt_gpu(self):
        file = os.path.dirname(os.path.abspath(__file__)) + "/fixtures/niaz.jpg"
        caption = generate_caption(device=torch.device("cuda"), image_path=file)

        self.assertEqual(
            "<start> a man with a beard is holding a remote control . <end>", caption
        )

        logger.info(f"Caption: {caption}")

    @skip
    def test_im2txt_cpu_100(self):
        file = os.path.dirname(os.path.abspath(__file__)) + "/fixtures/niaz.jpg"
        self.gpu_available = "False"

        for i in range(100):
            caption = generate_caption(device=torch.device("cpu"), image_path=file)
            self.assertEqual(
                "<start> a man with a beard is holding a remote control . <end>",
                caption,
            )

    @skip
    def test_im2txt_gpu_100(self):
        file = os.path.dirname(os.path.abspath(__file__)) + "/fixtures/niaz.jpg"

        for i in range(100):
            caption = generate_caption(device=torch.device("cuda"), image_path=file)
            self.assertEqual(
                "<start> a man with a beard is holding a remote control . <end>",
                caption,
            )

    @skip
    def test_im2txt_coco_cpu(self):
        test_coco(testcase=self, device="cpu", model="im2txt")

    @skip
    def test_im2txt_coco_gpu(self):
        test_coco(testcase=self, device="cuda", model="im2txt")

    @skip
    def test_blip_coco_cpu(self):
        test_coco(self, "cpu", "blip")

    @skip
    def test_blip_coco_gpu(self):
        test_coco(self, "cuda", "blip")


================================================
FILE: api/tests/test_live_photo.py
================================================
"""
Comprehensive tests for api/stacks/live_photo.py

Tests the Live Photo detection and stacking logic:
- Google Pixel Motion Photo detection (embedded MP4 after JPEG EOI)
- Samsung Motion Photo detection (MotionPhoto_Data marker)
- Apple Live Photo detection (paired .mov file)
- Stack creation for detected live photos
- Batch processing
"""

import os
import tempfile
from pathlib import Path
from unittest.mock import MagicMock, Mock, patch

from django.test import TestCase, override_settings

from api.models.file import File
from api.models.photo import Photo
from api.models.photo_stack import PhotoStack
from api.models.user import User
from api.stacks.live_photo import (
    APPLE_LIVE_PHOTO_EXTENSIONS,
    GOOGLE_PIXEL_MP4_SIGNATURES,
    JPEG_EOI_MARKER,
    SAMSUNG_MOTION_MARKER,
    _create_apple_live_photo_stack,
    _create_embedded_live_photo_stack,
    _locate_google_embedded_video,
    _locate_samsung_embedded_video,
    detect_live_photo,
    extract_embedded_motion_video,
    find_apple_live_photo_video,
    has_embedded_motion_video,
    process_live_photos_batch,
)


class LocateGoogleEmbeddedVideoTestCase(TestCase):
    """Tests for the _locate_google_embedded_video function."""

    def test_finds_ftypmp42_signature(self):
        """Should find MP4 with ftypmp42 signature."""
        # Build data: JPEG content + 4 padding bytes + ftyp signature
        data = b"JPEG_CONTENT\xff\xd9" + b"\x00\x00\x00\x00" + b"ftypmp42" + b"more_video_data"
        position = _locate_google_embedded_video(data)
        expected = data.find(b"ftypmp42") - 4
        self.assertEqual(position, expected)

    def test_finds_ftypisom_signature(self):
        """Should find MP4 with ftypisom signature."""
        data = b"JPEG_CONTENT\xff\xd9" + b"\x00\x00\x00\x20" + b"ftypisom"
        position = _locate_google_embedded_video(data)
        expected = data.find(b"ftypisom") - 4
        self.assertEqual(position, expected)

    def test_finds_ftypiso2_signature(self):
        """Should find MP4 with ftypiso2 signature."""
        data = b"JPEG_CONTENT\xff\xd9" + b"\x00\x00\x00\x20" + b"ftypiso2"
        position = _locate_google_embedded_video(data)
        expected = data.find(b"ftypiso2") - 4
        self.assertEqual(position, expected)

    def test_returns_minus_one_when_not_found(self):
        """Should return -1 if no signature found."""
        data = b"JPEG_CONTENT\xff\xd9_no_video_here"
        position = _locate_google_embedded_video(data)
        self.assertEqual(position, -1)

    def test_empty_data(self):
        """Should return -1 for empty data."""
        position = _locate_google_embedded_video(b"")
        self.assertEqual(position, -1)

    def test_finds_first_signature_if_multiple(self):
        """Should find the first signature if multiple exist."""
        data = b"JPEG" + b"\x00\x00\x00\x00" + b"ftypmp42" + b"MIDDLE" + b"ftypisom"
        position = _locate_google_embedded_video(data)
        # Should find ftypmp42 first
        self.assertEqual(position, 4)  # 4 bytes for "JPEG"


class LocateSamsungEmbeddedVideoTestCase(TestCase):
    """Tests for the _locate_samsung_embedded_video function."""

    def test_finds_samsung_marker(self):
        """Should find Samsung motion photo marker."""
        data = b"JPEG_CONTENT\xff\xd9" + SAMSUNG_MOTION_MARKER + b"video_data"
        position = _locate_samsung_embedded_video(data)
        expected = data.find(SAMSUNG_MOTION_MARKER) + len(SAMSUNG_MOTION_MARKER)
        self.assertEqual(position, expected)

    def test_returns_minus_one_when_not_found(self):
        """Should return -1 if no marker found."""
        data = b"JPEG_CONTENT\xff\xd9_no_motion_marker"
        position = _locate_samsung_embedded_video(data)
        self.assertEqual(position, -1)

    def test_empty_data(self):
        """Should return -1 for empty data."""
        position = _locate_samsung_embedded_video(b"")
        self.assertEqual(position, -1)


class HasEmbeddedMotionVideoTestCase(TestCase):
    """Tests for the has_embedded_motion_video function."""

    def setUp(self):
        """Create temporary directory for test files."""
        self.temp_dir = tempfile.mkdtemp()

    def tearDown(self):
        """Clean up temporary files."""
        import shutil
        shutil.rmtree(self.temp_dir, ignore_errors=True)

    @patch("api.stacks.live_photo.magic.Magic")
    def test_returns_false_for_non_jpeg(self, mock_magic_class):
        """Should return False for non-JPEG files."""
        mock_magic = MagicMock()
        mock_magic.from_file.return_value = "image/png"
        mock_magic_class.return_value = mock_magic

        result = has_embedded_motion_video("/some/path.png")
        self.assertFalse(result)

    @patch("api.stacks.live_photo.magic.Magic")
    @patch("builtins.open")
    @patch("api.stacks.live_photo.mmap")
    def test_returns_true_for_google_motion_photo(self, mock_mmap, mock_open, mock_magic_class):
        """Should return True for Google Motion Photo."""
        mock_magic = MagicMock()
        mock_magic.from_file.return_value = "image/jpeg"
        mock_magic_class.return_value = mock_magic

        # Mock file data with Google MP4 signature
        mock_data = b"JPEG" + b"\x00\x00\x00\x00" + b"ftypmp42"
        mock_mm = MagicMock()
        mock_mm.__enter__ = Mock(return_value=mock_data)
        mock_mm.__exit__ = Mock(return_value=False)
        mock_mmap.return_value = mock_mm

        mock_file = MagicMock()
        mock_file.__enter__ = Mock(return_value=mock_file)
        mock_file.__exit__ = Mock(return_value=False)
        mock_open.return_value = mock_file

        with patch("api.stacks.live_photo._locate_google_embedded_video", return_value=4):
            result = has_embedded_motion_video("/some/path.jpg")
            self.assertTrue(result)

    @patch("api.stacks.live_photo.magic.Magic")
    def test_returns_false_on_exception(self, mock_magic_class):
        """Should return False and log warning on exception."""
        mock_magic_class.side_effect = Exception("File not found")

        with patch("api.stacks.live_photo.logger") as mock_logger:
            result = has_embedded_motion_video("/nonexistent/path.jpg")
            self.assertFalse(result)
            mock_logger.warning.assert_called()


class FindAppleLivePhotoVideoTestCase(TestCase):
    """Tests for the find_apple_live_photo_video function."""

    def setUp(self):
        """Create temporary directory for test files."""
        self.temp_dir = tempfile.mkdtemp()

    def tearDown(self):
        """Clean up temporary files."""
        import shutil
        shutil.rmtree(self.temp_dir, ignore_errors=True)

    def test_finds_lowercase_mov_companion(self):
        """Should find .mov companion file."""
        # Create test files
        image_path = os.path.join(self.temp_dir, "IMG_001.jpg")
        video_path = os.path.join(self.temp_dir, "IMG_001.mov")
        Path(image_path).touch()
        Path(video_path).touch()

        result = find_apple_live_photo_video(image_path)
        self.assertEqual(result, video_path)

    def test_finds_uppercase_mov_companion(self):
        """Should find .MOV companion file (uppercase)."""
        image_path = os.path.join(self.temp_dir, "IMG_002.HEIC")
        video_path = os.path.join(self.temp_dir, "IMG_002.MOV")
        Path(image_path).touch()
        Path(video_path).touch()

        result = find_apple_live_photo_video(image_path)
        self.assertEqual(result, video_path)

    def test_returns_none_when_no_companion(self):
        """Should return None if no companion video exists."""
        image_path = os.path.join(self.temp_dir, "IMG_003.jpg")
        Path(image_path).touch()

        result = find_apple_live_photo_video(image_path)
        self.assertIsNone(result)

    def test_prefers_lowercase_mov(self):
        """Should prefer .mov over .MOV if both exist."""
        image_path = os.path.join(self.temp_dir, "IMG_004.jpg")
        video_lowercase = os.path.join(self.temp_dir, "IMG_004.mov")
        video_uppercase = os.path.join(self.temp_dir, "IMG_004.MOV")
        Path(image_path).touch()
        Path(video_lowercase).touch()
        Path(video_uppercase).touch()

        result = find_apple_live_photo_video(image_path)
        # Should find .mov first (lowercase is first in APPLE_LIVE_PHOTO_EXTENSIONS)
        self.assertEqual(result, video_lowercase)

    def test_handles_different_image_extensions(self):
        """Should work with various image extensions."""
        for ext in [".jpg", ".JPG", ".heic", ".HEIC", ".jpeg"]:
            image_path = os.path.join(self.temp_dir, f"test{ext}")
            video_path = os.path.join(self.temp_dir, "test.mov")
            Path(image_path).touch()
            Path(video_path).touch()

            result = find_apple_live_photo_video(image_path)
            self.assertEqual(result, video_path)

            # Cleanup for next iteration
            Path(image_path).unlink()
            Path(video_path).unlink()


class ExtractEmbeddedMotionVideoTestCase(TestCase):
    """Tests for the extract_embedded_motion_video function."""

    def setUp(self):
        """Create temporary directory for test files."""
        self.temp_dir = tempfile.mkdtemp()

    def tearDown(self):
        """Clean up temporary files."""
        import shutil
        shutil.rmtree(self.temp_dir, ignore_errors=True)

    @override_settings(MEDIA_ROOT=None)
    def test_extracts_google_motion_video(self):
        """Should extract embedded MP4 from Google Motion Photo."""
        # Use temp_dir as MEDIA_ROOT
        with self.settings(MEDIA_ROOT=self.temp_dir):
            # Create a fake motion photo file
            fake_video_data = b"fake_mp4_video_content"
            file_content = (
                b"JPEG_IMAGE_DATA\xff\xd9" +  # JPEG with EOI marker
                b"\x00\x00\x00\x00" +  # 4 padding bytes
                b"ftypmp42" +  # ftyp signature
                fake_video_data
            )

            input_path = os.path.join(self.temp_dir, "motion_photo.jpg")
            with open(input_path, "wb") as f:
                f.write(file_content)

            result = extract_embedded_motion_video(input_path, "test_hash_123")

            self.assertIsNotNone(result)
            self.assertIn("test_hash_123_motion.mp4", result)
            self.assertTrue(os.path.exists(result))

            # Verify extracted content starts from ftyp
            with open(result, "rb") as f:
                extracted = f.read()
                self.assertTrue(extracted.startswith(b"\x00\x00\x00\x00ftypmp42"))

    def test_returns_none_for_no_embedded_video(self):
        """Should return None if no embedded video found."""
        with self.settings(MEDIA_ROOT=self.temp_dir):
            # Create a regular JPEG without embedded video
            input_path = os.path.join(self.temp_dir, "regular.jpg")
            with open(input_path, "wb") as f:
                f.write(b"JPEG_DATA\xff\xd9")

            result = extract_embedded_motion_video(input_path, "hash123")
            self.assertIsNone(result)

    def test_returns_none_on_file_error(self):
        """Should return None and log error if file access fails."""
        with patch("api.stacks.live_photo.logger") as mock_logger:
            result = extract_embedded_motion_video("/nonexistent/file.jpg", "hash")
            self.assertIsNone(result)
            mock_logger.error.assert_called()


class DetectLivePhotoTestCase(TestCase):
    """Tests for the detect_live_photo function."""

    def setUp(self):
        """Create test user and temporary files."""
        self.temp_dir = tempfile.mkdtemp()
        self.user = User.objects.create(username="livetest")

    def tearDown(self):
        """Clean up."""
        import shutil
        shutil.rmtree(self.temp_dir, ignore_errors=True)

    def test_returns_none_for_photo_without_main_file(self):
        """Should return None if photo has no main_file."""
        photo = MagicMock()
        photo.main_file = None

        result = detect_live_photo(photo, self.user)
        self.assertIsNone(result)

    @patch("api.stacks.live_photo.has_embedded_motion_video")
    @patch("api.stacks.live_photo._create_embedded_live_photo_stack")
    def test_detects_embedded_motion_video(self, mock_create, mock_has_embedded):
        """Should detect and create stack for embedded motion video."""
        mock_has_embedded.return_value = True
        mock_stack = MagicMock()
        mock_create.return_value = mock_stack

        photo = MagicMock()
        photo.main_file.path = "/path/to/image.jpg"

        result = detect_live_photo(photo, self.user)

        mock_create.assert_called_once_with(photo, self.user)
        self.assertEqual(result, mock_stack)

    @patch("api.stacks.live_photo.has_embedded_motion_video")
    @patch("api.stacks.live_photo.find_apple_live_photo_video")
    @patch("api.stacks.live_photo._create_apple_live_photo_stack")
    def test_detects_apple_live_photo(self, mock_create, mock_find, mock_has_embedded):
        """Should detect and create stack for Apple Live Photo."""
        mock_has_embedded.return_value = False
        mock_find.return_value = "/path/to/video.mov"
        mock_stack = MagicMock()
        mock_create.return_value = mock_stack

        photo = MagicMock()
        photo.main_file.path = "/path/to/image.jpg"

        result = detect_live_photo(photo, self.user)

        mock_create.assert_called_once_with(photo, "/path/to/video.mov", self.user)
        self.assertEqual(result, mock_stack)

    @patch("api.stacks.live_photo.has_embedded_motion_video")
    @patch("api.stacks.live_photo.find_apple_live_photo_video")
    def test_returns_none_for_regular_photo(self, mock_find, mock_has_embedded):
        """Should return None for regular photos without motion."""
        mock_has_embedded.return_value = False
        mock_find.return_value = None

        photo = MagicMock()
        photo.main_file.path = "/path/to/regular.jpg"

        result = detect_live_photo(photo, self.user)
        self.assertIsNone(result)


class CreateEmbeddedLivePhotoStackTestCase(TestCase):
    """Tests for _create_embedded_live_photo_stack function."""

    def setUp(self):
        """Create test user."""
        self.user = User.objects.create(username="embedtest")
        self.temp_dir = tempfile.mkdtemp()

    def tearDown(self):
        """Clean up."""
        import shutil
        shutil.rmtree(self.temp_dir, ignore_errors=True)

    @override_settings(FEATURE_PROCESS_EMBEDDED_MEDIA=False)
    def test_returns_none_if_feature_disabled(self):
        """Should return None if embedded media processing is disabled."""
        photo = MagicMock()

        with patch("api.stacks.live_photo.logger") as mock_logger:
            result = _create_embedded_live_photo_stack(photo, self.user)
            self.assertIsNone(result)
            mock_logger.debug.assert_called()

    @override_settings(FEATURE_PROCESS_EMBEDDED_MEDIA=True)
    @patch("api.stacks.live_photo.extract_embedded_motion_video")
    def test_returns_none_if_extraction_fails(self, mock_extract):
        """Should return None if video extraction fails."""
        mock_extract.return_value = None

        photo = MagicMock()
        photo.main_file.path = "/path/to/image.jpg"
        photo.main_file.hash = "abc123"

        result = _create_embedded_live_photo_stack(photo, self.user)
        self.assertIsNone(result)

    @override_settings(FEATURE_PROCESS_EMBEDDED_MEDIA=True)
    @patch("api.stacks.live_photo.extract_embedded_motion_video")
    @patch("api.stacks.live_photo.File.create")
    def test_returns_existing_stack_if_present(self, mock_file_create, mock_extract):
        """Should return existing stack if photo already has one."""
        mock_extract.return_value = "/path/to/video.mp4"
        mock_video_file = MagicMock()
        mock_file_create.return_value = mock_video_file

        # Create a mock photo with existing stack
        existing_stack = MagicMock()
        photo = MagicMock()
        photo.main_file.path = "/path/to/image.jpg"
        photo.main_file.hash = "abc123"
        photo.main_file.embedded_media = MagicMock()
        photo.stacks.filter.return_value.first.return_value = existing_stack

        result = _create_embedded_live_photo_stack(photo, self.user)
        self.assertEqual(result, existing_stack)


class CreateAppleLivePhotoStackTestCase(TestCase):
    """Tests for _create_apple_live_photo_stack function."""

    def setUp(self):
        """Create test user and file."""
        from django.utils import timezone

        self.user = User.objects.create(username="appletest")
        self.temp_dir = tempfile.mkdtemp()

        # Create a test file
        self.file_hash = "a" * 32
        self.file_path = os.path.join(self.temp_dir, "test.jpg")
        Path(self.file_path).touch()

        self.file = File.objects.create(
            hash=self.file_hash,
            path=self.file_path,
            type=File.IMAGE,
        )

        # Create a test photo with required fields
        self.photo = Photo.objects.create(
            owner=self.user,
            main_file=self.file,
            image_hash="b" * 32,
            added_on=timezone.now(),
        )

    def tearDown(self):
        """Clean up."""
        import shutil
        shutil.rmtree(self.temp_dir, ignore_errors=True)

    def test_creates_new_stack_for_apple_live_photo(self):
        """Should create new Live Photo stack."""
        video_path = os.path.join(self.temp_dir, "test.mov")
        Path(video_path).touch()

        # Create a real video file to avoid foreign key issues
        video_file = File.objects.create(
            hash="c" * 32,
            path=video_path,
            type=File.VIDEO,
        )

        with patch("api.stacks.live_photo.File.create", return_value=video_file):
            with patch("api.stacks.live_photo.File.objects.filter") as mock_filter:
                # Simulate video file not existing yet
                mock_filter.return_value.first.return_value = None

                result = _create_apple_live_photo_stack(self.photo, video_path, self.user)

                self.assertIsNotNone(result)
                self.assertEqual(result.stack_type, PhotoStack.StackType.LIVE_PHOTO)
                self.assertEqual(result.primary_photo, self.photo)
                self.assertEqual(result.owner, self.user)

    def test_returns_existing_stack_if_present(self):
        """Should return existing stack if photo already has one."""
        # Create existing stack
        existing_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.LIVE_PHOTO,
            primary_photo=self.photo,
        )
        self.photo.stacks.add(existing_stack)

        video_path = os.path.join(self.temp_dir, "test.mov")
        Path(video_path).touch()

        # Create a real video file
        video_file = File.objects.create(
            hash="d" * 32,
            path=video_path,
            type=File.VIDEO,
        )

        with patch("api.stacks.live_photo.File.create", return_value=video_file):
            with patch("api.stacks.live_photo.File.objects.filter") as mock_filter:
                mock_filter.return_value.first.return_value = None

                result = _create_apple_live_photo_stack(self.photo, video_path, self.user)

                self.assertEqual(result, existing_stack)


class ProcessLivePhotosBatchTestCase(TestCase):
    """Tests for the process_live_photos_batch function."""

    def setUp(self):
        """Create test user."""
        self.user = User.objects.create(username="batchtest")

    @patch("api.stacks.live_photo.detect_live_photo")
    def test_processes_all_photos(self, mock_detect):
        """Should process all photos in the list."""
        mock_detect.return_value = None

        photos = [MagicMock() for _ in range(5)]
        result = process_live_photos_batch(self.user, photos)

        self.assertEqual(mock_detect.call_count, 5)
        self.assertEqual(result["detected"], 0)
        self.assertEqual(result["stacks_created"], 0)

    @patch("api.stacks.live_photo.detect_live_photo")
    def test_counts_detected_live_photos(self, mock_detect):
        """Should count detected live photos."""
        mock_stack = MagicMock()
        mock_stack.photo_count = 2  # Existing stack with photos
        mock_detect.side_effect = [mock_stack, None, mock_stack, None]

        photos = [MagicMock() for _ in range(4)]
        result = process_live_photos_batch(self.user, photos)

        self.assertEqual(result["detected"], 2)

    @patch("api.stacks.live_photo.detect_live_photo")
    def test_counts_new_stacks_created(self, mock_detect):
        """Should count newly created stacks."""
        new_stack = MagicMock()
        new_stack.photo_count = 1  # New stack (just the photo)
        mock_detect.return_value = new_stack

        photos = [MagicMock() for _ in range(3)]
        result = process_live_photos_batch(self.user, photos)

        self.assertEqual(result["detected"], 3)
        self.assertEqual(result["stacks_created"], 3)

    @patch("api.stacks.live_photo.detect_live_photo")
    def test_handles_exceptions_gracefully(self, mock_detect):
        """Should continue processing after exceptions."""
        mock_detect.side_effect = [Exception("Error"), MagicMock(photo_count=2)]

        photos = [MagicMock(), MagicMock()]
        photos[0].id = "photo1"
        photos[1].id = "photo2"

        with patch("api.stacks.live_photo.logger") as mock_logger:
            result = process_live_photos_batch(self.user, photos)
            mock_logger.error.assert_called()
            self.assertEqual(result["detected"], 1)

    def test_empty_list_returns_zero_counts(self):
        """Should return zero counts for empty list."""
        result = process_live_photos_batch(self.user, [])
        self.assertEqual(result["detected"], 0)
        self.assertEqual(result["stacks_created"], 0)


class ConstantsTestCase(TestCase):
    """Tests for module constants."""

    def test_jpeg_eoi_marker(self):
        """JPEG EOI marker should be correct."""
        self.assertEqual(JPEG_EOI_MARKER, b"\xff\xd9")

    def test_google_signatures_list(self):
        """Google MP4 signatures should be defined."""
        self.assertIn(b"ftypmp42", GOOGLE_PIXEL_MP4_SIGNATURES)
        self.assertIn(b"ftypisom", GOOGLE_PIXEL_MP4_SIGNATURES)
        self.assertIn(b"ftypiso2", GOOGLE_PIXEL_MP4_SIGNATURES)

    def test_samsung_marker(self):
        """Samsung motion marker should be correct."""
        self.assertEqual(SAMSUNG_MOTION_MARKER, b"MotionPhoto_Data")

    def test_apple_extensions(self):
        """Apple Live Photo extensions should include .mov variants."""
        self.assertIn(".mov", APPLE_LIVE_PHOTO_EXTENSIONS)
        self.assertIn(".MOV", APPLE_LIVE_PHOTO_EXTENSIONS)


class EdgeCasesTestCase(TestCase):
    """Edge case tests for live photo detection."""

    def setUp(self):
        """Create temporary directory."""
        self.temp_dir = tempfile.mkdtemp()

    def tearDown(self):
        """Clean up."""
        import shutil
        shutil.rmtree(self.temp_dir, ignore_errors=True)

    def test_unicode_filename_apple_live_photo(self):
        """Should handle unicode characters in filenames."""
        image_path = os.path.join(self.temp_dir, "照片_日本_🌸.jpg")
        video_path = os.path.join(self.temp_dir, "照片_日本_🌸.mov")
        Path(image_path).touch()
        Path(video_path).touch()

        result = find_apple_live_photo_video(image_path)
        self.assertEqual(result, video_path)

    def test_special_characters_in_path(self):
        """Should handle special characters in file path."""
        image_path = os.path.join(self.temp_dir, "test photo (1).jpg")
        video_path = os.path.join(self.temp_dir, "test photo (1).mov")
        Path(image_path).touch()
        Path(video_path).touch()

        result = find_apple_live_photo_video(image_path)
        self.assertEqual(result, video_path)

    def test_locate_video_at_start_of_data(self):
        """Should handle video marker at very start of data."""
        data = b"ftypmp42rest_of_video"
        position = _locate_google_embedded_video(data)
        self.assertEqual(position, -4)  # Would be negative, which is fine

    def test_multiple_samsung_markers(self):
        """Should find first Samsung marker if multiple present."""
        data = (
            SAMSUNG_MOTION_MARKER + b"first_video" +
            SAMSUNG_MOTION_MARKER + b"second_video"
        )
        position = _locate_samsung_embedded_video(data)
        self.assertEqual(position, len(SAMSUNG_MOTION_MARKER))

    def test_partial_signature_not_matched(self):
        """Should not match partial signatures."""
        # ftypm instead of ftypmp42
        data = b"JPEG\xff\xd9\x00\x00\x00\x00ftypm"
        position = _locate_google_embedded_video(data)
        self.assertEqual(position, -1)

    def test_very_large_file_simulation(self):
        """Should handle large data efficiently."""
        # Create 10MB of fake data with marker near end
        large_data = b"A" * (10 * 1024 * 1024)
        large_data += b"\x00\x00\x00\x00ftypmp42"

        position = _locate_google_embedded_video(large_data)
        self.assertGreater(position, 0)

    def test_binary_data_with_nulls(self):
        """Should handle binary data with null bytes."""
        data = b"\x00" * 100 + b"\x00\x00\x00\x00ftypmp42" + b"\x00" * 50
        position = _locate_google_embedded_video(data)
        self.assertEqual(position, 100)


================================================
FILE: api/tests/test_location_timeline.py
================================================
import csv
import os

from django.test import TestCase
from rest_framework.test import APIClient

from api.stats import get_location_timeline, get_photo_month_counts
from api.models import Photo
from api.tests.utils import create_test_photo, create_test_user


def prepare_database(user):
    data = (
        os.path.dirname(os.path.abspath(__file__))
        + "/fixtures/location_timeline_test_data.csv"
    )
    with open(data) as f:
        reader = csv.reader(f)
        for row in reader:
            if row[0].startswith("#"):
                continue
            country = row[0]
            exif_timestamp = row[1]
            geolocation_json = {"places": [country], "features": [{"text": country}]}
            create_test_photo(
                owner=user,
                exif_timestamp=exif_timestamp,
                geolocation_json=geolocation_json,
            )


expected_location_timeline = [
    {
        "data": [22208418.0],
        "color": "#a6cee3",
        "loc": "Germany",
        "start": 1576286343.0,
        "end": 1598494761.0,
    },
    {
        "data": [9413609.0],
        "color": "#1f78b4",
        "loc": "Canada",
        "start": 1598494761.0,
        "end": 1607908370.0,
    },
    {
        "data": [20648022.0],
        "color": "#b2df8a",
        "loc": "France",
        "start": 1607908370.0,
        "end": 1628556392.0,
    },
    {
        "data": [6132785.0],
        "color": "#33a02c",
        "loc": "Canada",
        "start": 1628556392.0,
        "end": 1634689177.0,
    },
    {
        "data": [79828.0],
        "color": "#fb9a99",
        "loc": "France",
        "start": 1634689177.0,
        "end": 1634769005.0,
    },
]

expected_photo_month_counts = [
    {"month": "2019-12", "count": 4},
    {"month": "2020-1", "count": 0},
    {"month": "2020-2", "count": 0},
    {"month": "2020-3", "count": 0},
    {"month": "2020-4", "count": 0},
    {"month": "2020-5", "count": 0},
    {"month": "2020-6", "count": 0},
    {"month": "2020-7", "count": 0},
    {"month": "2020-8", "count": 4},
    {"month": "2020-9", "count": 0},
    {"month": "2020-10", "count": 0},
    {"month": "2020-11", "count": 0},
    {"month": "2020-12", "count": 4},
    {"month": "2021-1", "count": 0},
    {"month": "2021-2", "count": 0},
    {"month": "2021-3", "count": 0},
    {"month": "2021-4", "count": 0},
    {"month": "2021-5", "count": 0},
    {"month": "2021-6", "count": 0},
    {"month": "2021-7", "count": 0},
    {"month": "2021-8", "count": 4},
    {"month": "2021-9", "count": 0},
    {"month": "2021-10", "count": 4},
]


class LocationTimelineTest(TestCase):
    def setUp(self) -> None:
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)
        Photo.objects.all().delete()
        prepare_database(self.user)

    def test_location_timeline_endpoint(self):
        response = self.client.get("/api/locationtimeline/")
        result = response.json()
        self.assertEqual(result, expected_location_timeline)

    def test_get_location_timeline(self):
        result = get_location_timeline(self.user)
        self.assertEqual(result, expected_location_timeline)

    def test_get_photo_month_counts_endpoint(self):
        response = self.client.get("/api/photomonthcounts/")
        result = response.json()
        self.assertEqual(result, expected_photo_month_counts)

    def test_get_photo_month_count(self):
        result = get_photo_month_counts(self.user)
        self.assertEqual(result, expected_photo_month_counts)


================================================
FILE: api/tests/test_metadata_ordering_sentinel.py
================================================
import os
import random
import tempfile
import uuid
from unittest.mock import patch

from django.test import TestCase, override_settings

from api.models import Photo
from api.tests.utils import create_test_user


def create_unique_png(seed=0):
    """
    Generate a minimal valid PNG with unique content based on seed.
    Each different seed produces a different hash.
    """
    import struct

    def png_chunk(chunk_type, data):
        chunk_data = chunk_type + data
        crc = 0xFFFFFFFF
        for byte in chunk_data:
            crc ^= byte
            for _ in range(8):
                crc = (crc >> 1) ^ 0xEDB88320 if crc & 1 else crc >> 1
        crc ^= 0xFFFFFFFF
        return struct.pack(">I", len(data)) + chunk_data + struct.pack(">I", crc)

    # PNG signature
    png_sig = b"\x89PNG\r\n\x1a\n"

    # IHDR: 1x1 image, 8-bit RGB
    ihdr = struct.pack(">IIBBBBB", 1, 1, 8, 2, 0, 0, 0)

    # IDAT: compressed image data with seed-based variation
    idat_data = bytes([seed % 256]) + b"\x00\x00\x00\x00\x00"
    import zlib

    idat_compressed = zlib.compress(idat_data)

    # IEND: end of PNG
    iend = b""

    return (
        png_sig
        + png_chunk(b"IHDR", ihdr)
        + png_chunk(b"IDAT", idat_compressed)
        + png_chunk(b"IEND", iend)
    )


class DummyAsyncTask:
    """Synchronous replacement for django_q.tasks.AsyncTask.

    - Immediately executes the callable.
    - Tracks completion counts per group id when used for image tasks.
    """

    GROUP_COMPLETIONS: dict[str, int] = {}

    def __init__(self, func, *args, **kwargs):
        self.func = func
        self.args = args
        # Extract 'group' from kwargs before passing to func (func doesn't accept it)
        self.group_id = kwargs.pop("group", None)
        self.kwargs = kwargs

    def run(self):
        # Execute the callable synchronously (without 'group' in kwargs)
        result = self.func(*self.args, **self.kwargs)

        # If this was an image/video task scheduled with a group,
        # increment the completion counter for that group
        func_name = getattr(self.func, "__name__", "")
        if self.group_id and func_name == "handle_new_image":
            DummyAsyncTask.GROUP_COMPLETIONS[self.group_id] = (
                DummyAsyncTask.GROUP_COMPLETIONS.get(self.group_id, 0) + 1
            )
        return result


class DummyChain:
    def __init__(self, *args, **kwargs):
        self.appended = []

    def append(self, *args, **kwargs):
        self.appended.append((args, kwargs))
        return self

    def run(self):
        return None


class MetadataOrderingSentinelTest(TestCase):
    def test_random_order_images_and_xmp_are_consistently_linked(self):
        user = create_test_user()
        with tempfile.TemporaryDirectory() as tmpdir:
            user.scan_directory = tmpdir
            user.save(update_fields=["scan_directory"])

            # Create N image files and corresponding XMP sidecars
            N = 4
            image_paths = []
            xmp_paths = []
            for i in range(N):
                base = f"img_{i}"
                img_path = os.path.join(tmpdir, f"{base}.jpg")
                xmp_path = os.path.join(tmpdir, f"{base}.xmp")
                with open(img_path, "wb") as f:
                    f.write(create_unique_png(i))  # Each image has unique hash
                with open(xmp_path, "wb") as f:
                    f.write(b"<x:xmpmeta>test</x:xmpmeta>")
                image_paths.append(img_path)
                xmp_paths.append(xmp_path)

            # Randomize processing order explicitly via scan_files
            all_files = image_paths + xmp_paths
            random.shuffle(all_files)

            # Patch environment to make processing synchronous and lightweight
            with override_settings(MEDIA_ROOT=tmpdir):
                with (
                    patch("api.directory_watcher.scan_jobs.AsyncTask", DummyAsyncTask),
                    patch("api.directory_watcher.scan_jobs.Chain", DummyChain),
                    patch(
                        "django_q.tasks.count_group",
                        side_effect=lambda gid: DummyAsyncTask.GROUP_COMPLETIONS.get(
                            gid, 0
                        ),
                    ),
                    patch(
                        "api.directory_watcher.scan_jobs.db.connections.close_all"
                    ) as _close_all,
                    patch(
                        "api.directory_watcher.scan_jobs.update_scan_counter"
                    ) as _update_counter,
                    patch("api.directory_watcher.scan_jobs.util.logger") as _logger,
                    patch("pyvips.Image.thumbnail") as _thumb,
                    patch(
                        "api.models.thumbnail.Thumbnail._generate_thumbnail"
                    ) as _gen_thumb,
                    patch(
                        "api.models.thumbnail.Thumbnail._calculate_aspect_ratio"
                    ) as _calc_ar,
                    patch(
                        "api.models.thumbnail.Thumbnail._get_dominant_color"
                    ) as _dom_color,
                    patch(
                        "api.models.photo_metadata.PhotoMetadata.extract_exif_data"
                    ) as _exif,
                    patch(
                        "api.models.photo.Photo._extract_date_time_from_exif"
                    ) as _exif_dt,
                ):
                    # No-op patches
                    _thumb.return_value = None
                    _close_all.return_value = None
                    _update_counter.side_effect = lambda *_args, **_kwargs: None
                    _logger.info.side_effect = lambda *_a, **_k: None
                    _logger.warning.side_effect = lambda *_a, **_k: None
                    _logger.exception.side_effect = lambda *_a, **_k: None
                    _gen_thumb.return_value = None
                    _calc_ar.return_value = None
                    _dom_color.return_value = None
                    _exif.return_value = None
                    _exif_dt.return_value = None

                    job_id = str(uuid.uuid4())
                    # Emulate the core of scan_photos sequencing explicitly:
                    # 1) Enqueue all images/videos in a group and run them synchronously
                    # 2) Run the sentinel to process metadata after the group completes
                    from api.directory_watcher import (
                        handle_new_image,
                        wait_for_group_and_process_metadata,
                    )

                    image_group_id = str(uuid.uuid4())
                    for img in image_paths:
                        DummyAsyncTask(
                            handle_new_image, user, img, job_id, group=image_group_id
                        ).run()

                    DummyAsyncTask(
                        wait_for_group_and_process_metadata,
                        image_group_id,
                        xmp_paths,
                        user.id,
                        False,
                        job_id,
                        len(image_paths),
                    ).run()

            # Validate: image tasks ran and each image must have its XMP associated to the same Photo
            total_completions = sum(DummyAsyncTask.GROUP_COMPLETIONS.values())
            self.assertEqual(
                total_completions,
                N,
                msg=f"Expected {N} image task completions, got {total_completions}",
            )

            photos = list(Photo.objects.all())
            self.assertEqual(
                len(photos), N, msg="All images should produce Photo objects"
            )

            # Build a map from image base name to whether an XMP is linked
            linked = {}
            for p in photos:
                # main_file.path is the image path
                main_path = p.main_file.path if p.main_file else ""
                base = os.path.splitext(os.path.basename(main_path))[0]
                xmp_list = list(
                    p.files.filter(path__endswith=".xmp").values_list("path", flat=True)
                )
                linked[base] = len(xmp_list) >= 1

            # All should be True
            self.assertTrue(
                all(linked.values()), msg=f"Some photos missing XMP: {linked}"
            )


================================================
FILE: api/tests/test_migration_0099.py
================================================
"""
Tests for migration 0099_photo_uuid_primary_key.

Verifies the UUID primary key migration works correctly on both
PostgreSQL (raw SQL) and SQLite (table recreation pattern).

Strategy:
- Migration 0099 is irreversible, so we cannot use the standard
  "roll back → seed → migrate forward" pattern.
- Instead we build a standalone in-memory SQLite database with the
  pre-migration schema, seed data, run the migration function
  directly, and verify the result (TestSQLiteMigration0099).
- We also verify the post-migration schema on the live Django test DB
  (which already had 0099 applied during test-database creation)
  in TestPostMigrationSchema.
- Helper functions are tested in isolation in TestSQLiteHelpers.
"""

import sqlite3
import uuid
from importlib import import_module
from unittest.mock import MagicMock, patch

from django.db import connection
from django.test import TestCase, TransactionTestCase

# Import the migration module (name starts with a digit, use importlib)
_mod = import_module("api.migrations.0099_photo_uuid_primary_key")


# ============================================================================
# Helpers
# ============================================================================

def _sqlite_table_exists(cursor, table_name):
    cursor.execute(
        "SELECT COUNT(*) FROM sqlite_master WHERE type='table' AND name=?",
        [table_name],
    )
    return cursor.fetchone()[0] > 0


def _sqlite_column_names(cursor, table_name):
    cursor.execute(f'PRAGMA table_info("{table_name}")')
    return {row[1] for row in cursor.fetchall()}


def _sqlite_pk_columns(cursor, table_name):
    cursor.execute(f'PRAGMA table_info("{table_name}")')
    return [row[1] for row in cursor.fetchall() if row[5]]


def _sqlite_index_exists(cursor, index_name):
    cursor.execute(
        "SELECT COUNT(*) FROM sqlite_master WHERE type='index' AND name=?",
        [index_name],
    )
    return cursor.fetchone()[0] > 0


# ============================================================================
# Pre-migration schema builder  (mimics the tables that exist at 0098)
# ============================================================================

_PRE_MIGRATION_DDL = """
CREATE TABLE api_photo (
    image_hash VARCHAR(64) NOT NULL PRIMARY KEY,
    hidden     INTEGER NOT NULL DEFAULT 0,
    rating     INTEGER NOT NULL DEFAULT 0,
    deleted    INTEGER NOT NULL DEFAULT 0,
    video      INTEGER NOT NULL DEFAULT 0
);

CREATE TABLE api_face (
    id                           INTEGER PRIMARY KEY AUTOINCREMENT,
    photo_id                     VARCHAR(64) NOT NULL REFERENCES api_photo(image_hash),
    location_top                 INTEGER NOT NULL DEFAULT 0,
    location_bottom              INTEGER NOT NULL DEFAULT 0,
    location_left                INTEGER NOT NULL DEFAULT 0,
    location_right               INTEGER NOT NULL DEFAULT 0,
    deleted                      INTEGER NOT NULL DEFAULT 0,
    classification_probability   REAL NOT NULL DEFAULT 0.0,
    cluster_probability          REAL NOT NULL DEFAULT 0.0
);

CREATE TABLE api_thumbnail (
    photo_id     VARCHAR(64) NOT NULL PRIMARY KEY REFERENCES api_photo(image_hash),
    aspect_ratio REAL
);

CREATE TABLE api_photo_caption (
    photo_id VARCHAR(64) NOT NULL PRIMARY KEY REFERENCES api_photo(image_hash)
);

CREATE TABLE api_photo_search (
    photo_id VARCHAR(64) NOT NULL PRIMARY KEY REFERENCES api_photo(image_hash)
);

CREATE TABLE api_person (
    id             INTEGER PRIMARY KEY AUTOINCREMENT,
    name           TEXT NOT NULL,
    kind           TEXT NOT NULL DEFAULT 'USER',
    cover_photo_id VARCHAR(64) REFERENCES api_photo(image_hash),
    face_count     INTEGER NOT NULL DEFAULT 0
);

CREATE TABLE api_albumuser (
    id             INTEGER PRIMARY KEY AUTOINCREMENT,
    title          TEXT,
    cover_photo_id VARCHAR(64) REFERENCES api_photo(image_hash)
);

CREATE TABLE api_photo_shared_to (
    id       INTEGER PRIMARY KEY AUTOINCREMENT,
    photo_id VARCHAR(64) NOT NULL REFERENCES api_photo(image_hash),
    user_id  INTEGER NOT NULL
);

CREATE TABLE api_photo_files (
    id       INTEGER PRIMARY KEY AUTOINCREMENT,
    photo_id VARCHAR(64) NOT NULL REFERENCES api_photo(image_hash),
    file_id  INTEGER NOT NULL
);

CREATE TABLE api_albumuser_photos (
    id             INTEGER PRIMARY KEY AUTOINCREMENT,
    albumuser_id   INTEGER NOT NULL,
    photo_id       VARCHAR(64) NOT NULL REFERENCES api_photo(image_hash)
);

CREATE TABLE api_albumthing_photos (
    id              INTEGER PRIMARY KEY AUTOINCREMENT,
    albumthing_id   INTEGER NOT NULL,
    photo_id        VARCHAR(64) NOT NULL REFERENCES api_photo(image_hash)
);

CREATE TABLE api_albumplace_photos (
    id              INTEGER PRIMARY KEY AUTOINCREMENT,
    albumplace_id   INTEGER NOT NULL,
    photo_id        VARCHAR(64) NOT NULL REFERENCES api_photo(image_hash)
);

CREATE TABLE api_albumdate_photos (
    id             INTEGER PRIMARY KEY AUTOINCREMENT,
    albumdate_id   INTEGER NOT NULL,
    photo_id       VARCHAR(64) NOT NULL REFERENCES api_photo(image_hash)
);

CREATE TABLE api_albumauto_photos (
    id             INTEGER PRIMARY KEY AUTOINCREMENT,
    albumauto_id   INTEGER NOT NULL,
    photo_id       VARCHAR(64) NOT NULL REFERENCES api_photo(image_hash)
);

CREATE TABLE api_albumthing_cover_photos (
    id              INTEGER PRIMARY KEY AUTOINCREMENT,
    albumthing_id   INTEGER NOT NULL,
    photo_id        VARCHAR(64) NOT NULL REFERENCES api_photo(image_hash)
);

CREATE TABLE api_photostack (
    id               TEXT PRIMARY KEY,
    primary_photo_id VARCHAR(64) REFERENCES api_photo(image_hash)
);

CREATE INDEX api_face_photo_id_old ON api_face(photo_id);
"""


def _build_test_db():
    """Create an in-memory SQLite DB with the pre-migration schema and seed data.

    Returns (connection, hashes) where hashes is a list of image_hash values.
    """
    conn = sqlite3.connect(":memory:")
    cur = conn.cursor()
    cur.executescript(_PRE_MIGRATION_DDL)

    hashes = [f"hash_{i:032d}" for i in range(1, 4)]
    for h in hashes:
        cur.execute(
            "INSERT INTO api_photo (image_hash) VALUES (?)", [h]
        )

    # face referencing photo 0
    cur.execute(
        "INSERT INTO api_face (photo_id, location_top, location_bottom, "
        "location_left, location_right, deleted, classification_probability, "
        "cluster_probability) VALUES (?, 0, 100, 0, 100, 0, 0.5, 0.5)",
        [hashes[0]],
    )
    # second face referencing photo 1
    cur.execute(
        "INSERT INTO api_face (photo_id, location_top, location_bottom, "
        "location_left, location_right, deleted, classification_probability, "
        "cluster_probability) VALUES (?, 10, 200, 10, 200, 0, 0.8, 0.3)",
        [hashes[1]],
    )
    # thumbnail for photo 0
    cur.execute("INSERT INTO api_thumbnail (photo_id, aspect_ratio) VALUES (?, 1.5)", [hashes[0]])
    # caption for photo 1
    cur.execute("INSERT INTO api_photo_caption (photo_id) VALUES (?)", [hashes[1]])
    # search for photo 2
    cur.execute("INSERT INTO api_photo_search (photo_id) VALUES (?)", [hashes[2]])
    # person with cover_photo
    cur.execute("INSERT INTO api_person (name, cover_photo_id) VALUES (?, ?)", ["Alice", hashes[0]])
    # album user with cover_photo
    cur.execute("INSERT INTO api_albumuser (title, cover_photo_id) VALUES (?, ?)", ["My Album", hashes[1]])
    # M2M entries
    cur.execute("INSERT INTO api_photo_shared_to (photo_id, user_id) VALUES (?, 1)", [hashes[0]])
    cur.execute("INSERT INTO api_albumuser_photos (albumuser_id, photo_id) VALUES (1, ?)", [hashes[0]])
    cur.execute("INSERT INTO api_albumthing_photos (albumthing_id, photo_id) VALUES (1, ?)", [hashes[1]])
    cur.execute("INSERT INTO api_albumplace_photos (albumplace_id, photo_id) VALUES (1, ?)", [hashes[2]])
    cur.execute("INSERT INTO api_albumdate_photos (albumdate_id, photo_id) VALUES (1, ?)", [hashes[0]])
    cur.execute("INSERT INTO api_albumauto_photos (albumauto_id, photo_id) VALUES (1, ?)", [hashes[1]])
    cur.execute("INSERT INTO api_albumthing_cover_photos (albumthing_id, photo_id) VALUES (1, ?)", [hashes[2]])
    cur.execute("INSERT INTO api_photostack (id, primary_photo_id) VALUES (?, ?)", ["stack-1", hashes[0]])

    conn.commit()
    return conn, hashes


def _run_migration_on(sqlite_conn):
    """Run the SQLite migration path on the given raw sqlite3 connection."""
    # _migrate_sqlite expects a Django-like schema_editor with
    # .connection.cursor() returning something with .execute/.fetchall.
    # We wrap the raw sqlite3 connection to match.
    class _CursorWrapper:
        """Thin adapter so _migrate_sqlite can call cursor.execute(sql, params)."""
        def __init__(self, raw_cursor):
            self._cur = raw_cursor
        def execute(self, sql, params=None):
            if params is None:
                return self._cur.execute(sql)
            return self._cur.execute(sql, params)
        def fetchall(self):
            return self._cur.fetchall()
        def fetchone(self):
            return self._cur.fetchone()

    class _ConnWrapper:
        def __init__(self, raw_conn):
            self._conn = raw_conn
            self.vendor = "sqlite"
        def cursor(self):
            return _CursorWrapper(self._conn.cursor())

    class _SchemaEditor:
        def __init__(self, raw_conn):
            self.connection = _ConnWrapper(raw_conn)

    _mod._migrate_sqlite(_SchemaEditor(sqlite_conn))
    sqlite_conn.commit()


# ============================================================================
# Test: Full end-to-end SQLite migration
# ============================================================================

class TestSQLiteMigration0099(TestCase):
    """
    End-to-end test of the SQLite migration path.

    Creates a standalone in-memory SQLite database with the pre-0099 schema,
    seeds test data, runs `_migrate_sqlite`, and verifies all changes.
    """

    @classmethod
    def setUpClass(cls):
        super().setUpClass()
        cls.conn, cls.hashes = _build_test_db()
        _run_migration_on(cls.conn)

    @classmethod
    def tearDownClass(cls):
        cls.conn.close()
        super().tearDownClass()

    def _cursor(self):
        return self.conn.cursor()

    # -- schema assertions -------------------------------------------------

    def test_photo_has_id_column(self):
        cur = self._cursor()
        cols = _sqlite_column_names(cur, "api_photo")
        self.assertIn("id", cols)

    def test_photo_has_image_hash_column(self):
        cur = self._cursor()
        cols = _sqlite_column_names(cur, "api_photo")
        self.assertIn("image_hash", cols)

    def test_photo_pk_is_id(self):
        cur = self._cursor()
        pk = _sqlite_pk_columns(cur, "api_photo")
        self.assertEqual(pk, ["id"])

    def test_image_hash_unique_index(self):
        cur = self._cursor()
        self.assertTrue(_sqlite_index_exists(cur, "api_photo_image_hash_unique"))

    def test_performance_indexes(self):
        expected = [
            "api_face_photo_id_idx",
            "api_photo_shared_to_photo_id_idx",
            "api_photo_files_photo_id_idx",
            "api_person_cover_photo_id_idx",
            "api_albumuser_cover_photo_id_idx",
            "api_photostack_primary_photo_id_idx",
        ]
        cur = self._cursor()
        for idx in expected:
            self.assertTrue(
                _sqlite_index_exists(cur, idx),
                f"Missing index: {idx}",
            )

    # -- data assertions ---------------------------------------------------

    def test_all_photos_have_valid_uuids(self):
        cur = self._cursor()
        cur.execute('SELECT "id" FROM api_photo')
        rows = cur.fetchall()
        self.assertEqual(len(rows), 3)
        for (photo_id,) in rows:
            uuid.UUID(photo_id)  # will raise if invalid

    def test_image_hashes_preserved(self):
        cur = self._cursor()
        cur.execute('SELECT "image_hash" FROM api_photo ORDER BY image_hash')
        actual = [r[0] for r in cur.fetchall()]
        self.assertEqual(actual, sorted(self.hashes))

    def test_each_photo_has_distinct_uuid(self):
        cur = self._cursor()
        cur.execute('SELECT "id" FROM api_photo')
        ids = [r[0] for r in cur.fetchall()]
        self.assertEqual(len(ids), len(set(ids)))

    def test_face_fk_translated(self):
        """Faces should join to photos via the new UUID id."""
        cur = self._cursor()
        cur.execute(
            'SELECT f.photo_id, p.id FROM api_face f '
            'JOIN api_photo p ON f.photo_id = p.id'
        )
        rows = cur.fetchall()
        self.assertEqual(len(rows), 2)
        for fk, pk in rows:
            self.assertEqual(fk, pk)
            uuid.UUID(fk)

    def test_no_orphan_faces(self):
        cur = self._cursor()
        cur.execute(
            'SELECT COUNT(*) FROM api_face f '
            'LEFT JOIN api_photo p ON f.photo_id = p.id '
            'WHERE p.id IS NULL'
        )
        self.assertEqual(cur.fetchone()[0], 0)

    def test_thumbnail_fk_translated(self):
        cur = self._cursor()
        cur.execute(
            'SELECT t.photo_id, p.id FROM api_thumbnail t '
            'JOIN api_photo p ON t.photo_id = p.id'
        )
        rows = cur.fetchall()
        self.assertEqual(len(rows), 1)
        self.assertEqual(rows[0][0], rows[0][1])

    def test_photo_caption_fk_translated(self):
        cur = self._cursor()
        cur.execute(
            'SELECT c.photo_id, p.id FROM api_photo_caption c '
            'JOIN api_photo p ON c.photo_id = p.id'
        )
        rows = cur.fetchall()
        self.assertEqual(len(rows), 1)

    def test_photo_search_fk_translated(self):
        cur = self._cursor()
        cur.execute(
            'SELECT s.photo_id, p.id FROM api_photo_search s '
            'JOIN api_photo p ON s.photo_id = p.id'
        )
        rows = cur.fetchall()
        self.assertEqual(len(rows), 1)

    def test_person_cover_photo_translated(self):
        cur = self._cursor()
        cur.execute(
            'SELECT per.cover_photo_id, p.id FROM api_person per '
            'JOIN api_photo p ON per.cover_photo_id = p.id'
        )
        rows = cur.fetchall()
        self.assertEqual(len(rows), 1)
        uuid.UUID(rows[0][0])

    def test_albumuser_cover_photo_translated(self):
        cur = self._cursor()
        cur.execute(
            'SELECT a.cover_photo_id, p.id FROM api_albumuser a '
            'JOIN api_photo p ON a.cover_photo_id = p.id'
        )
        rows = cur.fetchall()
        self.assertEqual(len(rows), 1)

    def test_m2m_shared_to_translated(self):
        cur = self._cursor()
        cur.execute(
            'SELECT s.photo_id, p.id FROM api_photo_shared_to s '
            'JOIN api_photo p ON s.photo_id = p.id'
        )
        self.assertEqual(len(cur.fetchall()), 1)

    def test_m2m_albumuser_photos_translated(self):
        cur = self._cursor()
        cur.execute(
            'SELECT a.photo_id, p.id FROM api_albumuser_photos a '
            'JOIN api_photo p ON a.photo_id = p.id'
        )
        self.assertEqual(len(cur.fetchall()), 1)

    def test_m2m_albumthing_photos_translated(self):
        cur = self._cursor()
        cur.execute(
            'SELECT a.photo_id, p.id FROM api_albumthing_photos a '
            'JOIN api_photo p ON a.photo_id = p.id'
        )
        self.assertEqual(len(cur.fetchall()), 1)

    def test_m2m_albumplace_photos_translated(self):
        cur = self._cursor()
        cur.execute(
            'SELECT a.photo_id, p.id FROM api_albumplace_photos a '
            'JOIN api_photo p ON a.photo_id = p.id'
        )
        self.assertEqual(len(cur.fetchall()), 1)

    def test_m2m_albumdate_photos_translated(self):
        cur = self._cursor()
        cur.execute(
            'SELECT a.photo_id, p.id FROM api_albumdate_photos a '
            'JOIN api_photo p ON a.photo_id = p.id'
        )
        self.assertEqual(len(cur.fetchall()), 1)

    def test_m2m_albumauto_photos_translated(self):
        cur = self._cursor()
        cur.execute(
            'SELECT a.photo_id, p.id FROM api_albumauto_photos a '
            'JOIN api_photo p ON a.photo_id = p.id'
        )
        self.assertEqual(len(cur.fetchall()), 1)

    def test_albumthing_cover_photos_translated(self):
        cur = self._cursor()
        cur.execute(
            'SELECT a.photo_id, p.id FROM api_albumthing_cover_photos a '
            'JOIN api_photo p ON a.photo_id = p.id'
        )
        self.assertEqual(len(cur.fetchall()), 1)

    def test_photostack_primary_photo_translated(self):
        cur = self._cursor()
        cur.execute(
            'SELECT s.primary_photo_id, p.id FROM api_photostack s '
            'JOIN api_photo p ON s.primary_photo_id = p.id'
        )
        rows = cur.fetchall()
        self.assertEqual(len(rows), 1)
        uuid.UUID(rows[0][0])


# ============================================================================
# Test: Post-migration schema on the live Django test database
# ============================================================================

class TestPostMigrationSchema(TestCase):
    """
    Verify the Django test DB (where migration 0099 already ran during
    test database creation) has the expected post-migration schema.

    This validates that the migration ran successfully on whatever backend
    the test suite is configured with (SQLite via test_sqlite settings).
    """

    def test_photo_table_has_id_and_image_hash(self):
        with connection.cursor() as cursor:
            if connection.vendor == "sqlite":
                cursor.execute('PRAGMA table_info("api_photo")')
                cols = {row[1] for row in cursor.fetchall()}
            else:
                cursor.execute(
                    "SELECT column_name FROM information_schema.columns "
                    "WHERE table_name = 'api_photo'"
                )
                cols = {row[0] for row in cursor.fetchall()}
        self.assertIn("id", cols)
        self.assertIn("image_hash", cols)

    def test_photo_pk_is_uuid_field(self):
        """Verify Django's ORM sees the PK as a UUID field named 'id'."""
        from api.models import Photo
        pk_field = Photo._meta.pk
        self.assertEqual(pk_field.name, "id")
        self.assertIsInstance(pk_field, __import__("django").db.models.UUIDField)


# ============================================================================
# Test: Dispatch and reverse logic
# ============================================================================

class TestMigrationDispatch(TestCase):
    """Test migrate_forward dispatch and migrate_reverse error."""

    def test_dispatches_to_sqlite(self):
        mock_editor = MagicMock()
        mock_editor.connection.vendor = "sqlite"
        with patch.object(_mod, "_migrate_sqlite") as mock_fn:
            _mod.migrate_forward(MagicMock(), mock_editor)
            mock_fn.assert_called_once_with(mock_editor)

    def test_dispatches_to_postgresql(self):
        mock_editor = MagicMock()
        mock_editor.connection.vendor = "postgresql"
        with patch.object(_mod, "_migrate_postgresql") as mock_fn:
            _mod.migrate_forward(MagicMock(), mock_editor)
            mock_fn.assert_called_once_with(mock_editor)

    def test_rejects_unknown_backend(self):
        mock_editor = MagicMock()
        mock_editor.connection.vendor = "oracle"
        with self.assertRaises(ValueError):
            _mod.migrate_forward(MagicMock(), mock_editor)

    def test_reverse_raises_runtime_error(self):
        with self.assertRaises(RuntimeError):
            _mod.migrate_reverse(MagicMock(), MagicMock())


# ============================================================================
# Test: SQLite helper functions in isolation
# ============================================================================

class TestSQLiteHelpers(TestCase):
    """Unit tests for the individual SQLite helper functions."""

    def test_column_info(self):
        if connection.vendor != "sqlite":
            self.skipTest("SQLite-specific")
        with connection.cursor() as cur:
            cur.execute(
                "CREATE TABLE IF NOT EXISTS _t_col "
                "(pk INTEGER PRIMARY KEY, name TEXT NOT NULL, val REAL)"
            )
            cols = _mod._sqlite_column_info(cur, "_t_col")
            cur.execute("DROP TABLE IF EXISTS _t_col")
        self.assertEqual({c[1] for c in cols}, {"pk", "name", "val"})

    def test_index_info(self):
        if connection.vendor != "sqlite":
            self.skipTest("SQLite-specific")
        with connection.cursor() as cur:
            cur.execute("CREATE TABLE IF NOT EXISTS _t_idx (a TEXT, b TEXT)")
            cur.execute("CREATE INDEX IF NOT EXISTS _t_idx_a ON _t_idx(a)")
            idxs = _mod._sqlite_index_info(cur, "_t_idx")
            cur.execute("DROP TABLE IF EXISTS _t_idx")
        self.assertIn("_t_idx_a", [i[0] for i in idxs])

    def test_recreate_table_changes_pk(self):
        if connection.vendor != "sqlite":
            self.skipTest("SQLite-specific")
        with connection.cursor() as cur:
            cur.execute(
                "CREATE TABLE _t_rec (old_pk TEXT PRIMARY KEY, new_pk TEXT, data TEXT)"
            )
            cur.execute("INSERT INTO _t_rec VALUES ('h1', 'u1', 'a')")
            cur.execute("INSERT INTO _t_rec VALUES ('h2', 'u2', 'b')")

            _mod._sqlite_recreate_table(
                cur, "_t_rec", pk_column="new_pk",
                column_overrides={
                    "new_pk": '"new_pk" TEXT NOT NULL',
                    "old_pk": '"old_pk" TEXT NOT NULL UNIQUE',
                },
            )
            pk = _sqlite_pk_columns(cur, "_t_rec")
            self.assertEqual(pk, ["new_pk"])
            cur.execute("SELECT old_pk, new_pk, data FROM _t_rec ORDER BY old_pk")
            self.assertEqual(cur.fetchall(), [("h1", "u1", "a"), ("h2", "u2", "b")])
            cur.execute("DROP TABLE _t_rec")

    def test_update_fk_table_translates_values(self):
        if connection.vendor != "sqlite":
            self.skipTest("SQLite-specific")
        with connection.cursor() as cur:
            cur.execute("CREATE TABLE _t_parent (id TEXT PRIMARY KEY)")
            cur.execute("INSERT INTO _t_parent VALUES ('uuid-a')")
            cur.execute(
                "CREATE TABLE _t_child (id INTEGER PRIMARY KEY, fk TEXT, info TEXT)"
            )
            cur.execute("INSERT INTO _t_child (fk, info) VALUES ('old', 'r1')")
            cur.execute("INSERT INTO _t_child (fk, info) VALUES ('old', 'r2')")

            _mod._sqlite_update_fk_table(cur, "_t_child", "fk", {"old": "uuid-a"})

            cur.execute("SELECT fk FROM _t_child")
            self.assertTrue(all(r[0] == "uuid-a" for r in cur.fetchall()))
            cur.execute("DROP TABLE _t_child")
            cur.execute("DROP TABLE _t_parent")

    def test_update_fk_table_skips_missing_table(self):
        if connection.vendor != "sqlite":
            self.skipTest("SQLite-specific")
        with connection.cursor() as cur:
            # Should not raise
            _mod._sqlite_update_fk_table(cur, "_no_such_table_999", "col", {"a": "b"})


================================================
FILE: api/tests/test_migration_0101.py
================================================
"""
Test for migration 0101_populate_photo_metadata to ensure it works correctly.

This test verifies:
1. The fix for the PostgreSQL error: "operator does not exist: uuid = character varying"
2. The fix for the SQLite issue: cursor-during-writes conflict with iterator() + writes
"""
from importlib import import_module

from django.db import models
from django.db.models import Exists, OuterRef, Subquery
from django.test import TestCase

from api.models import Photo
from api.models.photo_caption import PhotoCaption
from api.models.photo_metadata import PhotoMetadata
from api.tests.utils import create_test_photo, create_test_user

_migration = import_module("api.migrations.0101_populate_photo_metadata")
BATCH_SIZE = _migration.BATCH_SIZE


class Migration0101TestCase(TestCase):
    """Test the migration logic for populating PhotoMetadata."""

    def setUp(self):
        """Set up test data."""
        self.user = create_test_user()

    def test_subquery_with_uuid_primary_key(self):
        """
        Test that the subquery correctly references the UUID primary key.
        
        This test ensures the fix for the PostgreSQL error where
        photo_id (UUID) was incorrectly compared with image_hash (VARCHAR).
        """
        # Create a photo with caption
        photo = create_test_photo(
            owner=self.user,
            captions_json={"user_caption": "Test caption", "keywords": ["test"]},
        )

        # Verify the caption was created
        self.assertTrue(PhotoCaption.objects.filter(photo=photo).exists())

        # Test the subquery pattern from the migration (FIXED version)
        caption_subquery = PhotoCaption.objects.filter(
            photo_id=OuterRef('pk')  # Using 'pk' (UUID) instead of 'image_hash' (VARCHAR)
        ).values('captions_json')[:1]

        # Query photos with the subquery annotation
        photos = Photo.objects.annotate(
            captions_data=Subquery(caption_subquery)
        ).filter(pk=photo.pk)

        # Verify the query works without PostgreSQL type errors
        self.assertEqual(photos.count(), 1)
        photo_with_caption = photos.first()
        self.assertIsNotNone(photo_with_caption.captions_data)
        self.assertEqual(
            photo_with_caption.captions_data.get("user_caption"),
            "Test caption"
        )

    def test_migration_logic_creates_metadata(self):
        """
        Test the full migration logic to ensure PhotoMetadata is populated.
        """
        # Create photos without metadata
        photo1 = create_test_photo(
            owner=self.user,
            captions_json={"user_caption": "First photo"},
        )
        photo2 = create_test_photo(
            owner=self.user,
            captions_json={"user_caption": "Second photo", "keywords": ["tag1", "tag2"]},
        )

        # Manually delete any metadata that might have been auto-created
        PhotoMetadata.objects.filter(photo__in=[photo1, photo2]).delete()

        # Verify no metadata exists
        self.assertFalse(PhotoMetadata.objects.filter(photo=photo1).exists())
        self.assertFalse(PhotoMetadata.objects.filter(photo=photo2).exists())

        # Simulate the migration logic
        caption_subquery = PhotoCaption.objects.filter(
            photo_id=OuterRef('pk')
        ).values('captions_json')[:1]

        existing_metadata = PhotoMetadata.objects.filter(photo_id=OuterRef('pk'))

        photos = Photo.objects.filter(
            ~models.Exists(existing_metadata)
        ).annotate(
            captions_data=Subquery(caption_subquery)
        )

        # Create PhotoMetadata for each photo
        for photo in photos:
            captions_json = photo.captions_data
            PhotoMetadata.objects.create(
                photo=photo,
                caption=captions_json.get("user_caption") if captions_json else None,
                keywords=list(captions_json.get("keywords", [])) if captions_json else [],
                source="embedded",
                version=1,
            )

        # Verify metadata was created
        self.assertTrue(PhotoMetadata.objects.filter(photo=photo1).exists())
        self.assertTrue(PhotoMetadata.objects.filter(photo=photo2).exists())

        # Verify caption data was correctly populated
        metadata1 = PhotoMetadata.objects.get(photo=photo1)
        self.assertEqual(metadata1.caption, "First photo")

        metadata2 = PhotoMetadata.objects.get(photo=photo2)
        self.assertEqual(metadata2.caption, "Second photo")
        self.assertEqual(metadata2.keywords, ["tag1", "tag2"])

    def test_batch_processing_without_iterator(self):
        """
        Test the fixed migration approach: fetch IDs upfront, process in batches.

        This tests the SQLite-compatible pattern where:
        - All photo IDs are collected first (no open cursor during writes)
        - Caption data is loaded per-batch
        - No iterator() is used alongside writes
        - Photos with pre-existing metadata are correctly excluded
        """
        photo1 = create_test_photo(
            owner=self.user,
            captions_json={"user_caption": "Batch photo 1", "keywords": ["a"]},
        )
        photo2 = create_test_photo(
            owner=self.user,
            captions_json={"user_caption": "Batch photo 2", "keywords": ["b", "c"]},
        )
        photo3 = create_test_photo(owner=self.user)  # no caption

        # photo_already_done has pre-existing metadata — should be excluded
        photo_already_done = create_test_photo(owner=self.user)
        PhotoMetadata.objects.filter(photo=photo_already_done).delete()
        existing_meta = PhotoMetadata.objects.create(
            photo=photo_already_done,
            caption="pre-existing",
            source="embedded",
            version=1,
        )

        PhotoMetadata.objects.filter(photo__in=[photo1, photo2, photo3]).delete()

        # --- Simulate the fixed migration approach ---
        existing_metadata = PhotoMetadata.objects.filter(photo_id=OuterRef('pk'))
        photo_ids = list(
            Photo.objects
            .filter(~Exists(existing_metadata))
            .values_list('pk', flat=True)
        )

        all_batch = []
        for chunk_start in range(0, len(photo_ids), BATCH_SIZE):
            chunk_ids = photo_ids[chunk_start:chunk_start + BATCH_SIZE]
            captions = {
                c.photo_id: c.captions_json
                for c in PhotoCaption.objects.filter(photo_id__in=chunk_ids)
            }
            batch = []
            for photo in Photo.objects.filter(pk__in=chunk_ids):
                captions_json = captions.get(photo.pk)
                batch.append(PhotoMetadata(
                    photo=photo,
                    caption=captions_json.get("user_caption") if captions_json else None,
                    keywords=list(captions_json.get("keywords", [])) if captions_json else [],
                    source="embedded",
                    version=1,
                ))
            PhotoMetadata.objects.bulk_create(batch, ignore_conflicts=True)
            all_batch.extend(batch)

        # All three photos must have metadata
        self.assertTrue(PhotoMetadata.objects.filter(photo=photo1).exists())
        self.assertTrue(PhotoMetadata.objects.filter(photo=photo2).exists())
        self.assertTrue(PhotoMetadata.objects.filter(photo=photo3).exists())

        m1 = PhotoMetadata.objects.get(photo=photo1)
        self.assertEqual(m1.caption, "Batch photo 1")
        self.assertEqual(m1.keywords, ["a"])

        m2 = PhotoMetadata.objects.get(photo=photo2)
        self.assertEqual(m2.caption, "Batch photo 2")
        self.assertEqual(m2.keywords, ["b", "c"])

        m3 = PhotoMetadata.objects.get(photo=photo3)
        self.assertIsNone(m3.caption)
        self.assertEqual(m3.keywords, [])

        # photo_already_done must NOT have been re-processed — exactly one record,
        # the pre-existing one, and its caption must still be the original value.
        self.assertEqual(PhotoMetadata.objects.filter(photo=photo_already_done).count(), 1)
        existing_meta.refresh_from_db()
        self.assertEqual(existing_meta.caption, "pre-existing")

    def test_batch_processing_is_idempotent(self):
        """
        Running the batch-based migration approach twice should not duplicate records.
        """
        photo = create_test_photo(
            owner=self.user,
            captions_json={"user_caption": "Idempotent test"},
        )
        PhotoMetadata.objects.filter(photo=photo).delete()

        def run_migration_logic():
            existing_metadata = PhotoMetadata.objects.filter(photo_id=OuterRef('pk'))
            photo_ids = list(
                Photo.objects
                .filter(~Exists(existing_metadata))
                .values_list('pk', flat=True)
            )
            captions = {
                c.photo_id: c.captions_json
                for c in PhotoCaption.objects.filter(photo_id__in=photo_ids)
            }
            batch = []
            for p in Photo.objects.filter(pk__in=photo_ids):
                captions_json = captions.get(p.pk)
                batch.append(PhotoMetadata(
                    photo=p,
                    caption=captions_json.get("user_caption") if captions_json else None,
                    keywords=list(captions_json.get("keywords", [])) if captions_json else [],
                    source="embedded",
                    version=1,
                ))
            PhotoMetadata.objects.bulk_create(batch, ignore_conflicts=True)

        run_migration_logic()
        self.assertEqual(PhotoMetadata.objects.filter(photo=photo).count(), 1)

        # Second run: the photo already has metadata, so it should be skipped
        run_migration_logic()
        self.assertEqual(PhotoMetadata.objects.filter(photo=photo).count(), 1)

    def test_bulk_create_ignore_conflicts_on_duplicate(self):
        """
        Verify that bulk_create(ignore_conflicts=True) silently skips duplicate records.

        This tests the safety net used in each batch: if for any reason a
        PhotoMetadata record already exists for a photo in the batch (e.g. a
        partially-applied migration is retried), the insert is ignored rather
        than raising an IntegrityError.
        """
        photo = create_test_photo(owner=self.user)
        PhotoMetadata.objects.filter(photo=photo).delete()

        first = PhotoMetadata(photo=photo, source="embedded", version=1)
        PhotoMetadata.objects.bulk_create([first], ignore_conflicts=True)
        self.assertEqual(PhotoMetadata.objects.filter(photo=photo).count(), 1)

        # Attempt to insert the same photo again — must not raise
        duplicate = PhotoMetadata(photo=photo, source="embedded", version=1)
        PhotoMetadata.objects.bulk_create([duplicate], ignore_conflicts=True)
        self.assertEqual(PhotoMetadata.objects.filter(photo=photo).count(), 1)


================================================
FILE: api/tests/test_multi_user_isolation.py
================================================
"""
Tests for multi-user isolation and security.

Ensures that:
- Users can only see/modify their own duplicates and stacks
- Shared photos don't leak into other users' detection
- Admin access is properly scoped
- Cross-user operations are blocked
"""

from django.test import TestCase
from rest_framework.test import APIClient, APITestCase

from api.models.duplicate import Duplicate
from api.models.photo_stack import PhotoStack
from api.tests.utils import create_test_photo, create_test_user


class DuplicateUserIsolationTestCase(APITestCase):
    """Test that duplicates are properly scoped to users."""

    def setUp(self):
        self.user1 = create_test_user()
        self.user2 = create_test_user()
        self.admin = create_test_user()
        self.admin.is_staff = True
        self.admin.save()
        
        self.client = APIClient()

    def test_user_cannot_see_other_user_duplicates(self):
        """Test that users can only see their own duplicates."""
        # Create duplicate for user2
        photos = [create_test_photo(owner=self.user2) for _ in range(2)]
        dup = Duplicate.objects.create(
            owner=self.user2,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(*photos)
        
        # Login as user1
        self.client.force_authenticate(user=self.user1)
        
        # Try to access duplicate list
        response = self.client.get("/api/duplicates")
        self.assertEqual(response.status_code, 200)
        
        # Should not see user2's duplicate
        dup_ids = [d["id"] for d in response.data.get("results", [])]
        self.assertNotIn(str(dup.id), dup_ids)

    def test_user_cannot_access_other_user_duplicate_detail(self):
        """Test that users cannot access other users' duplicate details."""
        photos = [create_test_photo(owner=self.user2) for _ in range(2)]
        dup = Duplicate.objects.create(
            owner=self.user2,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(*photos)
        
        self.client.force_authenticate(user=self.user1)
        
        response = self.client.get(f"/api/duplicates/{dup.id}")
        self.assertIn(response.status_code, [403, 404])

    def test_user_cannot_resolve_other_user_duplicate(self):
        """Test that users cannot resolve other users' duplicates."""
        photos = [create_test_photo(owner=self.user2) for _ in range(2)]
        dup = Duplicate.objects.create(
            owner=self.user2,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(*photos)
        
        self.client.force_authenticate(user=self.user1)
        
        response = self.client.post(
            f"/api/duplicates/{dup.id}/resolve",
            {"kept_photo_id": str(photos[0].pk)},
            format="json"
        )
        self.assertIn(response.status_code, [403, 404])

    def test_user_cannot_delete_other_user_duplicate(self):
        """Test that users cannot delete other users' duplicates."""
        photos = [create_test_photo(owner=self.user2) for _ in range(2)]
        dup = Duplicate.objects.create(
            owner=self.user2,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(*photos)
        
        self.client.force_authenticate(user=self.user1)
        
        response = self.client.delete(f"/api/duplicates/{dup.id}/delete")
        self.assertIn(response.status_code, [403, 404])
        
        # Duplicate should still exist
        self.assertTrue(Duplicate.objects.filter(pk=dup.pk).exists())

    def test_admin_can_see_duplicate_stats(self):
        """Test that admin can see global stats."""
        # Create duplicates for different users
        for user in [self.user1, self.user2]:
            photos = [create_test_photo(owner=user) for _ in range(2)]
            dup = Duplicate.objects.create(
                owner=user,
                duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            )
            dup.photos.add(*photos)
        
        self.client.force_authenticate(user=self.admin)
        
        response = self.client.get("/api/duplicates/stats")
        self.assertEqual(response.status_code, 200)


class StackUserIsolationTestCase(APITestCase):
    """Test that stacks are properly scoped to users."""

    def setUp(self):
        self.user1 = create_test_user()
        self.user2 = create_test_user()
        self.client = APIClient()

    def test_user_cannot_see_other_user_stacks(self):
        """Test that users can only see their own stacks."""
        # Create stack for user2
        photos = [create_test_photo(owner=self.user2) for _ in range(2)]
        stack = PhotoStack.objects.create(
            owner=self.user2,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack.photos.add(*photos)
        
        self.client.force_authenticate(user=self.user1)
        
        response = self.client.get("/api/stacks")
        self.assertEqual(response.status_code, 200)
        
        stack_ids = [s["id"] for s in response.data.get("results", [])]
        self.assertNotIn(str(stack.id), stack_ids)

    def test_user_cannot_access_other_user_stack_detail(self):
        """Test that users cannot access other users' stack details."""
        photos = [create_test_photo(owner=self.user2) for _ in range(2)]
        stack = PhotoStack.objects.create(
            owner=self.user2,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack.photos.add(*photos)
        
        self.client.force_authenticate(user=self.user1)
        
        response = self.client.get(f"/api/stacks/{stack.id}")
        self.assertIn(response.status_code, [403, 404])

    def test_user_cannot_modify_other_user_stack(self):
        """Test that users cannot modify other users' stacks."""
        photos = [create_test_photo(owner=self.user2) for _ in range(3)]
        stack = PhotoStack.objects.create(
            owner=self.user2,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(*photos[:2])
        
        self.client.force_authenticate(user=self.user1)
        
        # Try to add a photo
        response = self.client.post(
            f"/api/stacks/{stack.id}/add",
            {"photo_ids": [str(photos[2].pk)]},
            format="json"
        )
        self.assertIn(response.status_code, [403, 404])

    def test_user_cannot_delete_other_user_stack(self):
        """Test that users cannot delete other users' stacks."""
        photos = [create_test_photo(owner=self.user2) for _ in range(2)]
        stack = PhotoStack.objects.create(
            owner=self.user2,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(*photos)
        
        self.client.force_authenticate(user=self.user1)
        
        response = self.client.delete(f"/api/stacks/{stack.id}/delete")
        self.assertIn(response.status_code, [403, 404])
        
        # Stack should still exist
        self.assertTrue(PhotoStack.objects.filter(pk=stack.pk).exists())

    def test_user_cannot_create_stack_with_other_user_photos(self):
        """Test that users cannot create stacks with other users' photos."""
        other_photos = [create_test_photo(owner=self.user2) for _ in range(2)]
        
        self.client.force_authenticate(user=self.user1)
        
        response = self.client.post(
            "/api/stacks/manual",
            {"photo_ids": [str(p.pk) for p in other_photos]},
            format="json"
        )
        # Should either fail or create empty stack
        if response.status_code == 201:
            # If created, should have no photos
            stack_id = response.data.get("id")
            if stack_id:
                stack = PhotoStack.objects.get(pk=stack_id)
                self.assertEqual(stack.photos.count(), 0)
        else:
            self.assertIn(response.status_code, [400, 403, 404])


class SharedPhotoIsolationTestCase(TestCase):
    """Test that shared photos don't affect personal stacks/duplicates."""

    def setUp(self):
        self.user1 = create_test_user()
        self.user2 = create_test_user()

    def test_shared_photo_not_in_receiver_stacks(self):
        """Test that photos shared TO a user don't appear in their stack detection."""
        # Create photo for user1
        photo1 = create_test_photo(owner=self.user1)
        
        # Share with user2
        photo1.shared_to.add(self.user2)
        
        # Create a stack for user1
        photo2 = create_test_photo(owner=self.user1)
        stack = PhotoStack.objects.create(
            owner=self.user1,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo1, photo2)
        
        # User2 should not see this stack
        user2_stacks = PhotoStack.objects.filter(owner=self.user2)
        self.assertEqual(user2_stacks.count(), 0)

    def test_shared_photo_not_in_receiver_duplicates(self):
        """Test that shared photos don't appear in receiver's duplicate detection."""
        # Create photos for user1
        photos = [create_test_photo(owner=self.user1) for _ in range(2)]
        
        # Create duplicate group for user1
        dup = Duplicate.objects.create(
            owner=self.user1,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(*photos)
        
        # Share one photo with user2
        photos[0].shared_to.add(self.user2)
        
        # User2 should not see this duplicate
        user2_dups = Duplicate.objects.filter(owner=self.user2)
        self.assertEqual(user2_dups.count(), 0)

    def test_user_stack_unaffected_by_shared_photos(self):
        """Test that user's own stacks aren't affected by sharing."""
        # Create stack for user1
        photos = [create_test_photo(owner=self.user1) for _ in range(3)]
        stack = PhotoStack.objects.create(
            owner=self.user1,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack.photos.add(*photos)
        
        # Share one photo
        photos[0].shared_to.add(self.user2)
        
        # Stack should still have all 3 photos
        stack.refresh_from_db()
        self.assertEqual(stack.photos.count(), 3)


class DetectionUserIsolationTestCase(APITestCase):
    """Test that detection operations are properly isolated."""

    def setUp(self):
        self.user1 = create_test_user()
        self.user2 = create_test_user()
        self.client = APIClient()

    def test_duplicate_detection_only_affects_own_photos(self):
        """Test that duplicate detection only processes user's own photos."""
        # Create photos for both users with same hash (simulating duplicates)
        photo1_u1 = create_test_photo(owner=self.user1)
        photo2_u1 = create_test_photo(owner=self.user1)
        photo1_u2 = create_test_photo(owner=self.user2)
        photo2_u2 = create_test_photo(owner=self.user2)
        
        # Set same perceptual hash to simulate visual duplicates
        same_hash = "0" * 16
        for photo in [photo1_u1, photo2_u1, photo1_u2, photo2_u2]:
            photo.image_phash = same_hash
            photo.save()
        
        self.client.force_authenticate(user=self.user1)
        
        # Trigger detection for user1
        response = self.client.post("/api/duplicates/detect")
        self.assertIn(response.status_code, [200, 202])
        
        # User2's photos should not be in user1's duplicates
        user1_dups = Duplicate.objects.filter(owner=self.user1)
        for dup in user1_dups:
            for photo in dup.photos.all():
                self.assertEqual(photo.owner, self.user1)

    def test_stack_detection_only_affects_own_photos(self):
        """Test that stack detection only processes user's own photos."""
        # Create photos for both users
        for _ in range(3):
            create_test_photo(owner=self.user1)
            create_test_photo(owner=self.user2)
        
        self.client.force_authenticate(user=self.user1)
        
        # Trigger stack detection for user1
        response = self.client.post("/api/stacks/detect")
        self.assertIn(response.status_code, [200, 202])
        
        # User2 should have no stacks created
        user2_stacks = PhotoStack.objects.filter(owner=self.user2)
        self.assertEqual(user2_stacks.count(), 0)


class CrossUserOperationTestCase(APITestCase):
    """Test that cross-user operations are properly blocked."""

    def setUp(self):
        self.user1 = create_test_user()
        self.user2 = create_test_user()
        self.client = APIClient()

    def test_cannot_add_other_user_photo_to_own_stack(self):
        """Test that users cannot add other users' photos to their stacks."""
        own_photos = [create_test_photo(owner=self.user1) for _ in range(2)]
        other_photo = create_test_photo(owner=self.user2)
        
        stack = PhotoStack.objects.create(
            owner=self.user1,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(*own_photos)
        
        self.client.force_authenticate(user=self.user1)
        
        _response = self.client.post(
            f"/api/stacks/{stack.id}/add",
            {"photo_ids": [str(other_photo.pk)]},
            format="json"
        )
        
        # Should either fail or not add the photo
        stack.refresh_from_db()
        self.assertNotIn(other_photo, stack.photos.all())

    def test_cannot_resolve_duplicate_with_other_user_photo(self):
        """Test that users cannot resolve duplicates by keeping other user's photo."""
        photos = [create_test_photo(owner=self.user1) for _ in range(2)]
        other_photo = create_test_photo(owner=self.user2)
        
        dup = Duplicate.objects.create(
            owner=self.user1,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(*photos)
        
        self.client.force_authenticate(user=self.user1)
        
        # Try to resolve keeping other user's photo
        response = self.client.post(
            f"/api/duplicates/{dup.id}/resolve",
            {"kept_photo_id": str(other_photo.pk)},
            format="json"
        )
        
        # Should fail
        self.assertIn(response.status_code, [400, 403, 404])

    def test_cannot_set_other_user_photo_as_stack_primary(self):
        """Test that users cannot set other user's photo as stack primary."""
        own_photos = [create_test_photo(owner=self.user1) for _ in range(2)]
        other_photo = create_test_photo(owner=self.user2)
        
        stack = PhotoStack.objects.create(
            owner=self.user1,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(*own_photos)
        
        self.client.force_authenticate(user=self.user1)
        
        _response = self.client.post(
            f"/api/stacks/{stack.id}/primary",
            {"photo_id": str(other_photo.pk)},
            format="json"
        )
        
        # Should fail or not set the photo
        stack.refresh_from_db()
        self.assertNotEqual(stack.primary_photo, other_photo)


class AdminAccessTestCase(APITestCase):
    """Test admin access and capabilities."""

    def setUp(self):
        self.user = create_test_user()
        self.admin = create_test_user()
        self.admin.is_staff = True
        self.admin.save()
        self.client = APIClient()

    def test_admin_can_view_stats_for_all_users(self):
        """Test that admin can view aggregate stats."""
        # Create data for regular user
        photos = [create_test_photo(owner=self.user) for _ in range(2)]
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(*photos)
        
        self.client.force_authenticate(user=self.admin)
        
        response = self.client.get("/api/duplicates/stats")
        self.assertEqual(response.status_code, 200)

    def test_regular_user_sees_only_own_stats(self):
        """Test that regular users only see their own stats."""
        # Create data for admin
        admin_photos = [create_test_photo(owner=self.admin) for _ in range(2)]
        admin_dup = Duplicate.objects.create(
            owner=self.admin,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        admin_dup.photos.add(*admin_photos)
        
        # Create data for user
        user_photos = [create_test_photo(owner=self.user) for _ in range(2)]
        user_dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        user_dup.photos.add(*user_photos)
        
        self.client.force_authenticate(user=self.user)
        
        response = self.client.get("/api/duplicates/stats")
        self.assertEqual(response.status_code, 200)
        
        # Stats should reflect only user's data
        # The exact assertion depends on the stats endpoint response format


================================================
FILE: api/tests/test_only_photos_or_only_videos.py
================================================
from django.test import TestCase
from django.utils import timezone
from rest_framework.test import APIClient

from api.models.album_date import AlbumDate
from api.tests.utils import create_test_photo, create_test_user


class OnlyPhotosOrOnlyVideosTest(TestCase):
    def setUp(self):
        self.client = APIClient()
        self.user = create_test_user()
        self.client.force_authenticate(user=self.user)

    def test_only_photos(self):
        now = timezone.now()
        photo = create_test_photo(owner=self.user, added_on=now, public=True)

        album = AlbumDate(owner=self.user)
        album.id = 1
        album.photos.add(photo)
        album.save()

        response = self.client.get("/api/albums/date/list?photo=true").url
        response = self.client.get(response)

        data = response.json()
        self.assertEqual(1, len(data["results"]))


================================================
FILE: api/tests/test_perceptual_hash.py
================================================
"""
Comprehensive tests for api/perceptual_hash.py

Tests the perceptual hashing algorithm used for visual duplicate detection:
- calculate_perceptual_hash: Calculates pHash from image files
- calculate_hash_from_thumbnail: Wrapper for thumbnail hashing
- hamming_distance: Calculates bit difference between hashes
- are_duplicates: Determines if two images are duplicates based on hash similarity
- find_similar_hashes: Finds all similar hashes in a list
"""

import os
import tempfile
from unittest.mock import patch

from django.test import TestCase
from PIL import Image

from api.perceptual_hash import (
    DEFAULT_HAMMING_THRESHOLD,
    are_duplicates,
    calculate_hash_from_thumbnail,
    calculate_perceptual_hash,
    find_similar_hashes,
    hamming_distance,
)


class HammingDistanceTestCase(TestCase):
    """Tests for the hamming_distance function."""

    def test_identical_hashes_return_zero(self):
        """Identical hashes should have distance 0."""
        hash1 = "a" * 16  # 64-bit hash as 16 hex chars
        self.assertEqual(hamming_distance(hash1, hash1), 0)

    def test_completely_different_hashes(self):
        """Completely different hashes should have maximum distance (64 for 64-bit hash)."""
        # 0000...0000 vs FFFF...FFFF
        hash1 = "0" * 16
        hash2 = "f" * 16
        distance = hamming_distance(hash1, hash2)
        self.assertEqual(distance, 64)  # All 64 bits different

    def test_one_bit_difference(self):
        """Hashes differing by one bit should have distance 1."""
        # 0x0 = 0000 in binary, 0x1 = 0001 in binary - 1 bit different
        hash1 = "0" * 16
        hash2 = "0" * 15 + "1"
        distance = hamming_distance(hash1, hash2)
        self.assertEqual(distance, 1)

    def test_half_bits_different(self):
        """Test hashes with approximately half the bits different."""
        # 0 = 0000, a = 1010 - 2 bits different per hex char
        hash1 = "0" * 16
        hash2 = "a" * 16  # 2 bits per char * 16 chars = 32 bits
        distance = hamming_distance(hash1, hash2)
        self.assertEqual(distance, 32)

    def test_invalid_hash_returns_max_distance(self):
        """Invalid hash strings should return maximum distance (64)."""
        distance = hamming_distance("invalid", "hash")
        self.assertEqual(distance, 64)

    def test_empty_strings_return_max_distance(self):
        """Empty strings should return maximum distance."""
        distance = hamming_distance("", "")
        self.assertEqual(distance, 64)

    def test_mixed_valid_invalid_returns_max_distance(self):
        """Mix of valid and invalid should return max distance."""
        valid_hash = "a" * 16
        distance = hamming_distance(valid_hash, "not_hex_xyz")
        self.assertEqual(distance, 64)

    def test_different_length_hashes(self):
        """Different length hashes should return max distance or handle gracefully."""
        hash1 = "a" * 16
        hash2 = "a" * 8  # Shorter hash
        distance = hamming_distance(hash1, hash2)
        # imagehash may handle this differently - should not crash
        self.assertIsInstance(distance, int)

    def test_real_phash_values(self):
        """Test with realistic pHash values."""
        # These are example pHash values that might be generated
        hash1 = "8f94b5a16363c3c3"
        hash2 = "8f94b5a16363c3c7"  # 2 bits different (c3 vs c7)
        distance = hamming_distance(hash1, hash2)
        self.assertLessEqual(distance, 5)  # Should be small

    def test_case_insensitive_hashes(self):
        """Hash comparison should be case-insensitive (hex)."""
        hash1 = "ABCDEF0123456789"
        hash2 = "abcdef0123456789"
        distance = hamming_distance(hash1, hash2)
        self.assertEqual(distance, 0)


class AreDuplicatesTestCase(TestCase):
    """Tests for the are_duplicates function."""

    def test_identical_hashes_are_duplicates(self):
        """Identical hashes should always be considered duplicates."""
        hash1 = "a" * 16
        self.assertTrue(are_duplicates(hash1, hash1))

    def test_distance_under_threshold_is_duplicate(self):
        """Hashes with distance under threshold are duplicates."""
        # Using 1 bit difference which is well under default threshold of 10
        hash1 = "0" * 16
        hash2 = "0" * 15 + "1"
        self.assertTrue(are_duplicates(hash1, hash2))

    def test_distance_at_threshold_is_duplicate(self):
        """Hashes with distance exactly at threshold are duplicates."""
        with patch("api.perceptual_hash.hamming_distance", return_value=10):
            self.assertTrue(are_duplicates("a" * 16, "b" * 16, threshold=10))

    def test_distance_over_threshold_not_duplicate(self):
        """Hashes with distance over threshold are not duplicates."""
        with patch("api.perceptual_hash.hamming_distance", return_value=11):
            self.assertFalse(are_duplicates("a" * 16, "b" * 16, threshold=10))

    def test_empty_hash1_not_duplicate(self):
        """Empty first hash should not be considered duplicate."""
        self.assertFalse(are_duplicates("", "a" * 16))

    def test_empty_hash2_not_duplicate(self):
        """Empty second hash should not be considered duplicate."""
        self.assertFalse(are_duplicates("a" * 16, ""))

    def test_none_hash1_not_duplicate(self):
        """None first hash should not be considered duplicate."""
        self.assertFalse(are_duplicates(None, "a" * 16))

    def test_none_hash2_not_duplicate(self):
        """None second hash should not be considered duplicate."""
        self.assertFalse(are_duplicates("a" * 16, None))

    def test_both_none_not_duplicate(self):
        """Both None should not be considered duplicate."""
        self.assertFalse(are_duplicates(None, None))

    def test_both_empty_not_duplicate(self):
        """Both empty should not be considered duplicate."""
        self.assertFalse(are_duplicates("", ""))

    def test_custom_threshold_strict(self):
        """Strict threshold (lower) should reject more."""
        with patch("api.perceptual_hash.hamming_distance", return_value=5):
            self.assertTrue(are_duplicates("a" * 16, "b" * 16, threshold=5))
            self.assertFalse(are_duplicates("a" * 16, "b" * 16, threshold=4))

    def test_custom_threshold_loose(self):
        """Loose threshold (higher) should accept more."""
        with patch("api.perceptual_hash.hamming_distance", return_value=15):
            self.assertTrue(are_duplicates("a" * 16, "b" * 16, threshold=15))
            self.assertTrue(are_duplicates("a" * 16, "b" * 16, threshold=20))

    def test_default_threshold_value(self):
        """Default threshold should be 10."""
        self.assertEqual(DEFAULT_HAMMING_THRESHOLD, 10)


class FindSimilarHashesTestCase(TestCase):
    """Tests for the find_similar_hashes function."""

    def test_empty_target_hash_returns_empty(self):
        """Empty target hash should return empty list."""
        hash_list = [("img1", "a" * 16), ("img2", "b" * 16)]
        result = find_similar_hashes("", hash_list)
        self.assertEqual(result, [])

    def test_none_target_hash_returns_empty(self):
        """None target hash should return empty list."""
        hash_list = [("img1", "a" * 16), ("img2", "b" * 16)]
        result = find_similar_hashes(None, hash_list)
        self.assertEqual(result, [])

    def test_empty_hash_list_returns_empty(self):
        """Empty hash list should return empty list."""
        result = find_similar_hashes("a" * 16, [])
        self.assertEqual(result, [])

    def test_finds_similar_hashes(self):
        """Should find hashes within threshold."""
        target = "0" * 16
        # 1 bit different - should be found
        similar = "0" * 15 + "1"
        hash_list = [("img1", similar)]
        result = find_similar_hashes(target, hash_list)
        self.assertEqual(len(result), 1)
        self.assertEqual(result[0][0], "img1")
        self.assertEqual(result[0][1], 1)  # distance of 1

    def test_excludes_distant_hashes(self):
        """Should exclude hashes beyond threshold."""
        target = "0" * 16
        distant = "f" * 16  # 64 bits different
        hash_list = [("img1", distant)]
        result = find_similar_hashes(target, hash_list)
        self.assertEqual(result, [])

    def test_skips_identical_hash(self):
        """Should skip exact same hash (self-comparison)."""
        target = "a" * 16
        hash_list = [("img1", target)]  # Same hash
        result = find_similar_hashes(target, hash_list)
        self.assertEqual(result, [])

    def test_skips_none_hash_in_list(self):
        """Should skip None hashes in the list."""
        target = "a" * 16
        similar = "a" * 15 + "0"  # 1 bit different
        hash_list = [("img1", None), ("img2", similar)]
        result = find_similar_hashes(target, hash_list)
        self.assertEqual(len(result), 1)
        self.assertEqual(result[0][0], "img2")

    def test_skips_empty_hash_in_list(self):
        """Should skip empty hashes in the list."""
        target = "a" * 16
        similar = "a" * 15 + "0"
        hash_list = [("img1", ""), ("img2", similar)]
        result = find_similar_hashes(target, hash_list)
        self.assertEqual(len(result), 1)
        self.assertEqual(result[0][0], "img2")

    def test_sorted_by_distance(self):
        """Results should be sorted by distance (closest first)."""
        target = "0" * 16
        # Create hashes with known distances
        with patch("api.perceptual_hash.hamming_distance") as mock_dist:
            mock_dist.side_effect = [8, 3, 5]  # Distances for 3 hashes
            hash_list = [("img1", "h1"), ("img2", "h2"), ("img3", "h3")]
            result = find_similar_hashes(target, hash_list, threshold=10)
            # Should be sorted: img2 (3), img3 (5), img1 (8)
            self.assertEqual(result[0][0], "img2")
            self.assertEqual(result[1][0], "img3")
            self.assertEqual(result[2][0], "img1")

    def test_custom_threshold(self):
        """Should respect custom threshold."""
        target = "0" * 16
        with patch("api.perceptual_hash.hamming_distance") as mock_dist:
            mock_dist.return_value = 5
            hash_list = [("img1", "h1")]
            # Threshold 4 - should exclude distance 5
            result = find_similar_hashes(target, hash_list, threshold=4)
            self.assertEqual(result, [])
            # Threshold 5 - should include distance 5
            result = find_similar_hashes(target, hash_list, threshold=5)
            self.assertEqual(len(result), 1)

    def test_returns_correct_tuple_format(self):
        """Results should be (image_id, distance) tuples."""
        target = "0" * 16
        with patch("api.perceptual_hash.hamming_distance", return_value=2):
            hash_list = [("my_image_id", "some_hash")]
            result = find_similar_hashes(target, hash_list)
            self.assertEqual(len(result), 1)
            image_id, distance = result[0]
            self.assertEqual(image_id, "my_image_id")
            self.assertEqual(distance, 2)

    def test_multiple_similar_all_returned(self):
        """All similar hashes should be returned."""
        target = "0" * 16
        with patch("api.perceptual_hash.hamming_distance", return_value=5):
            hash_list = [("img1", "h1"), ("img2", "h2"), ("img3", "h3")]
            result = find_similar_hashes(target, hash_list, threshold=10)
            self.assertEqual(len(result), 3)


class CalculatePerceptualHashTestCase(TestCase):
    """Tests for the calculate_perceptual_hash function."""

    def setUp(self):
        """Create temporary directory for test images."""
        self.temp_dir = tempfile.mkdtemp()

    def tearDown(self):
        """Clean up temporary files."""
        import shutil

        shutil.rmtree(self.temp_dir, ignore_errors=True)

    def _create_test_image(self, filename, size=(100, 100), mode="RGB", color=(255, 0, 0)):
        """Helper to create a test image file."""
        path = os.path.join(self.temp_dir, filename)
        img = Image.new(mode, size, color)
        img.save(path)
        return path

    def test_valid_rgb_image(self):
        """Should calculate hash for valid RGB image."""
        path = self._create_test_image("test.jpg", mode="RGB")
        result = calculate_perceptual_hash(path)
        self.assertIsNotNone(result)
        self.assertIsInstance(result, str)
        self.assertEqual(len(result), 16)  # 64-bit hash = 16 hex chars

    def test_valid_rgba_image_converted(self):
        """Should handle RGBA images by converting to RGB."""
        path = self._create_test_image("test.png", mode="RGBA", color=(255, 0, 0, 128))
        result = calculate_perceptual_hash(path)
        self.assertIsNotNone(result)
        self.assertEqual(len(result), 16)

    def test_valid_grayscale_image(self):
        """Should handle grayscale (L mode) images."""
        path = self._create_test_image("test_gray.jpg", mode="L", color=128)
        result = calculate_perceptual_hash(path)
        self.assertIsNotNone(result)
        self.assertEqual(len(result), 16)

    def test_valid_palette_image_converted(self):
        """Should handle palette (P mode) images by converting to RGB."""
        path = os.path.join(self.temp_dir, "test_palette.png")
        img = Image.new("P", (100, 100))
        img.save(path)
        result = calculate_perceptual_hash(path)
        self.assertIsNotNone(result)

    def test_nonexistent_file_returns_none(self):
        """Should return None for nonexistent file."""
        result = calculate_perceptual_hash("/nonexistent/path/image.jpg")
        self.assertIsNone(result)

    def test_corrupted_file_returns_none(self):
        """Should return None for corrupted/invalid image file."""
        path = os.path.join(self.temp_dir, "corrupted.jpg")
        with open(path, "w") as f:
            f.write("not an image file content")
        result = calculate_perceptual_hash(path)
        self.assertIsNone(result)

    def test_empty_file_returns_none(self):
        """Should return None for empty file."""
        path = os.path.join(self.temp_dir, "empty.jpg")
        with open(path, "w") as _f:
            pass  # Create empty file
        result = calculate_perceptual_hash(path)
        self.assertIsNone(result)

    def test_directory_instead_of_file_returns_none(self):
        """Should return None if path is a directory."""
        result = calculate_perceptual_hash(self.temp_dir)
        self.assertIsNone(result)

    def test_custom_hash_size(self):
        """Should support custom hash sizes."""
        path = self._create_test_image("test.jpg")
        # hash_size=16 produces 256-bit hash = 64 hex chars
        result = calculate_perceptual_hash(path, hash_size=16)
        self.assertIsNotNone(result)
        self.assertEqual(len(result), 64)

    def test_small_hash_size(self):
        """Should support smaller hash sizes."""
        path = self._create_test_image("test.jpg")
        # hash_size=4 produces 16-bit hash = 4 hex chars
        result = calculate_perceptual_hash(path, hash_size=4)
        self.assertIsNotNone(result)
        self.assertEqual(len(result), 4)

    def test_similar_images_similar_hashes(self):
        """Similar images should produce similar hashes."""
        # Create two similar images (same color, slight size difference)
        path1 = self._create_test_image("img1.jpg", size=(100, 100), color=(255, 0, 0))
        path2 = self._create_test_image("img2.jpg", size=(110, 110), color=(255, 0, 0))
        hash1 = calculate_perceptual_hash(path1)
        hash2 = calculate_perceptual_hash(path2)
        self.assertIsNotNone(hash1)
        self.assertIsNotNone(hash2)
        # Similar solid color images should have low distance
        distance = hamming_distance(hash1, hash2)
        self.assertLessEqual(distance, 10)

    def test_different_images_different_hashes(self):
        """Very different images should produce different hashes."""
        # Create two very different images with patterns (not solid colors)
        # Solid colors produce similar hashes because pHash uses DCT
        path1 = os.path.join(self.temp_dir, "pattern1.jpg")
        path2 = os.path.join(self.temp_dir, "pattern2.jpg")

        # Create a horizontal gradient pattern
        img1 = Image.new("RGB", (100, 100))
        for x in range(100):
            for y in range(100):
                img1.putpixel((x, y), (x * 2, 0, 0))
        img1.save(path1)

        # Create a vertical gradient pattern (different structure)
        img2 = Image.new("RGB", (100, 100))
        for x in range(100):
            for y in range(100):
                img2.putpixel((x, y), (0, 0, y * 2))
        img2.save(path2)

        hash1 = calculate_perceptual_hash(path1)
        hash2 = calculate_perceptual_hash(path2)
        self.assertIsNotNone(hash1)
        self.assertIsNotNone(hash2)
        # Different patterns should have noticeable distance
        distance = hamming_distance(hash1, hash2)
        self.assertGreater(distance, 0)

    def test_deterministic_hash(self):
        """Same image should always produce same hash."""
        path = self._create_test_image("test.jpg")
        hash1 = calculate_perceptual_hash(path)
        hash2 = calculate_perceptual_hash(path)
        self.assertEqual(hash1, hash2)

    def test_very_small_image(self):
        """Should handle very small images (1x1 pixel)."""
        path = self._create_test_image("tiny.jpg", size=(1, 1))
        _result = calculate_perceptual_hash(path)
        # Should not crash - may return hash or None depending on implementation
        # The key is it doesn't raise an exception

    def test_very_large_image(self):
        """Should handle large images (though may be slow)."""
        path = self._create_test_image("large.jpg", size=(1000, 1000))
        result = calculate_perceptual_hash(path)
        self.assertIsNotNone(result)
        self.assertEqual(len(result), 16)

    def test_jpeg_vs_png_same_content(self):
        """Same image content in different formats should have similar hash."""
        # Create same color image in different formats
        jpg_path = self._create_test_image("test.jpg", color=(100, 150, 200))
        png_path = self._create_test_image("test.png", color=(100, 150, 200))
        hash_jpg = calculate_perceptual_hash(jpg_path)
        hash_png = calculate_perceptual_hash(png_path)
        self.assertIsNotNone(hash_jpg)
        self.assertIsNotNone(hash_png)
        distance = hamming_distance(hash_jpg, hash_png)
        # Same content should have identical or very similar hashes
        self.assertLessEqual(distance, 5)


class CalculateHashFromThumbnailTestCase(TestCase):
    """Tests for the calculate_hash_from_thumbnail function."""

    def setUp(self):
        """Create temporary directory for test images."""
        self.temp_dir = tempfile.mkdtemp()

    def tearDown(self):
        """Clean up temporary files."""
        import shutil

        shutil.rmtree(self.temp_dir, ignore_errors=True)

    def test_delegates_to_calculate_perceptual_hash(self):
        """Should delegate to calculate_perceptual_hash."""
        with patch("api.perceptual_hash.calculate_perceptual_hash") as mock:
            mock.return_value = "abc123"
            result = calculate_hash_from_thumbnail("/some/path")
            mock.assert_called_once_with("/some/path")
            self.assertEqual(result, "abc123")

    def test_returns_none_on_failure(self):
        """Should return None if underlying function fails."""
        result = calculate_hash_from_thumbnail("/nonexistent/path")
        self.assertIsNone(result)


class EdgeCasesTestCase(TestCase):
    """Edge case tests for the perceptual hash module."""

    def setUp(self):
        """Create temporary directory for test images."""
        self.temp_dir = tempfile.mkdtemp()

    def tearDown(self):
        """Clean up temporary files."""
        import shutil

        shutil.rmtree(self.temp_dir, ignore_errors=True)

    def test_unicode_filename(self):
        """Should handle unicode characters in filename."""
        path = os.path.join(self.temp_dir, "图片_照片_🖼️.jpg")
        img = Image.new("RGB", (50, 50), (255, 255, 0))
        img.save(path)
        result = calculate_perceptual_hash(path)
        self.assertIsNotNone(result)

    def test_special_characters_in_path(self):
        """Should handle special characters in file path."""
        path = os.path.join(self.temp_dir, "test with spaces & special (1).jpg")
        img = Image.new("RGB", (50, 50), (255, 255, 0))
        img.save(path)
        result = calculate_perceptual_hash(path)
        self.assertIsNotNone(result)

    def test_hash_only_contains_hex_chars(self):
        """Generated hash should only contain valid hex characters."""
        path = os.path.join(self.temp_dir, "test.jpg")
        img = Image.new("RGB", (50, 50), (123, 45, 67))
        img.save(path)
        result = calculate_perceptual_hash(path)
        self.assertIsNotNone(result)
        # Check all characters are hex
        valid_hex = set("0123456789abcdef")
        self.assertTrue(all(c in valid_hex for c in result.lower()))

    def test_webp_format(self):
        """Should handle WebP format images."""
        path = os.path.join(self.temp_dir, "test.webp")
        img = Image.new("RGB", (50, 50), (100, 100, 100))
        img.save(path, "WEBP")
        result = calculate_perceptual_hash(path)
        self.assertIsNotNone(result)

    def test_gif_format(self):
        """Should handle GIF format images."""
        path = os.path.join(self.temp_dir, "test.gif")
        img = Image.new("RGB", (50, 50), (50, 100, 150))
        img.save(path, "GIF")
        result = calculate_perceptual_hash(path)
        self.assertIsNotNone(result)

    def test_bmp_format(self):
        """Should handle BMP format images."""
        path = os.path.join(self.temp_dir, "test.bmp")
        img = Image.new("RGB", (50, 50), (200, 100, 50))
        img.save(path, "BMP")
        result = calculate_perceptual_hash(path)
        self.assertIsNotNone(result)

    def test_hamming_distance_with_newlines_in_hash(self):
        """Should handle hashes that might have whitespace (edge case)."""
        # This tests robustness - real hashes shouldn't have whitespace
        # imagehash's hex_to_hash is resilient and strips/ignores trailing chars
        distance = hamming_distance("a" * 16 + "\n", "a" * 16)
        # The library handles this gracefully - doesn't crash
        self.assertIsInstance(distance, int)

    def test_find_similar_with_large_list(self):
        """Should handle large hash lists efficiently."""
        target = "0" * 16
        # Create a large list of hashes
        hash_list = [(f"img_{i}", f"{i:016x}") for i in range(1000)]
        # Should not crash or hang
        result = find_similar_hashes(target, hash_list, threshold=10)
        self.assertIsInstance(result, list)

    def test_are_duplicates_with_whitespace_only_hash(self):
        """Should handle whitespace-only hash gracefully."""
        self.assertFalse(are_duplicates("   ", "a" * 16))
        self.assertFalse(are_duplicates("a" * 16, "   "))

    def test_cmyk_image_converted(self):
        """Should handle CMYK images by converting to RGB."""
        path = os.path.join(self.temp_dir, "test_cmyk.jpg")
        # Create a CMYK image
        img = Image.new("CMYK", (50, 50), (0, 100, 100, 0))  # Red in CMYK
        img.save(path)
        result = calculate_perceptual_hash(path)
        self.assertIsNotNone(result)

    def test_1bit_image(self):
        """Should handle 1-bit (black and white) images."""
        path = os.path.join(self.temp_dir, "test_1bit.png")
        img = Image.new("1", (50, 50), 1)  # White
        img.save(path)
        result = calculate_perceptual_hash(path)
        self.assertIsNotNone(result)

    def test_concurrent_hash_calculation(self):
        """Hash calculation should be thread-safe (no shared mutable state)."""
        import concurrent.futures

        # Create multiple test images with distinct patterns (not just solid colors)
        paths = []
        for i in range(5):
            path = os.path.join(self.temp_dir, f"concurrent_{i}.jpg")
            img = Image.new("RGB", (50, 50))
            # Create distinct patterns for each image
            for x in range(50):
                for y in range(50):
                    # Each image has a unique pattern based on i
                    if i == 0:
                        img.putpixel((x, y), (x * 5, 0, 0))  # Horizontal red gradient
                    elif i == 1:
                        img.putpixel((x, y), (0, y * 5, 0))  # Vertical green gradient
                    elif i == 2:
                        img.putpixel((x, y), (0, 0, (x + y) * 2))  # Diagonal blue
                    elif i == 3:
                        img.putpixel((x, y), ((x * y) % 256, 0, 0))  # Multiplicative pattern
                    else:
                        img.putpixel((x, y), (255 if x > 25 else 0, 255 if y > 25 else 0, 0))  # Quadrants
            img.save(path)
            paths.append(path)

        # Calculate hashes concurrently
        with concurrent.futures.ThreadPoolExecutor(max_workers=5) as executor:
            futures = [executor.submit(calculate_perceptual_hash, p) for p in paths]
            results = [f.result() for f in futures]

        # All should succeed
        self.assertTrue(all(r is not None for r in results))
        # Most should be unique (distinct patterns) - allow some similarity
        unique_count = len(set(results))
        self.assertGreaterEqual(unique_count, 3)  # At least 3 unique hashes from 5 distinct patterns


class PerformanceTestCase(TestCase):
    """Performance-related tests for the perceptual hash module."""

    def setUp(self):
        """Create temporary directory for test images."""
        self.temp_dir = tempfile.mkdtemp()

    def tearDown(self):
        """Clean up temporary files."""
        import shutil

        shutil.rmtree(self.temp_dir, ignore_errors=True)

    def test_hamming_distance_performance(self):
        """Hamming distance should be fast for many comparisons."""
        import time

        hash1 = "a" * 16
        hash2 = "b" * 16

        start = time.time()
        for _ in range(10000):
            hamming_distance(hash1, hash2)
        elapsed = time.time() - start

        # 10000 comparisons should complete in under 1 second
        self.assertLess(elapsed, 1.0)

    def test_find_similar_performance(self):
        """find_similar_hashes should be reasonably fast for medium-sized lists."""
        import time

        target = "0" * 16
        # Create a list of 100 hashes
        hash_list = [(f"img_{i}", f"{i:016x}") for i in range(100)]

        start = time.time()
        for _ in range(100):
            find_similar_hashes(target, hash_list, threshold=10)
        elapsed = time.time() - start

        # 100 searches over 100 hashes should complete quickly
        self.assertLess(elapsed, 2.0)


================================================
FILE: api/tests/test_photo_caption_model.py
================================================
from django.test import TestCase

from api.models import PhotoCaption
from api.tests.utils import create_test_user, create_test_photo


class PhotoCaptionModelTest(TestCase):
    def setUp(self):
        self.user = create_test_user()
        self.photo = create_test_photo(owner=self.user)

    def test_create_photo_caption(self):
        """Test creating a PhotoCaption instance"""
        caption = PhotoCaption.objects.create(
            photo=self.photo, captions_json={"user_caption": "Test caption"}
        )

        self.assertEqual(caption.photo, self.photo)
        self.assertEqual(caption.captions_json["user_caption"], "Test caption")

    def test_photo_caption_one_to_one_relationship(self):
        """Test that PhotoCaption has a one-to-one relationship with Photo"""
        PhotoCaption.objects.create(
            photo=self.photo, captions_json={"user_caption": "First caption"}
        )

        # Trying to create another caption for the same photo should fail
        with self.assertRaises(Exception):
            PhotoCaption.objects.create(
                photo=self.photo, captions_json={"user_caption": "Second caption"}
            )

    def test_generate_captions_im2txt(self):
        """Test generating im2txt captions"""
        caption = PhotoCaption.objects.create(photo=self.photo)

        # This method requires thumbnail access which isn't available in tests
        # We'll test that it returns False when no thumbnail is available
        result = caption.generate_captions_im2txt(commit=False)
        self.assertFalse(result)

    def test_save_user_caption(self):
        """Test saving user captions"""
        caption = PhotoCaption.objects.create(photo=self.photo)

        # This method requires thumbnail access which isn't available in tests
        # We'll test that it returns False when no thumbnail is available
        result = caption.save_user_caption("My beautiful photo", commit=True)
        self.assertFalse(result)

    def test_generate_tag_captions_skips_existing(self):
        """Test that generate_tag_captions skips if active model tags already exist"""
        caption = PhotoCaption.objects.create(photo=self.photo)

        # Pre-populate places365 data (the default tagging model)
        caption.captions_json = {
            "places365": {
                "categories": ["outdoor", "landscape"],
                "attributes": ["natural", "sunny"],
                "environment": "outdoor",
            }
        }
        caption.save()

        # Should return early since places365 tags already exist
        caption.generate_tag_captions(commit=True)
        caption.refresh_from_db()

        self.assertIn("places365", caption.captions_json)

    def test_recreate_search_captions_delegates_to_photo_search(self):
        """Test that recreate_search_captions delegates to PhotoSearch"""
        caption = PhotoCaption.objects.create(
            photo=self.photo, captions_json={"user_caption": "Test caption"}
        )

        # This should create a PhotoSearch instance and update search captions
        caption.recreate_search_captions()

        # Verify PhotoSearch was created and has search captions
        self.assertTrue(hasattr(self.photo, "search_instance"))
        from api.models.photo_search import PhotoSearch

        search_instance, created = PhotoSearch.objects.get_or_create(photo=self.photo)
        self.assertIsNotNone(search_instance.search_captions)

    def test_captions_json_default_empty_dict(self):
        """Test that captions_json defaults to None (nullable field)"""
        caption = PhotoCaption.objects.create(photo=self.photo)

        self.assertIsNone(caption.captions_json)

    def test_str_representation(self):
        """Test string representation of PhotoCaption"""
        caption = PhotoCaption.objects.create(
            photo=self.photo, captions_json={"user_caption": "Test"}
        )

        str_repr = str(caption)
        self.assertIn(self.photo.image_hash, str_repr)

    def test_cascade_delete_with_photo(self):
        """Test that PhotoCaption is deleted when Photo is deleted"""
        PhotoCaption.objects.create(photo=self.photo)
        photo_id = self.photo.image_hash

        self.photo.delete()

        with self.assertRaises(PhotoCaption.DoesNotExist):
            PhotoCaption.objects.get(photo_id=photo_id)

    def test_multiple_caption_types(self):
        """Test storing multiple types of captions"""
        caption = PhotoCaption.objects.create(
            photo=self.photo,
            captions_json={
                "user_caption": "My photo",
                "im2txt": "a photo of a landscape",
                "places365": {
                    "categories": ["outdoor"],
                    "attributes": ["natural"],
                    "environment": "outdoor",
                },
            },
        )

        self.assertEqual(caption.captions_json["user_caption"], "My photo")
        self.assertEqual(caption.captions_json["im2txt"], "a photo of a landscape")
        self.assertIn("categories", caption.captions_json["places365"])

    def test_update_existing_captions(self):
        """Test updating existing captions"""
        caption = PhotoCaption.objects.create(
            photo=self.photo, captions_json={"user_caption": "Original caption"}
        )

        # Update the caption directly (since save_user_caption requires thumbnails)
        caption.captions_json["user_caption"] = "Updated caption"
        caption.save()
        caption.refresh_from_db()

        self.assertEqual(caption.captions_json["user_caption"], "Updated caption")

    def test_empty_captions_json_handling(self):
        """Test handling of empty or None captions_json"""
        caption = PhotoCaption.objects.create(photo=self.photo)

        # Should handle empty dict gracefully
        caption.recreate_search_captions()

        # Test direct assignment since save_user_caption requires thumbnails
        caption.captions_json = {"user_caption": ""}
        caption.save()
        self.assertEqual(caption.captions_json["user_caption"], "")


================================================
FILE: api/tests/test_photo_captions.py
================================================
from unittest.mock import patch

from django.test import TestCase
from rest_framework.test import APIClient

from api.tests.utils import create_test_photo, create_test_user


class PhotoCaptionsTest(TestCase):
    def setUp(self):
        self.client = APIClient()
        self.user1 = create_test_user()
        self.user2 = create_test_user()
        self.client.force_authenticate(user=self.user1)

    @patch(
        "api.models.photo_caption.PhotoCaption.generate_captions_im2txt", autospec=True
    )
    def test_generate_captions_for_my_photo(self, generate_caption_mock):
        generate_caption_mock.return_value = True
        photo = create_test_photo(owner=self.user1)

        payload = {"image_hash": photo.image_hash}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/generateim2txt/",
            format="json",
            data=payload,
            headers=headers,
        )
        data = response.json()

        self.assertTrue(data["status"])

    @patch(
        "api.models.photo_caption.PhotoCaption.generate_captions_im2txt", autospec=True
    )
    def test_fail_to_generate_captions_for_my_photo(self, generate_caption_mock):
        generate_caption_mock.return_value = False
        photo = create_test_photo(owner=self.user1)

        payload = {"image_hash": photo.image_hash}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/generateim2txt/",
            format="json",
            data=payload,
            headers=headers,
        )
        data = response.json()

        self.assertFalse(data["status"])

    def test_generate_captions_for_my_photo_of_another_user(self):
        photo = create_test_photo(owner=self.user2)

        payload = {"image_hash": photo.image_hash}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/generateim2txt/",
            format="json",
            data=payload,
            headers=headers,
        )
        data = response.json()

        # Returns 404 to avoid leaking existence of other users' photos
        self.assertEqual(404, response.status_code)
        self.assertFalse(data["status"])
        self.assertEqual("photo not found", data["message"])


================================================
FILE: api/tests/test_photo_lifecycle.py
================================================
"""
Tests for Photo Lifecycle - deletion, trashing, restoration.

Tests verify proper cleanup of:
- Stack memberships (ManyToMany)
- Duplicate group memberships (ManyToMany)
- Empty groups after photo removal
- Restoration behavior
"""

from django.test import TestCase

from api.models.file import File
from api.models.photo_stack import PhotoStack
from api.models.duplicate import Duplicate
from api.tests.utils import create_test_photo, create_test_user


class PhotoDeletionStackCleanupTestCase(TestCase):
    """Tests for photo deletion and stack cleanup."""

    def setUp(self):
        self.user = create_test_user()

    def test_manual_delete_clears_stack_membership(self):
        """Test that manual_delete removes photo from stacks."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack.photos.add(photo1, photo2, photo3)
        
        self.assertEqual(stack.photos.count(), 3)
        
        # Delete photo1
        photo1.in_trashcan = True
        photo1.save()
        photo1.manual_delete()
        
        # photo1 should be removed from stack
        photo1.refresh_from_db()
        self.assertEqual(photo1.stacks.count(), 0)
        
        # Stack should still have 2 photos
        stack.refresh_from_db()
        self.assertEqual(stack.photos.count(), 2)

    def test_manual_delete_deletes_stack_with_one_remaining(self):
        """Test that deleting a photo leaves stack with only 1 photo, stack is deleted."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack.photos.add(photo1, photo2)
        stack_id = stack.id
        
        # Delete photo1
        photo1.in_trashcan = True
        photo1.save()
        photo1.manual_delete()
        
        # Stack should be deleted (only 1 photo remaining)
        self.assertFalse(PhotoStack.objects.filter(id=stack_id).exists())
        
        # photo2 should have no stacks
        photo2.refresh_from_db()
        self.assertEqual(photo2.stacks.count(), 0)

    def test_manual_delete_deletes_empty_stack(self):
        """Test that deleting all photos in stack deletes the stack."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack.photos.add(photo1, photo2)
        stack_id = stack.id
        
        # Delete both photos
        photo1.in_trashcan = True
        photo1.save()
        photo1.manual_delete()
        
        photo2.in_trashcan = True
        photo2.save()
        photo2.manual_delete()
        
        # Stack should be deleted
        self.assertFalse(PhotoStack.objects.filter(id=stack_id).exists())


class PhotoDeletionDuplicateCleanupTestCase(TestCase):
    """Tests for photo deletion and duplicate group cleanup."""

    def setUp(self):
        self.user = create_test_user()

    def test_manual_delete_clears_duplicate_membership(self):
        """Test that manual_delete removes photo from duplicate groups.
        
        BUG #12: This test will FAIL if duplicates are not cleared!
        """
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        duplicate.photos.add(photo1, photo2, photo3)
        
        self.assertEqual(duplicate.photos.count(), 3)
        
        # Delete photo1
        photo1.in_trashcan = True
        photo1.save()
        photo1.manual_delete()
        
        # photo1 should be removed from duplicate group
        photo1.refresh_from_db()
        self.assertEqual(photo1.duplicates.count(), 0,
            "Bug #12: manual_delete should clear duplicates")
        
        # Duplicate group should still have 2 photos
        duplicate.refresh_from_db()
        self.assertEqual(duplicate.photos.count(), 2)

    def test_manual_delete_deletes_duplicate_with_one_remaining(self):
        """Test that deleting a photo leaves duplicate with only 1 photo, group is deleted.
        
        BUG #12: This test will FAIL if duplicate groups are not cleaned up!
        """
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        duplicate.photos.add(photo1, photo2)
        duplicate_id = duplicate.id
        
        # Delete photo1
        photo1.in_trashcan = True
        photo1.save()
        photo1.manual_delete()
        
        # Duplicate group should be deleted (only 1 photo remaining)
        self.assertFalse(Duplicate.objects.filter(id=duplicate_id).exists(),
            "Bug #12: Duplicate group with 1 photo should be deleted")
        
        # photo2 should have no duplicate groups
        photo2.refresh_from_db()
        self.assertEqual(photo2.duplicates.count(), 0)

    def test_manual_delete_deletes_empty_duplicate_group(self):
        """Test that deleting all photos in duplicate group deletes the group."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        duplicate.photos.add(photo1, photo2)
        duplicate_id = duplicate.id
        
        # Delete both photos
        photo1.in_trashcan = True
        photo1.save()
        photo1.manual_delete()
        
        photo2.in_trashcan = True
        photo2.save()
        photo2.manual_delete()
        
        # Duplicate group should be deleted
        self.assertFalse(Duplicate.objects.filter(id=duplicate_id).exists(),
            "Bug #12: Empty duplicate group should be deleted")


class PhotoTrashRestoreTestCase(TestCase):
    """Tests for trashing and restoring photos."""

    def setUp(self):
        self.user = create_test_user()

    def test_trashed_photo_preserves_stack_membership(self):
        """Test that trashing a photo does NOT remove it from stacks."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack.photos.add(photo1, photo2)
        
        # Trash photo1 (not permanent delete)
        photo1.in_trashcan = True
        photo1.save()
        
        # photo1 should still be in stack (just trashed)
        photo1.refresh_from_db()
        self.assertEqual(photo1.stacks.count(), 1)
        
        stack.refresh_from_db()
        self.assertEqual(stack.photos.count(), 2)

    def test_trashed_photo_preserves_duplicate_membership(self):
        """Test that trashing a photo does NOT remove it from duplicates."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        duplicate.photos.add(photo1, photo2)
        
        # Trash photo1 (not permanent delete)
        photo1.in_trashcan = True
        photo1.save()
        
        # photo1 should still be in duplicate group (just trashed)
        photo1.refresh_from_db()
        self.assertEqual(photo1.duplicates.count(), 1)
        
        duplicate.refresh_from_db()
        self.assertEqual(duplicate.photos.count(), 2)

    def test_restore_photo_from_trash(self):
        """Test that restoring a photo from trash works correctly."""
        photo1 = create_test_photo(owner=self.user, in_trashcan=True)
        
        # Restore
        photo1.in_trashcan = False
        photo1.save()
        
        photo1.refresh_from_db()
        self.assertFalse(photo1.in_trashcan)


class PhotoInMultipleGroupsTestCase(TestCase):
    """Tests for photos that are in multiple stacks and/or duplicate groups."""

    def setUp(self):
        self.user = create_test_user()

    def test_photo_in_both_stack_and_duplicate(self):
        """Test deleting photo that's in both a stack and duplicate group."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        
        # Photo1 is in a burst stack with photo2
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack.photos.add(photo1, photo2)
        
        # Photo1 is also in a duplicate group with photo3
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        duplicate.photos.add(photo1, photo3)
        
        stack_id = stack.id
        duplicate_id = duplicate.id
        
        # Delete photo1
        photo1.in_trashcan = True
        photo1.save()
        photo1.manual_delete()
        
        photo1.refresh_from_db()
        
        # Both relationships should be cleared
        self.assertEqual(photo1.stacks.count(), 0)
        self.assertEqual(photo1.duplicates.count(), 0,
            "Bug #12: Duplicates should be cleared on delete")
        
        # Both groups should be deleted (only 1 photo remaining in each)
        self.assertFalse(PhotoStack.objects.filter(id=stack_id).exists())
        self.assertFalse(Duplicate.objects.filter(id=duplicate_id).exists(),
            "Bug #12: Duplicate group should be deleted")

    def test_photo_in_multiple_stacks(self):
        """Test photo that's in multiple stacks (different types)."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        
        # Stack 1: Burst with photo1 and photo2
        stack1 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack1.photos.add(photo1, photo2)
        
        # Stack 2: Manual with photo1 and photo3
        stack2 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack2.photos.add(photo1, photo3)
        
        stack1_id = stack1.id
        stack2_id = stack2.id
        
        # Delete photo1
        photo1.in_trashcan = True
        photo1.save()
        photo1.manual_delete()
        
        # Both stacks should be deleted (only 1 photo remaining in each)
        self.assertFalse(PhotoStack.objects.filter(id=stack1_id).exists())
        self.assertFalse(PhotoStack.objects.filter(id=stack2_id).exists())


class DuplicateResolutionCleanupTestCase(TestCase):
    """Tests for duplicate resolution affecting photo lifecycle."""

    def setUp(self):
        self.user = create_test_user()

    def test_resolve_duplicate_trashes_non_kept_photos(self):
        """Test that resolving a duplicate trashes other photos."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        duplicate.photos.add(photo1, photo2, photo3)
        
        # Resolve keeping photo1
        duplicate.resolve(kept_photo=photo1)
        
        # photo2 and photo3 should be trashed
        photo2.refresh_from_db()
        photo3.refresh_from_db()
        self.assertTrue(photo2.in_trashcan)
        self.assertTrue(photo3.in_trashcan)
        
        # photo1 should not be trashed
        photo1.refresh_from_db()
        self.assertFalse(photo1.in_trashcan)

    def test_resolve_duplicate_updates_status(self):
        """Test that resolving updates duplicate status."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.PENDING,
        )
        duplicate.photos.add(photo1, photo2)
        
        duplicate.resolve(kept_photo=photo1)
        
        duplicate.refresh_from_db()
        self.assertEqual(duplicate.review_status, Duplicate.ReviewStatus.RESOLVED)


class EdgeCasesTestCase(TestCase):
    """Edge cases for photo lifecycle."""

    def setUp(self):
        self.user = create_test_user()

    def test_delete_photo_not_in_any_group(self):
        """Test deleting a photo that's not in any stack or duplicate group."""
        photo = create_test_photo(owner=self.user)
        
        photo.in_trashcan = True
        photo.save()
        photo.manual_delete()
        
        photo.refresh_from_db()
        self.assertTrue(photo.removed)

    def test_delete_photo_with_no_main_file(self):
        """Test deleting a photo without a main_file."""
        photo = create_test_photo(owner=self.user)
        photo.main_file = None
        photo.save()
        
        photo.in_trashcan = True
        photo.save()
        
        # Should not crash
        photo.manual_delete()
        
        photo.refresh_from_db()
        self.assertTrue(photo.removed)

    def test_stack_primary_photo_deleted(self):
        """Test what happens when the primary photo of a stack is deleted."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
            primary_photo=photo1,
        )
        stack.photos.add(photo1, photo2, photo3)
        
        # Delete the primary photo
        photo1.in_trashcan = True
        photo1.save()
        photo1.manual_delete()
        
        # Stack should still exist with 2 photos
        stack.refresh_from_db()
        self.assertEqual(stack.photos.count(), 2)
        
        # Primary photo reference might be stale - check it
        # (This tests if there's a bug in primary_photo handling)
        # The primary_photo should ideally be updated or cleared

    def test_duplicate_kept_photo_deleted(self):
        """Test what happens when the kept_photo of a resolved duplicate is deleted."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.RESOLVED,
            kept_photo=photo1,
        )
        duplicate.photos.add(photo1, photo2)
        duplicate_id = duplicate.id
        
        # Now delete the kept photo
        photo1.in_trashcan = True
        photo1.save()
        photo1.manual_delete()
        
        # Duplicate group should be deleted (only 1 photo remaining)
        self.assertFalse(Duplicate.objects.filter(id=duplicate_id).exists(),
            "Duplicate group with 1 photo should be deleted after kept_photo deletion")


class SharedFileTestCase(TestCase):
    """Tests for photos sharing the same File."""

    def setUp(self):
        self.user = create_test_user()

    def test_delete_photo_preserves_shared_file(self):
        """Test that deleting a photo does not delete a file shared with another photo."""
        # Create a shared file
        shared_file = File.objects.create(
            hash="shared_file_hash" + "a" * 17,
            path="/photos/shared_image.jpg",
            type=File.IMAGE,
        )
        
        # Create two photos that share the same file
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        photo1.files.add(shared_file)
        photo1.main_file = shared_file
        photo1.save()
        
        photo2.files.add(shared_file)
        photo2.main_file = shared_file
        photo2.save()
        
        # Verify both photos reference the same file
        self.assertEqual(photo1.main_file.hash, photo2.main_file.hash)
        self.assertEqual(shared_file.photo_set.count(), 2)
        
        # Delete photo1
        photo1.in_trashcan = True
        photo1.save()
        photo1.manual_delete()
        
        # File should still exist (used by photo2)
        self.assertTrue(File.objects.filter(hash=shared_file.hash).exists(),
            "File should not be deleted when another photo still uses it")
        
        # photo2 should still have its main_file
        photo2.refresh_from_db()
        self.assertIsNotNone(photo2.main_file)
        self.assertEqual(photo2.main_file.hash, shared_file.hash)
        
        # photo2's files should still include the shared file
        self.assertTrue(photo2.files.filter(hash=shared_file.hash).exists())

    def test_delete_photo_removes_unshared_file(self):
        """Test that deleting a photo removes a file only used by that photo."""
        import tempfile
        import os
        
        # Create a temp file to simulate a real file
        with tempfile.NamedTemporaryFile(delete=False, suffix='.jpg') as tmp:
            tmp.write(b'test image data')
            temp_path = tmp.name
        
        try:
            # Create a file that's only used by one photo
            unique_file = File.objects.create(
                hash="unique_file_hash" + "a" * 18,
                path=temp_path,
                type=File.IMAGE,
            )
            
            photo = create_test_photo(owner=self.user)
            photo.files.add(unique_file)
            photo.main_file = unique_file
            photo.save()
            
            # Verify only one photo uses this file
            self.assertEqual(unique_file.photo_set.count(), 1)
            
            # Delete the photo
            photo.in_trashcan = True
            photo.save()
            photo.manual_delete()
            
            # File should be deleted from database
            self.assertFalse(File.objects.filter(hash=unique_file.hash).exists(),
                "File should be deleted when no other photos use it")
            
            # Physical file should be deleted
            self.assertFalse(os.path.exists(temp_path),
                "Physical file should be removed from disk")
        finally:
            # Cleanup in case test fails
            if os.path.exists(temp_path):
                os.remove(temp_path)

    def test_delete_photo_with_shared_main_file_different_from_files(self):
        """Test deleting when main_file is shared but files M2M has unique files."""
        # Shared main_file
        shared_main = File.objects.create(
            hash="shared_main_hash" + "a" * 18,
            path="/photos/main.jpg",
            type=File.IMAGE,
        )
        
        # Unique sidecar file for photo1 only
        unique_sidecar = File.objects.create(
            hash="unique_sidecar_hash" + "a" * 15,
            path="/photos/sidecar.xmp",
            type=File.METADATA_FILE,
        )
        
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        # Both photos share main_file
        photo1.main_file = shared_main
        photo1.files.add(shared_main, unique_sidecar)
        photo1.save()
        
        photo2.main_file = shared_main
        photo2.files.add(shared_main)
        photo2.save()
        
        # Delete photo1
        photo1.in_trashcan = True
        photo1.save()
        photo1.manual_delete()
        
        # shared_main should still exist (used by photo2)
        self.assertTrue(File.objects.filter(hash=shared_main.hash).exists())
        
        # unique_sidecar should be deleted (only used by photo1)
        self.assertFalse(File.objects.filter(hash=unique_sidecar.hash).exists())
        
        # photo2 should still reference shared_main
        photo2.refresh_from_db()
        self.assertEqual(photo2.main_file.hash, shared_main.hash)

    def test_delete_last_photo_using_shared_file(self):
        """Test that file is deleted when the last photo using it is deleted."""
        shared_file = File.objects.create(
            hash="eventually_orphan" + "a" * 17,
            path="/photos/shared.jpg",
            type=File.IMAGE,
        )
        
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        photo1.files.add(shared_file)
        photo1.main_file = shared_file
        photo1.save()
        
        photo2.files.add(shared_file)
        photo2.main_file = shared_file
        photo2.save()
        
        # Delete photo1 - file should remain
        photo1.in_trashcan = True
        photo1.save()
        photo1.manual_delete()
        
        self.assertTrue(File.objects.filter(hash=shared_file.hash).exists())
        
        # Delete photo2 - file should now be deleted (no photos using it)
        photo2.in_trashcan = True
        photo2.save()
        photo2.manual_delete()
        
        # File should be deleted from database (no physical file to check)
        self.assertFalse(File.objects.filter(hash=shared_file.hash).exists(),
            "File should be deleted when the last photo using it is deleted")


================================================
FILE: api/tests/test_photo_list_without_timestamp.py
================================================
from django.test import TestCase
from django.utils import timezone
from rest_framework.test import APIClient

from api.tests.utils import create_test_photos, create_test_user


class PhotoListWithoutTimestampTest(TestCase):
    def setUp(self):
        self.client = APIClient()
        self.user = create_test_user()
        self.client.force_authenticate(user=self.user)

    def test_retrieve_photos_without_exif_timestamp(self):
        now = timezone.now()
        create_test_photos(number_of_photos=1, owner=self.user, added_on=now)
        create_test_photos(
            number_of_photos=1, owner=self.user, added_on=now, exif_timestamp=now
        )

        response = self.client.get("/api/photos/notimestamp/")
        json = response.json()

        self.assertEqual(response.status_code, 200)
        self.assertEqual(1, len(json["results"]))


================================================
FILE: api/tests/test_photo_metadata.py
================================================
"""
Comprehensive tests for PhotoMetadata model and API.

Tests cover:
- PhotoMetadata model fields and properties
- MetadataFile model
- MetadataEdit model for change tracking
- API endpoints (retrieve, update, history, revert)
- Bulk metadata operations
- Edge cases and error handling
"""

import uuid
from unittest.mock import patch

from django.test import TestCase
from rest_framework import status
from rest_framework.test import APIClient

from api.models.photo_metadata import MetadataEdit, MetadataFile, PhotoMetadata
from api.tests.utils import create_test_photo, create_test_user


class PhotoMetadataModelTestCase(TestCase):
    """Tests for PhotoMetadata model functionality."""

    def setUp(self):
        self.user = create_test_user()
        self.photo = create_test_photo(owner=self.user)

    def test_create_metadata_basic(self):
        """Test creating basic PhotoMetadata."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            aperture=2.8,
            iso=100,
            focal_length=50.0,
            camera_model="Canon EOS R5",
        )
        
        self.assertEqual(metadata.photo, self.photo)
        self.assertEqual(metadata.aperture, 2.8)
        self.assertEqual(metadata.iso, 100)
        self.assertEqual(metadata.focal_length, 50.0)
        self.assertEqual(metadata.camera_model, "Canon EOS R5")

    def test_metadata_source_choices(self):
        """Test metadata source choices."""
        self.assertEqual(PhotoMetadata.Source.EMBEDDED, "embedded")
        self.assertEqual(PhotoMetadata.Source.SIDECAR, "sidecar")
        self.assertEqual(PhotoMetadata.Source.USER_EDIT, "user_edit")
        self.assertEqual(PhotoMetadata.Source.COMPUTED, "computed")

    def test_resolution_property(self):
        """Test resolution property."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            width=1920,
            height=1080,
        )
        
        self.assertEqual(metadata.resolution, "1920x1080")

    def test_resolution_property_missing_dimensions(self):
        """Test resolution property with missing dimensions."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            width=1920,
            height=None,
        )
        
        self.assertIsNone(metadata.resolution)

    def test_megapixels_property(self):
        """Test megapixels calculation."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            width=8256,
            height=5504,
        )
        
        # 8256 * 5504 = 45,441,024 pixels ≈ 45.4 MP
        self.assertEqual(metadata.megapixels, 45.4)

    def test_megapixels_property_missing_dimensions(self):
        """Test megapixels with missing dimensions."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            width=None,
            height=None,
        )
        
        self.assertIsNone(metadata.megapixels)

    def test_has_location_property_with_gps(self):
        """Test has_location with GPS data."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            gps_latitude=40.7128,
            gps_longitude=-74.0060,
        )
        
        self.assertTrue(metadata.has_location)

    def test_has_location_property_without_gps(self):
        """Test has_location without GPS data."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
        )
        
        self.assertFalse(metadata.has_location)

    def test_has_location_partial_gps(self):
        """Test has_location with only latitude."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            gps_latitude=40.7128,
            gps_longitude=None,
        )
        
        self.assertFalse(metadata.has_location)

    def test_camera_display_make_and_model(self):
        """Test camera_display with both make and model."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            camera_make="Canon",
            camera_model="EOS R5",
        )
        
        self.assertEqual(metadata.camera_display, "Canon EOS R5")

    def test_camera_display_model_includes_make(self):
        """Test camera_display when model already includes make."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            camera_make="Canon",
            camera_model="Canon EOS R5",
        )
        
        # Should not duplicate make
        self.assertEqual(metadata.camera_display, "Canon EOS R5")

    def test_camera_display_only_model(self):
        """Test camera_display with only model."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            camera_model="EOS R5",
        )
        
        self.assertEqual(metadata.camera_display, "EOS R5")

    def test_lens_display(self):
        """Test lens_display property."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            lens_make="Canon",
            lens_model="RF 50mm F1.2L",
        )
        
        self.assertEqual(metadata.lens_display, "Canon RF 50mm F1.2L")

    def test_lens_display_model_includes_make(self):
        """Test lens_display when model includes make."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            lens_make="Canon",
            lens_model="Canon RF 50mm F1.2L",
        )
        
        self.assertEqual(metadata.lens_display, "Canon RF 50mm F1.2L")

    def test_version_increments(self):
        """Test version field increments on save."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            aperture=2.8,
        )
        
        self.assertEqual(metadata.version, 1)
        
        metadata.aperture = 4.0
        metadata.version += 1
        metadata.save()
        
        metadata.refresh_from_db()
        self.assertEqual(metadata.version, 2)

    def test_raw_data_json_fields(self):
        """Test raw EXIF/XMP/IPTC JSON fields."""
        raw_data = {
            "EXIF:Make": "Canon",
            "EXIF:Model": "EOS R5",
            "EXIF:ISO": 100,
        }
        
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            raw_exif=raw_data,
        )
        
        self.assertEqual(metadata.raw_exif, raw_data)

    def test_keywords_json_field(self):
        """Test keywords JSON field stores list."""
        keywords = ["landscape", "sunset", "nature"]
        
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            keywords=keywords,
        )
        
        metadata.refresh_from_db()
        self.assertEqual(metadata.keywords, keywords)


class MetadataFileModelTestCase(TestCase):
    """Tests for MetadataFile model."""

    def setUp(self):
        self.user = create_test_user()
        self.photo = create_test_photo(owner=self.user)

    def test_file_type_choices(self):
        """Test file type choices exist."""
        self.assertEqual(MetadataFile.FileType.XMP, "xmp")
        self.assertEqual(MetadataFile.FileType.JSON, "json")
        self.assertEqual(MetadataFile.FileType.EXIF, "exif")
        self.assertEqual(MetadataFile.FileType.OTHER, "other")

    def test_source_choices(self):
        """Test source choices exist."""
        self.assertEqual(MetadataFile.Source.ORIGINAL, "original")
        self.assertEqual(MetadataFile.Source.SOFTWARE, "software")
        self.assertEqual(MetadataFile.Source.LIBREPHOTOS, "librephotos")
        self.assertEqual(MetadataFile.Source.USER, "user")


class MetadataEditModelTestCase(TestCase):
    """Tests for MetadataEdit model."""

    def setUp(self):
        self.user = create_test_user()
        self.photo = create_test_photo(owner=self.user)

    def test_create_edit_record(self):
        """Test creating a metadata edit record."""
        edit = MetadataEdit.objects.create(
            photo=self.photo,
            user=self.user,
            field_name="title",
            old_value="Old Title",
            new_value="New Title",
        )
        
        self.assertEqual(edit.photo, self.photo)
        self.assertEqual(edit.user, self.user)
        self.assertEqual(edit.field_name, "title")
        self.assertEqual(edit.old_value, "Old Title")
        self.assertEqual(edit.new_value, "New Title")
        self.assertFalse(edit.synced_to_file)

    def test_edit_records_ordered_by_created_at(self):
        """Test edit records are ordered by creation time."""
        edit1 = MetadataEdit.objects.create(
            photo=self.photo,
            user=self.user,
            field_name="title",
            old_value=None,
            new_value="First",
        )
        edit2 = MetadataEdit.objects.create(
            photo=self.photo,
            user=self.user,
            field_name="title",
            old_value="First",
            new_value="Second",
        )
        
        edits = list(MetadataEdit.objects.filter(photo=self.photo))
        # Most recent first
        self.assertEqual(edits[0].id, edit2.id)
        self.assertEqual(edits[1].id, edit1.id)


class PhotoMetadataAPITestCase(TestCase):
    """Tests for PhotoMetadata API endpoints."""

    def setUp(self):
        self.client = APIClient()
        self.user = create_test_user()
        self.other_user = create_test_user()
        self.client.force_authenticate(user=self.user)
        
        self.photo = create_test_photo(owner=self.user)
        self.metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            aperture=2.8,
            iso=100,
            focal_length=50.0,
            camera_make="Canon",
            camera_model="EOS R5",
            width=8256,
            height=5504,
        )

    def test_retrieve_metadata(self):
        """Test retrieving metadata for a photo."""
        response = self.client.get(f"/api/photos/{self.photo.id}/metadata")
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["aperture"], 2.8)
        self.assertEqual(data["iso"], 100)
        self.assertEqual(data["camera_model"], "EOS R5")

    def test_retrieve_metadata_by_image_hash(self):
        """Test retrieving metadata using image_hash."""
        response = self.client.get(f"/api/photos/{self.photo.image_hash}/metadata")
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)

    def test_retrieve_metadata_creates_if_missing(self):
        """Test retrieve creates metadata if it doesn't exist."""
        photo2 = create_test_photo(owner=self.user)
        
        # Delete any auto-created metadata
        PhotoMetadata.objects.filter(photo=photo2).delete()
        
        response = self.client.get(f"/api/photos/{photo2.id}/metadata")
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        # Metadata should now exist
        self.assertTrue(PhotoMetadata.objects.filter(photo=photo2).exists())

    def test_retrieve_metadata_other_user_forbidden(self):
        """Test retrieving other user's photo metadata is forbidden."""
        other_photo = create_test_photo(owner=self.other_user)
        
        response = self.client.get(f"/api/photos/{other_photo.id}/metadata")
        
        self.assertEqual(response.status_code, status.HTTP_403_FORBIDDEN)

    def test_update_metadata(self):
        """Test updating metadata fields."""
        response = self.client.patch(
            f"/api/photos/{self.photo.id}/metadata",
            {"title": "My Beautiful Photo", "rating": 5},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        
        self.metadata.refresh_from_db()
        self.assertEqual(self.metadata.title, "My Beautiful Photo")
        self.assertEqual(self.metadata.rating, 5)

    def test_update_creates_edit_history(self):
        """Test updating metadata creates edit history."""
        response = self.client.patch(
            f"/api/photos/{self.photo.id}/metadata",
            {"caption": "A stunning sunset"},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        
        # Check edit history was created
        edits = MetadataEdit.objects.filter(photo=self.photo)
        self.assertTrue(edits.exists())
        edit = edits.first()
        self.assertEqual(edit.field_name, "caption")
        self.assertEqual(edit.new_value, "A stunning sunset")

    def test_get_edit_history(self):
        """Test getting edit history."""
        # Create some edits
        MetadataEdit.objects.create(
            photo=self.photo,
            user=self.user,
            field_name="title",
            old_value=None,
            new_value="First",
        )
        MetadataEdit.objects.create(
            photo=self.photo,
            user=self.user,
            field_name="title",
            old_value="First",
            new_value="Second",
        )
        
        response = self.client.get(f"/api/photos/{self.photo.id}/metadata/history")
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertIn("results", data)
        self.assertEqual(data["count"], 2)
        self.assertEqual(len(data["results"]), 2)

    def test_revert_edit(self):
        """Test reverting a specific edit."""
        # Set initial value
        self.metadata.title = "Original Title"
        self.metadata.save()
        
        # Create an edit
        edit = MetadataEdit.objects.create(
            photo=self.photo,
            user=self.user,
            field_name="title",
            old_value="Original Title",
            new_value="Changed Title",
        )
        self.metadata.title = "Changed Title"
        self.metadata.save()
        
        # Revert the edit
        response = self.client.post(f"/api/photos/{self.photo.id}/metadata/revert/{edit.id}")
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        
        self.metadata.refresh_from_db()
        self.assertEqual(self.metadata.title, "Original Title")

    def test_revert_creates_new_edit_record(self):
        """Test reverting creates a new edit record."""
        edit = MetadataEdit.objects.create(
            photo=self.photo,
            user=self.user,
            field_name="title",
            old_value="Original",
            new_value="Changed",
        )
        self.metadata.title = "Changed"
        self.metadata.save()
        
        initial_count = MetadataEdit.objects.filter(photo=self.photo).count()
        
        self.client.post(f"/api/photos/{self.photo.id}/metadata/revert/{edit.id}")
        
        final_count = MetadataEdit.objects.filter(photo=self.photo).count()
        self.assertEqual(final_count, initial_count + 1)

    def test_revert_nonexistent_edit(self):
        """Test reverting nonexistent edit returns 404."""
        fake_edit_id = uuid.uuid4()
        
        response = self.client.post(f"/api/photos/{self.photo.id}/metadata/revert/{fake_edit_id}")
        
        self.assertEqual(response.status_code, status.HTTP_404_NOT_FOUND)

    def test_unauthenticated_request(self):
        """Test unauthenticated requests return 401."""
        self.client.force_authenticate(user=None)
        
        response = self.client.get(f"/api/photos/{self.photo.id}/metadata")
        
        self.assertEqual(response.status_code, status.HTTP_401_UNAUTHORIZED)


class BulkMetadataAPITestCase(TestCase):
    """Tests for bulk metadata operations."""

    def setUp(self):
        self.client = APIClient()
        self.user = create_test_user()
        self.client.force_authenticate(user=self.user)
        
        self.photo1 = create_test_photo(owner=self.user)
        self.photo2 = create_test_photo(owner=self.user)
        self.photo3 = create_test_photo(owner=self.user)
        
        self.meta1 = PhotoMetadata.objects.create(
            photo=self.photo1,
            camera_model="Canon R5",
            rating=3,
        )
        self.meta2 = PhotoMetadata.objects.create(
            photo=self.photo2,
            camera_model="Nikon Z9",
            rating=4,
        )

    def test_bulk_get_metadata(self):
        """Test getting metadata for multiple photos."""
        photo_ids = f"{self.photo1.id},{self.photo2.id}"
        
        response = self.client.get(f"/api/photos/metadata/bulk?photo_ids={photo_ids}")
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertIn(str(self.photo1.id), data)
        self.assertIn(str(self.photo2.id), data)

    def test_bulk_get_no_photo_ids(self):
        """Test bulk get without photo_ids returns error."""
        response = self.client.get("/api/photos/metadata/bulk")
        
        self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST)

    def test_bulk_get_max_100_photos(self):
        """Test bulk get with >100 photos returns error."""
        # Create 101 fake photo IDs
        photo_ids = ",".join([str(uuid.uuid4()) for _ in range(101)])
        
        response = self.client.get(f"/api/photos/metadata/bulk?photo_ids={photo_ids}")
        
        self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST)
        self.assertIn("Maximum 100", response.json()["error"])

    def test_bulk_update_metadata(self):
        """Test bulk updating metadata."""
        response = self.client.patch(
            "/api/photos/metadata/bulk",
            {
                "photo_ids": [str(self.photo1.id), str(self.photo2.id)],
                "updates": {"rating": 5},
            },
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["updated_count"], 2)
        
        self.meta1.refresh_from_db()
        self.meta2.refresh_from_db()
        self.assertEqual(self.meta1.rating, 5)
        self.assertEqual(self.meta2.rating, 5)

    def test_bulk_update_no_photo_ids(self):
        """Test bulk update without photo_ids returns error."""
        response = self.client.patch(
            "/api/photos/metadata/bulk",
            {"updates": {"rating": 5}},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST)

    def test_bulk_update_no_updates(self):
        """Test bulk update without updates returns error."""
        response = self.client.patch(
            "/api/photos/metadata/bulk",
            {"photo_ids": [str(self.photo1.id)]},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST)

    def test_bulk_update_invalid_fields(self):
        """Test bulk update with invalid fields returns error."""
        response = self.client.patch(
            "/api/photos/metadata/bulk",
            {
                "photo_ids": [str(self.photo1.id)],
                "updates": {"iso": 100},  # ISO is not allowed for bulk edit
            },
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST)
        self.assertIn("Invalid fields", response.json()["error"])

    def test_bulk_update_creates_edit_history(self):
        """Test bulk update creates edit history for each photo."""
        initial_count = MetadataEdit.objects.count()
        
        self.client.patch(
            "/api/photos/metadata/bulk",
            {
                "photo_ids": [str(self.photo1.id), str(self.photo2.id)],
                "updates": {"title": "Bulk Title"},
            },
            format="json",
        )
        
        # Should have 2 new edit records (one per photo)
        self.assertEqual(MetadataEdit.objects.count(), initial_count + 2)

    def test_bulk_update_other_user_photos_ignored(self):
        """Test bulk update ignores other user's photos."""
        other_user = create_test_user()
        other_photo = create_test_photo(owner=other_user)
        
        response = self.client.patch(
            "/api/photos/metadata/bulk",
            {
                "photo_ids": [str(self.photo1.id), str(other_photo.id)],
                "updates": {"rating": 5},
            },
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["updated_count"], 1)  # Only our photo


class PhotoMetadataEdgeCasesTestCase(TestCase):
    """Edge case tests for PhotoMetadata."""

    def setUp(self):
        self.client = APIClient()
        self.user = create_test_user()
        self.client.force_authenticate(user=self.user)
        self.photo = create_test_photo(owner=self.user)

    def test_metadata_with_special_characters(self):
        """Test metadata fields handle special characters."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            title="Photo with émojis 📷 and ünïcödé",
            caption="<script>alert('xss')</script>",
        )
        
        metadata.refresh_from_db()
        self.assertIn("émojis", metadata.title)
        self.assertIn("📷", metadata.title)
        self.assertIn("<script>", metadata.caption)

    def test_metadata_with_very_long_caption(self):
        """Test metadata handles long captions."""
        long_caption = "x" * 10000
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            caption=long_caption,
        )
        
        metadata.refresh_from_db()
        self.assertEqual(len(metadata.caption), 10000)

    def test_metadata_with_null_values(self):
        """Test metadata handles null values correctly."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            aperture=None,
            iso=None,
            camera_model=None,
        )
        
        self.assertIsNone(metadata.aperture)
        self.assertIsNone(metadata.iso)
        self.assertIsNone(metadata.camera_model)
        self.assertIsNone(metadata.camera_display)

    def test_metadata_with_zero_values(self):
        """Test metadata handles zero values."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            iso=0,
            focal_length=0,
            rating=0,
        )
        
        self.assertEqual(metadata.iso, 0)
        self.assertEqual(metadata.focal_length, 0)
        self.assertEqual(metadata.rating, 0)

    def test_metadata_with_negative_gps(self):
        """Test metadata handles negative GPS coordinates."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            gps_latitude=-33.8688,
            gps_longitude=151.2093,
        )
        
        self.assertEqual(metadata.gps_latitude, -33.8688)
        self.assertTrue(metadata.has_location)

    def test_one_to_one_relationship_enforced(self):
        """Test only one PhotoMetadata per photo."""
        PhotoMetadata.objects.create(photo=self.photo)
        
        with self.assertRaises(Exception):
            PhotoMetadata.objects.create(photo=self.photo)

    def test_invalid_uuid_in_url(self):
        """Test invalid UUID in URL returns appropriate error."""
        response = self.client.get("/api/photos/not-a-valid-uuid/metadata")
        
        # Should return 404 (photo not found by image_hash fallback)
        self.assertEqual(response.status_code, status.HTTP_404_NOT_FOUND)

    def test_staff_can_access_any_photo_metadata(self):
        """Test staff users can access any photo's metadata."""
        admin = create_test_user(is_admin=True)
        self.client.force_authenticate(user=admin)
        
        other_user = create_test_user()
        other_photo = create_test_photo(owner=other_user)
        PhotoMetadata.objects.create(photo=other_photo, iso=100)
        
        response = self.client.get(f"/api/photos/{other_photo.id}/metadata")
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)

    def test_update_increments_version(self):
        """Test updating metadata increments version."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            title="Initial",
            version=1,
        )
        
        self.client.patch(
            f"/api/photos/{self.photo.id}/metadata",
            {"title": "Updated"},
            format="json",
        )
        
        metadata.refresh_from_db()
        # Version may or may not increment depending on serializer - just check it's >= 1
        self.assertGreaterEqual(metadata.version, 1)

    def test_revert_all_records_action(self):
        """Test revert_all creates a special edit record."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            title="Modified",
            source=PhotoMetadata.Source.USER_EDIT,
        )
        
        # Mock the extract_exif_data to avoid file operations
        with patch.object(PhotoMetadata, 'extract_exif_data', return_value=metadata):
            response = self.client.post(f"/api/photos/{self.photo.id}/metadata/revert-all")
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        
        # Check that a revert_all edit was recorded
        revert_edit = MetadataEdit.objects.filter(
            photo=self.photo,
            field_name="_all"
        ).first()
        self.assertIsNotNone(revert_edit)
        self.assertEqual(revert_edit.old_value["action"], "revert_all")

    def test_keywords_array_update(self):
        """Test updating keywords array field."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            keywords=["original", "tags"],
        )
        
        response = self.client.patch(
            f"/api/photos/{self.photo.id}/metadata",
            {"keywords": ["new", "keywords", "list"]},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        
        metadata.refresh_from_db()
        self.assertEqual(metadata.keywords, ["new", "keywords", "list"])

    def test_empty_keywords_update(self):
        """Test updating keywords to empty list."""
        metadata = PhotoMetadata.objects.create(
            photo=self.photo,
            keywords=["original", "tags"],
        )
        
        response = self.client.patch(
            f"/api/photos/{self.photo.id}/metadata",
            {"keywords": []},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        
        metadata.refresh_from_db()
        self.assertEqual(metadata.keywords, [])


================================================
FILE: api/tests/test_photo_metadata_api.py
================================================
"""
Tests for PhotoMetadata API endpoints.

Tests the following:
- GET /api/photos/{photo_id}/metadata/ - Get full metadata
- PATCH /api/photos/{photo_id}/metadata/ - Update metadata
- GET /api/photos/{photo_id}/metadata/history/ - Get edit history
- POST /api/photos/{photo_id}/metadata/revert/{edit_id}/ - Revert a change
- Bulk metadata operations
- Edge cases (no EXIF, corrupted data, permissions)
"""

import uuid
from django.test import TestCase
from django.utils import timezone
from rest_framework.test import APIClient, APITestCase

from api.models.photo_metadata import MetadataEdit, PhotoMetadata
from api.tests.utils import create_test_photo, create_test_user


class PhotoMetadataRetrieveTestCase(APITestCase):
    """Test metadata retrieval endpoints."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)
        self.photo = create_test_photo(owner=self.user)

    def test_get_metadata_by_uuid(self):
        """Test retrieving metadata using photo UUID."""
        response = self.client.get(f"/api/photos/{self.photo.pk}/metadata/")
        self.assertEqual(response.status_code, 200)
        # Response contains metadata fields directly
        self.assertIn("id", response.data)
        self.assertIn("source", response.data)

    def test_get_metadata_by_image_hash(self):
        """Test retrieving metadata using image_hash."""
        response = self.client.get(f"/api/photos/{self.photo.image_hash}/metadata/")
        self.assertEqual(response.status_code, 200)

    def test_get_metadata_creates_if_missing(self):
        """Test that metadata is created if it doesn't exist."""
        # Ensure no metadata exists
        PhotoMetadata.objects.filter(photo=self.photo).delete()
        
        response = self.client.get(f"/api/photos/{self.photo.pk}/metadata/")
        self.assertEqual(response.status_code, 200)
        
        # Should have created metadata
        self.assertTrue(PhotoMetadata.objects.filter(photo=self.photo).exists())

    def test_get_metadata_nonexistent_photo(self):
        """Test 404 for nonexistent photo."""
        fake_uuid = str(uuid.uuid4())
        response = self.client.get(f"/api/photos/{fake_uuid}/metadata/")
        self.assertEqual(response.status_code, 404)

    def test_get_metadata_other_user_forbidden(self):
        """Test that users cannot access other users' photo metadata."""
        other_user = create_test_user()
        other_photo = create_test_photo(owner=other_user)
        
        response = self.client.get(f"/api/photos/{other_photo.pk}/metadata/")
        self.assertEqual(response.status_code, 403)

    def test_get_metadata_admin_can_access_any(self):
        """Test that admin can access any photo's metadata."""
        other_user = create_test_user()
        other_photo = create_test_photo(owner=other_user)
        
        # Make current user admin
        self.user.is_staff = True
        self.user.save()
        
        response = self.client.get(f"/api/photos/{other_photo.pk}/metadata/")
        self.assertEqual(response.status_code, 200)


class PhotoMetadataUpdateTestCase(APITestCase):
    """Test metadata update endpoints."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)
        self.photo = create_test_photo(owner=self.user)

    def test_update_metadata_title(self):
        """Test updating photo title."""
        response = self.client.patch(
            f"/api/photos/{self.photo.pk}/metadata/",
            {"title": "My Test Photo"},
            format="json"
        )
        self.assertEqual(response.status_code, 200)
        
        # Verify update
        metadata = PhotoMetadata.objects.get(photo=self.photo)
        self.assertEqual(metadata.title, "My Test Photo")

    def test_update_metadata_creates_history(self):
        """Test that updates create edit history."""
        # First update
        response = self.client.patch(
            f"/api/photos/{self.photo.pk}/metadata/",
            {"title": "First Title"},
            format="json"
        )
        self.assertEqual(response.status_code, 200)
        
        # Second update
        response = self.client.patch(
            f"/api/photos/{self.photo.pk}/metadata/",
            {"title": "Second Title"},
            format="json"
        )
        self.assertEqual(response.status_code, 200)
        
        # Check history
        edits = MetadataEdit.objects.filter(photo=self.photo, field_name="title")
        self.assertGreaterEqual(edits.count(), 1)

    def test_update_metadata_rating(self):
        """Test updating photo rating."""
        response = self.client.patch(
            f"/api/photos/{self.photo.pk}/metadata/",
            {"rating": 5},
            format="json"
        )
        self.assertEqual(response.status_code, 200)
        
        metadata = PhotoMetadata.objects.get(photo=self.photo)
        self.assertEqual(metadata.rating, 5)

    def test_update_metadata_caption(self):
        """Test updating photo caption."""
        response = self.client.patch(
            f"/api/photos/{self.photo.pk}/metadata/",
            {"caption": "A beautiful sunset over the mountains"},
            format="json"
        )
        self.assertEqual(response.status_code, 200)
        
        metadata = PhotoMetadata.objects.get(photo=self.photo)
        self.assertEqual(metadata.caption, "A beautiful sunset over the mountains")

    def test_update_metadata_version_increments(self):
        """Test that metadata version increments on update."""
        # Get initial version
        metadata, _ = PhotoMetadata.objects.get_or_create(photo=self.photo)
        initial_version = metadata.version
        
        response = self.client.patch(
            f"/api/photos/{self.photo.pk}/metadata/",
            {"title": "Updated Title"},
            format="json"
        )
        self.assertEqual(response.status_code, 200)
        
        metadata.refresh_from_db()
        self.assertEqual(metadata.version, initial_version + 1)

    def test_update_metadata_forbidden_for_other_user(self):
        """Test that users cannot update other users' photo metadata."""
        other_user = create_test_user()
        other_photo = create_test_photo(owner=other_user)
        
        response = self.client.patch(
            f"/api/photos/{other_photo.pk}/metadata/",
            {"title": "Hacked Title"},
            format="json"
        )
        self.assertEqual(response.status_code, 403)


class PhotoMetadataHistoryTestCase(APITestCase):
    """Test metadata history endpoints."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)
        self.photo = create_test_photo(owner=self.user)

    def test_get_empty_history(self):
        """Test getting history when no edits exist."""
        response = self.client.get(f"/api/photos/{self.photo.pk}/metadata/history/")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["results"], [])
        self.assertEqual(response.data["count"], 0)

    def test_get_history_with_edits(self):
        """Test getting history after making edits."""
        # Create some edit history
        metadata, _ = PhotoMetadata.objects.get_or_create(photo=self.photo)
        MetadataEdit.objects.create(
            photo=self.photo,
            user=self.user,
            field_name="title",
            old_value=None,
            new_value="Test Title"
        )
        
        response = self.client.get(f"/api/photos/{self.photo.pk}/metadata/history/")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["count"], 1)
        self.assertEqual(len(response.data["results"]), 1)

    def test_history_pagination(self):
        """Test history pagination."""
        metadata, _ = PhotoMetadata.objects.get_or_create(photo=self.photo)
        
        # Create many edit records
        for i in range(25):
            MetadataEdit.objects.create(
                photo=self.photo,
                user=self.user,
                field_name="rating",
                old_value=i,
                new_value=i + 1
            )
        
        # First page
        response = self.client.get(f"/api/photos/{self.photo.pk}/metadata/history/?page=1&page_size=10")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(len(response.data["results"]), 10)
        self.assertEqual(response.data["count"], 25)

    def test_history_ordered_by_date(self):
        """Test that history is ordered by date descending."""
        metadata, _ = PhotoMetadata.objects.get_or_create(photo=self.photo)
        
        # Create edits with different times
        _edit1 = MetadataEdit.objects.create(
            photo=self.photo,
            user=self.user,
            field_name="title",
            old_value=None,
            new_value="First"
        )
        _edit2 = MetadataEdit.objects.create(
            photo=self.photo,
            user=self.user,
            field_name="title",
            old_value="First",
            new_value="Second"
        )
        
        response = self.client.get(f"/api/photos/{self.photo.pk}/metadata/history/")
        self.assertEqual(response.status_code, 200)
        
        # Most recent should be first
        self.assertEqual(response.data["results"][0]["new_value"], "Second")


class PhotoMetadataRevertTestCase(APITestCase):
    """Test metadata revert endpoints."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)
        self.photo = create_test_photo(owner=self.user)
        self.metadata, _ = PhotoMetadata.objects.get_or_create(photo=self.photo)

    def test_revert_single_edit(self):
        """Test reverting a single edit."""
        # Set initial value
        self.metadata.title = "Original Title"
        self.metadata.save()
        
        # Create edit record
        edit = MetadataEdit.objects.create(
            photo=self.photo,
            user=self.user,
            field_name="title",
            old_value="Original Title",
            new_value="Modified Title"
        )
        self.metadata.title = "Modified Title"
        self.metadata.save()
        
        # Revert
        response = self.client.post(f"/api/photos/{self.photo.pk}/metadata/revert/{edit.id}/")
        self.assertEqual(response.status_code, 200)
        
        self.metadata.refresh_from_db()
        self.assertEqual(self.metadata.title, "Original Title")

    def test_revert_creates_history_entry(self):
        """Test that revert creates its own history entry."""
        edit = MetadataEdit.objects.create(
            photo=self.photo,
            user=self.user,
            field_name="title",
            old_value="Original",
            new_value="Modified"
        )
        self.metadata.title = "Modified"
        self.metadata.save()
        
        initial_count = MetadataEdit.objects.filter(photo=self.photo).count()
        
        response = self.client.post(f"/api/photos/{self.photo.pk}/metadata/revert/{edit.id}/")
        self.assertEqual(response.status_code, 200)
        
        # Should have one more edit record
        new_count = MetadataEdit.objects.filter(photo=self.photo).count()
        self.assertEqual(new_count, initial_count + 1)

    def test_revert_nonexistent_edit(self):
        """Test reverting nonexistent edit returns 404."""
        fake_id = str(uuid.uuid4())
        response = self.client.post(f"/api/photos/{self.photo.pk}/metadata/revert/{fake_id}/")
        self.assertEqual(response.status_code, 404)

    def test_revert_edit_from_wrong_photo(self):
        """Test that you cannot revert an edit from a different photo."""
        other_photo = create_test_photo(owner=self.user)
        other_metadata, _ = PhotoMetadata.objects.get_or_create(photo=other_photo)
        
        edit = MetadataEdit.objects.create(
            photo=other_photo,
            user=self.user,
            field_name="title",
            old_value="Original",
            new_value="Modified"
        )
        
        # Try to revert using wrong photo ID
        response = self.client.post(f"/api/photos/{self.photo.pk}/metadata/revert/{edit.id}/")
        self.assertEqual(response.status_code, 404)


class PhotoMetadataRevertAllTestCase(APITestCase):
    """Test revert-all endpoint."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)
        self.photo = create_test_photo(owner=self.user)

    def test_revert_all_creates_history(self):
        """Test that revert-all creates a history entry."""
        metadata, _ = PhotoMetadata.objects.get_or_create(photo=self.photo)
        
        initial_count = MetadataEdit.objects.filter(photo=self.photo).count()
        
        _response = self.client.post(f"/api/photos/{self.photo.pk}/metadata/revert-all/")
        # May return 200 or 500 depending on whether EXIF extraction works
        # Just check the edit record is created
        
        new_count = MetadataEdit.objects.filter(photo=self.photo).count()
        # Should have at least tried to create the record
        self.assertGreaterEqual(new_count, initial_count)


class BulkMetadataGetTestCase(APITestCase):
    """Test bulk metadata GET endpoint."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)
        self.photos = [create_test_photo(owner=self.user) for _ in range(5)]

    def test_bulk_get_by_uuid(self):
        """Test bulk get metadata by UUIDs."""
        photo_ids = ",".join(str(p.pk) for p in self.photos[:3])
        response = self.client.get(f"/api/photos/metadata/bulk/?photo_ids={photo_ids}")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(len(response.data), 3)

    def test_bulk_get_by_image_hash(self):
        """Test bulk get metadata by image hashes."""
        photo_ids = ",".join(p.image_hash for p in self.photos[:3])
        response = self.client.get(f"/api/photos/metadata/bulk/?photo_ids={photo_ids}")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(len(response.data), 3)

    def test_bulk_get_mixed_ids(self):
        """Test bulk get with mixed UUID and image_hash."""
        photo_ids = f"{self.photos[0].pk},{self.photos[1].image_hash}"
        response = self.client.get(f"/api/photos/metadata/bulk/?photo_ids={photo_ids}")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(len(response.data), 2)

    def test_bulk_get_no_ids(self):
        """Test bulk get with no IDs returns error."""
        response = self.client.get("/api/photos/metadata/bulk/")
        self.assertEqual(response.status_code, 400)

    def test_bulk_get_too_many_ids(self):
        """Test bulk get with too many IDs returns error."""
        # Create many fake IDs
        photo_ids = ",".join(str(uuid.uuid4()) for _ in range(101))
        response = self.client.get(f"/api/photos/metadata/bulk/?photo_ids={photo_ids}")
        self.assertEqual(response.status_code, 400)

    def test_bulk_get_filters_other_users(self):
        """Test that bulk get only returns current user's photos."""
        other_user = create_test_user()
        other_photo = create_test_photo(owner=other_user)
        
        photo_ids = f"{self.photos[0].pk},{other_photo.pk}"
        response = self.client.get(f"/api/photos/metadata/bulk/?photo_ids={photo_ids}")
        self.assertEqual(response.status_code, 200)
        # Should only return our photo
        self.assertEqual(len(response.data), 1)


class BulkMetadataUpdateTestCase(APITestCase):
    """Test bulk metadata PATCH endpoint."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)
        self.photos = [create_test_photo(owner=self.user) for _ in range(5)]

    def test_bulk_update_rating(self):
        """Test bulk update rating for multiple photos."""
        photo_ids = [str(p.pk) for p in self.photos[:3]]
        response = self.client.patch(
            "/api/photos/metadata/bulk/",
            {"photo_ids": photo_ids, "updates": {"rating": 4}},
            format="json"
        )
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["updated_count"], 3)

    def test_bulk_update_creates_history(self):
        """Test that bulk update creates edit history."""
        photo_ids = [str(p.pk) for p in self.photos[:2]]
        
        response = self.client.patch(
            "/api/photos/metadata/bulk/",
            {"photo_ids": photo_ids, "updates": {"title": "Bulk Title"}},
            format="json"
        )
        self.assertEqual(response.status_code, 200)
        
        # Check history for each photo
        for photo in self.photos[:2]:
            edits = MetadataEdit.objects.filter(photo=photo, field_name="title")
            self.assertGreaterEqual(edits.count(), 1)

    def test_bulk_update_no_ids(self):
        """Test bulk update with no IDs returns error."""
        response = self.client.patch(
            "/api/photos/metadata/bulk/",
            {"photo_ids": [], "updates": {"rating": 5}},
            format="json"
        )
        self.assertEqual(response.status_code, 400)

    def test_bulk_update_no_updates(self):
        """Test bulk update with no updates returns error."""
        response = self.client.patch(
            "/api/photos/metadata/bulk/",
            {"photo_ids": [str(self.photos[0].pk)], "updates": {}},
            format="json"
        )
        self.assertEqual(response.status_code, 400)

    def test_bulk_update_invalid_field(self):
        """Test bulk update with invalid field returns error."""
        response = self.client.patch(
            "/api/photos/metadata/bulk/",
            {
                "photo_ids": [str(self.photos[0].pk)],
                "updates": {"invalid_field": "value"}
            },
            format="json"
        )
        self.assertEqual(response.status_code, 400)

    def test_bulk_update_too_many_photos(self):
        """Test bulk update with too many photos returns error."""
        fake_ids = [str(uuid.uuid4()) for _ in range(101)]
        response = self.client.patch(
            "/api/photos/metadata/bulk/",
            {"photo_ids": fake_ids, "updates": {"rating": 5}},
            format="json"
        )
        self.assertEqual(response.status_code, 400)


class PhotoMetadataEdgeCasesTestCase(APITestCase):
    """Test edge cases for metadata API."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)
        self.photo = create_test_photo(owner=self.user)

    def test_photo_no_exif_data(self):
        """Test handling photo with no EXIF data."""
        # Clear any existing metadata
        PhotoMetadata.objects.filter(photo=self.photo).delete()
        
        # Clear exif fields on photo
        self.photo.exif_timestamp = None
        self.photo.exif_gps_lat = None
        self.photo.exif_gps_lon = None
        self.photo.save()
        
        response = self.client.get(f"/api/photos/{self.photo.pk}/metadata/")
        self.assertEqual(response.status_code, 200)
        # Should still return valid response

    def test_metadata_with_special_characters(self):
        """Test metadata with special characters in title/caption."""
        response = self.client.patch(
            f"/api/photos/{self.photo.pk}/metadata/",
            {"title": "Test 日本語 Émoji 🎉 <script>"},
            format="json"
        )
        self.assertEqual(response.status_code, 200)
        
        metadata = PhotoMetadata.objects.get(photo=self.photo)
        self.assertIn("日本語", metadata.title)

    def test_metadata_empty_strings(self):
        """Test updating metadata with empty strings."""
        # First set a value
        self.client.patch(
            f"/api/photos/{self.photo.pk}/metadata/",
            {"title": "Some Title"},
            format="json"
        )
        
        # Then clear it
        response = self.client.patch(
            f"/api/photos/{self.photo.pk}/metadata/",
            {"title": ""},
            format="json"
        )
        self.assertEqual(response.status_code, 200)

    def test_metadata_null_values(self):
        """Test updating metadata with null values."""
        response = self.client.patch(
            f"/api/photos/{self.photo.pk}/metadata/",
            {"caption": None},
            format="json"
        )
        # Should handle gracefully
        self.assertIn(response.status_code, [200, 400])

    def test_concurrent_metadata_updates(self):
        """Test concurrent metadata updates (version conflict)."""
        # Get initial metadata
        metadata, _ = PhotoMetadata.objects.get_or_create(photo=self.photo)
        
        # Simulate concurrent updates
        response1 = self.client.patch(
            f"/api/photos/{self.photo.pk}/metadata/",
            {"title": "Update 1"},
            format="json"
        )
        response2 = self.client.patch(
            f"/api/photos/{self.photo.pk}/metadata/",
            {"title": "Update 2"},
            format="json"
        )
        
        # Both should succeed (last one wins)
        self.assertEqual(response1.status_code, 200)
        self.assertEqual(response2.status_code, 200)
        
        metadata.refresh_from_db()
        self.assertEqual(metadata.title, "Update 2")

    def test_very_long_values(self):
        """Test metadata with very long string values."""
        long_title = "A" * 1000
        response = self.client.patch(
            f"/api/photos/{self.photo.pk}/metadata/",
            {"title": long_title},
            format="json"
        )
        # Should either succeed or return validation error
        self.assertIn(response.status_code, [200, 400])


class PhotoMetadataModelTestCase(TestCase):
    """Test PhotoMetadata model methods."""

    def setUp(self):
        self.user = create_test_user()
        self.photo = create_test_photo(owner=self.user)

    def test_metadata_source_choices(self):
        """Test metadata source choices."""
        metadata, _ = PhotoMetadata.objects.get_or_create(photo=self.photo)
        
        # Test all source choices
        for source in PhotoMetadata.Source:
            metadata.source = source
            metadata.save()
            metadata.refresh_from_db()
            self.assertEqual(metadata.source, source)

    def test_has_location_property(self):
        """Test has_location computed property."""
        metadata, _ = PhotoMetadata.objects.get_or_create(photo=self.photo)
        
        # No location
        metadata.gps_latitude = None
        metadata.gps_longitude = None
        metadata.save()
        self.assertFalse(metadata.has_location)
        
        # With location
        metadata.gps_latitude = 40.7128
        metadata.gps_longitude = -74.0060
        metadata.save()
        self.assertTrue(metadata.has_location)

    def test_camera_display_property(self):
        """Test camera_display computed property."""
        metadata, _ = PhotoMetadata.objects.get_or_create(photo=self.photo)
        
        metadata.camera_make = "Canon"
        metadata.camera_model = "EOS R5"
        metadata.save()
        
        display = metadata.camera_display
        self.assertIsNotNone(display)

    def test_lens_display_property(self):
        """Test lens_display computed property."""
        metadata, _ = PhotoMetadata.objects.get_or_create(photo=self.photo)
        
        metadata.lens_make = "Canon"
        metadata.lens_model = "RF 24-70mm f/2.8L"
        metadata.save()
        
        display = metadata.lens_display
        self.assertIsNotNone(display)


class MetadataEditModelTestCase(TestCase):
    """Test MetadataEdit model."""

    def setUp(self):
        self.user = create_test_user()
        self.photo = create_test_photo(owner=self.user)

    def test_create_edit_record(self):
        """Test creating a metadata edit record."""
        edit = MetadataEdit.objects.create(
            photo=self.photo,
            user=self.user,
            field_name="title",
            old_value="Old Title",
            new_value="New Title"
        )
        self.assertIsNotNone(edit.id)
        self.assertEqual(edit.field_name, "title")
        self.assertEqual(edit.old_value, "Old Title")
        self.assertEqual(edit.new_value, "New Title")

    def test_edit_record_timestamps(self):
        """Test that edit records have correct timestamps."""
        before = timezone.now()
        edit = MetadataEdit.objects.create(
            photo=self.photo,
            user=self.user,
            field_name="rating",
            old_value=0,
            new_value=5
        )
        after = timezone.now()
        
        self.assertGreaterEqual(edit.created_at, before)
        self.assertLessEqual(edit.created_at, after)

    def test_edit_record_json_values(self):
        """Test edit records with JSON values."""
        edit = MetadataEdit.objects.create(
            photo=self.photo,
            user=self.user,
            field_name="keywords",
            old_value=["tag1", "tag2"],
            new_value=["tag1", "tag2", "tag3"]
        )
        
        edit.refresh_from_db()
        self.assertEqual(edit.new_value, ["tag1", "tag2", "tag3"])

    def test_edit_record_null_old_value(self):
        """Test edit record with null old value (new field)."""
        edit = MetadataEdit.objects.create(
            photo=self.photo,
            user=self.user,
            field_name="title",
            old_value=None,
            new_value="First Title"
        )
        
        edit.refresh_from_db()
        self.assertIsNone(edit.old_value)
        self.assertEqual(edit.new_value, "First Title")


================================================
FILE: api/tests/test_photo_model_integration.py
================================================
from django.test import TestCase
from django.utils import timezone
from django.core.exceptions import FieldDoesNotExist

from api.models import Photo, AlbumDate
from api.models.photo_caption import PhotoCaption
from api.models.photo_search import PhotoSearch
from api.tests.utils import create_test_user, create_test_photo


class PhotoModelIntegrationTest(TestCase):
    def setUp(self):
        self.user = create_test_user()
        self.photo = create_test_photo(owner=self.user)

    def test_photo_properties_delegate_to_caption_model(self):
        """Test that Photo properties delegate to PhotoCaption model"""
        # Initially no caption instance

        caption_instance, created = PhotoCaption.objects.get_or_create(photo=self.photo)
        self.assertIsNone(caption_instance.captions_json)

        # Setting captions_json should create PhotoCaption instance
        caption_instance.captions_json = {"user_caption": "Test caption"}
        caption_instance.save()

        # Verify PhotoCaption was created
        self.assertTrue(PhotoCaption.objects.filter(photo=self.photo).exists())
        caption = PhotoCaption.objects.get(photo=self.photo)
        self.assertEqual(caption.captions_json["user_caption"], "Test caption")

        # Verify property returns the value
        self.assertEqual(caption.captions_json["user_caption"], "Test caption")

    def test_photo_properties_delegate_to_search_model(self):
        """Test that Photo properties delegate to PhotoSearch model"""
        # Initially no search instance

        search_instance, created = PhotoSearch.objects.get_or_create(photo=self.photo)
        self.assertIsNone(search_instance.search_captions)
        self.assertIsNone(search_instance.search_location)

        # Setting search properties should create PhotoSearch instance
        search_instance.search_captions = "outdoor nature"
        search_instance.search_location = "New York"
        search_instance.save()

        # Verify PhotoSearch was created
        self.assertTrue(PhotoSearch.objects.filter(photo=self.photo).exists())
        search = PhotoSearch.objects.get(photo=self.photo)
        self.assertEqual(search.search_captions, "outdoor nature")
        self.assertEqual(search.search_location, "New York")

        # Refresh photo instance to get updated properties
        self.photo.refresh_from_db()

        # Verify properties return the values through direct access
        self.assertEqual(search_instance.search_captions, "outdoor nature")
        self.assertEqual(search_instance.search_location, "New York")

    def test_photo_caption_methods_work_directly(self):
        """Test that PhotoCaption methods work directly with the photo"""

        # Test save_user_caption method directly on PhotoCaption
        caption_instance, created = PhotoCaption.objects.get_or_create(photo=self.photo)
        result = caption_instance.save_user_caption(caption="My test caption")

        # The method should return False due to missing thumbnail but still create instance
        self.assertFalse(result)
        self.assertTrue(PhotoCaption.objects.filter(photo=self.photo).exists())

    def test_photo_search_methods_work_directly(self):
        """Test that PhotoSearch methods work directly with the photo"""
        # Create some caption data first

        caption_instance, created = PhotoCaption.objects.get_or_create(photo=self.photo)
        caption_instance.captions_json = {"user_caption": "Beautiful landscape"}
        caption_instance.save()

        # Test recreate_search_captions method directly on PhotoSearch
        search_instance, created = PhotoSearch.objects.get_or_create(photo=self.photo)
        search_instance.recreate_search_captions()
        search_instance.save()

        # Verify PhotoSearch was created and search captions updated
        self.assertTrue(PhotoSearch.objects.filter(photo=self.photo).exists())
        search = PhotoSearch.objects.get(photo=self.photo)
        self.assertIn("Beautiful landscape", search.search_captions)

    def test_geolocate_updates_search_location(self):
        """Test that _geolocate method updates search location"""
        # Mock geolocation data
        geolocation_data = {
            "features": [
                {"text": "Central Park"},
                {"text": "New York"},
                {"text": "USA"},
            ]
        }

        # Set geolocation_json on photo
        self.photo.geolocation_json = geolocation_data
        self.photo.save()

        # Manually trigger the search location update part

        search_instance, created = PhotoSearch.objects.get_or_create(photo=self.photo)
        search_instance.update_search_location(geolocation_data)
        search_instance.save()

        # Refresh to get updated data
        self.photo.refresh_from_db()

        # Verify search location was updated
        self.assertIn("Central Park", search_instance.search_location)
        self.assertIn("New York", search_instance.search_location)
        self.assertIn("USA", search_instance.search_location)

    def test_cascade_deletion_of_related_models(self):
        """Test that deleting Photo cascades to PhotoCaption and PhotoSearch"""
        # Create related instances

        caption_instance, created = PhotoCaption.objects.get_or_create(photo=self.photo)
        caption_instance.captions_json = {"user_caption": "Test"}
        caption_instance.save()

        search_instance, created = PhotoSearch.objects.get_or_create(photo=self.photo)
        search_instance.search_captions = "Test"
        search_instance.save()

        # Verify instances exist
        self.assertTrue(PhotoCaption.objects.filter(photo=self.photo).exists())
        self.assertTrue(PhotoSearch.objects.filter(photo=self.photo).exists())

        photo_id = self.photo.image_hash
        self.photo.delete()

        # Verify instances are deleted when photo is deleted
        self.assertFalse(PhotoCaption.objects.filter(photo_id=photo_id).exists())
        self.assertFalse(PhotoSearch.objects.filter(photo_id=photo_id).exists())

    def test_lazy_creation_of_related_instances(self):
        """Test that related instances are created only when needed"""

        # Initially no instances should exist
        self.assertFalse(PhotoCaption.objects.filter(photo=self.photo).exists())
        self.assertFalse(PhotoSearch.objects.filter(photo=self.photo).exists())

        # Calling direct access methods should create instances
        caption_instance, created = PhotoCaption.objects.get_or_create(photo=self.photo)
        search_instance, created = PhotoSearch.objects.get_or_create(photo=self.photo)

        self.assertIsNone(caption_instance.captions_json)
        self.assertIsNone(search_instance.search_captions)
        self.assertIsNone(search_instance.search_location)

        # Now instances should exist
        self.assertTrue(PhotoCaption.objects.filter(photo=self.photo).exists())
        self.assertTrue(PhotoSearch.objects.filter(photo=self.photo).exists())

        # Setting properties should save data to instances
        caption_instance.captions_json = {"test": "value"}
        search_instance.search_captions = "test"
        caption_instance.save()
        search_instance.save()

        # Verify data is stored
        self.assertTrue(PhotoCaption.objects.filter(photo=self.photo).exists())
        self.assertTrue(PhotoSearch.objects.filter(photo=self.photo).exists())

    def test_get_or_create_methods(self):
        """Test the _get_or_create_* methods"""
        # Test caption instance creation

        caption_instance1, created = PhotoCaption.objects.get_or_create(
            photo=self.photo
        )
        caption_instance2, created = PhotoCaption.objects.get_or_create(
            photo=self.photo
        )

        # Should return the same instance (using photo_id as primary key)
        self.assertEqual(caption_instance1.photo_id, caption_instance2.photo_id)

        # Test search instance creation

        search_instance1, created = PhotoSearch.objects.get_or_create(photo=self.photo)
        search_instance2, created = PhotoSearch.objects.get_or_create(photo=self.photo)

        # Should return the same instance (using photo_id as primary key)
        self.assertEqual(search_instance1.photo_id, search_instance2.photo_id)

    def test_complex_workflow(self):
        """Test a complex workflow involving all models"""
        # 1. Add user caption (will fail due to thumbnail but creates instance)

        caption_instance, created = PhotoCaption.objects.get_or_create(photo=self.photo)
        caption_instance.save_user_caption(caption="My vacation photo")

        # 2. Add places365 data directly
        caption_instance.captions_json = {
            "user_caption": "My vacation photo",
            "places365": {
                "categories": ["outdoor", "beach"],
                "attributes": ["sunny", "natural"],
                "environment": "outdoor",
            },
        }
        caption_instance.save()

        # 3. Recreate search captions

        search_instance, created = PhotoSearch.objects.get_or_create(photo=self.photo)
        search_instance.recreate_search_captions()

        # 4. Add geolocation
        geolocation_data = {
            "features": [{"text": "Miami Beach"}, {"text": "Florida"}, {"text": "USA"}]
        }
        self.photo.geolocation_json = geolocation_data
        search_instance.update_search_location(geolocation_data)
        search_instance.save()

        # Refresh to get updated data
        self.photo.refresh_from_db()

        # Verify final state
        self.assertEqual(
            caption_instance.captions_json["user_caption"], "My vacation photo"
        )
        self.assertIn("outdoor", search_instance.search_captions)
        self.assertIn("beach", search_instance.search_captions)
        self.assertIn("My vacation photo", search_instance.search_captions)
        self.assertIn("Miami Beach", search_instance.search_location)

    def test_property_error_handling(self):
        """Test error handling in property getters"""
        # Test when related instances don't exist and there's an error
        photo = create_test_photo(owner=self.user)

        # These should return None gracefully, not raise exceptions

        caption_instance, created = PhotoCaption.objects.get_or_create(photo=photo)
        search_instance, created = PhotoSearch.objects.get_or_create(photo=photo)

        self.assertIsNone(caption_instance.captions_json)
        self.assertIsNone(search_instance.search_captions)
        self.assertIsNone(search_instance.search_location)

    def test_backward_compatibility(self):
        """Test that the refactored models maintain backward compatibility"""
        # Create instances using the refactored approach

        caption_instance, created = PhotoCaption.objects.get_or_create(photo=self.photo)
        caption_instance.captions_json = {
            "user_caption": "Test caption",
            "im2txt": "Generated caption",
        }
        caption_instance.save()

        search_instance, created = PhotoSearch.objects.get_or_create(photo=self.photo)
        search_instance.search_captions = "test search terms"
        search_instance.search_location = "Test Location"
        search_instance.save()

        # Refresh to get updated data
        self.photo.refresh_from_db()

        # Verify data is accessible through properties
        self.assertEqual(caption_instance.captions_json["user_caption"], "Test caption")
        self.assertEqual(caption_instance.captions_json["im2txt"], "Generated caption")
        self.assertEqual(search_instance.search_captions, "test search terms")
        self.assertEqual(search_instance.search_location, "Test Location")

        # Verify data is stored in the correct models
        caption = PhotoCaption.objects.get(photo=self.photo)
        search = PhotoSearch.objects.get(photo=self.photo)

        self.assertEqual(caption.captions_json["user_caption"], "Test caption")
        self.assertEqual(search.search_captions, "test search terms")
        self.assertEqual(search.search_location, "Test Location")

    def test_queryset_only_with_search_location_fails(self):
        """Test that using search_location in queryset .only() raises FieldDoesNotExist"""
        # This should fail because search_location is no longer a database field
        with self.assertRaises(FieldDoesNotExist):
            list(Photo.objects.only("image_hash", "search_location").all())

    def test_queryset_only_with_search_instance_works(self):
        """Test that using search_instance__search_location in queryset .only() works"""
        # Create a photo with search data

        search_instance, created = PhotoSearch.objects.get_or_create(photo=self.photo)
        search_instance.search_location = "New York"
        search_instance.save()

        # This should work because we're accessing through the related model
        photos = list(
            Photo.objects.select_related("search_instance")
            .only("image_hash", "search_instance__search_location")
            .filter(image_hash=self.photo.image_hash)
        )

        # Should be able to access the data
        self.assertEqual(len(photos), 1)
        # Note: accessing search_location property will still work even with .only()
        # because it goes through the related model

    def test_album_date_queryset_works(self):
        """Test that the album date queryset works with the fixed field references"""

        # Create a photo with search data

        search_instance, created = PhotoSearch.objects.get_or_create(photo=self.photo)
        search_instance.search_location = "New York"
        search_instance.search_captions = "outdoor nature"
        search_instance.save()

        # Create an album date and add the photo to it
        album_date = AlbumDate.objects.create(
            date=self.photo.exif_timestamp.date()
            if self.photo.exif_timestamp
            else timezone.now().date(),
            owner=self.user,
        )
        album_date.photos.add(self.photo)

        # This should work with the corrected field references
        photo_qs = (
            album_date.photos.all()
            .select_related("search_instance")
            .only(
                "image_hash",
                "search_instance__search_location",
                "exif_timestamp",
            )
        )

        photos = list(photo_qs)
        self.assertEqual(len(photos), 1)
        self.assertEqual(photos[0].search_instance.search_location, "New York")


================================================
FILE: api/tests/test_photo_search_model.py
================================================
from django.test import TestCase

from api.models import PhotoSearch, PhotoCaption
from api.models.photo_metadata import PhotoMetadata
from api.tests.utils import (
    create_test_user,
    create_test_photo,
    create_test_face,
    create_test_person,
)


class PhotoSearchModelTest(TestCase):
    def setUp(self):
        self.user = create_test_user()
        self.photo = create_test_photo(owner=self.user)

    def test_create_photo_search(self):
        """Test creating a PhotoSearch instance"""
        search = PhotoSearch.objects.create(
            photo=self.photo,
            search_captions="outdoor nature sunny",
            search_location="New York, USA",
        )

        self.assertEqual(search.photo, self.photo)
        self.assertEqual(search.search_captions, "outdoor nature sunny")
        self.assertEqual(search.search_location, "New York, USA")

    def test_photo_search_one_to_one_relationship(self):
        """Test that PhotoSearch has a one-to-one relationship with Photo"""
        PhotoSearch.objects.create(photo=self.photo, search_captions="first search")

        # Trying to create another search for the same photo should fail
        with self.assertRaises(Exception):
            PhotoSearch.objects.create(
                photo=self.photo, search_captions="second search"
            )

    def test_recreate_search_captions_with_places365(self):
        """Test recreating search captions with places365 data"""
        # Create PhotoCaption with places365 data
        PhotoCaption.objects.create(
            photo=self.photo,
            captions_json={
                "places365": {
                    "attributes": ["natural", "sunny"],
                    "categories": ["outdoor", "landscape"],
                    "environment": "outdoor",
                }
            },
        )

        search = PhotoSearch.objects.create(photo=self.photo)
        search.recreate_search_captions()

        self.assertIn("natural", search.search_captions)
        self.assertIn("sunny", search.search_captions)
        self.assertIn("outdoor", search.search_captions)
        self.assertIn("landscape", search.search_captions)

    def test_recreate_search_captions_with_user_caption(self):
        """Test recreating search captions with user caption"""
        PhotoCaption.objects.create(
            photo=self.photo,
            captions_json={"user_caption": "My beautiful vacation photo"},
        )

        search = PhotoSearch.objects.create(photo=self.photo)
        search.recreate_search_captions()

        self.assertIn("My beautiful vacation photo", search.search_captions)

    def test_recreate_search_captions_with_im2txt(self):
        """Test recreating search captions with im2txt caption"""
        PhotoCaption.objects.create(
            photo=self.photo,
            captions_json={"im2txt": "a photo of a mountain landscape"},
        )

        search = PhotoSearch.objects.create(photo=self.photo)
        search.recreate_search_captions()

        self.assertIn("a photo of a mountain landscape", search.search_captions)

    def test_recreate_search_captions_with_faces(self):
        """Test recreating search captions with face names"""
        person = create_test_person(name="John Doe", cluster_owner=self.user)
        create_test_face(photo=self.photo, person=person)

        search = PhotoSearch.objects.create(photo=self.photo)
        search.recreate_search_captions()

        self.assertIn("John Doe", search.search_captions)

    def test_recreate_search_captions_with_file_path(self):
        """Test recreating search captions with file path"""
        search = PhotoSearch.objects.create(photo=self.photo)
        search.recreate_search_captions()

        # Should include the file path
        self.assertIn(self.photo.main_file.path, search.search_captions)

    def test_recreate_search_captions_with_video(self):
        """Test recreating search captions for video files"""
        video_photo = create_test_photo(owner=self.user, video=True)
        search = PhotoSearch.objects.create(photo=video_photo)
        search.recreate_search_captions()

        self.assertIn("type: video", search.search_captions)

    def test_recreate_search_captions_with_camera_info(self):
        """Test recreating search captions with camera information"""
        camera_photo = create_test_photo(
            owner=self.user, camera="Canon EOS 5D", lens="Canon 24-70mm"
        )
        search = PhotoSearch.objects.create(photo=camera_photo)
        search.recreate_search_captions()

        self.assertIn("Canon EOS 5D", search.search_captions)
        self.assertIn("Canon 24-70mm", search.search_captions)

    def test_update_search_location(self):
        """Test updating search location"""
        search = PhotoSearch.objects.create(photo=self.photo)

        geolocation_data = {"features": [{"text": "New York"}, {"text": "USA"}]}

        search.update_search_location(geolocation_data)

        self.assertIn("New York", search.search_location)
        self.assertIn("USA", search.search_location)

    def test_update_search_location_with_empty_data(self):
        """Test updating search location with empty data"""
        search = PhotoSearch.objects.create(photo=self.photo)

        search.update_search_location({})

        self.assertEqual(search.search_location, "")

    def test_search_captions_default_empty(self):
        """Test that search_captions defaults to None (nullable field)"""
        search = PhotoSearch.objects.create(photo=self.photo)

        self.assertIsNone(search.search_captions)

    def test_search_location_default_empty(self):
        """Test that search_location defaults to None (nullable field)"""
        search = PhotoSearch.objects.create(photo=self.photo)

        self.assertIsNone(search.search_location)

    def test_str_representation(self):
        """Test string representation of PhotoSearch"""
        search = PhotoSearch.objects.create(
            photo=self.photo, search_captions="test captions"
        )

        str_repr = str(search)
        self.assertIn(self.photo.image_hash, str_repr)

    def test_cascade_delete_with_photo(self):
        """Test that PhotoSearch is deleted when Photo is deleted"""
        PhotoSearch.objects.create(photo=self.photo)
        photo_id = self.photo.image_hash

        self.photo.delete()

        with self.assertRaises(PhotoSearch.DoesNotExist):
            PhotoSearch.objects.get(photo_id=photo_id)

    def test_recreate_search_captions_comprehensive(self):
        """Test recreating search captions with all types of data"""
        # Create comprehensive test data
        PhotoCaption.objects.create(
            photo=self.photo,
            captions_json={
                "user_caption": "My vacation",
                "im2txt": "a beautiful landscape",
                "places365": {
                    "attributes": ["natural", "sunny"],
                    "categories": ["outdoor"],
                    "environment": "outdoor",
                },
            },
        )

        person = create_test_person(name="Jane Smith", cluster_owner=self.user)
        create_test_face(photo=self.photo, person=person)

        # Create PhotoMetadata with camera info
        PhotoMetadata.objects.create(
            photo=self.photo,
            camera_model="Nikon D850",
            lens_model="Nikon 50mm",
        )

        search = PhotoSearch.objects.create(photo=self.photo)
        search.recreate_search_captions()

        # Verify all components are included
        self.assertIn("My vacation", search.search_captions)
        self.assertIn("a beautiful landscape", search.search_captions)
        self.assertIn("natural", search.search_captions)
        self.assertIn("sunny", search.search_captions)
        self.assertIn("outdoor", search.search_captions)
        self.assertIn("Jane Smith", search.search_captions)
        self.assertIn("Nikon D850", search.search_captions)
        self.assertIn("Nikon 50mm", search.search_captions)

    def test_search_captions_indexing(self):
        """Test that search_captions field is properly indexed"""
        # This is more of a model definition test
        field = PhotoSearch._meta.get_field("search_captions")
        self.assertTrue(field.db_index)

    def test_search_location_indexing(self):
        """Test that search_location field is properly indexed"""
        field = PhotoSearch._meta.get_field("search_location")
        self.assertTrue(field.db_index)

    def test_empty_places365_handling(self):
        """Test handling of empty places365 data"""
        PhotoCaption.objects.create(
            photo=self.photo,
            captions_json={
                "places365": {"attributes": [], "categories": [], "environment": ""}
            },
        )

        search = PhotoSearch.objects.create(photo=self.photo)
        search.recreate_search_captions()

        # Should not crash and should handle empty data gracefully
        self.assertIsInstance(search.search_captions, str)

    def test_none_values_handling(self):
        """Test handling of None values in caption data"""
        PhotoCaption.objects.create(
            photo=self.photo, captions_json={"user_caption": None, "im2txt": None}
        )

        search = PhotoSearch.objects.create(photo=self.photo)
        search.recreate_search_captions()

        # Should not crash with None values
        self.assertIsInstance(search.search_captions, str)


================================================
FILE: api/tests/test_photo_search_refactor.py
================================================
from django.test import TestCase
from rest_framework.test import APIClient

from api.tests.utils import create_test_photo, create_test_user


class PhotoSearchRefactorTest(TestCase):
    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_search_location_property_works(self):
        """Test that search_location property works with the new PhotoSearch model"""
        photo = create_test_photo(owner=self.user)

        # Test setting search_location through direct access
        from api.models.photo_search import PhotoSearch

        search_instance, created = PhotoSearch.objects.get_or_create(photo=photo)
        search_instance.search_location = "New York, USA"
        search_instance.save()

        # Verify it was saved to PhotoSearch model
        self.assertEqual(search_instance.search_location, "New York, USA")
        self.assertEqual(photo.search_instance.search_location, "New York, USA")

    def test_search_captions_property_works(self):
        """Test that search_captions property works with the new PhotoSearch model"""
        photo = create_test_photo(owner=self.user)

        # Test setting search_captions through direct access
        from api.models.photo_search import PhotoSearch

        search_instance, created = PhotoSearch.objects.get_or_create(photo=photo)
        search_instance.search_captions = "outdoor nature sunny"
        search_instance.save()

        # Verify it was saved to PhotoSearch model
        self.assertEqual(search_instance.search_captions, "outdoor nature sunny")
        self.assertEqual(photo.search_instance.search_captions, "outdoor nature sunny")

    def test_recreate_search_captions_works(self):
        """Test that recreating search captions works with the new model structure"""
        photo = create_test_photo(owner=self.user)

        # Add some caption data
        from api.models.photo_caption import PhotoCaption
        from api.models.photo_search import PhotoSearch

        caption_instance, created = PhotoCaption.objects.get_or_create(photo=photo)
        caption_instance.captions_json = {
            "places365": {"categories": ["outdoor"], "attributes": ["sunny"]},
            "user_caption": "My photo",
        }
        caption_instance.save()

        # Recreate search captions
        search_instance, created = PhotoSearch.objects.get_or_create(photo=photo)
        search_instance.recreate_search_captions()
        search_instance.save()

        # Verify search captions were created
        from api.models.photo_search import PhotoSearch

        search_instance, created = PhotoSearch.objects.get_or_create(photo=photo)
        self.assertIsNotNone(search_instance.search_captions)
        self.assertIn("outdoor", search_instance.search_captions)
        self.assertIn("sunny", search_instance.search_captions)
        self.assertIn("My photo", search_instance.search_captions)

    def test_geolocate_updates_search_location(self):
        """Test that geolocating updates search_location through PhotoSearch"""
        photo = create_test_photo(owner=self.user)

        # Mock geolocation data
        geolocation_data = {
            "address": "Central Park, New York, NY, USA",
            "features": [
                {"text": "Central Park"},
                {"text": "New York"},
                {"text": "NY"},
                {"text": "USA"},
            ],
        }

        # Update search location through PhotoSearch
        from api.models.photo_search import PhotoSearch

        search_instance, created = PhotoSearch.objects.get_or_create(photo=photo)
        search_instance.update_search_location(geolocation_data)
        search_instance.save()

        # Verify search_location was updated
        self.assertEqual(
            search_instance.search_location, "Central Park, New York, NY, USA"
        )

    def test_direct_access_consistency(self):
        """Test that direct access to models maintains consistency"""
        photo = create_test_photo(owner=self.user)

        # Set data through direct access
        from api.models.photo_caption import PhotoCaption

        caption_instance, created = PhotoCaption.objects.get_or_create(photo=photo)
        caption_instance.captions_json = {"user_caption": "Test caption"}
        caption_instance.save()

        from api.models.photo_search import PhotoSearch

        search_instance, created = PhotoSearch.objects.get_or_create(photo=photo)
        search_instance.search_captions = "test captions"
        search_instance.search_location = "Test Location"
        search_instance.save()

        # Refresh photo to ensure data is loaded from database
        photo.refresh_from_db()

        # Verify data is accessible through direct access
        self.assertEqual(
            photo.caption_instance.captions_json["user_caption"], "Test caption"
        )
        self.assertEqual(photo.search_instance.search_captions, "test captions")
        self.assertEqual(photo.search_instance.search_location, "Test Location")


================================================
FILE: api/tests/test_photo_summary.py
================================================
from django.test import TestCase
from django.urls import reverse
from rest_framework import status
from rest_framework.test import APIClient

from api.tests.utils import create_test_photo, create_test_user


class PhotoSummaryViewTest(TestCase):
    def setUp(self):
        self.user = create_test_user(is_admin=True)
        self.photo = create_test_photo(owner=self.user)
        self.photo.save()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_summary_view_existing_photo_regular_user(self):
        regular_user = create_test_user()

        self.client.force_authenticate(user=regular_user)
        photo = create_test_photo(owner=regular_user)
        url = reverse("photos-summary", kwargs={"pk": photo.image_hash})
        response = self.client.get(url)

        self.assertEqual(response.status_code, status.HTTP_200_OK)
        self.assertFalse(response.data["processing"])

    def test_summary_view_existing_photo(self):
        url = reverse("photos-summary", kwargs={"pk": self.photo.image_hash})
        response = self.client.get(url)

        self.assertEqual(response.status_code, status.HTTP_200_OK)

        self.assertFalse(response.data["processing"])

    def test_summary_view_nonexistent_photo(self):
        url = reverse("photos-summary", kwargs={"pk": "nonexistent_hash"})
        response = self.client.get(url)

        self.assertEqual(response.status_code, status.HTTP_404_NOT_FOUND)

    def test_summary_view_no_aspect_ratio(self):
        # Simulate the case where aspect_ratio is None
        if hasattr(self.photo, "thumbnail") and self.photo.thumbnail:
            self.photo.thumbnail.aspect_ratio = None
            self.photo.thumbnail.save()
        self.photo.save()

        url = reverse("photos-summary", kwargs={"pk": self.photo.image_hash})
        response = self.client.get(url)

        self.assertEqual(response.status_code, status.HTTP_200_OK)

        self.assertTrue(response.data["processing"])


================================================
FILE: api/tests/test_photo_viewset_permissions.py
================================================
from django.test import TestCase
from rest_framework.test import APIClient

from api.tests.utils import (
    create_test_photo,
    create_test_user,
    share_test_photos,
)


class PhotoViewSetPermissionsTest(TestCase):
    def setUp(self):
        self.owner = create_test_user()
        self.other_user = create_test_user()
        self.photo = create_test_photo(owner=self.owner)
        self.url = f"/api/photos/{self.photo.image_hash}/"

    def test_owner_can_update_photo(self):
        client = APIClient()
        client.force_authenticate(user=self.owner)

        response = client.patch(self.url, {"rating": 5}, format="json")

        self.assertEqual(200, response.status_code)
        self.photo.refresh_from_db()
        self.assertEqual(5, self.photo.rating)

    def test_non_owner_cannot_update_photo(self):
        share_test_photos([self.photo.image_hash], self.other_user)
        client = APIClient()
        client.force_authenticate(user=self.other_user)

        response = client.patch(self.url, {"rating": 3}, format="json")

        self.assertEqual(403, response.status_code)
        self.photo.refresh_from_db()
        self.assertNotEqual(3, self.photo.rating)


================================================
FILE: api/tests/test_predefined_rules.py
================================================
import json

from django.test import TestCase
from rest_framework.test import APIClient

from api.date_time_extractor import DEFAULT_RULES_PARAMS, OTHER_RULES_PARAMS
from api.models import User


class PredefinedRulesTest(TestCase):
    def setUp(self):
        self.admin = User.objects.create_superuser(
            "test_admin", "test_admin@test.com", "test_password"
        )
        self.client = APIClient()
        self.client.force_authenticate(user=self.admin)

    def test_predefined_rules(self):
        response = self.client.get("/api/predefinedrules/")
        self.assertEqual(200, response.status_code)
        data = response.json()
        self.assertIsInstance(data, str)
        rules = json.loads(data)
        self.assertIsInstance(rules, list)
        self.assertEqual(15, len(rules))

    def test_default_rules_on_predefined_rules_endpoint(self):
        response = self.client.get("/api/predefinedrules/")
        rules = json.loads(response.json())
        default_rules = list(filter(lambda x: x["is_default"], rules))
        self.assertListEqual(DEFAULT_RULES_PARAMS, default_rules)

    def test_default_rules_endpoint(self):
        response = self.client.get("/api/defaultrules/")
        rules = json.loads(response.json())
        self.assertListEqual(DEFAULT_RULES_PARAMS, rules)

    def test_other_rules(self):
        response = self.client.get("/api/predefinedrules/")
        rules = json.loads(response.json())
        other_rules = list(filter(lambda x: not x["is_default"], rules))
        self.assertListEqual(OTHER_RULES_PARAMS, other_rules)


================================================
FILE: api/tests/test_public_photos.py
================================================
import logging
import unittest.mock
from unittest.mock import patch

from django.test import TestCase
from rest_framework.test import APIClient

from api.tests.utils import create_test_photos, create_test_user

logger = logging.getLogger(__name__)


class PublicPhotosTest(TestCase):
    def setUp(self):
        self.client = APIClient()
        self.user1 = create_test_user()
        self.user2 = create_test_user()
        self.client.force_authenticate(user=self.user1)

    def test_set_my_photos_as_public(self):
        photos = create_test_photos(number_of_photos=3, owner=self.user1)
        image_hashes = [p.image_hash for p in photos]

        payload = {"image_hashes": image_hashes, "val_public": True}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/makepublic/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(3, len(data["results"]))
        self.assertEqual(3, len(data["updated"]))
        self.assertEqual(0, len(data["not_updated"]))

    def test_set_my_photos_as_private(self):
        photos = create_test_photos(number_of_photos=2, owner=self.user1, public=True)
        image_hashes = [p.image_hash for p in photos]

        payload = {"image_hashes": image_hashes, "val_public": False}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/makepublic/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(2, len(data["results"]))
        self.assertEqual(2, len(data["updated"]))
        self.assertEqual(0, len(data["not_updated"]))

    def test_set_photos_of_other_user_as_public(self):
        photos = create_test_photos(number_of_photos=2, owner=self.user2)
        image_hashes = [p.image_hash for p in photos]

        payload = {"image_hashes": image_hashes, "val_public": True}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/makepublic/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(0, len(data["results"]))
        self.assertEqual(0, len(data["updated"]))
        # Photos not owned by user are treated as "missing" for security (no info leak)
        self.assertEqual(0, len(data["not_updated"]))

    @patch("api.views.photos.logger.warning", autospec=True)
    def test_tag_nonexistent_photo_as_favorite(self, logger_ext: unittest.mock.Mock):
        payload = {"image_hashes": ["nonexistent_photo"], "val_public": True}
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/makepublic/", format="json", data=payload, headers=headers
        )
        data = response.json()
        logger.debug(data)

        self.assertTrue(data["status"])
        self.assertEqual(0, len(data["results"]))
        self.assertEqual(0, len(data["updated"]))
        self.assertEqual(0, len(data["not_updated"]))
        logger_ext.assert_called_with(
            "Could not set photo nonexistent_photo to public. It does not exist or is not owned by user."
        )


================================================
FILE: api/tests/test_reading_exif.py
================================================
import os

from django.test import TestCase
from django.utils import timezone
from faker import Faker
from rest_framework.test import APIClient

from api.models import File, Person, Photo
from api.tests.utils import create_test_user


class ReadFacesFromPhotosTest(TestCase):
    def setUp(self):
        self.client = APIClient()
        self.user1 = create_test_user(favorite_min_rating=1)
        self.client.force_authenticate(user=self.user1)

    def test_reading_from_photo(self):
        file = os.path.dirname(os.path.abspath(__file__)) + "/fixtures/niaz.jpg"

        exif_file = os.path.dirname(os.path.abspath(__file__)) + "/fixtures/niaz.xmp"

        fake = Faker()
        pk = fake.md5()
        os.system("cp " + file + " " + "/tmp/" + str(pk) + ".jpg")
        # copy exif file to photo and rename it to have the same name as the photo but with .xmp extension
        os.system("cp " + exif_file + " " + "/tmp/" + str(pk) + ".xmp")
        # we need a thumbnail in the thumbnails_big folder
        os.system(
            "cp " + file + " " + "/protected_media/thumbnails_big/" + str(pk) + ".jpg"
        )

        photo = Photo(pk=pk, image_hash=pk, owner=self.user1)
        fileObject = File.create("/tmp/" + str(photo.pk) + ".jpg", self.user1)
        photo.main_file = fileObject
        photo.added_on = timezone.now()
        photo.save()

        # Create thumbnail for the photo
        from api.models.thumbnail import Thumbnail

        Thumbnail.objects.create(
            photo=photo,
            thumbnail_big="/protected_media/thumbnails_big/" + str(photo.pk) + ".jpg",
            aspect_ratio=1.0,
        )

        photo._extract_faces()

        # To Debug Face Extraction: Look at the actual produced thumbnail
        # Thumbnail is wrong at the moment, need to create a correct face tag first, where I know the face is correct
        # output_file = (
        #        os.path.dirname(os.path.abspath(__file__))
        #        + "/fixtures/niaz_face.jpg"
        # )
        # os.system("cp " + "/protected_media/faces/" + str(photo.pk) + "_0.jpg" + " " + output_file)

        self.assertEqual(1, len(photo.faces.all()))
        # One Niaz Faridani-Rad
        self.assertEqual(1, len(Person.objects.all()))
        # There has to be a face encoding
        self.assertIsNotNone(photo.faces.all()[0].encoding)
        self.assertEqual(
            "Niaz Faridani-Rad",
            Person.objects.filter(name="Niaz Faridani-Rad").first().name,
        )


================================================
FILE: api/tests/test_recently_added_photos.py
================================================
from datetime import timedelta
from django.test import TestCase
from django.utils import timezone
from rest_framework.test import APIClient

from api.tests.utils import create_test_photos, create_test_user


class RecentlyAddedPhotosTest(TestCase):
    def setUp(self):
        self.client = APIClient()
        self.user1 = create_test_user()
        self.user2 = create_test_user()
        self.client.force_authenticate(user=self.user1)

    def test_retrieve_recently_added_photos(self):
        today = timezone.now()
        before_today = timezone.now() - timedelta(days=1)
        create_test_photos(number_of_photos=3, owner=self.user1, added_on=today)
        create_test_photos(number_of_photos=4, owner=self.user1, added_on=before_today)
        create_test_photos(number_of_photos=5, owner=self.user2, added_on=today)

        response = self.client.get("/api/photos/recentlyadded/")
        json = response.json()

        self.assertEqual(response.status_code, 200)
        self.assertEqual(3, len(json["results"]))

    def test_retrieve_empty_result_when_no_photos(self):
        create_test_photos(number_of_photos=2, owner=self.user2)
        response = self.client.get("/api/photos/recentlyadded/")
        json = response.json()

        self.assertEqual(response.status_code, 200)
        self.assertEqual([], json["results"])
        self.assertIsNone(json["date"])


================================================
FILE: api/tests/test_redetection_idempotency.py
================================================
"""
Tests for re-detection idempotency.

Ensures that running detection multiple times:
- Does not create duplicate stacks
- Does not create duplicate duplicate-groups
- Handles already-processed photos correctly
- Merges with existing groups properly

NOTE: RAW+JPEG pairs and Live Photos are now handled as file variants
during the initial scan (Photo.files ManyToMany field), not as stacks.
This module tests idempotency for:
- Duplicate detection (exact copies, visual duplicates)
- Burst sequence detection
"""

import uuid

from django.test import TestCase
from django.utils import timezone
from rest_framework.test import APIClient, APITestCase

from api.models.duplicate import Duplicate
from api.models.photo_stack import PhotoStack
from api.models.file import File
from api.tests.utils import create_test_photo, create_test_user
from api.duplicate_detection import detect_exact_copies, detect_visual_duplicates
from api.stack_detection import detect_burst_sequences


class DuplicateRedetectionTestCase(TestCase):
    """Test that duplicate detection is idempotent."""

    def setUp(self):
        self.user = create_test_user()

    def test_exact_copy_redetection_no_duplicates(self):
        """Test that running exact copy detection twice doesn't create duplicate groups."""
        # Create photos with same hash (simulating exact copies)
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        # Set same image_hash to simulate exact copies
        same_hash = "abcdef1234567890abcdef1234567890"
        photo1.image_hash = same_hash
        photo1.save()
        photo2.image_hash = same_hash
        photo2.save()
        
        # First detection
        detect_exact_copies(self.user)
        initial_count = Duplicate.objects.filter(owner=self.user).count()
        
        # Second detection
        detect_exact_copies(self.user)
        final_count = Duplicate.objects.filter(owner=self.user).count()
        
        # Should have same number of groups
        self.assertEqual(initial_count, final_count)

    def test_visual_duplicate_redetection_no_duplicates(self):
        """Test that running visual duplicate detection twice doesn't create duplicate groups."""
        # Create photos with similar perceptual hash
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        # Set similar perceptual hashes
        photo1.image_phash = "0000000000000000"
        photo1.save()
        photo2.image_phash = "0000000000000001"  # Very similar
        photo2.save()
        
        # First detection
        detect_visual_duplicates(self.user, threshold=10)
        initial_count = Duplicate.objects.filter(owner=self.user).count()
        initial_photo_count = sum(
            d.photos.count() for d in Duplicate.objects.filter(owner=self.user)
        )
        
        # Second detection
        detect_visual_duplicates(self.user, threshold=10)
        final_count = Duplicate.objects.filter(owner=self.user).count()
        final_photo_count = sum(
            d.photos.count() for d in Duplicate.objects.filter(owner=self.user)
        )
        
        # Should have same number of groups and photos
        self.assertEqual(initial_count, final_count)
        self.assertEqual(initial_photo_count, final_photo_count)

    def test_redetection_adds_new_photos_to_existing_group(self):
        """Test that new duplicates are added to existing groups, not new ones."""
        # Create initial duplicate pair
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        same_hash = "abcdef1234567890abcdef1234567890"
        photo1.image_hash = same_hash
        photo1.save()
        photo2.image_hash = same_hash
        photo2.save()
        
        # First detection creates a group
        detect_exact_copies(self.user)
        initial_groups = list(Duplicate.objects.filter(owner=self.user))
        self.assertEqual(len(initial_groups), 1)
        
        # Add a third photo with same hash
        photo3 = create_test_photo(owner=self.user)
        photo3.image_hash = same_hash
        photo3.save()
        
        # Second detection should add to existing group
        detect_exact_copies(self.user)
        final_groups = list(Duplicate.objects.filter(owner=self.user))
        
        # Should still have only one group
        self.assertEqual(len(final_groups), 1)
        # Group should now have 3 photos
        self.assertEqual(final_groups[0].photos.count(), 3)

    def test_redetection_with_resolved_duplicates(self):
        """Test that resolved duplicates are not re-detected."""
        # Create duplicate pair
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        same_hash = "abcdef1234567890abcdef1234567890"
        photo1.image_hash = same_hash
        photo1.save()
        photo2.image_hash = same_hash
        photo2.save()
        
        # First detection
        detect_exact_copies(self.user)
        dup = Duplicate.objects.filter(owner=self.user).first()
        
        # Resolve the duplicate
        dup.resolve(kept_photo=photo1)
        
        # Re-detection
        detect_exact_copies(self.user)
        
        # Should not create a new pending group for resolved duplicates
        _pending_groups = Duplicate.objects.filter(
            owner=self.user,
            review_status=Duplicate.ReviewStatus.PENDING
        ).count()
        
        # Depending on implementation, either 0 new pending groups or existing resolved stays resolved
        resolved_groups = Duplicate.objects.filter(
            owner=self.user,
            review_status=Duplicate.ReviewStatus.RESOLVED
        ).count()
        self.assertGreaterEqual(resolved_groups, 1)


class BurstRedetectionTestCase(TestCase):
    """Test that burst stack detection is idempotent."""

    def setUp(self):
        self.user = create_test_user()

    def test_burst_redetection_no_duplicate_stacks(self):
        """Test that running burst detection twice doesn't create duplicate stacks."""
        # Create photos that look like a burst
        base_time = timezone.now()
        photos = []
        for i in range(3):
            photo = create_test_photo(owner=self.user)
            photo.exif_timestamp = base_time + timezone.timedelta(milliseconds=100 * i)
            photo.main_file.path = f"/photos/IMG_001_{i}.JPG"
            photo.main_file.save()
            photo.save()
            photos.append(photo)
        
        # First detection
        detect_burst_sequences(self.user)
        initial_stacks = PhotoStack.objects.filter(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE
        ).count()
        
        # Second detection
        detect_burst_sequences(self.user)
        final_stacks = PhotoStack.objects.filter(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE
        ).count()
        
        # Should have same number of stacks
        self.assertEqual(initial_stacks, final_stacks)

    def test_redetection_adds_new_photos_to_existing_stack(self):
        """Test that new photos are added to existing stacks."""
        # Create initial burst pair
        base_time = timezone.now()
        
        photo1 = create_test_photo(owner=self.user)
        photo1.exif_timestamp = base_time
        photo1.main_file.path = "/photos/burst_001.jpg"
        photo1.main_file.save()
        photo1.save()
        
        photo2 = create_test_photo(owner=self.user)
        photo2.exif_timestamp = base_time + timezone.timedelta(milliseconds=100)
        photo2.main_file.path = "/photos/burst_002.jpg"
        photo2.main_file.save()
        photo2.save()
        
        # First detection
        detect_burst_sequences(self.user)
        _initial_stacks = list(PhotoStack.objects.filter(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE
        ))
        
        # Add a third photo to the burst
        photo3 = create_test_photo(owner=self.user)
        photo3.exif_timestamp = base_time + timezone.timedelta(milliseconds=200)
        photo3.main_file.path = "/photos/burst_003.jpg"
        photo3.main_file.save()
        photo3.save()
        
        # Second detection should add to existing stack
        detect_burst_sequences(self.user)
        _final_stacks = list(PhotoStack.objects.filter(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE
        ))
        
        # Stack count may vary based on implementation
        # The key is no duplicate photos in stacks


class APIRedetectionTestCase(APITestCase):
    """Test re-detection through API endpoints."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)
        
        # Create some test photos
        for _ in range(5):
            create_test_photo(owner=self.user)

    def test_duplicate_detect_api_idempotent(self):
        """Test that calling /api/duplicates/detect multiple times is safe."""
        # First detection
        response1 = self.client.post("/api/duplicates/detect")
        self.assertIn(response1.status_code, [200, 202])
        
        # Second detection
        response2 = self.client.post("/api/duplicates/detect")
        self.assertIn(response2.status_code, [200, 202])
        
        # Third detection
        response3 = self.client.post("/api/duplicates/detect")
        self.assertIn(response3.status_code, [200, 202])

    def test_stack_detect_api_idempotent(self):
        """Test that calling /api/stacks/detect multiple times is safe."""
        # First detection
        response1 = self.client.post("/api/stacks/detect")
        self.assertIn(response1.status_code, [200, 202])
        
        # Second detection
        response2 = self.client.post("/api/stacks/detect")
        self.assertIn(response2.status_code, [200, 202])
        
        # Third detection
        response3 = self.client.post("/api/stacks/detect")
        self.assertIn(response3.status_code, [200, 202])

    def test_duplicate_detect_with_clear_pending(self):
        """Test detection with clear_pending option."""
        # Create a duplicate
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo1.image_hash = photo2.image_hash = "samehash123456789012345678901234"
        photo1.save()
        photo2.save()
        
        # First detection
        response1 = self.client.post(
            "/api/duplicates/detect",
            {"clear_pending": False},
            format="json"
        )
        self.assertIn(response1.status_code, [200, 202])
        
        # Detection with clear_pending
        response2 = self.client.post(
            "/api/duplicates/detect",
            {"clear_pending": True},
            format="json"
        )
        self.assertIn(response2.status_code, [200, 202])


class PhotoInMultipleGroupsRedetectionTestCase(TestCase):
    """Test re-detection when photos are in multiple groups."""

    def setUp(self):
        self.user = create_test_user()

    def test_photo_already_in_stack_not_duplicated(self):
        """Test that a photo already in a stack isn't added again."""
        photos = [create_test_photo(owner=self.user) for _ in range(3)]
        
        # Create a manual stack
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(*photos)
        
        initial_photo_count = stack.photos.count()
        
        # Try to add the same photos through create_or_merge
        PhotoStack.create_or_merge(
            photos=photos,
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        
        # Should not have duplicated photos in the stack
        stack.refresh_from_db()
        self.assertEqual(stack.photos.count(), initial_photo_count)

    def test_duplicate_group_photos_not_duplicated(self):
        """Test that photos already in a duplicate group aren't added again."""
        photos = [create_test_photo(owner=self.user) for _ in range(3)]
        
        # Create a duplicate group
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup.photos.add(*photos)
        
        initial_photo_count = dup.photos.count()
        
        # Try to add the same photos through create_or_merge
        Duplicate.create_or_merge(
            photos=photos,
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        
        # Should have merged, not duplicated
        final_groups = Duplicate.objects.filter(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        total_photos = sum(g.photos.count() for g in final_groups)
        self.assertEqual(total_photos, initial_photo_count)


class ClearExistingGroupsTestCase(TestCase):
    """Test clearing existing groups before re-detection."""

    def setUp(self):
        self.user = create_test_user()

    def test_clear_pending_duplicates(self):
        """Test that clear_pending removes pending duplicates."""
        # Create a pending duplicate
        photos = [create_test_photo(owner=self.user) for _ in range(2)]
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.PENDING,
        )
        dup.photos.add(*photos)
        
        # There should be one pending
        self.assertEqual(
            Duplicate.objects.filter(
                owner=self.user,
                review_status=Duplicate.ReviewStatus.PENDING
            ).count(),
            1
        )
        
        # Clear pending duplicates
        Duplicate.objects.filter(
            owner=self.user,
            review_status=Duplicate.ReviewStatus.PENDING
        ).delete()
        
        # Now there should be none
        self.assertEqual(
            Duplicate.objects.filter(
                owner=self.user,
                review_status=Duplicate.ReviewStatus.PENDING
            ).count(),
            0
        )

    def test_clear_pending_preserves_resolved(self):
        """Test that clearing pending doesn't affect resolved duplicates."""
        photos1 = [create_test_photo(owner=self.user) for _ in range(2)]
        photos2 = [create_test_photo(owner=self.user) for _ in range(2)]
        
        # Create pending and resolved duplicates
        pending_dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.PENDING,
        )
        pending_dup.photos.add(*photos1)
        
        resolved_dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.RESOLVED,
        )
        resolved_dup.photos.add(*photos2)
        
        # Clear only pending
        Duplicate.objects.filter(
            owner=self.user,
            review_status=Duplicate.ReviewStatus.PENDING
        ).delete()
        
        # Resolved should still exist
        self.assertTrue(
            Duplicate.objects.filter(pk=resolved_dup.pk).exists()
        )
        
        # Pending should be gone
        self.assertFalse(
            Duplicate.objects.filter(pk=pending_dup.pk).exists()
        )


class MergeOnRedetectionTestCase(TestCase):
    """Test that overlapping groups are merged on re-detection."""

    def setUp(self):
        self.user = create_test_user()

    def test_overlapping_stacks_merged(self):
        """Test that overlapping stacks are merged."""
        photos = [create_test_photo(owner=self.user) for _ in range(4)]
        
        # Create two overlapping stacks
        stack1 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack1.photos.add(photos[0], photos[1], photos[2])  # 0, 1, 2
        
        stack2 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack2.photos.add(photos[1], photos[2], photos[3])  # 1, 2, 3 (overlaps)
        
        # Using create_or_merge should merge these
        merged = PhotoStack.create_or_merge(
            photos=[photos[0], photos[1], photos[2], photos[3]],
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        
        # Should have merged into one stack with all photos
        self.assertIsNotNone(merged)

    def test_overlapping_duplicates_merged(self):
        """Test that overlapping duplicate groups are merged."""
        photos = [create_test_photo(owner=self.user) for _ in range(4)]
        
        # Create two overlapping duplicate groups
        dup1 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup1.photos.add(photos[0], photos[1], photos[2])
        
        dup2 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup2.photos.add(photos[1], photos[2], photos[3])
        
        # Using create_or_merge should merge these
        merged = Duplicate.create_or_merge(
            photos=[photos[0], photos[1], photos[2], photos[3]],
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        
        # Should have merged
        self.assertIsNotNone(merged)


class FileVariantsIdempotencyTestCase(TestCase):
    """
    Test that file variants (RAW+JPEG, Live Photos) are handled idempotently.
    
    File variants are now stored via Photo.files ManyToMany field, not as stacks.
    This is handled during the scan process in directory_watcher.py.
    """

    def setUp(self):
        self.user = create_test_user()

    def test_photo_with_multiple_file_variants(self):
        """Test that a photo can have multiple file variants."""

        # Create a photo (create_test_photo adds its own file)
        photo = create_test_photo(owner=self.user)

        # Clear any existing files and set up fresh
        photo.files.clear()

        # Use unique hashes to avoid any collision with other tests
        unique_suffix = str(uuid.uuid4())[:8]

        # Create a JPEG file
        jpeg_file = File.objects.create(
            hash=f"jpeg_{unique_suffix}" + "a" * 20,
            path=f"/photos/IMG_001_{unique_suffix}.jpg",
            type=File.IMAGE,
        )
        photo.main_file = jpeg_file
        photo.files.add(jpeg_file)
        photo.save()

        # Add a RAW file variant
        raw_file = File.objects.create(
            hash=f"raw_{unique_suffix}" + "b" * 21,
            path=f"/photos/IMG_001_{unique_suffix}.CR2",
            type=File.RAW_FILE,
        )
        photo.files.add(raw_file)

        # Photo should have 2 file variants
        self.assertEqual(photo.files.count(), 2)

        # Verify both files are present
        file_paths = set(photo.files.values_list('path', flat=True))
        self.assertIn(f"/photos/IMG_001_{unique_suffix}.jpg", file_paths)
        self.assertIn(f"/photos/IMG_001_{unique_suffix}.CR2", file_paths)

    def test_file_variant_types(self):
        """Test that we can identify file variant types."""
        photo = create_test_photo(owner=self.user)
        
        # Clear existing files
        photo.files.clear()
        
        # Add JPEG
        jpeg_file = File.objects.create(
            hash="jpeg" + "a" * 28,
            path="/photos/IMG_001.jpg",
            type=File.IMAGE,
        )
        photo.main_file = jpeg_file
        photo.files.add(jpeg_file)
        
        # Add RAW
        raw_file = File.objects.create(
            hash="raw" + "b" * 29,
            path="/photos/IMG_001.CR2",
            type=File.RAW_FILE,
        )
        photo.files.add(raw_file)
        
        # Add video for Live Photo
        video_file = File.objects.create(
            hash="video" + "c" * 27,
            path="/photos/IMG_001.mov",
            type=File.VIDEO,
        )
        photo.files.add(video_file)
        photo.save()
        
        # Check file types
        file_types = set(photo.files.values_list('type', flat=True))
        self.assertIn(File.IMAGE, file_types)
        self.assertIn(File.RAW_FILE, file_types)
        self.assertIn(File.VIDEO, file_types)

    def test_has_raw_variant(self):
        """Test detecting if a photo has a RAW file variant."""
        photo = create_test_photo(owner=self.user)
        
        # Clear existing files
        photo.files.clear()
        
        # Add JPEG
        jpeg_file = File.objects.create(
            hash="jpeg" + "a" * 28,
            path="/photos/IMG_001.jpg",
            type=File.IMAGE,
        )
        photo.main_file = jpeg_file
        photo.files.add(jpeg_file)
        
        # Initially no RAW
        has_raw = photo.files.filter(type=File.RAW_FILE).exists()
        self.assertFalse(has_raw)
        
        # Add RAW
        raw_file = File.objects.create(
            hash="raw" + "b" * 29,
            path="/photos/IMG_001.CR2",
            type=File.RAW_FILE,
        )
        photo.files.add(raw_file)
        
        # Now has RAW
        has_raw = photo.files.filter(type=File.RAW_FILE).exists()
        self.assertTrue(has_raw)

    def test_has_video_variant_live_photo(self):
        """Test detecting if a photo has a video variant (Live Photo)."""
        photo = create_test_photo(owner=self.user)
        
        # Clear existing files
        photo.files.clear()
        
        # Add image
        image_file = File.objects.create(
            hash="image" + "a" * 27,
            path="/photos/IMG_001.heic",
            type=File.IMAGE,
        )
        photo.main_file = image_file
        photo.files.add(image_file)
        
        # Initially no video
        has_video = photo.files.filter(type=File.VIDEO).exists()
        self.assertFalse(has_video)
        
        # Add video for Live Photo
        video_file = File.objects.create(
            hash="video" + "b" * 27,
            path="/photos/IMG_001.mov",
            type=File.VIDEO,
        )
        photo.files.add(video_file)
        
        # Now has video
        has_video = photo.files.filter(type=File.VIDEO).exists()
        self.assertTrue(has_video)


================================================
FILE: api/tests/test_regenerate_titles.py
================================================
from datetime import datetime

import pytz
from django.test import TestCase

from api.models import AlbumAuto, User


class RegenerateTitlesTestCase(TestCase):
    def test_regenerate_titles(self):
        admin = User.objects.create_superuser(
            "test_admin", "test_admin@test.com", "test_password"
        )
        album_auto = AlbumAuto.objects.create(
            timestamp=datetime.strptime("2022-01-02", "%Y-%m-%d").replace(
                tzinfo=pytz.utc
            ),
            created_on=datetime.strptime("2022-01-02", "%Y-%m-%d").replace(
                tzinfo=pytz.utc
            ),
            owner=admin,
        )
        album_auto._generate_title()
        self.assertEqual(album_auto.title, "Sunday")


================================================
FILE: api/tests/test_retrieve_photo.py
================================================
from django.test import TestCase
from rest_framework.test import APIClient

from api.tests.utils import create_test_photo, create_test_user


class RetrievePhotoTest(TestCase):
    def setUp(self):
        self.client = APIClient()
        self.admin = create_test_user(is_admin=True)
        self.user = create_test_user()

    def test_should_retrieve_my_photo(self):
        self.client.force_authenticate(user=self.user)
        photo = create_test_photo(owner=self.user)

        headers = {"Content-Type": "application/json"}
        response = self.client.get(
            f"/api/photos/{photo.image_hash}/",
            format="json",
            headers=headers,
        )

        self.assertEqual(200, response.status_code)

    def test_should_not_retrieve_other_user_photo(self):
        self.client.force_authenticate(user=self.user)
        photo = create_test_photo(owner=self.admin)

        headers = {"Content-Type": "application/json"}
        response = self.client.get(
            f"/api/photos/{photo.image_hash}/",
            format="json",
            headers=headers,
        )

        # Returns 404 instead of 403 to avoid leaking existence of other users' photos
        self.assertEqual(404, response.status_code)

    def test_anonymous_user_should_retrieve_public_photo(self):
        self.client.force_authenticate(None)
        photo = create_test_photo(owner=self.user, public=True)

        headers = {"Content-Type": "application/json"}
        response = self.client.get(
            f"/api/photos/{photo.image_hash}/",
            format="json",
            headers=headers,
        )

        self.assertEqual(200, response.status_code)

    def test_anonymous_user_should_not_retrieve_private_photo(self):
        self.client.force_authenticate(None)
        photo = create_test_photo(owner=self.user, public=False)

        headers = {"Content-Type": "application/json"}
        response = self.client.get(
            f"/api/photos/{photo.image_hash}/",
            format="json",
            headers=headers,
        )

        self.assertEqual(404, response.status_code)


================================================
FILE: api/tests/test_scan_percentage_bug.py
================================================
import os
import tempfile
import uuid
from unittest.mock import MagicMock, patch

from django.test import TestCase  # type: ignore

from api.directory_watcher import handle_new_image, scan_photos
from api.models import LongRunningJob, User


class ScanPercentageProgressTestCase(TestCase):
    def setUp(self):
        self.user = User.objects.create_user(
            username="testuser",
            password="testpass",
        )
        self.user.skip_raw_files = True
        self.user.save()
        self.job_id = uuid.uuid4()

    def _scan_file_list(self):
        return (
            [f"photo{i}.jpg" for i in range(10)]
            + [f"photo{i}.raw" for i in range(7)]
            + [f"photo{i}.xmp" for i in range(10)]
            + [f"document{i}.pdf" for i in range(10)]
        )

    def _simulate_pre_fix_progress(self, files):
        images_and_videos: list[str] = []
        metadata_paths: list[str] = []
        for path in files:
            if path.endswith(".xmp"):
                metadata_paths.append(path)
            else:
                images_and_videos.append(path)

        processed = 0
        for path in images_and_videos:
            ext = os.path.splitext(path)[1].lower()
            if ext == ".raw" and self.user.skip_raw_files:
                continue
            if ext == ".pdf":
                continue
            if ext == ".jpg":
                processed += 1
        processed += len(metadata_paths)
        return processed

    def test_scan_progress_counts_every_discovered_file(self):
        """Ensure the scan job reaches 100% even when files are skipped or metadata."""

        files = self._scan_file_list()
        pre_fix_processed = self._simulate_pre_fix_progress(files)
        pre_fix_percentage = (pre_fix_processed / len(files)) * 100
        _pre_fix_summary = (
            f"Pre-fix simulated progress: {pre_fix_processed}/{len(files)} "
            f"({pre_fix_percentage:.1f}%) -> stuck"
        )
        discovered_by_ext: dict[str, int] = {}
        for path in files:
            ext = os.path.splitext(path)[1].lower()
            discovered_by_ext[ext] = discovered_by_ext.get(ext, 0) + 1
        lrj = LongRunningJob.objects.create(
            started_by=self.user,
            job_id=self.job_id,
            job_type=LongRunningJob.JOB_SCAN_PHOTOS,
            progress_current=0,
            progress_target=len(files),
        )

        photos_created_by_ext: dict[str, int] = {}

        def mock_create_new_image(user, path):
            ext = os.path.splitext(path)[1].lower()
            if ext == ".jpg":
                photos_created_by_ext[ext] = photos_created_by_ext.get(ext, 0) + 1
                return MagicMock()
            photos_created_by_ext[ext] = photos_created_by_ext.get(ext, 0)
            return None

        thumbnail_mock = MagicMock()
        thumbnail_mock._generate_thumbnail.return_value = None
        thumbnail_mock._calculate_aspect_ratio.return_value = None
        thumbnail_mock._get_dominant_color.return_value = None
        search_instance_mock = MagicMock()

        with (
            patch(
                "api.directory_watcher.create_new_image",
                side_effect=mock_create_new_image,
            ),
            patch(
                "api.models.Thumbnail.objects.get_or_create",
                return_value=(thumbnail_mock, True),
            ),
            patch(
                "api.models.PhotoSearch.objects.get_or_create",
                return_value=(search_instance_mock, True),
            ),
        ):
            for path in files:
                handle_new_image(self.user, path, self.job_id)

        lrj.refresh_from_db()
        percentage = (
            (lrj.progress_current / lrj.progress_target) * 100
            if lrj.progress_target
            else 0
        )
        file_breakdown = ["File breakdown:"]
        for ext, total in sorted(discovered_by_ext.items()):
            created = photos_created_by_ext.get(ext, 0)
            behavior = "creates Photo" if created else "skipped"
            file_breakdown.append(
                f" - {ext}: discovered={total}, create_new_image={behavior}"
            )
        breakdown_summary = "\n".join(file_breakdown)
        progress_summary = (
            f"Scan job progress: {lrj.progress_current}/{lrj.progress_target} "
            f"({percentage:.1f}%) finished={lrj.finished}"
        )

        self.assertLess(
            pre_fix_processed,
            len(files),
            "Pre-fix simulation should demonstrate the bug (progress < total).",
        )
        self.assertEqual(lrj.progress_target, len(files), progress_summary)
        self.assertEqual(
            lrj.progress_current,
            len(files),
            f"{breakdown_summary}\n{progress_summary} -> Every discovered file should advance the counter.",
        )
        self.assertTrue(
            lrj.finished,
            f"{breakdown_summary}\n{progress_summary} -> Scan job must finish when current equals target.",
        )


class EmptyDirectoryScanTestCase(TestCase):
    """Test that scanning an empty directory completes correctly."""

    def setUp(self):
        self.user = User.objects.create_user(
            username="empty_scan_testuser",
            password="testpass",
        )
        # Create a temporary empty directory for testing
        self.temp_dir = tempfile.mkdtemp()
        self.user.scan_directory = self.temp_dir
        self.user.save()
        self.job_id = uuid.uuid4()

    def tearDown(self):
        # Clean up temp directory
        import shutil

        shutil.rmtree(self.temp_dir, ignore_errors=True)

    def test_empty_directory_scan_completes_successfully(self):
        """Ensure scanning an empty directory finishes with 0/0 progress."""
        # Verify directory is empty
        self.assertEqual(
            len(os.listdir(self.temp_dir)),
            0,
            "Test directory should be empty",
        )

        # Mock db.connections.close_all() to prevent closing test DB connection
        # Mock AsyncTask to prevent background task issues in tests
        with (
            patch("api.directory_watcher.scan_jobs.db.connections.close_all"),
            patch("api.directory_watcher.scan_jobs.AsyncTask"),
            patch("api.directory_watcher.scan_jobs.Chain"),
        ):
            # Run the scan
            scan_photos(
                self.user,
                full_scan=True,
                job_id=self.job_id,
                scan_directory=self.temp_dir,
            )

        # Check job status
        job = LongRunningJob.objects.get(job_id=self.job_id)

        self.assertEqual(
            job.progress_target,
            0,
            "Empty directory should have progress_target=0",
        )
        self.assertEqual(
            job.progress_current,
            0,
            "Empty directory should have progress_current=0",
        )
        self.assertTrue(
            job.finished,
            "Empty directory scan should be marked as finished",
        )
        self.assertFalse(
            job.failed,
            "Empty directory scan should not be marked as failed",
        )


================================================
FILE: api/tests/test_scan_photos.py
================================================
import os
from unittest import skip

from django.test import TestCase
from pyfakefs.fake_filesystem_unittest import Patcher
from rest_framework.test import APIClient

from api.tests.utils import create_test_user

# get path to test images
test_images_path = os.path.join(os.path.dirname(__file__), "test_images")


@skip
class ScanPhotosTestCase(TestCase):
    def setUp(self):
        with Patcher() as patcher:
            samplephotos_dir = "/data/samplephotos"
            # add dependencies
            patcher.fs.add_real_directory("/usr/local/lib/python3.11/dist-packages/")
            patcher.fs.add_real_directory(
                test_images_path, target_path=samplephotos_dir
            )
            self.client_admin = APIClient()
            self.admin = create_test_user(is_admin=True)
            self.client_admin.force_authenticate(self.admin)

            response = self.client_admin.patch(
                f"/api/manage/user/{self.admin.id}/",
                {"scan_directory": samplephotos_dir},
            )

            self.assertEqual(response.status_code, 200)
            self.assertEqual(response.json()["scan_directory"], samplephotos_dir)

            # scan photos
            scan_photos_res = self.client_admin.get("/api/scanphotos/")
            self.assertEqual(scan_photos_res.status_code, 200)

            # make sure photos are imported
            get_photos_res = self.client_admin.get("/api/photos/")
            self.assertEqual(get_photos_res.status_code, 200)
            self.assertGreater(len(get_photos_res.json()["results"]), 0)

            # try scanning again and make sure there are no duplicate imports
            num_photos = len(get_photos_res.json()["results"])
            scan_photos_res = self.client_admin.get("/api/scanphotos/")
            self.assertEqual(scan_photos_res.status_code, 200)

            get_photos_res = self.client_admin.get("/api/photos/")
            self.assertEqual(get_photos_res.status_code, 200)
            self.assertEqual(len(get_photos_res.json()["results"]), num_photos)

    def test_setup(self):
        """Make sure setup works"""
        pass

    @skip
    def test_auto_albums(self):
        """Make sure user can make auto albums, list and retrieve them"""
        # make auto albums
        auto_album_gen_res = self.client_admin.get("/api/autoalbumgen/")
        self.assertEqual(auto_album_gen_res.status_code, 200)

        # make sure auto albums are there
        auto_album_list_res = self.client_admin.get("/api/albums/auto/list/")
        self.assertEqual(auto_album_list_res.status_code, 200)

        # make sure user can retrieve each auto album
        for album in auto_album_list_res.json()["results"]:
            auto_album_retrieve_res = self.client_admin.get(
                "/api/albums/auto/%d/" % album["id"]
            )
            self.assertEqual(auto_album_retrieve_res.status_code, 200)
            self.assertGreater(len(auto_album_retrieve_res.json()["photos"]), 0)

        # try making auto albums again and make sure there are no duplicates
        num_auto_albums = len(auto_album_list_res.json()["results"])

        auto_album_gen_res = self.client_admin.get("/api/autoalbumgen/")
        self.assertEqual(auto_album_gen_res.status_code, 200)

        auto_album_list_res = self.client_admin.get("/api/albums/auto/list/")
        self.assertEqual(len(auto_album_list_res.json()["results"]), num_auto_albums)

    @skip
    def test_place_albums(self):
        """Make sure user can list and retrieve place albums"""
        place_album_list_res = self.client_admin.get("/api/albums/place/list/")
        self.assertEqual(place_album_list_res.status_code, 200)

        for album in place_album_list_res.json()["results"]:
            place_album_retrieve_res = self.client_admin.get(
                "/api/albums/place/%d/" % album["id"]
            )
            self.assertEqual(place_album_retrieve_res.status_code, 200)

    @skip
    def test_thing_albums(self):
        """Make sure user can list and retrieve thing albums"""
        thing_album_list_res = self.client_admin.get("/api/albums/thing/list/")
        self.assertEqual(thing_album_list_res.status_code, 200)

        for album in thing_album_list_res.json()["results"]:
            thing_album_retrieve_res = self.client_admin.get(
                "/api/albums/thing/%d/" % album["id"]
            )
            self.assertEqual(thing_album_retrieve_res.status_code, 200)


================================================
FILE: api/tests/test_scan_photos_directories.py
================================================
import os
import tempfile
import uuid
from unittest.mock import patch

from django.test import TestCase, override_settings

from api.directory_watcher import scan_photos
from api.tests.utils import create_test_user


class DummyAsyncTask:
    def __init__(self, *args, **kwargs):
        pass

    def run(self):
        return None


class DummyChain:
    def __init__(self, *args, **kwargs):
        self.appended = []

    def append(self, *args, **kwargs):
        self.appended.append((args, kwargs))
        return self

    def run(self):
        return None


class ScanPhotosDirectoryCreationTest(TestCase):
    def test_existing_thumbnail_directory_does_not_raise(self):
        user = create_test_user()
        with tempfile.TemporaryDirectory() as media_root:
            preexisting_dir = os.path.join(media_root, "square_thumbnails_small")
            os.makedirs(preexisting_dir, exist_ok=True)

            user.scan_directory = media_root
            user.save(update_fields=["scan_directory"])

            with override_settings(MEDIA_ROOT=media_root):
                with (
                    patch("api.directory_watcher.scan_jobs.walk_directory"),
                    patch("api.directory_watcher.scan_jobs.walk_files"),
                    patch("api.directory_watcher.scan_jobs.photo_scanner"),
                    patch("api.directory_watcher.scan_jobs.AsyncTask", DummyAsyncTask),
                    patch("api.directory_watcher.scan_jobs.Chain", DummyChain),
                    patch("api.directory_watcher.scan_jobs.db.connections.close_all"),
                ):
                    scan_photos(user, full_scan=False, job_id=str(uuid.uuid4()))

            expected_directories = [
                "square_thumbnails_small",
                "square_thumbnails",
                "thumbnails_big",
            ]
            for directory_name in expected_directories:
                directory_path = os.path.join(media_root, directory_name)
                self.assertTrue(
                    os.path.isdir(directory_path),
                    msg=f"Expected directory {directory_path} to exist",
                )


================================================
FILE: api/tests/test_search_term_examples.py
================================================
from django.test import TestCase
from rest_framework.test import APIClient

from api.api_util import get_search_term_examples
from api.tests.utils import create_test_photo, create_test_user


class SearchTermExamplesTest(TestCase):
    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_get_search_term_examples_with_captions(self):
        """Test that get_search_term_examples works after caption refactoring"""
        # Create a photo with captions and geolocation
        photo = create_test_photo(owner=self.user)

        # Add geolocation data to avoid the NoneType error
        photo.geolocation_json = {
            "features": [
                {"text": "New York"},
                {"text": "USA"},
                {"text": "North America"},
            ]
        }
        photo.save()

        # Add some caption data through the new PhotoCaption model
        from api.models.photo_caption import PhotoCaption

        caption_instance, created = PhotoCaption.objects.get_or_create(photo=photo)
        caption_instance.captions_json = {
            "places365": {
                "categories": ["outdoor", "nature"],
                "attributes": ["sunny", "green"],
            },
            "im2txt": "A beautiful landscape",
            "user_caption": "My vacation photo",
        }
        caption_instance.save()

        # This should not raise a FieldError
        search_terms = get_search_term_examples(self.user)

        # Should return some search terms
        self.assertIsInstance(search_terms, list)

    def test_get_search_term_examples_with_empty_captions(self):
        """Test that get_search_term_examples works with empty captions"""
        # Create a photo without captions
        photo = create_test_photo(owner=self.user)

        # Add geolocation data
        photo.geolocation_json = {
            "features": [
                {"text": "Miami"},
                {"text": "Florida"},
                {"text": "USA"},
            ]
        }
        photo.save()

        # Add empty caption data
        from api.models.photo_caption import PhotoCaption

        caption_instance, created = PhotoCaption.objects.get_or_create(photo=photo)
        caption_instance.captions_json = {
            "places365": {
                "categories": [],
                "attributes": [],
            },
            "im2txt": "",
            "user_caption": "",
        }
        caption_instance.save()

        # This should not raise a FieldError
        search_terms = get_search_term_examples(self.user)

        # Should return some search terms (may be empty)
        self.assertIsInstance(search_terms, list)

    def test_search_term_examples_api_endpoint(self):
        """Test the API endpoint that calls get_search_term_examples"""
        # Create a photo with captions and geolocation
        photo = create_test_photo(owner=self.user)

        # Add geolocation data
        photo.geolocation_json = {"features": [{"text": "Paris"}, {"text": "France"}]}
        photo.save()

        # Add some caption data
        from api.models.photo_caption import PhotoCaption

        caption_instance, created = PhotoCaption.objects.get_or_create(photo=photo)
        caption_instance.captions_json = {
            "places365": {"categories": ["outdoor"], "attributes": ["sunny"]}
        }
        caption_instance.save()

        # Test the API endpoint
        response = self.client.get("/api/searchtermexamples/")

        # Should not return 500 error
        self.assertEqual(response.status_code, 200)
        # The API returns a dict with 'results' key containing the list
        self.assertIn("results", response.data)
        self.assertIsInstance(response.data["results"], list)


================================================
FILE: api/tests/test_search_terms.py
================================================
import random

from django.test import TestCase

from api.api_util import get_search_term_examples
from api.models import Photo
from api.tests.fixtures.api_util.captions_json import captions_json
from api.tests.fixtures.geocode.expectations.mapbox import expectations
from api.tests.utils import (
    create_test_photos,
    create_test_photos_with_faces,
    create_test_user,
)


class GetSearchTermExamples(TestCase):
    def setUp(self) -> None:
        self.admin = create_test_user(is_admin=True)
        self.photos = (
            create_test_photos(
                90,
                owner=self.admin,
                geolocation_json=expectations[0],
                captions_json=captions_json,
                exif_timestamp="2017-08-18 15:08:09.000000 +00:00",
            )
            + create_test_photos(
                5,
                owner=self.admin,
                geolocation_json={},
                captions_json={"places365": None},
            )
            + create_test_photos_with_faces(
                5,
                owner=self.admin,
                geolocation_json=expectations[0],
                captions_json={"places365": None},
            )
        )
        self._original__random_random = random.random
        self._original__random_choices = random.choices
        self._original__random_choice = random.choice
        self._original__random_shuffle = random.shuffle
        random.choices = lambda x, **kw: x
        random.choice = lambda x: x[0]
        random.shuffle = lambda x: x

    def tearDown(self) -> None:
        random.random = self._original__random_random
        random.choices = self._original__random_choices
        random.choice = self._original__random_choice
        random.shuffle = self._original__random_shuffle

    def test_get_search_term_examples_0(self):
        random.random = lambda: 0
        array = get_search_term_examples(self.admin)
        self.assertEqual(len(array), 3)
        self.assertEqual(set(array), {"phone booth", "2017", "Beach Road"})

    def test_get_search_term_examples_2(self):
        random.random = lambda: 0.5
        array = get_search_term_examples(self.admin)
        self.assertEqual(len(array), 4)
        self.assertEqual(
            set(array),
            {
                "2017",
                "Beach Road 2017",
                "Beach Road",
                "phone booth",
            },
        )

    def test_get_search_term_examples_3(self):
        random.random = lambda: 1
        array = get_search_term_examples(self.admin)
        self.assertEqual(len(array), 7)
        self.assertEqual(
            set(array),
            {
                "2017 phone booth",
                "2017",
                "Beach Road  2017 phone booth",
                "Beach Road 2017",
                "Beach Road phone booth",
                "Beach Road",
                "phone booth",
            },
        )

    def test_get_search_term_examples_without_photos(self):
        Photo.objects.all().delete()
        array = get_search_term_examples(self.admin)
        self.assertEqual(len(array), 5)
        self.assertEqual(
            set(array),
            {
                "for time",
                "for places",
                "for people",
                "for file path or file name",
                "for things",
            },
        )


================================================
FILE: api/tests/test_services.py
================================================
"""Tests for CPU architecture detection and service compatibility checks"""
import unittest
from unittest.mock import patch

from api.services import check_cpu_features, has_required_cpu_features, _is_arm_architecture


class TestServiceCPUCompatibility(unittest.TestCase):
    """Test CPU feature detection and compatibility checks"""

    # Constants for testing
    ARM_ARCHITECTURES = ['aarch64', 'arm64', 'armv7l', 'armv8']
    X86_ARCHITECTURES = ['x86_64', 'i686', 'i386', 'AMD64']

    @patch('api.services.platform.machine')
    def test_is_arm_architecture_detection(self, mock_machine):
        """Test that _is_arm_architecture helper correctly identifies ARM architectures"""
        # Test lowercase ARM architectures
        for arch in self.ARM_ARCHITECTURES:
            mock_machine.return_value = arch
            self.assertTrue(_is_arm_architecture(), f"Should detect {arch} as ARM")
        
        # Test case-insensitive detection
        for arch in ['AARCH64', 'ARM64', 'AArch64']:
            mock_machine.return_value = arch
            self.assertTrue(_is_arm_architecture(), f"Should detect {arch} as ARM (case-insensitive)")
        
        # Test x86 architectures are not detected as ARM
        for arch in self.X86_ARCHITECTURES:
            mock_machine.return_value = arch
            self.assertFalse(_is_arm_architecture(), f"Should not detect {arch} as ARM")

    @patch('api.services.platform.machine')
    def test_check_cpu_features_on_arm(self, mock_machine):
        """Test that ARM architectures skip x86 CPU feature checks"""
        for arch in self.ARM_ARCHITECTURES:
            mock_machine.return_value = arch
            features = check_cpu_features()
            # On ARM, should return empty list as x86 features don't apply
            self.assertEqual(features, [], f"Expected empty list for {arch}")

    @patch('api.services.platform.machine')
    def test_check_cpu_features_on_x86(self, mock_machine):
        """Test that x86 architectures attempt to check CPU features"""
        for arch in self.X86_ARCHITECTURES:
            mock_machine.return_value = arch
            # Should not return early, will try to import cpuinfo
            # We can't easily test the cpuinfo part without mocking more
            features = check_cpu_features()
            # Should be a list (may be empty if cpuinfo not available)
            self.assertIsInstance(features, list, f"Expected list for {arch}")

    @patch('api.services.platform.machine')
    def test_has_required_cpu_features_on_arm(self, mock_machine):
        """Test that ARM architectures bypass x86-specific CPU checks"""
        mock_machine.return_value = 'aarch64'
        
        # LLM service has CPU requirements, but should be allowed on ARM
        result = has_required_cpu_features('llm')
        self.assertTrue(result, "LLM service should be compatible on ARM")

    @patch('api.services.platform.machine')
    def test_has_required_cpu_features_no_requirements(self, mock_machine):
        """Test services without CPU requirements are always compatible"""
        mock_machine.return_value = 'x86_64'
        
        # Service without requirements should always return True
        result = has_required_cpu_features('thumbnail')
        self.assertTrue(result, "Services without requirements should be compatible")

    @patch('api.services.platform.machine')
    @patch('api.services.check_cpu_features')
    def test_has_required_cpu_features_on_x86_with_features(self, mock_features, mock_machine):
        """Test x86 with required features present"""
        mock_machine.return_value = 'x86_64'
        mock_features.return_value = ['avx', 'avx2', 'sse4_2', 'fma', 'f16c']
        
        result = has_required_cpu_features('llm')
        self.assertTrue(result, "Should be compatible when all features present")

    @patch('api.services.platform.machine')
    @patch('api.services.check_cpu_features')
    def test_has_required_cpu_features_on_x86_missing_required(self, mock_features, mock_machine):
        """Test x86 missing required features"""
        mock_machine.return_value = 'x86_64'
        mock_features.return_value = []  # No features available
        
        result = has_required_cpu_features('llm')
        self.assertFalse(result, "Should be incompatible when required features missing")

    @patch('api.services.platform.machine')
    @patch('api.services.check_cpu_features')
    def test_has_required_cpu_features_on_x86_missing_recommended(self, mock_features, mock_machine):
        """Test x86 with required features but missing recommended ones"""
        mock_machine.return_value = 'x86_64'
        # Has required but not recommended
        mock_features.return_value = ['avx', 'sse4_2']
        
        result = has_required_cpu_features('llm')
        self.assertTrue(result, "Should be compatible with required features even if missing recommended")


================================================
FILE: api/tests/test_setup_directory.py
================================================
from django.test import TestCase
from rest_framework.test import APIClient

from api.models import User
from api.tests.utils import create_password


class SetupDirectoryTestCase(TestCase):
    userid = 0

    def setUp(self):
        self.client = APIClient()
        self.admin = User.objects.create_superuser(
            "test_admin", "test_admin@test.com", create_password()
        )

    def test_setup_directory(self):
        self.client.force_authenticate(user=self.admin)
        response = self.client.patch(
            f"/api/manage/user/{self.admin.id}/",
            {"scan_directory": "/data"},
        )
        self.assertEqual(response.status_code, 200)

    def test_setup_not_existing_directory(self):
        self.client.force_authenticate(user=self.admin)
        response = self.client.patch(
            f"/api/manage/user/{self.admin.id}/",
            {"scan_directory": "/non-existent-directory"},
        )
        self.assertEqual(response.status_code, 400)
        # Check for the error message in the new format
        data = response.json()
        self.assertIn("errors", data)
        self.assertGreater(len(data["errors"]), 0)
        self.assertEqual(
            data["errors"][0]["message"], "Scan directory must be inside the data root."
        )


================================================
FILE: api/tests/test_share_photos.py
================================================
import logging
from unittest import skip

from django.test import TestCase
from rest_framework.test import APIClient

from api.models import Photo
from api.tests.utils import create_test_photos, create_test_user, share_test_photos

logger = logging.getLogger(__name__)


class SharePhotosTest(TestCase):
    def setUp(self):
        self.client = APIClient()
        self.user1 = create_test_user()
        self.user2 = create_test_user()
        self.client.force_authenticate(user=self.user1)

    def test_share_photos(self):
        photos = create_test_photos(number_of_photos=3, owner=self.user1)
        image_hashes = [p.image_hash for p in photos]
        photo_ids = [p.id for p in photos]

        payload = {
            "image_hashes": image_hashes,
            "val_shared": True,
            "target_user_id": self.user2.id,
        }
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/share/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(3, data["count"])
        # Query by photo UUID (pk), not image_hash
        shared_photos = list(
            Photo.shared_to.through.objects.filter(
                user_id=self.user2.id, photo_id__in=photo_ids
            )
        )
        self.assertEqual(3, len(shared_photos))

    def test_unshare_photos(self):
        photos = create_test_photos(number_of_photos=3, owner=self.user1)
        image_hashes = [p.image_hash for p in photos]
        photo_ids = [p.id for p in photos]
        share_test_photos(image_hashes, self.user2)

        payload = {
            "image_hashes": image_hashes,
            "val_shared": False,
            "target_user_id": self.user2.id,
        }
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/share/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(3, data["count"])
        # Query by photo UUID (pk), not image_hash
        shared_photos = list(
            Photo.shared_to.through.objects.filter(
                user_id=self.user2.id, photo_id__in=photo_ids
            )
        )
        self.assertEqual(0, len(shared_photos))

    @skip("BUG!!! scenario not implemented")
    def test_share_other_user_photos(self):
        photos = create_test_photos(number_of_photos=2, owner=self.user2)
        image_hashes = [p.image_hash for p in photos]

        payload = {
            "image_hashes": image_hashes,
            "val_shared": True,
            "target_user_id": self.user1.id,
        }
        headers = {"Content-Type": "application/json"}
        response = self.client.post(
            "/api/photosedit/share/", format="json", data=payload, headers=headers
        )
        data = response.json()

        self.assertTrue(data["status"])
        self.assertEqual(0, data["count"])
        shared_photos = list(
            Photo.shared_to.through.objects.filter(
                user_id=self.user1.id, photo_id__in=image_hashes
            )
        )
        self.assertEqual(0, len(shared_photos))


================================================
FILE: api/tests/test_skip_raw_files.py
================================================
"""
Test to verify the behavior of the stack_raw_jpeg feature during scans.
Note: skip_raw_files is deprecated - RAW files are always imported, but can be stacked or not.
"""
from unittest.mock import patch

from django.test import TestCase

from api.models import Photo, User
from api.models.file import is_valid_media


class StackRawJpegTestCase(TestCase):
    """Test to verify that RAW files are always imported and can be stacked"""

    def setUp(self):
        """Set up the test environment"""
        self.user = User.objects.create_user(
            username="testuser",
            email="test@example.com",
            password="testpass123",
        )
        self.user.scan_directory = "/tmp/test_photos"
        self.user.save()

    def tearDown(self):
        """Clean up after tests"""
        Photo.objects.filter(owner=self.user).delete()
        self.user.delete()

    def test_raw_files_always_valid(self):
        """
        Test: RAW files are always considered valid (no longer skipped)
        """
        # Verify that is_valid_media returns True for RAW files regardless of stack_raw_jpeg
        with patch("api.models.file.is_raw") as mock_is_raw:
            mock_is_raw.return_value = True
            # With stack_raw_jpeg=True
            self.user.stack_raw_jpeg = True
            self.user.save()
            result = is_valid_media("/new/raw/file.NEF", self.user)
            self.assertTrue(
                result,
                "RAW files should always be considered valid",
            )

            # With stack_raw_jpeg=False
            self.user.stack_raw_jpeg = False
            self.user.save()
            result = is_valid_media("/new/raw/file.NEF", self.user)
            self.assertTrue(
                result,
                "RAW files should always be considered valid even with stack_raw_jpeg=False",
            )


================================================
FILE: api/tests/test_social_graph.py
================================================
"""
Tests for social graph functionality.
"""

from django.test import TestCase
from django.utils import timezone

from api.models import Face, Person, Photo, User
from api.social_graph import build_social_graph


class SocialGraphTestCase(TestCase):
    def setUp(self):
        """Set up test data."""
        self.user = User.objects.create_user(username="testuser", password="testpass")

    def test_build_social_graph_no_data(self):
        """Test building social graph with no faces/photos."""
        result = build_social_graph(self.user)
        self.assertEqual(result, {"nodes": [], "links": []})

    def test_build_social_graph_single_person(self):
        """Test building social graph with single person (no connections)."""
        # Create a photo
        photo = Photo.objects.create(
            owner=self.user,
            image_hash="testhash1",
            added_on=timezone.now(),
        )

        # Create a person
        person = Person.objects.create(name="John Doe", owner=self.user)

        # Create a face
        Face.objects.create(
            photo=photo,
            person=person,
            location_top=0,
            location_bottom=100,
            location_left=0,
            location_right=100,
            encoding="0" * 256,  # Dummy encoding
        )

        # Should return empty since we need at least 2 people in same photo for connections
        result = build_social_graph(self.user)
        self.assertEqual(result, {"nodes": [], "links": []})

    def test_build_social_graph_two_people_same_photo(self):
        """Test building social graph with two people in same photo."""
        # Create a photo
        photo = Photo.objects.create(
            owner=self.user,
            image_hash="testhash2",
            added_on=timezone.now(),
        )

        # Create two people
        person1 = Person.objects.create(name="Alice", owner=self.user)
        person2 = Person.objects.create(name="Bob", owner=self.user)

        # Create faces for both people in the same photo
        Face.objects.create(
            photo=photo,
            person=person1,
            location_top=0,
            location_bottom=100,
            location_left=0,
            location_right=100,
            encoding="0" * 256,
        )
        Face.objects.create(
            photo=photo,
            person=person2,
            location_top=0,
            location_bottom=100,
            location_left=100,
            location_right=200,
            encoding="1" * 256,
        )

        result = build_social_graph(self.user)

        # Should have 2 nodes and 1 link
        self.assertEqual(len(result["nodes"]), 2)
        self.assertEqual(len(result["links"]), 1)

        # Check node names
        node_ids = {node["id"] for node in result["nodes"]}
        self.assertEqual(node_ids, {"Alice", "Bob"})

        # Check link
        link = result["links"][0]
        self.assertIn(link["source"], {"Alice", "Bob"})
        self.assertIn(link["target"], {"Alice", "Bob"})
        self.assertNotEqual(link["source"], link["target"])


================================================
FILE: api/tests/test_stack_api_edge_cases.py
================================================
"""
Edge case tests for Stack API endpoints.

Tests cover:
- Manual stack creation edge cases
- Add/remove photos from stacks
- Set primary photo
- Merge stacks
- Stack statistics
- Detection triggers
"""

import uuid
from django.test import TestCase
from rest_framework.test import APIClient

from api.models.photo_stack import PhotoStack
from api.tests.utils import create_test_photo, create_test_user


class ManualStackCreationAPITestCase(TestCase):
    """Tests for manual stack creation API."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_create_manual_stack_success(self):
        """Test creating a manual stack with valid photos."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        response = self.client.post(
            "/api/stacks/manual",
            {"photo_hashes": [photo1.image_hash, photo2.image_hash]},
            format='json',
        )
        
        self.assertEqual(response.status_code, 201)
        self.assertIn("stack_id", response.data)
        
        # Verify stack was created
        stack = PhotoStack.objects.get(id=response.data["stack_id"])
        self.assertEqual(stack.stack_type, PhotoStack.StackType.MANUAL)
        self.assertEqual(stack.photos.count(), 2)

    def test_create_manual_stack_minimum_photos(self):
        """Test that manual stack requires at least 2 photos."""
        photo1 = create_test_photo(owner=self.user)
        
        response = self.client.post(
            "/api/stacks/manual",
            {"photo_hashes": [photo1.image_hash]},
            format='json',
        )
        
        # Should fail - need at least 2 photos
        self.assertEqual(response.status_code, 400)

    def test_create_manual_stack_empty_photos(self):
        """Test creating manual stack with empty photo list."""
        response = self.client.post(
            "/api/stacks/manual",
            {"photo_hashes": []},
            format='json',
        )
        
        self.assertEqual(response.status_code, 400)

    def test_create_manual_stack_nonexistent_photos(self):
        """Test creating manual stack with nonexistent photo hashes."""
        response = self.client.post(
            "/api/stacks/manual",
            {"photo_hashes": ["nonexistent1", "nonexistent2"]},
            format='json',
        )
        
        # Should fail - photos don't exist
        self.assertEqual(response.status_code, 400)

    def test_create_manual_stack_other_users_photos(self):
        """Test creating manual stack with other user's photos."""
        other_user = create_test_user()
        other_photo = create_test_photo(owner=other_user)
        my_photo = create_test_photo(owner=self.user)
        
        response = self.client.post(
            "/api/stacks/manual",
            {"photo_hashes": [my_photo.image_hash, other_photo.image_hash]},
            format='json',
        )
        
        # Should fail - only 1 photo found (other user's photo not found)
        self.assertEqual(response.status_code, 400)

    def test_create_manual_stack_duplicate_hashes(self):
        """Test creating manual stack with duplicate photo hashes.
        
        Bug #15 Fixed: Duplicate hashes are now de-duplicated before validation.
        If there's only 1 unique photo, the error message correctly states
        "At least 2 unique photos required".
        """
        photo = create_test_photo(owner=self.user)
        
        response = self.client.post(
            "/api/stacks/manual",
            {"photo_hashes": [photo.image_hash, photo.image_hash]},
            format='json',
        )
        
        # After fix: Duplicates are de-duplicated first, then we check if we have >= 2
        # Since there's only 1 unique photo, it fails with a clear message
        self.assertEqual(response.status_code, 400)
        self.assertEqual(response.data["error"], "At least 2 unique photos required to create a stack")


class AddRemovePhotosAPITestCase(TestCase):
    """Tests for adding/removing photos from stacks."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_add_photo_to_stack(self):
        """Test adding a photo to an existing stack."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo1, photo2)
        
        response = self.client.post(
            f"/api/stacks/{stack.id}/add",
            {"photo_hashes": [photo3.image_hash]},
            format='json',
        )
        
        self.assertEqual(response.status_code, 200)
        stack.refresh_from_db()
        self.assertEqual(stack.photos.count(), 3)

    def test_add_already_in_stack_photo(self):
        """Test adding a photo that's already in the stack."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo1, photo2)
        
        response = self.client.post(
            f"/api/stacks/{stack.id}/add",
            {"photo_hashes": [photo1.image_hash]},
            format='json',
        )
        
        # Should succeed (idempotent) but count stays same
        self.assertEqual(response.status_code, 200)
        stack.refresh_from_db()
        self.assertEqual(stack.photos.count(), 2)

    def test_remove_photo_from_stack(self):
        """Test removing a photo from a stack."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo1, photo2, photo3)
        
        response = self.client.post(
            f"/api/stacks/{stack.id}/remove",
            {"photo_hashes": [photo3.image_hash]},
            format='json',
        )
        
        self.assertEqual(response.status_code, 200)
        stack.refresh_from_db()
        self.assertEqual(stack.photos.count(), 2)

    def test_remove_to_one_photo_deletes_stack(self):
        """Test that removing photos until 1 left deletes the stack."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo1, photo2)
        stack_id = stack.id
        
        response = self.client.post(
            f"/api/stacks/{stack_id}/remove",
            {"photo_hashes": [photo2.image_hash]},
            format='json',
        )
        
        self.assertEqual(response.status_code, 200)
        # Stack should be deleted (only 1 photo left)
        self.assertFalse(PhotoStack.objects.filter(id=stack_id).exists())

    def test_remove_photo_not_in_stack(self):
        """Test removing a photo that's not in the stack."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo1, photo2)
        
        response = self.client.post(
            f"/api/stacks/{stack.id}/remove",
            {"photo_hashes": [photo3.image_hash]},
            format='json',
        )
        
        # Should succeed (no-op) or return 400
        self.assertIn(response.status_code, [200, 400])


class SetPrimaryPhotoAPITestCase(TestCase):
    """Tests for setting primary/cover photo."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_set_primary_photo(self):
        """Test setting a primary photo for a stack."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
            primary_photo=photo1,
        )
        stack.photos.add(photo1, photo2)
        
        response = self.client.post(
            f"/api/stacks/{stack.id}/primary",
            {"photo_hash": photo2.image_hash},
            format='json',
        )
        
        self.assertEqual(response.status_code, 200)
        stack.refresh_from_db()
        self.assertEqual(stack.primary_photo, photo2)

    def test_set_primary_photo_not_in_stack(self):
        """Test setting primary photo that's not in the stack."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo1, photo2)
        
        response = self.client.post(
            f"/api/stacks/{stack.id}/primary",
            {"photo_hash": photo3.image_hash},
            format='json',
        )
        
        # Should fail - photo not in stack
        self.assertEqual(response.status_code, 400)

    def test_set_primary_nonexistent_photo(self):
        """Test setting primary with nonexistent photo hash."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo1, photo2)
        
        response = self.client.post(
            f"/api/stacks/{stack.id}/primary",
            {"photo_hash": "nonexistent"},
            format='json',
        )
        
        self.assertEqual(response.status_code, 400)


class MergeStacksAPITestCase(TestCase):
    """Tests for merging stacks."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_merge_two_stacks(self):
        """Test merging two manual stacks."""
        photos1 = [create_test_photo(owner=self.user) for _ in range(2)]
        photos2 = [create_test_photo(owner=self.user) for _ in range(2)]
        
        stack1 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack1.photos.add(*photos1)
        
        stack2 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack2.photos.add(*photos2)
        
        # Get all photo hashes from both stacks
        all_hashes = [p.image_hash for p in photos1 + photos2]
        
        response = self.client.post(
            "/api/stacks/merge",
            {"photo_hashes": all_hashes},
            format='json',
        )
        
        self.assertEqual(response.status_code, 200)
        
        # Should have 1 stack with all 4 photos
        stacks = PhotoStack.objects.filter(owner=self.user, stack_type=PhotoStack.StackType.MANUAL)
        self.assertEqual(stacks.count(), 1)
        self.assertEqual(stacks.first().photos.count(), 4)

    def test_merge_nonexistent_stacks(self):
        """Test merging with photos not in any stack."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        response = self.client.post(
            "/api/stacks/merge",
            {"photo_hashes": [photo1.image_hash, photo2.image_hash]},
            format='json',
        )
        
        # Should create a new stack or return error
        self.assertIn(response.status_code, [200, 201, 400])


class StackStatsAPITestCase(TestCase):
    """Tests for stack statistics endpoint."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_stats_with_no_stacks(self):
        """Test stats endpoint with no stacks."""
        response = self.client.get("/api/stacks/stats")
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["total_stacks"], 0)

    def test_stats_counts_by_type(self):
        """Test stats counts by stack type."""
        photos = [create_test_photo(owner=self.user) for _ in range(6)]
        
        # Create different stack types
        burst_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        burst_stack.photos.add(photos[0], photos[1])
        
        raw_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.RAW_JPEG_PAIR,
        )
        raw_stack.photos.add(photos[2], photos[3])
        
        manual_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        manual_stack.photos.add(photos[4], photos[5])
        
        response = self.client.get("/api/stacks/stats")
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["total_stacks"], 3)
        self.assertEqual(response.data["by_type"][PhotoStack.StackType.BURST_SEQUENCE], 1)
        self.assertEqual(response.data["by_type"][PhotoStack.StackType.RAW_JPEG_PAIR], 1)
        self.assertEqual(response.data["by_type"][PhotoStack.StackType.MANUAL], 1)

    def test_stats_photos_in_stacks(self):
        """Test stats counts photos in stacks correctly."""
        photos = [create_test_photo(owner=self.user) for _ in range(5)]
        
        stack1 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack1.photos.add(photos[0], photos[1], photos[2])
        
        # Create another stack with overlapping photo
        stack2 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack2.photos.add(photos[2], photos[3])  # photos[2] in both
        
        response = self.client.get("/api/stacks/stats")
        
        self.assertEqual(response.status_code, 200)
        # 4 unique photos (0,1,2,3)
        self.assertEqual(response.data["photos_in_stacks"], 4)

    def test_stats_other_users_not_included(self):
        """Test stats don't include other user's stacks."""
        other_user = create_test_user()
        
        # Create stack for other user
        other_photo1 = create_test_photo(owner=other_user)
        other_photo2 = create_test_photo(owner=other_user)
        stack = PhotoStack.objects.create(
            owner=other_user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(other_photo1, other_photo2)
        
        response = self.client.get("/api/stacks/stats")
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["total_stacks"], 0)


class StackDeleteAPITestCase(TestCase):
    """Tests for stack deletion."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_delete_stack(self):
        """Test deleting a stack."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo1, photo2)
        stack_id = stack.id
        
        response = self.client.delete(f"/api/stacks/{stack_id}/delete")
        
        self.assertEqual(response.status_code, 200)
        self.assertFalse(PhotoStack.objects.filter(id=stack_id).exists())
        
        # Photos should still exist
        photo1.refresh_from_db()
        photo2.refresh_from_db()
        self.assertFalse(photo1.removed)

    def test_delete_nonexistent_stack(self):
        """Test deleting a nonexistent stack."""
        response = self.client.delete(f"/api/stacks/{uuid.uuid4()}/delete")
        self.assertEqual(response.status_code, 404)

    def test_delete_other_users_stack(self):
        """Test deleting another user's stack."""
        other_user = create_test_user()
        photo1 = create_test_photo(owner=other_user)
        photo2 = create_test_photo(owner=other_user)
        
        stack = PhotoStack.objects.create(
            owner=other_user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo1, photo2)
        
        response = self.client.delete(f"/api/stacks/{stack.id}/delete")
        
        # Should return 404 (not found for this user)
        self.assertEqual(response.status_code, 404)


class StackDetailAPITestCase(TestCase):
    """Tests for stack detail view."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_get_stack_detail(self):
        """Test getting stack details."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
            primary_photo=photo1,
        )
        stack.photos.add(photo1, photo2)
        
        response = self.client.get(f"/api/stacks/{stack.id}")
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["stack_type"], PhotoStack.StackType.MANUAL)
        self.assertEqual(len(response.data["photos"]), 2)

    def test_get_stack_with_deleted_primary(self):
        """Test getting stack when primary photo was deleted."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
            primary_photo=photo1,
        )
        stack.photos.add(photo1, photo2, photo3)
        
        # Delete primary photo
        photo1.in_trashcan = True
        photo1.save()
        photo1.manual_delete()
        
        # Stack should still exist with 2 photos
        stack.refresh_from_db()
        
        response = self.client.get(f"/api/stacks/{stack.id}")
        
        self.assertEqual(response.status_code, 200)


class StackListAPITestCase(TestCase):
    """Tests for stack list view."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_list_stacks(self):
        """Test listing all stacks."""
        photos = [create_test_photo(owner=self.user) for _ in range(4)]
        
        stack1 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack1.photos.add(photos[0], photos[1])
        
        stack2 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack2.photos.add(photos[2], photos[3])
        
        response = self.client.get("/api/stacks")
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["count"], 2)

    def test_list_stacks_filter_by_type(self):
        """Test filtering stacks by type."""
        photos = [create_test_photo(owner=self.user) for _ in range(4)]
        
        manual_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        manual_stack.photos.add(photos[0], photos[1])
        
        burst_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        burst_stack.photos.add(photos[2], photos[3])
        
        response = self.client.get(f"/api/stacks?stack_type={PhotoStack.StackType.MANUAL}")
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["count"], 1)

    def test_list_excludes_single_photo_stacks(self):
        """Test that list excludes stacks with only 1 photo."""
        photo = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo)
        
        response = self.client.get("/api/stacks")
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["count"], 0)


class DetectionTriggerAPITestCase(TestCase):
    """Tests for detection trigger endpoints."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_trigger_detection(self):
        """Test triggering stack detection."""
        response = self.client.post(
            "/api/stacks/detect",
            {
                "detect_raw_jpeg": True,
                "detect_bursts": False,
                "detect_live_photos": False,
            },
            format='json',
        )
        
        # Should return 202 Accepted (queued)
        self.assertEqual(response.status_code, 202)

    def test_trigger_detection_empty_body(self):
        """Test triggering detection with empty body (defaults)."""
        response = self.client.post("/api/stacks/detect", {}, format='json')
        
        # Should succeed with defaults
        self.assertEqual(response.status_code, 202)


================================================
FILE: api/tests/test_stack_detection.py
================================================
"""
Comprehensive tests for PhotoStack Detection and API.

Tests cover:
- PhotoStack model functionality
- Stack API endpoints (list, detail, delete, set-primary, add, remove)
- Manual stack creation and merging
- Stack detection triggering
- Edge cases and error handling
"""

import uuid
from unittest.mock import patch

from django.test import TestCase
from rest_framework import status
from rest_framework.test import APIClient

from api.models import Photo
from api.models.photo_stack import PhotoStack
from api.tests.utils import create_test_photo, create_test_user


class PhotoStackModelTestCase(TestCase):
    """Tests for PhotoStack model functionality."""

    def setUp(self):
        self.user = create_test_user()
        self.photo1 = create_test_photo(owner=self.user)
        self.photo2 = create_test_photo(owner=self.user)
        self.photo3 = create_test_photo(owner=self.user)

    def test_create_stack_basic(self):
        """Test basic stack creation."""
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        self.photo1.stacks.add(stack)
        self.photo2.stacks.add(stack)

        self.assertEqual(stack.photo_count, 2)
        self.assertEqual(stack.owner, self.user)
        self.assertEqual(stack.stack_type, PhotoStack.StackType.MANUAL)

    def test_stack_types(self):
        """Test all stack types can be created."""
        for stack_type, display_name in PhotoStack.StackType.choices:
            stack = PhotoStack.objects.create(
                owner=self.user,
                stack_type=stack_type,
            )
            self.assertEqual(stack.stack_type, stack_type)
            self.assertIn(display_name, str(stack.get_stack_type_display()))

    def test_auto_select_primary_for_manual_stack(self):
        """Test auto-selecting primary for manual stack picks highest resolution."""
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        self.photo1.stacks.add(stack)
        self.photo2.stacks.add(stack)
        
        stack.auto_select_primary()
        
        # Primary should be set
        self.assertIsNotNone(stack.primary_photo)
        self.assertIn(stack.primary_photo, [self.photo1, self.photo2])

    def test_auto_select_primary_empty_stack(self):
        """Test auto_select_primary returns None for empty stack."""
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        
        result = stack.auto_select_primary()
        
        self.assertIsNone(result)
        self.assertIsNone(stack.primary_photo)

    def test_merge_with_another_stack(self):
        """Test merging two stacks."""
        stack1 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack2 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        
        self.photo1.stacks.add(stack1)
        self.photo2.stacks.add(stack2)
        self.photo3.stacks.add(stack2)
        
        stack2_id = stack2.pk
        stack1.merge_with(stack2)
        
        # All photos should be in stack1
        self.assertEqual(stack1.photos.count(), 3)
        self.assertIn(self.photo1, stack1.photos.all())
        self.assertIn(self.photo2, stack1.photos.all())
        self.assertIn(self.photo3, stack1.photos.all())
        
        # stack2 should be deleted
        self.assertFalse(PhotoStack.objects.filter(pk=stack2_id).exists())

    def test_merge_with_self_does_nothing(self):
        """Test merging a stack with itself is a no-op."""
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        self.photo1.stacks.add(stack)
        
        stack.merge_with(stack)
        
        # Stack should still exist and have same photo
        self.assertTrue(PhotoStack.objects.filter(pk=stack.pk).exists())
        self.assertEqual(stack.photos.count(), 1)

    def test_create_or_merge_new_stack(self):
        """Test create_or_merge creates a new stack when no overlap."""
        photos = [self.photo1, self.photo2]
        
        stack = PhotoStack.create_or_merge(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
            photos=photos,
        )
        
        self.assertIsNotNone(stack)
        self.assertEqual(stack.photos.count(), 2)
        self.assertIsNotNone(stack.primary_photo)

    def test_create_or_merge_returns_none_for_single_photo(self):
        """Test create_or_merge returns None when given <2 photos."""
        stack = PhotoStack.create_or_merge(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
            photos=[self.photo1],
        )
        
        self.assertIsNone(stack)

    def test_create_or_merge_merges_existing_stacks(self):
        """Test create_or_merge merges when photos already in stack."""
        # Create existing stack with photo1
        existing_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        self.photo1.stacks.add(existing_stack)
        
        # Now create_or_merge with photo1 and photo2
        result = PhotoStack.create_or_merge(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
            photos=[self.photo1, self.photo2],
        )
        
        # Should return the existing stack with both photos
        self.assertEqual(result.pk, existing_stack.pk)
        self.assertEqual(result.photos.count(), 2)
        self.assertIn(self.photo2, result.photos.all())

    def test_photo_can_be_in_multiple_stacks_of_different_types(self):
        """Test a photo can be in stacks of different types."""
        raw_jpeg_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.RAW_JPEG_PAIR,
        )
        manual_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        
        self.photo1.stacks.add(raw_jpeg_stack)
        self.photo1.stacks.add(manual_stack)
        
        self.assertEqual(self.photo1.stacks.count(), 2)


class PhotoStackAPITestCase(TestCase):
    """Tests for PhotoStack API endpoints."""

    def setUp(self):
        self.client = APIClient()
        self.user = create_test_user()
        self.other_user = create_test_user()
        self.client.force_authenticate(user=self.user)
        
        # Create photos for testing
        self.photo1 = create_test_photo(owner=self.user)
        self.photo2 = create_test_photo(owner=self.user)
        self.photo3 = create_test_photo(owner=self.user)
        
        # Create a test stack
        self.stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        self.photo1.stacks.add(self.stack)
        self.photo2.stacks.add(self.stack)
        self.stack.auto_select_primary()

    def test_list_stacks_returns_user_stacks(self):
        """Test listing stacks returns only user's stacks."""
        response = self.client.get("/api/stacks")
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertIn("results", data)
        self.assertIn("count", data)
        self.assertEqual(data["count"], 1)
        self.assertEqual(len(data["results"]), 1)
        self.assertEqual(data["results"][0]["id"], str(self.stack.id))

    def test_list_stacks_excludes_other_user_stacks(self):
        """Test listing stacks doesn't include other user's stacks."""
        # Create stack for other user
        other_photo = create_test_photo(owner=self.other_user)
        other_photo2 = create_test_photo(owner=self.other_user)
        other_stack = PhotoStack.objects.create(
            owner=self.other_user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        other_photo.stacks.add(other_stack)
        other_photo2.stacks.add(other_stack)
        
        response = self.client.get("/api/stacks")
        
        data = response.json()
        self.assertEqual(data["count"], 1)  # Only our stack
        self.assertNotEqual(data["results"][0]["id"], str(other_stack.id))

    def test_list_stacks_excludes_stacks_with_less_than_2_photos(self):
        """Test listing excludes stacks with <2 photos."""
        # Create stack with only 1 photo
        single_photo_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        self.photo3.stacks.add(single_photo_stack)
        
        response = self.client.get("/api/stacks")
        
        data = response.json()
        self.assertEqual(data["count"], 1)  # Only the stack with 2 photos

    def test_list_stacks_filter_by_type(self):
        """Test filtering stacks by type."""
        # Create burst stack
        burst_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        self.photo3.stacks.add(burst_stack)
        photo4 = create_test_photo(owner=self.user)
        photo4.stacks.add(burst_stack)
        
        response = self.client.get("/api/stacks?stack_type=burst")
        
        data = response.json()
        self.assertEqual(data["count"], 1)
        self.assertEqual(data["results"][0]["stack_type"], "burst")

    def test_list_stacks_pagination(self):
        """Test pagination works correctly."""
        response = self.client.get("/api/stacks?page=1&page_size=10")
        
        data = response.json()
        self.assertIn("page", data)
        self.assertIn("page_size", data)
        self.assertIn("has_next", data)
        self.assertIn("has_previous", data)
        self.assertEqual(data["page"], 1)
        self.assertEqual(data["page_size"], 10)

    def test_get_stack_detail(self):
        """Test getting stack detail."""
        response = self.client.get(f"/api/stacks/{self.stack.id}")
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["id"], str(self.stack.id))
        self.assertEqual(data["stack_type"], "manual")
        self.assertEqual(data["photo_count"], 2)
        self.assertIn("photos", data)
        self.assertEqual(len(data["photos"]), 2)

    def test_get_stack_detail_not_found(self):
        """Test getting non-existent stack returns 404."""
        fake_id = uuid.uuid4()
        response = self.client.get(f"/api/stacks/{fake_id}")
        
        self.assertEqual(response.status_code, status.HTTP_404_NOT_FOUND)

    def test_get_stack_detail_other_user_returns_404(self):
        """Test getting other user's stack returns 404."""
        other_photo = create_test_photo(owner=self.other_user)
        other_photo2 = create_test_photo(owner=self.other_user)
        other_stack = PhotoStack.objects.create(
            owner=self.other_user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        other_photo.stacks.add(other_stack)
        other_photo2.stacks.add(other_stack)
        
        response = self.client.get(f"/api/stacks/{other_stack.id}")
        
        self.assertEqual(response.status_code, status.HTTP_404_NOT_FOUND)

    def test_delete_stack(self):
        """Test deleting a stack unlinks photos but doesn't delete them."""
        stack_id = self.stack.id
        photo1_pk = self.photo1.pk
        photo2_pk = self.photo2.pk
        
        response = self.client.delete(f"/api/stacks/{stack_id}/delete")
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["status"], "deleted")
        self.assertEqual(data["unlinked_count"], 2)
        
        # Stack should be deleted
        self.assertFalse(PhotoStack.objects.filter(pk=stack_id).exists())
        
        # Photos should still exist
        self.assertTrue(Photo.objects.filter(pk=photo1_pk).exists())
        self.assertTrue(Photo.objects.filter(pk=photo2_pk).exists())

    def test_delete_stack_not_found(self):
        """Test deleting non-existent stack returns 404."""
        fake_id = uuid.uuid4()
        response = self.client.delete(f"/api/stacks/{fake_id}/delete")
        
        self.assertEqual(response.status_code, status.HTTP_404_NOT_FOUND)

    def test_set_primary_photo(self):
        """Test setting a photo as primary."""
        response = self.client.post(
            f"/api/stacks/{self.stack.id}/primary",
            {"photo_hash": self.photo2.image_hash},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["status"], "updated")
        self.assertEqual(data["primary_photo_hash"], self.photo2.image_hash)
        
        # Verify in database
        self.stack.refresh_from_db()
        self.assertEqual(self.stack.primary_photo.image_hash, self.photo2.image_hash)

    def test_set_primary_photo_not_in_stack(self):
        """Test setting photo not in stack as primary returns 400."""
        response = self.client.post(
            f"/api/stacks/{self.stack.id}/primary",
            {"photo_hash": self.photo3.image_hash},  # photo3 not in stack
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST)
        self.assertIn("error", response.json())

    def test_set_primary_missing_photo_hash(self):
        """Test setting primary without photo_hash returns 400."""
        response = self.client.post(
            f"/api/stacks/{self.stack.id}/primary",
            {},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST)

    def test_add_photos_to_stack(self):
        """Test adding photos to an existing stack."""
        response = self.client.post(
            f"/api/stacks/{self.stack.id}/add",
            {"photo_hashes": [self.photo3.image_hash]},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["status"], "updated")
        self.assertEqual(data["added_count"], 1)
        self.assertEqual(data["total_count"], 3)
        
        # Verify in database
        self.assertIn(self.photo3, self.stack.photos.all())

    def test_add_photos_already_in_stack(self):
        """Test adding photo already in stack doesn't duplicate."""
        response = self.client.post(
            f"/api/stacks/{self.stack.id}/add",
            {"photo_hashes": [self.photo1.image_hash]},  # Already in stack
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["added_count"], 0)  # Not added again
        self.assertEqual(data["total_count"], 2)

    def test_remove_photos_from_stack(self):
        """Test removing photos from a stack."""
        # First add photo3 so we have 3 photos
        self.photo3.stacks.add(self.stack)
        
        response = self.client.post(
            f"/api/stacks/{self.stack.id}/remove",
            {"photo_hashes": [self.photo3.image_hash]},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["status"], "updated")
        self.assertEqual(data["removed_count"], 1)
        self.assertEqual(data["total_count"], 2)

    def test_remove_photos_deletes_stack_if_less_than_2_remain(self):
        """Test removing photos deletes stack if <2 photos remain."""
        stack_id = self.stack.id
        
        response = self.client.post(
            f"/api/stacks/{self.stack.id}/remove",
            {"photo_hashes": [self.photo1.image_hash, self.photo2.image_hash]},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["status"], "deleted")
        
        # Stack should be deleted
        self.assertFalse(PhotoStack.objects.filter(pk=stack_id).exists())

    def test_unauthenticated_request_returns_401(self):
        """Test unauthenticated requests return 401."""
        self.client.force_authenticate(user=None)
        
        response = self.client.get("/api/stacks")
        
        self.assertEqual(response.status_code, status.HTTP_401_UNAUTHORIZED)


class ManualStackCreationTestCase(TestCase):
    """Tests for manual stack creation."""

    def setUp(self):
        self.client = APIClient()
        self.user = create_test_user()
        self.client.force_authenticate(user=self.user)
        
        self.photo1 = create_test_photo(owner=self.user)
        self.photo2 = create_test_photo(owner=self.user)
        self.photo3 = create_test_photo(owner=self.user)

    def test_create_manual_stack(self):
        """Test creating a manual stack."""
        response = self.client.post(
            "/api/stacks/manual",
            {"photo_hashes": [self.photo1.image_hash, self.photo2.image_hash]},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_201_CREATED)
        data = response.json()
        self.assertEqual(data["status"], "created")
        self.assertIn("stack_id", data)
        self.assertEqual(data["photo_count"], 2)
        
        # Verify stack was created
        stack = PhotoStack.objects.get(pk=data["stack_id"])
        self.assertEqual(stack.stack_type, PhotoStack.StackType.MANUAL)
        self.assertEqual(stack.photos.count(), 2)

    def test_create_manual_stack_requires_at_least_2_photos(self):
        """Test creating stack with <2 photos returns error."""
        response = self.client.post(
            "/api/stacks/manual",
            {"photo_hashes": [self.photo1.image_hash]},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST)

    def test_create_manual_stack_invalid_photo_hash(self):
        """Test creating stack with invalid photo hash returns error."""
        response = self.client.post(
            "/api/stacks/manual",
            {"photo_hashes": [self.photo1.image_hash, "invalid_hash"]},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST)
        self.assertIn("error", response.json())

    def test_create_manual_stack_other_user_photo(self):
        """Test creating stack with other user's photo returns error."""
        other_user = create_test_user()
        other_photo = create_test_photo(owner=other_user)
        
        response = self.client.post(
            "/api/stacks/manual",
            {"photo_hashes": [self.photo1.image_hash, other_photo.image_hash]},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST)

    def test_create_manual_stack_adds_to_existing_if_already_stacked(self):
        """Test creating stack adds to existing stack if photo already in manual stack."""
        # Create existing manual stack
        existing_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        self.photo1.stacks.add(existing_stack)
        self.photo2.stacks.add(existing_stack)
        
        # Try to create new stack with photo1 and photo3
        response = self.client.post(
            "/api/stacks/manual",
            {"photo_hashes": [self.photo1.image_hash, self.photo3.image_hash]},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_201_CREATED)
        data = response.json()
        self.assertEqual(data["stack_id"], str(existing_stack.id))
        
        # Verify photo3 was added to existing stack
        self.assertIn(self.photo3, existing_stack.photos.all())


class MergeStacksTestCase(TestCase):
    """Tests for stack merging."""

    def setUp(self):
        self.client = APIClient()
        self.user = create_test_user()
        self.client.force_authenticate(user=self.user)
        
        self.photo1 = create_test_photo(owner=self.user)
        self.photo2 = create_test_photo(owner=self.user)
        self.photo3 = create_test_photo(owner=self.user)
        self.photo4 = create_test_photo(owner=self.user)

    def test_merge_stacks(self):
        """Test merging multiple stacks."""
        # Create two separate stacks
        stack1 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        self.photo1.stacks.add(stack1)
        self.photo2.stacks.add(stack1)
        
        stack2 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        self.photo3.stacks.add(stack2)
        self.photo4.stacks.add(stack2)
        
        stack1_id = stack1.id
        stack2_id = stack2.id
        
        # Merge stacks using photos from both
        response = self.client.post(
            "/api/stacks/merge",
            {"photo_hashes": [self.photo1.image_hash, self.photo3.image_hash]},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        
        self.assertEqual(data["status"], "merged")
        self.assertEqual(data["merged_count"], 1)
        self.assertEqual(data["photo_count"], 4)
        
        # The non-target stack should be deleted
        # The target stack is the one returned in the response
        returned_stack_id = data.get("stack_id")
        if str(stack1_id) == returned_stack_id:
            # stack1 was target, stack2 should be deleted
            self.assertFalse(
                PhotoStack.objects.filter(pk=stack2_id).exists(),
                "stack2 should be deleted but still exists"
            )
        else:
            # stack2 was target, stack1 should be deleted
            self.assertFalse(
                PhotoStack.objects.filter(pk=stack1_id).exists(),
                "stack1 should be deleted but still exists"
            )

    def test_merge_single_stack_no_merge_needed(self):
        """Test merging when only one stack found returns no_merge_needed."""
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        self.photo1.stacks.add(stack)
        self.photo2.stacks.add(stack)
        
        response = self.client.post(
            "/api/stacks/merge",
            {"photo_hashes": [self.photo1.image_hash, self.photo2.image_hash]},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["status"], "no_merge_needed")

    def test_merge_no_stacks_returns_error(self):
        """Test merging photos not in any stack returns error."""
        response = self.client.post(
            "/api/stacks/merge",
            {"photo_hashes": [self.photo1.image_hash, self.photo2.image_hash]},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST)

    def test_merge_missing_photo_hashes(self):
        """Test merge without photo_hashes returns error."""
        response = self.client.post(
            "/api/stacks/merge",
            {},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST)


class StackDetectionTestCase(TestCase):
    """Tests for stack detection trigger."""

    def setUp(self):
        self.client = APIClient()
        self.user = create_test_user()
        self.client.force_authenticate(user=self.user)

    @patch("api.views.stacks.async_task")
    def test_detect_stacks_queues_background_job(self, mock_async_task):
        """Test detect stacks queues a background job."""
        response = self.client.post("/api/stacks/detect")
        
        self.assertEqual(response.status_code, status.HTTP_202_ACCEPTED)
        data = response.json()
        self.assertEqual(data["status"], "queued")
        self.assertIn("options", data)
        
        # Verify async_task was called
        mock_async_task.assert_called_once()

    @patch("api.views.stacks.async_task")
    def test_detect_stacks_with_options(self, mock_async_task):
        """Test detect stacks with custom options.
        
        NOTE: detect_raw_jpeg and detect_live_photos options were removed.
        RAW+JPEG and Live Photos are now handled via file variants during scan.
        Only detect_bursts is available.
        """
        response = self.client.post(
            "/api/stacks/detect",
            {
                "detect_bursts": False,
            },
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_202_ACCEPTED)
        data = response.json()
        self.assertEqual(data["options"]["detect_bursts"], False)


class StackStatsTestCase(TestCase):
    """Tests for stack statistics."""

    def setUp(self):
        self.client = APIClient()
        self.user = create_test_user()
        self.client.force_authenticate(user=self.user)
        
        self.photo1 = create_test_photo(owner=self.user)
        self.photo2 = create_test_photo(owner=self.user)
        self.photo3 = create_test_photo(owner=self.user)
        self.photo4 = create_test_photo(owner=self.user)

    def test_get_stack_stats(self):
        """Test getting stack statistics."""
        # Create some stacks
        manual_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        self.photo1.stacks.add(manual_stack)
        self.photo2.stacks.add(manual_stack)
        
        burst_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        self.photo3.stacks.add(burst_stack)
        self.photo4.stacks.add(burst_stack)
        
        response = self.client.get("/api/stacks/stats")
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["total_stacks"], 2)
        self.assertIn("by_type", data)
        self.assertEqual(data["by_type"]["manual"], 1)
        self.assertEqual(data["by_type"]["burst"], 1)
        self.assertEqual(data["photos_in_stacks"], 4)


class StackEdgeCasesTestCase(TestCase):
    """Edge case tests for stacks."""

    def setUp(self):
        self.client = APIClient()
        self.user = create_test_user()
        self.client.force_authenticate(user=self.user)
        
        self.photo1 = create_test_photo(owner=self.user)
        self.photo2 = create_test_photo(owner=self.user)

    def test_invalid_uuid_format_in_url(self):
        """Test invalid UUID format in URL is handled gracefully."""
        response = self.client.get("/api/stacks/not-a-valid-uuid")
        
        # The URL pattern [0-9a-f-]+ is permissive and partial matches fall through
        # to the list endpoint which returns 200. This is acceptable behavior -
        # the important thing is we don't get a 500 error.
        self.assertIn(response.status_code, [
            status.HTTP_200_OK,  # Falls through to list endpoint
            status.HTTP_400_BAD_REQUEST,
            status.HTTP_404_NOT_FOUND
        ])

    def test_stack_with_deleted_photo_handles_gracefully(self):
        """Test stack behavior when a photo is deleted."""
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        self.photo1.stacks.add(stack)
        self.photo2.stacks.add(stack)
        stack.primary_photo = self.photo1
        stack.save()
        
        # Delete photo1
        self.photo1.delete()
        
        # Stack detail should still work
        response = self.client.get(f"/api/stacks/{stack.id}")
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        # primary_photo should be None or the remaining photo
        self.assertEqual(len(data["photos"]), 1)

    def test_empty_photo_hashes_array(self):
        """Test empty photo_hashes array returns error."""
        response = self.client.post(
            "/api/stacks/manual",
            {"photo_hashes": []},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST)

    def test_duplicate_photo_hashes_in_request(self):
        """Test duplicate photo hashes in request are handled."""
        response = self.client.post(
            "/api/stacks/manual",
            {"photo_hashes": [self.photo1.image_hash, self.photo1.image_hash]},
            format="json",
        )
        
        # Should fail since we need 2 unique photos
        self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST)

    def test_remove_primary_photo_auto_selects_new_primary(self):
        """Test removing primary photo auto-selects a new primary."""
        photo3 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        self.photo1.stacks.add(stack)
        self.photo2.stacks.add(stack)
        photo3.stacks.add(stack)
        stack.primary_photo = self.photo1
        stack.save()
        
        response = self.client.post(
            f"/api/stacks/{stack.id}/remove",
            {"photo_hashes": [self.photo1.image_hash]},
            format="json",
        )
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        
        # Refresh and check primary was auto-selected
        stack.refresh_from_db()
        self.assertIsNotNone(stack.primary_photo)
        self.assertNotEqual(stack.primary_photo.image_hash, self.photo1.image_hash)

    def test_stack_list_page_size_max_100(self):
        """Test page_size is capped at 100."""
        response = self.client.get("/api/stacks?page_size=500")
        
        self.assertEqual(response.status_code, status.HTTP_200_OK)
        data = response.json()
        self.assertEqual(data["page_size"], 100)  # Capped at 100


================================================
FILE: api/tests/test_stack_detection_edge_cases.py
================================================
"""
Edge case tests for Stack Detection to find bugs.

NOTE: RAW+JPEG pairs and Live Photos are now handled as file variants
during scan (Photo.files ManyToMany field), not as stacks.

These tests specifically target:
1. create_or_merge queryset ordering issues (potential Bug #11)
2. Edge cases in hard criteria burst detection
3. Edge cases in soft criteria burst detection
4. File variant handling edge cases
5. Memory/performance edge cases
"""

import json
import uuid
from datetime import datetime, timedelta
from unittest.mock import patch

from django.test import TestCase

from api.models.file import File
from api.models.photo_stack import PhotoStack
from api.models.duplicate import Duplicate
from api.models.long_running_job import LongRunningJob
from api.stack_detection import (
    clear_stacks_of_type,
    detect_burst_sequences,
    batch_detect_stacks,
    _create_burst_stack,
)
from api.tests.utils import create_test_photo, create_test_user


class CreateOrMergeQuerysetOrderingTestCase(TestCase):
    """
    Test for Bug #11: create_or_merge uses two separate queries without ordering.

    The code does:
        existing_stacks = cls.objects.filter(...).distinct()
        target_stack = existing_stacks.first()      # Query 1
        for stack in existing_stacks[1:]:           # Query 2

    Without explicit ordering, these two queries could return stacks in different
    orders, causing the merge to not work correctly.
    """

    def setUp(self):
        self.user = create_test_user()

    def test_create_or_merge_with_multiple_existing_stacks(self):
        """Test that create_or_merge properly merges when photos are in multiple stacks."""
        # Create 4 photos
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        photo4 = create_test_photo(owner=self.user)

        # Create two separate stacks
        stack1 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack1.photos.add(photo1, photo2)

        stack2 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack2.photos.add(photo3, photo4)

        # Now try to create a stack with photos from both existing stacks
        # This should trigger the merge logic
        result_stack = PhotoStack.create_or_merge(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
            photos=[photo1, photo3],  # One from each stack
        )

        # Should have merged into one stack
        self.assertIsNotNone(result_stack)

        # Count remaining stacks of this type
        remaining_stacks = PhotoStack.objects.filter(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )

        # Should only have 1 stack after merge
        self.assertEqual(
            remaining_stacks.count(),
            1,
            "Multiple existing stacks should be merged into one",
        )

        # The merged stack should contain all 4 photos
        merged_stack = remaining_stacks.first()
        self.assertEqual(
            merged_stack.photos.count(),
            4,
            "Merged stack should contain all photos from both original stacks",
        )

    def test_create_or_merge_with_three_existing_stacks(self):
        """Test merging with 3 existing stacks - tests iterative merge."""
        photos = [create_test_photo(owner=self.user) for _ in range(6)]

        # Create three separate stacks with 2 photos each
        stack1 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack1.photos.add(photos[0], photos[1])

        stack2 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack2.photos.add(photos[2], photos[3])

        stack3 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack3.photos.add(photos[4], photos[5])

        # Create stack with one photo from each existing stack
        _result_stack = PhotoStack.create_or_merge(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
            photos=[photos[0], photos[2], photos[4]],
        )

        # Should merge all into one
        remaining_stacks = PhotoStack.objects.filter(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )

        self.assertEqual(
            remaining_stacks.count(), 1, "All 3 stacks should be merged into one"
        )
        self.assertEqual(
            remaining_stacks.first().photos.count(),
            6,
            "Merged stack should have all 6 photos",
        )


class DuplicateCreateOrMergeOrderingTestCase(TestCase):
    """Test the same ordering issue in Duplicate.create_or_merge."""

    def setUp(self):
        self.user = create_test_user()

    def test_duplicate_create_or_merge_with_multiple_groups(self):
        """Test that Duplicate.create_or_merge properly merges multiple groups."""
        photos = [create_test_photo(owner=self.user) for _ in range(4)]

        # Create two duplicate groups
        dup1 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup1.photos.add(photos[0], photos[1])

        dup2 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup2.photos.add(photos[2], photos[3])

        # Merge by adding photos from both groups
        _result = Duplicate.create_or_merge(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            photos=[photos[0], photos[2]],
        )

        remaining = Duplicate.objects.filter(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )

        self.assertEqual(
            remaining.count(), 1, "Multiple duplicate groups should be merged"
        )
        self.assertEqual(
            remaining.first().photos.count(), 4, "Merged group should have all photos"
        )


class HardCriteriaBurstDetectionEdgeCasesTestCase(TestCase):
    """Edge cases for hard criteria burst detection."""

    def setUp(self):
        self.user = create_test_user()
        # Set up hard rule that uses EXIF burst mode
        self.user.burst_detection_rules = json.dumps(
            [
                {
                    "id": 1,
                    "name": "EXIF Burst Mode",
                    "rule_type": "exif_burst_mode",
                    "category": "hard",
                    "enabled": True,
                }
            ]
        )
        self.user.save()

    def _create_file(self, path, file_type=File.IMAGE):
        """Helper to create a File object."""
        return File.objects.create(
            hash=str(uuid.uuid4())[:32],
            path=path,
            type=file_type,
        )

    def _create_photo_with_file(self, path, **kwargs):
        """Helper to create Photo with associated File."""
        file = self._create_file(path, File.IMAGE)
        photo = create_test_photo(owner=self.user, **kwargs)
        photo.main_file = file
        photo.save()
        return photo

    def test_all_photos_without_main_file(self):
        """Test detection when all photos have no main_file."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo1.main_file = None
        photo2.main_file = None
        photo1.save()
        photo2.save()

        # Should handle gracefully
        count = detect_burst_sequences(self.user)
        self.assertEqual(count, 0)

    @patch("api.metadata.reader.get_metadata")
    def test_get_metadata_raises_exception_for_all(self, mock_get_metadata):
        """Test when get_metadata raises exceptions for every photo."""
        _photo1 = self._create_photo_with_file("/photos/IMG_001.jpg")
        _photo2 = self._create_photo_with_file("/photos/IMG_002.jpg")

        mock_get_metadata.side_effect = Exception("EXIF read failed")

        # Should handle gracefully without crashing
        count = detect_burst_sequences(self.user)
        self.assertEqual(count, 0)

    @patch("api.metadata.reader.get_metadata")
    def test_get_metadata_returns_empty_for_some(self, mock_get_metadata):
        """Test when get_metadata returns empty for some photos."""
        _photo1 = self._create_photo_with_file("/photos/IMG_001.jpg")
        _photo2 = self._create_photo_with_file("/photos/IMG_002.jpg")

        # Return empty values
        mock_get_metadata.return_value = [None, None]

        count = detect_burst_sequences(self.user)
        # No bursts found because EXIF data is empty
        self.assertEqual(count, 0)


class SoftCriteriaBurstDetectionEdgeCasesTestCase(TestCase):
    """Edge cases for soft criteria burst detection."""

    def setUp(self):
        self.user = create_test_user()

    def _create_file(self, path, file_type=File.IMAGE):
        """Helper to create a File object."""
        return File.objects.create(
            hash=str(uuid.uuid4())[:32],
            path=path,
            type=file_type,
        )

    def _create_photo_with_timestamp(self, timestamp, perceptual_hash=None, **kwargs):
        """Helper to create Photo with specific timestamp and optional hash."""
        photo = create_test_photo(owner=self.user, **kwargs)
        photo.exif_timestamp = timestamp
        if perceptual_hash:
            photo.perceptual_hash = perceptual_hash
        file = self._create_file(f"/photos/IMG_{photo.pk}.jpg")
        photo.main_file = file
        photo.save()
        return photo

    def test_visual_similarity_with_null_perceptual_hash(self):
        """Test visual similarity detection when photos have no perceptual hash."""
        self.user.burst_detection_rules = json.dumps(
            [
                {
                    "id": 1,
                    "name": "Visual Similarity",
                    "rule_type": "visual_similarity",
                    "category": "soft",
                    "enabled": True,
                    "similarity_threshold": 15,
                }
            ]
        )
        self.user.save()

        base_time = datetime(2024, 1, 1, 12, 0, 0)
        # Create photos with no perceptual hash
        _photo1 = self._create_photo_with_timestamp(base_time, perceptual_hash=None)
        _photo2 = self._create_photo_with_timestamp(
            base_time + timedelta(seconds=1), perceptual_hash=None
        )

        # Should handle gracefully
        count = detect_burst_sequences(self.user)
        self.assertEqual(count, 0)

    def test_timestamp_proximity_with_same_timestamp(self):
        """Test timestamp proximity when multiple photos have exact same timestamp."""
        self.user.burst_detection_rules = json.dumps(
            [
                {
                    "id": 1,
                    "name": "Timestamp Proximity",
                    "rule_type": "timestamp_proximity",
                    "category": "soft",
                    "enabled": True,
                    "interval_ms": 2000,
                }
            ]
        )
        self.user.save()

        exact_time = datetime(2024, 1, 1, 12, 0, 0)
        # Create 5 photos with exact same timestamp
        photos = []
        for i in range(5):
            photos.append(self._create_photo_with_timestamp(exact_time))

        count = detect_burst_sequences(self.user)

        # Should create one burst stack with all 5 photos
        self.assertEqual(count, 1)

        stacks = PhotoStack.objects.filter(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        self.assertEqual(stacks.count(), 1)
        self.assertEqual(stacks.first().photos.count(), 5)

    def test_timestamp_proximity_boundary_condition(self):
        """Test timestamp proximity at exact boundary (2000ms)."""
        self.user.burst_detection_rules = json.dumps(
            [
                {
                    "id": 1,
                    "name": "Timestamp Proximity",
                    "rule_type": "timestamp_proximity",
                    "category": "soft",
                    "enabled": True,
                    "interval_ms": 2000,
                    "require_same_camera": False,
                }
            ]
        )
        self.user.save()

        base_time = datetime(2024, 1, 1, 12, 0, 0)
        # Photo 2 is exactly 2000ms after photo 1
        _photo1 = self._create_photo_with_timestamp(base_time)
        _photo2 = self._create_photo_with_timestamp(
            base_time + timedelta(milliseconds=2000)
        )
        # Photo 3 is 2001ms after photo 1 (just outside boundary)
        _photo3 = self._create_photo_with_timestamp(
            base_time + timedelta(milliseconds=2001)
        )

        count = detect_burst_sequences(self.user)

        # Depending on implementation, photo1+photo2 might be grouped, photo3 separate
        # This tests the boundary condition behavior
        _stacks = PhotoStack.objects.filter(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        # At minimum, should not crash
        self.assertGreaterEqual(count, 0)

    def test_all_photos_already_in_burst_stacks(self):
        """Test soft criteria when all photos are already in burst stacks."""
        self.user.burst_detection_rules = json.dumps(
            [
                {
                    "id": 1,
                    "name": "Timestamp Proximity",
                    "rule_type": "timestamp_proximity",
                    "category": "soft",
                    "enabled": True,
                    "interval_ms": 5000,
                }
            ]
        )
        self.user.save()

        base_time = datetime(2024, 1, 1, 12, 0, 0)
        photo1 = self._create_photo_with_timestamp(base_time)
        photo2 = self._create_photo_with_timestamp(base_time + timedelta(seconds=1))

        # Pre-create a burst stack with both photos
        existing_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        existing_stack.photos.add(photo1, photo2)

        # Run detection - burst stacks are cleared at start, so this will re-detect
        count = detect_burst_sequences(self.user)

        # Should re-detect the burst
        self.assertEqual(count, 1)


class FileVariantEdgeCasesTestCase(TestCase):
    """
    Edge cases for file variant handling.

    File variants (RAW+JPEG, Live Photos) are now stored via Photo.files
    ManyToMany field, not as stacks.
    """

    def setUp(self):
        self.user = create_test_user()

    def _create_file(self, path, file_type=File.IMAGE):
        """Helper to create a File object."""
        return File.objects.create(
            hash=str(uuid.uuid4())[:32],
            path=path,
            type=file_type,
        )

    def test_multiple_raw_files_same_photo(self):
        """Test when multiple RAW files are attached to same photo."""
        photo = create_test_photo(owner=self.user)

        # Add JPEG as main file
        jpeg_file = self._create_file("/photos/IMG_001.jpg", File.IMAGE)
        photo.main_file = jpeg_file
        photo.files.add(jpeg_file)

        # Add multiple RAW files (e.g., camera shot both CR2 and NEF)
        raw_cr2 = self._create_file("/photos/IMG_001.CR2", File.RAW_FILE)
        raw_nef = self._create_file("/photos/IMG_001.NEF", File.RAW_FILE)
        photo.files.add(raw_cr2, raw_nef)
        photo.save()

        # Photo should have 3 file variants
        self.assertEqual(photo.files.count(), 3)
        self.assertEqual(photo.files.filter(type=File.RAW_FILE).count(), 2)

    def test_video_and_raw_same_photo(self):
        """Test Live Photo with RAW (image + video + RAW)."""
        photo = create_test_photo(owner=self.user)

        # Add HEIC as main file
        heic_file = self._create_file("/photos/IMG_001.heic", File.IMAGE)
        photo.main_file = heic_file
        photo.files.add(heic_file)

        # Add RAW
        raw_file = self._create_file("/photos/IMG_001.DNG", File.RAW_FILE)
        photo.files.add(raw_file)

        # Add video for Live Photo
        video_file = self._create_file("/photos/IMG_001.mov", File.VIDEO)
        photo.files.add(video_file)
        photo.save()

        # Photo should have all three
        self.assertEqual(photo.files.count(), 3)
        self.assertTrue(photo.files.filter(type=File.IMAGE).exists())
        self.assertTrue(photo.files.filter(type=File.RAW_FILE).exists())
        self.assertTrue(photo.files.filter(type=File.VIDEO).exists())

    def test_dot_in_basename(self):
        """Test files with dots in basename."""
        photo = create_test_photo(owner=self.user)

        # File with dots in name
        jpeg_file = self._create_file("/photos/IMG.2024.01.01.001.jpg", File.IMAGE)
        photo.main_file = jpeg_file
        photo.files.add(jpeg_file)

        raw_file = self._create_file("/photos/IMG.2024.01.01.001.CR2", File.RAW_FILE)
        photo.files.add(raw_file)
        photo.save()

        self.assertEqual(photo.files.count(), 2)

    def test_very_long_filename(self):
        """Test files with very long filenames."""
        photo = create_test_photo(owner=self.user)

        long_name = "IMG_" + "a" * 200
        jpeg_file = self._create_file(f"/photos/{long_name}.jpg", File.IMAGE)
        photo.main_file = jpeg_file
        photo.files.add(jpeg_file)

        raw_file = self._create_file(f"/photos/{long_name}.CR2", File.RAW_FILE)
        photo.files.add(raw_file)
        photo.save()

        self.assertEqual(photo.files.count(), 2)

    def test_whitespace_in_path(self):
        """Test files with whitespace in path."""
        photo = create_test_photo(owner=self.user)

        jpeg_file = self._create_file("/photos/My Photos/IMG 001.jpg", File.IMAGE)
        photo.main_file = jpeg_file
        photo.files.add(jpeg_file)

        raw_file = self._create_file("/photos/My Photos/IMG 001.CR2", File.RAW_FILE)
        photo.files.add(raw_file)
        photo.save()

        self.assertEqual(photo.files.count(), 2)

    def test_deeply_nested_path(self):
        """Test files in deeply nested directories."""
        photo = create_test_photo(owner=self.user)

        deep_path = "/photos" + "/subdir" * 50
        jpeg_file = self._create_file(f"{deep_path}/IMG_001.jpg", File.IMAGE)
        photo.main_file = jpeg_file
        photo.files.add(jpeg_file)

        raw_file = self._create_file(f"{deep_path}/IMG_001.CR2", File.RAW_FILE)
        photo.files.add(raw_file)
        photo.save()

        self.assertEqual(photo.files.count(), 2)


class MalformedRulesEdgeCasesTestCase(TestCase):
    """Edge cases for malformed burst detection rules."""

    def setUp(self):
        self.user = create_test_user()

    def test_invalid_json_string_rules(self):
        """Test detection with invalid JSON in burst_detection_rules."""
        self.user.burst_detection_rules = "not valid json {"
        self.user.save()

        # Should handle gracefully (json.loads will fail)
        with self.assertRaises(json.JSONDecodeError):
            detect_burst_sequences(self.user)

    def test_rules_as_dict_instead_of_list(self):
        """Test detection when rules are stored as dict instead of list."""
        self.user.burst_detection_rules = json.dumps({"rule1": {"enabled": True}})
        self.user.save()

        # as_rules expects a list, dict should cause issues
        # This tests if the code handles this gracefully
        try:
            count = detect_burst_sequences(self.user)
            # If it doesn't crash, it should return 0 (no valid rules)
            self.assertEqual(count, 0)
        except (TypeError, AttributeError):
            # This is expected if the code doesn't handle dict input
            pass

    def test_rules_with_missing_required_fields(self):
        """Test detection with rules missing required fields."""
        self.user.burst_detection_rules = json.dumps(
            [
                {
                    "id": 1,
                    # Missing: name, rule_type, category, enabled
                }
            ]
        )
        self.user.save()

        # Should handle gracefully
        try:
            count = detect_burst_sequences(self.user)
            self.assertEqual(count, 0)
        except (KeyError, AttributeError):
            # Expected if code doesn't validate input
            pass

    def test_rules_with_unknown_rule_type(self):
        """Test detection with unknown rule_type."""
        self.user.burst_detection_rules = json.dumps(
            [
                {
                    "id": 1,
                    "name": "Unknown Rule",
                    "rule_type": "unknown_nonexistent_type",
                    "category": "hard",
                    "enabled": True,
                }
            ]
        )
        self.user.save()

        # Should handle gracefully - unknown rule types should be skipped
        count = detect_burst_sequences(self.user)
        self.assertEqual(count, 0)


class BatchDetectionEdgeCasesTestCase(TestCase):
    """Edge cases for batch_detect_stacks."""

    def setUp(self):
        self.user = create_test_user()
        self.user.burst_detection_rules = json.dumps([])
        self.user.save()

    def test_partial_options(self):
        """Test batch detection with partial options dict."""
        # Only specify some options
        options = {"detect_bursts": False}

        with patch("api.stack_detection.detect_burst_sequences") as mock_burst:
            mock_burst.return_value = 0

            batch_detect_stacks(self.user, options=options)

            # Burst should not be called (explicitly disabled)
            mock_burst.assert_not_called()

    def test_empty_options_dict(self):
        """Test batch detection with empty options dict."""
        with patch("api.stack_detection.detect_burst_sequences") as mock_burst:
            mock_burst.return_value = 0

            batch_detect_stacks(self.user, options={})

            # Burst should be called with defaults (True)
            mock_burst.assert_called_once()

    @patch("api.stack_detection.detect_burst_sequences")
    def test_exception_in_detector(self, mock_burst):
        """Test that exception in detector fails job properly."""
        mock_burst.side_effect = Exception("Burst detection crashed")

        with self.assertRaises(Exception):
            batch_detect_stacks(self.user)

        # Job should exist and be marked as failed
        jobs = LongRunningJob.objects.filter(started_by=self.user)
        self.assertEqual(jobs.count(), 1)


class ClearStacksEdgeCasesTestCase(TestCase):
    """Edge cases for clear_stacks_of_type."""

    def setUp(self):
        self.user = create_test_user()

    def test_clear_with_photo_in_multiple_stacks(self):
        """Test clearing when a photo is in multiple stacks of different types."""
        photo = create_test_photo(owner=self.user)

        # Add photo to burst stack
        burst_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        burst_stack.photos.add(photo)

        # Add same photo to manual stack
        manual_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        manual_stack.photos.add(photo)

        # Clear only burst stacks
        clear_stacks_of_type(self.user, PhotoStack.StackType.BURST_SEQUENCE)

        # Photo should still be in manual stack
        photo.refresh_from_db()
        self.assertEqual(photo.stacks.count(), 1)
        self.assertEqual(photo.stacks.first().stack_type, PhotoStack.StackType.MANUAL)

    def test_clear_with_many_stacks(self):
        """Test clearing a large number of stacks."""
        # Create 100 stacks
        for i in range(100):
            stack = PhotoStack.objects.create(
                owner=self.user,
                stack_type=PhotoStack.StackType.BURST_SEQUENCE,
            )
            photo1 = create_test_photo(owner=self.user)
            photo2 = create_test_photo(owner=self.user)
            stack.photos.add(photo1, photo2)

        count = clear_stacks_of_type(self.user, PhotoStack.StackType.BURST_SEQUENCE)

        self.assertEqual(count, 100)
        self.assertEqual(
            PhotoStack.objects.filter(
                owner=self.user,
                stack_type=PhotoStack.StackType.BURST_SEQUENCE,
            ).count(),
            0,
        )


class SequenceTimestampEdgeCasesTestCase(TestCase):
    """Edge cases for sequence_start/sequence_end handling in burst stacks."""

    def setUp(self):
        self.user = create_test_user()

    def test_burst_stack_with_none_timestamps(self):
        """Test burst stack creation when photos have None exif_timestamp."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo1.exif_timestamp = None
        photo2.exif_timestamp = None
        photo1.save()
        photo2.save()

        # Create burst stack with None timestamps
        stack = _create_burst_stack(self.user, [photo1, photo2])

        # Should still create stack, sequence timestamps will be None
        self.assertIsNotNone(stack)
        self.assertIsNone(stack.sequence_start)
        self.assertIsNone(stack.sequence_end)

    def test_create_or_merge_updates_sequence_timestamps(self):
        """Test that create_or_merge properly extends sequence timestamps."""
        from django.utils import timezone

        base_time = timezone.now()

        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo1.exif_timestamp = base_time
        photo2.exif_timestamp = base_time + timedelta(seconds=1)
        photo1.save()
        photo2.save()

        # Create initial stack
        stack = PhotoStack.create_or_merge(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
            photos=[photo1, photo2],
            sequence_start=base_time,
            sequence_end=base_time + timedelta(seconds=1),
        )

        # Create third photo with earlier timestamp
        photo3 = create_test_photo(owner=self.user)
        photo3.exif_timestamp = base_time - timedelta(seconds=1)
        photo3.save()

        # Merge with earlier timestamp
        stack = PhotoStack.create_or_merge(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
            photos=[photo1, photo3],  # photo1 already in stack
            sequence_start=base_time - timedelta(seconds=1),
            sequence_end=base_time,
        )

        stack.refresh_from_db()
        # sequence_start should be updated to earlier time
        self.assertEqual(stack.sequence_start, base_time - timedelta(seconds=1))


class FilenamePatternEdgeCasesTestCase(TestCase):
    """Edge cases for filename pattern matching in detection."""

    def setUp(self):
        self.user = create_test_user()
        self.user.burst_detection_rules = json.dumps(
            [
                {
                    "id": 1,
                    "name": "Filename Pattern",
                    "rule_type": "filename_pattern",
                    "category": "hard",
                    "enabled": True,
                    "pattern": r"^IMG_(\d+)_BURST(\d+)\.jpg$",
                    "group_by": "burst_id",
                }
            ]
        )
        self.user.save()

    def _create_file(self, path, file_type=File.IMAGE):
        """Helper to create a File object."""
        return File.objects.create(
            hash=str(uuid.uuid4())[:32],
            path=path,
            type=file_type,
        )

    def _create_photo_with_file(self, path, **kwargs):
        """Helper to create Photo with associated File."""
        file = self._create_file(path, File.IMAGE)
        photo = create_test_photo(owner=self.user, **kwargs)
        photo.main_file = file
        photo.save()
        return photo

    def test_regex_pattern_special_chars(self):
        """Test filename pattern with special regex characters."""
        self.user.burst_detection_rules = json.dumps(
            [
                {
                    "id": 1,
                    "name": "Pattern with brackets",
                    "rule_type": "filename_pattern",
                    "category": "hard",
                    "enabled": True,
                    "pattern": r"^IMG_\[(\d+)\]\.jpg$",
                    "group_by": "photo_id",
                }
            ]
        )
        self.user.save()

        # Create two photos with different paths that both match the bracket pattern
        _photo1 = self._create_photo_with_file("/photos/IMG_[001].jpg")
        _photo2 = self._create_photo_with_file(
            "/photos/IMG_[002].jpg"
        )  # Different path, same pattern

        # Should not crash on regex special characters
        count = detect_burst_sequences(self.user)
        self.assertGreaterEqual(count, 0)

    def test_empty_filename(self):
        """Test handling of empty filename (edge case)."""
        # Create photo with empty filename component
        file = File.objects.create(
            hash=str(uuid.uuid4())[:32],
            path="/photos/",  # Just directory, no filename
            type=File.IMAGE,
        )
        photo = create_test_photo(owner=self.user)
        photo.main_file = file
        photo.save()

        # Should handle gracefully
        count = detect_burst_sequences(self.user)
        self.assertEqual(count, 0)


================================================
FILE: api/tests/test_stack_detection_logic.py
================================================
"""
Comprehensive tests for Stack Detection Logic.

NOTE: RAW+JPEG pairs and Live Photos are now handled as file variants
during scan (Photo.files ManyToMany field), not as stacks.
See test_file_variants.py for file variant tests.

Tests cover:
- clear_stacks_of_type: Clearing stacks before re-detection
- detect_burst_sequences: Burst sequence detection with rules
- batch_detect_stacks: Batch detection orchestration
- Edge cases and error handling
"""

import json
import uuid
from datetime import datetime, timedelta
from unittest.mock import patch

from django.test import TestCase

from api.models.file import File
from api.models.photo_stack import PhotoStack
from api.models.long_running_job import LongRunningJob
from api.stack_detection import (
    clear_stacks_of_type,
    detect_burst_sequences,
    batch_detect_stacks,
    _create_burst_stack,
)
from api.directory_watcher import JPEG_EXTENSIONS
from api.tests.utils import create_test_photo, create_test_user


class ClearStacksTestCase(TestCase):
    """Tests for clear_stacks_of_type function."""

    def setUp(self):
        self.user = create_test_user()
        self.other_user = create_test_user()

    def test_clear_stacks_removes_all_of_type(self):
        """Test clearing removes all stacks of specific type."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        photo4 = create_test_photo(owner=self.user)
        
        # Create stacks of different types
        burst_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        burst_stack.photos.add(photo1, photo2)
        
        manual_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        manual_stack.photos.add(photo3, photo4)
        
        # Clear only burst stacks
        count = clear_stacks_of_type(self.user, PhotoStack.StackType.BURST_SEQUENCE)
        
        self.assertEqual(count, 1)
        self.assertFalse(PhotoStack.objects.filter(
            owner=self.user, stack_type=PhotoStack.StackType.BURST_SEQUENCE
        ).exists())
        # Manual stack should still exist
        self.assertTrue(PhotoStack.objects.filter(
            owner=self.user, stack_type=PhotoStack.StackType.MANUAL
        ).exists())

    def test_clear_stacks_unlinks_photos(self):
        """Test clearing unlinks photos from stacks."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack.photos.add(photo1, photo2)
        
        self.assertEqual(photo1.stacks.count(), 1)
        
        clear_stacks_of_type(self.user, PhotoStack.StackType.BURST_SEQUENCE)
        
        photo1.refresh_from_db()
        self.assertEqual(photo1.stacks.count(), 0)

    def test_clear_stacks_only_affects_user(self):
        """Test clearing only affects specified user's stacks."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        other_photo1 = create_test_photo(owner=self.other_user)
        other_photo2 = create_test_photo(owner=self.other_user)
        
        stack1 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack1.photos.add(photo1, photo2)
        
        stack2 = PhotoStack.objects.create(
            owner=self.other_user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack2.photos.add(other_photo1, other_photo2)
        
        clear_stacks_of_type(self.user, PhotoStack.StackType.BURST_SEQUENCE)
        
        # User's stack deleted
        self.assertFalse(PhotoStack.objects.filter(pk=stack1.pk).exists())
        # Other user's stack remains
        self.assertTrue(PhotoStack.objects.filter(pk=stack2.pk).exists())

    def test_clear_stacks_returns_zero_if_none(self):
        """Test clearing returns 0 if no stacks of type exist."""
        count = clear_stacks_of_type(self.user, PhotoStack.StackType.BURST_SEQUENCE)
        self.assertEqual(count, 0)


class BurstDetectionTestCase(TestCase):
    """Tests for burst sequence detection."""

    def setUp(self):
        self.user = create_test_user()
        # Set up default burst rules using correct format
        self.user.burst_detection_rules = json.dumps([
            {
                "id": 1,
                "name": "Test EXIF Burst",
                "rule_type": "exif_burst_mode",
                "category": "hard",
                "enabled": True,
            },
            {
                "id": 2,
                "name": "Test Timestamp",
                "rule_type": "timestamp_proximity",
                "category": "soft",
                "enabled": True,
                "interval_ms": 2000
            }
        ])
        self.user.save()

    def _create_file(self, path, file_type=File.IMAGE):
        """Helper to create a File object."""
        return File.objects.create(
            hash=str(uuid.uuid4())[:32],
            path=path,
            type=file_type,
        )

    def _create_photo_with_timestamp(self, timestamp, **kwargs):
        """Helper to create Photo with specific timestamp."""
        photo = create_test_photo(owner=self.user, **kwargs)
        photo.exif_timestamp = timestamp
        file = self._create_file(f"/photos/IMG_{photo.pk}.jpg")
        photo.main_file = file
        photo.save()
        return photo

    def test_no_rules_returns_zero(self):
        """Test no burst detection when rules are empty."""
        self.user.burst_detection_rules = json.dumps([])
        self.user.save()
        
        _photo1 = self._create_photo_with_timestamp(datetime(2024, 1, 1, 12, 0, 0))
        _photo2 = self._create_photo_with_timestamp(datetime(2024, 1, 1, 12, 0, 1))
        
        count = detect_burst_sequences(self.user)
        
        self.assertEqual(count, 0)

    def test_disabled_rules_ignored(self):
        """Test disabled rules are not used."""
        self.user.burst_detection_rules = json.dumps([
            {
                "id": 1,
                "name": "Disabled rule",
                "rule_type": "timestamp_proximity",
                "category": "soft",
                "enabled": False,
                "interval_ms": 5000
            }
        ])
        self.user.save()
        
        _photo1 = self._create_photo_with_timestamp(datetime(2024, 1, 1, 12, 0, 0))
        _photo2 = self._create_photo_with_timestamp(datetime(2024, 1, 1, 12, 0, 1))
        
        count = detect_burst_sequences(self.user)
        
        self.assertEqual(count, 0)

    def test_clears_existing_burst_stacks(self):
        """Test existing burst stacks are cleared before re-detection."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        old_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        old_stack.photos.add(photo1, photo2)
        
        detect_burst_sequences(self.user)
        
        self.assertFalse(PhotoStack.objects.filter(pk=old_stack.pk).exists())

    def test_skip_hidden_photos(self):
        """Test hidden photos are excluded from burst detection."""
        base_time = datetime(2024, 1, 1, 12, 0, 0)
        _photo1 = self._create_photo_with_timestamp(base_time, hidden=True)
        _photo2 = self._create_photo_with_timestamp(base_time + timedelta(seconds=1))
        
        count = detect_burst_sequences(self.user)
        
        self.assertEqual(count, 0)

    def test_skip_trashed_photos(self):
        """Test trashed photos are excluded from burst detection."""
        base_time = datetime(2024, 1, 1, 12, 0, 0)
        _photo1 = self._create_photo_with_timestamp(base_time, in_trashcan=True)
        _photo2 = self._create_photo_with_timestamp(base_time + timedelta(seconds=1))
        
        count = detect_burst_sequences(self.user)
        
        self.assertEqual(count, 0)


class CreateBurstStackTestCase(TestCase):
    """Tests for _create_burst_stack helper."""

    def setUp(self):
        self.user = create_test_user()

    def test_requires_minimum_two_photos(self):
        """Test stack not created with less than 2 photos."""
        photo = create_test_photo(owner=self.user)
        
        stack = _create_burst_stack(self.user, [photo])
        
        self.assertIsNone(stack)

    def test_creates_stack_with_two_photos(self):
        """Test stack created with exactly 2 photos."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo1.exif_timestamp = datetime(2024, 1, 1, 12, 0, 0)
        photo2.exif_timestamp = datetime(2024, 1, 1, 12, 0, 1)
        photo1.save()
        photo2.save()
        
        stack = _create_burst_stack(self.user, [photo1, photo2])
        
        self.assertIsNotNone(stack)
        self.assertEqual(stack.stack_type, PhotoStack.StackType.BURST_SEQUENCE)
        self.assertEqual(stack.photos.count(), 2)

    def test_skips_already_stacked_photos(self):
        """Test photos already in burst stack are skipped."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        
        # Add photo1 to existing burst stack
        existing_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        existing_stack.photos.add(photo1, photo2)
        
        # Try to create new stack with photo1 and photo3
        stack = _create_burst_stack(self.user, [photo1, photo3])
        
        # photo1 is filtered out, photo3 remains = 1 photo < 2, no stack created
        self.assertIsNone(stack)


class BatchDetectStacksTestCase(TestCase):
    """Tests for batch_detect_stacks orchestration."""

    def setUp(self):
        self.user = create_test_user()
        self.user.burst_detection_rules = json.dumps([])
        self.user.save()

    @patch('api.stack_detection.detect_burst_sequences')
    def test_calls_burst_detector_by_default(self, mock_burst):
        """Test burst detector called with default options."""
        mock_burst.return_value = 3
        
        batch_detect_stacks(self.user)
        
        mock_burst.assert_called_once()

    @patch('api.stack_detection.detect_burst_sequences')
    def test_respects_options(self, mock_burst):
        """Test options control which detectors run."""
        mock_burst.return_value = 0
        
        batch_detect_stacks(self.user, options={
            'detect_bursts': False,
        })
        
        mock_burst.assert_not_called()

    @patch('api.stack_detection.detect_burst_sequences')
    def test_creates_job(self, mock_burst):
        """Test LongRunningJob created for tracking."""
        mock_burst.return_value = 0
        
        batch_detect_stacks(self.user)
        
        job = LongRunningJob.objects.filter(
            started_by=self.user,
            job_type=LongRunningJob.JOB_SCAN_PHOTOS,
        ).first()
        self.assertIsNotNone(job)

    @patch('api.stack_detection.detect_burst_sequences')
    def test_handles_exception(self, mock_burst):
        """Test exception handling during detection."""
        mock_burst.side_effect = Exception("Detection failed")
        
        with self.assertRaises(Exception):
            batch_detect_stacks(self.user)
        
        # Job should be marked as failed
        job = LongRunningJob.objects.filter(
            started_by=self.user,
        ).first()
        self.assertIsNotNone(job)


class FileExtensionsTestCase(TestCase):
    """Tests for file extension handling in directory_watcher."""

    def test_jpeg_extensions_included(self):
        """Test JPEG and HEIC extensions are included."""
        expected = ['.jpg', '.jpeg', '.heic', '.heif']
        for ext in expected:
            self.assertIn(ext, JPEG_EXTENSIONS, f"{ext} should be in JPEG_EXTENSIONS")

    def test_extensions_are_lowercase(self):
        """Test all JPEG extensions are lowercase."""
        for ext in JPEG_EXTENSIONS:
            self.assertEqual(ext, ext.lower(), f"{ext} should be lowercase")


class EdgeCasesTestCase(TestCase):
    """Edge case tests for stack detection."""

    def setUp(self):
        self.user = create_test_user()

    def test_photo_without_main_file(self):
        """Test photos without main_file are handled gracefully."""
        photo = create_test_photo(owner=self.user)
        photo.main_file = None
        photo.save()
        
        # Set up rules to trigger detection
        self.user.burst_detection_rules = json.dumps([
            {
                "id": 1,
                "name": "Test Timestamp",
                "rule_type": "timestamp_proximity",
                "category": "soft",
                "enabled": True,
                "interval_ms": 2000
            }
        ])
        self.user.save()
        
        # Should not raise
        count = detect_burst_sequences(self.user)
        self.assertEqual(count, 0)

    def test_empty_photo_library(self):
        """Test detection on empty library."""
        self.user.burst_detection_rules = json.dumps([
            {
                "id": 1,
                "name": "Test Timestamp",
                "rule_type": "timestamp_proximity",
                "category": "soft",
                "enabled": True,
                "interval_ms": 2000
            }
        ])
        self.user.save()
        
        count = detect_burst_sequences(self.user)
        self.assertEqual(count, 0)

    def test_burst_rules_as_string(self):
        """Test burst_detection_rules stored as JSON string."""
        self.user.burst_detection_rules = '[]'  # Empty JSON string
        self.user.save()
        
        count = detect_burst_sequences(self.user)
        self.assertEqual(count, 0)


class FileVariantTestCase(TestCase):
    """
    Tests for file variant handling (RAW+JPEG, Live Photos).
    
    File variants are now stored via Photo.files ManyToMany field,
    not as stacks. These tests verify the data model works correctly.
    """

    def setUp(self):
        self.user = create_test_user()

    def _create_file(self, path, file_type=File.IMAGE):
        """Helper to create a File object."""
        return File.objects.create(
            hash=str(uuid.uuid4())[:32],
            path=path,
            type=file_type,
        )

    def test_photo_with_raw_variant(self):
        """Test a photo can have a RAW file variant."""
        photo = create_test_photo(owner=self.user)
        
        # Add JPEG as main file
        jpeg_file = self._create_file("/photos/IMG_001.jpg", File.IMAGE)
        photo.main_file = jpeg_file
        photo.files.add(jpeg_file)
        
        # Add RAW variant
        raw_file = self._create_file("/photos/IMG_001.CR2", File.RAW_FILE)
        photo.files.add(raw_file)
        photo.save()
        
        # Verify
        self.assertEqual(photo.files.count(), 2)
        self.assertTrue(photo.files.filter(type=File.RAW_FILE).exists())
        self.assertTrue(photo.files.filter(type=File.IMAGE).exists())

    def test_photo_with_live_photo_video(self):
        """Test a photo can have a video variant (Live Photo)."""
        photo = create_test_photo(owner=self.user)
        
        # Add HEIC as main file
        heic_file = self._create_file("/photos/IMG_001.heic", File.IMAGE)
        photo.main_file = heic_file
        photo.files.add(heic_file)
        
        # Add video variant
        video_file = self._create_file("/photos/IMG_001.mov", File.VIDEO)
        photo.files.add(video_file)
        photo.save()
        
        # Verify
        self.assertEqual(photo.files.count(), 2)
        self.assertTrue(photo.files.filter(type=File.VIDEO).exists())
        self.assertTrue(photo.files.filter(type=File.IMAGE).exists())

    def test_photo_with_all_variant_types(self):
        """Test a photo can have image, RAW, and video variants."""
        photo = create_test_photo(owner=self.user)
        
        # Add all variant types
        jpeg_file = self._create_file("/photos/IMG_001.jpg", File.IMAGE)
        raw_file = self._create_file("/photos/IMG_001.CR2", File.RAW_FILE)
        video_file = self._create_file("/photos/IMG_001.mov", File.VIDEO)
        
        photo.main_file = jpeg_file
        photo.files.add(jpeg_file, raw_file, video_file)
        photo.save()
        
        # Verify
        self.assertEqual(photo.files.count(), 3)
        file_types = set(photo.files.values_list('type', flat=True))
        self.assertEqual(file_types, {File.IMAGE, File.RAW_FILE, File.VIDEO})

    def test_file_variant_vs_stack(self):
        """Test that file variants are separate from stacks."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        # Add file variant to photo1
        jpeg_file = self._create_file("/photos/IMG_001.jpg", File.IMAGE)
        raw_file = self._create_file("/photos/IMG_001.CR2", File.RAW_FILE)
        photo1.main_file = jpeg_file
        photo1.files.add(jpeg_file, raw_file)
        photo1.save()
        
        # Add photo1 and photo2 to a burst stack
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack.photos.add(photo1, photo2)
        
        # Photo1 has 2 file variants AND is in a stack
        self.assertEqual(photo1.files.count(), 2)
        self.assertEqual(photo1.stacks.count(), 1)
        
        # These are independent concepts
        self.assertNotEqual(photo1.files.count(), photo1.stacks.count())

    def test_special_characters_in_filename(self):
        """Test files with special characters in names."""
        photo = create_test_photo(owner=self.user)
        
        jpeg_file = self._create_file("/photos/IMG (1) - Copy.jpg", File.IMAGE)
        raw_file = self._create_file("/photos/IMG (1) - Copy.CR2", File.RAW_FILE)
        
        photo.main_file = jpeg_file
        photo.files.add(jpeg_file, raw_file)
        photo.save()
        
        self.assertEqual(photo.files.count(), 2)

    def test_unicode_in_filename(self):
        """Test files with unicode characters in names."""
        photo = create_test_photo(owner=self.user)
        
        jpeg_file = self._create_file("/photos/фото_001.jpg", File.IMAGE)
        raw_file = self._create_file("/photos/фото_001.CR2", File.RAW_FILE)
        
        photo.main_file = jpeg_file
        photo.files.add(jpeg_file, raw_file)
        photo.save()
        
        self.assertEqual(photo.files.count(), 2)

    def test_progress_callback_called(self):
        """Test progress callback is called during burst detection."""
        self.user.burst_detection_rules = json.dumps([
            {
                "id": 1,
                "name": "Test Timestamp",
                "rule_type": "timestamp_proximity",
                "category": "soft",
                "enabled": True,
                "interval_ms": 2000
            }
        ])
        self.user.save()
        
        file = File.objects.create(
            hash=str(uuid.uuid4())[:32],
            path="/photos/IMG_001.jpg",
            type=File.IMAGE,
        )
        photo = create_test_photo(owner=self.user)
        photo.main_file = file
        photo.exif_timestamp = datetime(2024, 1, 1, 12, 0, 0)
        photo.save()
        
        callback_calls = []
        
        def progress_callback(current, total, found):
            callback_calls.append((current, total, found))
        
        detect_burst_sequences(self.user, progress_callback=progress_callback)
        
        # Callback should be called at least once (for index 0) or not at all if no hard rules
        self.assertGreaterEqual(len(callback_calls), 0)


================================================
FILE: api/tests/test_stack_duplicate_integration.py
================================================
"""
Integration tests for interactions between Stacks and Duplicates.

Tests edge cases where photos belong to both stacks and duplicate groups:
- Photo in stack is also part of duplicate group
- Resolving duplicate trashes stack's primary photo
- Deleting stack affects duplicate group
- Concurrent operations on same photos
- Multi-user isolation
"""


from django.test import TestCase
from django.utils import timezone

from api.models.duplicate import Duplicate
from api.models.file import File
from api.models.photo import Photo
from api.models.photo_stack import PhotoStack
from api.models.user import User


class PhotoInBothStackAndDuplicateTestCase(TestCase):
    """Tests for photos that are in both a stack and a duplicate group."""

    def setUp(self):
        """Create test user and photos."""
        self.user = User.objects.create(username="integrationtest")
        self.photos = self._create_photos(4)

    def _create_photos(self, count):
        """Helper to create multiple photos."""
        photos = []
        for i in range(count):
            file = File.objects.create(
                hash=f"integ{i}" + "a" * 27,
                path=f"/photos/integration_{i}.jpg",
                type=File.IMAGE,
            )
            photo = Photo.objects.create(
                owner=self.user,
                main_file=file,
                image_hash=f"integ{i}" + "b" * 27,
                added_on=timezone.now(),
                in_trashcan=False,
            )
            photos.append(photo)
        return photos

    def test_photo_can_be_in_stack_and_duplicate_simultaneously(self):
        """Photo should be able to belong to both a stack and duplicate group."""
        # Create stack with first two photos
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        self.photos[0].stacks.add(stack)
        self.photos[1].stacks.add(stack)

        # Create duplicate group with first and third photos
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
        )
        self.photos[0].duplicates.add(duplicate)
        self.photos[2].duplicates.add(duplicate)

        # Verify photo 0 is in both
        self.assertEqual(self.photos[0].stacks.count(), 1)
        self.assertEqual(self.photos[0].duplicates.count(), 1)

        # Verify stack and duplicate are independent
        self.assertEqual(stack.photos.count(), 2)
        self.assertEqual(duplicate.photos.count(), 2)

    def test_resolving_duplicate_trashes_stacked_photo(self):
        """Resolving duplicate should trash photo even if it's in a stack."""
        # Photo 0 and 1 are in a stack
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
            primary_photo=self.photos[0],
        )
        self.photos[0].stacks.add(stack)
        self.photos[1].stacks.add(stack)

        # Photo 0 and 2 are duplicates
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        self.photos[0].duplicates.add(duplicate)
        self.photos[2].duplicates.add(duplicate)

        # Resolve duplicate, keeping photo 2 (trash photo 0)
        duplicate.resolve(self.photos[2], trash_others=True)

        # Photo 0 should be trashed
        self.photos[0].refresh_from_db()
        self.assertTrue(self.photos[0].in_trashcan)

        # Photo 0 should still be in stack (not removed)
        self.assertEqual(self.photos[0].stacks.count(), 1)

        # Stack should still have both photos (ManyToMany not affected by trash)
        self.assertEqual(stack.photos.count(), 2)

    def test_resolving_duplicate_trashes_stack_primary(self):
        """What happens when duplicate resolution trashes the stack's primary photo."""
        # Photo 0 is stack primary
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
            primary_photo=self.photos[0],
        )
        self.photos[0].stacks.add(stack)
        self.photos[1].stacks.add(stack)

        # Photo 0 and 2 are duplicates
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        self.photos[0].duplicates.add(duplicate)
        self.photos[2].duplicates.add(duplicate)

        # Resolve keeping photo 2, trashing photo 0 (the stack primary)
        duplicate.resolve(self.photos[2], trash_others=True)

        # Stack's primary is now trashed - this is a potential issue
        stack.refresh_from_db()
        self.assertTrue(stack.primary_photo.in_trashcan)

        # Note: The system allows this - the UI should handle showing appropriate warning

    def test_deleting_stack_does_not_affect_duplicate(self):
        """Deleting a stack should not affect duplicate group membership."""
        # Photo in both stack and duplicate
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        self.photos[0].stacks.add(stack)

        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
        )
        self.photos[0].duplicates.add(duplicate)
        self.photos[1].duplicates.add(duplicate)

        # Delete the stack
        stack.delete()

        # Photo should still be in duplicate group
        self.photos[0].refresh_from_db()
        self.assertEqual(self.photos[0].duplicates.count(), 1)
        self.assertEqual(duplicate.photos.count(), 2)

    def test_dismissing_duplicate_does_not_affect_stack(self):
        """Dismissing duplicate group should not affect stack membership."""
        # Photo in both
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        self.photos[0].stacks.add(stack)
        self.photos[1].stacks.add(stack)

        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
        )
        self.photos[0].duplicates.add(duplicate)
        self.photos[2].duplicates.add(duplicate)

        # Dismiss the duplicate
        duplicate.dismiss()

        # Photo should still be in stack
        self.photos[0].refresh_from_db()
        self.assertEqual(self.photos[0].stacks.count(), 1)
        self.assertEqual(stack.photos.count(), 2)


class PhotoDeletionCascadeTestCase(TestCase):
    """Tests for photo deletion effects on stacks and duplicates."""

    def setUp(self):
        """Create test user and photos."""
        self.user = User.objects.create(username="deletiontest")

    def _create_photo(self, suffix):
        """Create a single photo."""
        file = File.objects.create(
            hash=f"del{suffix}" + "a" * 28,
            path=f"/photos/delete_{suffix}.jpg",
            type=File.IMAGE,
        )
        return Photo.objects.create(
            owner=self.user,
            main_file=file,
            image_hash=f"del{suffix}" + "b" * 28,
            added_on=timezone.now(),
        )

    def test_deleting_photo_removes_from_stack(self):
        """Deleting photo should remove it from associated stacks."""
        photo1 = self._create_photo("1")
        photo2 = self._create_photo("2")

        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        photo1.stacks.add(stack)
        photo2.stacks.add(stack)

        self.assertEqual(stack.photos.count(), 2)

        # Delete photo1
        photo1.delete()

        stack.refresh_from_db()
        self.assertEqual(stack.photos.count(), 1)
        self.assertEqual(stack.photos.first(), photo2)

    def test_deleting_photo_removes_from_duplicate(self):
        """Deleting photo should remove it from associated duplicate groups."""
        photo1 = self._create_photo("3")
        photo2 = self._create_photo("4")

        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        photo1.duplicates.add(duplicate)
        photo2.duplicates.add(duplicate)

        self.assertEqual(duplicate.photos.count(), 2)

        # Delete photo1
        photo1.delete()

        duplicate.refresh_from_db()
        self.assertEqual(duplicate.photos.count(), 1)

    def test_deleting_stack_primary_sets_to_null(self):
        """Deleting stack's primary photo should set primary_photo to NULL."""
        photo1 = self._create_photo("5")
        photo2 = self._create_photo("6")

        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
            primary_photo=photo1,
        )
        photo1.stacks.add(stack)
        photo2.stacks.add(stack)

        # Delete the primary photo
        photo1.delete()

        stack.refresh_from_db()
        self.assertIsNone(stack.primary_photo)
        self.assertEqual(stack.photos.count(), 1)

    def test_deleting_kept_photo_sets_to_null(self):
        """Deleting duplicate's kept_photo should set kept_photo to NULL."""
        photo1 = self._create_photo("7")
        photo2 = self._create_photo("8")

        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            kept_photo=photo1,
        )
        photo1.duplicates.add(duplicate)
        photo2.duplicates.add(duplicate)

        # Delete the kept photo
        photo1.delete()

        duplicate.refresh_from_db()
        self.assertIsNone(duplicate.kept_photo)


class MultiUserIsolationTestCase(TestCase):
    """Tests for proper isolation between users."""

    def setUp(self):
        """Create two test users."""
        self.user1 = User.objects.create(username="user1")
        self.user2 = User.objects.create(username="user2")

    def _create_photo_for_user(self, user, suffix):
        """Create a photo for a specific user."""
        file = File.objects.create(
            hash=f"usr{suffix}" + "a" * 28,
            path=f"/photos/user_{suffix}.jpg",
            type=File.IMAGE,
        )
        return Photo.objects.create(
            owner=user,
            main_file=file,
            image_hash=f"usr{suffix}" + "b" * 28,
            added_on=timezone.now(),
        )

    def test_users_cannot_share_stacks(self):
        """Users should not be able to add photos to another user's stack."""
        photo1 = self._create_photo_for_user(self.user1, "1")
        photo2 = self._create_photo_for_user(self.user2, "2")

        stack = PhotoStack.objects.create(
            owner=self.user1,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        photo1.stacks.add(stack)

        # Attempt to add user2's photo to user1's stack
        # The ManyToMany doesn't enforce this at DB level, but API should
        photo2.stacks.add(stack)  # This succeeds at DB level

        # Stack contains both photos (no DB-level enforcement)
        self.assertEqual(stack.photos.count(), 2)

        # Note: This is a potential issue - API layer should validate owner

    def test_duplicate_detection_scoped_to_user(self):
        """Duplicate groups should be scoped to owner."""
        photo1 = self._create_photo_for_user(self.user1, "3")
        
        dup1 = Duplicate.objects.create(
            owner=self.user1,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        photo1.duplicates.add(dup1)

        # User2's duplicates should be separate
        photo2 = self._create_photo_for_user(self.user2, "4")
        dup2 = Duplicate.objects.create(
            owner=self.user2,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        photo2.duplicates.add(dup2)

        # Each user should have their own duplicate
        self.assertEqual(Duplicate.objects.filter(owner=self.user1).count(), 1)
        self.assertEqual(Duplicate.objects.filter(owner=self.user2).count(), 1)


class StackMergeWithDuplicatesTestCase(TestCase):
    """Tests for stack merging when photos are also in duplicates."""

    def setUp(self):
        """Create test user and photos."""
        self.user = User.objects.create(username="mergetest")
        self.photos = []
        for i in range(4):
            file = File.objects.create(
                hash=f"mrg{i}" + "a" * 28,
                path=f"/photos/merge_{i}.jpg",
                type=File.IMAGE,
            )
            photo = Photo.objects.create(
                owner=self.user,
                main_file=file,
                image_hash=f"mrg{i}" + "b" * 28,
                added_on=timezone.now(),
            )
            self.photos.append(photo)

    def test_merging_stacks_preserves_duplicate_membership(self):
        """Merging stacks should not affect duplicate group membership."""
        # Stack 1 with photo 0, 1
        stack1 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        self.photos[0].stacks.add(stack1)
        self.photos[1].stacks.add(stack1)

        # Stack 2 with photo 2, 3
        stack2 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        self.photos[2].stacks.add(stack2)
        self.photos[3].stacks.add(stack2)

        # Photo 1 and 2 are duplicates
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
        )
        self.photos[1].duplicates.add(duplicate)
        self.photos[2].duplicates.add(duplicate)

        # Merge stack2 into stack1
        stack1.merge_with(stack2)

        # All photos should be in stack1
        self.assertEqual(stack1.photos.count(), 4)

        # Duplicate membership should be preserved
        self.assertEqual(self.photos[1].duplicates.count(), 1)
        self.assertEqual(self.photos[2].duplicates.count(), 1)
        self.assertEqual(duplicate.photos.count(), 2)


class PhotoInMultipleStacksTestCase(TestCase):
    """Tests for photos that are in multiple stacks."""

    def setUp(self):
        """Create test user and photos."""
        self.user = User.objects.create(username="multistacktest")

    def _create_photo(self, suffix):
        """Create a single photo."""
        file = File.objects.create(
            hash=f"multi{suffix}" + "a" * 26,
            path=f"/photos/multi_{suffix}.jpg",
            type=File.IMAGE,
        )
        return Photo.objects.create(
            owner=self.user,
            main_file=file,
            image_hash=f"multi{suffix}" + "b" * 26,
            added_on=timezone.now(),
        )

    def test_photo_can_be_in_multiple_stacks(self):
        """Photo should be able to belong to multiple stacks."""
        photo = self._create_photo("1")

        stack1 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.RAW_JPEG_PAIR,
        )
        stack2 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )

        photo.stacks.add(stack1)
        photo.stacks.add(stack2)

        self.assertEqual(photo.stacks.count(), 2)

    def test_photo_can_be_primary_in_multiple_stacks(self):
        """Photo can be primary photo for multiple stacks."""
        photo = self._create_photo("2")

        stack1 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.RAW_JPEG_PAIR,
            primary_photo=photo,
        )
        stack2 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
            primary_photo=photo,
        )

        photo.stacks.add(stack1)
        photo.stacks.add(stack2)

        self.assertEqual(stack1.primary_photo, photo)
        self.assertEqual(stack2.primary_photo, photo)

    def test_removing_photo_from_one_stack_preserves_others(self):
        """Removing from one stack should not affect other stacks."""
        photo = self._create_photo("3")

        stack1 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack2 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )

        photo.stacks.add(stack1)
        photo.stacks.add(stack2)

        # Remove from stack1
        photo.stacks.remove(stack1)

        # Should still be in stack2
        self.assertEqual(photo.stacks.count(), 1)
        self.assertIn(stack2, photo.stacks.all())


class DuplicateMergeWithStacksTestCase(TestCase):
    """Tests for duplicate merging when photos are also in stacks."""

    def setUp(self):
        """Create test user and photos."""
        self.user = User.objects.create(username="dupmergetest")
        self.photos = []
        for i in range(4):
            file = File.objects.create(
                hash=f"dpm{i}" + "a" * 28,
                path=f"/photos/dupmerge_{i}.jpg",
                type=File.IMAGE,
            )
            photo = Photo.objects.create(
                owner=self.user,
                main_file=file,
                image_hash=f"dpm{i}" + "b" * 28,
                added_on=timezone.now(),
            )
            self.photos.append(photo)

    def test_merging_duplicates_preserves_stack_membership(self):
        """Merging duplicate groups should not affect stack membership."""
        # Photo 0, 1 are in a stack
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        self.photos[0].stacks.add(stack)
        self.photos[1].stacks.add(stack)

        # Dup1: photo 0, 2
        dup1 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        self.photos[0].duplicates.add(dup1)
        self.photos[2].duplicates.add(dup1)

        # Dup2: photo 1, 3
        dup2 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        self.photos[1].duplicates.add(dup2)
        self.photos[3].duplicates.add(dup2)

        # Merge dup2 into dup1
        dup1.merge_with(dup2)

        # Stack membership should be preserved
        self.assertEqual(stack.photos.count(), 2)
        self.assertEqual(self.photos[0].stacks.count(), 1)
        self.assertEqual(self.photos[1].stacks.count(), 1)


class EdgeCasesTestCase(TestCase):
    """Edge case tests for stack/duplicate integration."""

    def setUp(self):
        """Create test user."""
        self.user = User.objects.create(username="edgecasetest")

    def _create_photo(self, suffix):
        """Create a single photo."""
        file = File.objects.create(
            hash=f"edge{suffix}" + "a" * 26,
            path=f"/photos/edge_{suffix}.jpg",
            type=File.IMAGE,
        )
        return Photo.objects.create(
            owner=self.user,
            main_file=file,
            image_hash=f"edge{suffix}" + "b" * 26,
            added_on=timezone.now(),
        )

    def test_empty_stack_and_duplicate(self):
        """Empty stack and duplicate should exist without photos."""
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
        )

        self.assertEqual(stack.photos.count(), 0)
        self.assertEqual(duplicate.photos.count(), 0)

    def test_single_photo_in_both(self):
        """Single photo can be only member of both stack and duplicate."""
        photo = self._create_photo("1")

        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        photo.stacks.add(stack)

        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
        )
        photo.duplicates.add(duplicate)

        self.assertEqual(stack.photos.count(), 1)
        self.assertEqual(duplicate.photos.count(), 1)

    def test_trashing_all_photos_in_stack(self):
        """Trashing all photos in stack should not delete the stack."""
        photo1 = self._create_photo("2")
        photo2 = self._create_photo("3")

        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        photo1.stacks.add(stack)
        photo2.stacks.add(stack)

        # Trash all photos
        photo1.in_trashcan = True
        photo1.save()
        photo2.in_trashcan = True
        photo2.save()

        # Stack should still exist
        self.assertTrue(PhotoStack.objects.filter(id=stack.id).exists())
        self.assertEqual(stack.photos.count(), 2)

    def test_photo_in_multiple_duplicate_groups(self):
        """Photo can be in multiple duplicate groups."""
        photo = self._create_photo("4")

        dup1 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        dup2 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
        )

        photo.duplicates.add(dup1)
        photo.duplicates.add(dup2)

        self.assertEqual(photo.duplicates.count(), 2)

    def test_resolving_duplicate_does_not_affect_other_duplicates(self):
        """Resolving one duplicate should not affect photo's other duplicates."""
        photo1 = self._create_photo("5")
        photo2 = self._create_photo("6")
        photo3 = self._create_photo("7")

        # photo1 is in two duplicate groups
        dup1 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        photo1.duplicates.add(dup1)
        photo2.duplicates.add(dup1)

        dup2 = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
        )
        photo1.duplicates.add(dup2)
        photo3.duplicates.add(dup2)

        # Resolve dup1, keeping photo1
        dup1.resolve(photo1, trash_others=True)

        # photo1 should still be in dup2
        photo1.refresh_from_db()
        self.assertEqual(photo1.duplicates.count(), 2)
        self.assertIn(dup2, photo1.duplicates.all())

    def test_cascade_effects_are_contained(self):
        """Operations on one group should not cascade unexpectedly."""
        photo1 = self._create_photo("8")
        photo2 = self._create_photo("9")

        # Create complex relationship
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
            primary_photo=photo1,
        )
        photo1.stacks.add(stack)
        photo2.stacks.add(stack)

        duplicate = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            kept_photo=photo1,
        )
        photo1.duplicates.add(duplicate)
        photo2.duplicates.add(duplicate)

        # Delete the stack
        _stack_id = stack.id
        stack.delete()

        # Duplicate should be unaffected
        self.assertTrue(Duplicate.objects.filter(id=duplicate.id).exists())
        self.assertEqual(duplicate.photos.count(), 2)
        
        # Photos should still be in duplicate
        photo1.refresh_from_db()
        photo2.refresh_from_db()
        self.assertEqual(photo1.duplicates.count(), 1)
        self.assertEqual(photo2.duplicates.count(), 1)


================================================
FILE: api/tests/test_stack_review.py
================================================
"""
Comprehensive tests for api/models/stack_review.py

Tests the StackReview model for tracking user review decisions on stacks:
- Model creation and field validation
- Decision choices (PENDING, RESOLVED, DISMISSED)
- Resolve workflow (keep photo, trash others)
- Dismiss workflow (unlink photos)
- Revert workflow (restore trashed photos)
- Reviewable stack types logic

NOTE: With the new file variants architecture, no stack types are
reviewable because:
- exact_copy and visual_duplicate are handled by Duplicate model
- BURST_SEQUENCE, EXPOSURE_BRACKET, MANUAL are informational
- RAW_JPEG_PAIR and LIVE_PHOTO are deprecated (use Photo.files)
"""

import uuid

from django.test import TestCase
from django.utils import timezone

from api.models.file import File
from api.models.photo import Photo
from api.models.photo_stack import PhotoStack
from api.models.stack_review import StackReview
from api.models.user import User


class StackReviewModelTestCase(TestCase):
    """Tests for the StackReview model creation and fields."""

    def setUp(self):
        """Create test user and stack."""
        self.user = User.objects.create(username="reviewtest")
        self.stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )

    def test_create_stack_review(self):
        """Should create a StackReview with default values."""
        review = StackReview.objects.create(
            stack=self.stack,
            reviewer=self.user,
        )
        self.assertIsNotNone(review.id)
        self.assertEqual(review.decision, StackReview.Decision.PENDING)
        self.assertIsNone(review.kept_photo)
        self.assertEqual(review.trashed_count, 0)
        self.assertIsNone(review.reviewed_at)

    def test_uuid_primary_key(self):
        """Review ID should be a valid UUID."""
        review = StackReview.objects.create(
            stack=self.stack,
            reviewer=self.user,
        )
        self.assertIsInstance(review.id, uuid.UUID)

    def test_one_to_one_with_stack(self):
        """Stack should have at most one review."""
        StackReview.objects.create(
            stack=self.stack,
            reviewer=self.user,
        )
        # Creating second review for same stack should raise error
        from django.db import IntegrityError
        with self.assertRaises(IntegrityError):
            StackReview.objects.create(
                stack=self.stack,
                reviewer=self.user,
            )

    def test_str_representation(self):
        """String representation should include stack ID and decision."""
        review = StackReview.objects.create(
            stack=self.stack,
            reviewer=self.user,
            decision=StackReview.Decision.PENDING,
        )
        result = str(review)
        self.assertIn(str(self.stack.id), result)
        self.assertIn("pending", result)

    def test_decision_choices(self):
        """All decision choices should be valid."""
        for decision, label in StackReview.Decision.choices:
            review = StackReview.objects.create(
                stack=PhotoStack.objects.create(
                    owner=self.user,
                    stack_type=PhotoStack.StackType.MANUAL,
                ),
                reviewer=self.user,
                decision=decision,
            )
            self.assertEqual(review.decision, decision)

    def test_optional_note_field(self):
        """Note field should be optional."""
        review = StackReview.objects.create(
            stack=self.stack,
            reviewer=self.user,
            note="User's reason for this decision",
        )
        self.assertEqual(review.note, "User's reason for this decision")

    def test_ordering_by_created_at_descending(self):
        """Reviews should be ordered by created_at descending."""
        stack2 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        review1 = StackReview.objects.create(
            stack=self.stack,
            reviewer=self.user,
        )
        review2 = StackReview.objects.create(
            stack=stack2,
            reviewer=self.user,
        )
        reviews = list(StackReview.objects.all())
        # review2 was created later, should come first
        self.assertEqual(reviews[0], review2)
        self.assertEqual(reviews[1], review1)


class DecisionChoicesTestCase(TestCase):
    """Tests for the Decision text choices."""

    def test_pending_choice(self):
        """PENDING decision should exist."""
        self.assertEqual(StackReview.Decision.PENDING, "pending")

    def test_resolved_choice(self):
        """RESOLVED decision should exist."""
        self.assertEqual(StackReview.Decision.RESOLVED, "resolved")

    def test_dismissed_choice(self):
        """DISMISSED decision should exist."""
        self.assertEqual(StackReview.Decision.DISMISSED, "dismissed")

    def test_all_choices_have_labels(self):
        """All choices should have human-readable labels."""
        labels = dict(StackReview.Decision.choices)
        self.assertEqual(labels["pending"], "Pending Review")
        self.assertEqual(labels["resolved"], "Resolved")
        self.assertEqual(labels["dismissed"], "Dismissed")


class IsReviewableTypeTestCase(TestCase):
    """Tests for the is_reviewable_type classmethod."""

    def test_no_stack_types_are_reviewable(self):
        """No current stack types should be reviewable.
        
        This is because:
        - Duplicates are now handled by the separate Duplicate model
        - Other stack types are informational only
        - RAW_JPEG_PAIR and LIVE_PHOTO are deprecated (use Photo.files)
        """
        for stack_type in PhotoStack.StackType.values:
            self.assertFalse(
                StackReview.is_reviewable_type(stack_type),
                f"{stack_type} should not be reviewable"
            )

    def test_manual_not_reviewable(self):
        """MANUAL stacks should not be reviewable."""
        self.assertFalse(StackReview.is_reviewable_type(PhotoStack.StackType.MANUAL))

    def test_burst_not_reviewable(self):
        """BURST_SEQUENCE stacks should not be reviewable."""
        self.assertFalse(StackReview.is_reviewable_type(PhotoStack.StackType.BURST_SEQUENCE))


class CreateForStackTestCase(TestCase):
    """Tests for the create_for_stack classmethod."""

    def setUp(self):
        """Create test user."""
        self.user = User.objects.create(username="createtest")

    def test_returns_none_for_all_stack_types(self):
        """Should return None for all stack types (none are reviewable)."""
        for stack_type in PhotoStack.StackType.values:
            stack = PhotoStack.objects.create(
                owner=self.user,
                stack_type=stack_type,
            )
            review = StackReview.create_for_stack(stack)
            self.assertIsNone(
                review,
                f"create_for_stack should return None for {stack_type}"
            )

    def test_returns_none_for_manual_stack(self):
        """Should return None for manual stacks."""
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        review = StackReview.create_for_stack(stack)
        self.assertIsNone(review)

    def test_returns_none_for_burst_stack(self):
        """Should return None for burst stacks."""
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        review = StackReview.create_for_stack(stack)
        self.assertIsNone(review)


class ResolveTestCase(TestCase):
    """Tests for the resolve method."""

    def setUp(self):
        """Create test user, photos, and stack."""
        self.user = User.objects.create(username="resolvetest")
        
        # Create photos with files
        self.photos = []
        for i in range(3):
            file = File.objects.create(
                hash=f"resolve{i}" + "a" * 25,
                path=f"/photos/img_{i}.jpg",
                type=File.IMAGE,
            )
            photo = Photo.objects.create(
                owner=self.user,
                main_file=file,
                image_hash=f"resolve{i}" + "b" * 25,
                added_on=timezone.now(),
                in_trashcan=False,
            )
            self.photos.append(photo)
        
        # Create stack with photos
        self.stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        for photo in self.photos:
            photo.stacks.add(self.stack)
        
        # Create review directly (since create_for_stack returns None)
        self.review = StackReview.objects.create(
            stack=self.stack,
            reviewer=self.user,
        )

    def test_resolve_sets_kept_photo(self):
        """Should set the kept_photo field."""
        kept = self.photos[0]
        self.review.resolve(kept)
        
        self.review.refresh_from_db()
        self.assertEqual(self.review.kept_photo, kept)

    def test_resolve_sets_decision_to_resolved(self):
        """Should change decision to RESOLVED."""
        self.review.resolve(self.photos[0])
        
        self.review.refresh_from_db()
        self.assertEqual(self.review.decision, StackReview.Decision.RESOLVED)

    def test_resolve_sets_reviewed_at(self):
        """Should set reviewed_at timestamp."""
        self.assertIsNone(self.review.reviewed_at)
        
        self.review.resolve(self.photos[0])
        
        self.review.refresh_from_db()
        self.assertIsNotNone(self.review.reviewed_at)

    def test_resolve_sets_stack_primary_photo(self):
        """Should update stack's primary_photo."""
        kept = self.photos[0]
        self.review.resolve(kept)
        
        self.stack.refresh_from_db()
        self.assertEqual(self.stack.primary_photo, kept)

    def test_resolve_trashes_other_photos(self):
        """Should move non-kept photos to trashcan."""
        kept = self.photos[0]
        self.review.resolve(kept, trash_others=True)
        
        for photo in self.photos:
            photo.refresh_from_db()
        
        self.assertFalse(self.photos[0].in_trashcan)
        self.assertTrue(self.photos[1].in_trashcan)
        self.assertTrue(self.photos[2].in_trashcan)

    def test_resolve_sets_trashed_count(self):
        """Should count trashed photos."""
        self.review.resolve(self.photos[0], trash_others=True)
        
        self.review.refresh_from_db()
        self.assertEqual(self.review.trashed_count, 2)

    def test_resolve_without_trashing(self):
        """Should not trash photos when trash_others=False."""
        self.review.resolve(self.photos[0], trash_others=False)
        
        for photo in self.photos:
            photo.refresh_from_db()
            self.assertFalse(photo.in_trashcan)

    def test_resolve_returns_self(self):
        """Should return the review instance."""
        result = self.review.resolve(self.photos[0])
        self.assertEqual(result, self.review)


class DismissTestCase(TestCase):
    """Tests for the dismiss method."""

    def setUp(self):
        """Create test user, photos, and stack."""
        self.user = User.objects.create(username="dismisstest")
        
        # Create photos
        self.photos = []
        for i in range(2):
            file = File.objects.create(
                hash=f"dismiss{i}" + "a" * 26,
                path=f"/photos/dismiss_{i}.jpg",
                type=File.IMAGE,
            )
            photo = Photo.objects.create(
                owner=self.user,
                main_file=file,
                image_hash=f"dismiss{i}" + "b" * 26,
                added_on=timezone.now(),
            )
            self.photos.append(photo)
        
        # Create stack
        self.stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        for photo in self.photos:
            photo.stacks.add(self.stack)
        
        # Create review directly
        self.review = StackReview.objects.create(
            stack=self.stack,
            reviewer=self.user,
        )

    def test_dismiss_sets_decision_to_dismissed(self):
        """Should change decision to DISMISSED."""
        self.review.dismiss()
        
        self.review.refresh_from_db()
        self.assertEqual(self.review.decision, StackReview.Decision.DISMISSED)

    def test_dismiss_sets_reviewed_at(self):
        """Should set reviewed_at timestamp."""
        self.review.dismiss()
        
        self.review.refresh_from_db()
        self.assertIsNotNone(self.review.reviewed_at)

    def test_dismiss_unlinks_photos_from_stack(self):
        """Should remove photos from the stack."""
        # Verify photos are in stack
        self.assertEqual(self.stack.photos.count(), 2)
        
        self.review.dismiss()
        
        # Verify photos are unlinked
        self.stack.refresh_from_db()
        self.assertEqual(self.stack.photos.count(), 0)

    def test_dismiss_returns_self(self):
        """Should return the review instance."""
        result = self.review.dismiss()
        self.assertEqual(result, self.review)

    def test_dismiss_photos_still_exist(self):
        """Photos should not be deleted, just unlinked."""
        photo_ids = [p.id for p in self.photos]
        
        self.review.dismiss()
        
        for pid in photo_ids:
            self.assertTrue(Photo.objects.filter(id=pid).exists())


class RevertTestCase(TestCase):
    """Tests for the revert method."""

    def setUp(self):
        """Create test user, photos, and resolved review."""
        self.user = User.objects.create(username="reverttest")
        
        # Create photos
        self.photos = []
        for i in range(3):
            file = File.objects.create(
                hash=f"revert{i}" + "a" * 26,
                path=f"/photos/revert_{i}.jpg",
                type=File.IMAGE,
            )
            photo = Photo.objects.create(
                owner=self.user,
                main_file=file,
                image_hash=f"revert{i}" + "b" * 26,
                added_on=timezone.now(),
                in_trashcan=False,
            )
            self.photos.append(photo)
        
        # Create stack
        self.stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        for photo in self.photos:
            photo.stacks.add(self.stack)
        
        # Create and resolve review
        self.review = StackReview.objects.create(
            stack=self.stack,
            reviewer=self.user,
        )
        self.review.resolve(self.photos[0], trash_others=True)

    def test_revert_restores_trashed_photos(self):
        """Should restore photos from trashcan."""
        # Verify photos are trashed
        self.photos[1].refresh_from_db()
        self.photos[2].refresh_from_db()
        self.assertTrue(self.photos[1].in_trashcan)
        self.assertTrue(self.photos[2].in_trashcan)
        
        self.review.revert()
        
        # Verify photos are restored
        self.photos[1].refresh_from_db()
        self.photos[2].refresh_from_db()
        self.assertFalse(self.photos[1].in_trashcan)
        self.assertFalse(self.photos[2].in_trashcan)

    def test_revert_resets_decision_to_pending(self):
        """Should change decision back to PENDING."""
        self.review.revert()
        
        self.review.refresh_from_db()
        self.assertEqual(self.review.decision, StackReview.Decision.PENDING)

    def test_revert_clears_kept_photo(self):
        """Should clear the kept_photo field."""
        self.review.revert()
        
        self.review.refresh_from_db()
        self.assertIsNone(self.review.kept_photo)

    def test_revert_clears_trashed_count(self):
        """Should reset trashed_count to 0."""
        self.review.revert()
        
        self.review.refresh_from_db()
        self.assertEqual(self.review.trashed_count, 0)

    def test_revert_clears_reviewed_at(self):
        """Should clear reviewed_at timestamp."""
        self.review.revert()
        
        self.review.refresh_from_db()
        self.assertIsNone(self.review.reviewed_at)

    def test_revert_clears_stack_primary_photo(self):
        """Should clear stack's primary_photo."""
        self.review.revert()
        
        self.stack.refresh_from_db()
        self.assertIsNone(self.stack.primary_photo)

    def test_revert_returns_restored_count(self):
        """Should return number of restored photos."""
        count = self.review.revert()
        self.assertEqual(count, 2)

    def test_revert_does_nothing_if_not_resolved(self):
        """Should do nothing if decision is not RESOLVED."""
        # Create pending review
        stack2 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        review2 = StackReview.objects.create(
            stack=stack2,
            reviewer=self.user,
            decision=StackReview.Decision.PENDING,
        )
        
        result = review2.revert()
        
        review2.refresh_from_db()
        self.assertEqual(result, review2)  # Returns self, not count
        self.assertEqual(review2.decision, StackReview.Decision.PENDING)

    def test_revert_does_nothing_if_dismissed(self):
        """Should do nothing if decision is DISMISSED."""
        self.review.decision = StackReview.Decision.DISMISSED
        self.review.save()
        
        result = self.review.revert()
        
        self.review.refresh_from_db()
        self.assertEqual(result, self.review)  # Returns self
        self.assertEqual(self.review.decision, StackReview.Decision.DISMISSED)


class EdgeCasesTestCase(TestCase):
    """Edge case tests for StackReview."""

    def setUp(self):
        """Create test user."""
        self.user = User.objects.create(username="edgetest")

    def test_resolve_with_single_photo_stack(self):
        """Should handle stack with only one photo."""
        file = File.objects.create(
            hash="single" + "a" * 26,
            path="/photos/single.jpg",
            type=File.IMAGE,
        )
        photo = Photo.objects.create(
            owner=self.user,
            main_file=file,
            image_hash="single" + "b" * 26,
            added_on=timezone.now(),
        )
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        photo.stacks.add(stack)
        
        review = StackReview.objects.create(
            stack=stack,
            reviewer=self.user,
        )
        review.resolve(photo)
        
        review.refresh_from_db()
        self.assertEqual(review.trashed_count, 0)
        self.assertEqual(review.kept_photo, photo)

    def test_dismiss_empty_stack(self):
        """Should handle stack with no photos."""
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        review = StackReview.objects.create(
            stack=stack,
            reviewer=self.user,
        )
        
        # Should not raise error
        review.dismiss()
        
        review.refresh_from_db()
        self.assertEqual(review.decision, StackReview.Decision.DISMISSED)

    def test_revert_when_photos_already_restored(self):
        """Should handle reverting when photos are already not in trash."""
        file = File.objects.create(
            hash="restored" + "a" * 24,
            path="/photos/restored.jpg",
            type=File.IMAGE,
        )
        photo = Photo.objects.create(
            owner=self.user,
            main_file=file,
            image_hash="restored" + "b" * 24,
            added_on=timezone.now(),
            in_trashcan=False,
        )
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        photo.stacks.add(stack)
        
        review = StackReview.objects.create(
            stack=stack,
            reviewer=self.user,
            decision=StackReview.Decision.RESOLVED,
            kept_photo=photo,
            trashed_count=0,
        )
        
        # Should not raise error, returns 0 restored
        count = review.revert()
        self.assertEqual(count, 0)

    def test_stack_cascade_delete(self):
        """Review should be deleted when stack is deleted."""
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        review = StackReview.objects.create(
            stack=stack,
            reviewer=self.user,
        )
        review_id = review.id
        
        stack.delete()
        
        self.assertFalse(StackReview.objects.filter(id=review_id).exists())

    def test_user_set_to_deleted_on_reviewer_delete(self):
        """Reviewer should be set to deleted user when user is deleted."""
        temp_user = User.objects.create(username="temp_reviewer")
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        review = StackReview.objects.create(
            stack=stack,
            reviewer=temp_user,
        )
        
        temp_user.delete()
        
        review.refresh_from_db()
        self.assertEqual(review.reviewer.username, "deleted")

    def test_review_with_note(self):
        """Should store user's note."""
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        review = StackReview.objects.create(
            stack=stack,
            reviewer=self.user,
            note="These are from different events, not duplicates",
        )
        
        review.refresh_from_db()
        self.assertEqual(review.note, "These are from different events, not duplicates")

    def test_review_index_on_reviewer_decision(self):
        """Index on reviewer+decision should exist for efficient queries."""
        # Create multiple reviews with different decisions
        for decision in StackReview.Decision.values:
            stack = PhotoStack.objects.create(
                owner=self.user,
                stack_type=PhotoStack.StackType.MANUAL,
            )
            StackReview.objects.create(
                stack=stack,
                reviewer=self.user,
                decision=decision,
            )
        
        # Query should be efficient (index used)
        pending = StackReview.objects.filter(
            reviewer=self.user,
            decision=StackReview.Decision.PENDING,
        )
        self.assertEqual(pending.count(), 1)


================================================
FILE: api/tests/test_stack_validation_edge_cases.py
================================================
"""
Edge case tests for Stack API input validation.

Tests cover:
- Duplicate photo hashes handling
- Input validation edge cases
- Error message accuracy
"""

from django.test import TestCase
from rest_framework.test import APIClient

from api.models.photo_stack import PhotoStack
from api.tests.utils import create_test_photo, create_test_user


class DuplicatePhotoHashesTestCase(TestCase):
    """Tests for handling duplicate photo hashes in input."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_create_manual_stack_with_duplicate_valid_hashes(self):
        """
        Test creating manual stack when two valid photos are provided
        but one hash is duplicated.
        
        Fixed Bug #15: If photo_hashes = [hash1, hash2, hash1], the input
        is de-duplicated before validation. Since there are 2 unique valid
        photos, the stack creation should succeed.
        """
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        # Send duplicate hash1
        response = self.client.post(
            "/api/stacks/manual",
            {"photo_hashes": [photo1.image_hash, photo2.image_hash, photo1.image_hash]},
            format='json',
        )
        
        # After fix: Duplicates are de-duplicated, so 2 unique photos are found
        # Stack creation should succeed
        self.assertEqual(response.status_code, 201)
        self.assertIn("stack_id", response.data)
        
        # Verify stack was created with 2 photos
        stack = PhotoStack.objects.get(id=response.data["stack_id"])
        self.assertEqual(stack.photos.count(), 2)

    def test_create_manual_stack_triple_duplicate_same_hash(self):
        """Test with all three hashes being the same."""
        photo = create_test_photo(owner=self.user)
        
        response = self.client.post(
            "/api/stacks/manual",
            {"photo_hashes": [photo.image_hash, photo.image_hash, photo.image_hash]},
            format='json',
        )
        
        # Expected: Only 1 unique photo, should fail (need >= 2)
        self.assertEqual(response.status_code, 400)

    def test_add_photos_with_duplicate_hashes(self):
        """Test adding photos with duplicate hashes to existing stack."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo1, photo2)
        
        # Add photo3 with duplicate hash
        response = self.client.post(
            f"/api/stacks/{stack.id}/add",
            {"photo_hashes": [photo3.image_hash, photo3.image_hash]},
            format='json',
        )
        
        # Should work - duplicates should be ignored
        self.assertEqual(response.status_code, 200)
        stack.refresh_from_db()
        self.assertEqual(stack.photos.count(), 3)

    def test_remove_photos_with_duplicate_hashes(self):
        """Test removing photos with duplicate hashes."""
        photos = [create_test_photo(owner=self.user) for _ in range(4)]
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(*photos)
        
        # Remove with duplicate hash
        response = self.client.post(
            f"/api/stacks/{stack.id}/remove",
            {"photo_hashes": [photos[0].image_hash, photos[0].image_hash]},
            format='json',
        )
        
        # Should work - removes only once
        self.assertEqual(response.status_code, 200)
        stack.refresh_from_db()
        self.assertEqual(stack.photos.count(), 3)


class MergeStacksDuplicateHashesTestCase(TestCase):
    """Tests for merge stacks with duplicate hashes."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_merge_with_duplicate_hashes(self):
        """Test merge endpoint with duplicate photo hashes.
        
        Fixed Bug #15: Duplicate hashes are now de-duplicated before validation.
        """
        photos1 = [create_test_photo(owner=self.user) for _ in range(2)]
        photos2 = [create_test_photo(owner=self.user) for _ in range(2)]
        
        stack1 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack1.photos.add(*photos1)
        
        stack2 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack2.photos.add(*photos2)
        
        # Include duplicate hashes
        hashes = [photos1[0].image_hash, photos2[0].image_hash, photos1[0].image_hash]
        
        response = self.client.post(
            "/api/stacks/merge",
            {"photo_hashes": hashes},
            format='json',
        )
        
        # After fix: Duplicates are de-duplicated, merge should succeed
        self.assertEqual(response.status_code, 200)
        self.assertIn("stack_id", response.data)
        
        # Should have merged into one stack with all 4 photos
        stacks = PhotoStack.objects.filter(owner=self.user, stack_type=PhotoStack.StackType.MANUAL)
        self.assertEqual(stacks.count(), 1)
        self.assertEqual(stacks.first().photos.count(), 4)


class ListStacksWithNullThumbnailTestCase(TestCase):
    """Tests for stack list with photos that have no thumbnails."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_list_stacks_without_thumbnails(self):
        """Test listing stacks when photos have thumbnails (created by helper)."""
        # Note: create_test_photo creates thumbnails, so we test that listing works
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
            primary_photo=photo1,
        )
        stack.photos.add(photo1, photo2)
        
        # List should work
        response = self.client.get("/api/stacks")
        
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["count"], 1)
        
        # thumbnail_url should be present (create_test_photo creates thumbnails)
        result = response.data["results"][0]
        # Primary photo thumbnail should exist since create_test_photo creates them
        if result.get("primary_photo"):
            # Just verify the structure is valid - may or may not have thumbnail
            self.assertIn("thumbnail_url", result["primary_photo"])

    def test_detail_stack_without_thumbnails(self):
        """Test getting stack detail when photos don't have thumbnails."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
            primary_photo=photo1,
        )
        stack.photos.add(photo1, photo2)
        
        response = self.client.get(f"/api/stacks/{stack.id}")
        
        self.assertEqual(response.status_code, 200)
        # Should have photos even without thumbnails
        self.assertEqual(len(response.data["photos"]), 2)


class RemoveFromStackPrimaryPhotoTestCase(TestCase):
    """Tests for removing the primary photo from a stack."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_remove_primary_updates_primary(self):
        """Test that removing the primary photo selects a new primary."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
            primary_photo=photo1,
        )
        stack.photos.add(photo1, photo2, photo3)
        
        # Remove the primary photo
        response = self.client.post(
            f"/api/stacks/{stack.id}/remove",
            {"photo_hashes": [photo1.image_hash]},
            format='json',
        )
        
        self.assertEqual(response.status_code, 200)
        stack.refresh_from_db()
        
        # Primary should have changed
        self.assertIsNotNone(stack.primary_photo)
        self.assertNotEqual(stack.primary_photo.image_hash, photo1.image_hash)

    def test_remove_non_primary_keeps_primary(self):
        """Test that removing a non-primary photo keeps the current primary."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        photo3 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
            primary_photo=photo1,
        )
        stack.photos.add(photo1, photo2, photo3)
        
        # Remove a non-primary photo
        response = self.client.post(
            f"/api/stacks/{stack.id}/remove",
            {"photo_hashes": [photo2.image_hash]},
            format='json',
        )
        
        self.assertEqual(response.status_code, 200)
        stack.refresh_from_db()
        
        # Primary should stay the same
        self.assertEqual(stack.primary_photo.image_hash, photo1.image_hash)


class EmptyInputTestCase(TestCase):
    """Tests for empty or null input handling."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_set_primary_no_hash(self):
        """Test setting primary with no photo_hash provided."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo1, photo2)
        
        response = self.client.post(
            f"/api/stacks/{stack.id}/primary",
            {},  # No photo_hash
            format='json',
        )
        
        self.assertEqual(response.status_code, 400)
        self.assertEqual(response.data["error"], "photo_hash is required")

    def test_set_primary_empty_hash(self):
        """Test setting primary with empty photo_hash."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo1, photo2)
        
        response = self.client.post(
            f"/api/stacks/{stack.id}/primary",
            {"photo_hash": ""},  # Empty hash
            format='json',
        )
        
        self.assertEqual(response.status_code, 400)

    def test_add_empty_photo_list(self):
        """Test adding empty photo list to stack."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo1, photo2)
        
        response = self.client.post(
            f"/api/stacks/{stack.id}/add",
            {"photo_hashes": []},
            format='json',
        )
        
        self.assertEqual(response.status_code, 400)

    def test_remove_empty_photo_list(self):
        """Test removing empty photo list from stack."""
        photo1 = create_test_photo(owner=self.user)
        photo2 = create_test_photo(owner=self.user)
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo1, photo2)
        
        response = self.client.post(
            f"/api/stacks/{stack.id}/remove",
            {"photo_hashes": []},
            format='json',
        )
        
        self.assertEqual(response.status_code, 400)

    def test_merge_empty_photo_list(self):
        """Test merge with empty photo list."""
        response = self.client.post(
            "/api/stacks/merge",
            {"photo_hashes": []},
            format='json',
        )
        
        self.assertEqual(response.status_code, 400)

    def test_create_manual_missing_photo_hashes_key(self):
        """Test creating manual stack without photo_hashes key."""
        response = self.client.post(
            "/api/stacks/manual",
            {},  # No photo_hashes key
            format='json',
        )
        
        self.assertEqual(response.status_code, 400)


class StackListPaginationEdgeCasesTestCase(TestCase):
    """Tests for pagination edge cases in stack list."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)
        
        # Create 5 stacks
        for i in range(5):
            photos = [create_test_photo(owner=self.user) for _ in range(2)]
            stack = PhotoStack.objects.create(
                owner=self.user,
                stack_type=PhotoStack.StackType.MANUAL,
            )
            stack.photos.add(*photos)

    def test_page_beyond_results(self):
        """Test requesting a page beyond available results."""
        response = self.client.get("/api/stacks?page=100")
        
        self.assertEqual(response.status_code, 200)
        # Django's Paginator.get_page() returns last page for out-of-range pages
        # So we may get results (last page) rather than empty
        self.assertGreaterEqual(len(response.data["results"]), 0)
        # has_next should be False since we're at/past the last page
        self.assertFalse(response.data["has_next"])

    def test_page_zero(self):
        """Test requesting page 0 (should default to 1)."""
        response = self.client.get("/api/stacks?page=0")
        
        self.assertEqual(response.status_code, 200)
        # Should get results (treated as page 1)
        self.assertGreater(len(response.data["results"]), 0)

    def test_negative_page(self):
        """Test requesting negative page number."""
        response = self.client.get("/api/stacks?page=-1")
        
        self.assertEqual(response.status_code, 200)
        # Should get results (negative treated as 1)
        self.assertGreater(len(response.data["results"]), 0)

    def test_non_numeric_page(self):
        """Test requesting non-numeric page."""
        response = self.client.get("/api/stacks?page=abc")
        
        # After Bug #16 fix: Non-numeric page defaults to 1
        self.assertEqual(response.status_code, 200)
        self.assertGreater(len(response.data["results"]), 0)

    def test_page_size_zero(self):
        """Test requesting page_size of 0."""
        response = self.client.get("/api/stacks?page_size=0")
        
        self.assertEqual(response.status_code, 200)
        # page_size=0 should be treated as page_size=1 (min)
        self.assertGreater(len(response.data["results"]), 0)

    def test_page_size_negative(self):
        """Test requesting negative page_size."""
        response = self.client.get("/api/stacks?page_size=-5")
        
        # Should handle gracefully (Bug #10 fix)
        self.assertEqual(response.status_code, 200)

    def test_page_size_exceeds_max(self):
        """Test requesting page_size exceeding maximum."""
        response = self.client.get("/api/stacks?page_size=1000")
        
        self.assertEqual(response.status_code, 200)
        # page_size should be capped at 100
        self.assertLessEqual(response.data["page_size"], 100)

    def test_non_numeric_page_size(self):
        """Test requesting non-numeric page_size."""
        response = self.client.get("/api/stacks?page_size=abc")
        
        # After Bug #16 fix: Non-numeric page_size defaults to 20
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["page_size"], 20)


================================================
FILE: api/tests/test_stats_accuracy.py
================================================
"""
Tests for stats accuracy and edge cases.

Ensures that:
- Duplicate stats are calculated correctly
- Stack stats are calculated correctly
- Edge cases (empty, single items, etc.) are handled
- Stats are properly scoped to user
- Potential savings calculations are accurate
"""

from django.test import TestCase
from rest_framework.test import APIClient, APITestCase

from api.models import Photo
from api.models.duplicate import Duplicate
from api.models.photo_stack import PhotoStack
from api.tests.utils import create_test_photo, create_test_user
from api.stats import get_count_stats, calc_megabytes, median_value


class DuplicateStatsAccuracyTestCase(APITestCase):
    """Test duplicate stats calculations."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_empty_stats(self):
        """Test stats when no duplicates exist."""
        response = self.client.get("/api/duplicates/stats")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["total_duplicates"], 0)
        self.assertEqual(response.data["pending_duplicates"], 0)
        self.assertEqual(response.data["resolved_duplicates"], 0)
        self.assertEqual(response.data["dismissed_duplicates"], 0)

    def test_stats_by_type(self):
        """Test stats count by duplicate type."""
        # Create exact copies
        for _ in range(3):
            photos = [create_test_photo(owner=self.user) for _ in range(2)]
            dup = Duplicate.objects.create(
                owner=self.user,
                duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            )
            dup.photos.add(*photos)
        
        # Create visual duplicates
        for _ in range(2):
            photos = [create_test_photo(owner=self.user) for _ in range(2)]
            dup = Duplicate.objects.create(
                owner=self.user,
                duplicate_type=Duplicate.DuplicateType.VISUAL_DUPLICATE,
            )
            dup.photos.add(*photos)
        
        response = self.client.get("/api/duplicates/stats")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["by_type"]["exact_copy"], 3)
        self.assertEqual(response.data["by_type"]["visual_duplicate"], 2)

    def test_stats_by_status(self):
        """Test stats count by review status."""
        # Create pending
        for _ in range(4):
            photos = [create_test_photo(owner=self.user) for _ in range(2)]
            dup = Duplicate.objects.create(
                owner=self.user,
                duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
                review_status=Duplicate.ReviewStatus.PENDING,
            )
            dup.photos.add(*photos)
        
        # Create resolved
        for _ in range(2):
            photos = [create_test_photo(owner=self.user) for _ in range(2)]
            dup = Duplicate.objects.create(
                owner=self.user,
                duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
                review_status=Duplicate.ReviewStatus.RESOLVED,
            )
            dup.photos.add(*photos)
        
        # Create dismissed
        photos = [create_test_photo(owner=self.user) for _ in range(2)]
        dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.DISMISSED,
        )
        dup.photos.add(*photos)
        
        response = self.client.get("/api/duplicates/stats")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["pending_duplicates"], 4)
        self.assertEqual(response.data["resolved_duplicates"], 2)
        self.assertEqual(response.data["dismissed_duplicates"], 1)

    def test_photos_in_duplicates_count(self):
        """Test count of photos involved in duplicates."""
        # Create 3 duplicate groups, each with 2 photos = 6 photos total
        for _ in range(3):
            photos = [create_test_photo(owner=self.user) for _ in range(2)]
            dup = Duplicate.objects.create(
                owner=self.user,
                duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            )
            dup.photos.add(*photos)
        
        response = self.client.get("/api/duplicates/stats")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["photos_in_duplicates"], 6)

    def test_potential_savings_calculation(self):
        """Test that potential savings is calculated from pending duplicates only."""
        # Create pending duplicate with known savings
        photos = [create_test_photo(owner=self.user) for _ in range(2)]
        pending_dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.PENDING,
            potential_savings=1000000,  # 1MB
        )
        pending_dup.photos.add(*photos)
        
        # Create resolved duplicate - should not count
        photos2 = [create_test_photo(owner=self.user) for _ in range(2)]
        resolved_dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            review_status=Duplicate.ReviewStatus.RESOLVED,
            potential_savings=5000000,  # 5MB - should be ignored
        )
        resolved_dup.photos.add(*photos2)
        
        response = self.client.get("/api/duplicates/stats")
        self.assertEqual(response.status_code, 200)
        # Only pending savings should be counted
        self.assertEqual(response.data["potential_savings_bytes"], 1000000)

    def test_stats_user_scoped(self):
        """Test that stats only include current user's duplicates."""
        other_user = create_test_user()
        
        # Create duplicate for other user
        other_photos = [create_test_photo(owner=other_user) for _ in range(2)]
        other_dup = Duplicate.objects.create(
            owner=other_user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        other_dup.photos.add(*other_photos)
        
        # Create duplicate for current user
        my_photos = [create_test_photo(owner=self.user) for _ in range(2)]
        my_dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        my_dup.photos.add(*my_photos)
        
        response = self.client.get("/api/duplicates/stats")
        self.assertEqual(response.status_code, 200)
        # Should only see our duplicate
        self.assertEqual(response.data["total_duplicates"], 1)


class StackStatsAccuracyTestCase(APITestCase):
    """Test stack stats calculations."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_empty_stats(self):
        """Test stats when no stacks exist."""
        response = self.client.get("/api/stacks/stats")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["total_stacks"], 0)
        self.assertEqual(response.data["photos_in_stacks"], 0)

    def test_stats_by_type(self):
        """Test stats count by stack type."""
        # Create RAW+JPEG pairs
        for _ in range(2):
            photos = [create_test_photo(owner=self.user) for _ in range(2)]
            stack = PhotoStack.objects.create(
                owner=self.user,
                stack_type=PhotoStack.StackType.RAW_JPEG_PAIR,
            )
            stack.photos.add(*photos)
        
        # Create burst sequences
        for _ in range(3):
            photos = [create_test_photo(owner=self.user) for _ in range(3)]
            stack = PhotoStack.objects.create(
                owner=self.user,
                stack_type=PhotoStack.StackType.BURST_SEQUENCE,
            )
            stack.photos.add(*photos)
        
        # Create manual stack
        photos = [create_test_photo(owner=self.user) for _ in range(2)]
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(*photos)
        
        response = self.client.get("/api/stacks/stats")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["by_type"]["raw_jpeg"], 2)
        self.assertEqual(response.data["by_type"]["burst"], 3)
        self.assertEqual(response.data["by_type"]["manual"], 1)

    def test_photos_in_stacks_count(self):
        """Test count of photos involved in stacks."""
        # 2 RAW+JPEG pairs (2 photos each) = 4 photos
        for _ in range(2):
            photos = [create_test_photo(owner=self.user) for _ in range(2)]
            stack = PhotoStack.objects.create(
                owner=self.user,
                stack_type=PhotoStack.StackType.RAW_JPEG_PAIR,
            )
            stack.photos.add(*photos)
        
        # 1 burst (3 photos)
        photos = [create_test_photo(owner=self.user) for _ in range(3)]
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.BURST_SEQUENCE,
        )
        stack.photos.add(*photos)
        
        response = self.client.get("/api/stacks/stats")
        self.assertEqual(response.status_code, 200)
        # Total: 4 + 3 = 7 photos
        self.assertEqual(response.data["photos_in_stacks"], 7)

    def test_photo_in_multiple_stacks_counted_once(self):
        """Test that a photo in multiple stacks is counted only once."""
        photos = [create_test_photo(owner=self.user) for _ in range(3)]
        
        # Add first two photos to one stack
        stack1 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack1.photos.add(photos[0], photos[1])
        
        # Add last two photos to another stack (photos[1] is in both)
        stack2 = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack2.photos.add(photos[1], photos[2])
        
        response = self.client.get("/api/stacks/stats")
        self.assertEqual(response.status_code, 200)
        # Should be 3 distinct photos, not 4
        self.assertEqual(response.data["photos_in_stacks"], 3)

    def test_stats_user_scoped(self):
        """Test that stats only include current user's stacks."""
        other_user = create_test_user()
        
        # Create stack for other user
        other_photos = [create_test_photo(owner=other_user) for _ in range(2)]
        other_stack = PhotoStack.objects.create(
            owner=other_user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        other_stack.photos.add(*other_photos)
        
        # Create stack for current user
        my_photos = [create_test_photo(owner=self.user) for _ in range(2)]
        my_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        my_stack.photos.add(*my_photos)
        
        response = self.client.get("/api/stacks/stats")
        self.assertEqual(response.status_code, 200)
        # Should only see our stack
        self.assertEqual(response.data["total_stacks"], 1)

    def test_excludes_duplicate_type_stacks(self):
        """Test that old duplicate-type stacks are excluded from stats."""
        # Create a valid stack
        photos = [create_test_photo(owner=self.user) for _ in range(2)]
        valid_stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        valid_stack.photos.add(*photos)
        
        # Create an old duplicate-type stack (should be excluded)
        # Note: These types may not exist anymore, but test the filtering
        
        response = self.client.get("/api/stacks/stats")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["total_stacks"], 1)


class UtilityFunctionsTestCase(TestCase):
    """Test utility functions in stats module."""

    def test_calc_megabytes_zero(self):
        """Test megabyte calculation with zero bytes."""
        self.assertEqual(calc_megabytes(0), 0)

    def test_calc_megabytes_none(self):
        """Test megabyte calculation with None."""
        self.assertEqual(calc_megabytes(None), 0)

    def test_calc_megabytes_small(self):
        """Test megabyte calculation with small values."""
        # 1 MB = 1048576 bytes
        self.assertEqual(calc_megabytes(1048576), 1)

    def test_calc_megabytes_large(self):
        """Test megabyte calculation with large values."""
        # 100 MB
        self.assertEqual(calc_megabytes(104857600), 100)

    def test_median_value_empty_queryset(self):
        """Test median with empty queryset."""
        qs = Photo.objects.none()
        result = median_value(qs, "size")
        self.assertIsNone(result)


class CountStatsTestCase(TestCase):
    """Test get_count_stats function."""

    def setUp(self):
        self.user = create_test_user()

    def test_count_stats_no_photos(self):
        """Test count stats when user has no photos."""
        stats = get_count_stats(self.user)
        self.assertEqual(stats["num_photos"], 0)

    def test_count_stats_with_photos(self):
        """Test count stats with photos."""
        # Create some photos
        for _ in range(5):
            create_test_photo(owner=self.user)
        
        stats = get_count_stats(self.user)
        self.assertEqual(stats["num_photos"], 5)

    def test_count_stats_excludes_hidden(self):
        """Test that hidden photos are excluded from count."""
        # Create visible photos
        for _ in range(3):
            create_test_photo(owner=self.user)
        
        # Create hidden photo
        hidden = create_test_photo(owner=self.user)
        hidden.hidden = True
        hidden.save()
        
        _stats = get_count_stats(self.user)
        # Depending on implementation, hidden may or may not be counted
        # The important thing is no crash

    def test_count_stats_user_scoped(self):
        """Test that count stats are user-scoped."""
        other_user = create_test_user()
        
        # Create photos for other user
        for _ in range(10):
            create_test_photo(owner=other_user)
        
        # Create photos for current user
        for _ in range(3):
            create_test_photo(owner=self.user)
        
        stats = get_count_stats(self.user)
        self.assertEqual(stats["num_photos"], 3)


class StatsEdgeCasesTestCase(APITestCase):
    """Test edge cases for stats calculations."""

    def setUp(self):
        self.user = create_test_user()
        self.client = APIClient()
        self.client.force_authenticate(user=self.user)

    def test_duplicate_with_zero_photos(self):
        """Test stats with duplicate group that has no photos."""
        # Create empty duplicate group
        _dup = Duplicate.objects.create(
            owner=self.user,
            duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
        )
        # Don't add any photos
        
        response = self.client.get("/api/duplicates/stats")
        self.assertEqual(response.status_code, 200)
        # Should handle gracefully

    def test_stack_with_single_photo(self):
        """Test stats with stack that has only one photo."""
        photo = create_test_photo(owner=self.user)
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(photo)
        
        response = self.client.get("/api/stacks/stats")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["total_stacks"], 1)
        self.assertEqual(response.data["photos_in_stacks"], 1)

    def test_deleted_photo_in_group(self):
        """Test stats when photo has been deleted from group."""
        photos = [create_test_photo(owner=self.user) for _ in range(3)]
        
        stack = PhotoStack.objects.create(
            owner=self.user,
            stack_type=PhotoStack.StackType.MANUAL,
        )
        stack.photos.add(*photos)
        
        # Delete one photo from stack
        stack.photos.remove(photos[0])
        
        response = self.client.get("/api/stacks/stats")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["photos_in_stacks"], 2)

    def test_trashed_photos_excluded(self):
        """Test that trashed photos are excluded from total count."""
        # Create normal photos
        for _ in range(3):
            create_test_photo(owner=self.user)
        
        # Create trashed photo
        trashed = create_test_photo(owner=self.user)
        trashed.in_trashcan = True
        trashed.save()
        
        response = self.client.get("/api/stacks/stats")
        self.assertEqual(response.status_code, 200)
        # total_photos should not include trashed
        self.assertEqual(response.data["total_photos"], 3)

    def test_large_number_of_groups(self):
        """Test stats with many groups."""
        # Create 50 duplicate groups
        for _ in range(50):
            photos = [create_test_photo(owner=self.user) for _ in range(2)]
            dup = Duplicate.objects.create(
                owner=self.user,
                duplicate_type=Duplicate.DuplicateType.EXACT_COPY,
            )
            dup.photos.add(*photos)
        
        response = self.client.get("/api/duplicates/stats")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response.data["total_duplicates"], 50)
        self.assertEqual(response.data["photos_in_duplicates"], 100)


================================================
FILE: api/tests/test_thumbnail_migration.py
================================================
"""
Tests for the thumbnail migration (0120_rename_thumbnails_uuid_to_hash)
"""

import os
import tempfile
from unittest.mock import patch
from django.test import TestCase
from django.conf import settings

from api.models import Photo, Thumbnail
from api.tests.utils import create_test_user, create_test_photo


class ThumbnailMigrationTest(TestCase):
    """Test the thumbnail UUID to hash migration"""

    def setUp(self):
        self.user = create_test_user()
        # Create a temporary directory for test thumbnails
        self.test_media_root = tempfile.mkdtemp()

    def tearDown(self):
        # Clean up temporary files
        import shutil

        if os.path.exists(self.test_media_root):
            shutil.rmtree(self.test_media_root)

    def test_batch_processing_logic(self):
        """Test that batch processing correctly handles multiple photos"""
        # Create test photos with thumbnails
        photos = []
        for i in range(5):
            photo = create_test_photo(owner=self.user)
            photos.append(photo)

        # Verify all photos have thumbnails
        self.assertEqual(Thumbnail.objects.count(), 5)

        # Verify thumbnails use image_hash in their paths
        for photo in photos:
            thumbnail = photo.thumbnail
            self.assertIn(photo.image_hash, thumbnail.thumbnail_big.name)
            self.assertIn(photo.image_hash, thumbnail.square_thumbnail.name)
            self.assertIn(photo.image_hash, thumbnail.square_thumbnail_small.name)

    @patch("django.conf.settings.MEDIA_ROOT")
    def test_file_renaming_with_mocked_filesystem(self, mock_media_root):
        """Test that the migration logic handles file renaming correctly"""
        # Set the mock to return our test directory
        test_dir = self.test_media_root
        mock_media_root.return_value = test_dir
        mock_media_root.__str__ = lambda _: test_dir

        # Create test photo
        photo = create_test_photo(owner=self.user)
        photo_uuid = str(photo.id)
        photo_hash = photo.image_hash

        # Create dummy thumbnail directories
        for thumb_dir in [
            "thumbnails_big",
            "square_thumbnails",
            "square_thumbnails_small",
        ]:
            os.makedirs(os.path.join(self.test_media_root, thumb_dir), exist_ok=True)

        # Create dummy "old" thumbnail files with UUID names
        old_files = []
        for thumb_dir in [
            "thumbnails_big",
            "square_thumbnails",
            "square_thumbnails_small",
        ]:
            old_file = os.path.join(
                self.test_media_root, thumb_dir, f"{photo_uuid}.webp"
            )
            with open(old_file, "w") as f:
                f.write("dummy thumbnail")
            old_files.append(old_file)
            self.assertTrue(os.path.exists(old_file))

        # Simulate the migration logic (simplified version)
        for thumb_dir in [
            "thumbnails_big",
            "square_thumbnails",
            "square_thumbnails_small",
        ]:
            old_path = os.path.join(
                self.test_media_root, thumb_dir, f"{photo_uuid}.webp"
            )
            new_path = os.path.join(
                self.test_media_root, thumb_dir, f"{photo_hash}.webp"
            )

            if os.path.exists(old_path) and not os.path.exists(new_path):
                os.rename(old_path, new_path)

        # Verify files were renamed
        for thumb_dir in [
            "thumbnails_big",
            "square_thumbnails",
            "square_thumbnails_small",
        ]:
            old_path = os.path.join(
                self.test_media_root, thumb_dir, f"{photo_uuid}.webp"
            )
            new_path = os.path.join(
                self.test_media_root, thumb_dir, f"{photo_hash}.webp"
            )

            self.assertFalse(
                os.path.exists(old_path), f"Old file should not exist: {old_path}"
            )
            self.assertTrue(
                os.path.exists(new_path), f"New file should exist: {new_path}"
            )

    def test_bulk_update_performance(self):
        """Test that bulk_update is more efficient than individual saves"""
        # This test verifies the concept - actual migration uses bulk_update
        photos = []
        thumbnails = []

        for i in range(10):
            photo = create_test_photo(owner=self.user)
            photos.append(photo)
            thumbnails.append(photo.thumbnail)

        # Update thumbnails in bulk
        for thumbnail in thumbnails:
            thumbnail.thumbnail_big = f"updated_{thumbnail.thumbnail_big}"

        # Use bulk_update (this is what the migration does)
        Thumbnail.objects.bulk_update(thumbnails, ["thumbnail_big"], batch_size=1000)

        # Verify updates were applied
        for i, photo in enumerate(photos):
            photo.thumbnail.refresh_from_db()
            self.assertTrue(photo.thumbnail.thumbnail_big.name.startswith("updated_"))


================================================
FILE: api/tests/test_thumbnail_naming.py
================================================
"""
Tests for thumbnail naming using image_hash instead of UUID.
"""
import os
from unittest import mock
from django.test import TestCase
from django.conf import settings

from api.models import Photo, Thumbnail
from api.tests.utils import create_test_user, create_test_photo


class ThumbnailNamingTest(TestCase):
    """Test that thumbnails are named using image_hash instead of UUID"""

    def setUp(self):
        self.user = create_test_user()

    def test_thumbnail_uses_image_hash_not_uuid(self):
        """Verify that thumbnails use image_hash for file naming"""
        # Create a photo with thumbnail
        photo = create_test_photo(owner=self.user)
        
        # Verify photo has both UUID and image_hash
        self.assertIsNotNone(photo.id)  # UUID
        self.assertIsNotNone(photo.image_hash)  # Content hash
        self.assertNotEqual(str(photo.id), photo.image_hash)  # They should be different
        
        # Check that thumbnail exists
        self.assertTrue(hasattr(photo, 'thumbnail'))
        thumbnail = photo.thumbnail
        
        # Verify thumbnail paths use image_hash, not UUID
        self.assertIn(photo.image_hash, thumbnail.thumbnail_big.name)
        self.assertIn(photo.image_hash, thumbnail.square_thumbnail.name)
        self.assertIn(photo.image_hash, thumbnail.square_thumbnail_small.name)
        
        # Verify UUID is NOT in the thumbnail paths
        self.assertNotIn(str(photo.id), thumbnail.thumbnail_big.name)
        self.assertNotIn(str(photo.id), thumbnail.square_thumbnail.name)
        self.assertNotIn(str(photo.id), thumbnail.square_thumbnail_small.name)

    @mock.patch('api.models.thumbnail.create_thumbnail')
    @mock.patch('api.models.thumbnail.does_static_thumbnail_exist')
    def test_generate_thumbnail_uses_image_hash(self, mock_exists, mock_create):
        """Verify that _generate_thumbnail method uses image_hash"""
        # Mock to indicate thumbnails don't exist yet
        mock_exists.return_value = False
        mock_create.return_value = '/tmp/test.webp'
        
        # Create a photo
        photo = create_test_photo(owner=self.user)
        thumbnail = photo.thumbnail
        
        # Call _generate_thumbnail
        thumbnail._generate_thumbnail()
        
        # Verify create_thumbnail was called with image_hash, not UUID
        calls = mock_create.call_args_list
        for call in calls:
            kwargs = call[1]
            if 'hash' in kwargs:
                # The hash parameter should be the image_hash
                self.assertEqual(kwargs['hash'], photo.image_hash)
                # Should NOT be the UUID
                self.assertNotEqual(kwargs['hash'], str(photo.id))

    def test_thumbnail_file_naming_convention(self):
        """Test that thumbnail file names follow the correct pattern"""
        photo = create_test_photo(owner=self.user)
        thumbnail = photo.thumbnail
        
        # Check naming patterns
        expected_big = f"thumbnails_big/{photo.image_hash}.webp"
        expected_square = f"square_thumbnails/{photo.image_hash}.webp"
        expected_square_small = f"square_thumbnails_small/{photo.image_hash}.webp"
        
        self.assertEqual(thumbnail.thumbnail_big.name.strip(), expected_big)
        self.assertEqual(thumbnail.square_thumbnail.name.strip(), expected_square)
        self.assertEqual(thumbnail.square_thumbnail_small.name.strip(), expected_square_small)

    def test_video_thumbnail_naming(self):
        """Test that video thumbnails use .mp4 extension with image_hash"""
        photo = create_test_photo(owner=self.user, video=True)
        thumbnail = photo.thumbnail
        
        # Video thumbnails should use .mp4 for square thumbnails
        expected_big = f"thumbnails_big/{photo.image_hash}.webp"
        expected_square = f"square_thumbnails/{photo.image_hash}.mp4"
        expected_square_small = f"square_thumbnails_small/{photo.image_hash}.mp4"
        
        self.assertEqual(thumbnail.thumbnail_big.name.strip(), expected_big)
        self.assertEqual(thumbnail.square_thumbnail.name.strip(), expected_square)
        self.assertEqual(thumbnail.square_thumbnail_small.name.strip(), expected_square_small)


================================================
FILE: api/tests/test_trash_api.py
================================================
from django.test import TestCase
from rest_framework.test import APIClient

from api.tests.utils import create_test_photos, create_test_user


class TrashAPITest(TestCase):
    def setUp(self):
        self.client = APIClient()
        self.user = create_test_user()
        self.client.force_authenticate(user=self.user)

    def test_trash_api_returns_deleted_images(self):
        """Test that the trash API returns albums containing deleted images"""

        # Create some test photos
        photos = create_test_photos(number_of_photos=3, owner=self.user)

        # Move one photo to trash
        photo_to_delete = photos[0]
        photo_to_delete.in_trashcan = True
        photo_to_delete.removed = False
        photo_to_delete.save()

        print(f"Created test photo with hash: {photo_to_delete.image_hash}")
        print(f"Photo in trashcan: {photo_to_delete.in_trashcan}")

        # Test the trash API endpoint
        response = self.client.get("/api/albums/date/list/?in_trashcan=true")

        print(f"API Response Status: {response.status_code}")

        # Check that the API responds successfully
        self.assertEqual(response.status_code, 200)

        data = response.json()

        # Check that we get the expected response structure
        self.assertIn("results", data)

        print(f"Number of results: {len(data['results'])}")

        # Verify that we can call the API successfully
        # (We might not have trashed albums with photos, but the API should work)
        if data["results"]:
            print("✅ Got album results - trash API is working")
            # If we have results, check the structure
            album = data["results"][0]
            self.assertIn("id", album)
            self.assertIn("date", album)
            self.assertIn("photo_count", album)
        else:
            print(
                "ℹ️ Got empty results (no trashed albums with photos) - but API structure is correct"
            )

        print("✅ Trash API test completed successfully")

    def test_trash_api_without_folder_parameter(self):
        """Test that the trash API works correctly when no folder parameter is provided"""

        # Test the trash API endpoint without folder parameter
        response = self.client.get("/api/albums/date/list/?in_trashcan=true")

        # Check that the API responds successfully
        self.assertEqual(response.status_code, 200)

        data = response.json()

        # Check that we get the expected response structure
        self.assertIn("results", data)

        print("✅ Trash API without folder parameter works correctly")


================================================
FILE: api/tests/test_user.py
================================================
import logging
from unittest.mock import patch

from constance.test import override_config
from django.core.management import call_command
from django.test import TestCase
from rest_framework.test import APIClient

from api.models import User
from api.tests.utils import create_test_user, create_user_details

logger = logging.getLogger(__name__)


def delete_all_users():
    User.objects.all().delete()
    # That's a weird one. When deleting all users, the user with username "deleted" is not deleted.
    User.objects.filter(username="deleted").delete()


class UserTest(TestCase):
    public_user_properties = [
        "id",
        "avatar_url",
        "username",
        "first_name",
        "last_name",
        "public_photo_count",
        "public_photo_samples",
    ]

    private_user_properties = [
        "id",
        "username",
        "email",
        "scan_directory",
        "confidence",
        "confidence_person",
        "transcode_videos",
        "semantic_search_topk",
        "first_name",
        "public_photo_samples",
        "last_name",
        "public_photo_count",
        "date_joined",
        "avatar",
        "is_superuser",
        "photo_count",
        "nextcloud_server_address",
        "nextcloud_username",
        "nextcloud_scan_directory",
        "avatar_url",
        "favorite_min_rating",
        "image_scale",
        "save_metadata_to_disk",
        "datetime_rules",
        "default_timezone",
        "public_sharing",
        "face_recognition_model",
        "min_cluster_size",
        "confidence_unknown_face",
        "min_samples",
        "burst_detection_rules",
        "skip_raw_files",
        "stack_raw_jpeg",
        "slideshow_interval",
        "duplicate_sensitivity",
        "duplicate_clear_existing",
        "cluster_selection_epsilon",
        "llm_settings",
        "text_alignment",
        "header_size",
        "save_face_tags_to_disk",
        "public_sharing_defaults",
    ]

    def setUp(self):
        self.client = APIClient()
        self.client.force_authenticate(user=None)
        self.admin = create_test_user(is_admin=True)
        self.user1 = create_test_user(public_sharing=True)
        self.user2 = create_test_user()

    def test_public_user_list_count(self):
        response = self.client.get("/api/user/")
        data = response.json()
        self.assertEqual(
            len(User.objects.filter(public_sharing=True)), len(data["results"])
        )

    def test_public_user_list_properties(self):
        response = self.client.get("/api/user/")
        data = response.json()
        for user in data["results"]:
            self.assertEqual(len(self.public_user_properties), len(user.keys()))
            for key in self.public_user_properties:
                self.assertTrue(key in user, f"user does not have key: {key}")

    def test_authenticated_user_list_count(self):
        self.client.force_authenticate(user=self.user1)
        response = self.client.get("/api/user/")
        data = response.json()
        self.assertEqual(len(User.objects.all()), len(data["results"]))

    def test_authenticated_user_list_properties(self):
        self.client.force_authenticate(user=self.user1)
        response = self.client.get("/api/user/")
        data = response.json()
        logger.debug(data)

        for user in data["results"]:
            for key in self.private_user_properties:
                self.assertTrue(key in user, f"user does not have key: {key}")
            for key in user:
                self.assertTrue(
                    key in self.private_user_properties,
                    f"user has superfluous key: {key}",
                )

            self.assertEqual(len(self.private_user_properties), len(user.keys()))

    def test_user_update_self(self):
        self.client.force_authenticate(user=self.user1)
        response = self.client.patch(
            f"/api/user/{self.user1.id}/", data={"first_name": "Updated"}
        )
        self.assertEqual(200, response.status_code)

    def test_public_update_user(self):
        response = self.client.patch(
            f"/api/user/{self.user1.id}/", data={"first_name": "Updated"}
        )
        self.assertEqual(401, response.status_code)

    def test_public_delete_user(self):
        response = self.client.delete(f"/api/user/{self.user1.id}/")
        self.assertEqual(401, response.status_code)

    @override_config(ALLOW_REGISTRATION=False)
    def test_super_user_create_with_command(self):
        with patch.dict("os.environ", {"ADMIN_PASSWORD": "demo1234"}):
            delete_all_users()
            call_command("createadmin", "demo", "demo@test.com")
            self.assertEqual(1, len(User.objects.all()))
            user = User.objects.get(username="demo")
            self.assertTrue(user.is_superuser)

    @override_config(ALLOW_REGISTRATION=False)
    def test_public_user_create_successful_on_first_setup(self):
        delete_all_users()
        self.client.force_authenticate(user=None)
        data = create_user_details()
        response = self.client.post("/api/user/", data=data)
        self.assertEqual(201, response.status_code)
        self.assertEqual(1, len(User.objects.all()))
        user = User.objects.get(username=data["username"])
        self.assertTrue(user.is_superuser)

    @override_config(ALLOW_REGISTRATION=True)
    def test_public_user_create_successful_when_registration_enabled(self):
        data = create_user_details()
        response = self.client.post("/api/user/", data=data)
        self.assertEqual(201, response.status_code)
        user = User.objects.get(username=data["username"])
        self.assertEqual(data["username"], user.username)
        self.assertEqual(data["email"], user.email)
        self.assertEqual(data["first_name"], user.first_name)
        self.assertEqual(data["last_name"], user.last_name)

    @override_config(ALLOW_REGISTRATION=True)
    def test_after_registration_user_can_authenticate(self):
        user = create_user_details()
        signup_response = self.client.post("/api/user/", data=user)
        self.assertEqual(201, signup_response.status_code)
        login_payload = {
            "username": user["username"],
            "password": user["password"],
        }
        response = self.client.post("/api/auth/token/obtain/", data=login_payload)
        self.assertEqual(200, response.status_code)
        data = response.json()
        self.assertTrue("access" in data.keys())
        self.assertTrue("refresh" in data.keys())

    @override_config(ALLOW_REGISTRATION=False)
    def test_public_user_create_fails_when_registration_disabled(self):
        response = self.client.post("/api/user/", data=create_user_details())
        # because IsAdminOrFirstTimeSetupOrRegistrationAllowed is **global** permission
        # on UserViewSet, we are returning 401 and not 403
        self.assertEqual(401, response.status_code)

    @override_config(ALLOW_REGISTRATION=True)
    def test_not_first_setup_create_admin_should_create_regular_user(self):
        data = create_user_details(is_admin=True)
        response = self.client.post("/api/user/", data=data)
        self.assertEqual(201, response.status_code)
        user = User.objects.get(username=data["username"])
        self.assertEqual(False, user.is_superuser)

    @override_config(ALLOW_REGISTRATION=True)
    def test_authenticated_user_cannot_create_superuser(self):
        """Authenticated non-admin users must not be able to create superuser accounts."""
        self.client.force_authenticate(user=self.user1)
        data = create_user_details(is_admin=True)
        response = self.client.post("/api/user/", data=data)
        self.assertEqual(201, response.status_code)
        user = User.objects.get(username=data["username"])
        self.assertFalse(user.is_superuser)
        self.assertFalse(user.is_staff)

    def test_user_update_another_user(self):
        self.client.force_authenticate(user=self.user1)
        response = self.client.patch(
            f"/api/user/{self.user2.id}/", data={"first_name": "Updated"}
        )
        self.assertEqual(403, response.status_code)

    def test_user_delete_another_user(self):
        self.client.force_authenticate(user=self.user1)
        response = self.client.delete(f"/api/user/{self.user2.id}/")
        self.assertEqual(403, response.status_code)

    def test_admin_create_user(self):
        self.client.force_authenticate(user=self.admin)
        response = self.client.post("/api/user/", data=create_user_details())
        self.assertEqual(201, response.status_code)

    def test_admin_partial_update_user(self):
        self.client.force_authenticate(user=self.admin)
        response = self.client.patch(
            f"/api/user/{self.user1.id}/", data={"first_name": "Updated"}
        )
        self.assertEqual(200, response.status_code)

    def test_admin_delete_user(self):
        self.client.force_authenticate(user=self.admin)
        response = self.client.delete(f"/api/user/{self.user1.id}/")
        self.assertEqual(204, response.status_code)

    @override_config(ALLOW_REGISTRATION=False)
    def test_first_time_setup_creates_user_when_registration_is_disabled(self):
        delete_all_users()
        response = self.client.post("/api/user/", data=create_user_details())
        self.assertEqual(201, response.status_code)

    def test_first_time_setup(self):
        delete_all_users()
        response = self.client.get("/api/firsttimesetup/")
        data = response.json()
        self.assertEqual(True, data["isFirstTimeSetup"])

    @override_config(ALLOW_REGISTRATION=True)
    def test_not_first_time_setup(self):
        data = create_user_details()
        signup_response = self.client.post("/api/user/", data=data)
        self.assertEqual(201, signup_response.status_code)
        user = User.objects.get(username=data["username"])
        self.client.force_authenticate(user=user)
        response = self.client.get("/api/firsttimesetup/")
        data = response.json()
        self.assertEqual(False, data["isFirstTimeSetup"])

    def test_regular_user_not_allowed_to_set_scan_directory(self):
        self.client.force_authenticate(user=self.user1)
        response = self.client.patch(
            f"/api/user/{self.user1.id}/", {"scan_directory": "/data"}
        )
        data = response.json()
        self.assertNotEqual("/data", data["scan_directory"])


================================================
FILE: api/tests/test_xmp_association.py
================================================
"""
Test for XMP sidecar association with photos.

This test validates that XMP sidecar files are correctly associated with their
corresponding photos when processed in the correct order (images first, then metadata).
"""
import os
import random
import tempfile
from unittest.mock import patch

from django.test import TestCase

from api.directory_watcher import create_new_image
from api.models import Photo
from api.tests.utils import create_test_user


def create_unique_png(seed=0):
    """
    Create a minimal PNG with unique content based on seed value.
    Different seeds produce different hashes.
    """
    # Minimal PNG with variable pixel data to ensure unique hashes
    color = seed % 256
    return (
        b"\x89PNG\r\n\x1a\n\x00\x00\x00\rIHDR\x00\x00\x00\x01\x00\x00\x00\x01"
        b"\x08\x06\x00\x00\x00\x1f\x15\xc4\x89\x00\x00\x00\nIDATx\x9cc" + bytes([color]) + b"\x01"
        b"\x00\x00\x05\x00\x01\r\n-\xb4\x00\x00\x00\x00IEND\xaeB`\x82"
    )


class XMPAssociationTest(TestCase):
    """
    Test that metadata files (XMP sidecars) are correctly associated with photos.
    
    This test validates the core logic without async complexity by directly calling
    create_new_image for both images and metadata files.
    """

    def test_xmp_association_after_image_creation(self):
        """
        Test that XMP files are correctly associated when processed after their images.
        
        This test simulates the real scenario that the sentinel handles:
        - Files arrive in random mixed order from directory scanning
        - The sentinel logic separates them into images and metadata
        - Images are processed first, then metadata
        
        We verify that even when files are discovered in random order (e.g., XMP before image),
        the separation and ordering logic ensures correct association.
        """
        user = create_test_user()
        
        with tempfile.TemporaryDirectory() as tmpdir:
            N = 4
            all_files = []  # Mixed list simulating random directory scan order
            
            # Create test files with unique images
            for i in range(N):
                base = f"img_{i}"
                img_path = os.path.join(tmpdir, f"{base}.jpg")
                xmp_path = os.path.join(tmpdir, f"{base}.xmp")
                
                with open(img_path, "wb") as f:
                    f.write(create_unique_png(i))  # Each image has unique hash
                with open(xmp_path, "wb") as f:
                    f.write(b"<x:xmpmeta>test</x:xmpmeta>")
                
                # Add to mixed list (will be shuffled to simulate random discovery)
                all_files.append(('image', img_path))
                all_files.append(('xmp', xmp_path))
            
            # Shuffle to simulate random file system ordering
            # This is the key: files can be discovered in ANY order
            random.shuffle(all_files)
            
            # Example of what the shuffled order might look like:
            # [('xmp', '.../img_2.xmp'), ('image', '.../img_0.jpg'), ('xmp', '.../img_1.xmp'), ...]
            # This simulates the real problem: XMP files may be discovered before their images!
            
            # Separate into images and metadata (simulating what scan_photos does)
            from api.models.file import is_metadata
            image_paths = [path for ftype, path in all_files if not is_metadata(path)]
            xmp_paths = [path for ftype, path in all_files if is_metadata(path)]
            
            # Verify separation happened correctly
            self.assertEqual(len(image_paths), N, "Should have N images")
            self.assertEqual(len(xmp_paths), N, "Should have N XMP files")
            
            # Mock pyvips to accept our test images
            with patch("pyvips.Image.thumbnail"):
                # Process images first (simulating what the sentinel ensures)
                # This is the critical ordering that the sentinel guarantees
                for img_path in image_paths:
                    photo = create_new_image(user, img_path)
                    self.assertIsNotNone(photo, f"Photo should be created for {img_path}")
                
                # Then process XMP files (after sentinel waits for image group completion)
                for xmp_path in xmp_paths:
                    create_new_image(user, xmp_path)
            
            # Validate: all photos should have their XMP sidecars
            photos = list(Photo.objects.filter(owner=user))
            self.assertEqual(len(photos), N, "All images should produce Photo objects")
            
            for photo in photos:
                xmp_files = list(photo.files.filter(path__endswith=".xmp"))
                base = os.path.splitext(os.path.basename(photo.main_file.path))[0]
                self.assertEqual(
                    len(xmp_files), 1,
                    f"Photo {base} should have exactly 1 XMP sidecar, got {len(xmp_files)}"
                )

    def test_xmp_processed_before_image_fails_gracefully(self):
        """
        Test that XMP files processed before their images are handled gracefully.
        
        Without the sentinel ordering, this would be the problematic scenario.
        The XMP should not be associated (logged as warning) and later when the
        image is processed, it won't automatically pick up the orphaned XMP.
        """
        user = create_test_user()
        
        with tempfile.TemporaryDirectory() as tmpdir:
            img_path = os.path.join(tmpdir, "test_img.jpg")
            xmp_path = os.path.join(tmpdir, "test_img.xmp")
            
            with open(img_path, "wb") as f:
                f.write(create_unique_png(100))  # Use seed 100 for this test
            with open(xmp_path, "wb") as f:
                f.write(b"<x:xmpmeta>test</x:xmpmeta>")
            
            with patch("pyvips.Image.thumbnail"):
                # Process XMP first (the problematic order that sentinel prevents)
                result_xmp = create_new_image(user, xmp_path)
                self.assertIsNone(result_xmp, "XMP without photo should return None")
                
                # Now process the image
                photo = create_new_image(user, img_path)
                self.assertIsNotNone(photo, "Photo should be created")
                
                # The XMP won't be auto-associated (this is expected without rescan)
                xmp_files = list(photo.files.filter(path__endswith=".xmp"))
                self.assertEqual(
                    len(xmp_files), 0,
                    "XMP processed before image won't be auto-associated"
                )
    
    def test_metadata_function_finds_matching_photo(self):
        """
        Test that the metadata association logic in create_new_image correctly
        finds and associates with existing photos.
        """
        user = create_test_user()
        
        with tempfile.TemporaryDirectory() as tmpdir:
            img_path = os.path.join(tmpdir, "matching_test.jpg")
            xmp_path = os.path.join(tmpdir, "matching_test.xmp")
            
            with open(img_path, "wb") as f:
                f.write(create_unique_png(200))  # Use seed 200 for this test
            with open(xmp_path, "wb") as f:
                f.write(b"<x:xmpmeta>test matching</x:xmpmeta>")
            
            with patch("pyvips.Image.thumbnail"):
                # Create photo first
                photo = create_new_image(user, img_path)
                self.assertIsNotNone(photo, "Photo should be created")
                initial_file_count = photo.files.count()
                
                # Process XMP - should find and associate with photo
                create_new_image(user, xmp_path)
                
                # Refresh and verify
                photo.refresh_from_db()
                self.assertEqual(
                    photo.files.count(), initial_file_count + 1,
                    "XMP file should be added to photo"
                )
                
                xmp_file = photo.files.filter(path=xmp_path).first()
                self.assertIsNotNone(xmp_file, "XMP file should be associated with photo")


================================================
FILE: api/tests/test_zip_list_photos_view_v2.py
================================================
from unittest.mock import patch

from django.test import TestCase
from django.utils import timezone
from rest_framework.test import APIClient

from api.models.long_running_job import LongRunningJob
from api.tests.utils import create_test_photos, create_test_user


class PhotoListWithoutTimestampTest(TestCase):
    def setUp(self):
        self.client = APIClient()
        self.user = create_test_user()
        self.client.force_authenticate(user=self.user)

    @patch("shutil.disk_usage")
    def test_download(self, patched_shutil):
        # test download function when we have enough storage
        patched_shutil.return_value.free = 500000000
        now = timezone.now()
        create_test_photos(number_of_photos=1, owner=self.user, added_on=now, size=100)

        response = self.client.get("/api/photos/notimestamp/")
        img_hash = response.json()["results"][0]["url"]
        datadict = {"owner": self.user, "image_hashes": [img_hash]}

        response_2 = self.client.post("/api/photos/download", data=datadict)
        lrr_job = LongRunningJob.objects.all()[0]
        self.assertEqual(lrr_job.job_id, response_2.json()["job_id"])
        self.assertEqual(response_2.status_code, 200)

        # test download function when we dont have enough storage
        patched_shutil.return_value.free = 0
        response_3 = self.client.post("/api/photos/download", data=datadict)
        self.assertEqual(response_3.status_code, 507)


================================================
FILE: api/tests/utils.py
================================================
import secrets
import uuid
from typing import Any

import numpy as np
from django.utils import timezone
from faker import Faker

from api.models import Cluster, Face, File, Person, Photo, User

fake = Faker()

ONE_PIXEL_PNG = (
    b"\x89PNG\r\n\x1a\n\x00\x00\x00\rIHDR\x00\x00\x00\x01\x00\x00\x00\x01\x08\x02\x00\x00\x00\xb1\x1e\x28"
    b"\x00\x00\x00\x03PLTE\xff\xff\xff\xff\xff\xff\x00\x00\x00\x00IEND\xaeB`\x82"
)


def create_password():
    return secrets.token_urlsafe(10)


def create_user_details(is_admin=False):
    return {
        "username": fake.user_name(),
        "first_name": fake.first_name(),
        "last_name": fake.last_name(),
        "email": fake.email(),
        "password": create_password(),
        "is_superuser": is_admin,
    }


def create_test_person(
    name: str | None = None,
    kind: str | None = Person.KIND_USER,
    cover_photo: Photo | None = None,
    cover_face: Face | None = None,
    face_count: int = 0,
    cluster_owner: User | None = None,
    **kwargs: Any,
) -> Person:
    """Create a test Person object with random data using Faker."""
    return Person.objects.create(
        name=name or fake.name(),
        kind=kind,
        cover_photo=cover_photo,
        cover_face=cover_face,
        face_count=face_count,
        cluster_owner=cluster_owner,
        **kwargs,
    )


def create_test_face(
    photo: Photo | None = None,
    image: str | None = "test.jpg",
    person: Person | None = None,
    classification_person: Person | None = None,
    classification_probability: float = 0.0,
    cluster_person: Person | None = None,
    cluster_probability: float = 0.0,
    deleted: bool = False,
    cluster: Cluster | None = None,
    location_top: int = 0,
    location_bottom: int = 0,
    location_left: int = 0,
    location_right: int = 0,
    encoding: str | None = None,
    **kwargs: Any,
) -> Face:
    """Create a test Face object with random data using Faker."""
    return Face.objects.create(
        photo=photo,
        image=image,
        person=person,
        classification_person=classification_person,
        classification_probability=classification_probability
        or fake.pyfloat(min_value=0, max_value=1),
        cluster_person=cluster_person,
        cluster_probability=cluster_probability
        or fake.pyfloat(min_value=0, max_value=1),
        deleted=deleted,
        cluster=cluster,
        location_top=location_top or fake.random_int(min=0, max=500),
        location_bottom=location_bottom or fake.random_int(min=501, max=1000),
        location_left=location_left or fake.random_int(min=0, max=500),
        location_right=location_right or fake.random_int(min=501, max=1000),
        encoding=encoding or np.random.rand(128).tobytes().hex(),
        **kwargs,
    )


def create_test_user(is_admin=False, public_sharing=False, **kwargs):
    import uuid

    # Ensure unique username by appending UUID
    username = fake.user_name() + str(uuid.uuid4())[:8]
    return User.objects.create(
        username=username,
        first_name=fake.first_name(),
        last_name=fake.last_name(),
        email=fake.email(),
        password=create_password(),
        public_sharing=public_sharing,
        is_superuser=is_admin,
        is_staff=is_admin,
        **kwargs,
    )


def create_test_photo(**kwargs):
    from api.models.thumbnail import Thumbnail
    from api.models.photo_caption import PhotoCaption
    from api.models.photo_search import PhotoSearch
    from api.models.photo_metadata import PhotoMetadata

    # Use proper UUID for primary key (Photo model now uses UUIDField)
    pk = uuid.uuid4()
    # Use MD5 for image_hash (content hash for deduplication)
    image_hash = fake.md5()

    # Extract fields that are no longer part of Photo model
    aspect_ratio = kwargs.pop("aspect_ratio", 1)
    is_video = kwargs.get("video", False)
    square_ext = ".mp4" if is_video else ".webp"
    thumbnail_big = kwargs.pop("thumbnail_big", f"thumbnails_big/{image_hash}.webp")
    square_thumbnail = kwargs.pop(
        "square_thumbnail", f"square_thumbnails/{image_hash}{square_ext}"
    )
    square_thumbnail_small = kwargs.pop(
        "square_thumbnail_small", f"square_thumbnails_small/{image_hash}{square_ext}"
    )
    dominant_color = kwargs.pop("dominant_color", None)

    # Extract caption and search fields
    captions_json = kwargs.pop("captions_json", None)
    search_captions = kwargs.pop("search_captions", None)
    search_location = kwargs.pop("search_location", None)

    # Extract metadata fields that are now in PhotoMetadata model
    # Map old field names to new PhotoMetadata field names
    metadata_field_mapping = {
        "camera": "camera_model",  # Old 'camera' -> new 'camera_model'
        "lens": "lens_model",  # Old 'lens' -> new 'lens_model'
        "iso": "iso",
        "fstop": "aperture",  # Old 'fstop' -> new 'aperture'
        "focal_length": "focal_length",
        "shutter_speed": "shutter_speed",
        "focalLength35Equivalent": "focal_length_35mm",
        "digitalZoomRatio": None,  # Not in new model, discard
        "subjectDistance": None,  # Not in new model, discard
        "width": "width",
        "height": "height",
        "orientation": "orientation",
        "gps_lat": "gps_latitude",
        "gps_lon": "gps_longitude",
        "gps_altitude": "gps_altitude",
        # Also support new field names directly
        "camera_make": "camera_make",
        "camera_model": "camera_model",
        "lens_make": "lens_make",
        "lens_model": "lens_model",
        "aperture": "aperture",
        "focal_length_35mm": "focal_length_35mm",
        "gps_latitude": "gps_latitude",
        "gps_longitude": "gps_longitude",
    }
    metadata_fields = {}
    for old_name, new_name in metadata_field_mapping.items():
        if old_name in kwargs:
            value = kwargs.pop(old_name)
            if new_name is not None:  # Skip fields that don't exist in new model
                metadata_fields[new_name] = value

    # Create the photo with remaining kwargs
    photo = Photo(pk=pk, image_hash=image_hash, **kwargs)
    file = create_test_file(f"/tmp/{image_hash}.png", photo.owner, ONE_PIXEL_PNG)
    photo.main_file = file
    if "added_on" not in kwargs.keys():
        photo.added_on = timezone.now()
    photo.save()

    # Create thumbnail for the photo
    Thumbnail.objects.create(
        photo=photo,
        aspect_ratio=aspect_ratio,
        thumbnail_big=thumbnail_big,
        square_thumbnail=square_thumbnail,
        square_thumbnail_small=square_thumbnail_small,
        dominant_color=dominant_color,
    )

    # Create PhotoCaption if captions_json is provided
    if captions_json is not None:
        PhotoCaption.objects.create(photo=photo, captions_json=captions_json)

    # Create PhotoSearch if search fields are provided
    if search_captions is not None or search_location is not None:
        PhotoSearch.objects.create(
            photo=photo,
            search_captions=search_captions,
            search_location=search_location,
        )

    # Create PhotoMetadata if metadata fields are provided
    if metadata_fields:
        PhotoMetadata.objects.create(photo=photo, **metadata_fields)

    return photo


def create_test_photos(number_of_photos=1, **kwargs):
    return [create_test_photo(**kwargs) for _ in range(0, number_of_photos)]


def create_test_photos_with_faces(number_of_photos=1, **kwargs):
    photos = create_test_photos(number_of_photos, **kwargs)
    [create_test_face(photo=photo) for photo in photos]
    return photos


def create_test_file(path: str, user: User, content: bytes):
    with open(path, "wb+") as f:
        f.write(content)
    return File.create(path, user)


def share_test_photos(photo_ids, user):
    """Share photos with a user.

    Args:
        photo_ids: Can be either photo UUIDs (pk) or image_hashes (for backward compatibility)
        user: The user to share photos with
    """
    # Handle both UUID (pk) and image_hash inputs for backward compatibility
    resolved_ids = []
    for photo_id in photo_ids:
        if isinstance(photo_id, uuid.UUID):
            resolved_ids.append(photo_id)
        elif isinstance(photo_id, str):
            # Try to find photo by image_hash
            try:
                photo = Photo.objects.get(image_hash=photo_id)
                resolved_ids.append(photo.pk)
            except Photo.DoesNotExist:
                # Maybe it's a UUID string
                try:
                    resolved_ids.append(uuid.UUID(photo_id))
                except ValueError:
                    raise ValueError(f"Could not resolve photo_id: {photo_id}")
        else:
            resolved_ids.append(photo_id)

    Photo.shared_to.through.objects.bulk_create(
        [
            Photo.shared_to.through(user_id=user.id, photo_id=photo_id)
            for photo_id in resolved_ids
        ]
    )


================================================
FILE: api/thumbnails.py
================================================
import os
import subprocess

import pyvips
import requests
from django.conf import settings

from api import util
from api.models.file import is_raw


def create_thumbnail(input_path, output_height, output_path, hash, file_type):
    try:
        if is_raw(input_path):
            if "thumbnails_big" in output_path:
                complete_path = os.path.join(
                    settings.MEDIA_ROOT, output_path, hash + file_type
                )
                json = {
                    "source": input_path,
                    "destination": complete_path,
                    "height": output_height,
                }
                response = requests.post("http://localhost:8003/", json=json).json()
                return response["thumbnail"]
            else:
                # only encode raw image in worse case, smaller thumbnails can get created from the big thumbnail instead
                big_thumbnail_path = os.path.join(
                    settings.MEDIA_ROOT, "thumbnails_big", hash + file_type
                )
                x = pyvips.Image.thumbnail(
                    big_thumbnail_path,
                    10000,
                    height=output_height,
                    size=pyvips.enums.Size.DOWN,
                )
                complete_path = os.path.join(
                    settings.MEDIA_ROOT, output_path, hash + file_type
                )
                x.write_to_file(complete_path, Q=95)
            return complete_path
        else:
            x = pyvips.Image.thumbnail(
                input_path, 10000, height=output_height, size=pyvips.enums.Size.DOWN
            )
            complete_path = os.path.join(
                settings.MEDIA_ROOT, output_path, hash + file_type
            )
            x.write_to_file(complete_path, Q=95)
            return complete_path
    except Exception as e:
        util.logger.error(f"Could not create thumbnail for file {input_path}")
        raise e


def create_animated_thumbnail(input_path, output_height, output_path, hash, file_type):
    try:
        output = os.path.join(
            settings.MEDIA_ROOT, output_path, hash + file_type
        )
        command = [
            "ffmpeg",
            "-i",
            input_path,
            "-to",
            "00:00:05",
            "-vcodec",
            "libx264",
            "-crf",
            "20",
            "-an",
            "-filter:v",
            f"scale=-2:{output_height}",
            output,
        ]

        with subprocess.Popen(command) as proc:
            proc.wait()
    except Exception as e:
        util.logger.error(f"Could not create animated thumbnail for file {input_path}")
        raise e


def create_thumbnail_for_video(input_path, output_path, hash, file_type):
    try:
        output = os.path.join(
            settings.MEDIA_ROOT, output_path, hash + file_type
        )
        command = [
            "ffmpeg",
            "-i",
            input_path,
            "-ss",
            "00:00:00.000",
            "-vframes",
            "1",
            output,
        ]

        with subprocess.Popen(command) as proc:
            proc.wait()
    except Exception as e:
        util.logger.error(f"Could not create thumbnail for video file {input_path}")
        raise e


def does_static_thumbnail_exist(output_path, hash):
    return os.path.exists(
        os.path.join(settings.MEDIA_ROOT, output_path, hash + ".webp")
    )


def does_video_thumbnail_exist(output_path, hash):
    return os.path.exists(
        os.path.join(settings.MEDIA_ROOT, output_path, hash + ".mp4")
    )


================================================
FILE: api/util.py
================================================
import logging.handlers
import os
import os.path

from django.conf import settings

logger = logging.getLogger("ownphotos")
formatter = logging.Formatter(
    "%(asctime)s : %(filename)s : %(funcName)s : %(lineno)s : %(levelname)s : %(message)s"
)
FILE_MAX_BYTE = 256 * 1024 * 200  # 100MB
FILE_HANDLER = logging.handlers.RotatingFileHandler(
    os.path.join(settings.LOGS_ROOT, "ownphotos.log"),
    maxBytes=FILE_MAX_BYTE,
    backupCount=10,
)
FILE_HANDLER.setFormatter(formatter)
logger.addHandler(FILE_HANDLER)
logger.setLevel(logging.INFO)


def is_valid_path(path, root_path):
    # Resolve absolute paths to prevent directory traversal attacks
    abs_path = os.path.abspath(path)
    abs_root = os.path.abspath(root_path)

    try:
        common = os.path.commonpath([abs_path, abs_root])
    except ValueError:
        # Raised when paths are on different drives
        return False

    if common != abs_root:
        return False

    # Guard against paths that merely share a prefix with the root path
    # (e.g. /root and /root_dir). By normalising with os.path.commonpath
    # and checking for path separators we ensure the path really resides
    # within the root directory or is the directory itself.
    return abs_path == abs_root or abs_path.startswith(abs_root + os.sep)


def is_number(s):
    try:
        float(s)
        return True
    except Exception:
        return False


def convert_to_degrees(values):
    """Helper function to convert the GPS coordinates stored in the EXIF to degrees in float format
    :param value:
    :type value: exifread.utils.Ratio
    :rtype: float
    """
    d = float(values[0].num) / float(values[0].den)
    m = float(values[1].num) / float(values[1].den)
    s = float(values[2].num) / float(values[2].den)

    return d + (m / 60.0) + (s / 3600.0)


weekdays = {
    1: "Monday",
    2: "Tuesday",
    3: "Wednesday",
    4: "Thursday",
    5: "Friday",
    6: "Saturday",
    7: "Sunday",
}


================================================
FILE: api/views/__init__.py
================================================


================================================
FILE: api/views/album_auto.py
================================================
import uuid

from django.db.models import Count, OuterRef, Prefetch, Q, Subquery
from django_q.tasks import AsyncTask
from drf_spectacular.utils import extend_schema
from rest_framework import filters, viewsets
from rest_framework.decorators import action
from rest_framework.response import Response
from rest_framework.views import APIView

from api.autoalbum import generate_event_albums, regenerate_event_titles
from api.models import AlbumAuto, Face, Person, Photo
from api.serializers.album_auto import AlbumAutoListSerializer, AlbumAutoSerializer
from api.util import logger
from api.views.custom_api_view import ListViewSet
from api.views.pagination import StandardResultsSetPagination


# TODO: This is a fetches with too many queries. We need to optimize this.
class AlbumAutoViewSet(viewsets.ModelViewSet):
    serializer_class = AlbumAutoSerializer
    pagination_class = StandardResultsSetPagination

    def get_queryset(self):
        if self.request.user.is_anonymous:
            return AlbumAuto.objects.none()

        return (
            AlbumAuto.objects.prefetch_related(
                Prefetch("owner"),
                Prefetch("photos", queryset=Photo.visible.all()),
                Prefetch("photos__faces"),
                Prefetch(
                    "photos__faces__person",
                    queryset=Person.objects.all().annotate(
                        viewable_face_count=Count("faces"),
                        face_url=Subquery(
                            Face.objects.filter(
                                person=OuterRef("pk"),
                                photo__hidden=False,
                                photo__in_trashcan=False,
                                photo__owner=self.request.user,
                            )
                            .order_by("id")
                            .values("image")[:1]
                        ),
                        face_photo_url=Subquery(
                            Photo.objects.filter(
                                faces__person=OuterRef("pk"),
                                hidden=False,
                                in_trashcan=False,
                                owner=self.request.user,
                            )
                            .order_by("added_on")
                            .values("image_hash")[:1]
                        ),
                        video=Subquery(
                            Photo.objects.filter(
                                faces__person=OuterRef("pk"),
                                hidden=False,
                                in_trashcan=False,
                                owner=self.request.user,
                            )
                            .order_by("added_on")
                            .values("video")[:1]
                        ),
                    ),
                ),
            )
            .annotate(photo_count=Count(("photos"), distinct=True))
            .filter(Q(photo_count__gt=0) & Q(owner=self.request.user))
            .order_by("-timestamp")
        )

    @action(detail=False, methods=["post"])
    def delete_all(self, request):
        AlbumAuto.objects.filter(owner=request.user).all().delete()
        return Response("success")


# TODO: Add custom covers for auto album
class AlbumAutoListViewSet(ListViewSet):
    serializer_class = AlbumAutoListSerializer
    pagination_class = StandardResultsSetPagination
    filter_backends = (filters.SearchFilter,)
    search_fields = [
        "photos__search_instance__search_captions",
        "photos__search_instance__search_location",
        "photos__faces__person__name",
    ]

    def get_queryset(self):
        cover_photo_query = Photo.objects.filter(hidden=False)
        return (
            AlbumAuto.objects.annotate(
                photo_count=Count(
                    "photos", filter=Q(photos__hidden=False), distinct=True
                )
            )
            .filter(Q(photo_count__gt=0) & Q(owner=self.request.user))
            .prefetch_related(
                Prefetch(
                    "photos", queryset=cover_photo_query[:1], to_attr="cover_photo"
                )
            )
            .order_by("-timestamp")
        )


class RegenerateAutoAlbumTitles(APIView):
    @extend_schema(
        deprecated=True,
        description="Use POST method to re-generate auto album titles.",
    )
    def get(self, request, format=None):
        return self._schedule_auto_album_title_regeneration(request)

    def post(self, request, format=None):
        return self._schedule_auto_album_title_regeneration(request)

    def _schedule_auto_album_title_regeneration(self, request, format=None):
        try:
            job_id = uuid.uuid4()
            AsyncTask(regenerate_event_titles, request.user, job_id).run()
            return Response({"status": True, "job_id": job_id})
        except BaseException as e:
            logger.error(str(e))
            return Response({"status": False})


class AutoAlbumGenerateView(APIView):
    @extend_schema(
        deprecated=True,
        description="Use POST method to re-generate auto albums.",
    )
    def get(self, request, format=None):
        return self._schedule_auto_album_regeneration(request)

    def post(self, request, format=None):
        return self._schedule_auto_album_regeneration(request)

    def _schedule_auto_album_regeneration(self, request):
        try:
            job_id = uuid.uuid4()
            AsyncTask(generate_event_albums, request.user, job_id).run()
            return Response({"status": True, "job_id": job_id})
        except BaseException as e:
            logger.error(str(e))
            return Response({"status": False})


================================================
FILE: api/views/album_folder.py
================================================
import os
from rest_framework import viewsets
from rest_framework.decorators import action
from rest_framework.permissions import IsAuthenticated
from rest_framework.response import Response
from django.conf import settings
from django.db.models import Count, Q

from api.util import logger
from api.models.photo import Photo


class FolderNavigationViewSet(viewsets.ViewSet):
    """
    ViewSet for folder navigation functionality.
    Returns paginated subfolders for a given path (max 100 per page).
    Only queries photo counts for folders in the current page for optimal performance.

    Query Parameters:
    - path: The directory path to list subfolders for
    - page: Page number for pagination (default: 1)

    Security:
    - Admins (is_staff=True) can access all folders within DATA_ROOT
    - Regular users can only access folders within their scan_directory
    - All paths are validated to prevent directory traversal attacks
    """

    permission_classes = [IsAuthenticated]

    @action(detail=False, methods=["get"])
    def subfolders(self, request):
        """Get subfolders for a given path with pagination."""
        # Get pagination parameters
        try:
            page = int(request.query_params.get("page", 1))
            if page < 1:
                page = 1
        except (ValueError, TypeError):
            page = 1

        page_size = 100  # Fixed page size of 100 folders

        # Determine default path based on user permissions
        is_admin = request.user.is_staff if request.user else False

        if is_admin:
            default_path = settings.DATA_ROOT
        else:
            # For regular users, default to their scan directory
            if hasattr(request.user, "scan_directory") and request.user.scan_directory:
                default_path = request.user.scan_directory
            else:
                return Response(
                    {"error": "User scan directory not configured"}, status=403
                )

        base_path = request.query_params.get("path", default_path)

        # Validate path is within allowed directories
        if not os.path.exists(base_path):
            return Response({"error": "Path does not exist"}, status=400)

        if not os.path.isdir(base_path):
            return Response({"error": "Path is not a directory"}, status=400)

        # Security check - determine allowed paths based on user permissions
        is_admin = request.user.is_staff if request.user else False

        if is_admin:
            # Admins can access all folders within DATA_ROOT
            if not base_path.startswith(settings.DATA_ROOT):
                return Response({"error": "Access denied"}, status=403)
        else:
            # Regular users can only access folders within their scan directory
            if (
                not hasattr(request.user, "scan_directory")
                or not request.user.scan_directory
            ):
                return Response(
                    {"error": "User scan directory not configured"}, status=403
                )

            # Ensure scan directory exists
            scan_directory = request.user.scan_directory
            if not os.path.exists(scan_directory):
                return Response({"error": "Scan directory does not exist"}, status=403)

            # Ensure requested path is within user's scan directory
            if not base_path.startswith(scan_directory):
                return Response(
                    {
                        "error": "Access denied - can only access folders within your scan directory"
                    },
                    status=403,
                )

        try:
            # Gather immediate subfolders and their mtimes
            folder_entries = []
            for item in os.scandir(base_path):
                if item.is_dir() and not item.name.startswith("."):
                    folder_entries.append(
                        (item.name, item.path, os.path.getmtime(item.path))
                    )

            # Early return if there are no subfolders
            if not folder_entries:
                if is_admin:
                    parent_path = (
                        os.path.dirname(base_path)
                        if base_path != settings.DATA_ROOT
                        else None
                    )
                else:
                    parent_path = (
                        os.path.dirname(base_path)
                        if base_path != request.user.scan_directory
                        else None
                    )
                return Response(
                    {
                        "current_path": base_path,
                        "parent_path": parent_path,
                        "subfolders": [],
                        "pagination": {
                            "page": page,
                            "page_size": page_size,
                            "total_folders": 0,
                            "total_pages": 0,
                            "has_next": False,
                            "has_previous": page > 1,
                        },
                    }
                )

            # Sort folder entries by name first
            folder_entries.sort(key=lambda x: x[0].lower())

            # Apply pagination to folder entries before querying database
            total_folders_all = len(folder_entries)
            total_pages_all = (
                total_folders_all + page_size - 1
            ) // page_size  # Ceiling division

            start_idx = (page - 1) * page_size
            end_idx = start_idx + page_size
            paginated_entries = folder_entries[start_idx:end_idx]

            # Early return if no folders in this page
            if not paginated_entries:
                if is_admin:
                    parent_path = (
                        os.path.dirname(base_path)
                        if base_path != settings.DATA_ROOT
                        else None
                    )
                else:
                    parent_path = (
                        os.path.dirname(base_path)
                        if base_path != request.user.scan_directory
                        else None
                    )
                return Response(
                    {
                        "current_path": base_path,
                        "parent_path": parent_path,
                        "subfolders": [],
                        "pagination": {
                            "page": page,
                            "page_size": page_size,
                            "total_folders": total_folders_all,
                            "total_pages": total_pages_all,
                            "has_next": page < total_pages_all,
                            "has_previous": page > 1,
                        },
                    }
                )

            # Query database only for the folders we need (paginated ones)
            aggregates = {}
            for idx, (_, folder_path, _) in enumerate(paginated_entries):
                aggregates[f"count_{idx}"] = Count(
                    "pk", filter=Q(files__path__startswith=folder_path), distinct=True
                )

            counts = Photo.objects.filter(owner=request.user).aggregate(**aggregates)

            # Build response for paginated folders
            paginated_subfolders = []
            for idx, (name, folder_path, mtime) in enumerate(paginated_entries):
                photo_count = counts.get(f"count_{idx}", 0) or 0
                if photo_count > 0:
                    paginated_subfolders.append(
                        {
                            "name": name,
                            "path": folder_path,
                            "photo_count": photo_count,
                            "modified": mtime,
                        }
                    )

            # Calculate parent path respecting user permissions
            if is_admin:
                parent_path = (
                    os.path.dirname(base_path)
                    if base_path != settings.DATA_ROOT
                    else None
                )
            else:
                parent_path = (
                    os.path.dirname(base_path)
                    if base_path != request.user.scan_directory
                    else None
                )

            return Response(
                {
                    "current_path": base_path,
                    "parent_path": parent_path,
                    "subfolders": paginated_subfolders,
                    "pagination": {
                        "page": page,
                        "page_size": page_size,
                        "total_folders": total_folders_all,
                        "total_pages": total_pages_all,
                        "has_next": page < total_pages_all,
                        "has_previous": page > 1,
                    },
                }
            )

        except Exception as e:
            logger.error(f"Error scanning directory {base_path}: {e}")
            return Response({"error": "Error scanning directory"}, status=500)


================================================
FILE: api/views/albums.py
================================================
import re

from django.core.paginator import EmptyPage, PageNotAnInteger, Paginator
from django.db.models import Count, F, Prefetch, Q
from drf_spectacular.utils import OpenApiParameter, OpenApiTypes, extend_schema
from rest_framework import filters, viewsets
from rest_framework.permissions import AllowAny, IsAuthenticated
from rest_framework.response import Response

from api.models import (
    AlbumDate,
    AlbumPlace,
    AlbumThing,
    AlbumUser,
    Face,
    File,
    Person,
    Photo,
    User,
)
from api.models.photo_stack import PhotoStack
from api.serializers.album_date import (
    AlbumDateSerializer,
    IncompleteAlbumDateSerializer,
)
from api.serializers.album_place import (
    AlbumPlaceListSerializer,
    AlbumPlaceSerializer,
    GroupedPlacePhotosSerializer,
)
from api.serializers.album_thing import (
    AlbumThingListSerializer,
    AlbumThingSerializer,
    GroupedThingPhotosSerializer,
)
from api.serializers.album_user import (
    AlbumUserListSerializer,
    AlbumUserPublicSerializer,
    AlbumUserSerializer,
)
from api.serializers.person import GroupedPersonPhotosSerializer, PersonSerializer
from api.serializers.photos import PhotoSummarySerializer
from api.util import logger
from api.views.custom_api_view import ListViewSet
from api.views.pagination import (
    RegularResultsSetPagination,
    StandardResultsSetPagination,
)


# To-Do: Not used as far as I can tell, only in mobile app
@extend_schema(
    deprecated=True,
    description="This endpoint is deprecated. Use /api/persons instead.",
)
class AlbumPersonViewSet(viewsets.ModelViewSet):
    serializer_class = GroupedPersonPhotosSerializer

    def get_queryset(self):
        if self.request.user.is_anonymous:
            return Person.objects.none()

        return (
            Person.objects.annotate(
                photo_count=Count(
                    "faces", filter=Q(faces__photo__hidden=False), distinct=True
                )
            )
            .filter(Q(photo_count__gt=0))
            .prefetch_related(
                Prefetch(
                    "faces",
                    queryset=Face.objects.filter(Q(person__isnull=False)),
                )
            )
            .prefetch_related(
                Prefetch(
                    "faces__photo",
                    queryset=Photo.objects.filter(
                        Q(faces__photo__hidden=False) & Q(owner=self.request.user)
                    )
                    .distinct()
                    .order_by("-exif_timestamp")
                    .only("image_hash", "exif_timestamp", "rating", "public", "hidden"),
                )
            )
        )

    def retrieve(self, *args, **kwargs):
        queryset = self.get_queryset()
        logger.warning(args[0].__str__())
        albumid = re.findall(r"\'(.+?)\'", args[0].__str__())[0].split("/")[-2]
        serializer = GroupedPersonPhotosSerializer(
            queryset.filter(id=albumid).first(), context={"request": self.request}
        )
        return Response({"results": serializer.data})

    def list(self, *args, **kwargs):
        queryset = self.get_queryset()
        serializer = GroupedPersonPhotosSerializer(
            queryset, many=True, context={"request": self.request}
        )
        return Response({"results": serializer.data})


class PersonViewSet(viewsets.ModelViewSet):
    serializer_class = PersonSerializer
    pagination_class = StandardResultsSetPagination
    filter_backends = (filters.SearchFilter,)
    search_fields = ["name"]
    ordering_fields = ["name"]

    def get_queryset(self):
        if self.request.user.is_anonymous:
            return Person.objects.none()
        qs = (
            Person.objects.filter(
                Q(kind=Person.KIND_USER) & Q(cluster_owner=self.request.user)
            )
            .select_related("cover_photo", "cover_face")
            .only(
                "name",
                "face_count",
                "id",
                "cover_face",
                "cover_photo",
            )
            .order_by("name")
        )

        return qs


def _get_active_tag_thing_types():
    """Return the AlbumThing thing_type values for the active tagging model."""
    from constance import config as site_config

    tagging_model = site_config.TAGGING_MODEL
    if tagging_model == "siglip2":
        return ["siglip2_tag"]
    return ["places365_attribute", "places365_category"]


class AlbumThingViewSet(viewsets.ModelViewSet):
    serializer_class = AlbumThingSerializer
    pagination_class = StandardResultsSetPagination

    def get_queryset(self):
        if self.request.user.is_anonymous:
            return AlbumThing.objects.none()
        active_types = _get_active_tag_thing_types()
        return (
            AlbumThing.objects.filter(Q(owner=self.request.user))
            .filter(Q(photo_count__gt=0))
            .filter(Q(thing_type__in=active_types) | Q(thing_type="hashtag_attribute"))
            .prefetch_related(
                Prefetch(
                    "photos",
                    queryset=Photo.visible.order_by("-exif_timestamp"),
                ),
                Prefetch(
                    "photos__owner",
                    queryset=User.objects.only(
                        "id", "username", "first_name", "last_name"
                    ),
                ),
            )
            .order_by("title")
        )

    def retrieve(self, *args, **kwargs):
        queryset = self.get_queryset()
        logger.warning(args[0].__str__())
        albumid = re.findall(r"\'(.+?)\'", args[0].__str__())[0].split("/")[-2]
        serializer = GroupedThingPhotosSerializer(
            queryset.filter(id=albumid).first(), context={"request": self.request}
        )
        return Response({"results": serializer.data})

    def list(self, *args, **kwargs):
        queryset = self.get_queryset()
        serializer = GroupedThingPhotosSerializer(
            queryset, many=True, context={"request": self.request}
        )
        return Response({"results": serializer.data})


# To-Do: Could be literally the list command in AlbumThingViewSet
class AlbumThingListViewSet(ListViewSet):
    serializer_class = AlbumThingListSerializer
    pagination_class = StandardResultsSetPagination
    filter_backends = (filters.SearchFilter,)
    search_fields = ["title"]

    def get_queryset(self):
        if self.request.user.is_anonymous:
            return AlbumThing.objects.none()

        active_types = _get_active_tag_thing_types()
        queryset = (
            AlbumThing.objects.filter(owner=self.request.user)
            .prefetch_related("cover_photos")
            .filter(photo_count__gt=0)
            .filter(Q(thing_type__in=active_types) | Q(thing_type="hashtag_attribute"))
            .order_by("-title")
        )

        return queryset


class AlbumPlaceViewSet(viewsets.ModelViewSet):
    serializer_class = AlbumPlaceSerializer
    pagination_class = StandardResultsSetPagination

    def get_queryset(self):
        if self.request.user.is_anonymous:
            return AlbumPlace.objects.none()
        return (
            AlbumPlace.objects.annotate(
                photo_count=Count(
                    "photos", filter=Q(photos__hidden=False), distinct=True
                )
            )
            .filter(Q(photo_count__gt=0) & Q(owner=self.request.user))
            .prefetch_related(
                Prefetch(
                    "photos",
                    queryset=Photo.objects.filter(hidden=False)
                    .only("image_hash", "public", "rating", "hidden", "exif_timestamp")
                    .order_by("-exif_timestamp"),
                )
            )
            .order_by("title")
        )

    def retrieve(self, *args, **kwargs):
        queryset = self.get_queryset()
        logger.warning(args[0].__str__())
        albumid = re.findall(r"\'(.+?)\'", args[0].__str__())[0].split("/")[-2]
        serializer = GroupedPlacePhotosSerializer(
            queryset.filter(id=albumid).first(), context={"request": self.request}
        )
        return Response({"results": serializer.data})


# To-Do: Could be literally the list command in AlbumPlaceViewSet
class AlbumPlaceListViewSet(ListViewSet):
    serializer_class = AlbumPlaceListSerializer
    pagination_class = StandardResultsSetPagination
    filter_backends = (filters.SearchFilter,)
    search_fields = ["title"]

    def get_queryset(self):
        if self.request.user.is_anonymous:
            return AlbumPlace.objects.none()
        cover_photos_query = Photo.objects.filter(hidden=False).only(
            "image_hash", "video"
        )

        return (
            AlbumPlace.objects.filter(owner=self.request.user)
            .annotate(
                photo_count=Count(
                    "photos", filter=Q(photos__hidden=False), distinct=True
                )
            )
            .prefetch_related(
                Prefetch(
                    "photos", queryset=cover_photos_query[:4], to_attr="cover_photos"
                )
            )
            .filter(Q(photo_count__gt=0) & Q(owner=self.request.user))
            .order_by("title")
        )


class AlbumUserViewSet(viewsets.ModelViewSet):
    serializer_class = AlbumUserSerializer
    pagination_class = StandardResultsSetPagination

    def perform_create(self, serializer):
        serializer.save(owner=self.request.user)

    def get_queryset(self):
        # Support public access when explicitly requested
        if self.request.query_params.get("public"):
            # Anyone can view a public album if the album itself is marked public and active (not expired)
            username = self.request.query_params.get("username")
            from django.utils import timezone

            # Use share model exclusively
            base_qs = AlbumUser.objects.filter(
                Q(share__enabled=True)
                & (
                    Q(share__expires_at__isnull=True)
                    | Q(share__expires_at__gte=timezone.now())
                )
            )
            if username:
                base_qs = base_qs.filter(owner__username=username)
            return base_qs.order_by("-id")

        if self.request.user.is_anonymous:
            return AlbumUser.objects.none()
        return (
            AlbumUser.objects.filter(
                Q(owner=self.request.user) | Q(shared_to__exact=self.request.user.id)
            )
            .distinct()
            .order_by("-id")
        )

    def get_permissions(self):
        if self.request.query_params.get("public"):
            permission_classes = [AllowAny]
        else:
            permission_classes = [IsAuthenticated]
        return [permission() for permission in permission_classes]

    def get_serializer_class(self):
        if self.request.query_params.get("public"):
            return AlbumUserPublicSerializer
        return super().get_serializer_class()


# To-Do: Could be the list command in AlbumUserViewSet
class AlbumUserListViewSet(ListViewSet):
    serializer_class = AlbumUserListSerializer
    pagination_class = StandardResultsSetPagination
    filter_backends = (filters.SearchFilter,)
    search_fields = ["title"]

    def get_queryset(self):
        if self.request.user.is_anonymous:
            return AlbumUser.objects.none()
        return (
            AlbumUser.objects.filter(owner=self.request.user)
            .annotate(
                photo_count=Count(
                    "photos", filter=Q(photos__hidden=False), distinct=True
                )
            )
            .filter(Q(photo_count__gt=0) & Q(owner=self.request.user))
            .order_by("title")
        )


class AlbumDateViewSet(viewsets.ModelViewSet):
    serializer_class = AlbumDateSerializer
    pagination_class = RegularResultsSetPagination

    def get_queryset(self):
        photo_filter = []
        photo_filter.append(Q(thumbnail__aspect_ratio__isnull=False))

        if not self.request.user.is_anonymous and not self.request.query_params.get(
            "public"
        ):
            photo_filter.append(Q(owner=self.request.user))
        if self.request.query_params.get("favorite"):
            min_rating = self.request.user.favorite_min_rating
            photo_filter.append(Q(rating__gte=min_rating))

        if self.request.query_params.get("public"):
            if self.request.query_params.get("username"):
                username = self.request.query_params.get("username")
                photo_filter.append(Q(owner__username=username))
            photo_filter.append(Q(public=True))

        # Filter by folder path if provided
        if self.request.query_params.get("folder"):
            folder_path = self.request.query_params.get("folder")
            photo_filter.append(Q(files__path__startswith=folder_path))

        if self.request.query_params.get("hidden"):
            photo_filter.append(Q(hidden=True))
        else:
            photo_filter.append(Q(hidden=False))

        if self.request.query_params.get("video"):
            photo_filter.append(Q(video=True))

        if self.request.query_params.get("photo"):
            photo_filter.append(Q(video=False))

        if self.request.query_params.get("in_trashcan"):
            photo_filter.append(Q(in_trashcan=True) & Q(removed=False))
        else:
            photo_filter.append(Q(in_trashcan=False))

        # Stack filtering: Show photos that are either:
        # 1. Not in any stack, OR
        # 2. The primary photo of their stack
        # Stacks are for organizational purposes (RAW+JPEG pairs, bursts, brackets, live photos, manual)
        # Non-primary photos are hidden in the timeline but accessible via stack expansion
        # NOTE: Duplicates are handled separately via the Duplicate model and are not filtered here
        if not self.request.query_params.get("show_all_stack_photos"):
            photo_filter.append(
                Q(stacks__isnull=True) |
                Q(primary_in_stack__isnull=False)
            )

        if self.request.query_params.get("person"):
            photo_filter.append(
                Q(faces__person__id=self.request.query_params.get("person"))
            )
        if self.request.query_params.get("last_modified"):
            photo_filter = []
            photo_filter.append(Q(owner=self.request.user))
            photo_filter.append(
                Q(exif_timestamp__gte=self.request.query_params.get("last_modified"))
            )

        album_date = AlbumDate.objects.filter(id=self.kwargs["pk"]).first()

        # Build a prefetch for stacks that filters to valid types and annotates
        # photo_count, avoiding N+1 queries in the serializer
        valid_stack_types = PhotoStack.VALID_STACK_TYPES + [
            PhotoStack.StackType.RAW_JPEG_PAIR,
            PhotoStack.StackType.LIVE_PHOTO,
        ]
        stacks_prefetch = Prefetch(
            "stacks",
            queryset=PhotoStack.objects.filter(
                stack_type__in=valid_stack_types
            ).annotate(photo_count_annotation=Count("photos")),
        )

        photo_qs = (
            album_date.photos.filter(*photo_filter)
            .prefetch_related(
                Prefetch(
                    "owner",
                    queryset=User.objects.only(
                        "id", "username", "first_name", "last_name"
                    ),
                ),
                Prefetch(
                    "main_file__embedded_media",
                    queryset=File.objects.only("hash"),
                ),
                stacks_prefetch,
                "files",  # Prefetch files for get_has_raw_variant()
            )
            .select_related("thumbnail", "search_instance", "main_file")
            .distinct()  # Remove duplicates that can occur when filtering through reverse ForeignKey relationships (e.g., faces__person__id)
            .order_by("-exif_timestamp")
            .only(
                "image_hash",
                "thumbnail__aspect_ratio",
                "thumbnail__dominant_color",
                "video",
                "main_file",
                "search_instance__search_location",
                "public",
                "rating",
                "hidden",
                "exif_timestamp",
                "owner",
                "video_length",
                "exif_gps_lat",
                "exif_gps_lon",
                "removed",
                "in_trashcan",
            )
        )

        # Paginate photo queryset
        page_size = self.request.query_params.get("size") or 100
        paginator = Paginator(photo_qs, page_size)
        page = self.request.query_params.get("page")

        try:
            photos = paginator.page(page)
        except PageNotAnInteger:
            photos = paginator.page(1)
        except EmptyPage:
            photos = paginator.page(paginator.num_pages)

        return album_date, photos, paginator.count

    def get_permissions(self):
        if self.request.query_params.get("public"):
            permission_classes = [AllowAny]
        else:
            permission_classes = [IsAuthenticated]
        return [permission() for permission in permission_classes]

    @extend_schema(
        parameters=[
            OpenApiParameter("favorite", OpenApiTypes.BOOL),
            OpenApiParameter("public", OpenApiTypes.BOOL),
            OpenApiParameter("in_trashcan", OpenApiTypes.BOOL),
            OpenApiParameter("hidden", OpenApiTypes.BOOL),
            OpenApiParameter("video", OpenApiTypes.BOOL),
            OpenApiParameter("username", OpenApiTypes.STR),
            OpenApiParameter("person", OpenApiTypes.INT),
            OpenApiParameter("last_modified", OpenApiTypes.DATE),
        ],
        description="Returns the actual images, for a given day in chunks of 100 images.",
    )
    def retrieve(self, *args, **kwargs):
        album_date, photos, count = self.get_queryset()
        serializer = AlbumDateSerializer(album_date, context={"request": self.request})
        serializer_data = serializer.data
        serializer_data["items"] = PhotoSummarySerializer(
            photos, many=True
        ).data  # Assuming you have a PhotoSerializer
        serializer_data["numberOfItems"] = count
        return Response({"results": serializer_data})


# To-Do: Could be the summary command in AlbumDateViewSet
class AlbumDateListViewSet(ListViewSet):
    serializer_class = IncompleteAlbumDateSerializer
    pagination_class = None
    filter_backends = (filters.SearchFilter,)
    search_fields = [
        "photos__search_instance__search_captions",
        "photos__search_instance__search_location",
        "photos__faces__person__name",
    ]

    def get_queryset(self):
        filter = []
        filter.append(Q(photos__thumbnail__aspect_ratio__isnull=False))

        if self.request.query_params.get("hidden"):
            filter.append(Q(photos__hidden=True))
        else:
            filter.append(Q(photos__hidden=False))

        if self.request.query_params.get("in_trashcan"):
            filter.append(Q(photos__in_trashcan=True) & Q(photos__removed=False))
        else:
            filter.append(Q(photos__in_trashcan=False))

        # Stack filtering: Only count photos that are either:
        # 1. Not in any stack, OR
        # 2. The primary photo of their stack
        # Stacks are for organizational purposes (RAW+JPEG pairs, bursts, brackets, live photos, manual)
        # Non-primary photos are hidden in the timeline but accessible via stack expansion
        # NOTE: Duplicates are handled separately via the Duplicate model and are not filtered here
        if not self.request.query_params.get("show_all_stack_photos"):
            filter.append(
                Q(photos__stacks__isnull=True) |
                Q(photos__primary_in_stack__isnull=False)
            )

        # Filter by folder path if provided
        if self.request.query_params.get("folder"):
            folder_path = self.request.query_params.get("folder")
            filter.append(Q(photos__files__path__startswith=folder_path))

        if not self.request.user.is_anonymous and not self.request.query_params.get(
            "public"
        ):
            filter.append(Q(owner=self.request.user))
            filter.append(Q(photos__owner=self.request.user))

        if self.request.query_params.get("favorite"):
            min_rating = self.request.user.favorite_min_rating
            filter.append(Q(photos__rating__gte=min_rating))

        if self.request.query_params.get("public"):
            username = self.request.query_params.get("username")
            filter.append(Q(owner__username=username))
            filter.append(Q(photos__public=True))

        if self.request.query_params.get("video"):
            filter.append(Q(photos__video=True))

        if self.request.query_params.get("photo"):
            filter.append(Q(photos__video=False))

        if self.request.query_params.get("person"):
            filter.append(
                Q(photos__faces__person__id=self.request.query_params.get("person"))
            )
        if self.request.query_params.get("last_modified"):
            filter = []
            filter.append(Q(owner=self.request.user))
            filter.append(Q(photos__owner=self.request.user))
            filter.append(
                Q(
                    photos__last_modified__gte=self.request.query_params.get(
                        "last_modified"
                    )
                )
            )

        qs = (
            AlbumDate.objects.filter(*filter)
            .annotate(photo_count=Count("photos", distinct=True))
            .filter(Q(photo_count__gt=0))
            .order_by(F("date").desc(nulls_last=True))
        )

        return qs

    def get_permissions(self):
        if self.request.query_params.get("public"):
            permission_classes = [AllowAny]
        else:
            permission_classes = [IsAuthenticated]
        return [permission() for permission in permission_classes]

    @extend_schema(
        parameters=[
            OpenApiParameter("favorite", OpenApiTypes.BOOL),
            OpenApiParameter("public", OpenApiTypes.BOOL),
            OpenApiParameter("in_trashcan", OpenApiTypes.BOOL),
            OpenApiParameter("hidden", OpenApiTypes.BOOL),
            OpenApiParameter("video", OpenApiTypes.BOOL),
            OpenApiParameter("username", OpenApiTypes.STR),
            OpenApiParameter("person", OpenApiTypes.INT),
            OpenApiParameter("last_modified", OpenApiTypes.DATE),
        ],
        description="Gives you a list of days with the number of elements. This is not paginated and can be large.",
    )
    def list(self, *args, **kwargs):
        serializer = IncompleteAlbumDateSerializer(self.get_queryset(), many=True)
        return Response({"results": serializer.data})


================================================
FILE: api/views/custom_api_view.py
================================================
from rest_framework import mixins, viewsets


class ListViewSet(mixins.ListModelMixin, viewsets.GenericViewSet):
    """A viewset that provides `list` actions.

    To use it, override the class and set the `.queryset` and
    `.serializer_class` attributes.
    """

    pass


================================================
FILE: api/views/dataviz.py
================================================
import os

from django.http import FileResponse, HttpResponseForbidden
from drf_spectacular.utils import extend_schema
from rest_framework.response import Response
from rest_framework.views import APIView

from api.stats import (
    get_count_stats,
    get_photo_month_counts,
    get_searchterms_wordcloud,
    get_server_stats,
    get_location_clusters,
    get_location_sunburst,
    get_location_timeline,
)

from api.face_classify import cluster_faces
from api.social_graph import build_social_graph
from api.util import logger


class ClusterFaceView(APIView):
    @extend_schema(
        deprecated=True,
        description="Use POST method",
    )
    def get(self, request, format=None):
        return self._cluster_faces(request.user)

    def post(self, request, format=None):
        return self._cluster_faces(request.user)

    def _cluster_faces(self, user):
        res = cluster_faces(user)
        return Response(res)


class SocialGraphView(APIView):
    def get(self, request, format=None):
        try:
            res = build_social_graph(request.user)
            return Response(res)
        except Exception:
            logger.exception(f"Error in SocialGraphView for user {request.user.id}")
            return Response({"error": "Failed to build social graph"}, status=500)


class ServerLogsView(APIView):
    def get(self, request, format=None):
        if not (request.user and request.user.is_staff):
            return HttpResponseForbidden()

        BASE_LOGS = os.environ.get("BASE_LOGS", "/logs/")
        log_file = os.path.join(BASE_LOGS, "ownphotos.log")

        if os.path.exists(log_file):
            return FileResponse(
                open(log_file, "rb"), as_attachment=True, filename="ownphotos.log"
            )
        else:
            return Response({"error": "Log file not found"}, status=404)


class ServerStatsView(APIView):
    def get(self, request, format=None):
        if not (request.user and request.user.is_staff):
            return HttpResponseForbidden()
        res = get_server_stats()
        return Response(res)


class StatsView(APIView):
    def get(self, request, format=None):
        res = get_count_stats(user=request.user)
        return Response(res)


class LocationClustersView(APIView):
    def get(self, request, format=None):
        res = get_location_clusters(request.user)
        return Response(res)


class LocationSunburst(APIView):
    def get(self, request, format=None):
        res = get_location_sunburst(request.user)
        return Response(res)


class LocationTimeline(APIView):
    def get(self, request, format=None):
        res = get_location_timeline(request.user)
        return Response(res)


class PhotoMonthCountsView(APIView):
    def get(self, request, format=None):
        res = get_photo_month_counts(request.user)
        return Response(res)


class SearchTermWordCloudView(APIView):
    def get(self, request, format=None):
        res = get_searchterms_wordcloud(request.user)
        return Response(res)


================================================
FILE: api/views/duplicates.py
================================================
"""
API views for Duplicate management - finding and cleaning up duplicate photos.

Handles duplicate types:
- EXACT_COPY: Byte-for-byte identical files (same MD5 hash, different paths)
- VISUAL_DUPLICATE: Visually similar photos (similar perceptual hash)

Duplicates are separate from Stacks because they have different purposes:
- Duplicates: Storage cleanup (review and delete redundant copies)
- Stacks: Photo organization (browse related photos like RAW+JPEG, bursts)
"""

from django.core.paginator import Paginator
from django.db.models import Count, Sum
from django_q.tasks import async_task
from drf_spectacular.utils import OpenApiParameter, extend_schema
from rest_framework import status
from rest_framework.permissions import IsAuthenticated
from rest_framework.response import Response
from rest_framework.views import APIView

from api.models import Photo
from api.models.duplicate import Duplicate
from api.util import logger


class DuplicateListView(APIView):
    """List all duplicate groups for the current user with pagination and filters."""

    permission_classes = [IsAuthenticated]

    @extend_schema(
        parameters=[
            OpenApiParameter(
                "duplicate_type",
                str,
                description="Filter by duplicate type: exact_copy, visual_duplicate",
            ),
            OpenApiParameter(
                "status",
                str,
                description="Filter by review status: pending, resolved, dismissed",
            ),
            OpenApiParameter(
                "page",
                int,
                description="Page number (default: 1)",
            ),
            OpenApiParameter(
                "page_size",
                int,
                description="Number of items per page (default: 20, max: 100)",
            ),
        ],
    )
    def get(self, request):
        duplicate_type_filter = request.query_params.get("duplicate_type", None)
        status_filter = request.query_params.get("status", None)
        page = max(1, int(request.query_params.get("page", 1)))
        page_size = max(1, min(int(request.query_params.get("page_size", 20)), 100))

        duplicates = (
            Duplicate.objects.filter(owner=request.user)
            .prefetch_related("photos__thumbnail", "kept_photo__thumbnail")
            .annotate(photos_count=Count("photos"))
            .order_by("-created_at")
        )

        if duplicate_type_filter:
            duplicates = duplicates.filter(duplicate_type=duplicate_type_filter)

        if status_filter:
            duplicates = duplicates.filter(review_status=status_filter)

        # Only return duplicates with at least 2 photos
        duplicates = duplicates.filter(photos_count__gte=2)

        # Paginate results
        paginator = Paginator(duplicates, page_size)
        page_obj = paginator.get_page(page)

        # Serialize manually to include nested photo data
        results = []
        for duplicate in page_obj.object_list:
            photos = duplicate.photos.all()[:4]  # Preview first 4 photos
            results.append(
                {
                    "id": str(duplicate.id),
                    "duplicate_type": duplicate.duplicate_type,
                    "duplicate_type_display": duplicate.get_duplicate_type_display(),
                    "review_status": duplicate.review_status,
                    "review_status_display": duplicate.get_review_status_display(),
                    "photo_count": duplicate.photos_count,
                    "potential_savings": duplicate.potential_savings,
                    "similarity_score": duplicate.similarity_score,
                    "created_at": duplicate.created_at,
                    "kept_photo": {
                        "image_hash": duplicate.kept_photo.image_hash,
                        "thumbnail_url": f"/media/square_thumbnails_small/{duplicate.kept_photo.image_hash}"
                        if hasattr(duplicate.kept_photo, "thumbnail")
                        and duplicate.kept_photo.thumbnail.square_thumbnail_small
                        else None,
                    }
                    if duplicate.kept_photo
                    else None,
                    "preview_photos": [
                        {
                            "image_hash": p.image_hash,
                            "thumbnail_url": f"/media/square_thumbnails_small/{p.image_hash}"
                            if hasattr(p, "thumbnail")
                            and p.thumbnail.square_thumbnail_small
                            else None,
                        }
                        for p in photos
                    ],
                }
            )

        return Response(
            {
                "results": results,
                "count": paginator.count,
                "num_pages": paginator.num_pages,
                "page": page,
                "page_size": page_size,
                "has_next": page_obj.has_next(),
                "has_previous": page_obj.has_previous(),
            }
        )


class DuplicateDetailView(APIView):
    """Get details of a specific duplicate group with all photos."""

    permission_classes = [IsAuthenticated]

    def get(self, request, duplicate_id):
        try:
            duplicate = Duplicate.objects.annotate(photos_count=Count("photos")).get(
                id=duplicate_id, owner=request.user
            )
        except Duplicate.DoesNotExist:
            return Response(
                {"error": "Duplicate group not found"}, status=status.HTTP_404_NOT_FOUND
            )

        photos = duplicate.photos.select_related(
            "thumbnail", "main_file", "metadata"
        ).all()

        photo_data = []
        for p in photos:
            # Width, height, and camera are on the metadata model
            width = None
            height = None
            camera = None
            if hasattr(p, "metadata") and p.metadata:
                width = p.metadata.width
                height = p.metadata.height
                camera = p.metadata.camera_model

            data = {
                "id": str(p.id),
                "image_hash": p.image_hash,
                "width": width,
                "height": height,
                "size": p.size,
                "camera": camera,
                "exif_timestamp": p.exif_timestamp,
                "is_kept": duplicate.kept_photo
                and p.image_hash == duplicate.kept_photo.image_hash,
                "file_path": p.main_file.path if p.main_file else None,
                "file_type": p.main_file.get_type_display() if p.main_file else None,
                "thumbnail_url": f"/media/square_thumbnails_small/{p.image_hash}"
                if hasattr(p, "thumbnail") and p.thumbnail.square_thumbnail_small
                else None,
                "thumbnail_big_url": f"/media/thumbnails_big/{p.image_hash}"
                if hasattr(p, "thumbnail") and p.thumbnail.thumbnail_big
                else None,
            }
            photo_data.append(data)

        # Get suggested best photo
        suggested_photo = duplicate.auto_select_best_photo()

        return Response(
            {
                "id": str(duplicate.id),
                "duplicate_type": duplicate.duplicate_type,
                "duplicate_type_display": duplicate.get_duplicate_type_display(),
                "review_status": duplicate.review_status,
                "review_status_display": duplicate.get_review_status_display(),
                "photo_count": duplicate.photos_count,
                "potential_savings": duplicate.potential_savings,
                "similarity_score": duplicate.similarity_score,
                "created_at": duplicate.created_at,
                "updated_at": duplicate.updated_at,
                "kept_photo_hash": duplicate.kept_photo.image_hash
                if duplicate.kept_photo
                else None,
                "suggested_photo_hash": suggested_photo.image_hash
                if suggested_photo
                else None,
                "photos": photo_data,
            }
        )


class DuplicateResolveView(APIView):
    """Resolve a duplicate group by selecting a photo to keep and optionally trashing others."""

    permission_classes = [IsAuthenticated]

    def post(self, request, duplicate_id):
        try:
            duplicate = Duplicate.objects.get(id=duplicate_id, owner=request.user)
        except Duplicate.DoesNotExist:
            return Response(
                {"error": "Duplicate group not found"}, status=status.HTTP_404_NOT_FOUND
            )

        keep_photo_hash = request.data.get("keep_photo_hash")
        trash_others = request.data.get("trash_others", True)

        if not keep_photo_hash:
            return Response(
                {"error": "keep_photo_hash is required"},
                status=status.HTTP_400_BAD_REQUEST,
            )

        # Verify photo exists in duplicate group
        try:
            keep_photo = duplicate.photos.get(image_hash=keep_photo_hash)
        except Photo.DoesNotExist:
            return Response(
                {"error": "Photo not found in this duplicate group"},
                status=status.HTTP_400_BAD_REQUEST,
            )

        # Resolve the duplicate
        duplicate.resolve(keep_photo, trash_others)

        logger.info(
            f"Resolved duplicate {duplicate.id}: kept {keep_photo_hash}, trashed {duplicate.trashed_count}"
        )
        return Response(
            {
                "status": "resolved",
                "kept_photo": keep_photo_hash,
                "trashed_count": duplicate.trashed_count,
            }
        )


class DuplicateDismissView(APIView):
    """Dismiss a duplicate group (mark photos as not actually duplicates)."""

    permission_classes = [IsAuthenticated]

    def post(self, request, duplicate_id):
        try:
            duplicate = Duplicate.objects.get(id=duplicate_id, owner=request.user)
        except Duplicate.DoesNotExist:
            return Response(
                {"error": "Duplicate group not found"}, status=status.HTTP_404_NOT_FOUND
            )

        duplicate.dismiss()

        logger.info(f"Dismissed duplicate {duplicate.id}")
        return Response({"status": "dismissed"})


class DuplicateRevertView(APIView):
    """Revert a resolved duplicate (restore trashed photos, reset to pending)."""

    permission_classes = [IsAuthenticated]

    def post(self, request, duplicate_id):
        try:
            duplicate = Duplicate.objects.get(id=duplicate_id, owner=request.user)
        except Duplicate.DoesNotExist:
            return Response(
                {"error": "Duplicate group not found"}, status=status.HTTP_404_NOT_FOUND
            )

        if duplicate.review_status != Duplicate.ReviewStatus.RESOLVED:
            return Response(
                {"error": "Can only revert resolved duplicates"},
                status=status.HTTP_400_BAD_REQUEST,
            )

        restored_count = duplicate.revert()

        logger.info(
            f"Reverted duplicate {duplicate.id}: restored {restored_count} photos"
        )
        return Response({"status": "reverted", "restored_count": restored_count})


class DuplicateDeleteView(APIView):
    """Delete a duplicate group (unlinks photos but doesn't delete them)."""

    permission_classes = [IsAuthenticated]

    def delete(self, request, duplicate_id):
        try:
            duplicate = Duplicate.objects.get(id=duplicate_id, owner=request.user)
        except Duplicate.DoesNotExist:
            return Response(
                {"error": "Duplicate group not found"}, status=status.HTTP_404_NOT_FOUND
            )

        # Unlink photos from this duplicate group (ManyToMany)
        photo_count = duplicate.photos.count()
        for photo in duplicate.photos.all():
            photo.duplicates.remove(duplicate)

        # Delete duplicate group
        duplicate_id_str = str(duplicate.id)
        duplicate.delete()

        logger.info(
            f"Deleted duplicate group {duplicate_id_str}: unlinked {photo_count} photos"
        )
        return Response({"status": "deleted", "unlinked_count": photo_count})


class DetectDuplicatesView(APIView):
    """Trigger duplicate detection for the current user."""

    permission_classes = [IsAuthenticated]

    @extend_schema(
        parameters=[
            OpenApiParameter(
                "detect_exact_copies",
                bool,
                description="Detect exact file copies (default: true)",
            ),
            OpenApiParameter(
                "detect_visual_duplicates",
                bool,
                description="Detect visually similar photos (default: true)",
            ),
            OpenApiParameter(
                "visual_threshold",
                int,
                description="Hamming distance threshold for visual duplicates (default: 10)",
            ),
            OpenApiParameter(
                "clear_pending",
                bool,
                description="Clear existing pending duplicates before detection (default: false)",
            ),
            OpenApiParameter(
                "batch_size",
                int,
                description="Number of photos to process per batch for visual detection (default: 10000, min: 100, max: 50000)",
            ),
        ],
    )
    def post(self, request):
        from api.duplicate_detection import batch_detect_duplicates

        # Validate and clamp batch_size to reasonable range
        batch_size = int(request.data.get("batch_size", 10000))
        if batch_size < 100:
            batch_size = 100  # Minimum to avoid too many batches
        elif batch_size > 50000:
            batch_size = 50000  # Maximum to prevent memory issues

        options = {
            "detect_exact_copies": request.data.get("detect_exact_copies", True),
            "detect_visual_duplicates": request.data.get(
                "detect_visual_duplicates", True
            ),
            "visual_threshold": int(request.data.get("visual_threshold", 10)),
            "clear_pending": request.data.get("clear_pending", False),
            "batch_size": batch_size,
        }

        # Queue background job
        async_task(batch_detect_duplicates, request.user, options)

        logger.info(
            f"Duplicate detection queued for user {request.user.username} with options: {options}"
        )
        return Response(
            {
                "status": "queued",
                "message": "Duplicate detection started",
                "options": options,
            },
            status=status.HTTP_202_ACCEPTED,
        )


class DuplicateStatsView(APIView):
    """Get duplicate statistics for the current user."""

    permission_classes = [IsAuthenticated]

    def get(self, request):
        duplicates = Duplicate.objects.filter(owner=request.user)

        # Count by type
        by_type = {}
        for dup_type in Duplicate.DuplicateType.values:
            by_type[dup_type] = duplicates.filter(duplicate_type=dup_type).count()

        # Count by review status
        pending_count = duplicates.filter(
            review_status=Duplicate.ReviewStatus.PENDING
        ).count()
        resolved_count = duplicates.filter(
            review_status=Duplicate.ReviewStatus.RESOLVED
        ).count()
        dismissed_count = duplicates.filter(
            review_status=Duplicate.ReviewStatus.DISMISSED
        ).count()

        # Calculate potential savings (from pending duplicates)
        total_savings = (
            duplicates.filter(review_status=Duplicate.ReviewStatus.PENDING).aggregate(
                total=Sum("potential_savings")
            )["total"]
            or 0
        )

        # Count photos in duplicate groups
        photos_in_duplicates = (
            Photo.objects.filter(owner=request.user, duplicates__isnull=False)
            .distinct()
            .count()
        )

        total_photos = Photo.objects.filter(
            owner=request.user, hidden=False, in_trashcan=False
        ).count()

        return Response(
            {
                "total_duplicates": duplicates.count(),
                "pending_duplicates": pending_count,
                "resolved_duplicates": resolved_count,
                "dismissed_duplicates": dismissed_count,
                "by_type": by_type,
                "photos_in_duplicates": photos_in_duplicates,
                "total_photos": total_photos,
                "potential_savings_bytes": total_savings,
                "potential_savings_mb": round(total_savings / (1024 * 1024), 2)
                if total_savings
                else 0,
            }
        )


================================================
FILE: api/views/faces.py
================================================
import uuid

from django.db.models import Case, CharField, Count, IntegerField, Q, Value, When
from django_q.tasks import Chain
from drf_spectacular.types import OpenApiTypes
from drf_spectacular.utils import OpenApiParameter, extend_schema
from rest_framework import status
from rest_framework.response import Response
from rest_framework.views import APIView

from api.directory_watcher import generate_face_embeddings, scan_faces
from api.face_classify import cluster_all_faces
from api.ml_models import do_all_models_exist, download_models
from api.models import Face, User
from api.models.person import Person, get_or_create_person
from api.models.photo_search import PhotoSearch
from api.serializers.face import (
    FaceListSerializer,
    IncompletePersonFaceListSerializer,
    PersonFaceListSerializer,
)
from api.util import logger
from api.views.custom_api_view import ListViewSet
from api.views.pagination import RegularResultsSetPagination


class ScanFacesView(APIView):
    @extend_schema(
        deprecated=True,
        description="Use POST method",
    )
    def get(self, request, format=None):
        return self._scan_faces(request)

    def post(self, request, format=None):
        return self._scan_faces(request)

    def _scan_faces(self, request, format=None):
        chain = Chain()
        if not do_all_models_exist():
            chain.append(download_models, request.user)
        try:
            job_id = uuid.uuid4()
            chain.append(scan_faces, request.user, job_id, True)
            chain.run()
            return Response({"status": True, "job_id": job_id})
        except BaseException:
            logger.exception("An Error occurred")
            return Response({"status": False})


class TrainFaceView(APIView):
    @staticmethod
    def _train_faces(request):
        chain = Chain()
        if not do_all_models_exist():
            chain.append(download_models, request.user)
        try:
            job_id = uuid.uuid4()
            chain.append(generate_face_embeddings, request.user, uuid.uuid4())
            chain.append(cluster_all_faces, request.user, job_id)
            chain.run()
            return Response({"status": True, "job_id": job_id})
        except BaseException:
            logger.exception()
            return Response({"status": False})

    def post(self, request, format=None):
        return self._train_faces(request)


class FaceListView(ListViewSet):
    serializer_class = PersonFaceListSerializer
    pagination_class = RegularResultsSetPagination

    def get_queryset(self):
        personid = self.request.query_params.get("person", "0")

        if personid == "0":
            personid = None

        analysis_method = self.request.query_params.get("analysis_method", "clustering")
        min_confidence = float(self.request.query_params.get("min_confidence", 0))

        if (
            self.request.query_params.get("inferred", "").lower() == "false"
            and personid
        ):
            analysis_method = None
        if analysis_method == "classification":
            conditional_filter = Q(person=None)
            if not personid:
                conditional_filter = conditional_filter & Q(
                    classification_probability__lte=min_confidence
                )
            else:
                conditional_filter = (
                    conditional_filter
                    & Q(classification_person=personid)
                    & Q(classification_probability__gte=min_confidence)
                )
            order_by = ["-classification_probability", "id"]
        if analysis_method == "clustering":
            if not personid:
                conditional_filter = Q(person=None) & (
                    Q(cluster_person=None) | Q(cluster_probability__lte=min_confidence)
                )
            else:
                conditional_filter = (
                    Q(cluster_person=personid)
                    & Q(person=None)
                    & Q(cluster_probability__gte=min_confidence)
                )
            order_by = ["-cluster_probability", "id"]
        if not analysis_method:
            conditional_filter = Q(person=personid)
            order_by = ["-id"]
        if self.request.query_params.get("order_by", "").lower() == "date":
            order_by = ["photo__exif_timestamp", *order_by]
        return (
            Face.objects.filter(
                Q(photo__owner=self.request.user),
                Q(deleted=False),
                conditional_filter,
            )
            .annotate(analysis_method=Value(analysis_method, output_field=CharField()))
            .prefetch_related("photo")
            .order_by(*order_by)
        )

    @extend_schema(
        parameters=[
            OpenApiParameter("person", OpenApiTypes.STR),
            OpenApiParameter("inferred", OpenApiTypes.BOOL),
            OpenApiParameter("order_by", OpenApiTypes.STR),
        ],
    )
    def list(self, *args, **kwargs):
        return super().list(*args, **kwargs)


class FaceIncompleteListViewSet(ListViewSet):
    serializer_class = IncompletePersonFaceListSerializer
    pagination_class = None

    def get_queryset(self):
        inferred = self.request.query_params.get("inferred", "").lower() == "true"
        analysis_method = self.request.query_params.get("analysis_method", "clustering")
        min_confidence = float(self.request.query_params.get("min_confidence", 0))

        queryset = Person.objects.filter(cluster_owner=self.request.user)
        if inferred:
            if analysis_method == "classification":
                conditional_count = Count(
                    Case(
                        When(
                            Q(classification_faces__deleted=False)
                            & Q(classification_faces__person=None)
                            & Q(
                                classification_faces__classification_probability__gte=min_confidence
                            ),
                            then=1,
                        ),
                        output_field=IntegerField(),
                    )
                )
            if analysis_method == "clustering":
                conditional_count = Count(
                    Case(
                        When(
                            Q(cluster_faces__deleted=False)
                            & Q(cluster_faces__person=None)
                            & Q(cluster_faces__cluster_probability__gte=min_confidence),
                            then=1,
                        ),
                        output_field=IntegerField(),
                    )
                )
        else:
            queryset = queryset.filter(kind=Person.KIND_USER)
            conditional_count = Count(
                Case(
                    When(
                        Q(faces__deleted=False),
                        then=1,
                    ),
                    output_field=IntegerField(),
                )
            )

        queryset = (
            queryset.annotate(viewable_face_count=conditional_count)
            .filter(viewable_face_count__gt=0)
            .order_by("name")
        )

        return queryset

    @extend_schema(
        parameters=[
            OpenApiParameter("inferred", OpenApiTypes.BOOL),
        ],
    )
    def list(self, *args, **kwargs):
        queryset = self.get_queryset()

        serializer = self.get_serializer(queryset, many=True)
        real_persons = serializer.data

        min_confidence = float(self.request.query_params.get("min_confidence", 0))

        if self.request.query_params.get("inferred", "").lower() == "true":
            if (
                self.request.query_params.get("analysis_method", "clustering")
                == "classification"
            ):
                unknown_faces_count = Face.objects.filter(
                    Q(deleted=False)
                    & Q(person=None)
                    & Q(photo__owner=self.request.user)
                    & Q(classification_probability__lte=min_confidence),
                ).count()
            else:
                unknown_faces_count = Face.objects.filter(
                    (
                        Q(cluster_person=None)
                        | Q(cluster_probability__lte=min_confidence)
                    )
                    & Q(deleted=False)
                    & Q(person=None)
                    & Q(photo__owner=self.request.user),
                ).count()
        else:
            unknown_faces_count = Face.objects.filter(
                person=None, deleted=False, photo__owner=self.request.user
            ).count()

        if unknown_faces_count > 0:
            unknown_person = {
                "id": 0,
                "name": "Unknown - Other",
                "face_count": unknown_faces_count,
                "kind": Person.UNKNOWN_PERSON_NAME,
            }
            real_persons.append(unknown_person)

        return Response(real_persons, status=status.HTTP_200_OK)


class SetFacePersonLabel(APIView):
    def post(self, request, format=None):
        data = dict(request.data)
        person = None
        cluster_person = None
        classification_person = None
        if data["person_name"] != Person.UNKNOWN_PERSON_NAME:
            person = get_or_create_person(
                name=data["person_name"], owner=self.request.user, kind=Person.KIND_USER
            )

        faces = Face.objects.in_bulk(data["face_ids"])

        updated = []
        not_updated = []
        for face in faces.values():
            if face.photo.owner == request.user:
                face.person = person
                if not person:
                    face.cluster_person = cluster_person
                    face.classification_person = classification_person
                face.save()
                updated.append(FaceListSerializer(face).data)
            else:
                not_updated.append(FaceListSerializer(face).data)
        if person:
            person._calculate_face_count()
            person._set_default_cover_photo()
        search_instance, created = PhotoSearch.objects.get_or_create(photo=face.photo)
        search_instance.recreate_search_captions()
        search_instance.save()

        # Write face regions to image files if user preference is enabled
        if request.user.save_face_tags_to_disk:
            use_sidecar = (
                request.user.save_metadata_to_disk == User.SaveMetadata.SIDECAR_FILE
            )
            updated_photos = {
                f.photo for f in faces.values() if f.photo.owner == request.user
            }
            for photo in updated_photos:
                try:
                    photo._save_metadata(
                        use_sidecar=use_sidecar,
                        metadata_types=["face_tags"],
                    )
                except Exception:
                    logger.exception(
                        f"Failed to write face tags for photo {photo.image_hash}"
                    )

        return Response(
            {
                "status": True,
                "results": updated,
                "updated": updated,
                "not_updated": not_updated,
            }
        )


class DeleteFaces(APIView):
    def post(self, request, format=None):
        data = dict(request.data)
        faces = Face.objects.in_bulk(data["face_ids"])

        deleted = []
        not_deleted = []
        for face in faces.values():
            if face.photo.owner == request.user:
                deleted.append(face.image.url)
                face.deleted = True
                face.save()
            else:
                not_deleted.append(face.image.url)

        return Response(
            {
                "status": True,
                "results": deleted,
                "not_deleted": not_deleted,
                "deleted": deleted,
            }
        )


================================================
FILE: api/views/geocode.py
================================================
from rest_framework.response import Response
from rest_framework.views import APIView

from api.geocode.geocode import search_location


class GeocodeSearchView(APIView):
    """Search for locations by name/address."""

    def get(self, request, format=None):
        query = request.query_params.get("q", "").strip()
        if not query:
            return Response([])
        limit = int(request.query_params.get("limit", 5))
        results = search_location(query, limit=limit)
        return Response(results)


================================================
FILE: api/views/jobs.py
================================================
from django.db.models import Prefetch
from rest_framework import viewsets
from rest_framework.response import Response
from rest_framework.views import APIView

from api.models import LongRunningJob, User
from api.serializers.job import LongRunningJobSerializer
from api.views.pagination import TinyResultsSetPagination


class LongRunningJobViewSet(viewsets.ModelViewSet):
    queryset = (
        LongRunningJob.objects.prefetch_related(
            Prefetch(
                "started_by",
                queryset=User.objects.only("id", "username", "first_name", "last_name"),
            ),
        )
        .all()
        .order_by("-started_at")
    )
    serializer_class = LongRunningJobSerializer
    pagination_class = TinyResultsSetPagination


class QueueAvailabilityView(APIView):
    def get(self, request, format=None):
        job_detail = None

        running_job = (
            LongRunningJob.objects.filter(finished=False).order_by("-started_at").last()
        )
        if running_job:
            job_detail = LongRunningJobSerializer(running_job).data

        return Response(
            {
                "status": True,
                "queue_can_accept_job": job_detail is None,
                "job_detail": job_detail,
            }
        )


================================================
FILE: api/views/pagination.py
================================================
from rest_framework.pagination import PageNumberPagination


class HugeResultsSetPagination(PageNumberPagination):
    page_size = 2500
    page_size_query_param = "page_size"
    max_page_size = 5000


class StandardResultsSetPagination(PageNumberPagination):
    page_size = 1000
    page_size_query_param = "page_size"
    max_page_size = 2000


class RegularResultsSetPagination(PageNumberPagination):
    page_size = 100
    page_size_query_param = "page_size"
    max_page_size = 200


class TinyResultsSetPagination(PageNumberPagination):
    page_size = 20
    page_size_query_param = "page_size"
    max_page_size = 50


================================================
FILE: api/views/photo_filters.py
================================================
"""
Photo filtering utilities for bulk operations.

This module provides reusable functions to build photo querysets from filter parameters,
enabling server-side "Select All" operations without sending individual photo IDs.
"""

from django.db.models import Q

from api.models import Photo


def build_photo_queryset(user, params: dict):
    """Build a Photo queryset from filter parameters.

    This function reuses the same filtering logic as AlbumDateListViewSet to ensure
    consistency between what users see in the UI and what bulk operations affect.

    Args:
        user: The authenticated user making the request
        params: Dictionary of filter parameters:
            - favorite: bool - Filter by favorite status (rating >= user.favorite_min_rating)
            - public: bool - Filter by public photos only
            - hidden: bool - Filter by hidden photos
            - in_trashcan: bool - Filter by trashed photos
            - video: bool - Filter by videos only
            - photo: bool - Filter by photos only (non-videos)
            - person: int - Filter by person ID (faces)
            - folder: str - Filter by folder path prefix
            - username: str - Filter by owner username (for public photos)
            - show_all_stack_photos: bool - If True, show all photos in stacks (default: False)

    Returns:
        QuerySet[Photo]: Filtered photo queryset
    """
    filters = [Q(thumbnail__aspect_ratio__isnull=False)]

    # Owner filter - default to current user unless viewing public photos
    if not params.get("public"):
        filters.append(Q(owner=user))

    # Favorite filter
    if params.get("favorite"):
        min_rating = user.favorite_min_rating
        filters.append(Q(rating__gte=min_rating))

    # Public photos filter
    if params.get("public"):
        if params.get("username"):
            filters.append(Q(owner__username=params["username"]))
        filters.append(Q(public=True))

    # Hidden filter
    if params.get("hidden"):
        filters.append(Q(hidden=True))
    else:
        filters.append(Q(hidden=False))

    # Video/photo type filter
    if params.get("video"):
        filters.append(Q(video=True))
    elif params.get("photo"):
        filters.append(Q(video=False))

    # Trashcan filter
    if params.get("in_trashcan"):
        filters.append(Q(in_trashcan=True) & Q(removed=False))
    else:
        filters.append(Q(in_trashcan=False))

    # Person/face filter
    if params.get("person"):
        filters.append(Q(faces__person__id=params["person"]))

    # Folder path filter
    if params.get("folder"):
        filters.append(Q(files__path__startswith=params["folder"]))

    # Stack filtering: Show photos that are either:
    # 1. Not in any stack, OR
    # 2. The primary photo of their stack
    # This applies stacking behavior for ALL stack types (manual, burst, etc.)
    # Non-primary photos are hidden in the timeline but accessible via stack expansion
    if not params.get("show_all_stack_photos"):
        filters.append(
            Q(stacks__isnull=True) |
            Q(primary_in_stack__isnull=False)
        )

    return Photo.objects.filter(*filters).distinct()


================================================
FILE: api/views/photo_metadata.py
================================================
"""
API views for PhotoMetadata management.

Provides endpoints for:
- Viewing detailed metadata
- Editing metadata with history tracking
- Reverting metadata changes
- Viewing edit history
"""

from django.shortcuts import get_object_or_404
from drf_spectacular.utils import extend_schema, OpenApiParameter
from rest_framework.decorators import action
from rest_framework.permissions import IsAuthenticated
from rest_framework.response import Response
from rest_framework.views import APIView
from rest_framework.viewsets import ViewSet

from api.models import Photo
from api.models.photo_metadata import MetadataEdit, PhotoMetadata
from api.serializers.photo_metadata import (
    MetadataEditSerializer,
    PhotoMetadataSerializer,
    PhotoMetadataUpdateSerializer,
)


class PhotoMetadataViewSet(ViewSet):
    """
    ViewSet for photo metadata operations.
    
    Provides:
    - GET /api/photos/{photo_id}/metadata/ - Get full metadata
    - PATCH /api/photos/{photo_id}/metadata/ - Update metadata (creates history)
    - GET /api/photos/{photo_id}/metadata/history/ - Get edit history
    - POST /api/photos/{photo_id}/metadata/revert/{edit_id}/ - Revert a change
    """

    permission_classes = [IsAuthenticated]

    def _get_photo(self, request, photo_id: str) -> Photo:
        """Get photo by ID or image_hash, checking permissions."""
        # UUID format is 36 chars with 4 hyphens (xxxxxxxx-xxxx-xxxx-xxxx-xxxxxxxxxxxx)
        # MD5 hashes are 32 hex chars without hyphens
        # Python's uuid.UUID() accepts both, so we need to check format explicitly
        is_uuid_format = len(photo_id) == 36 and photo_id.count("-") == 4
        
        if is_uuid_format:
            photo = get_object_or_404(Photo, pk=photo_id)
        else:
            photo = get_object_or_404(Photo, image_hash=photo_id)
        
        # Check ownership
        if photo.owner != request.user and not request.user.is_staff:
            from rest_framework.exceptions import PermissionDenied
            raise PermissionDenied("You don't have permission to access this photo's metadata.")
        
        return photo

    def _get_or_create_metadata(self, photo: Photo) -> PhotoMetadata:
        """Get or create PhotoMetadata for a photo."""
        metadata, created = PhotoMetadata.objects.get_or_create(
            photo=photo,
            defaults={
                # If creating new, leave fields empty - they'll be populated on next scan
                "date_taken": photo.exif_timestamp,
                "gps_latitude": photo.exif_gps_lat,
                "gps_longitude": photo.exif_gps_lon,
                "rating": photo.rating,
                "source": PhotoMetadata.Source.EMBEDDED,
            }
        )
        return metadata

    @extend_schema(
        description="Get full structured metadata for a photo.",
        responses={200: PhotoMetadataSerializer},
    )
    def retrieve(self, request, photo_id: str):
        """Get full metadata for a photo."""
        photo = self._get_photo(request, photo_id)
        metadata = self._get_or_create_metadata(photo)
        serializer = PhotoMetadataSerializer(metadata)
        return Response(serializer.data)

    @extend_schema(
        description="Update photo metadata. Changes are tracked in edit history.",
        request=PhotoMetadataUpdateSerializer,
        responses={200: PhotoMetadataSerializer},
    )
    def partial_update(self, request, photo_id: str):
        """Update metadata with change tracking."""
        photo = self._get_photo(request, photo_id)
        metadata = self._get_or_create_metadata(photo)
        
        serializer = PhotoMetadataUpdateSerializer(
            metadata,
            data=request.data,
            partial=True,
            context={"request": request}
        )
        serializer.is_valid(raise_exception=True)
        serializer.save()
        
        # Return full metadata
        return Response(PhotoMetadataSerializer(metadata).data)

    @extend_schema(
        description="Get edit history for a photo's metadata.",
        responses={200: MetadataEditSerializer(many=True)},
    )
    @action(detail=True, methods=["get"], url_path="history")
    def history(self, request, photo_id: str):
        """Get edit history for a photo."""
        photo = self._get_photo(request, photo_id)
        edits = MetadataEdit.objects.filter(photo=photo).order_by("-created_at")
        
        # Pagination
        page = int(request.query_params.get("page", 1))
        page_size = int(request.query_params.get("page_size", 20))
        start = (page - 1) * page_size
        end = start + page_size
        
        serializer = MetadataEditSerializer(edits[start:end], many=True)
        return Response({
            "results": serializer.data,
            "count": edits.count(),
            "page": page,
            "page_size": page_size,
        })

    @extend_schema(
        description="Revert a specific metadata edit.",
        responses={200: PhotoMetadataSerializer},
    )
    @action(detail=True, methods=["post"], url_path=r"revert/(?P<edit_id>[^/.]+)")
    def revert(self, request, photo_id: str, edit_id: str):
        """Revert a specific metadata edit."""
        photo = self._get_photo(request, photo_id)
        edit = get_object_or_404(MetadataEdit, pk=edit_id, photo=photo)
        
        # Get or create metadata
        metadata = self._get_or_create_metadata(photo)
        
        # Restore the old value
        field_name = edit.field_name
        old_value = edit.old_value
        current_value = getattr(metadata, field_name, None)
        
        # Create a new edit record for the revert
        MetadataEdit.objects.create(
            photo=photo,
            user=request.user,
            field_name=field_name,
            old_value=current_value,
            new_value=old_value,
        )
        
        # Apply the revert
        setattr(metadata, field_name, old_value)
        metadata.version += 1
        metadata.save()
        
        return Response(PhotoMetadataSerializer(metadata).data)

    @extend_schema(
        description="Revert all edits and restore original embedded metadata.",
        responses={200: PhotoMetadataSerializer},
    )
    @action(detail=True, methods=["post"], url_path="revert-all")
    def revert_all(self, request, photo_id: str):
        """Revert all edits and restore original metadata from file by re-extracting EXIF."""
        photo = self._get_photo(request, photo_id)
        
        try:
            metadata = photo.metadata
            # Record the revert
            MetadataEdit.objects.create(
                photo=photo,
                user=request.user,
                field_name="_all",
                old_value={"action": "revert_all"},
                new_value={"source": "embedded"},
            )
            
            # Re-extract EXIF data from the file to restore original values
            # This will update PhotoMetadata with fresh data from the image file
            PhotoMetadata.extract_exif_data(photo, commit=True)
            
            # Refresh metadata from database
            metadata.refresh_from_db()
            metadata.source = PhotoMetadata.Source.EMBEDDED
            metadata.version += 1
            metadata.save()
            
        except PhotoMetadata.DoesNotExist:
            # If no metadata exists, extract it fresh
            metadata = PhotoMetadata.extract_exif_data(photo, commit=True)
        
        return Response(PhotoMetadataSerializer(metadata).data)


class BulkMetadataView(APIView):
    """
    Bulk metadata operations for multiple photos.
    """

    permission_classes = [IsAuthenticated]

    @extend_schema(
        description="Get metadata summary for multiple photos.",
        parameters=[
            OpenApiParameter("photo_ids", str, description="Comma-separated photo IDs or image hashes"),
        ],
    )
    def get(self, request):
        """Get metadata summary for multiple photos."""
        photo_ids = request.query_params.get("photo_ids", "").split(",")
        photo_ids = [pid.strip() for pid in photo_ids if pid.strip()]
        
        if not photo_ids:
            return Response({"error": "No photo_ids provided"}, status=400)
        
        if len(photo_ids) > 100:
            return Response({"error": "Maximum 100 photos per request"}, status=400)
        
        # Get photos (by UUID or image_hash)
        from django.db.models import Q
        import uuid
        
        uuid_ids = []
        hash_ids = []
        for pid in photo_ids:
            # UUID format: 36 chars with 4 hyphens (xxxxxxxx-xxxx-xxxx-xxxx-xxxxxxxxxxxx)
            # MD5 hashes are 32 hex chars without hyphens
            # Note: uuid.UUID() accepts both formats, so we must check explicitly
            is_uuid_format = len(pid) == 36 and pid.count("-") == 4
            if is_uuid_format:
                try:
                    uuid.UUID(pid)
                    uuid_ids.append(pid)
                except (ValueError, AttributeError):
                    hash_ids.append(pid)
            else:
                hash_ids.append(pid)
        
        photos = Photo.objects.filter(
            Q(pk__in=uuid_ids) | Q(image_hash__in=hash_ids),
            owner=request.user,
        ).select_related("metadata")
        
        results = {}
        for photo in photos:
            try:
                metadata = photo.metadata
                results[str(photo.id)] = {
                    "camera": metadata.camera_display,
                    "lens": metadata.lens_display,
                    "date_taken": metadata.date_taken,
                    "has_location": metadata.has_location,
                    "rating": metadata.rating,
                }
            except PhotoMetadata.DoesNotExist:
                # No metadata exists - return minimal info with None values
                results[str(photo.id)] = {
                    "camera": None,
                    "lens": None,
                    "date_taken": photo.exif_timestamp,
                    "has_location": photo.exif_gps_lat is not None,
                    "rating": photo.rating,
                }
        
        return Response(results)

    @extend_schema(
        description="Update metadata for multiple photos.",
    )
    def patch(self, request):
        """Bulk update metadata for multiple photos."""
        photo_ids = request.data.get("photo_ids", [])
        updates = request.data.get("updates", {})
        
        if not photo_ids:
            return Response({"error": "No photo_ids provided"}, status=400)
        
        if not updates:
            return Response({"error": "No updates provided"}, status=400)
        
        if len(photo_ids) > 100:
            return Response({"error": "Maximum 100 photos per request"}, status=400)
        
        # Validate allowed fields
        allowed_fields = {"title", "caption", "keywords", "rating", "copyright", "creator"}
        invalid_fields = set(updates.keys()) - allowed_fields
        if invalid_fields:
            return Response(
                {"error": f"Invalid fields: {invalid_fields}. Allowed: {allowed_fields}"},
                status=400
            )
        
        # Get photos
        from django.db.models import Q
        import uuid
        
        uuid_ids = []
        hash_ids = []
        for pid in photo_ids:
            pid_str = str(pid)
            # UUID format: 36 chars with 4 hyphens
            is_uuid_format = len(pid_str) == 36 and pid_str.count("-") == 4
            if is_uuid_format:
                try:
                    uuid.UUID(pid_str)
                    uuid_ids.append(pid)
                except (ValueError, AttributeError):
                    hash_ids.append(pid)
            else:
                hash_ids.append(pid)
        
        photos = Photo.objects.filter(
            Q(pk__in=uuid_ids) | Q(image_hash__in=hash_ids),
            owner=request.user,
        )
        
        updated_count = 0
        for photo in photos:
            metadata, _ = PhotoMetadata.objects.get_or_create(photo=photo)
            
            for field_name, new_value in updates.items():
                old_value = getattr(metadata, field_name, None)
                if old_value != new_value:
                    MetadataEdit.objects.create(
                        photo=photo,
                        user=request.user,
                        field_name=field_name,
                        old_value=old_value,
                        new_value=new_value,
                    )
                    setattr(metadata, field_name, new_value)
            
            metadata.source = PhotoMetadata.Source.USER_EDIT
            metadata.version += 1
            metadata.save()
            updated_count += 1
        
        return Response({
            "updated_count": updated_count,
            "message": f"Updated metadata for {updated_count} photos",
        })


================================================
FILE: api/views/photos.py
================================================
from django.db.models import Count, Prefetch, Q
from drf_spectacular.utils import OpenApiParameter, OpenApiTypes, extend_schema
from rest_framework import filters, status, viewsets
from rest_framework.decorators import action
from rest_framework.permissions import IsAdminUser
from rest_framework.response import Response
from rest_framework.views import APIView

from api.models import AlbumUser, File, Photo, User
from api.models.photo_stack import PhotoStack
from api.models.person import Person
from api.models.photo_caption import PhotoCaption
from api.permissions import IsOwnerOrReadOnly, IsPhotoOrAlbumSharedTo
from api.serializers.album_user import AlbumUserListSerializer
from api.serializers.photos import (
    PhotoDetailsSummarySerializer,
    PhotoEditSerializer,
    PhotoSerializer,
    PhotoSummarySerializer,
)
from api.util import logger
from api.views.custom_api_view import ListViewSet
from api.views.pagination import (
    HugeResultsSetPagination,
    RegularResultsSetPagination,
    StandardResultsSetPagination,
)


class RecentlyAddedPhotoListViewSet(ListViewSet):
    serializer_class = PhotoSummarySerializer
    pagination_class = HugeResultsSetPagination

    def get_queryset(self):
        latest_photo = self._get_latest_photo()
        if latest_photo is None:
            return Photo.objects.none()
        latest_date = latest_photo.added_on

        # Prefetch stacks with type filter and annotated photo count
        # to avoid N+1 queries in PhotoSummarySerializer.get_stacks()
        valid_stack_types = PhotoStack.VALID_STACK_TYPES + [
            PhotoStack.StackType.RAW_JPEG_PAIR,
            PhotoStack.StackType.LIVE_PHOTO,
        ]
        stacks_prefetch = Prefetch(
            "stacks",
            queryset=PhotoStack.objects.filter(
                stack_type__in=valid_stack_types
            ).annotate(photo_count_annotation=Count("photos")),
        )

        queryset = (
            Photo.visible.filter(
                Q(owner=self.request.user)
                & Q(thumbnail__aspect_ratio__isnull=False)
                & Q(added_on__date=latest_date.date())
            )
            .select_related("thumbnail", "search_instance", "main_file")
            .prefetch_related(
                Prefetch(
                    "owner",
                    queryset=User.objects.only(
                        "id", "username", "first_name", "last_name"
                    ),
                ),
                Prefetch(
                    "main_file__embedded_media",
                    queryset=File.objects.only("hash"),
                ),
                stacks_prefetch,
                "files",  # For get_has_raw_variant()
            )
            .only(
                "image_hash",
                "thumbnail__aspect_ratio",
                "thumbnail__dominant_color",
                "video",
                "main_file",
                "search_instance__search_location",
                "rating",
                "owner",
                "exif_gps_lat",
                "exif_gps_lon",
                "removed",
                "in_trashcan",
                "exif_timestamp",
                "video_length",
            )
            .order_by("-added_on")
        )
        return queryset

    def list(self, *args, **kwargs):
        queryset = self.get_queryset()
        latest_photo = self._get_latest_photo()
        latest_date = latest_photo.added_on if latest_photo else None
        serializer = PhotoSummarySerializer(queryset, many=True)
        return Response({"date": latest_date, "results": serializer.data})

    def _get_latest_photo(self):
        if not hasattr(self, "_latest_photo"):
            self._latest_photo = (
                Photo.visible.filter(Q(owner=self.request.user))
                .only("added_on")
                .order_by("-added_on")
                .first()
            )
        return self._latest_photo


class NoTimestampPhotoViewSet(ListViewSet):
    serializer_class = PhotoSummarySerializer
    pagination_class = RegularResultsSetPagination
    filter_backends = (filters.SearchFilter,)
    search_fields = [
        "search_instance__search_captions",
        "search_instance__search_location",
        "faces__person__name",
    ]

    def get_queryset(self):
        return (
            Photo.visible.filter(Q(exif_timestamp=None) & Q(owner=self.request.user))
            .select_related("thumbnail", "search_instance", "main_file")
            .prefetch_related(
                Prefetch(
                    "owner",
                    queryset=User.objects.only(
                        "id", "username", "first_name", "last_name"
                    ),
                ),
                Prefetch(
                    "main_file__embedded_media",
                    queryset=File.objects.only("hash"),
                ),
            )
            .only(
                "image_hash",
                "thumbnail__aspect_ratio",
                "thumbnail__dominant_color",
                "video",
                "main_file",
                "search_instance__search_location",
                "rating",
                "owner",
                "exif_gps_lat",
                "exif_gps_lon",
                "removed",
                "in_trashcan",
                "exif_timestamp",
                "video_length",
            )
            .order_by("added_on")
        )

    def list(self, *args, **kwargs):
        return super().list(*args, **kwargs)


class SetPhotosDeleted(APIView):
    def post(self, request, format=None):
        from api.views.photo_filters import build_photo_queryset

        data = dict(request.data)
        val_deleted = data["deleted"]

        # NEW: Support select_all mode for bulk operations
        if data.get("select_all"):
            query_params = data.get("query", {})
            excluded_hashes = data.get("excluded_hashes", [])

            photos_qs = build_photo_queryset(request.user, query_params)
            if excluded_hashes:
                photos_qs = photos_qs.exclude(image_hash__in=excluded_hashes)

            # If restoring from trash, reset stacks to pending for re-evaluation
            if not val_deleted:
                from api.models.stack_review import StackReview
                from api.models.photo_stack import PhotoStack

                # Get stack IDs from photos that have stacks (ManyToMany)
                stack_ids = set(
                    PhotoStack.objects.filter(photos__in=photos_qs).values_list(
                        "id", flat=True
                    )
                )
                if stack_ids:
                    StackReview.objects.filter(
                        stack_id__in=stack_ids, decision=StackReview.Decision.RESOLVED
                    ).update(decision=StackReview.Decision.PENDING)
                    logger.info(
                        f"Reset {len(stack_ids)} photo stacks to pending after restore"
                    )

            count = photos_qs.update(in_trashcan=val_deleted)

            if val_deleted:
                logger.info(
                    f"{count} photos were moved to trash via select_all for user {request.user.id}."
                )
            else:
                logger.info(
                    f"{count} photos were restored from trash via select_all for user {request.user.id}."
                )

            return Response({"status": True, "count": count})

        # Existing logic for individual hashes
        image_hashes = data["image_hashes"]

        # Get all photos with related data in one query to prevent N+1 queries from serializer
        photos = (
            Photo.objects.filter(image_hash__in=image_hashes, owner=request.user)
            .select_related("owner", "thumbnail", "main_file")
            .prefetch_related(
                "files", "faces__person", "shared_to", "main_file__embedded_media"
            )
        )

        # Also prefetch search and caption instances if they exist
        photos = photos.select_related("search_instance", "caption_instance")

        # Group photos by whether they need updating
        photos_to_update = []
        updated_data = []
        not_updated_data = []

        for photo in photos:
            if photo.in_trashcan != val_deleted:
                photos_to_update.append(photo.image_hash)
                photo.in_trashcan = val_deleted
                updated_data.append(PhotoSerializer(photo).data)
            else:
                not_updated_data.append(PhotoSerializer(photo).data)

        # Bulk update in one query
        if photos_to_update:
            Photo.objects.filter(
                image_hash__in=photos_to_update, owner=request.user
            ).update(in_trashcan=val_deleted)

            # If restoring from trash, reset stacks to pending for re-evaluation
            if not val_deleted:
                from api.models.stack_review import StackReview
                from api.models.photo_stack import PhotoStack

                # Get stack IDs from photos that have stacks (ManyToMany)
                stack_ids = set(
                    PhotoStack.objects.filter(
                        photos__image_hash__in=photos_to_update
                    ).values_list("id", flat=True)
                )
                if stack_ids:
                    StackReview.objects.filter(
                        stack_id__in=stack_ids, decision=StackReview.Decision.RESOLVED
                    ).update(decision=StackReview.Decision.PENDING)
                    logger.info(
                        f"Reset {len(stack_ids)} photo stacks to pending after restore"
                    )

        # Handle missing photos
        found_hashes = {photo.image_hash for photo in photos}
        missing_hashes = set(image_hashes) - found_hashes
        for missing_hash in missing_hashes:
            logger.warning(
                f"Could not set photo {missing_hash} to deleted. It does not exist or is not owned by user."
            )

        if val_deleted:
            logger.info(
                f"{len(updated_data)} photos were moved to trash. {len(not_updated_data)} photos were already in trash."
            )
        else:
            logger.info(
                f"{len(updated_data)} photos were restored from trash. {len(not_updated_data)} photos were already restored."
            )
        return Response(
            {
                "status": True,
                "results": updated_data,
                "updated": updated_data,
                "not_updated": not_updated_data,
            }
        )


class SetPhotosFavorite(APIView):
    def post(self, request, format=None):
        from api.views.photo_filters import build_photo_queryset

        data = dict(request.data)
        val_favorite = data["favorite"]
        user = request.user

        # NEW: Support select_all mode for bulk operations
        if data.get("select_all"):
            query_params = data.get("query", {})
            excluded_hashes = data.get("excluded_hashes", [])

            photos_qs = build_photo_queryset(request.user, query_params)
            if excluded_hashes:
                photos_qs = photos_qs.exclude(image_hash__in=excluded_hashes)

            if val_favorite:
                # Only update photos that aren't already favorites
                count = photos_qs.filter(rating__lt=user.favorite_min_rating).update(
                    rating=user.favorite_min_rating
                )
                logger.info(
                    f"{count} photos were added to favorites via select_all for user {user.id}."
                )
            else:
                # Only update photos that are currently favorites
                count = photos_qs.filter(rating__gte=user.favorite_min_rating).update(
                    rating=0
                )
                logger.info(
                    f"{count} photos were removed from favorites via select_all for user {user.id}."
                )

            return Response({"status": True, "count": count})

        # Existing logic for individual hashes
        image_hashes = data["image_hashes"]

        # Get all photos with related data in one query to prevent N+1 queries from serializer
        photos = (
            Photo.objects.filter(image_hash__in=image_hashes, owner=request.user)
            .select_related(
                "owner", "thumbnail", "main_file", "search_instance", "caption_instance"
            )
            .prefetch_related(
                "files", "faces__person", "shared_to", "main_file__embedded_media"
            )
        )

        # Group photos by whether they need updating
        photos_to_favorite = []
        photos_to_unfavorite = []
        updated_data = []
        not_updated_data = []

        for photo in photos:
            if val_favorite and photo.rating < user.favorite_min_rating:
                photos_to_favorite.append(photo.image_hash)
                photo.rating = user.favorite_min_rating
                updated_data.append(PhotoSerializer(photo).data)
            elif not val_favorite and photo.rating >= user.favorite_min_rating:
                photos_to_unfavorite.append(photo.image_hash)
                photo.rating = 0
                updated_data.append(PhotoSerializer(photo).data)
            else:
                not_updated_data.append(PhotoSerializer(photo).data)

        # Bulk update in separate queries for different rating values
        if photos_to_favorite:
            Photo.objects.filter(
                image_hash__in=photos_to_favorite, owner=request.user
            ).update(rating=user.favorite_min_rating)

        if photos_to_unfavorite:
            Photo.objects.filter(
                image_hash__in=photos_to_unfavorite, owner=request.user
            ).update(rating=0)

        # Handle missing photos
        found_hashes = {photo.image_hash for photo in photos}
        missing_hashes = set(image_hashes) - found_hashes
        for missing_hash in missing_hashes:
            logger.warning(
                f"Could not set photo {missing_hash} to favorite. It does not exist or is not owned by user."
            )

        if val_favorite:
            logger.info(
                f"{len(updated_data)} photos were added to favorites. {len(not_updated_data)} photos were already in favorites."
            )
        else:
            logger.info(
                f"{len(updated_data)} photos were removed from favorites. {len(not_updated_data)} photos were already not in favorites."
            )
        return Response(
            {
                "status": True,
                "results": updated_data,
                "updated": updated_data,
                "not_updated": not_updated_data,
            }
        )


class SetPhotosHidden(APIView):
    def post(self, request, format=None):
        from api.views.photo_filters import build_photo_queryset

        data = dict(request.data)
        val_hidden = data["hidden"]

        # NEW: Support select_all mode for bulk operations
        if data.get("select_all"):
            query_params = data.get("query", {})
            excluded_hashes = data.get("excluded_hashes", [])

            photos_qs = build_photo_queryset(request.user, query_params)
            if excluded_hashes:
                photos_qs = photos_qs.exclude(image_hash__in=excluded_hashes)

            count = photos_qs.update(hidden=val_hidden)

            if val_hidden:
                logger.info(
                    f"{count} photos were set hidden via select_all for user {request.user.id}."
                )
            else:
                logger.info(
                    f"{count} photos were set unhidden via select_all for user {request.user.id}."
                )

            return Response({"status": True, "count": count})

        # Existing logic for individual hashes
        image_hashes = data["image_hashes"]

        # Get all photos with related data in one query to prevent N+1 queries from serializer
        photos = (
            Photo.objects.filter(image_hash__in=image_hashes, owner=request.user)
            .select_related(
                "owner", "thumbnail", "main_file", "search_instance", "caption_instance"
            )
            .prefetch_related(
                "files", "faces__person", "shared_to", "main_file__embedded_media"
            )
        )

        # Group photos by whether they need updating
        photos_to_update = []
        updated_data = []
        not_updated_data = []

        for photo in photos:
            if photo.hidden != val_hidden:
                photos_to_update.append(photo.image_hash)
                photo.hidden = val_hidden
                updated_data.append(PhotoSerializer(photo).data)
            else:
                not_updated_data.append(PhotoSerializer(photo).data)

        # Bulk update in one query
        if photos_to_update:
            Photo.objects.filter(
                image_hash__in=photos_to_update, owner=request.user
            ).update(hidden=val_hidden)

        # Handle missing photos
        found_hashes = {photo.image_hash for photo in photos}
        missing_hashes = set(image_hashes) - found_hashes
        for missing_hash in missing_hashes:
            logger.warning(
                f"Could not set photo {missing_hash} to hidden. It does not exist or is not owned by user."
            )

        if val_hidden:
            logger.info(
                f"{len(updated_data)} photos were set hidden. {len(not_updated_data)} photos were already hidden."
            )
        else:
            logger.info(
                f"{len(updated_data)} photos were set unhidden. {len(not_updated_data)} photos were already unhidden."
            )
        return Response(
            {
                "status": True,
                "results": updated_data,
                "updated": updated_data,
                "not_updated": not_updated_data,
            }
        )


class PhotoViewSet(viewsets.ModelViewSet):
    serializer_class = PhotoSerializer
    pagination_class = HugeResultsSetPagination
    filter_backends = (filters.SearchFilter,)
    search_fields = [
        "search_instance__search_captions",
        "search_instance__search_location",
        "faces__person__name",
        "exif_timestamp",
        "main_file__path",
    ]

    def get_object(self):
        """
        Override get_object to support lookup by both UUID (pk) and image_hash.
        This provides backward compatibility with existing URLs using image_hash.
        """
        queryset = self.get_queryset()
        lookup_url_kwarg = self.lookup_url_kwarg or self.lookup_field
        lookup_value = self.kwargs.get(lookup_url_kwarg)

        if lookup_value:
            # Determine if this is a UUID (36 chars with hyphens) or image_hash (32 hex chars)
            # Note: Python's uuid.UUID() accepts 32 hex chars without hyphens, but those
            # are MD5 hashes used for backward compatibility, not actual UUIDs
            is_uuid_format = len(lookup_value) == 36 and lookup_value.count("-") == 4

            if is_uuid_format:
                try:
                    import uuid

                    uuid.UUID(lookup_value)
                    filter_kwargs = {"pk": lookup_value}
                except (ValueError, AttributeError):
                    filter_kwargs = {"image_hash": lookup_value}
            else:
                # 32 hex chars = MD5 image_hash (backward compatibility)
                filter_kwargs = {"image_hash": lookup_value}

            obj = queryset.filter(**filter_kwargs).first()
            if obj is None:
                from rest_framework.exceptions import NotFound

                raise NotFound()

            # May raise a permission denied
            self.check_object_permissions(self.request, obj)
            return obj

        return super().get_object()

    @action(
        detail=True,
        methods=["get"],
        name="summary",
        serializer_class=PhotoDetailsSummarySerializer,
    )
    def summary(self, request, pk):
        # Support both UUID and image_hash lookups
        # Note: 32 hex chars could parse as UUID but are actually MD5 hashes
        # Use Photo.objects instead of get_queryset() to include processing photos
        is_uuid_format = len(pk) == 36 and pk.count("-") == 4

        if is_uuid_format:
            try:
                import uuid

                uuid.UUID(pk)
                queryset = Photo.objects.filter(pk=pk)
            except (ValueError, AttributeError):
                queryset = Photo.objects.filter(image_hash=pk)
        else:
            queryset = Photo.objects.filter(image_hash=pk)

        if not queryset.exists():
            return Response(status=status.HTTP_404_NOT_FOUND)

        photo = queryset.first()
        # Check permissions - owner, shared, or public
        if not (
            photo.owner == request.user
            or photo.shared_to.filter(id=request.user.id).exists()
            or photo.public
        ):
            return Response(status=status.HTTP_404_NOT_FOUND)

        # Serializer expects a queryset (calls .get() internally)
        serializer = PhotoDetailsSummarySerializer(queryset, many=False)
        return Response(serializer.data)

    @action(
        detail=True,
        methods=["get"],
        name="albums",
        serializer_class=AlbumUserListSerializer,
    )
    def albums(self, request, pk):
        """Return user albums that contain this photo."""
        # Support both UUID and image_hash lookups
        try:
            import uuid

            uuid.UUID(pk)
            photo = Photo.objects.filter(pk=pk).first()
        except (ValueError, AttributeError):
            photo = Photo.objects.filter(image_hash=pk).first()

        if not photo:
            return Response(status=status.HTTP_404_NOT_FOUND)
        albums = AlbumUser.objects.filter(
            Q(photos=photo) & (Q(owner=request.user) | Q(shared_to=request.user))
        ).distinct()
        serializer = AlbumUserListSerializer(albums, many=True)
        return Response({"results": serializer.data})

    def get_permissions(self):
        if self.action in ("list", "retrieve", "summary", "albums"):
            permission_classes = [IsPhotoOrAlbumSharedTo]
        else:  # pragma: no cover - unused
            if getattr(self.request, "user", None) and self.request.user.is_staff:
                permission_classes = [IsAdminUser]
            else:
                permission_classes = [IsOwnerOrReadOnly]
        return [permission() for permission in permission_classes]

    def get_queryset(self):
        if self.request.user.is_anonymous:
            return (
                Photo.visible.filter(Q(public=True))
                .prefetch_related("stacks")
                .order_by("-exif_timestamp")
            )
        else:
            # Include photos that are:
            # 1. Owned by the user
            # 2. Shared directly with the user
            # 3. Public (for retrieve access)
            # Note: Photos in shared albums are handled by the permission class
            return (
                Photo.visible.filter(
                    Q(owner=self.request.user)
                    | Q(shared_to=self.request.user)
                    | Q(public=True)
                )
                .prefetch_related("stacks")
                .order_by("-exif_timestamp")
            )

    def retrieve(self, *args, **kwargs):
        return super().retrieve(*args, **kwargs)

    def list(self, *args, **kwargs):  # pragma: no cover - unused
        return super().list(*args, **kwargs)


class PhotoEditViewSet(viewsets.ModelViewSet):
    serializer_class = PhotoEditSerializer
    pagination_class = StandardResultsSetPagination

    def get_queryset(self):
        return Photo.visible.filter(Q(owner=self.request.user))

    def get_object(self):
        """
        Override get_object to support lookup by both UUID (pk) and image_hash.
        """
        queryset = self.get_queryset()
        lookup_url_kwarg = self.lookup_url_kwarg or self.lookup_field
        lookup_value = self.kwargs.get(lookup_url_kwarg)

        if lookup_value:
            # Check if proper UUID format (36 chars with hyphens) vs MD5 hash (32 hex chars)
            is_uuid_format = len(lookup_value) == 36 and lookup_value.count("-") == 4

            if is_uuid_format:
                try:
                    import uuid

                    uuid.UUID(lookup_value)
                    filter_kwargs = {"pk": lookup_value}
                except (ValueError, AttributeError):
                    filter_kwargs = {"image_hash": lookup_value}
            else:
                filter_kwargs = {"image_hash": lookup_value}

            obj = queryset.filter(**filter_kwargs).first()
            if obj is None:
                from rest_framework.exceptions import NotFound

                raise NotFound()

            self.check_object_permissions(self.request, obj)
            return obj

        return super().get_object()

    def retrieve(
        self, *args, **kwargs
    ):  # pragma: no cover TODO(sickelap): remove unused code
        return super().retrieve(*args, **kwargs)

    def list(
        self, *args, **kwargs
    ):  # pragma: no cover TODO(sickelap): remove unused code
        return super().list(*args, **kwargs)


class SetPhotosShared(APIView):
    def post(self, request, format=None):
        from api.views.photo_filters import build_photo_queryset

        data = dict(request.data)
        shared = data["val_shared"]  # bool
        target_user_id = data["target_user_id"]  # user pk, int

        through_model = Photo.shared_to.through

        # NEW: Support select_all mode for bulk operations
        if data.get("select_all"):
            query_params = data.get("query", {})
            excluded_hashes = data.get("excluded_hashes", [])

            photos_qs = build_photo_queryset(request.user, query_params)
            if excluded_hashes:
                photos_qs = photos_qs.exclude(image_hash__in=excluded_hashes)

            image_hashes = list(photos_qs.values_list("image_hash", flat=True))
        else:
            image_hashes = data["image_hashes"]

        """
        From https://stackoverflow.com/questions/6996176/how-to-create-an-object-for-a-django-model-with-a-many-to-many-field/10116452#10116452
        # Access the through model directly
        ThroughModel = Sample.users.through

        users = Users.objects.filter(pk__in=[1,2])

        sample_object = Sample()
        sample_object.save()

        ThroughModel.objects.bulk_create([
            ThroughModel(users_id=users[0].pk, sample_id=sample_object.pk),
            ThroughModel(users_id=users[1].pk, sample_id=sample_object.pk)
        ])
        """

        # Look up photo UUIDs from image_hashes (image_hash is no longer the primary key)
        photos = Photo.objects.filter(image_hash__in=image_hashes).only(
            "id", "image_hash"
        )
        photo_ids = [photo.id for photo in photos]

        if shared:
            already_existing = through_model.objects.filter(
                user_id=target_user_id, photo_id__in=photo_ids
            ).only("photo_id")
            already_existing_photo_ids = set(e.photo_id for e in already_existing)
            res = through_model.objects.bulk_create(
                [
                    through_model(user_id=target_user_id, photo_id=photo_id)
                    for photo_id in photo_ids
                    if photo_id not in already_existing_photo_ids
                ]
            )
            logger.info(
                f"Shared {request.user.id}'s {len(res)} images to user {target_user_id}"
            )
            res_count = len(res)
        else:
            res = through_model.objects.filter(
                user_id=target_user_id, photo_id__in=photo_ids
            ).delete()
            logger.info(
                f"Unshared {request.user.id}'s {len(res)} images to user {target_user_id}"
            )
            res_count = res[0]

        return Response({"status": True, "count": res_count})


class SetPhotosPublic(APIView):
    def post(self, request, format=None):
        from api.views.photo_filters import build_photo_queryset

        data = dict(request.data)
        val_public = data["val_public"]

        # NEW: Support select_all mode for bulk operations
        if data.get("select_all"):
            query_params = data.get("query", {})
            excluded_hashes = data.get("excluded_hashes", [])

            photos_qs = build_photo_queryset(request.user, query_params)
            if excluded_hashes:
                photos_qs = photos_qs.exclude(image_hash__in=excluded_hashes)

            count = photos_qs.update(public=val_public)

            if val_public:
                logger.info(
                    f"{count} photos were set public via select_all for user {request.user.id}."
                )
            else:
                logger.info(
                    f"{count} photos were set private via select_all for user {request.user.id}."
                )

            return Response({"status": True, "count": count})

        # Existing logic for individual hashes
        image_hashes = data["image_hashes"]

        # Get all photos with related data in one query to prevent N+1 queries from serializer
        photos = (
            Photo.objects.filter(image_hash__in=image_hashes, owner=request.user)
            .select_related(
                "owner", "thumbnail", "main_file", "search_instance", "caption_instance"
            )
            .prefetch_related(
                "files", "faces__person", "shared_to", "main_file__embedded_media"
            )
        )

        # Group photos by whether they need updating
        photos_to_update = []
        updated_data = []
        not_updated_data = []

        for photo in photos:
            if photo.public != val_public:
                photos_to_update.append(photo.image_hash)
                photo.public = val_public
                updated_data.append(PhotoSerializer(photo).data)
            else:
                not_updated_data.append(PhotoSerializer(photo).data)

        # Bulk update in one query
        if photos_to_update:
            Photo.objects.filter(
                image_hash__in=photos_to_update, owner=request.user
            ).update(public=val_public)

        # Handle missing photos
        found_hashes = {photo.image_hash for photo in photos}
        missing_hashes = set(image_hashes) - found_hashes
        for missing_hash in missing_hashes:
            logger.warning(
                f"Could not set photo {missing_hash} to public. It does not exist or is not owned by user."
            )

        if val_public:
            logger.info(
                f"{len(updated_data)} photos were set public. {len(not_updated_data)} photos were already public."
            )
        else:
            logger.info(
                f"{len(updated_data)} photos were set private. {len(not_updated_data)} photos were already public."
            )

        return Response(
            {
                "status": True,
                "results": updated_data,
                "updated": updated_data,
                "not_updated": not_updated_data,
            }
        )


class GeneratePhotoCaption(APIView):
    permission_classes = (IsOwnerOrReadOnly,)

    def post(self, request, format=None):
        data = dict(request.data)
        image_hash = data["image_hash"]

        photo = Photo.objects.filter(image_hash=image_hash, owner=request.user).first()
        if photo is None:
            return Response(
                {"status": False, "message": "photo not found"},
                status=404,
            )

        caption_instance, created = PhotoCaption.objects.get_or_create(photo=photo)
        res = caption_instance.generate_captions_im2txt()

        if res:
            return Response({"status": True})
        else:
            return Response(
                {
                    "status": False,
                    "message": "Failed to generate caption. Check service logs for details.",
                },
                status=500,
            )


class SavePhotoCaption(APIView):
    permission_classes = (IsOwnerOrReadOnly,)

    def post(self, request, format=None):
        data = dict(request.data)
        image_hash = data["image_hash"]
        caption = data["caption"]

        photo = Photo.objects.filter(image_hash=image_hash, owner=request.user).first()
        if photo is None:
            return Response(
                {"status": False, "message": "photo not found"},
                status=404,
            )

        caption_instance, created = PhotoCaption.objects.get_or_create(photo=photo)
        res = caption_instance.save_user_caption(caption)
        return Response({"status": res})


class DeletePhotos(APIView):
    def delete(self, request):
        from api.views.photo_filters import build_photo_queryset

        data = dict(request.data)

        # NEW: Support select_all mode for bulk operations
        if data.get("select_all"):
            query_params = data.get("query", {})
            excluded_hashes = data.get("excluded_hashes", [])

            # For delete, we need to ensure photos are in trashcan
            # Override query to filter for trashcan photos only
            query_params["in_trashcan"] = True

            photos_qs = build_photo_queryset(request.user, query_params)
            if excluded_hashes:
                photos_qs = photos_qs.exclude(image_hash__in=excluded_hashes)

            # Need to call manual_delete on each photo for proper cleanup
            deleted_count = 0
            for photo in photos_qs:
                if photo.owner == request.user:
                    photo.manual_delete()
                    deleted_count += 1

            logger.info(
                f"{deleted_count} photos were permanently deleted via select_all for user {request.user.id}."
            )

            return Response({"status": True, "count": deleted_count})

        # Existing logic for individual hashes
        # Use filter since image_hash may not be unique after UUID migration
        image_hashes = data["image_hashes"]
        photos = Photo.objects.filter(image_hash__in=image_hashes)
        photos_by_hash = {photo.image_hash: photo for photo in photos}

        deleted = []
        not_deleted = []
        for image_hash in image_hashes:
            photo = photos_by_hash.get(image_hash)
            if photo is None:
                continue  # Photo not found
            if photo.owner == request.user and photo.in_trashcan:
                deleted.append(photo.image_hash)
                photo.manual_delete()
            else:
                not_deleted.append(photo.image_hash)

        return Response(
            {
                "status": True,
                "results": deleted,
                "not_deleted": not_deleted,
                "deleted": deleted,
            }
        )


class FileVariantDownloadView(APIView):
    """
    Download a specific file variant for a photo.

    Supports downloading RAW, JPEG, video (Live Photo), or other variants
    associated with a Photo entity (PhotoPrism-like file variant model).
    """

    @extend_schema(
        parameters=[
            OpenApiParameter(
                "file_hash",
                OpenApiTypes.STR,
                description="Hash of the specific file variant to download",
            ),
        ],
    )
    def get(self, request, image_hash, file_hash):
        """Download a specific file variant by hash."""
        import magic
        import os
        from django.http import FileResponse, HttpResponse

        # Find the photo
        try:
            photo = Photo.objects.get(
                image_hash=image_hash,
                owner=request.user,
            )
        except Photo.DoesNotExist:
            return Response(
                {"error": "Photo not found"}, status=status.HTTP_404_NOT_FOUND
            )
        except Photo.MultipleObjectsReturned:
            # Multiple photos with same hash - get the one owned by user
            photo = Photo.objects.filter(
                image_hash=image_hash,
                owner=request.user,
            ).first()
            if not photo:
                return Response(
                    {"error": "Photo not found"}, status=status.HTTP_404_NOT_FOUND
                )

        # Find the requested file variant
        file_variant = photo.files.filter(hash=file_hash).first()
        if not file_variant:
            return Response(
                {"error": "File variant not found"}, status=status.HTTP_404_NOT_FOUND
            )

        # Check file exists
        if not os.path.exists(file_variant.path):
            return Response(
                {"error": "File not found on disk"}, status=status.HTTP_404_NOT_FOUND
            )

        # Serve the file
        try:
            response = FileResponse(
                open(file_variant.path, "rb"),
                as_attachment=True,
                filename=os.path.basename(file_variant.path),
            )

            # Set content type
            try:
                mime = magic.Magic(mime=True)
                response["Content-Type"] = mime.from_file(file_variant.path)
            except Exception:
                response["Content-Type"] = "application/octet-stream"

            return response

        except (FileNotFoundError, PermissionError) as e:
            logger.error(f"Error serving file {file_variant.path}: {e}")
            return Response(
                {"error": "Could not read file"},
                status=status.HTTP_500_INTERNAL_SERVER_ERROR,
            )


class SetMainFileView(APIView):
    """
    Set the main (primary) file for a photo.

    Changes which file variant is used as the main display file for the photo.
    Useful when a photo has multiple variants (RAW, JPEG, etc.).
    """

    def post(self, request, image_hash):
        """Set the main file for a photo."""
        file_hash = request.data.get("file_hash")

        if not file_hash:
            return Response(
                {"error": "file_hash is required"}, status=status.HTTP_400_BAD_REQUEST
            )

        # Find the photo
        try:
            photo = Photo.objects.get(
                image_hash=image_hash,
                owner=request.user,
            )
        except Photo.DoesNotExist:
            return Response(
                {"error": "Photo not found"}, status=status.HTTP_404_NOT_FOUND
            )
        except Photo.MultipleObjectsReturned:
            photo = Photo.objects.filter(
                image_hash=image_hash,
                owner=request.user,
            ).first()
            if not photo:
                return Response(
                    {"error": "Photo not found"}, status=status.HTTP_404_NOT_FOUND
                )

        # Find the requested file variant
        file_variant = photo.files.filter(hash=file_hash).first()
        if not file_variant:
            return Response(
                {"error": "File variant not found in this photo"},
                status=status.HTTP_404_NOT_FOUND,
            )

        # Update main file
        photo.main_file = file_variant
        photo.save(update_fields=["main_file", "last_modified"])

        logger.info(f"Set main file for photo {image_hash} to {file_hash}")

        return Response(
            {
                "status": "updated",
                "main_file_hash": file_hash,
            }
        )


class SaveMetadataView(APIView):
    def post(self, request, format=None):
        """Bulk-write metadata to image files for the authenticated user's photos.

        Accepts {"types": ["ratings", "face_tags"]} to control what gets written.
        Defaults to ["ratings"] if not specified.
        """
        metadata_types = request.data.get("types", ["ratings"])
        use_sidecar = (
            request.user.save_metadata_to_disk == User.SaveMetadata.SIDECAR_FILE
        )

        photos = Photo.objects.filter(owner=request.user)

        # When writing face tags, only include photos that have labeled faces
        if "face_tags" in metadata_types and metadata_types == ["face_tags"]:
            photos = photos.filter(
                faces__person__kind=Person.KIND_USER,
                faces__deleted=False,
            ).distinct()

        written = 0
        errors = 0
        for photo in photos.iterator():
            try:
                photo._save_metadata(
                    use_sidecar=use_sidecar, metadata_types=metadata_types
                )
                written += 1
            except Exception:
                errors += 1
                logger.exception(
                    f"Failed to save metadata for photo {photo.image_hash}"
                )

        return Response({"status": True, "written": written, "errors": errors})


================================================
FILE: api/views/public_albums.py
================================================
from django.db.models import Q
from django.utils import timezone
from django.utils.dateparse import parse_datetime
from drf_spectacular.utils import OpenApiParameter, OpenApiTypes, extend_schema
from rest_framework.permissions import AllowAny
from rest_framework.response import Response
from rest_framework.views import APIView

from api.models import AlbumUser, Photo
from api.models.album_user_share import AlbumUserShare
from api.serializers.album_user import (
    AlbumUserListSerializer,
    AlbumUserPublicSerializer,
)
from api.serializers.photos import PublicPhotoDetailSerializer


class SetUserAlbumPublic(APIView):
    def post(self, request, format=None):
        data = dict(request.data)
        val_public = data.get("val_public")
        album_id = data.get("album_id")
        slug = data.get("slug")
        expires_at = data.get("expires_at")  # ISO string or None
        
        # Sharing options - None means use user default, True/False overrides
        sharing_options = data.get("sharing_options", {})
        
        if album_id is None or val_public is None:
            return Response(
                {"status": False, "message": "Missing parameters"}, status=400
            )

        try:
            album = AlbumUser.objects.get(id=album_id)
        except AlbumUser.DoesNotExist:
            return Response({"status": False, "message": "No such album"}, status=404)

        if album.owner != request.user:
            return Response(
                {"status": False, "message": "You are not the owner of this album"},
                status=403,
            )

        share, _ = AlbumUserShare.objects.get_or_create(album=album)
        share.enabled = bool(val_public)
        if slug is not None:
            share.slug = slug or None
        if expires_at is not None:
            try:
                dt = parse_datetime(expires_at)
                share.expires_at = dt
            except Exception:
                pass
        
        # Update sharing options if provided
        if sharing_options:
            # Each option can be True, False, or None (use default)
            if "share_location" in sharing_options:
                share.share_location = sharing_options.get("share_location")
            if "share_camera_info" in sharing_options:
                share.share_camera_info = sharing_options.get("share_camera_info")
            if "share_timestamps" in sharing_options:
                share.share_timestamps = sharing_options.get("share_timestamps")
            if "share_captions" in sharing_options:
                share.share_captions = sharing_options.get("share_captions")
            if "share_faces" in sharing_options:
                share.share_faces = sharing_options.get("share_faces")
        
        share.save()

        return Response({"status": True, "album": AlbumUserListSerializer(album).data})


class PublicAlbumBySlug(APIView):
    permission_classes = [AllowAny]

    @extend_schema(
        parameters=[OpenApiParameter("slug", OpenApiTypes.STR)],
        description="Returns a public user album by slug if active",
    )
    def get(self, request, slug):
        album = (
            AlbumUser.objects.filter(Q(share__enabled=True) & Q(share__slug=slug))
            .filter(
                Q(share__expires_at__isnull=True)
                | Q(share__expires_at__gte=timezone.now())
            )
            .select_related("share", "owner")
            .first()
        )
        if not album:
            return Response(status=404)
        
        # Include effective sharing settings in response
        sharing_settings = album.share.get_effective_sharing_settings()
        
        serializer = AlbumUserPublicSerializer(album, context={"request": request})
        return Response({
            "results": serializer.data,
            "sharing_settings": sharing_settings,
        })


class PublicPhotoDetailBySlug(APIView):
    """Get photo details for a photo in a publicly shared album."""
    
    permission_classes = [AllowAny]

    @extend_schema(
        parameters=[
            OpenApiParameter("slug", OpenApiTypes.STR, description="Album share slug"),
            OpenApiParameter("photo_id", OpenApiTypes.STR, description="Photo ID or image hash"),
        ],
        description="Returns photo details for a photo in a public album, filtered by sharing settings",
    )
    def get(self, request, slug, photo_id):
        # Find the public album
        album = (
            AlbumUser.objects.filter(Q(share__enabled=True) & Q(share__slug=slug))
            .filter(
                Q(share__expires_at__isnull=True)
                | Q(share__expires_at__gte=timezone.now())
            )
            .select_related("share", "owner")
            .first()
        )
        if not album:
            return Response({"error": "Album not found or not public"}, status=404)
        
        # Find the photo - support both UUID and image_hash lookups
        # UUID format is 36 chars with hyphens, image_hash is 32 hex chars
        is_uuid_format = len(photo_id) == 36 and photo_id.count("-") == 4
        
        if is_uuid_format:
            photo = album.photos.filter(
                pk=photo_id,
                hidden=False,
                in_trashcan=False,
            ).first()
        else:
            photo = album.photos.filter(
                image_hash=photo_id,
                hidden=False,
                in_trashcan=False,
            ).first()
        
        if not photo:
            return Response({"error": "Photo not found in album"}, status=404)
        
        # Get effective sharing settings
        sharing_settings = album.share.get_effective_sharing_settings()
        
        # Serialize with sharing settings in context
        serializer = PublicPhotoDetailSerializer(
            photo,
            context={"request": request, "sharing_settings": sharing_settings}
        )
        
        return Response({
            "results": serializer.data,
            "sharing_settings": sharing_settings,
        })


================================================
FILE: api/views/search.py
================================================
from django.db.models import Prefetch, Q
from rest_framework.response import Response

from api.filters import SemanticSearchFilter
from api.models import File, Photo, User
from api.serializers.photos import GroupedPhotosSerializer, PhotoSummarySerializer
from api.serializers.PhotosGroupedByDate import get_photos_ordered_by_date
from api.views.custom_api_view import ListViewSet
from api.views.pagination import HugeResultsSetPagination


class SearchListViewSet(ListViewSet):
    serializer_class = GroupedPhotosSerializer
    pagination_class = HugeResultsSetPagination
    filter_backends = (SemanticSearchFilter,)

    search_fields = [
        "search_instance__search_captions",
        "search_instance__search_location",
        "exif_timestamp",
    ]

    def get_queryset(self):
        return Photo.visible.filter(Q(owner=self.request.user)).order_by(
            "-exif_timestamp"
        )

    def list(self, request):
        if request.user.semantic_search_topk == 0:
            queryset = self.filter_queryset(
                Photo.visible.filter(Q(owner=self.request.user))
                .select_related("thumbnail", "search_instance", "main_file")
                .prefetch_related(
                    Prefetch(
                        "owner",
                        queryset=User.objects.only(
                            "id", "username", "first_name", "last_name"
                        ),
                    ),
                    Prefetch(
                        "main_file__embedded_media",
                        queryset=File.objects.only("hash"),
                    ),
                )
                .order_by("-exif_timestamp")
                .only(
                    "image_hash",
                    "thumbnail__aspect_ratio",
                    "thumbnail__dominant_color",
                    "video",
                    "main_file",
                    "search_instance__search_location",
                    "public",
                    "rating",
                    "hidden",
                    "exif_timestamp",
                    "owner",
                    "video_length",
                    "exif_gps_lat",
                    "exif_gps_lon",
                    "removed",
                    "in_trashcan",
                )
            )
            grouped_photos = get_photos_ordered_by_date(queryset)
            serializer = GroupedPhotosSerializer(grouped_photos, many=True)
            return Response({"results": serializer.data})
        else:
            queryset = self.filter_queryset(
                Photo.visible.filter(Q(owner=self.request.user))
                .select_related("thumbnail", "search_instance", "main_file")
                .prefetch_related(
                    Prefetch(
                        "owner",
                        queryset=User.objects.only(
                            "id", "username", "first_name", "last_name"
                        ),
                    ),
                    Prefetch(
                        "main_file__embedded_media",
                        queryset=File.objects.only("hash"),
                    ),
                )
                .only(
                    "image_hash",
                    "thumbnail__aspect_ratio",
                    "thumbnail__dominant_color",
                    "video",
                    "main_file",
                    "search_instance__search_location",
                    "public",
                    "rating",
                    "hidden",
                    "exif_timestamp",
                    "owner",
                    "video_length",
                    "exif_gps_lat",
                    "exif_gps_lon",
                    "removed",
                    "in_trashcan",
                )
            )
            serializer = PhotoSummarySerializer(queryset, many=True)
            return Response({"results": serializer.data})


================================================
FILE: api/views/services.py
================================================
from rest_framework import status, viewsets
from rest_framework.decorators import action
from rest_framework.permissions import IsAdminUser
from rest_framework.response import Response

from api.services import SERVICES, is_healthy, start_service, stop_service


class ServiceViewSet(viewsets.ViewSet):
    permission_classes = [IsAdminUser]

    def list(self, request):
        return Response({"services": SERVICES})

    def retrieve(self, request, pk=None):
        service_name = pk

        if service_name not in SERVICES:
            return Response(
                {"error": f"Service {service_name} not found"},
                status=status.HTTP_404_NOT_FOUND,
            )

        healthy = is_healthy(service_name)
        return Response({"service_name": service_name, "healthy": healthy})

    @action(detail=True, methods=["post"])
    def start(self, request, pk=None):
        service_name = pk

        if service_name not in SERVICES:
            return Response(
                {"error": f"Service {service_name} not found"},
                status=status.HTTP_404_NOT_FOUND,
            )

        start_result = start_service(service_name)
        if start_result:
            return Response(
                {"message": f"Service {service_name} started successfully"},
                status=status.HTTP_200_OK,
            )
        else:
            return Response(
                {"error": f"Failed to start service {service_name}"},
                status=status.HTTP_500_INTERNAL_SERVER_ERROR,
            )

    @action(detail=True, methods=["post"])
    def stop(self, request, pk=None):
        service_name = pk

        if service_name not in SERVICES:
            return Response(
                {"error": f"Service {service_name} not found"},
                status=status.HTTP_404_NOT_FOUND,
            )

        stop_result = stop_service(service_name)
        if stop_result:
            return Response(
                {"message": f"Service {service_name} stopped successfully"},
                status=status.HTTP_200_OK,
            )
        else:
            return Response(
                {"error": f"Failed to stop service {service_name}"},
                status=status.HTTP_500_INTERNAL_SERVER_ERROR,
            )


================================================
FILE: api/views/sharing.py
================================================
from django.db.models import Count, Prefetch, Q

from api.models import AlbumUser, Photo, User
from api.serializers.album_user import AlbumUserListSerializer
from api.serializers.photos import (
    PhotoSummarySerializer,
    SharedFromMePhotoThroughSerializer,
)
from api.views.custom_api_view import ListViewSet
from api.views.pagination import HugeResultsSetPagination


class SharedToMePhotoSuperSimpleListViewSet(ListViewSet):
    serializer_class = PhotoSummarySerializer
    pagination_class = HugeResultsSetPagination

    def get_queryset(self):
        return (
            Photo.visible.filter(Q(shared_to__id__exact=self.request.user.id))
            .only(
                "image_hash",
                "public",
                "rating",
                "owner",
                "hidden",
                "exif_timestamp",
            )
            .prefetch_related("owner")
            .order_by("exif_timestamp")
        )


class SharedFromMePhotoSuperSimpleListViewSet(ListViewSet):
    serializer_class = SharedFromMePhotoThroughSerializer
    pagination_class = HugeResultsSetPagination

    def get_queryset(self):
        ThroughModel = Photo.shared_to.through

        user_photos = Photo.visible.filter(Q(owner=self.request.user.id)).only(
            "image_hash"
        )
        qs = (
            ThroughModel.objects.filter(photo_id__in=user_photos)
            .prefetch_related(
                Prefetch(
                    "user",
                    queryset=User.objects.only(
                        "id", "username", "first_name", "last_name"
                    ),
                )
            )
            .prefetch_related(
                Prefetch(
                    "photo",
                    queryset=Photo.objects.filter(hidden=False).only(
                        "image_hash", "rating", "hidden", "exif_timestamp", "public"
                    ),
                )
            )
            .order_by("photo__exif_timestamp")
        )
        return qs


class SharedToMeAlbumUserListViewSet(ListViewSet):
    serializer_class = AlbumUserListSerializer
    pagination_class = HugeResultsSetPagination

    def get_queryset(self):
        return AlbumUser.objects.filter(shared_to__id__exact=self.request.user.id).order_by("id")


class SharedFromMeAlbumUserListViewSet(ListViewSet):
    serializer_class = AlbumUserListSerializer
    pagination_class = HugeResultsSetPagination

    def get_queryset(self):
        return (
            AlbumUser.objects.annotate(shared_to_count=Count("shared_to"))
            .filter(shared_to_count__gt=0)
            .filter(owner=self.request.user.id)
            .order_by("id")
        )


================================================
FILE: api/views/stacks.py
================================================
"""
API views for PhotoStack management - organizational photo grouping.

Handles organizational stack types: burst sequences, exposure brackets,
and manual stacks.

NOTE: RAW+JPEG pairs and Live Photos are NO LONGER stacks. They use
the Photo.files field for file variants (PhotoPrism-like model).

NOTE: Duplicates (exact copies and visual duplicates) are handled 
separately by the duplicates API in api/views/duplicates.py.
Stacks are for organization, duplicates are for storage cleanup.
"""

from django.core.paginator import Paginator
from django.db.models import Count
from django_q.tasks import async_task
from drf_spectacular.utils import OpenApiParameter, extend_schema
from rest_framework import status
from rest_framework.permissions import IsAuthenticated
from rest_framework.response import Response
from rest_framework.views import APIView

from api.models import Photo
from api.models.photo_stack import PhotoStack
from api.util import logger


class PhotoStackListView(APIView):
    """List all photo stacks for the current user with pagination and filters."""

    permission_classes = [IsAuthenticated]

    @extend_schema(
        parameters=[
            OpenApiParameter(
                "stack_type",
                str,
                description="Filter by stack type: raw_jpeg, burst, bracket, live_photo, manual",
            ),
            OpenApiParameter(
                "page",
                int,
                description="Page number (default: 1)",
            ),
            OpenApiParameter(
                "page_size",
                int,
                description="Number of items per page (default: 20, max: 100)",
            ),
        ],
    )
    def get(self, request):
        stack_type_filter = request.query_params.get("stack_type", None)
        
        # Safely parse pagination parameters with defaults for invalid input
        try:
            page = max(1, int(request.query_params.get("page", 1)))
        except (ValueError, TypeError):
            page = 1
        
        try:
            page_size = max(1, min(int(request.query_params.get("page_size", 20)), 100))
        except (ValueError, TypeError):
            page_size = 20

        # Use model-defined valid stack types (excludes deprecated RAW_JPEG_PAIR, LIVE_PHOTO)
        valid_stack_types = PhotoStack.VALID_STACK_TYPES

        stacks = PhotoStack.objects.filter(
            owner=request.user,
            stack_type__in=valid_stack_types
        ).prefetch_related(
            "photos__thumbnail", "primary_photo__thumbnail"
        ).annotate(
            photos_count=Count("photos")
        ).order_by("-created_at")

        if stack_type_filter:
            # Validate that the filter is a valid organizational stack type
            # valid_stack_types contains TextChoices values which are strings
            if stack_type_filter in [str(st) for st in valid_stack_types]:
                stacks = stacks.filter(stack_type=stack_type_filter)

        # Only return stacks with at least 2 photos
        stacks = stacks.filter(photos_count__gte=2)

        # Paginate results
        paginator = Paginator(stacks, page_size)
        page_obj = paginator.get_page(page)

        # Serialize manually to include nested photo data
        results = []
        for stack in page_obj.object_list:
            photos = stack.photos.all()[:4]  # Preview first 4 photos
            results.append({
                "id": str(stack.id),
                "stack_type": stack.stack_type,
                "stack_type_display": stack.get_stack_type_display(),
                "photo_count": stack.photos_count,
                "sequence_start": stack.sequence_start,
                "sequence_end": stack.sequence_end,
                "created_at": stack.created_at,
                "primary_photo": {
                    "image_hash": stack.primary_photo.image_hash,
                    "thumbnail_url": f"/media/square_thumbnails_small/{stack.primary_photo.image_hash}" if hasattr(stack.primary_photo, 'thumbnail') and stack.primary_photo.thumbnail.square_thumbnail_small else None,
                } if stack.primary_photo else None,
                "preview_photos": [
                    {
                        "image_hash": p.image_hash,
                        "thumbnail_url": f"/media/square_thumbnails_small/{p.image_hash}" if hasattr(p, 'thumbnail') and p.thumbnail.square_thumbnail_small else None,
                    }
                    for p in photos
                ],
            })

        return Response({
            "results": results,
            "count": paginator.count,
            "num_pages": paginator.num_pages,
            "page": page,
            "page_size": page_size,
            "has_next": page_obj.has_next(),
            "has_previous": page_obj.has_previous(),
        })


class PhotoStackDetailView(APIView):
    """Get details of a specific photo stack with all photos."""

    permission_classes = [IsAuthenticated]

    def get(self, request, stack_id):
        # Use model-defined valid stack types (excludes deprecated RAW_JPEG_PAIR, LIVE_PHOTO)
        # Also include deprecated types for viewing existing stacks during migration
        all_stack_types = PhotoStack.VALID_STACK_TYPES + [
            PhotoStack.StackType.RAW_JPEG_PAIR,
            PhotoStack.StackType.LIVE_PHOTO,
        ]
        
        try:
            stack = PhotoStack.objects.annotate(
                photos_count=Count("photos")
            ).get(id=stack_id, owner=request.user, stack_type__in=all_stack_types)
        except PhotoStack.DoesNotExist:
            return Response(
                {"error": "Photo stack not found"}, status=status.HTTP_404_NOT_FOUND
            )

        photos = stack.photos.select_related('thumbnail', 'main_file', 'metadata').prefetch_related('files').all()

        photo_data = []
        for p in photos:
            # Width, height, and camera are on the metadata model
            width = None
            height = None
            camera = None
            if hasattr(p, 'metadata') and p.metadata:
                width = p.metadata.width
                height = p.metadata.height
                camera = p.metadata.camera_model

            # Get all file variants for this photo
            file_variants = []
            for f in p.files.all():
                file_variants.append({
                    "hash": f.hash,
                    "path": f.path,
                    "type": f.get_type_display().lower(),
                    "is_main": p.main_file and f.hash == p.main_file.hash,
                    "filename": f.path.split("/")[-1] if f.path else None,
                })

            data = {
                "id": str(p.id),
                "image_hash": p.image_hash,
                "width": width,
                "height": height,
                "size": p.size,
                "camera": camera,
                "exif_timestamp": p.exif_timestamp,
                "is_primary": stack.primary_photo and p.image_hash == stack.primary_photo.image_hash,
                "file_path": p.main_file.path if p.main_file else None,
                "file_type": p.main_file.get_type_display().lower() if p.main_file else None,
                "file_variants": file_variants if file_variants else None,
                "thumbnail_url": f"/media/square_thumbnails_small/{p.image_hash}" if hasattr(p, 'thumbnail') and p.thumbnail.square_thumbnail_small else None,
                "thumbnail_big_url": f"/media/thumbnails_big/{p.image_hash}" if hasattr(p, 'thumbnail') and p.thumbnail.thumbnail_big else None,
            }
            photo_data.append(data)

        return Response({
            "id": str(stack.id),
            "stack_type": stack.stack_type,
            "stack_type_display": stack.get_stack_type_display(),
            "photo_count": stack.photos_count,
            "sequence_start": stack.sequence_start,
            "sequence_end": stack.sequence_end,
            "created_at": stack.created_at,
            "updated_at": stack.updated_at,
            "primary_photo_hash": stack.primary_photo.image_hash if stack.primary_photo else None,
            "photos": photo_data,
        })

    def delete(self, request, stack_id):
        """Delete a stack (unlinks photos but doesn't delete them)."""
        try:
            stack = PhotoStack.objects.get(id=stack_id, owner=request.user)
        except PhotoStack.DoesNotExist:
            return Response(
                {"error": "Photo stack not found"}, status=status.HTTP_404_NOT_FOUND
            )

        # Unlink photos from this stack (ManyToMany)
        photo_count = stack.photos.count()
        for photo in stack.photos.all():
            photo.stacks.remove(stack)

        # Delete stack
        stack_id_str = str(stack.id)
        stack.delete()

        logger.info(f"Deleted stack {stack_id_str}: unlinked {photo_count} photos")
        return Response({
            "status": "deleted",
            "unlinked_count": photo_count
        })


class PhotoStackDeleteView(APIView):
    """Delete a stack (unlinks photos but doesn't delete them)."""

    permission_classes = [IsAuthenticated]

    def delete(self, request, stack_id):
        try:
            stack = PhotoStack.objects.get(id=stack_id, owner=request.user)
        except PhotoStack.DoesNotExist:
            return Response(
                {"error": "Photo stack not found"}, status=status.HTTP_404_NOT_FOUND
            )

        # Unlink photos from this stack (ManyToMany)
        photo_count = stack.photos.count()
        for photo in stack.photos.all():
            photo.stacks.remove(stack)

        # Delete stack
        stack_id_str = str(stack.id)
        stack.delete()

        logger.info(f"Deleted stack {stack_id_str}: unlinked {photo_count} photos")
        return Response({
            "status": "deleted",
            "unlinked_count": photo_count
        })


class PhotoStackSetPrimaryView(APIView):
    """Set the primary (cover) photo for a stack."""

    permission_classes = [IsAuthenticated]

    def post(self, request, stack_id):
        try:
            stack = PhotoStack.objects.get(id=stack_id, owner=request.user)
        except PhotoStack.DoesNotExist:
            return Response(
                {"error": "Photo stack not found"}, status=status.HTTP_404_NOT_FOUND
            )

        photo_hash = request.data.get("photo_hash")
        if not photo_hash:
            return Response(
                {"error": "photo_hash is required"},
                status=status.HTTP_400_BAD_REQUEST
            )

        try:
            photo = stack.photos.get(image_hash=photo_hash)
        except Photo.DoesNotExist:
            return Response(
                {"error": "Photo not found in this stack"},
                status=status.HTTP_400_BAD_REQUEST
            )

        stack.primary_photo = photo
        stack.save(update_fields=['primary_photo', 'updated_at'])

        logger.info(f"Set primary photo for stack {stack.id} to {photo_hash}")
        return Response({
            "status": "updated",
            "primary_photo_hash": photo_hash
        })


class DetectStacksView(APIView):
    """Trigger stack detection for the current user (bursts, brackets).
    
    NOTE: RAW+JPEG pairs and Live Photos are now handled as file variants
    during scan (PhotoPrism-like model), not as stacks.
    
    Burst detection uses the user's configured burst_detection_rules from their profile.
    """

    permission_classes = [IsAuthenticated]

    @extend_schema(
        parameters=[
            OpenApiParameter(
                "detect_bursts",
                bool,
                description="Detect burst sequences using user's configured rules (default: true)",
            ),
        ],
    )
    def post(self, request):
        from api.stack_detection import batch_detect_stacks
        
        # RAW+JPEG and Live Photos are now file variants, not stacks
        # Only burst/bracket detection is done here
        options = {
            'detect_bursts': request.data.get('detect_bursts', True),
        }

        # Queue background job
        async_task(batch_detect_stacks, request.user, options)
        
        logger.info(f"Stack detection queued for user {request.user.username} with options: {options}")
        return Response(
            {
                "status": "queued",
                "message": "Stack detection started",
                "options": options,
            },
            status=status.HTTP_202_ACCEPTED,
        )


class PhotoStackStatsView(APIView):
    """Get stack statistics for the current user."""

    permission_classes = [IsAuthenticated]

    def get(self, request):
        # Include all stack types for stats (shows deprecated types for migration visibility)
        all_stack_types = PhotoStack.VALID_STACK_TYPES + [
            PhotoStack.StackType.RAW_JPEG_PAIR,
            PhotoStack.StackType.LIVE_PHOTO,
        ]
        
        stacks = PhotoStack.objects.filter(
            owner=request.user,
            stack_type__in=all_stack_types
        )
        
        # Count by type (includes deprecated types so users can see migration progress)
        by_type = {}
        for stack_type in all_stack_types:
            by_type[stack_type] = stacks.filter(stack_type=stack_type).count()
        
        # Count photos in stacks (ManyToMany - photos with at least one valid organizational stack)
        photos_in_stacks = Photo.objects.filter(
            owner=request.user,
            stacks__stack_type__in=all_stack_types
        ).distinct().count()
        
        total_photos = Photo.objects.filter(
            owner=request.user, hidden=False, in_trashcan=False
        ).count()

        return Response({
            "total_stacks": stacks.count(),
            "by_type": by_type,
            "photos_in_stacks": photos_in_stacks,
            "total_photos": total_photos,
        })


class CreateManualStackView(APIView):
    """Create a manual stack from selected photos."""

    permission_classes = [IsAuthenticated]

    def post(self, request):
        photo_hashes = request.data.get("photo_hashes", [])
        
        # De-duplicate the input to handle repeated hashes
        unique_hashes = list(dict.fromkeys(photo_hashes))  # Preserves order
        
        if len(unique_hashes) < 2:
            return Response(
                {"error": "At least 2 unique photos required to create a stack"},
                status=status.HTTP_400_BAD_REQUEST
            )

        # Verify all photos exist and belong to user
        photos = Photo.objects.filter(
            owner=request.user,
            image_hash__in=unique_hashes
        )
        
        if photos.count() != len(unique_hashes):
            return Response(
                {"error": "Some photos not found"},
                status=status.HTTP_400_BAD_REQUEST
            )

        # Check if any photo is already in a manual stack
        existing_stack = None
        for photo in photos:
            manual_stack = photo.stacks.filter(stack_type=PhotoStack.StackType.MANUAL).first()
            if manual_stack:
                existing_stack = manual_stack
                break
        
        if existing_stack:
            # Add to existing stack (ManyToMany)
            stack = existing_stack
            for photo in photos:
                if not photo.stacks.filter(pk=stack.pk).exists():
                    photo.stacks.add(stack)
        else:
            # Create new manual stack
            stack = PhotoStack.objects.create(
                owner=request.user,
                stack_type=PhotoStack.StackType.MANUAL,
            )
            for photo in photos:
                photo.stacks.add(stack)
        
        stack.auto_select_primary()
        
        logger.info(f"Created/updated MANUAL stack {stack.id} with {photos.count()} photos")
        return Response({
            "status": "created",
            "stack_id": str(stack.id),
            "photo_count": photos.count(),
        }, status=status.HTTP_201_CREATED)


class AddToStackView(APIView):
    """Add photos to an existing stack."""

    permission_classes = [IsAuthenticated]

    def post(self, request, stack_id):
        try:
            stack = PhotoStack.objects.get(id=stack_id, owner=request.user)
        except PhotoStack.DoesNotExist:
            return Response(
                {"error": "Photo stack not found"}, status=status.HTTP_404_NOT_FOUND
            )

        photo_hashes = request.data.get("photo_hashes", [])
        if not photo_hashes:
            return Response(
                {"error": "photo_hashes is required"},
                status=status.HTTP_400_BAD_REQUEST
            )

        photos = Photo.objects.filter(
            owner=request.user,
            image_hash__in=photo_hashes
        )
        
        added_count = 0
        for photo in photos:
            if not photo.stacks.filter(pk=stack.pk).exists():
                photo.stacks.add(stack)
                added_count += 1

        logger.info(f"Added {added_count} photos to stack {stack.id}")
        return Response({
            "status": "updated",
            "added_count": added_count,
            "total_count": stack.photos.count(),
        })


class RemoveFromStackView(APIView):
    """Remove photos from a stack."""

    permission_classes = [IsAuthenticated]

    def post(self, request, stack_id):
        try:
            stack = PhotoStack.objects.get(id=stack_id, owner=request.user)
        except PhotoStack.DoesNotExist:
            return Response(
                {"error": "Photo stack not found"}, status=status.HTTP_404_NOT_FOUND
            )

        photo_hashes = request.data.get("photo_hashes", [])
        if not photo_hashes:
            return Response(
                {"error": "photo_hashes is required"},
                status=status.HTTP_400_BAD_REQUEST
            )

        photos = Photo.objects.filter(
            owner=request.user,
            image_hash__in=photo_hashes
        )
        
        removed_count = 0
        for photo in photos:
            if photo.stacks.filter(pk=stack.pk).exists():
                photo.stacks.remove(stack)
                removed_count += 1

        # Delete stack if it now has fewer than 2 photos
        remaining_count = stack.photos.count()
        if remaining_count < 2:
            stack.delete()
            logger.info(f"Deleted stack {stack_id} after removing photos (only {remaining_count} left)")
            return Response({
                "status": "deleted",
                "removed_count": removed_count,
                "message": "Stack deleted because fewer than 2 photos remain",
            })

        # Update primary if it was removed
        if stack.primary_photo and stack.primary_photo.image_hash in photo_hashes:
            stack.auto_select_primary()

        logger.info(f"Removed {removed_count} photos from stack {stack.id}")
        return Response({
            "status": "updated",
            "removed_count": removed_count,
            "total_count": remaining_count,
        })


class MergeStacksView(APIView):
    """Merge all manual stacks containing any of the selected photos into one stack."""

    permission_classes = [IsAuthenticated]

    def post(self, request):
        photo_hashes = request.data.get("photo_hashes", [])
        
        if not photo_hashes:
            return Response(
                {"error": "photo_hashes is required"},
                status=status.HTTP_400_BAD_REQUEST
            )

        # De-duplicate the input to handle repeated hashes
        unique_hashes = list(dict.fromkeys(photo_hashes))  # Preserves order

        # Verify all photos exist and belong to user
        photos = Photo.objects.filter(
            owner=request.user,
            image_hash__in=unique_hashes
        )
        
        if photos.count() != len(unique_hashes):
            return Response(
                {"error": "Some photos not found"},
                status=status.HTTP_400_BAD_REQUEST
            )

        # Find all manual stacks that contain any of the selected photos
        # Convert to list immediately to avoid multiple query evaluations with
        # potentially inconsistent ordering
        manual_stacks = list(PhotoStack.objects.filter(
            owner=request.user,
            stack_type=PhotoStack.StackType.MANUAL,
            photos__in=photos
        ).distinct())

        if not manual_stacks:
            return Response(
                {"error": "No manual stacks found containing selected photos"},
                status=status.HTTP_400_BAD_REQUEST
            )

        if len(manual_stacks) == 1:
            # Only one stack found, nothing to merge
            stack = manual_stacks[0]
            return Response({
                "status": "no_merge_needed",
                "stack_id": str(stack.id),
                "photo_count": stack.photos.count(),
                "message": "Only one stack found, nothing to merge",
            })

        # Merge all stacks into the first one
        target_stack = manual_stacks[0]
        stacks_to_merge = manual_stacks[1:]
        
        for stack in stacks_to_merge:
            target_stack.merge_with(stack)

        # Recalculate primary if needed
        if not target_stack.primary_photo:
            target_stack.auto_select_primary()

        logger.info(f"Merged {len(stacks_to_merge)} manual stacks into {target_stack.id}")
        return Response({
            "status": "merged",
            "stack_id": str(target_stack.id),
            "photo_count": target_stack.photos.count(),
            "merged_count": len(stacks_to_merge),
        }, status=status.HTTP_200_OK)


================================================
FILE: api/views/timezone.py
================================================
from rest_framework.response import Response
from rest_framework.views import APIView

from api import date_time_extractor


class TimeZoneView(APIView):
    def get(self, request, format=None):
        return Response(date_time_extractor.ALL_TIME_ZONES_JSON)


================================================
FILE: api/views/upload.py
================================================
import io
import os

from chunked_upload.constants import http_status
from chunked_upload.exceptions import ChunkedUploadError
from chunked_upload.models import ChunkedUpload
from chunked_upload.views import ChunkedUploadCompleteView, ChunkedUploadView
from constance import config as site_config
from django.core.files.base import ContentFile
from django.shortcuts import get_object_or_404
from django.utils.decorators import method_decorator
from django.utils.text import get_valid_filename
from django.views.decorators.csrf import csrf_exempt
from django_q.tasks import Chain
from rest_framework import viewsets
from rest_framework.response import Response
from rest_framework_simplejwt.exceptions import TokenError
from rest_framework_simplejwt.tokens import AccessToken

from api import util
from api.directory_watcher import create_new_image, handle_new_image, is_valid_media
from api.models import Photo, User
from api.models.file import calculate_hash, calculate_hash_b64
from api.models.photo_caption import PhotoCaption


def generate_captions_wrapper(photo, commit=True):
    """Wrapper function to generate captions for use in chain"""
    caption_instance, created = PhotoCaption.objects.get_or_create(photo=photo)
    caption_instance.generate_tag_captions(commit=commit)


class UploadPhotoExists(viewsets.ViewSet):
    def retrieve(self, request, pk):
        try:
            Photo.objects.get(image_hash=pk)
            return Response({"exists": True})
        except Photo.DoesNotExist:
            return Response({"exists": False})
        except Photo.MultipleObjectsReturned:
            # Multiple photos with same hash - photo exists
            return Response({"exists": True})


@method_decorator(csrf_exempt, name="dispatch")
class UploadPhotosChunked(ChunkedUploadView):
    model = ChunkedUpload

    def check_permissions(self, request):
        if not site_config.ALLOW_UPLOAD:
            raise ChunkedUploadError(
                status=http_status.HTTP_403_FORBIDDEN,
                detail="Uploading is not allowed",
            )
        jwt = request.COOKIES.get("jwt")
        if jwt is not None:
            try:
                token = AccessToken(jwt)
            except TokenError:
                raise ChunkedUploadError(
                    status=http_status.HTTP_403_FORBIDDEN,
                    detail="Authentication credentials were invalid",
                )
        else:
            raise ChunkedUploadError(
                status=http_status.HTTP_403_FORBIDDEN,
                detail="Authentication credentials were not provided",
            )
        # To-Do: Check if file is allowed type
        user = User.objects.filter(id=token["user_id"]).first()
        if not user or not user.is_authenticated:
            raise ChunkedUploadError(
                status=http_status.HTTP_403_FORBIDDEN,
                detail="Authentication credentials were not provided",
            )

    def create_chunked_upload(self, save=False, **attrs):
        """Creates new chunked upload instance. Called if no 'upload_id' is
        found in the POST data.
        """
        chunked_upload = self.model(**attrs)
        # file starts empty
        chunked_upload.file.save(name="tmp", content=ContentFile(""), save=save)
        return chunked_upload


@method_decorator(csrf_exempt, name="dispatch")
class UploadPhotosChunkedComplete(ChunkedUploadCompleteView):
    model = ChunkedUpload

    def check_permissions(self, request):
        if not site_config.ALLOW_UPLOAD:
            raise ChunkedUploadError(
                status=http_status.HTTP_403_FORBIDDEN,
                detail="Uploading is not allowed",
            )
        jwt = request.COOKIES.get("jwt")
        if jwt is not None:
            try:
                token = AccessToken(jwt)
            except TokenError:
                raise ChunkedUploadError(
                    status=http_status.HTTP_403_FORBIDDEN,
                    detail="Authentication credentials were invalid",
                )
        else:
            raise ChunkedUploadError(
                status=http_status.HTTP_403_FORBIDDEN,
                detail="Authentication credentials were not provided",
            )
        user = User.objects.filter(id=token["user_id"]).first()
        if not user or not user.is_authenticated:
            raise ChunkedUploadError(
                status=http_status.HTTP_403_FORBIDDEN,
                detail="Authentication credentials were not provided",
            )

    def on_completion(self, uploaded_file, request):
        jwt = request.COOKIES.get("jwt")
        if jwt is not None:
            try:
                token = AccessToken(jwt)
            except TokenError:
                raise ChunkedUploadError(
                    status=http_status.HTTP_403_FORBIDDEN,
                    detail="Authentication credentials were invalid",
                )
        else:
            raise ChunkedUploadError(
                status=http_status.HTTP_403_FORBIDDEN,
                detail="Authentication credentials were not provided",
            )

        user = User.objects.filter(id=token["user_id"]).first()
        if not user or not user.is_authenticated:
            raise ChunkedUploadError(
                status=http_status.HTTP_403_FORBIDDEN,
                detail="Authentication credentials were not provided",
            )

        # Validate that user has a configured scan directory
        if not user.scan_directory or user.scan_directory.strip() == "":
            raise ChunkedUploadError(
                status=http_status.HTTP_400_BAD_REQUEST,
                detail="Upload failed: No scan directory configured. Please contact your administrator to set up a scan directory for your account.",
            )

        # Validate that the scan directory exists
        if not os.path.exists(user.scan_directory):
            raise ChunkedUploadError(
                status=http_status.HTTP_400_BAD_REQUEST,
                detail=f"Upload failed: Scan directory '{user.scan_directory}' does not exist. Please contact your administrator.",
            )

        if not is_valid_media(uploaded_file.file.path, user):
            chunked_upload = get_object_or_404(
                ChunkedUpload, upload_id=request.POST.get("upload_id")
            )
            chunked_upload.delete(delete_file=True)
            raise ChunkedUploadError(
                status=http_status.HTTP_400_BAD_REQUEST,
                detail="File type not allowed",
            )

        # Sanitize file name
        filename = get_valid_filename(request.POST.get("filename"))

        # To-Do: Get origin device
        device = "web"

        if not os.path.exists(os.path.join(user.scan_directory, "uploads")):
            os.mkdir(os.path.join(user.scan_directory, "uploads"))
        if not os.path.exists(os.path.join(user.scan_directory, "uploads", device)):
            os.mkdir(os.path.join(user.scan_directory, "uploads", device))
        photo = uploaded_file
        image_hash = calculate_hash_b64(user, io.BytesIO(photo.read()))
        photo_path = ""

        if not Photo.objects.filter(image_hash=image_hash).exists():
            if not os.path.exists(
                os.path.join(user.scan_directory, "uploads", device, filename)
            ):
                photo_path = os.path.join(
                    user.scan_directory, "uploads", device, filename
                )
            else:
                existing_photo_hash = calculate_hash(
                    user, os.path.join(user.scan_directory, "uploads", device, filename)
                )

                file_name = os.path.splitext(os.path.basename(filename))[0]
                file_name_extension = os.path.splitext(os.path.basename(filename))[1]

                if existing_photo_hash == image_hash:
                    # File already exist, do not copy it in the upload folder
                    util.logger.info(
                        f"Photo {filename} duplicated with hash {image_hash} "
                    )
                else:
                    photo_path = os.path.join(
                        user.scan_directory,
                        "uploads",
                        device,
                        file_name + "_" + image_hash + file_name_extension,
                    )

        else:
            util.logger.info(f"Photo {filename} duplicated with hash {image_hash} ")

        if photo_path:
            with open(photo_path, "wb") as f:
                photo.seek(0)
                f.write(photo.read())

        chunked_upload = get_object_or_404(
            ChunkedUpload, upload_id=request.POST.get("upload_id")
        )
        chunked_upload.delete(delete_file=True)

        if not photo_path:
            return Response(
                {"detail": "Photo duplicated. No new import performed."},
                status=http_status.HTTP_200_OK,
            )

        chain = Chain()
        photo = create_new_image(user, photo_path)
        chain.append(handle_new_image, user, photo_path, image_hash, photo)
        chain.append(generate_captions_wrapper, photo, True)
        chain.append(photo._geolocate)
        chain.append(photo._add_location_to_album_dates)
        chain.append(photo._extract_faces)
        chain.run()


================================================
FILE: api/views/user.py
================================================
from django.conf import settings
from rest_framework import status, viewsets
from rest_framework.permissions import AllowAny, IsAdminUser
from rest_framework.response import Response
from rest_framework.views import APIView

from api.api_util import path_to_dict
from api.date_time_extractor import DEFAULT_RULES_JSON, PREDEFINED_RULES_JSON
from api.burst_detection_rules import (
    DEFAULT_RULES_JSON as BURST_DEFAULT_RULES_JSON,
    PREDEFINED_RULES_JSON as BURST_PREDEFINED_RULES_JSON,
)
from api.models import User
from api.permissions import IsAdminOrFirstTimeSetupOrRegistrationAllowed, IsAdminOrSelf
from api.serializers.user import (
    DeleteUserSerializer,
    ManageUserSerializer,
    PublicUserSerializer,
    SignupUserSerializer,
    UserSerializer,
)
from api.util import is_valid_path, logger


class DefaultRulesView(APIView):
    def get(self, request, format=None):
        res = DEFAULT_RULES_JSON
        return Response(res)


class PredefinedRulesView(APIView):
    def get(self, request, format=None):
        res = PREDEFINED_RULES_JSON
        return Response(res)


class DefaultBurstRulesView(APIView):
    """Get default burst detection rules."""
    def get(self, request, format=None):
        res = BURST_DEFAULT_RULES_JSON
        return Response(res)


class PredefinedBurstRulesView(APIView):
    """Get all predefined burst detection rules (default + optional)."""
    def get(self, request, format=None):
        res = BURST_PREDEFINED_RULES_JSON
        return Response(res)


class RootPathTreeView(APIView):
    permission_classes = (IsAdminUser,)

    def get(self, request, format=None):
        try:
            path = self.request.query_params.get("path")
            base_path = settings.DATA_ROOT

            # Default to root directory if no path is provided
            if not path:
                path = base_path

            # Validate the requested path
            if not is_valid_path(path, base_path):
                return Response(
                    {
                        "message": "Access denied. Path is outside the allowed directory."
                    },
                    status=403,
                )

            res = [path_to_dict(path)]
            return Response(res)
        except Exception as e:
            logger.exception(str(e))
            return Response({"message": str(e)}, status=500)


class IsFirstTimeSetupView(APIView):
    permission_classes = (AllowAny,)

    def get(self, request):
        return Response(
            {"isFirstTimeSetup": not User.objects.filter(is_superuser=True).exists()}
        )


# To-Do: This executes multiple querys per users
class UserViewSet(viewsets.ModelViewSet):
    def get_queryset(self):
        queryset = (
            User.objects.exclude(is_active=False)
            .only(
                "id",
                "username",
                "email",
                "scan_directory",
                "transcode_videos",
                "confidence",
                "confidence_person",
                "semantic_search_topk",
                "first_name",
                "last_name",
                "date_joined",
                "avatar",
                "nextcloud_server_address",
                "nextcloud_username",
                "nextcloud_scan_directory",
                "favorite_min_rating",
                "image_scale",
                "save_metadata_to_disk",
                "datetime_rules",
                "default_timezone",
                "is_superuser",
                "public_sharing",
            )
            .order_by("id")
        )
        if not self.request.user.is_authenticated:
            return queryset.exclude(public_sharing=False)
        return queryset

    def get_serializer_class(self):
        if self.action == "create":
            if self.request.user.is_authenticated and self.request.user.is_superuser:
                return UserSerializer
            return SignupUserSerializer
        if not self.request.user.is_authenticated:
            return PublicUserSerializer
        return UserSerializer

    def get_permissions(self):
        permission_classes = [IsAdminUser]
        if self.action == "create":
            permission_classes = [IsAdminOrFirstTimeSetupOrRegistrationAllowed]
        elif self.action in ["list", "retrieve"]:
            permission_classes = [AllowAny]
        elif self.action in ["update", "partial_update"]:
            permission_classes = [IsAdminOrSelf]
        return [p() for p in permission_classes]


class DeleteUserViewSet(viewsets.ModelViewSet):
    queryset = User.objects.all().order_by("id")
    serializer_class = DeleteUserSerializer
    permission_classes = (IsAdminUser,)

    def destroy(self, request, *args, **kwargs):
        if not request.user.is_superuser:
            return Response(status=status.HTTP_401_UNAUTHORIZED)
        instance = self.get_object()

        if instance.is_superuser:
            return Response(status=status.HTTP_400_BAD_REQUEST)

        return super().destroy(request, *args, **kwargs)


class ManageUserViewSet(viewsets.ModelViewSet):
    queryset = User.objects.all().order_by("id")
    serializer_class = ManageUserSerializer
    permission_classes = (IsAdminUser,)

    def retrieve(self, *args, **kwargs):
        return super().retrieve(*args, **kwargs)

    def list(self, *args, **kwargs):
        return super().list(*args, **kwargs)


================================================
FILE: api/views/views.py
================================================
import os
import subprocess
import uuid
from urllib.parse import quote

import jsonschema
import magic
from constance import config as site_config
from django.conf import settings
from django.db.models import Q, Sum
from django.http import (
    FileResponse,
    HttpResponse,
    HttpResponseForbidden,
    StreamingHttpResponse,
)
from django.utils.decorators import method_decorator
from django.utils.encoding import iri_to_uri
from django.utils import timezone
from django.views.decorators.cache import cache_page
from django.views.decorators.vary import vary_on_cookie
from django_q.tasks import AsyncTask, Chain
from drf_spectacular.utils import extend_schema
from rest_framework import viewsets
from rest_framework.permissions import AllowAny, IsAdminUser, IsAuthenticated
from rest_framework.response import Response
from rest_framework.views import APIView, exception_handler
from rest_framework_simplejwt.exceptions import TokenError
from rest_framework_simplejwt.tokens import AccessToken

from api.all_tasks import create_download_job, delete_zip_file
from api.api_util import get_search_term_examples
from api.autoalbum import delete_missing_photos
from api.directory_watcher import scan_photos
from api.ml_models import do_all_models_exist, download_models
from api.models import AlbumUser, LongRunningJob, Photo, User
from api.schemas.site_settings import site_settings_schema
from api.serializers.album_user import AlbumUserEditSerializer, AlbumUserListSerializer
from api.util import logger
from api.views.pagination import StandardResultsSetPagination


def custom_exception_handler(exc, context):
    # Call REST framework's default exception handler first,
    # to get the standard error response.
    response = exception_handler(exc, context)

    # Update the structure of the response data and enrich auth errors.
    if response is not None:
        customized_response = {"errors": []}

        if isinstance(response.data, dict):
            for key, value in response.data.items():
                error = {"field": key, "message": "".join(str(value))}
                customized_response["errors"].append(error)
        elif isinstance(response.data, list):
            # Handle ValidationError raised with a string (creates a list)
            for item in response.data:
                error = {"field": "non_field_errors", "message": str(item)}
                customized_response["errors"].append(error)

        # Add actionable guidance for unauthenticated/forbidden responses
        if getattr(response, "status_code", None) in (401, 403) and settings.DEBUG:
            customized_response["errors"].append(
                {
                    "field": "auth",
                    "message": (
                        "Authentication required. Obtain a JWT via POST /api/auth/token/obtain/ "
                        'with JSON {"username":"<user>", "password":"<pass>"}. '
                        "Then call APIs with header Authorization: Bearer <access_token> (or use the 'jwt' cookie set by the obtain/refresh endpoints). "
                        "See /api/help and docs at https://docs.librephotos.com/docs/user-guide/api-authentication."
                    ),
                }
            )

        response.data = customized_response

    return response


class AlbumUserEditViewSet(viewsets.ModelViewSet):
    serializer_class = AlbumUserEditSerializer
    pagination_class = StandardResultsSetPagination

    def retrieve(self, *args, **kwargs):
        return super().retrieve(*args, **kwargs)

    def list(self, *args, **kwargs):
        return super().list(*args, **kwargs)

    def get_queryset(self):
        if self.request.user.is_anonymous:
            return AlbumUser.objects.none()
        return AlbumUser.objects.filter(owner=self.request.user).order_by("title")

    def get_permissions(self):
        if self.action in ["list", "retrieve"]:
            self.permission_classes = (IsAuthenticated,)
        else:
            self.permission_classes = (IsAuthenticated,)

        return super().get_permissions()


# API Views
class SiteSettingsView(APIView):
    def get_permissions(self):
        if self.request.method == "GET":
            self.permission_classes = (AllowAny,)
        else:
            self.permission_classes = (IsAdminUser,)

        return super(SiteSettingsView, self).get_permissions()

    def get(self, request, format=None):
        out = {}
        out["allow_registration"] = site_config.ALLOW_REGISTRATION
        out["allow_upload"] = site_config.ALLOW_UPLOAD
        out["skip_patterns"] = site_config.SKIP_PATTERNS
        out["heavyweight_process"] = 0
        out["map_api_provider"] = site_config.MAP_API_PROVIDER
        out["map_api_key"] = site_config.MAP_API_KEY
        out["captioning_model"] = site_config.CAPTIONING_MODEL
        out["llm_model"] = site_config.LLM_MODEL
        out["tagging_model"] = site_config.TAGGING_MODEL
        return Response(out)

    def post(self, request, format=None):
        jsonschema.validate(request.data, site_settings_schema)
        if "allow_registration" in request.data.keys():
            site_config.ALLOW_REGISTRATION = request.data["allow_registration"]
        if "allow_upload" in request.data.keys():
            site_config.ALLOW_UPLOAD = request.data["allow_upload"]
        if "skip_patterns" in request.data.keys():
            site_config.SKIP_PATTERNS = request.data["skip_patterns"]
        if "map_api_provider" in request.data.keys():
            site_config.MAP_API_PROVIDER = request.data["map_api_provider"]
        if "map_api_key" in request.data.keys():
            site_config.MAP_API_KEY = request.data["map_api_key"]
        if "captioning_model" in request.data.keys():
            site_config.CAPTIONING_MODEL = request.data["captioning_model"]
        if "llm_model" in request.data.keys():
            site_config.LLM_MODEL = request.data["llm_model"]
        if "tagging_model" in request.data.keys():
            site_config.TAGGING_MODEL = request.data["tagging_model"]
        if not do_all_models_exist():
            AsyncTask(download_models, User.objects.get(id=request.user.id)).run()

        return self.get(request, format=format)


class SetUserAlbumShared(APIView):
    def post(self, request, format=None):
        data = dict(request.data)
        shared = data["shared"]  # bool
        target_user_id = data["target_user_id"]  # user pk, int
        user_album_id = data["album_id"]

        try:
            target_user = User.objects.get(id=target_user_id)
        except User.DoesNotExist:
            logger.warning(
                f"Cannot share album to user: target user_id {target_user_id} does not exist"
            )
            return Response(
                {"status": False, "message": "No such user"}, status_code=400
            )

        try:
            user_album_to_share = AlbumUser.objects.get(id=user_album_id)
        except AlbumUser.DoesNotExist:
            logger.warning(
                f"Cannot share album to user: source user_album_id {user_album_id} does not exist"
            )
            return Response(
                {"status": False, "message": "No such album"}, status_code=400
            )

        if user_album_to_share.owner != request.user:
            logger.warning(
                f"Cannot share album to user: source user_album_id {user_album_id} does not belong to user_id {request.user.id}"
            )
            return Response(
                {"status": False, "message": "You cannot share an album you don't own"},
                status_code=400,
            )

        if shared:
            user_album_to_share.shared_to.add(target_user)
            logger.info(
                f"Shared user {request.user.id}'s album {user_album_id} to user {target_user_id}"
            )
        else:
            user_album_to_share.shared_to.remove(target_user)
            logger.info(
                f"Unshared user {request.user.id}'s album {user_album_id} to user {target_user_id}"
            )

        user_album_to_share.save()
        return Response(AlbumUserListSerializer(user_album_to_share).data)


# Utility views


class StorageStatsView(APIView):
    def get(self, request, format=None):
        import shutil

        total_storage, used_storage, free_storage = shutil.disk_usage(
            settings.DATA_ROOT
        )
        return Response(
            {
                "total_storage": total_storage,
                "used_storage": used_storage,
                "free_storage": free_storage,
            }
        )


class ApiHelpView(APIView):
    permission_classes = (AllowAny,)

    def get(self, request, format=None):
        base = ""
        try:
            base = request.build_absolute_uri("/").rstrip("/")
        except Exception:
            base = ""

        data = {
            "about": "LibrePhotos API Help",
            "authentication": {
                "default_authentication_classes": [
                    "rest_framework_simplejwt.authentication.JWTAuthentication",
                    "rest_framework.authentication.BasicAuthentication",
                ],
                "jwt": {
                    "obtain": f"{base}/api/auth/token/obtain/",
                    "refresh": f"{base}/api/auth/token/refresh/",
                    "how_to": "POST username and password as JSON to obtain, then send Authorization: Bearer <access_token> or rely on 'jwt' cookie set by obtain/refresh endpoints.",
                },
                "basic": {
                    "how_to": "Send Authorization: Basic base64(username:password).",
                },
            },
            "useful_endpoints": {
                "api_root": f"{base}/",  # browsable API may be disabled when serving frontend
                "help": f"{base}/api/help",
                "photos": f"{base}/api/photos/",
                "search": f"{base}/api/photos/searchlist/",
            },
            "documentation": {
                "api_authentication": "https://docs.librephotos.com/docs/user-guide/api-authentication",
            },
            "examples": {
                "obtain_token_curl": (
                    "curl -X POST \"{base}/api/auth/token/obtain/\" -H 'Content-Type: application/json' "
                    "-d '{"
                    "username"
                    ": "
                    "myuser"
                    ", "
                    "password"
                    ": "
                    "mypassword"
                    "}'"
                ),
                "call_api_with_bearer": (
                    "curl -H 'Authorization: Bearer <access_token>' \"{base}/api/photos/\""
                ),
                "call_api_with_basic": (
                    'curl -u myuser:mypassword "{base}/api/photos/"'
                ),
            },
        }

        # Add schema links in DEBUG mode if available
        try:
            if settings.DEBUG:
                data.setdefault("useful_endpoints", {}).update(
                    {
                        "openapi_schema": f"{base}/api/schema",
                        "swagger_ui": f"{base}/api/swagger",
                        "redoc": f"{base}/api/redoc",
                    }
                )
        except Exception:
            pass

        return Response(data)


class ImageTagView(APIView):
    @method_decorator(cache_page(60 * 60 * 2))
    def get(self, request, format=None):
        # Add an exception for the directory '/code'
        subprocess.run(
            ["git", "config", "--global", "--add", "safe.directory", "/code"],
            check=False,
        )

        # Get the current commit hash
        git_hash = (
            subprocess.check_output(["git", "rev-parse", "--short", "HEAD"])
            .strip()
            .decode("utf-8")
        )
        return Response(
            {"image_tag": os.environ.get("IMAGE_TAG", ""), "git_hash": git_hash}
        )


class SearchTermExamples(APIView):
    @method_decorator(vary_on_cookie)
    @method_decorator(cache_page(60 * 60 * 2))
    def get(self, request, format=None):
        search_term_examples = get_search_term_examples(request.user)
        return Response({"results": search_term_examples})


# long running jobs
class ScanPhotosView(APIView):
    def post(self, request, format=None):
        return self._scan_photos(request)

    @extend_schema(
        deprecated=True,
        description="Use POST method instead",
    )
    def get(self, request, format=None):
        return self._scan_photos(request)

    def _scan_photos(self, request):
        # Validate that user has a configured scan directory
        if not request.user.scan_directory or request.user.scan_directory.strip() == "":
            return Response(
                {
                    "status": False,
                    "message": "Scan failed: No scan directory configured. Please contact your administrator to set up a scan directory for your account.",
                },
                status=400,
            )

        # Validate that the scan directory exists
        if not os.path.exists(request.user.scan_directory):
            return Response(
                {
                    "status": False,
                    "message": f"Scan failed: Scan directory '{request.user.scan_directory}' does not exist. Please contact your administrator.",
                },
                status=400,
            )

        chain = Chain()
        if not do_all_models_exist():
            chain.append(download_models, request.user)
        try:
            job_id = uuid.uuid4()
            chain.append(
                scan_photos, request.user, False, job_id, request.user.scan_directory
            )
            chain.run()
            return Response({"status": True, "job_id": job_id})
        except BaseException:
            logger.exception("An Error occurred")
            return Response({"status": False})


# To-Do: Allow for custom paths
class SelectiveScanPhotosView(APIView):
    def get(self, request, format=None):
        # Validate that user has a configured scan directory
        if not request.user.scan_directory or request.user.scan_directory.strip() == "":
            return Response(
                {
                    "status": False,
                    "message": "Scan failed: No scan directory configured. Please contact your administrator to set up a scan directory for your account.",
                },
                status=400,
            )

        # Validate that the scan directory exists
        if not os.path.exists(request.user.scan_directory):
            return Response(
                {
                    "status": False,
                    "message": f"Scan failed: Scan directory '{request.user.scan_directory}' does not exist. Please contact your administrator.",
                },
                status=400,
            )

        chain = Chain()
        if not do_all_models_exist():
            chain.append(download_models, request.user)
        # To-Do: Sanatize the scan_directory
        try:
            job_id = uuid.uuid4()
            chain.append(
                scan_photos,
                request.user,
                False,
                job_id,
                os.path.join(request.user.scan_directory, "uploads", "web"),
            )
            chain.run()
            return Response({"status": True, "job_id": job_id})
        except BaseException:
            logger.exception("An Error occurred")
            return Response({"status": False})


class FullScanPhotosView(APIView):
    def post(self, request, format=None):
        return self._scan_photos(request)

    @extend_schema(
        deprecated=True,
        description="Use POST method instead",
    )
    def get(self, request, format=None):
        return self._scan_photos(request)

    def _scan_photos(self, request):
        chain = Chain()
        if not do_all_models_exist():
            chain.append(download_models, request.user)
        try:
            job_id = uuid.uuid4()
            chain.append(
                scan_photos, request.user, True, job_id, request.user.scan_directory
            )
            chain.run()
            return Response({"status": True, "job_id": job_id})
        except BaseException:
            logger.exception("An Error occurred")
            return Response({"status": False})


class DeleteMissingPhotosView(APIView):
    def post(self, request, format=None):
        return self._delete_missing_photos(request, format)

    @extend_schema(
        deprecated=True,
        description="Use POST method instead",
    )
    def get(self, request, format=None):
        return self._delete_missing_photos(request, format)

    def _delete_missing_photos(self, request, format=None):
        try:
            job_id = uuid.uuid4()
            delete_missing_photos(request.user, job_id)
            return Response({"status": True, "job_id": job_id})
        except BaseException:
            logger.exception("An Error occurred")
            return Response({"status": False})


class MediaAccessView(APIView):
    permission_classes = (AllowAny,)

    def _get_protected_media_url(self, path, fname):
        return f"protected_media/{path}/{fname}"

    # @silk_profile(name='media')
    def get(self, request, path, fname, format=None):
        jwt = request.COOKIES.get("jwt")
        image_hash = fname.split(".")[0].split("_")[0]
        try:
            photo = Photo.objects.get(image_hash=image_hash)
        except Photo.DoesNotExist:
            return HttpResponse(status=404)
        except Photo.MultipleObjectsReturned:
            # Multiple photos with same hash - find one that matches permissions
            photos = Photo.objects.filter(image_hash=image_hash)
            photo = None
            # First try to find one that's public or in a public album
            for p in photos:
                if p.public or p.albumuser_set.filter(public=True).exists():
                    photo = p
                    break
            # If none found, we'll check user permissions below
            if photo is None:
                photo = photos.first()

        # grant access if the requested photo is public or part of any public user album
        if photo.public or photo.albumuser_set.filter(public=True).exists():
            response = HttpResponse()
            response["Content-Type"] = "image/jpeg"
            response["X-Accel-Redirect"] = self._get_protected_media_url(path, fname)
            return response

        # forbid access if trouble with jwt
        if jwt is not None:
            try:
                token = AccessToken(jwt)
            except TokenError:
                return HttpResponseForbidden()
        else:
            return HttpResponseForbidden()

        # grant access if the user is owner of the requested photo,
        # the photo is shared with the user, or the photo belongs to a public user album
        image_hash = fname.split(".")[0].split("_")[0]  # janky alert
        user = User.objects.filter(id=token["user_id"]).only("id").first()
        if photo.owner == user or user in photo.shared_to.all():
            response = HttpResponse()
            response["Content-Type"] = "image/jpeg"
            response["X-Accel-Redirect"] = self._get_protected_media_url(path, fname)
            return response
        else:
            for album in photo.albumuser_set.only("shared_to", "public"):
                if album.public or user in album.shared_to.all():
                    response = HttpResponse()
                    response["Content-Type"] = "image/jpeg"
                    response["X-Accel-Redirect"] = self._get_protected_media_url(
                        path, fname
                    )
                    return response
        return HttpResponse(status=404)


class VideoTranscoder:
    process = ""

    def __init__(self, path):
        ffmpeg_command = [
            "ffmpeg",
            "-i",
            path,
            "-vcodec",
            "libx264",
            "-preset",
            "ultrafast",
            "-movflags",
            "frag_keyframe+empty_moov",
            "-filter:v",
            ("scale=-2:" + str(720)),
            "-f",
            "mp4",
            "-",
        ]
        self.process = subprocess.Popen(
            ffmpeg_command,
            stdout=subprocess.PIPE,
            stderr=subprocess.PIPE,
        )

    def __del__(self):
        self.process.kill()


def gen(transcoder):
    yield from iter(transcoder.process.stdout.readline, b"")


class UnifiedMediaAccessView(APIView):
    """
    Unified media access endpoint supporting both proxy and no-proxy setups,
    and handling public album media access.
    """

    permission_classes = (AllowAny,)

    def _should_use_proxy(self):
        return not getattr(settings, "SERVE_FRONTEND", False)

    def _protected_media_url(self, path, fname):
        path = path.lstrip("/")
        return f"/protected_media/{path}/{fname}"

    def _serve_file_direct(self, file_path, content_type=None):
        if not os.path.exists(file_path):
            return HttpResponse(status=404)
        try:
            response = FileResponse(open(file_path, "rb"))
            if content_type:
                response["Content-Type"] = content_type
            else:
                try:
                    mime = magic.Magic(mime=True)
                    response["Content-Type"] = mime.from_file(file_path)
                except Exception:
                    response["Content-Type"] = "application/octet-stream"
            return response
        except (FileNotFoundError, PermissionError):
            return HttpResponse(status=404)
        except Exception:
            return HttpResponse(status=500)

    def _generate_response_proxy(self, photo, path, fname, transcode_videos):
        if "thumbnail" in path:
            response = HttpResponse()

            # thumbnails_big is always .webp (static image), even for videos
            if "thumbnails_big" in path:
                response["Content-Type"] = "image/webp"
                response["X-Accel-Redirect"] = self._protected_media_url(
                    path, fname + ".webp"
                )
                return response

            # For square_thumbnails, use the actual extension from the model
            ext = (
                os.path.splitext(getattr(photo.thumbnail, "square_thumbnail").path)[1]
                if hasattr(photo, "thumbnail")
                else ""
            )
            if "jpg" in ext:
                response["Content-Type"] = "image/jpg"
                response["X-Accel-Redirect"] = getattr(
                    photo.thumbnail, "thumbnail_big", photo.thumbnail.square_thumbnail
                ).path
            if "webp" in ext:
                response["Content-Type"] = "image/webp"
                response["X-Accel-Redirect"] = self._protected_media_url(
                    path, fname + ".webp"
                )
            if "mp4" in ext:
                response["Content-Type"] = "video/mp4"
                response["X-Accel-Redirect"] = self._protected_media_url(
                    path, fname + ".mp4"
                )
            return response

        if "faces" in path:
            response = HttpResponse()
            response["Content-Type"] = "image/jpg"
            response["X-Accel-Redirect"] = self._protected_media_url(path, fname)
            return response

        if photo.video:
            mime = magic.Magic(mime=True)
            filename = mime.from_file(photo.main_file.path)
            if transcode_videos:
                response = StreamingHttpResponse(
                    gen(VideoTranscoder(photo.main_file.path)),
                    content_type="video/mp4",
                )
                return response
            response = HttpResponse()
            response["Content-Type"] = filename
            response["X-Accel-Redirect"] = iri_to_uri(
                photo.main_file.path.replace(settings.DATA_ROOT, "/original")
            )
            return response

        response = HttpResponse()
        response["Content-Type"] = "image/jpg"
        response["X-Accel-Redirect"] = self._protected_media_url(path, fname)
        return response

    def _generate_response_direct(self, photo, path, fname, transcode_videos):
        if "thumbnail" in path:
            file_path = os.path.join(settings.MEDIA_ROOT, path, fname)
            if not os.path.exists(file_path):
                if not fname.endswith(".webp"):
                    webp = os.path.join(settings.MEDIA_ROOT, path, fname + ".webp")
                    if os.path.exists(webp):
                        return self._serve_file_direct(webp, "image/webp")
                if not fname.endswith(".mp4"):
                    mp4 = os.path.join(settings.MEDIA_ROOT, path, fname + ".mp4")
                    if os.path.exists(mp4):
                        return self._serve_file_direct(mp4, "video/mp4")
            if hasattr(photo, "thumbnail"):
                ext = os.path.splitext(photo.thumbnail.square_thumbnail.path)[1]
                if "jpg" in ext:
                    return self._serve_file_direct(
                        photo.thumbnail.thumbnail_big.path, "image/jpg"
                    )
            return self._serve_file_direct(file_path)

        if "faces" in path:
            file_path = os.path.join(settings.MEDIA_ROOT, path, fname)
            return self._serve_file_direct(file_path, "image/jpg")

        if photo.video:
            return self._serve_file_direct(photo.main_file.path)

        file_path = os.path.join(settings.MEDIA_ROOT, path, fname)
        return self._serve_file_direct(file_path, "image/jpg")

    def _public_album_active_q(self):
        return Q(share__enabled=True) & (
            Q(share__expires_at__isnull=True) | Q(share__expires_at__gte=timezone.now())
        )

    def get(self, request, path, fname, album_id=None, format=None):
        use_proxy = self._should_use_proxy()

        # ZIP files
        if path.lower() == "zip":
            jwt = request.COOKIES.get("jwt")
            if jwt is not None:
                try:
                    token = AccessToken(jwt)
                except TokenError:
                    return HttpResponseForbidden()
            else:
                return HttpResponseForbidden()
            try:
                filename = fname + str(token["user_id"]) + ".zip"
                if use_proxy:
                    response = HttpResponse()
                    response["Content-Type"] = "application/x-zip-compressed"
                    response["X-Accel-Redirect"] = self._protected_media_url(
                        path, filename
                    )
                    return response
                file_path = os.path.join(settings.MEDIA_ROOT, path, filename)
                return self._serve_file_direct(
                    file_path, "application/x-zip-compressed"
                )
            except Exception:
                return HttpResponseForbidden()

        # Avatars
        if path.lower() == "avatars":
            jwt = request.COOKIES.get("jwt")
            if jwt is not None:
                try:
                    token = AccessToken(jwt)
                except TokenError:
                    return HttpResponseForbidden()
            else:
                return HttpResponseForbidden()
            try:
                _ = User.objects.filter(id=token["user_id"]).only("id").first()
                if use_proxy:
                    response = HttpResponse()
                    response["Content-Type"] = "image/png"
                    response["X-Accel-Redirect"] = self._protected_media_url(
                        path, fname
                    )
                    return response
                file_path = os.path.join(settings.MEDIA_ROOT, path, fname)
                return self._serve_file_direct(file_path, "image/png")
            except Exception:
                return HttpResponse(status=404)

        # Embedded media
        if path.lower() == "embedded_media":
            jwt = request.COOKIES.get("jwt")
            query = Q(public=True)
            if request.user.is_authenticated:
                query = Q(owner=request.user)
            if jwt is not None:  # pragma: no cover
                try:
                    token = AccessToken(jwt)
                    user = User.objects.filter(id=token["user_id"]).only("id").first()
                    query = Q(owner=user)
                except TokenError:
                    pass
            try:
                # Check if fname is UUID format (36 chars with 4 hyphens) or image_hash
                is_uuid_format = len(fname) == 36 and fname.count("-") == 4
                if is_uuid_format:
                    photo = Photo.objects.filter(query, pk=fname).first()
                else:
                    photo = Photo.objects.filter(query, image_hash=fname).first()
                if not photo or photo.main_file.embedded_media.count() < 1:
                    raise Photo.DoesNotExist()
            except Photo.DoesNotExist:
                return HttpResponse(status=404)
            if use_proxy:
                response = HttpResponse()
                response["Content-Type"] = "video/mp4"
                response["X-Accel-Redirect"] = self._protected_media_url(
                    path, fname + "_1.mp4"
                )
                return response
            file_path = os.path.join(settings.MEDIA_ROOT, path, fname + "_1.mp4")
            return self._serve_file_direct(file_path, "video/mp4")

        # Determine photo by hash
        image_hash = fname.split(".")[0].split("_")[0]

        # Public album access
        if album_id is not None:
            album = (
                AlbumUser.objects.filter(id=album_id)
                .filter(self._public_album_active_q())
                .first()
            )
            if album is None:
                return HttpResponse(status=404)
            try:
                photo = album.photos.only(
                    "image_hash", "video", "main_file", "thumbnail"
                ).get(image_hash=image_hash)
            except Photo.DoesNotExist:
                return HttpResponse(status=404)

            if "thumbnail" in path or "thumbnails" in path or "faces" in path:
                if use_proxy:
                    return self._generate_response_proxy(photo, path, fname, False)
                return self._generate_response_direct(photo, path, fname, False)

            if use_proxy:
                response = HttpResponse()
                try:
                    mime = magic.Magic(mime=True)
                    filename = mime.from_file(photo.main_file.path)
                except Exception:
                    filename = "application/octet-stream"
                response["Content-Type"] = filename if photo.video else "image/webp"
                if photo.main_file.path.startswith(settings.PHOTOS):
                    internal_path = (
                        "/original" + photo.main_file.path[len(settings.PHOTOS) :]
                    )
                else:
                    internal_path = photo.main_file.path
                response["X-Accel-Redirect"] = iri_to_uri(internal_path)
                return response
            try:
                mime = magic.Magic(mime=True)
                content_type = mime.from_file(photo.main_file.path)
            except Exception:
                content_type = "application/octet-stream"
            return self._serve_file_direct(
                photo.main_file.path, content_type if photo.video else "image/webp"
            )

        # Non-photos (thumbnails, faces, etc.)
        if path.lower() != "photos":
            # Try UUID lookup first (for new-style requests after migration 0099),
            # then fall back to image_hash lookup (for legacy/backward compatibility)
            is_uuid_format = len(image_hash) == 36 and image_hash.count("-") == 4
            try:
                if is_uuid_format:
                    photo = Photo.objects.get(pk=image_hash)
                else:
                    photo = Photo.objects.get(image_hash=image_hash)
            except Photo.DoesNotExist:
                return HttpResponse(status=404)
            except Photo.MultipleObjectsReturned:
                # Multiple photos with same hash - find one that matches permissions
                photos = Photo.objects.filter(image_hash=image_hash)
                photo = None
                # First try to find one in a public album
                for p in photos:
                    if p.albumuser_set.filter(self._public_album_active_q()).exists():
                        photo = p
                        break
                # If none found, we'll check user permissions below
                if photo is None:
                    photo = photos.first()

            if photo.albumuser_set.filter(self._public_album_active_q()).exists():
                if use_proxy:
                    return self._generate_response_proxy(photo, path, fname, False)
                return self._generate_response_direct(photo, path, fname, False)

            jwt = request.COOKIES.get("jwt")
            if jwt is not None:
                try:
                    token = AccessToken(jwt)
                except TokenError:
                    return HttpResponseForbidden()
            else:
                return HttpResponseForbidden()

            user = (
                User.objects.filter(id=token["user_id"])
                .only("id", "transcode_videos")
                .first()
            )
            if photo.owner == user or user in photo.shared_to.all():
                if use_proxy:
                    return self._generate_response_proxy(
                        photo, path, fname, user.transcode_videos
                    )
                return self._generate_response_direct(
                    photo, path, fname, user.transcode_videos
                )
            else:
                for album in photo.albumuser_set.only("shared_to", "public"):
                    if getattr(album, "public", False) or user in album.shared_to.all():
                        if use_proxy:
                            return self._generate_response_proxy(
                                photo, path, fname, user.transcode_videos
                            )
                        return self._generate_response_direct(
                            photo, path, fname, user.transcode_videos
                        )
            return HttpResponse(status=404)

        # Original photos (path == photos)
        try:
            photo = Photo.objects.get(image_hash=image_hash)
        except Photo.DoesNotExist:
            return HttpResponse(status=404)
        except Photo.MultipleObjectsReturned:
            # Multiple photos with same hash - find one that matches permissions
            photos = Photo.objects.filter(image_hash=image_hash)
            photo = None
            # First try to find one in a public album
            for p in photos:
                if p.albumuser_set.filter(self._public_album_active_q()).exists():
                    photo = p
                    break
            # If none found, we'll check user permissions below
            if photo is None:
                photo = photos.first()

        if photo.albumuser_set.filter(self._public_album_active_q()).exists():
            if use_proxy:
                try:
                    mime = magic.Magic(mime=True)
                    filename = mime.from_file(photo.main_file.path)
                except Exception:
                    filename = "application/octet-stream"
                response = HttpResponse()
                response["Content-Type"] = filename if photo.video else "image/webp"
                if photo.main_file.path.startswith("/nextcloud_media/"):
                    internal_path = "/nextcloud_original" + photo.main_file.path[21:]
                elif photo.main_file.path.startswith(settings.PHOTOS):
                    internal_path = (
                        "/original" + photo.main_file.path[len(settings.PHOTOS) :]
                    )
                else:
                    internal_path = quote(photo.main_file.path)
                response["X-Accel-Redirect"] = iri_to_uri(internal_path)
                return response
            try:
                mime = magic.Magic(mime=True)
                content_type = mime.from_file(photo.main_file.path)
            except Exception:
                content_type = "application/octet-stream"
            return self._serve_file_direct(photo.main_file.path, content_type)

        jwt = request.COOKIES.get("jwt")
        if jwt is not None:
            try:
                token = AccessToken(jwt)
            except TokenError:
                return HttpResponseForbidden()
        else:
            return HttpResponseForbidden()

        user = User.objects.filter(id=token["user_id"]).only("id").first()
        if photo.owner == user or user in photo.shared_to.all():
            if use_proxy:
                response = HttpResponse()
                try:
                    mime = magic.Magic(mime=True)
                    filename = mime.from_file(photo.main_file.path)
                except Exception:
                    filename = "application/octet-stream"
                response["Content-Type"] = filename if photo.video else "image/webp"
                if photo.main_file.path.startswith("/nextcloud_media/"):
                    internal_path = "/nextcloud_original" + photo.main_file.path[21:]
                elif photo.main_file.path.startswith(settings.PHOTOS):
                    internal_path = (
                        "/original" + photo.main_file.path[len(settings.PHOTOS) :]
                    )
                else:
                    internal_path = quote(photo.main_file.path)
                response["Content-Disposition"] = 'inline; filename="{}"'.format(
                    photo.main_file.path.split("/")[-1]
                )
                response["X-Accel-Redirect"] = iri_to_uri(internal_path)
                return response
            return self._serve_file_direct(photo.main_file.path)
        else:
            for album in photo.albumuser_set.only("shared_to", "public"):
                if getattr(album, "public", False) or user in album.shared_to.all():
                    if use_proxy:
                        response = HttpResponse()
                        try:
                            mime = magic.Magic(mime=True)
                            filename = mime.from_file(photo.main_file.path)
                        except Exception:
                            filename = "application/octet-stream"
                        response["Content-Type"] = (
                            filename if photo.video else "image/webp"
                        )
                        if photo.main_file.path.startswith("/nextcloud_media/"):
                            internal_path = (
                                "/nextcloud_original" + photo.main_file.path[21:]
                            )
                        elif photo.main_file.path.startswith(settings.PHOTOS):
                            internal_path = (
                                "/original"
                                + photo.main_file.path[len(settings.PHOTOS) :]
                            )
                        else:
                            internal_path = quote(photo.main_file.path)
                        response["X-Accel-Redirect"] = iri_to_uri(internal_path)
                        return response
                    return self._serve_file_direct(photo.main_file.path)
        return HttpResponse(status=404)


class ZipListPhotosView_V2(APIView):
    def post(self, request):
        import shutil

        free_storage = shutil.disk_usage("/").free
        data = request.data
        image_hashes = data.get("image_hashes")
        if not image_hashes:
            return Response(data={"error": "image_hashes required"}, status=400)

        # DRF may provide list values (QueryDict) or a single string
        if isinstance(image_hashes, str):
            image_hashes = [image_hashes]
        elif isinstance(image_hashes, (list, tuple)):
            # QueryDict -> dict() would produce list values, request.data keeps list too
            pass
        else:
            image_hashes = list(image_hashes)

        include_stacked = data.get("include_stacked_photos", False)
        if isinstance(include_stacked, (list, tuple)):
            include_stacked = include_stacked[0] if include_stacked else False
        if isinstance(include_stacked, str):
            include_stacked = include_stacked.strip().lower() in ("1", "true", "yes", "on")
        include_stacked = bool(include_stacked)

        photo_query = Photo.objects.filter(owner=self.request.user)
        # Filter photos based on image hashes
        photos = photo_query.filter(image_hash__in=image_hashes)
        if not photos.exists():
            return Response(data={"error": "No photos found"}, status=404)

        # Optionally expand to include all photos from the same stacks
        if include_stacked:
            stack_ids = (
                photos.exclude(stacks__isnull=True)
                .values_list("stacks__id", flat=True)
                .distinct()
            )
            if stack_ids:
                stacked_photos = photo_query.filter(stacks__id__in=stack_ids)
                photos = (photos | stacked_photos).distinct()

        # Calculate the total file size using aggregate
        total_file_size = photos.aggregate(Sum("size"))["size__sum"] or 0
        if free_storage < total_file_size:
            return Response(data={"status": "Insufficient Storage"}, status=507)
        file_uuid = uuid.uuid4()
        filename = str(str(file_uuid) + str(self.request.user.id) + ".zip")

        job_id = create_download_job(
            LongRunningJob.JOB_DOWNLOAD_PHOTOS,
            user=self.request.user,
            photos=list(photos),
            filename=filename,
        )
        response = {"job_id": job_id, "url": file_uuid}

        return Response(data=response, status=200)

    def get(self, request):
        job_id = request.GET["job_id"]
        print(job_id)
        if job_id is None:
            return Response(status=404)
        try:
            job = LongRunningJob.objects.get(job_id=job_id)
            if job.finished:
                return Response(data={"status": "SUCCESS"}, status=200)
            elif job.failed:
                return Response(
                    data={"status": "FAILURE", "result": job.result}, status=500
                )
            else:
                return Response(
                    data={"status": "PENDING", "progress": job.result}, status=202
                )
        except BaseException as e:
            logger.error(str(e))
            return Response(status=404)


class DeleteZipView(APIView):
    def delete(self, request, fname):
        jwt = request.COOKIES.get("jwt")
        if jwt is not None:
            try:
                token = AccessToken(jwt)
            except TokenError:
                return HttpResponseForbidden()
        else:
            return HttpResponseForbidden()
        filename = fname + str(token["user_id"]) + ".zip"
        try:
            delete_zip_file(filename)
            return Response(status=200)
        except BaseException as e:
            logger.error(str(e))
            return Response(status=404)


================================================
FILE: image_similarity/__init__.py
================================================


================================================
FILE: image_similarity/main.py
================================================
import json

from flask import Flask, jsonify, request
from flask_restful import Api, Resource
from gevent.pywsgi import WSGIServer
from retrieval_index import RetrievalIndex
from utils import logger

app = Flask(__name__)
api = Api(app)

index = RetrievalIndex()


class BuildIndex(Resource):
    def post(self):
        request_body = json.loads(request.data)

        user_id = request_body["user_id"]
        image_hashes = request_body["image_hashes"]
        image_embeddings = request_body["image_embeddings"]

        index.build_index_for_user(user_id, image_hashes, image_embeddings)

        # Return 0 if no index was created, otherwise return the actual size
        index_size = index.indices[user_id].ntotal if user_id in index.indices else 0
        return jsonify({"status": True, "index_size": index_size})

    def delete(self):
        user_id = json.loads(request.data)["user_id"]
        if user_id not in index.indices:
            return jsonify({"status": True})
        del index.indices[user_id]
        del index.image_hashes[user_id]
        return jsonify({"status": True})


class SearchIndex(Resource):
    def post(self):
        try:
            request_body = json.loads(request.data)

            user_id = request_body["user_id"]
            image_embedding = request_body["image_embedding"]
            if "n" in request_body.keys():
                n = int(request_body["n"])
            else:
                n = 100

            if "threshold" in request_body.keys():
                thres = float(request_body["threshold"])
            else:
                thres = 27.0

            res = index.search_similar(user_id, image_embedding, n, thres)

            return jsonify({"status": True, "result": res})
        except BaseException as e:
            logger.error(str(e))
            return jsonify({"status": False, "result": []}), 500


class Health(Resource):
    def get(self):
        return jsonify({"status": True})


api.add_resource(BuildIndex, "/build/")
api.add_resource(SearchIndex, "/search/")
api.add_resource(Health, "/health/")


def start_server():
    logger.info("Starting server")
    server = WSGIServer(("0.0.0.0", 8002), app)
    server.serve_forever()


if __name__ == "__main__":
    start_server()


================================================
FILE: image_similarity/retrieval_index.py
================================================
import datetime

import faiss
import numpy as np
from utils import logger

embedding_size = 512


class RetrievalIndex:
    def __init__(self):
        self.indices = {}
        self.image_hashes = {}

    def build_index_for_user(self, user_id, image_hashes, image_embeddings):
        logger.info(
            f"building index for user {user_id} - got {len(image_hashes)} photos to process"
        )
        start = datetime.datetime.now()

        # Check if we have any embeddings to process
        if not image_embeddings or len(image_embeddings) == 0:
            logger.warning(f"No embeddings provided for user {user_id}")
            return

        # Initialize or get existing index and hashes
        if not self.indices.get(user_id):
            self.indices[user_id] = faiss.IndexFlatIP(embedding_size)
        if not self.image_hashes.get(user_id):
            self.image_hashes[user_id] = []

        # Convert embeddings to numpy array and ensure correct shape
        # FAISS expects shape (n_vectors, embedding_size)
        embeddings_array = np.array(image_embeddings, dtype=np.float32)

        # Handle empty or invalid arrays
        if embeddings_array.size == 0:
            logger.warning(f"Empty embeddings array for user {user_id}")
            return

        if len(embeddings_array.shape) == 1:
            # If we got a single vector, reshape it to (1, embedding_size)
            embeddings_array = embeddings_array.reshape(1, -1)
        elif len(embeddings_array.shape) == 2:
            # If we got multiple vectors, ensure the second dimension is embedding_size
            if embeddings_array.shape[1] != embedding_size:
                logger.error(
                    f"Expected embedding size {embedding_size}, got {embeddings_array.shape[1]}"
                )
                return
        else:
            logger.error(f"Unexpected embedding shape: {embeddings_array.shape}")
            return

        try:
            self.indices[user_id].add(embeddings_array)
            # Add hashes to the list
            self.image_hashes[user_id].extend(image_hashes)
        except Exception as e:
            logger.error(
                f"Error adding embeddings to index for user {user_id}: {str(e)}"
            )
            return

        elapsed = (datetime.datetime.now() - start).total_seconds()
        logger.info(
            "finished building index for user %d - took %.2f seconds"
            % (user_id, elapsed)
        )

    def search_similar(self, user_id, in_embedding, n=100, thres=27.0):
        start = datetime.datetime.now()
        dist, res_indices = self.indices[user_id].search(
            np.array([in_embedding], dtype=np.float32), n
        )
        res = []
        for distance, idx in sorted(zip(dist[0], res_indices[0]), reverse=True):
            if distance >= thres:
                res.append(self.image_hashes[user_id][idx])
        elapsed = (datetime.datetime.now() - start).total_seconds()
        logger.info(
            "searched for %d images for user %d - took %.2f seconds"
            % (n, user_id, elapsed)
        )
        return res


================================================
FILE: image_similarity/utils.py
================================================
import logging
import logging.handlers
import os
import os.path

BASE_LOGS = os.environ.get("BASE_LOGS", "/logs/")

logger = logging.getLogger("image_similarity")
formatter = logging.Formatter(
    "%(asctime)s : %(filename)s : %(funcName)s : %(lineno)s : %(levelname)s : %(message)s"
)
fileMaxByte = 256 * 1024 * 200  # 100MB

fileHandler = logging.handlers.RotatingFileHandler(
    os.path.join(BASE_LOGS, "image_similarity.log"),
    maxBytes=fileMaxByte,
    backupCount=10,
)

fileHandler.setFormatter(formatter)
logger.addHandler(fileHandler)
logger.setLevel(logging.INFO)


================================================
FILE: librephotos/__init__.py
================================================


================================================
FILE: librephotos/settings/__init__.py
================================================


================================================
FILE: librephotos/settings/development.py
================================================
from .production import *  # noqa

DEBUG = True
MIDDLEWARE += ["silk.middleware.SilkyMiddleware"]  # noqa
INSTALLED_APPS += ["silk"]  # noqa
INSTALLED_APPS += ["drf_spectacular"]
SPECTACULAR_SETTINGS = {
    "TITLE": "LibrePhotos",
    "DESCRIPTION": "Your project description",
    "VERSION": "1.0.0",
}


================================================
FILE: librephotos/settings/production.py
================================================
import datetime
import os

BASE_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
BASE_LOGS = os.environ.get("BASE_LOGS", "/logs/")
BASE_DATA = os.environ.get("BASE_DATA", "/")
PHOTOS = os.environ.get("PHOTOS", os.path.join(BASE_DATA, "data"))
STATIC_URL = "api/static/"
MEDIA_URL = "/media/"
MEDIA_ROOT = os.path.join(BASE_DATA, "protected_media")
STATIC_ROOT = os.path.join(BASE_DIR, "static")
DATA_ROOT = PHOTOS
IM2TXT_ROOT = os.path.join(MEDIA_ROOT, "data_models", "im2txt")

BLIP_ROOT = os.path.join(MEDIA_ROOT, "data_models", "blip")
PLACES365_ROOT = os.path.join(MEDIA_ROOT, "data_models", "places365", "model")
CLIP_ROOT = os.path.join(MEDIA_ROOT, "data_models", "clip-embeddings")
LOGS_ROOT = BASE_LOGS
DEMO_SITE = os.environ.get("DEMO_SITE", "False") != "False"

WSGI_APPLICATION = "librephotos.wsgi.application"
AUTH_USER_MODEL = "api.User"
ROOT_URLCONF = "librephotos.urls"
DEFAULT_AUTO_FIELD = "django.db.models.AutoField"
DEBUG = False

SECRET_KEY_FILENAME = os.path.join(BASE_LOGS, "secret.key")
SECRET_KEY = ""

# analyze files to detect embedded media (e.g. in motion photos)
FEATURE_PROCESS_EMBEDDED_MEDIA = (
    os.getenv("FEATURE_PROCESS_EMBEDDED_MEDIA", "True") == "True"
)

if os.environ.get("SECRET_KEY"):
    SECRET_KEY = os.environ["SECRET_KEY"]
    print("use SECRET_KEY from env")

if not SECRET_KEY and os.path.exists(SECRET_KEY_FILENAME):
    with open(SECRET_KEY_FILENAME) as f:
        SECRET_KEY = f.read().strip()
        print("use SECRET_KEY from file")

if not SECRET_KEY:
    from django.core.management.utils import get_random_secret_key

    with open(SECRET_KEY_FILENAME, "w") as f:
        f.write(get_random_secret_key())
        print("generate SECRET_KEY and save to file")
    with open(SECRET_KEY_FILENAME) as f:
        SECRET_KEY = f.read().strip()
        print("use SECRET_KEY from file")

ALLOWED_HOSTS = ["localhost", os.environ.get("BACKEND_HOST", "backend")]

SIMPLE_JWT = {
    "ACCESS_TOKEN_LIFETIME": datetime.timedelta(minutes=5),
    "REFRESH_TOKEN_LIFETIME": datetime.timedelta(
        days=int(os.environ.get("REFRESH_TOKEN_DAYS", "7"))
    ),
}

INSTALLED_APPS = [
    "django.contrib.admin",
    "django.contrib.auth",
    "django.contrib.contenttypes",
    "django.contrib.sessions",
    "django.contrib.messages",
    "django.contrib.staticfiles",
    "django.contrib.postgres",
    "api",
    "nextcloud",
    "rest_framework",
    "rest_framework_simplejwt.token_blacklist",
    "corsheaders",
    "chunked_upload",
    "django_extensions",
    "constance",
    "constance.backends.database",
    "django_q",
]

Q_CLUSTER = {
    "name": "DjangORM",
    "queue_limit": 50,
    "recycle": 50,
    "timeout": 10000000,
    "retry": 20000000,
    "orm": "default",
    "max_rss": 300000,
    "poll": 1,
}

CONSTANCE_BACKEND = "constance.backends.database.DatabaseBackend"
CONSTANCE_ADDITIONAL_FIELDS = {
    "map_api_provider": [
        "django.forms.fields.ChoiceField",
        {
            "widget": "django.forms.Select",
            "choices": (
                ("mapbox", "Mapbox"),
                ("maptiler", "MapTiler"),
                ("nominatim", "Nominatim (OpenStreetMap)"),
                ("opencage", "OpenCage"),
                ("photon", "Photon"),
                ("tomtom", "TomTom"),
            ),
        },
    ],
    "captioning_model": [
        "django.forms.fields.ChoiceField",
        {
            "widget": "django.forms.Select",
            "choices": (
                ("none", "None"),
                ("im2txt", "im2txt PyTorch Model"),
                ("blip_base_capfilt_large", "BLIP Model"),
                ("moondream", "Moondream Visual LLM"),
            ),
        },
    ],
    "llm_model": [
        "django.forms.fields.ChoiceField",
        {
            "widget": "django.forms.Select",
            "choices": (
                ("none", "None"),
                ("mistral-7b-instruct-v0.2.Q5_K_M", "Mistral 7B Instruct v0.2 Q5 K M"),
                ("moondream", "Moondream Visual LLM"),
            ),
        },
    ],
    "tagging_model": [
        "django.forms.fields.ChoiceField",
        {
            "widget": "django.forms.Select",
            "choices": (
                ("places365", "Places365 Scene Recognition"),
                ("siglip2", "SigLIP 2 (Real-world photo tags)"),
            ),
        },
    ],
}
CONSTANCE_CONFIG = {
    "ALLOW_REGISTRATION": (False, "Publicly allow user registration", bool),
    "ALLOW_UPLOAD": (
        os.environ.get("ALLOW_UPLOAD", "True") not in ("false", "False", "0", "f"),
        "Allow uploading files",
        bool,
    ),
    "SKIP_PATTERNS": (
        os.environ.get("SKIP_PATTERNS", ""),
        "Comma delimited list of patterns to ignore (e.g. '@eaDir,#recycle' for synology devices)",
        str,
    ),
    "MAP_API_PROVIDER": (
        os.environ.get("MAP_API_PROVIDER", "nominatim"),
        "Map Provider",
        "map_api_provider",
    ),
    "MAP_API_KEY": (os.environ.get("MAPBOX_API_KEY", ""), "Map Box API Key", str),
    "IMAGE_DIRS": ("/data", "Image dirs list (serialized json)", str),
    "CAPTIONING_MODEL": ("im2txt", "Captioning model", "captioning_model"),
    "LLM_MODEL": ("None", "Large Language Model", "llm_model"),
    "TAGGING_MODEL": ("places365", "Tagging model", "tagging_model"),
}

INTERNAL_IPS = ("127.0.0.1", "localhost")

CORS_ALLOW_HEADERS = (
    "cache-control",
    "accept",
    "accept-encoding",
    "allow-credentials",
    "withcredentials",
    "authorization",
    "content-type",
    "dnt",
    "origin",
    "user-agent",
    "x-csrftoken",
    "x-requested-with",
)
CORS_ALLOW_ALL_ORIGINS = False
CORS_ALLOW_CREDENTIALS = True
CORS_ALLOWED_ORIGINS = ["http://localhost:3000"]

REST_FRAMEWORK = {
    "DEFAULT_PERMISSION_CLASSES": ("rest_framework.permissions.IsAuthenticated",),
    "DEFAULT_AUTHENTICATION_CLASSES": (
        "rest_framework_simplejwt.authentication.JWTAuthentication",
        "rest_framework.authentication.BasicAuthentication",
    ),
    "DEFAULT_SCHEMA_CLASS": "drf_spectacular.openapi.AutoSchema",
    "DEFAULT_FILTER_BACKENDS": ("django_filters.rest_framework.DjangoFilterBackend",),
    "DEFAULT_PAGINATION_CLASS": "rest_framework.pagination.LimitOffsetPagination",
    "EXCEPTION_HANDLER": "api.views.views.custom_exception_handler",
    "PAGE_SIZE": 20000,
}

MIDDLEWARE = [
    "django.middleware.security.SecurityMiddleware",
    "django.contrib.sessions.middleware.SessionMiddleware",
    "corsheaders.middleware.CorsMiddleware",
    "django.middleware.common.CommonMiddleware",
    "django.middleware.csrf.CsrfViewMiddleware",
    "django.contrib.auth.middleware.AuthenticationMiddleware",
    "django.contrib.messages.middleware.MessageMiddleware",
    "django.middleware.clickjacking.XFrameOptionsMiddleware",
    "api.middleware.FingerPrintMiddleware",
]

TEMPLATES = [
    {
        "BACKEND": "django.template.backends.django.DjangoTemplates",
        "DIRS": [],
        "APP_DIRS": True,
        "OPTIONS": {
            "context_processors": [
                "django.template.context_processors.debug",
                "django.template.context_processors.request",
                "django.contrib.auth.context_processors.auth",
                "django.contrib.messages.context_processors.messages",
            ],
        },
    },
]

DATABASES = {
    "default": {
        "ENGINE": "django.db.backends.postgresql",
        "NAME": os.environ.get("DB_NAME", "db"),
        "USER": os.environ.get("DB_USER", "docker"),
        "PASSWORD": os.environ.get("DB_PASS", "AaAa1234"),
        "HOST": os.environ.get("DB_HOST", "db"),
        "PORT": os.environ.get("DB_PORT", "5432"),
        # Using persistent connections instead of pooling due to Django 5.2 pooling bugs
        # (type conversion issues with COUNT queries - see error with UUID returned as string)
        "CONN_MAX_AGE": 600,
        "CONN_HEALTH_CHECKS": True,
    },
}

AUTH_PASSWORD_VALIDATORS = [
    {
        "NAME": "django.contrib.auth.password_validation.UserAttributeSimilarityValidator",
    },
    {
        "NAME": "django.contrib.auth.password_validation.MinimumLengthValidator",
    },
    {
        "NAME": "django.contrib.auth.password_validation.CommonPasswordValidator",
    },
    {
        "NAME": "django.contrib.auth.password_validation.NumericPasswordValidator",
    },
]

# Password Hashers - Argon2 is faster and more secure than PBKDF2
# Existing passwords will continue to work (PBKDF2 fallback)
# New passwords and password changes will use Argon2
PASSWORD_HASHERS = [
    "django.contrib.auth.hashers.Argon2PasswordHasher",
    "django.contrib.auth.hashers.PBKDF2PasswordHasher",
    "django.contrib.auth.hashers.PBKDF2SHA1PasswordHasher",
]

LANGUAGE_CODE = "en-us"
TIME_ZONE = "UTC"
USE_I18N = True
USE_L10N = True
USE_TZ = True

CSRF_TRUSTED_ORIGINS = [
    "http://localhost:3000",
]
if os.environ.get("CSRF_TRUSTED_ORIGINS"):
    CSRF_TRUSTED_ORIGINS.append(os.environ.get("CSRF_TRUSTED_ORIGINS"))

LOGGING = {
    "version": 1,
    "disable_existing_loggers": False,
    "handlers": {
        "console": {
            "class": "logging.StreamHandler",
        },
    },
    "loggers": {
        "django": {
            "handlers": ["console"],
            "level": "INFO",
        },
    },
}

CHUNKED_UPLOAD_PATH = ""
CHUNKED_UPLOAD_TO = os.path.join("chunked_uploads")

DEFAULT_FAVORITE_MIN_RATING = os.environ.get("DEFAULT_FAVORITE_MIN_RATING", 4)
IMAGE_SIMILARITY_SERVER = "http://localhost:8002"


================================================
FILE: librephotos/settings/test.py
================================================
from .production import *  # noqa

DEBUG = True
LOGGING = {
    "version": 1,
    "disable_existing_loggers": True,
    "handlers": {
        "null": {
            "class": "logging.NullHandler",
        },
    },
    "root": {
        "handlers": ["null"],
        "level": "CRITICAL",
    },
}


================================================
FILE: librephotos/settings/test_sqlite.py
================================================
"""
Test settings that use SQLite instead of PostgreSQL.

Usage:
    DJANGO_SETTINGS_MODULE=librephotos.settings.test_sqlite python manage.py test api.tests.test_migration_0099
"""

from .test import *  # noqa

DATABASES = {
    "default": {
        "ENGINE": "django.db.backends.sqlite3",
        "NAME": ":memory:",
    },
}


================================================
FILE: librephotos/urls.py
================================================
"""librephotos URL Configuration

The `urlpatterns` list routes URLs to views. For more information please see:
    https://docs.djangoproject.com/en/1.11/topics/http/urls/

Examples:
Function views
    1. Add an import:  from my_app import views
    2. Add a URL to urlpatterns:  re_path(r'^$', views.home, name='home')
Class-based views
    1. Add an import:  from other_app.views import Home
    2. Add a URL to urlpatterns:  re_path(r'^$', Home.as_view(), name='home')
Including another URLconf
    1. Import the include() function: from django.conf.urls import url, include
    2. Add a URL to urlpatterns:  re_path(r'^blog/', include('blog.urls'))

"""

from django.conf import settings
from django.conf.urls.static import static
from django.contrib import admin
from django.urls import include, re_path
from django.http import HttpResponse
from django.views.generic import TemplateView
from rest_framework import routers
from rest_framework_simplejwt.serializers import (
    TokenObtainPairSerializer,
    TokenRefreshSerializer,
)
from rest_framework_simplejwt.views import (
    TokenBlacklistView,
    TokenObtainPairView,
    TokenRefreshView,
)

from api.views import (
    album_auto,
    album_folder,
    albums,
    dataviz,
    duplicates,
    faces,
    geocode,
    jobs,
    photo_metadata,
    photos,
    public_albums,
    search,
    services,
    sharing,
    stacks,
    timezone,
    upload,
    user,
    views,
)
from nextcloud import views as nextcloud_views
import os


class CustomTokenObtainPairSerializer(TokenObtainPairSerializer):
    @classmethod
    def get_token(cls, user):
        token = super(TokenObtainPairSerializer, cls).get_token(user)

        token["name"] = user.get_username()
        token["is_admin"] = user.is_superuser
        token["first_name"] = user.first_name
        token["last_name"] = user.last_name
        token["scan_directory"] = user.scan_directory
        token["confidence"] = user.confidence
        token["semantic_search_topk"] = user.semantic_search_topk
        token["nextcloud_server_address"] = user.nextcloud_server_address
        token["nextcloud_username"] = user.nextcloud_username

        return token


class CustomTokenObtainPairView(TokenObtainPairView):
    serializer_class = CustomTokenObtainPairSerializer

    def post(self, request, *args, **kwargs):
        response = super().post(request, *args, **kwargs)
        response.set_cookie("jwt", response.data["access"])
        response["Access-Control-Allow-Credentials"] = "true"
        return response


class CustomTokenRefreshView(TokenRefreshView):
    serializer_class = TokenRefreshSerializer

    def post(self, request, *args, **kwargs):
        response = super().post(request, *args, **kwargs)
        response.set_cookie("jwt", response.data["access"])
        response["Access-Control-Allow-Credentials"] = "true"
        return response


class FrontendView(TemplateView):
    """
    Serves the frontend index.html for all non-API routes (no-proxy compatibility)
    """

    def get(self, request, *args, **kwargs):
        try:
            # The frontend_build is at /code/frontend_build, but BASE_DIR is /code/librephotos
            # So we need to go up one level from BASE_DIR
            frontend_path = os.path.join(
                os.path.dirname(settings.BASE_DIR), "frontend_build", "index.html"
            )
            with open(frontend_path) as f:
                return HttpResponse(f.read(), content_type="text/html")
        except FileNotFoundError:
            return HttpResponse(
                "Frontend build not found. Please build the frontend first.", status=500
            )


router = routers.DefaultRouter()
# In SERVE_FRONTEND mode, disable DRF's API root at '/'
# so the frontend catch-all can serve the SPA instead of the browsable API.
router.include_root_view = not getattr(settings, "SERVE_FRONTEND", False)

router.register(r"api/user", user.UserViewSet, basename="user")
router.register(r"api/manage/user", user.ManageUserViewSet, basename="manage_user")
router.register(r"api/delete/user", user.DeleteUserViewSet, basename="delete_user")

router.register(
    r"api/albums/auto/list", album_auto.AlbumAutoListViewSet, basename="album_auto_list"
)
router.register(
    r"api/albums/date/list", albums.AlbumDateListViewSet, basename="album_date_list"
)
router.register(
    r"api/albums/thing/list", albums.AlbumThingListViewSet, basename="album_thing_list"
)
router.register(
    r"api/albums/place/list", albums.AlbumPlaceListViewSet, basename="album_place_list"
)
router.register(
    r"api/albums/user/list", albums.AlbumUserListViewSet, basename="album_user_list"
)

router.register(
    r"api/albums/user/edit", views.AlbumUserEditViewSet, basename="edit_album_user"
)

router.register(
    r"api/albums/user/shared/tome",
    sharing.SharedToMeAlbumUserListViewSet,
    basename="share_to_me_album_user",
)
router.register(
    r"api/albums/user/shared/fromme",
    sharing.SharedFromMeAlbumUserListViewSet,
    basename="share_from_me_album_user",
)

router.register(r"api/albums/auto", album_auto.AlbumAutoViewSet, basename="album_auto")
router.register(
    r"api/folders", album_folder.FolderNavigationViewSet, basename="folder_navigation"
)
router.register(
    r"api/albums/person", albums.AlbumPersonViewSet, basename="album_person"
)
router.register(r"api/albums/date", albums.AlbumDateViewSet, basename="album_date")
router.register(r"api/albums/thing", albums.AlbumThingViewSet, basename="album_thing")
router.register(r"api/albums/place", albums.AlbumPlaceViewSet, basename="album_place")
router.register(r"api/albums/user", albums.AlbumUserViewSet, basename="album_user")

router.register(r"api/persons", albums.PersonViewSet, basename="persons")

router.register(
    r"api/photos/shared/tome",
    sharing.SharedToMePhotoSuperSimpleListViewSet,
    basename="shared_to_me_photo",
)
router.register(
    r"api/photos/shared/fromme",
    sharing.SharedFromMePhotoSuperSimpleListViewSet,
    basename="shared_from_me_photo",
)

router.register(
    r"api/photos/notimestamp",
    photos.NoTimestampPhotoViewSet,
    basename="photos_no_timestamp",
)

router.register(r"api/photos/edit", photos.PhotoEditViewSet, basename="photo_edit")

router.register(
    r"api/photos/recentlyadded",
    photos.RecentlyAddedPhotoListViewSet,
    basename="recently_added_photo",
)
router.register(
    r"api/photos/searchlist", search.SearchListViewSet, basename="photo_search"
)

router.register(r"api/photos", photos.PhotoViewSet, basename="photos")

router.register(
    r"api/faces/incomplete",
    faces.FaceIncompleteListViewSet,
    basename="incomplete_faces",
)

router.register(r"api/faces", faces.FaceListView, basename="faces")

router.register(r"api/exists", upload.UploadPhotoExists, basename="photo_exists")
router.register(r"api/jobs", jobs.LongRunningJobViewSet, basename="jobs")
router.register(r"api/services", services.ServiceViewSet, basename="service")

urlpatterns = [
    re_path(r"^", include(router.urls)),
    re_path(r"^api/django-admin/", admin.site.urls),
    re_path(r"^api/sitesettings", views.SiteSettingsView.as_view()),
    re_path(r"^api/firsttimesetup", user.IsFirstTimeSetupView.as_view()),
    re_path(r"^api/dirtree", user.RootPathTreeView.as_view()),
    re_path(r"^api/labelfaces", faces.SetFacePersonLabel.as_view()),
    re_path(r"^api/deletefaces", faces.DeleteFaces.as_view()),
    re_path(r"^api/savemetadata", photos.SaveMetadataView.as_view()),
    re_path(r"^api/photosedit/delete", photos.DeletePhotos.as_view()),
    re_path(r"^api/photosedit/setdeleted", photos.SetPhotosDeleted.as_view()),
    re_path(r"^api/photosedit/favorite", photos.SetPhotosFavorite.as_view()),
    re_path(r"^api/photosedit/hide", photos.SetPhotosHidden.as_view()),
    re_path(r"^api/photosedit/makepublic", photos.SetPhotosPublic.as_view()),
    re_path(r"^api/photosedit/share", photos.SetPhotosShared.as_view()),
    re_path(r"^api/photosedit/generateim2txt", photos.GeneratePhotoCaption.as_view()),
    re_path(r"^api/photosedit/savecaption", photos.SavePhotoCaption.as_view()),
    re_path(r"^api/useralbum/share", views.SetUserAlbumShared.as_view()),
    re_path(r"^api/trainfaces", faces.TrainFaceView.as_view()),
    re_path(r"^api/clusterfaces", dataviz.ClusterFaceView.as_view()),
    re_path(r"^api/socialgraph", dataviz.SocialGraphView.as_view()),
    re_path(r"^api/scanphotos", views.ScanPhotosView.as_view()),
    re_path(r"^api/scanuploadedphotos", views.FullScanPhotosView.as_view()),
    re_path(r"^api/fullscanphotos", views.FullScanPhotosView.as_view()),
    re_path(r"^api/scanfaces", faces.ScanFacesView.as_view()),
    re_path(r"^api/deletemissingphotos", views.DeleteMissingPhotosView.as_view()),
    re_path(r"^api/autoalbumgen", album_auto.AutoAlbumGenerateView.as_view()),
    re_path(r"^api/autoalbumtitlegen", album_auto.RegenerateAutoAlbumTitles.as_view()),
    # Photo Stacks - Organizational grouping (bursts, brackets, manual)
    # NOTE: RAW+JPEG pairs and Live Photos now use Photo.files (file variants model)
    re_path(r"^api/stacks/detect/?$", stacks.DetectStacksView.as_view()),
    re_path(r"^api/stacks/stats/?$", stacks.PhotoStackStatsView.as_view()),
    re_path(r"^api/stacks/manual/?$", stacks.CreateManualStackView.as_view()),
    re_path(r"^api/stacks/merge/?$", stacks.MergeStacksView.as_view()),
    re_path(
        r"^api/stacks/(?P<stack_id>[0-9a-f-]+)/add/?$",
        stacks.AddToStackView.as_view(),
    ),
    re_path(
        r"^api/stacks/(?P<stack_id>[0-9a-f-]+)/remove/?$",
        stacks.RemoveFromStackView.as_view(),
    ),
    re_path(
        r"^api/stacks/(?P<stack_id>[0-9a-f-]+)/delete/?$",
        stacks.PhotoStackDeleteView.as_view(),
    ),
    re_path(
        r"^api/stacks/(?P<stack_id>[0-9a-f-]+)/primary/?$",
        stacks.PhotoStackSetPrimaryView.as_view(),
    ),
    re_path(
        r"^api/stacks/(?P<stack_id>[0-9a-f-]+)/?$",
        stacks.PhotoStackDetailView.as_view(),
    ),
    re_path(r"^api/stacks/?$", stacks.PhotoStackListView.as_view()),
    # Duplicates - Storage cleanup (exact copies, visual duplicates)
    re_path(r"^api/duplicates/detect", duplicates.DetectDuplicatesView.as_view()),
    re_path(r"^api/duplicates/stats", duplicates.DuplicateStatsView.as_view()),
    re_path(
        r"^api/duplicates/(?P<duplicate_id>[0-9a-f-]+)/resolve",
        duplicates.DuplicateResolveView.as_view(),
    ),
    re_path(
        r"^api/duplicates/(?P<duplicate_id>[0-9a-f-]+)/dismiss",
        duplicates.DuplicateDismissView.as_view(),
    ),
    re_path(
        r"^api/duplicates/(?P<duplicate_id>[0-9a-f-]+)/revert",
        duplicates.DuplicateRevertView.as_view(),
    ),
    re_path(
        r"^api/duplicates/(?P<duplicate_id>[0-9a-f-]+)/delete",
        duplicates.DuplicateDeleteView.as_view(),
    ),
    re_path(
        r"^api/duplicates/(?P<duplicate_id>[0-9a-f-]+)",
        duplicates.DuplicateDetailView.as_view(),
    ),
    re_path(r"^api/duplicates", duplicates.DuplicateListView.as_view()),
    # Photo Metadata - Structured metadata with edit history
    re_path(
        r"^api/photos/(?P<photo_id>[0-9a-f-]+|[a-f0-9]{64})/metadata/history",
        photo_metadata.PhotoMetadataViewSet.as_view({"get": "history"}),
    ),
    re_path(
        r"^api/photos/(?P<photo_id>[0-9a-f-]+|[a-f0-9]{64})/metadata/revert-all",
        photo_metadata.PhotoMetadataViewSet.as_view({"post": "revert_all"}),
    ),
    re_path(
        r"^api/photos/(?P<photo_id>[0-9a-f-]+|[a-f0-9]{64})/metadata/revert/(?P<edit_id>[0-9a-f-]+)",
        photo_metadata.PhotoMetadataViewSet.as_view({"post": "revert"}),
    ),
    re_path(
        r"^api/photos/(?P<photo_id>[0-9a-f-]+|[a-f0-9]{64})/metadata",
        photo_metadata.PhotoMetadataViewSet.as_view({"get": "retrieve", "patch": "partial_update"}),
    ),
    re_path(r"^api/photos/metadata/bulk", photo_metadata.BulkMetadataView.as_view()),
    # File Variants - Download specific file variants (RAW, JPEG, video, etc.)
    re_path(
        r"^api/photos/(?P<image_hash>[a-f0-9]+)/file/(?P<file_hash>[a-f0-9]+)$",
        photos.FileVariantDownloadView.as_view(),
        name="file_variant_download",
    ),
    # Set main file for a photo (switch between variants)
    re_path(
        r"^api/photos/(?P<image_hash>[a-f0-9]+)/main-file$",
        photos.SetMainFileView.as_view(),
        name="set_main_file",
    ),
    re_path(r"^api/searchtermexamples", views.SearchTermExamples.as_view()),
    re_path(r"^api/locationsunburst", dataviz.LocationSunburst.as_view()),
    re_path(r"^api/locationtimeline", dataviz.LocationTimeline.as_view()),
    re_path(r"^api/defaultrules", user.DefaultRulesView.as_view()),
    re_path(r"^api/predefinedrules", user.PredefinedRulesView.as_view()),
    re_path(r"^api/defaultburstrules", user.DefaultBurstRulesView.as_view()),
    re_path(r"^api/predefinedburstrules", user.PredefinedBurstRulesView.as_view()),
    re_path(r"^api/stats", dataviz.StatsView.as_view()),
    re_path(r"^api/storagestats", views.StorageStatsView.as_view()),
    re_path(r"^api/imagetag", views.ImageTagView.as_view()),
    re_path(r"^api/serverstats", dataviz.ServerStatsView.as_view()),
    re_path(r"^api/serverlogs", dataviz.ServerLogsView.as_view()),
    re_path(r"^api/locclust", dataviz.LocationClustersView.as_view()),
    re_path(r"^api/photomonthcounts", dataviz.PhotoMonthCountsView.as_view()),
    re_path(r"^api/wordcloud", dataviz.SearchTermWordCloudView.as_view()),
    re_path(r"^api/auth/token/obtain/$", CustomTokenObtainPairView.as_view()),
    re_path(r"^api/auth/token/refresh/$", CustomTokenRefreshView.as_view()),
    re_path(r"^api/auth/token/blacklist/", TokenBlacklistView.as_view()),
    re_path(
        r"^media/(?P<path>.*)/(?P<fname>.*)",
        views.UnifiedMediaAccessView.as_view(),
        name="media",
    ),
    re_path(
        r"^api/delete/zip/(?P<fname>.*)",
        views.DeleteZipView.as_view(),
        name="delete-zip",
    ),
    re_path(r"^api/rqavailable/$", jobs.QueueAvailabilityView.as_view()),
    re_path(r"^api/nextcloud/listdir", nextcloud_views.ListDir.as_view()),
    re_path(r"^api/nextcloud/scanphotos", nextcloud_views.ScanPhotosView.as_view()),
    re_path(r"^api/photos/download$", views.ZipListPhotosView_V2.as_view()),
    # Public album by slug
    re_path(
        r"^api/public/albums/s/(?P<slug>[^/]+)/$",
        public_albums.PublicAlbumBySlug.as_view(),
    ),
    # Public photo detail in album
    re_path(
        r"^api/public/albums/s/(?P<slug>[^/]+)/photos/(?P<photo_id>[^/]+)/$",
        public_albums.PublicPhotoDetailBySlug.as_view(),
    ),
    # Toggle album public flag
    re_path(r"^api/useralbum/makepublic", public_albums.SetUserAlbumPublic.as_view()),
    re_path(r"^api/timezones", timezone.TimeZoneView.as_view()),
    re_path(r"^api/geocode/search", geocode.GeocodeSearchView.as_view()),
    re_path(r"api/upload/complete/", upload.UploadPhotosChunkedComplete.as_view()),
    re_path(r"api/upload/", upload.UploadPhotosChunked.as_view()),
]
urlpatterns += static(settings.STATIC_URL, document_root=settings.STATIC_ROOT)

if settings.DEBUG:
    from drf_spectacular.views import (
        SpectacularAPIView,
        SpectacularRedocView,
        SpectacularSwaggerView,
    )

    urlpatterns += [re_path(r"^api/silk/", include("silk.urls", namespace="silk"))]
    urlpatterns += [
        re_path(r"^api/schema", SpectacularAPIView.as_view(), name="schema"),
        re_path(r"^api/swagger", SpectacularSwaggerView.as_view(), name="swagger-ui"),
        re_path(r"^api/redoc", SpectacularRedocView.as_view(), name="redoc"),
        re_path(r"^api/help$", views.ApiHelpView.as_view()),
    ]

# Configure media and frontend serving for no-proxy (SERVE_FRONTEND) mode
if getattr(settings, "SERVE_FRONTEND", False):
    # Serve frontend assets and manifest directly
    from django.views.static import serve as static_serve  # type: ignore

    frontend_build_path = os.path.join(
        os.path.dirname(settings.BASE_DIR), "frontend_build"
    )
    urlpatterns += [
        re_path(
            r"^assets/(?P<path>.*)$",
            static_serve,
            {"document_root": os.path.join(frontend_build_path, "assets")},
        ),
        re_path(
            r"^(?P<path>manifest\.json)$",
            static_serve,
            {"document_root": frontend_build_path},
        ),
        re_path(
            r"^(?P<path>favicon\.ico)$",
            static_serve,
            {"document_root": frontend_build_path},
        ),
        re_path(
            r"^(?P<path>logo-white\.png)$",
            static_serve,
            {"document_root": frontend_build_path},
        ),
        re_path(
            r"^(?P<path>logo\.png)$",
            static_serve,
            {"document_root": frontend_build_path},
        ),
        re_path(
            r"^(?P<path>unknown_user\.jpg)$",
            static_serve,
            {"document_root": frontend_build_path},
        ),
        re_path(
            r"^(?P<path>.*\.(?:png|jpg|jpeg|gif|ico|svg))$",
            static_serve,
            {"document_root": frontend_build_path},
        ),
    ]

    # Catch-all pattern for frontend routes (must be last)
    urlpatterns += [
        re_path(
            r"^(?!api/)(?!media/)(?!static/)(?!assets/)(?!manifest\.json).*$",
            FrontendView.as_view(),
            name="frontend",
        ),
    ]


================================================
FILE: librephotos/wsgi.py
================================================
import os

from django.core.wsgi import get_wsgi_application

environment = "production"
if os.environ.get("DEBUG", "0") == "1":
    environment = "development"

os.environ.setdefault("DJANGO_SETTINGS_MODULE", f"librephotos.settings.{environment}")

application = get_wsgi_application()


================================================
FILE: manage.py
================================================
#!/usr/bin/env python
import os
import sys

if __name__ == "__main__":
    environment = "production"
    if os.environ.get("DEBUG", "0") == "1":
        environment = "development"

    try:
        command = sys.argv[1]
    except IndexError:
        command = "help"

    do_not_collect_coverage = os.environ.get("NO_COVERAGE") is not None
    running_tests = command == "test"
    if running_tests:
        environment = "test"
    if running_tests and not do_not_collect_coverage:
        from coverage import Coverage

        cov = Coverage()
        cov.erase()
        cov.start()

    from django.core.management import execute_from_command_line

    os.environ.setdefault(
        "DJANGO_SETTINGS_MODULE", f"librephotos.settings.{environment}"
    )
    execute_from_command_line(sys.argv)

    if running_tests and not do_not_collect_coverage:
        cov.stop()
        cov.save()
        cov.html_report()
        covered = cov.report()


================================================
FILE: nextcloud/__init__.py
================================================


================================================
FILE: nextcloud/admin.py
================================================


================================================
FILE: nextcloud/apps.py
================================================
from django.apps import AppConfig


class NextcloudConfig(AppConfig):
    name = "nextcloud"


================================================
FILE: nextcloud/directory_watcher.py
================================================
import os
import pathlib

import owncloud as nextcloud
from django.conf import settings

from api import util
from api.directory_watcher import handle_new_image
from api.image_similarity import build_image_similarity_index
from api.models import LongRunningJob


def isValidNCMedia(file_obj):
    file_attr = file_obj.attributes
    filetype = file_attr.get("{DAV:}getcontenttype", "")
    try:
        return (
            "jpeg" in filetype
            or "png" in filetype
            or "bmp" in filetype
            or "gif" in filetype
            or "heic" in filetype
            or "heif" in filetype
        )
    except Exception:
        util.logger.exception("An image thrown an exception")
        return False


def collect_photos(nc, path, photos):
    for x in nc.list(path):
        if not x.is_dir() and isValidNCMedia(x):
            photos.append(x.path)
        elif x.is_dir():
            collect_photos(nc, x.path, photos)


def scan_photos(user, job_id):
    lrj = LongRunningJob.get_or_create_job(
        user=user,
        job_type=LongRunningJob.JOB_SCAN_PHOTOS,
        job_id=job_id,
    )

    nc = nextcloud.Client(user.nextcloud_server_address)
    nc.login(user.nextcloud_username, user.nextcloud_app_password)

    photos = []

    paths = []

    collect_photos(nc, user.nextcloud_scan_directory, photos)

    for photo in photos:
        local_dir = os.path.join(
            settings.DATA_ROOT,
            "nextcloud_media",
            user.username,
            os.path.dirname(photo)[1:],
        )
        local_path = os.path.join(
            settings.DATA_ROOT, "nextcloud_media", user.username, photo[1:]
        )
        paths.append(local_path)

        if not os.path.exists(local_dir):
            pathlib.Path(local_dir).mkdir(parents=True, exist_ok=True)

        if not os.path.exists(local_path):
            nc.get_file(photo, local_path)
        util.logger.info("Downloaded photo from nextcloud to " + local_path)

    try:
        paths.sort()

        added_photo_count = 0
        to_add_count = len(paths)
        for idx, image_path in enumerate(paths):
            util.logger.info("begin handling of photo %d/%d" % (idx + 1, to_add_count))
            handle_new_image(user, image_path, job_id)
            lrj.update_progress(current=idx + 1, target=to_add_count)

        util.logger.info(f"Added {len(paths)} photos")
        build_image_similarity_index(user)

        lrj.complete()
    except Exception as e:
        util.logger.exception(str(e))
        lrj.fail(error=e)
    return {"new_photo_count": added_photo_count, "status": True}


================================================
FILE: nextcloud/models.py
================================================


================================================
FILE: nextcloud/tests.py
================================================
# from django.test import TestCase

# Create your tests here.


================================================
FILE: nextcloud/views.py
================================================
import uuid
from urllib.parse import urlparse

import owncloud as nextcloud
from django_q.tasks import AsyncTask
from drf_spectacular.utils import extend_schema
from rest_framework.response import Response
from rest_framework.views import APIView

from api.util import logger
from nextcloud.directory_watcher import scan_photos


class ListDir(APIView):
    def get(self, request, format=None):
        if not request.query_params.get("fpath"):
            return Response([])
        path = request.query_params["fpath"]

        if not request.user.nextcloud_server_address or not valid_url(
            request.user.nextcloud_server_address
        ):
            return Response([])

        nc = nextcloud.Client(request.user.nextcloud_server_address)
        nc.login(request.user.nextcloud_username, request.user.nextcloud_app_password)
        try:
            return Response(
                [
                    {
                        "absolute_path": p.path,
                        "title": p.path.split("/")[-2],
                        "children": [],
                    }
                    for p in nc.list(path)
                    if p.is_dir()
                ]
            )
        except nextcloud.HTTPResponseError:
            return Response(status=400)


def valid_url(url):
    try:
        urlparse(url)
        return True
    except BaseException:
        return False


class ScanPhotosView(APIView):
    def post(self, request, format=None):
        return self._scan_photos(request)

    @extend_schema(
        deprecated=True,
        description="Use POST method instead",
    )
    def get(self, request, format=None):
        return self._scan_photos(request)

    def _scan_photos(self, request):
        try:
            job_id = uuid.uuid4()
            AsyncTask(scan_photos, request.user, job_id).run()
            return Response({"status": True, "job_id": job_id})
        except BaseException:
            logger.exception("An Error occurred")
            return Response({"status": False})


================================================
FILE: pyproject.toml
================================================
[tool.ruff]
line-length = 88
target-version = "py311"
extend-exclude = ["migrations", "im2txt", "blip", "places365"]

[lint]
select = [
  "E",  # Pyflakes (errors)
  "F",  # Pyflakes
  "W",  # pycodestyle warnings
  "I",  # isort (import sorting)
  "N",  # PEP8 naming
  "UP", # Pyupgrade (modern syntax)
  "DJ", # pylint-django equivalent
  "PL", # pylint rules
]
ignore = ["E501", "E203", "E231"]

[tool.ruff.format]
quote-style = "double"
indent-style = "space"
line-ending = "lf"


================================================
FILE: renovate.json
================================================
{
  "$schema": "https://docs.renovatebot.com/renovate-schema.json",
  "packageRules": [
    {
      "matchUpdateTypes": ["minor", "patch", "pin", "digest"],
      "automerge": true
    }
  ],
  "extends": [
    "config:base"
  ]
}


================================================
FILE: requirements.dev.txt
================================================
ipdb==0.13.13
ipython==9.6.0
ipython-genutils==0.2.0
Pygments==2.19.2
prompt-toolkit==3.0.52
nose==1.3.7
pre-commit==4.3.0
coverage==7.11.0
Faker==37.12.0
setuptools==80.9.0
pyfakefs==5.9.3
pytest==8.4.2
ruff==0.14.8


================================================
FILE: requirements.mlval.txt
================================================
pycocotools==2.0.10
pycocoevalcap==1.2
nltk==3.9.2
matplotlib==3.10.7
onnx==1.19.0
onnxscript

================================================
FILE: requirements.txt
================================================
Django==5.2.11
django-constance==4.3.4
django-cors-headers==4.9.0
git+https://github.com/derneuere/django-chunked-upload@master#egg=django-chunked-upload
django-cryptography-5==2.0.3
django-extensions==4.1
django-filter==25.2
django-bulk-update
django-silk==5.4.3
djangorestframework==3.16.1
djangorestframework-simplejwt==5.5.1
drf-spectacular==0.29.0
face-recognition==1.3.0
faiss-cpu==1.12.0
Flask==3.1.2
Flask-Cors==6.0.1
Flask-RESTful==0.3.10
geopy==2.4.1
gunicorn==23.0.0
hdbscan==0.8.40
networkx==3.4.2
nltk==3.9.2
markupsafe==3.0.3
Pillow==11.3.0
ImageHash==4.3.1
psycopg==3.2.10
https://github.com/owncloud/pyocclient/archive/master.zip
pytz==2025.2
tzdata==2025.2
PyExifTool==0.4.9
pyvips==3.0.0
scikit-learn<1.7.3
seaborn==0.13.2
sentence_transformers==2.7.0
timezonefinder==6.6.3
tqdm==4.67.1
gevent==25.9.1
python-magic==0.4.27
Wand==0.6.13
django-q2==1.9.0
safetensors==0.6.2
py-cpuinfo==9.0.0
psutil==7.2.2

# Dependencies for blip
timm==1.0.19
# Dependencies for Moondream chat handler (llama-cpp-python multimodal)
transformers==4.56.2
# Dependencies for mistral quantized and multimodal models like Moondream
llama-cpp-python==0.3.16
argon2-cffi==23.1.0
# Dependencies for SigLIP 2 ONNX inference
onnxruntime==1.21.1
# SentencePiece tokenizer for SigLIP 2
sentencepiece==0.2.0

================================================
FILE: service/__init__.py
================================================


================================================
FILE: service/clip_embeddings/__init__.py
================================================


================================================
FILE: service/clip_embeddings/main.py
================================================
import time

import gevent
from flask import Flask, request
from gevent.pywsgi import WSGIServer
from semantic_search.semantic_search import SemanticSearch

app = Flask(__name__)


def log(message):
    print(f"clip embeddings: {message}")


semantic_search_instance = None
last_request_time = None


@app.route("/clip-embeddings", methods=["POST"])
def create_clip_embeddings():
    global last_request_time
    # Update last request time
    last_request_time = time.time()

    try:
        data = request.get_json()
        imgs = data["imgs"]
        model = data["model"]
    except Exception as e:
        print(str(e))
        return "", 400

    global semantic_search_instance

    if semantic_search_instance is None:
        semantic_search_instance = SemanticSearch()

    imgs_emb, magnitudes = semantic_search_instance.calculate_clip_embeddings(
        imgs, model
    )
    # Convert NumPy arrays to Python lists
    imgs_emb_list = [enc.tolist() for enc in imgs_emb]
    magnitudes = [float(m) for m in magnitudes]
    return {"imgs_emb": imgs_emb_list, "magnitudes": magnitudes}, 201


@app.route("/query-embeddings", methods=["POST"])
def calculate_query_embeddings():
    global last_request_time
    # Update last request time
    last_request_time = time.time()

    try:
        data = request.get_json()
        query = data["query"]
        model = data["model"]
    except Exception as e:
        print(str(e))
        return "", 400
    global semantic_search_instance

    if semantic_search_instance is None:
        semantic_search_instance = SemanticSearch()

    emb, magnitude = semantic_search_instance.calculate_query_embeddings(query, model)
    return {"emb": emb, "magnitude": magnitude}, 201


@app.route("/health", methods=["GET"])
def health():
    return {"last_request_time": last_request_time}, 200


if __name__ == "__main__":
    log("service starting")
    server = WSGIServer(("0.0.0.0", 8006), app)
    server_thread = gevent.spawn(server.serve_forever)
    gevent.joinall([server_thread])


================================================
FILE: service/clip_embeddings/semantic_search/__init__.py
================================================


================================================
FILE: service/clip_embeddings/semantic_search/semantic_search.py
================================================
import gc

import numpy as np
import PIL
from sentence_transformers import SentenceTransformer


class SemanticSearch:
    model = None
    model_is_loaded = False

    def load(self, model):
        self.load_model(model)
        self.model_is_loaded = True
        pass

    def unload(self):
        del self.model
        self.model = None
        gc.collect()
        self.model_is_loaded = False
        pass

    def load_model(self, model):
        self.model = SentenceTransformer(model)

    def calculate_clip_embeddings(self, img_paths, model):
        import torch

        if not self.model_is_loaded:
            self.load(model)
        imgs = []
        if type(img_paths) is list:
            for path in img_paths:
                try:
                    img = PIL.Image.open(path)
                    imgs.append(img)
                except PIL.UnidentifiedImageError:
                    print(f"Error loading image: {path}")
        else:
            try:
                img = PIL.Image.open(img_paths)
                imgs.append(img)
            except PIL.UnidentifiedImageError:
                print(f"Error loading image: {img_paths}")

        try:
            imgs_emb = self.model.encode(imgs, batch_size=32, convert_to_tensor=True)
            if torch.cuda.is_available():
                if type(img_paths) is list:
                    magnitudes = list(
                        map(lambda x: np.linalg.norm(x.cpu().numpy()), imgs_emb)
                    )

                    return imgs_emb, magnitudes
                else:
                    img_emb = imgs_emb[0].cpu().numpy().tolist()
                    magnitude = np.linalg.norm(img_emb)

                    return img_emb, magnitude
            else:
                if type(img_paths) is list:
                    magnitudes = map(np.linalg.norm, imgs_emb)
                    return imgs_emb, magnitudes
                else:
                    img_emb = imgs_emb[0].tolist()
                    magnitude = np.linalg.norm(img_emb)

                return img_emb, magnitude
        except Exception as e:
            print(f"Error in calculating clip embeddings: {e}")
            raise e

    def calculate_query_embeddings(self, query, model):
        if not self.model_is_loaded:
            self.load(model)

        query_emb = self.model.encode([query], convert_to_tensor=True)[0].tolist()
        magnitude = np.linalg.norm(query_emb)

        return query_emb, magnitude


================================================
FILE: service/exif/__init__.py
================================================


================================================
FILE: service/exif/main.py
================================================
import exiftool
import gevent
from flask import Flask, request
from gevent.pywsgi import WSGIServer

static_et = exiftool.ExifTool()
static_struct_et = exiftool.ExifTool(common_args=["-struct"])

app = Flask(__name__)


def log(message):
    print(f"exif: {message}")


@app.route("/get-tags", methods=["POST"])
def get_tags():
    try:
        data = request.get_json()
        files_by_reverse_priority = data["files_by_reverse_priority"]
        tags = data["tags"]
        struct = data["struct"]
    except Exception:
        return "", 400

    et = None
    if struct:
        et = static_struct_et
    else:
        et = static_et
    if not et.running:
        et.start()

    values = []
    try:
        for tag in tags:
            value = None
            for file in files_by_reverse_priority:
                retrieved_value = et.get_tag(tag, file)
                if retrieved_value is not None:
                    value = retrieved_value
            values.append(value)
    except Exception:
        log("An error occurred")

    return {"values": values}, 201


@app.route("/health", methods=["GET"])
def health():
    return {"status": "OK"}, 200


if __name__ == "__main__":
    log("service starting")
    server = WSGIServer(("0.0.0.0", 8010), app)
    server_thread = gevent.spawn(server.serve_forever)
    gevent.joinall([server_thread])


================================================
FILE: service/face_recognition/__init__.py
================================================


================================================
FILE: service/face_recognition/main.py
================================================
import time

import face_recognition
import gevent
import numpy as np
import PIL
from flask import Flask, request
from gevent.pywsgi import WSGIServer

app = Flask(__name__)

last_request_time = None


def log(message):
    print(f"face_recognition: {message}")


@app.route("/face-encodings", methods=["POST"])
def create_face_encodings():
    global last_request_time
    # Update last request time
    last_request_time = time.time()

    try:
        data = request.get_json()
        source = data["source"]
        face_locations = data["face_locations"]
    except Exception:
        return "", 400

    image = np.array(PIL.Image.open(source))
    face_encodings = face_recognition.face_encodings(
        image,
        known_face_locations=face_locations,
    )
    # Convert NumPy arrays to Python lists
    face_encodings_list = [enc.tolist() for enc in face_encodings]
    # Log number of face encodings
    log(f"created face_encodings={len(face_encodings_list)}")
    return {"encodings": face_encodings_list}, 201


@app.route("/face-locations", methods=["POST"])
def create_face_locations():
    global last_request_time
    # Update last request time
    last_request_time = time.time()

    try:
        data = request.get_json()
        source = data["source"]
        model = data["model"]
    except Exception:
        return "", 400

    image = np.array(PIL.Image.open(source))
    face_locations = face_recognition.face_locations(image, model=model)
    log(f"created face_location={face_locations}")
    return {"face_locations": face_locations}, 201


@app.route("/health", methods=["GET"])
def health():
    return {"last_request_time": last_request_time}, 200


if __name__ == "__main__":
    log("service starting")
    server = WSGIServer(("0.0.0.0", 8005), app)
    server_thread = gevent.spawn(server.serve_forever)
    gevent.joinall([server_thread])


================================================
FILE: service/image_captioning/__init__.py
================================================


================================================
FILE: service/image_captioning/api/im2txt/README.md
================================================
# Image Captioning
The goal of image captioning is to convert a given input image into a natural language description. The encoder-decoder framework is widely used for this task. The image encoder is a convolutional neural network (CNN). In this tutorial, we used [resnet-152](https://arxiv.org/abs/1512.03385) model pretrained on the [ILSVRC-2012-CLS](http://www.image-net.org/challenges/LSVRC/2012/) image classification dataset. The decoder is a long short-term memory (LSTM) network. 

![alt text](png/model.png)

#### Training phase
For the encoder part, the pretrained CNN extracts the feature vector from a given input image. The feature vector is linearly transformed to have the same dimension as the input dimension of the LSTM network. For the decoder part, source and target texts are predefined. For example, if the image description is **"Giraffes standing next to each other"**, the source sequence is a list containing **['\<start\>', 'Giraffes', 'standing', 'next', 'to', 'each', 'other']** and the target sequence is a list containing **['Giraffes', 'standing', 'next', 'to', 'each', 'other', '\<end\>']**. Using these source and target sequences and the feature vector, the LSTM decoder is trained as a language model conditioned on the feature vector.

#### Test phase
In the test phase, the encoder part is almost same as the training phase. The only difference is that batchnorm layer uses moving average and variance instead of mini-batch statistics. This can be easily implemented using [encoder.eval()](https://github.com/yunjey/pytorch-tutorial/blob/master/tutorials/03-advanced/image_captioning/sample.py#L37). For the decoder part, there is a significant difference between the training phase and the test phase. In the test phase, the LSTM decoder can't see the image description. To deal with this problem, the LSTM decoder feeds back the previously generated word to the next input. This can be implemented using a [for-loop](https://github.com/yunjey/pytorch-tutorial/blob/master/tutorials/03-advanced/image_captioning/model.py#L48).


## Usage 


#### 1. Clone the repositories
```bash
$ git clone https://github.com/pdollar/coco.git
$ cd coco/PythonAPI/
$ make
$ python setup.py build
$ python setup.py install
$ cd ../../
$ git clone https://github.com/yunjey/pytorch-tutorial.git
$ cd pytorch-tutorial/tutorials/03-advanced/image_captioning/
```

#### 2. Download the dataset

```bash
$ pip install -r requirements.txt
$ chmod +x download.sh
$ ./download.sh
```

#### 3. Preprocessing

```bash
$ python build_vocab.py   
$ python resize.py
```

#### 4. Train the model

```bash
$ python train.py    
```

#### 5. Test the model 

```bash
$ python sample.py --image='png/example.png'
```

<br>

## Pretrained model
If you do not want to train the model from scratch, you can use a pretrained model. You can download the pretrained model [here](https://www.dropbox.com/s/ne0ixz5d58ccbbz/pretrained_model.zip?dl=0) and the vocabulary file [here](https://www.dropbox.com/s/26adb7y9m98uisa/vocap.zip?dl=0). You should extract pretrained_model.zip to `./models/` and vocab.pkl to `./data/` using `unzip` command.


================================================
FILE: service/image_captioning/api/im2txt/blip/blip.py
================================================
"""* Copyright (c) 2022, salesforce.com, inc.
* All rights reserved.
* SPDX-License-Identifier: BSD-3-Clause
* For full license text, see LICENSE.txt file in the repo root or https://opensource.org/licenses/BSD-3-Clause
* By Junnan Li
"""

import os
from urllib.parse import urlparse

import torch
from torch import nn
from transformers import BertTokenizer

from api.im2txt.blip.med import BertConfig, BertLMHeadModel, BertModel
from api.im2txt.blip.vit import VisionTransformer, interpolate_pos_embed


class BLIP_Base(nn.Module):
    def __init__(
        self,
        med_config="configs/med_config.json",
        image_size=224,
        vit="base",
        vit_grad_ckpt=False,
        vit_ckpt_layer=0,
    ):
        """Args:
        med_config (str): path for the mixture of encoder-decoder model's configuration file
        image_size (int): input image size
        vit (str): model size of vision transformer

        """
        super().__init__()

        self.visual_encoder, vision_width = create_vit(
            vit, image_size, vit_grad_ckpt, vit_ckpt_layer
        )
        self.tokenizer = init_tokenizer()
        med_config = BertConfig.from_json_file(med_config)
        med_config.encoder_width = vision_width
        self.text_encoder = BertModel(config=med_config, add_pooling_layer=False)

    def forward(self, image, caption, mode):
        assert mode in [
            "image",
            "text",
            "multimodal",
        ], "mode parameter must be image, text, or multimodal"
        text = self.tokenizer(caption, return_tensors="pt").to(image.device)

        if mode == "image":
            # return image features
            image_embeds = self.visual_encoder(image)
            return image_embeds

        elif mode == "text":
            # return text features
            text_output = self.text_encoder(
                text.input_ids,
                attention_mask=text.attention_mask,
                return_dict=True,
                mode="text",
            )
            return text_output.last_hidden_state

        elif mode == "multimodal":
            # return multimodel features
            image_embeds = self.visual_encoder(image)
            image_atts = torch.ones(image_embeds.size()[:-1], dtype=torch.long).to(
                image.device
            )

            text.input_ids[:, 0] = self.tokenizer.enc_token_id
            output = self.text_encoder(
                text.input_ids,
                attention_mask=text.attention_mask,
                encoder_hidden_states=image_embeds,
                encoder_attention_mask=image_atts,
                return_dict=True,
            )
            return output.last_hidden_state


class BLIP_Decoder(nn.Module):
    def __init__(
        self,
        med_config="configs/med_config.json",
        image_size=384,
        vit="base",
        vit_grad_ckpt=False,
        vit_ckpt_layer=0,
        prompt="a picture of ",
    ):
        """Args:
        med_config (str): path for the mixture of encoder-decoder model's configuration file
        image_size (int): input image size
        vit (str): model size of vision transformer

        """
        super().__init__()

        self.visual_encoder, vision_width = create_vit(
            vit, image_size, vit_grad_ckpt, vit_ckpt_layer
        )
        self.tokenizer = init_tokenizer()
        med_config = BertConfig.from_json_file(med_config)
        med_config.encoder_width = vision_width
        self.text_decoder = BertLMHeadModel(config=med_config)

        self.prompt = prompt
        self.prompt_length = len(self.tokenizer(self.prompt).input_ids) - 1

    def forward(self, image, caption):
        image_embeds = self.visual_encoder(image)
        image_atts = torch.ones(image_embeds.size()[:-1], dtype=torch.long).to(
            image.device
        )

        text = self.tokenizer(
            caption,
            padding="longest",
            truncation=True,
            max_length=40,
            return_tensors="pt",
        ).to(image.device)

        text.input_ids[:, 0] = self.tokenizer.bos_token_id

        decoder_targets = text.input_ids.masked_fill(
            text.input_ids == self.tokenizer.pad_token_id, -100
        )
        decoder_targets[:, : self.prompt_length] = -100

        decoder_output = self.text_decoder(
            text.input_ids,
            attention_mask=text.attention_mask,
            encoder_hidden_states=image_embeds,
            encoder_attention_mask=image_atts,
            labels=decoder_targets,
            return_dict=True,
        )
        loss_lm = decoder_output.loss

        return loss_lm

    def generate(
        self,
        image,
        sample=False,
        num_beams=3,
        max_length=30,
        min_length=10,
        top_p=0.9,
        repetition_penalty=1.0,
    ):
        image_embeds = self.visual_encoder(image)

        if not sample:
            image_embeds = image_embeds.repeat_interleave(num_beams, dim=0)

        image_atts = torch.ones(image_embeds.size()[:-1], dtype=torch.long).to(
            image.device
        )
        model_kwargs = {
            "encoder_hidden_states": image_embeds,
            "encoder_attention_mask": image_atts,
        }

        prompt = [self.prompt] * image.size(0)
        input_ids = self.tokenizer(prompt, return_tensors="pt").input_ids.to(
            image.device
        )
        input_ids[:, 0] = self.tokenizer.bos_token_id
        input_ids = input_ids[:, :-1]

        if sample:
            # nucleus sampling
            outputs = self.text_decoder.generate(
                input_ids=input_ids,
                max_length=max_length,
                min_length=min_length,
                do_sample=True,
                top_p=top_p,
                num_return_sequences=1,
                eos_token_id=self.tokenizer.sep_token_id,
                pad_token_id=self.tokenizer.pad_token_id,
                repetition_penalty=1.1,
                **model_kwargs,
            )
        else:
            # beam search
            outputs = self.text_decoder.generate(
                input_ids=input_ids,
                max_length=max_length,
                min_length=min_length,
                num_beams=num_beams,
                eos_token_id=self.tokenizer.sep_token_id,
                pad_token_id=self.tokenizer.pad_token_id,
                repetition_penalty=repetition_penalty,
                **model_kwargs,
            )

        captions = []
        for output in outputs:
            caption = self.tokenizer.decode(output, skip_special_tokens=True)
            captions.append(caption[len(self.prompt) :])
        return captions


def blip_decoder(pretrained="", **kwargs):
    model = BLIP_Decoder(**kwargs)
    if pretrained:
        model, msg = load_checkpoint(model, pretrained)
        assert len(msg.missing_keys) == 0
    return model


def blip_feature_extractor(pretrained="", **kwargs):
    model = BLIP_Base(**kwargs)
    if pretrained:
        model, msg = load_checkpoint(model, pretrained)
        assert len(msg.missing_keys) == 0
    return model


def init_tokenizer():
    tokenizer = BertTokenizer.from_pretrained("bert-base-uncased")
    tokenizer.add_special_tokens({"bos_token": "[DEC]"})
    tokenizer.add_special_tokens({"additional_special_tokens": ["[ENC]"]})
    tokenizer.enc_token_id = tokenizer.additional_special_tokens_ids[0]
    return tokenizer


def create_vit(vit, image_size, ckpt_layer=0, drop_path_rate=0):
    assert vit in ["base", "large"], "vit parameter must be base or large"
    if vit == "base":
        vision_width = 768
        visual_encoder = VisionTransformer(
            img_size=image_size,
            patch_size=16,
            embed_dim=vision_width,
            depth=12,
            num_heads=12,
            ckpt_layer=ckpt_layer,
            drop_path_rate=0 or drop_path_rate,
        )
    elif vit == "large":
        vision_width = 1024
        visual_encoder = VisionTransformer(
            img_size=image_size,
            patch_size=16,
            embed_dim=vision_width,
            depth=24,
            num_heads=16,
            ckpt_layer=ckpt_layer,
            drop_path_rate=0.1 or drop_path_rate,
        )
    return visual_encoder, vision_width


def is_url(url_or_filename):
    parsed = urlparse(url_or_filename)
    return parsed.scheme in ("http", "https")


def load_checkpoint(model, url_or_filename):
    if os.path.isfile(url_or_filename):
        checkpoint = torch.load(url_or_filename, map_location="cpu")
    else:
        raise RuntimeError("checkpoint url or path is invalid")

    state_dict = checkpoint["model"]

    state_dict["visual_encoder.pos_embed"] = interpolate_pos_embed(
        state_dict["visual_encoder.pos_embed"], model.visual_encoder
    )
    if "visual_encoder_m.pos_embed" in model.state_dict().keys():
        state_dict["visual_encoder_m.pos_embed"] = interpolate_pos_embed(
            state_dict["visual_encoder_m.pos_embed"], model.visual_encoder_m
        )
    for key in model.state_dict().keys():
        if key in state_dict.keys():
            if state_dict[key].shape != model.state_dict()[key].shape:
                del state_dict[key]

    msg = model.load_state_dict(state_dict, strict=False)
    print("load checkpoint from %s" % url_or_filename)
    return model, msg


================================================
FILE: service/image_captioning/api/im2txt/blip/med.py
================================================
"""* Copyright (c) 2022, salesforce.com, inc.
* All rights reserved.
* SPDX-License-Identifier: BSD-3-Clause
* For full license text, see LICENSE.txt file in the repo root or https://opensource.org/licenses/BSD-3-Clause
* By Junnan Li
* Based on huggingface code base
* https://github.com/huggingface/transformers/blob/v4.15.0/src/transformers/models/bert
"""

import math

import torch
import torch.utils.checkpoint
from torch import Tensor, device, nn
from torch.nn import CrossEntropyLoss
from transformers.activations import ACT2FN
from transformers.modeling_outputs import (
    BaseModelOutputWithPastAndCrossAttentions,
    BaseModelOutputWithPoolingAndCrossAttentions,
    CausalLMOutputWithCrossAttentions,
)
from transformers.modeling_utils import PreTrainedModel
try:  # Compatibility with transformers<4.37 where helpers lived in modeling_utils
    from transformers.modeling_utils import (
        find_pruneable_heads_and_indices,
        prune_linear_layer,
    )
except ImportError:  # pragma: no cover - fallback for transformers>=4.37
    from transformers.models.bert.modeling_bert import (
        find_pruneable_heads_and_indices,
        prune_linear_layer,
    )
try:  # Compatibility with transformers>=4.36 where apply_chunking_to_forward moved
    from transformers.modeling_utils import apply_chunking_to_forward
except ImportError:  # pragma: no cover - fallback for older/newer transformers versions
    from transformers.pytorch_utils import apply_chunking_to_forward
from transformers.models.bert.configuration_bert import BertConfig
from transformers.utils import logging

logger = logging.get_logger(__name__)


class BertEmbeddings(nn.Module):
    """Construct the embeddings from word and position embeddings."""

    def __init__(self, config):
        super().__init__()
        self.word_embeddings = nn.Embedding(
            config.vocab_size, config.hidden_size, padding_idx=config.pad_token_id
        )
        self.position_embeddings = nn.Embedding(
            config.max_position_embeddings, config.hidden_size
        )

        # self.LayerNorm is not snake-cased to stick with TensorFlow model variable name and be able to load
        # any TensorFlow checkpoint file
        self.LayerNorm = nn.LayerNorm(config.hidden_size, eps=config.layer_norm_eps)
        self.dropout = nn.Dropout(config.hidden_dropout_prob)

        # position_ids (1, len position emb) is contiguous in memory and exported when serialized
        self.register_buffer(
            "position_ids", torch.arange(config.max_position_embeddings).expand((1, -1))
        )
        self.position_embedding_type = getattr(
            config, "position_embedding_type", "absolute"
        )

        self.config = config

    def forward(
        self,
        input_ids=None,
        position_ids=None,
        inputs_embeds=None,
        past_key_values_length=0,
    ):
        if input_ids is not None:
            input_shape = input_ids.size()
        else:
            input_shape = inputs_embeds.size()[:-1]

        seq_length = input_shape[1]

        if position_ids is None:
            position_ids = self.position_ids[
                :, past_key_values_length : seq_length + past_key_values_length
            ]

        if inputs_embeds is None:
            inputs_embeds = self.word_embeddings(input_ids)

        embeddings = inputs_embeds

        if self.position_embedding_type == "absolute":
            position_embeddings = self.position_embeddings(position_ids)
            embeddings += position_embeddings
        embeddings = self.LayerNorm(embeddings)
        embeddings = self.dropout(embeddings)
        return embeddings


class BertSelfAttention(nn.Module):
    def __init__(self, config, is_cross_attention):
        super().__init__()
        self.config = config
        if config.hidden_size % config.num_attention_heads != 0 and not hasattr(
            config, "embedding_size"
        ):
            raise ValueError(
                "The hidden size (%d) is not a multiple of the number of attention "
                "heads (%d)" % (config.hidden_size, config.num_attention_heads)
            )

        self.num_attention_heads = config.num_attention_heads
        self.attention_head_size = int(config.hidden_size / config.num_attention_heads)
        self.all_head_size = self.num_attention_heads * self.attention_head_size

        self.query = nn.Linear(config.hidden_size, self.all_head_size)
        if is_cross_attention:
            self.key = nn.Linear(config.encoder_width, self.all_head_size)
            self.value = nn.Linear(config.encoder_width, self.all_head_size)
        else:
            self.key = nn.Linear(config.hidden_size, self.all_head_size)
            self.value = nn.Linear(config.hidden_size, self.all_head_size)

        self.dropout = nn.Dropout(config.attention_probs_dropout_prob)
        self.position_embedding_type = getattr(
            config, "position_embedding_type", "absolute"
        )
        if (
            self.position_embedding_type == "relative_key"
            or self.position_embedding_type == "relative_key_query"
        ):
            self.max_position_embeddings = config.max_position_embeddings
            self.distance_embedding = nn.Embedding(
                2 * config.max_position_embeddings - 1, self.attention_head_size
            )
        self.save_attention = False

    def save_attn_gradients(self, attn_gradients):
        self.attn_gradients = attn_gradients

    def get_attn_gradients(self):
        return self.attn_gradients

    def save_attention_map(self, attention_map):
        self.attention_map = attention_map

    def get_attention_map(self):
        return self.attention_map

    def transpose_for_scores(self, x):
        new_x_shape = x.size()[:-1] + (
            self.num_attention_heads,
            self.attention_head_size,
        )
        x = x.view(*new_x_shape)
        return x.permute(0, 2, 1, 3)

    def forward(
        self,
        hidden_states,
        attention_mask=None,
        head_mask=None,
        encoder_hidden_states=None,
        encoder_attention_mask=None,
        past_key_value=None,
        output_attentions=False,
    ):
        mixed_query_layer = self.query(hidden_states)

        # If this is instantiated as a cross-attention module, the keys
        # and values come from an encoder; the attention mask needs to be
        # such that the encoder's padding tokens are not attended to.
        is_cross_attention = encoder_hidden_states is not None

        if is_cross_attention:
            key_layer = self.transpose_for_scores(self.key(encoder_hidden_states))
            value_layer = self.transpose_for_scores(self.value(encoder_hidden_states))
            attention_mask = encoder_attention_mask
        elif past_key_value is not None:
            key_layer = self.transpose_for_scores(self.key(hidden_states))
            value_layer = self.transpose_for_scores(self.value(hidden_states))
            key_layer = torch.cat([past_key_value[0], key_layer], dim=2)
            value_layer = torch.cat([past_key_value[1], value_layer], dim=2)
        else:
            key_layer = self.transpose_for_scores(self.key(hidden_states))
            value_layer = self.transpose_for_scores(self.value(hidden_states))

        query_layer = self.transpose_for_scores(mixed_query_layer)

        past_key_value = (key_layer, value_layer)

        # Take the dot product between "query" and "key" to get the raw attention scores.
        attention_scores = torch.matmul(query_layer, key_layer.transpose(-1, -2))

        if (
            self.position_embedding_type == "relative_key"
            or self.position_embedding_type == "relative_key_query"
        ):
            seq_length = hidden_states.size()[1]
            position_ids_l = torch.arange(
                seq_length, dtype=torch.long, device=hidden_states.device
            ).view(-1, 1)
            position_ids_r = torch.arange(
                seq_length, dtype=torch.long, device=hidden_states.device
            ).view(1, -1)
            distance = position_ids_l - position_ids_r
            positional_embedding = self.distance_embedding(
                distance + self.max_position_embeddings - 1
            )
            positional_embedding = positional_embedding.to(
                dtype=query_layer.dtype
            )  # fp16 compatibility

            if self.position_embedding_type == "relative_key":
                relative_position_scores = torch.einsum(
                    "bhld,lrd->bhlr", query_layer, positional_embedding
                )
                attention_scores = attention_scores + relative_position_scores
            elif self.position_embedding_type == "relative_key_query":
                relative_position_scores_query = torch.einsum(
                    "bhld,lrd->bhlr", query_layer, positional_embedding
                )
                relative_position_scores_key = torch.einsum(
                    "bhrd,lrd->bhlr", key_layer, positional_embedding
                )
                attention_scores = (
                    attention_scores
                    + relative_position_scores_query
                    + relative_position_scores_key
                )

        attention_scores = attention_scores / math.sqrt(self.attention_head_size)
        if attention_mask is not None:
            # Apply the attention mask is (precomputed for all layers in BertModel forward() function)
            attention_scores = attention_scores + attention_mask

        # Normalize the attention scores to probabilities.
        attention_probs = nn.Softmax(dim=-1)(attention_scores)

        if is_cross_attention and self.save_attention:
            self.save_attention_map(attention_probs)
            attention_probs.register_hook(self.save_attn_gradients)

        # This is actually dropping out entire tokens to attend to, which might
        # seem a bit unusual, but is taken from the original Transformer paper.
        attention_probs_dropped = self.dropout(attention_probs)

        # Mask heads if we want to
        if head_mask is not None:
            attention_probs_dropped = attention_probs_dropped * head_mask

        context_layer = torch.matmul(attention_probs_dropped, value_layer)

        context_layer = context_layer.permute(0, 2, 1, 3).contiguous()
        new_context_layer_shape = context_layer.size()[:-2] + (self.all_head_size,)
        context_layer = context_layer.view(*new_context_layer_shape)

        outputs = (
            (context_layer, attention_probs) if output_attentions else (context_layer,)
        )

        outputs = outputs + (past_key_value,)
        return outputs


class BertSelfOutput(nn.Module):
    def __init__(self, config):
        super().__init__()
        self.dense = nn.Linear(config.hidden_size, config.hidden_size)
        self.LayerNorm = nn.LayerNorm(config.hidden_size, eps=config.layer_norm_eps)
        self.dropout = nn.Dropout(config.hidden_dropout_prob)

    def forward(self, hidden_states, input_tensor):
        hidden_states = self.dense(hidden_states)
        hidden_states = self.dropout(hidden_states)
        hidden_states = self.LayerNorm(hidden_states + input_tensor)
        return hidden_states


class BertAttention(nn.Module):
    def __init__(self, config, is_cross_attention=False):
        super().__init__()
        self.self = BertSelfAttention(config, is_cross_attention)
        self.output = BertSelfOutput(config)
        self.pruned_heads = set()

    def prune_heads(self, heads):
        if len(heads) == 0:
            return
        heads, index = find_pruneable_heads_and_indices(
            heads,
            self.self.num_attention_heads,
            self.self.attention_head_size,
            self.pruned_heads,
        )

        # Prune linear layers
        self.self.query = prune_linear_layer(self.self.query, index)
        self.self.key = prune_linear_layer(self.self.key, index)
        self.self.value = prune_linear_layer(self.self.value, index)
        self.output.dense = prune_linear_layer(self.output.dense, index, dim=1)

        # Update hyper params and store pruned heads
        self.self.num_attention_heads = self.self.num_attention_heads - len(heads)
        self.self.all_head_size = (
            self.self.attention_head_size * self.self.num_attention_heads
        )
        self.pruned_heads = self.pruned_heads.union(heads)

    def forward(
        self,
        hidden_states,
        attention_mask=None,
        head_mask=None,
        encoder_hidden_states=None,
        encoder_attention_mask=None,
        past_key_value=None,
        output_attentions=False,
    ):
        self_outputs = self.self(
            hidden_states,
            attention_mask,
            head_mask,
            encoder_hidden_states,
            encoder_attention_mask,
            past_key_value,
            output_attentions,
        )
        attention_output = self.output(self_outputs[0], hidden_states)
        outputs = (attention_output,) + self_outputs[
            1:
        ]  # add attentions if we output them
        return outputs


class BertIntermediate(nn.Module):
    def __init__(self, config):
        super().__init__()
        self.dense = nn.Linear(config.hidden_size, config.intermediate_size)
        if isinstance(config.hidden_act, str):
            self.intermediate_act_fn = ACT2FN[config.hidden_act]
        else:
            self.intermediate_act_fn = config.hidden_act

    def forward(self, hidden_states):
        hidden_states = self.dense(hidden_states)
        hidden_states = self.intermediate_act_fn(hidden_states)
        return hidden_states


class BertOutput(nn.Module):
    def __init__(self, config):
        super().__init__()
        self.dense = nn.Linear(config.intermediate_size, config.hidden_size)
        self.LayerNorm = nn.LayerNorm(config.hidden_size, eps=config.layer_norm_eps)
        self.dropout = nn.Dropout(config.hidden_dropout_prob)

    def forward(self, hidden_states, input_tensor):
        hidden_states = self.dense(hidden_states)
        hidden_states = self.dropout(hidden_states)
        hidden_states = self.LayerNorm(hidden_states + input_tensor)
        return hidden_states


class BertLayer(nn.Module):
    def __init__(self, config, layer_num):
        super().__init__()
        self.config = config
        self.chunk_size_feed_forward = config.chunk_size_feed_forward
        self.seq_len_dim = 1
        self.attention = BertAttention(config)
        self.layer_num = layer_num
        if self.config.add_cross_attention:
            self.crossattention = BertAttention(
                config, is_cross_attention=self.config.add_cross_attention
            )
        self.intermediate = BertIntermediate(config)
        self.output = BertOutput(config)

    def forward(
        self,
        hidden_states,
        attention_mask=None,
        head_mask=None,
        encoder_hidden_states=None,
        encoder_attention_mask=None,
        past_key_value=None,
        output_attentions=False,
        mode=None,
    ):
        # decoder uni-directional self-attention cached key/values tuple is at positions 1,2
        self_attn_past_key_value = (
            past_key_value[:2] if past_key_value is not None else None
        )
        self_attention_outputs = self.attention(
            hidden_states,
            attention_mask,
            head_mask,
            output_attentions=output_attentions,
            past_key_value=self_attn_past_key_value,
        )
        attention_output = self_attention_outputs[0]

        outputs = self_attention_outputs[1:-1]
        present_key_value = self_attention_outputs[-1]

        if mode == "multimodal":
            assert encoder_hidden_states is not None, (
                "encoder_hidden_states must be given for cross-attention layers"
            )

            cross_attention_outputs = self.crossattention(
                attention_output,
                attention_mask,
                head_mask,
                encoder_hidden_states,
                encoder_attention_mask,
                output_attentions=output_attentions,
            )
            attention_output = cross_attention_outputs[0]
            outputs = (
                outputs + cross_attention_outputs[1:-1]
            )  # add cross attentions if we output attention weights
        layer_output = apply_chunking_to_forward(
            self.feed_forward_chunk,
            self.chunk_size_feed_forward,
            self.seq_len_dim,
            attention_output,
        )
        outputs = (layer_output,) + outputs

        outputs = outputs + (present_key_value,)

        return outputs

    def feed_forward_chunk(self, attention_output):
        intermediate_output = self.intermediate(attention_output)
        layer_output = self.output(intermediate_output, attention_output)
        return layer_output


class BertEncoder(nn.Module):
    def __init__(self, config):
        super().__init__()
        self.config = config
        self.layer = nn.ModuleList(
            [BertLayer(config, i) for i in range(config.num_hidden_layers)]
        )
        self.gradient_checkpointing = False

    def forward(
        self,
        hidden_states,
        attention_mask=None,
        head_mask=None,
        encoder_hidden_states=None,
        encoder_attention_mask=None,
        past_key_values=None,
        use_cache=None,
        output_attentions=False,
        output_hidden_states=False,
        return_dict=True,
        mode="multimodal",
    ):
        all_hidden_states = () if output_hidden_states else None
        all_self_attentions = () if output_attentions else None
        all_cross_attentions = (
            () if output_attentions and self.config.add_cross_attention else None
        )

        next_decoder_cache = () if use_cache else None

        for i in range(self.config.num_hidden_layers):
            layer_module = self.layer[i]
            if output_hidden_states:
                all_hidden_states = all_hidden_states + (hidden_states,)

            layer_head_mask = head_mask[i] if head_mask is not None else None
            past_key_value = past_key_values[i] if past_key_values is not None else None

            if self.gradient_checkpointing and self.training:
                if use_cache:
                    logger.warning(
                        "`use_cache=True` is incompatible with gradient checkpointing. Setting `use_cache=False`..."
                    )
                    use_cache = False

                def create_custom_forward(module):
                    def custom_forward(*inputs):
                        return module(*inputs, past_key_value, output_attentions)

                    return custom_forward

                layer_outputs = torch.utils.checkpoint.checkpoint(
                    create_custom_forward(layer_module),
                    hidden_states,
                    attention_mask,
                    layer_head_mask,
                    encoder_hidden_states,
                    encoder_attention_mask,
                    mode=mode,
                )
            else:
                layer_outputs = layer_module(
                    hidden_states,
                    attention_mask,
                    layer_head_mask,
                    encoder_hidden_states,
                    encoder_attention_mask,
                    past_key_value,
                    output_attentions,
                    mode=mode,
                )

            hidden_states = layer_outputs[0]
            if use_cache:
                next_decoder_cache += (layer_outputs[-1],)
            if output_attentions:
                all_self_attentions = all_self_attentions + (layer_outputs[1],)

        if output_hidden_states:
            all_hidden_states = all_hidden_states + (hidden_states,)

        if not return_dict:
            return tuple(
                v
                for v in [
                    hidden_states,
                    next_decoder_cache,
                    all_hidden_states,
                    all_self_attentions,
                    all_cross_attentions,
                ]
                if v is not None
            )
        return BaseModelOutputWithPastAndCrossAttentions(
            last_hidden_state=hidden_states,
            past_key_values=next_decoder_cache,
            hidden_states=all_hidden_states,
            attentions=all_self_attentions,
            cross_attentions=all_cross_attentions,
        )


class BertPooler(nn.Module):
    def __init__(self, config):
        super().__init__()
        self.dense = nn.Linear(config.hidden_size, config.hidden_size)
        self.activation = nn.Tanh()

    def forward(self, hidden_states):
        # We "pool" the model by simply taking the hidden state corresponding
        # to the first token.
        first_token_tensor = hidden_states[:, 0]
        pooled_output = self.dense(first_token_tensor)
        pooled_output = self.activation(pooled_output)
        return pooled_output


class BertPredictionHeadTransform(nn.Module):
    def __init__(self, config):
        super().__init__()
        self.dense = nn.Linear(config.hidden_size, config.hidden_size)
        if isinstance(config.hidden_act, str):
            self.transform_act_fn = ACT2FN[config.hidden_act]
        else:
            self.transform_act_fn = config.hidden_act
        self.LayerNorm = nn.LayerNorm(config.hidden_size, eps=config.layer_norm_eps)

    def forward(self, hidden_states):
        hidden_states = self.dense(hidden_states)
        hidden_states = self.transform_act_fn(hidden_states)
        hidden_states = self.LayerNorm(hidden_states)
        return hidden_states


class BertLMPredictionHead(nn.Module):
    def __init__(self, config):
        super().__init__()
        self.transform = BertPredictionHeadTransform(config)

        # The output weights are the same as the input embeddings, but there is
        # an output-only bias for each token.
        self.decoder = nn.Linear(config.hidden_size, config.vocab_size, bias=False)

        self.bias = nn.Parameter(torch.zeros(config.vocab_size))

        # Need a link between the two variables so that the bias is correctly resized with `resize_token_embeddings`
        self.decoder.bias = self.bias

    def forward(self, hidden_states):
        hidden_states = self.transform(hidden_states)
        hidden_states = self.decoder(hidden_states)
        return hidden_states


class BertOnlyMLMHead(nn.Module):
    def __init__(self, config):
        super().__init__()
        self.predictions = BertLMPredictionHead(config)

    def forward(self, sequence_output):
        prediction_scores = self.predictions(sequence_output)
        return prediction_scores


class BertPreTrainedModel(PreTrainedModel):
    """An abstract class to handle weights initialization and a simple interface for downloading and loading pretrained
    models.
    """

    config_class = BertConfig
    base_model_prefix = "bert"
    _keys_to_ignore_on_load_missing = [r"position_ids"]

    def _init_weights(self, module):
        """Initialize the weights"""
        if isinstance(module, (nn.Linear, nn.Embedding)):
            # Slightly different from the TF version which uses truncated_normal for initialization
            # cf https://github.com/pytorch/pytorch/pull/5617
            module.weight.data.normal_(mean=0.0, std=self.config.initializer_range)
        elif isinstance(module, nn.LayerNorm):
            module.bias.data.zero_()
            module.weight.data.fill_(1.0)
        if isinstance(module, nn.Linear) and module.bias is not None:
            module.bias.data.zero_()


class BertModel(BertPreTrainedModel):
    """The model can behave as an encoder (with only self-attention) as well as a decoder, in which case a layer of
    cross-attention is added between the self-attention layers, following the architecture described in `Attention is
    all you need <https://arxiv.org/abs/1706.03762>`__ by Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit,
    Llion Jones, Aidan N. Gomez, Lukasz Kaiser and Illia Polosukhin.
    argument and :obj:`add_cross_attention` set to :obj:`True`; an :obj:`encoder_hidden_states` is then expected as an
    input to the forward pass.
    """

    def __init__(self, config, add_pooling_layer=True):
        super().__init__(config)
        self.config = config

        self.embeddings = BertEmbeddings(config)

        self.encoder = BertEncoder(config)

        self.pooler = BertPooler(config) if add_pooling_layer else None

        self.init_weights()

    def get_input_embeddings(self):
        return self.embeddings.word_embeddings

    def set_input_embeddings(self, value):
        self.embeddings.word_embeddings = value

    def _prune_heads(self, heads_to_prune):
        """Prunes heads of the model. heads_to_prune: dict of {layer_num: list of heads to prune in this layer} See base
        class PreTrainedModel
        """
        for layer, heads in heads_to_prune.items():
            self.encoder.layer[layer].attention.prune_heads(heads)

    def get_extended_attention_mask(
        self,
        attention_mask: Tensor,
        input_shape: tuple[int],
        device: device,
        is_decoder: bool,
    ) -> Tensor:
        """Makes broadcastable attention and causal masks so that future and masked tokens are ignored.

        Arguments:
            attention_mask (:obj:`torch.Tensor`):
                Mask with ones indicating tokens to attend to, zeros for tokens to ignore.
            input_shape (:obj:`Tuple[int]`):
                The shape of the input to the model.
            device: (:obj:`torch.device`):
                The device of the input to the model.

        Returns:
            :obj:`torch.Tensor` The extended attention mask, with a the same dtype as :obj:`attention_mask.dtype`.

        """
        # We can provide a self-attention mask of dimensions [batch_size, from_seq_length, to_seq_length]
        # ourselves in which case we just need to make it broadcastable to all heads.
        if attention_mask.dim() == 3:
            extended_attention_mask = attention_mask[:, None, :, :]
        elif attention_mask.dim() == 2:
            # Provided a padding mask of dimensions [batch_size, seq_length]
            # - if the model is a decoder, apply a causal mask in addition to the padding mask
            # - if the model is an encoder, make the mask broadcastable to [batch_size, num_heads, seq_length, seq_length]
            if is_decoder:
                batch_size, seq_length = input_shape

                seq_ids = torch.arange(seq_length, device=device)
                causal_mask = (
                    seq_ids[None, None, :].repeat(batch_size, seq_length, 1)
                    <= seq_ids[None, :, None]
                )
                # in case past_key_values are used we need to add a prefix ones mask to the causal mask
                # causal and attention masks must have same type with pytorch version < 1.3
                causal_mask = causal_mask.to(attention_mask.dtype)

                if causal_mask.shape[1] < attention_mask.shape[1]:
                    prefix_seq_len = attention_mask.shape[1] - causal_mask.shape[1]
                    causal_mask = torch.cat(
                        [
                            torch.ones(
                                (batch_size, seq_length, prefix_seq_len),
                                device=device,
                                dtype=causal_mask.dtype,
                            ),
                            causal_mask,
                        ],
                        axis=-1,
                    )

                extended_attention_mask = (
                    causal_mask[:, None, :, :] * attention_mask[:, None, None, :]
                )
            else:
                extended_attention_mask = attention_mask[:, None, None, :]
        else:
            raise ValueError(
                f"Wrong shape for input_ids (shape {input_shape}) or attention_mask (shape {attention_mask.shape})"
            )

        # Since attention_mask is 1.0 for positions we want to attend and 0.0 for
        # masked positions, this operation will create a tensor which is 0.0 for
        # positions we want to attend and -10000.0 for masked positions.
        # Since we are adding it to the raw scores before the softmax, this is
        # effectively the same as removing these entirely.
        extended_attention_mask = extended_attention_mask.to(
            dtype=self.dtype
        )  # fp16 compatibility
        extended_attention_mask = (1.0 - extended_attention_mask) * -10000.0
        return extended_attention_mask

    def forward(
        self,
        input_ids=None,
        attention_mask=None,
        position_ids=None,
        head_mask=None,
        inputs_embeds=None,
        encoder_embeds=None,
        encoder_hidden_states=None,
        encoder_attention_mask=None,
        past_key_values=None,
        use_cache=None,
        output_attentions=None,
        output_hidden_states=None,
        return_dict=None,
        is_decoder=False,
        mode="multimodal",
    ):
        r"""encoder_hidden_states  (:obj:`torch.FloatTensor` of shape :obj:`(batch_size, sequence_length, hidden_size)`, `optional`):
            Sequence of hidden-states at the output of the last layer of the encoder. Used in the cross-attention if
            the model is configured as a decoder.
        encoder_attention_mask (:obj:`torch.FloatTensor` of shape :obj:`(batch_size, sequence_length)`, `optional`):
            Mask to avoid performing attention on the padding token indices of the encoder input. This mask is used in
            the cross-attention if the model is configured as a decoder. Mask values selected in ``[0, 1]``:
            - 1 for tokens that are **not masked**,
            - 0 for tokens that are **masked**.
        past_key_values (:obj:`tuple(tuple(torch.FloatTensor))` of length :obj:`config.n_layers` with each tuple having 4 tensors of shape :obj:`(batch_size, num_heads, sequence_length - 1, embed_size_per_head)`):
            Contains precomputed key and value hidden states of the attention blocks. Can be used to speed up decoding.
            If :obj:`past_key_values` are used, the user can optionally input only the last :obj:`decoder_input_ids`
            (those that don't have their past key value states given to this model) of shape :obj:`(batch_size, 1)`
            instead of all :obj:`decoder_input_ids` of shape :obj:`(batch_size, sequence_length)`.
        use_cache (:obj:`bool`, `optional`):
            If set to :obj:`True`, :obj:`past_key_values` key value states are returned and can be used to speed up
            decoding (see :obj:`past_key_values`).
        """
        output_attentions = (
            output_attentions
            if output_attentions is not None
            else self.config.output_attentions
        )
        output_hidden_states = (
            output_hidden_states
            if output_hidden_states is not None
            else self.config.output_hidden_states
        )
        return_dict = (
            return_dict if return_dict is not None else self.config.use_return_dict
        )

        if is_decoder:
            use_cache = use_cache if use_cache is not None else self.config.use_cache
        else:
            use_cache = False

        if input_ids is not None and inputs_embeds is not None:
            raise ValueError(
                "You cannot specify both input_ids and inputs_embeds at the same time"
            )
        elif input_ids is not None:
            input_shape = input_ids.size()
            batch_size, seq_length = input_shape
            device = input_ids.device
        elif inputs_embeds is not None:
            input_shape = inputs_embeds.size()[:-1]
            batch_size, seq_length = input_shape
            device = inputs_embeds.device
        elif encoder_embeds is not None:
            input_shape = encoder_embeds.size()[:-1]
            batch_size, seq_length = input_shape
            device = encoder_embeds.device
        else:
            raise ValueError(
                "You have to specify either input_ids or inputs_embeds or encoder_embeds"
            )

        # past_key_values_length
        past_key_values_length = (
            past_key_values[0][0].shape[2] if past_key_values is not None else 0
        )

        if attention_mask is None:
            attention_mask = torch.ones(
                ((batch_size, seq_length + past_key_values_length)), device=device
            )

        # We can provide a self-attention mask of dimensions [batch_size, from_seq_length, to_seq_length]
        # ourselves in which case we just need to make it broadcastable to all heads.
        extended_attention_mask: torch.Tensor = self.get_extended_attention_mask(
            attention_mask, input_shape, device, is_decoder
        )

        # If a 2D or 3D attention mask is provided for the cross-attention
        # we need to make broadcastable to [batch_size, num_heads, seq_length, seq_length]
        if encoder_hidden_states is not None:
            if type(encoder_hidden_states) == list:
                encoder_batch_size, encoder_sequence_length, _ = encoder_hidden_states[
                    0
                ].size()
            else:
                (
                    encoder_batch_size,
                    encoder_sequence_length,
                    _,
                ) = encoder_hidden_states.size()
            encoder_hidden_shape = (encoder_batch_size, encoder_sequence_length)

            if type(encoder_attention_mask) == list:
                encoder_extended_attention_mask = [
                    self.invert_attention_mask(mask) for mask in encoder_attention_mask
                ]
            elif encoder_attention_mask is None:
                encoder_attention_mask = torch.ones(encoder_hidden_shape, device=device)
                encoder_extended_attention_mask = self.invert_attention_mask(
                    encoder_attention_mask
                )
            else:
                encoder_extended_attention_mask = self.invert_attention_mask(
                    encoder_attention_mask
                )
        else:
            encoder_extended_attention_mask = None

        # Prepare head mask if needed
        # 1.0 in head_mask indicate we keep the head
        # attention_probs has shape bsz x n_heads x N x N
        # input head_mask has shape [num_heads] or [num_hidden_layers x num_heads]
        # and head_mask is converted to shape [num_hidden_layers x batch x num_heads x seq_length x seq_length]
        head_mask = self.get_head_mask(head_mask, self.config.num_hidden_layers)

        if encoder_embeds is None:
            embedding_output = self.embeddings(
                input_ids=input_ids,
                position_ids=position_ids,
                inputs_embeds=inputs_embeds,
                past_key_values_length=past_key_values_length,
            )
        else:
            embedding_output = encoder_embeds

        encoder_outputs = self.encoder(
            embedding_output,
            attention_mask=extended_attention_mask,
            head_mask=head_mask,
            encoder_hidden_states=encoder_hidden_states,
            encoder_attention_mask=encoder_extended_attention_mask,
            past_key_values=past_key_values,
            use_cache=use_cache,
            output_attentions=output_attentions,
            output_hidden_states=output_hidden_states,
            return_dict=return_dict,
            mode=mode,
        )
        sequence_output = encoder_outputs[0]
        pooled_output = (
            self.pooler(sequence_output) if self.pooler is not None else None
        )

        if not return_dict:
            return (sequence_output, pooled_output) + encoder_outputs[1:]

        return BaseModelOutputWithPoolingAndCrossAttentions(
            last_hidden_state=sequence_output,
            pooler_output=pooled_output,
            past_key_values=encoder_outputs.past_key_values,
            hidden_states=encoder_outputs.hidden_states,
            attentions=encoder_outputs.attentions,
            cross_attentions=encoder_outputs.cross_attentions,
        )


class BertLMHeadModel(BertPreTrainedModel):
    _keys_to_ignore_on_load_unexpected = [r"pooler"]
    _keys_to_ignore_on_load_missing = [r"position_ids", r"predictions.decoder.bias"]

    def __init__(self, config):
        super().__init__(config)

        self.bert = BertModel(config, add_pooling_layer=False)
        self.cls = BertOnlyMLMHead(config)

        self.init_weights()

    def get_output_embeddings(self):
        return self.cls.predictions.decoder

    def set_output_embeddings(self, new_embeddings):
        self.cls.predictions.decoder = new_embeddings

    def forward(
        self,
        input_ids=None,
        attention_mask=None,
        position_ids=None,
        head_mask=None,
        inputs_embeds=None,
        encoder_hidden_states=None,
        encoder_attention_mask=None,
        labels=None,
        past_key_values=None,
        use_cache=None,
        output_attentions=None,
        output_hidden_states=None,
        return_dict=None,
        return_logits=False,
        is_decoder=True,
        reduction="mean",
        mode="multimodal",
    ):
        r"""encoder_hidden_states  (:obj:`torch.FloatTensor` of shape :obj:`(batch_size, sequence_length, hidden_size)`, `optional`):
            Sequence of hidden-states at the output of the last layer of the encoder. Used in the cross-attention if
            the model is configured as a decoder.
        encoder_attention_mask (:obj:`torch.FloatTensor` of shape :obj:`(batch_size, sequence_length)`, `optional`):
            Mask to avoid performing attention on the padding token indices of the encoder input. This mask is used in
            the cross-attention if the model is configured as a decoder. Mask values selected in ``[0, 1]``:
            - 1 for tokens that are **not masked**,
            - 0 for tokens that are **masked**.
        labels (:obj:`torch.LongTensor` of shape :obj:`(batch_size, sequence_length)`, `optional`):
            Labels for computing the left-to-right language modeling loss (next word prediction). Indices should be in
            ``[-100, 0, ..., config.vocab_size]`` (see ``input_ids`` docstring) Tokens with indices set to ``-100`` are
            ignored (masked), the loss is only computed for the tokens with labels n ``[0, ..., config.vocab_size]``
        past_key_values (:obj:`tuple(tuple(torch.FloatTensor))` of length :obj:`config.n_layers` with each tuple having 4 tensors of shape :obj:`(batch_size, num_heads, sequence_length - 1, embed_size_per_head)`):
            Contains precomputed key and value hidden states of the attention blocks. Can be used to speed up decoding.
            If :obj:`past_key_values` are used, the user can optionally input only the last :obj:`decoder_input_ids`
            (those that don't have their past key value states given to this model) of shape :obj:`(batch_size, 1)`
            instead of all :obj:`decoder_input_ids` of shape :obj:`(batch_size, sequence_length)`.
        use_cache (:obj:`bool`, `optional`):
            If set to :obj:`True`, :obj:`past_key_values` key value states are returned and can be used to speed up
            decoding (see :obj:`past_key_values`).

        Returns:
        Example::
            >>> from transformers import BertTokenizer, BertLMHeadModel, BertConfig
            >>> import torch
            >>> tokenizer = BertTokenizer.from_pretrained('bert-base-cased')
            >>> config = BertConfig.from_pretrained("bert-base-cased")
            >>> model = BertLMHeadModel.from_pretrained('bert-base-cased', config=config)
            >>> inputs = tokenizer("Hello, my dog is cute", return_tensors="pt")
            >>> outputs = model(**inputs)
            >>> prediction_logits = outputs.logits

        """
        return_dict = (
            return_dict if return_dict is not None else self.config.use_return_dict
        )
        if labels is not None:
            use_cache = False

        outputs = self.bert(
            input_ids,
            attention_mask=attention_mask,
            position_ids=position_ids,
            head_mask=head_mask,
            inputs_embeds=inputs_embeds,
            encoder_hidden_states=encoder_hidden_states,
            encoder_attention_mask=encoder_attention_mask,
            past_key_values=past_key_values,
            use_cache=use_cache,
            output_attentions=output_attentions,
            output_hidden_states=output_hidden_states,
            return_dict=return_dict,
            is_decoder=is_decoder,
            mode=mode,
        )

        sequence_output = outputs[0]
        prediction_scores = self.cls(sequence_output)

        if return_logits:
            return prediction_scores[:, :-1, :].contiguous()

        lm_loss = None
        if labels is not None:
            # we are doing next-token prediction; shift prediction scores and input ids by one
            shifted_prediction_scores = prediction_scores[:, :-1, :].contiguous()
            labels = labels[:, 1:].contiguous()
            loss_fct = CrossEntropyLoss(reduction=reduction, label_smoothing=0.1)
            lm_loss = loss_fct(
                shifted_prediction_scores.view(-1, self.config.vocab_size),
                labels.view(-1),
            )
            if reduction == "none":
                lm_loss = lm_loss.view(prediction_scores.size(0), -1).sum(1)

        if not return_dict:
            output = (prediction_scores,) + outputs[2:]
            return ((lm_loss,) + output) if lm_loss is not None else output

        return CausalLMOutputWithCrossAttentions(
            loss=lm_loss,
            logits=prediction_scores,
            past_key_values=outputs.past_key_values,
            hidden_states=outputs.hidden_states,
            attentions=outputs.attentions,
            cross_attentions=outputs.cross_attentions,
        )

    def prepare_inputs_for_generation(
        self, input_ids, past=None, attention_mask=None, **model_kwargs
    ):
        input_shape = input_ids.shape
        # if model is used as a decoder in encoder-decoder model, the decoder attention mask is created on the fly
        if attention_mask is None:
            attention_mask = input_ids.new_ones(input_shape)

        # cut decoder_input_ids if past is used
        if past is not None:
            input_ids = input_ids[:, -1:]

        return {
            "input_ids": input_ids,
            "attention_mask": attention_mask,
            "past_key_values": past,
            "encoder_hidden_states": model_kwargs.get("encoder_hidden_states", None),
            "encoder_attention_mask": model_kwargs.get("encoder_attention_mask", None),
            "is_decoder": True,
        }

    def _reorder_cache(self, past, beam_idx):
        reordered_past = ()
        for layer_past in past:
            reordered_past += (
                tuple(
                    past_state.index_select(0, beam_idx) for past_state in layer_past
                ),
            )
        return reordered_past


================================================
FILE: service/image_captioning/api/im2txt/blip/vit.py
================================================
"""* Copyright (c) 2022, salesforce.com, inc.
* All rights reserved.
* SPDX-License-Identifier: BSD-3-Clause
* For full license text, see LICENSE.txt file in the repo root or https://opensource.org/licenses/BSD-3-Clause
* By Junnan Li
* Based on timm code base
* https://github.com/rwightman/pytorch-image-models/tree/master/timm
"""

from functools import partial

import torch
from timm.models.helpers import adapt_input_conv
from timm.models.layers import DropPath, trunc_normal_
from timm.models.vision_transformer import PatchEmbed, resize_pos_embed
from torch import nn


class Mlp(nn.Module):
    """MLP as used in Vision Transformer, MLP-Mixer and related networks"""

    def __init__(
        self,
        in_features,
        hidden_features=None,
        out_features=None,
        act_layer=nn.GELU,
        drop=0.0,
    ):
        super().__init__()
        out_features = out_features or in_features
        hidden_features = hidden_features or in_features
        self.fc1 = nn.Linear(in_features, hidden_features)
        self.act = act_layer()
        self.fc2 = nn.Linear(hidden_features, out_features)
        self.drop = nn.Dropout(drop)

    def forward(self, x):
        x = self.fc1(x)
        x = self.act(x)
        x = self.drop(x)
        x = self.fc2(x)
        x = self.drop(x)
        return x


class Attention(nn.Module):
    def __init__(
        self,
        dim,
        num_heads=8,
        qkv_bias=False,
        qk_scale=None,
        attn_drop=0.0,
        proj_drop=0.0,
    ):
        super().__init__()
        self.num_heads = num_heads
        head_dim = dim // num_heads
        # NOTE scale factor was wrong in my original version, can set manually to be compat with prev weights
        self.scale = qk_scale or head_dim**-0.5
        self.qkv = nn.Linear(dim, dim * 3, bias=qkv_bias)
        self.attn_drop = nn.Dropout(attn_drop)
        self.proj = nn.Linear(dim, dim)
        self.proj_drop = nn.Dropout(proj_drop)
        self.attn_gradients = None
        self.attention_map = None

    def save_attn_gradients(self, attn_gradients):
        self.attn_gradients = attn_gradients

    def get_attn_gradients(self):
        return self.attn_gradients

    def save_attention_map(self, attention_map):
        self.attention_map = attention_map

    def get_attention_map(self):
        return self.attention_map

    def forward(self, x, register_hook=False):
        B, N, C = x.shape
        qkv = (
            self.qkv(x)
            .reshape(B, N, 3, self.num_heads, C // self.num_heads)
            .permute(2, 0, 3, 1, 4)
        )
        q, k, v = (
            qkv[0],
            qkv[1],
            qkv[2],
        )  # make torchscript happy (cannot use tensor as tuple)

        attn = (q @ k.transpose(-2, -1)) * self.scale
        attn = attn.softmax(dim=-1)
        attn = self.attn_drop(attn)

        if register_hook:
            self.save_attention_map(attn)
            attn.register_hook(self.save_attn_gradients)

        x = (attn @ v).transpose(1, 2).reshape(B, N, C)
        x = self.proj(x)
        x = self.proj_drop(x)
        return x


class Block(nn.Module):
    def __init__(
        self,
        dim,
        num_heads,
        mlp_ratio=4.0,
        qkv_bias=False,
        qk_scale=None,
        drop=0.0,
        attn_drop=0.0,
        drop_path=0.0,
        act_layer=nn.GELU,
        norm_layer=nn.LayerNorm,
    ):
        super().__init__()
        self.norm1 = norm_layer(dim)
        self.attn = Attention(
            dim,
            num_heads=num_heads,
            qkv_bias=qkv_bias,
            qk_scale=qk_scale,
            attn_drop=attn_drop,
            proj_drop=drop,
        )
        # NOTE: drop path for stochastic depth, we shall see if this is better than dropout here
        self.drop_path = DropPath(drop_path) if drop_path > 0.0 else nn.Identity()
        self.norm2 = norm_layer(dim)
        mlp_hidden_dim = int(dim * mlp_ratio)
        self.mlp = Mlp(
            in_features=dim,
            hidden_features=mlp_hidden_dim,
            act_layer=act_layer,
            drop=drop,
        )

    def forward(self, x, register_hook=False):
        x = x + self.drop_path(self.attn(self.norm1(x), register_hook=register_hook))
        x = x + self.drop_path(self.mlp(self.norm2(x)))
        return x


class VisionTransformer(nn.Module):
    """Vision Transformer
    A PyTorch impl of : `An Image is Worth 16x16 Words: Transformers for Image Recognition at Scale`  -
        https://arxiv.org/abs/2010.11929
    """

    def __init__(
        self,
        img_size=224,
        patch_size=16,
        in_chans=3,
        num_classes=1000,
        embed_dim=768,
        depth=12,
        num_heads=12,
        mlp_ratio=4.0,
        qkv_bias=True,
        qk_scale=None,
        representation_size=None,
        drop_rate=0.0,
        attn_drop_rate=0.0,
        drop_path_rate=0.0,
        norm_layer=None,
        ckpt_layer=0,
    ):
        """Args:
        img_size (int, tuple): input image size
        patch_size (int, tuple): patch size
        in_chans (int): number of input channels
        num_classes (int): number of classes for classification head
        embed_dim (int): embedding dimension
        depth (int): depth of transformer
        num_heads (int): number of attention heads
        mlp_ratio (int): ratio of mlp hidden dim to embedding dim
        qkv_bias (bool): enable bias for qkv if True
        qk_scale (float): override default qk scale of head_dim ** -0.5 if set
        representation_size (Optional[int]): enable and set representation layer (pre-logits) to this value if set
        drop_rate (float): dropout rate
        attn_drop_rate (float): attention dropout rate
        drop_path_rate (float): stochastic depth rate
        norm_layer: (nn.Module): normalization layer

        """
        super().__init__()
        self.num_features = self.embed_dim = (
            embed_dim  # num_features for consistency with other models
        )
        norm_layer = norm_layer or partial(nn.LayerNorm, eps=1e-6)

        self.patch_embed = PatchEmbed(
            img_size=img_size,
            patch_size=patch_size,
            in_chans=in_chans,
            embed_dim=embed_dim,
        )

        num_patches = self.patch_embed.num_patches

        self.cls_token = nn.Parameter(torch.zeros(1, 1, embed_dim))
        self.pos_embed = nn.Parameter(torch.zeros(1, num_patches + 1, embed_dim))
        self.pos_drop = nn.Dropout(p=drop_rate)

        dpr = [
            x.item() for x in torch.linspace(0, drop_path_rate, depth)
        ]  # stochastic depth decay rule
        self.blocks = nn.ModuleList(
            [
                Block(
                    dim=embed_dim,
                    num_heads=num_heads,
                    mlp_ratio=mlp_ratio,
                    qkv_bias=qkv_bias,
                    qk_scale=qk_scale,
                    drop=drop_rate,
                    attn_drop=attn_drop_rate,
                    drop_path=dpr[i],
                    norm_layer=norm_layer,
                )
                for i in range(depth)
            ]
        )
        self.norm = norm_layer(embed_dim)

        trunc_normal_(self.pos_embed, std=0.02)
        trunc_normal_(self.cls_token, std=0.02)
        self.apply(self._init_weights)

    def _init_weights(self, m):
        if isinstance(m, nn.Linear):
            trunc_normal_(m.weight, std=0.02)
            if isinstance(m, nn.Linear) and m.bias is not None:
                nn.init.constant_(m.bias, 0)
        elif isinstance(m, nn.LayerNorm):
            nn.init.constant_(m.bias, 0)
            nn.init.constant_(m.weight, 1.0)

    @torch.jit.ignore
    def no_weight_decay(self):
        return {"pos_embed", "cls_token"}

    def forward(self, x, register_blk=-1):
        B = x.shape[0]
        x = self.patch_embed(x)

        cls_tokens = self.cls_token.expand(
            B, -1, -1
        )  # stole cls_tokens impl from Phil Wang, thanks
        x = torch.cat((cls_tokens, x), dim=1)

        x = x + self.pos_embed[:, : x.size(1), :]
        x = self.pos_drop(x)

        for i, blk in enumerate(self.blocks):
            x = blk(x, register_blk == i)
        x = self.norm(x)

        return x

    @torch.jit.ignore()
    def load_pretrained(self, checkpoint_path, prefix=""):
        _load_weights(self, checkpoint_path, prefix)


@torch.no_grad()
def _load_weights(model: VisionTransformer, checkpoint_path: str, prefix: str = ""):
    """Load weights from .npz checkpoints for official Google Brain Flax implementation"""
    import numpy as np

    def _n2p(w, t=True):
        if w.ndim == 4 and w.shape[0] == w.shape[1] == w.shape[2] == 1:
            w = w.flatten()
        if t:
            if w.ndim == 4:
                w = w.transpose([3, 2, 0, 1])
            elif w.ndim == 3:
                w = w.transpose([2, 0, 1])
            elif w.ndim == 2:
                w = w.transpose([1, 0])
        return torch.from_numpy(w)

    w = np.load(checkpoint_path)
    if not prefix and "opt/target/embedding/kernel" in w:
        prefix = "opt/target/"

    if hasattr(model.patch_embed, "backbone"):
        # hybrid
        backbone = model.patch_embed.backbone
        stem_only = not hasattr(backbone, "stem")
        stem = backbone if stem_only else backbone.stem
        stem.conv.weight.copy_(
            adapt_input_conv(
                stem.conv.weight.shape[1], _n2p(w[f"{prefix}conv_root/kernel"])
            )
        )
        stem.norm.weight.copy_(_n2p(w[f"{prefix}gn_root/scale"]))
        stem.norm.bias.copy_(_n2p(w[f"{prefix}gn_root/bias"]))
        if not stem_only:
            for i, stage in enumerate(backbone.stages):
                for j, block in enumerate(stage.blocks):
                    bp = f"{prefix}block{i + 1}/unit{j + 1}/"
                    for r in range(3):
                        getattr(block, f"conv{r + 1}").weight.copy_(
                            _n2p(w[f"{bp}conv{r + 1}/kernel"])
                        )
                        getattr(block, f"norm{r + 1}").weight.copy_(
                            _n2p(w[f"{bp}gn{r + 1}/scale"])
                        )
                        getattr(block, f"norm{r + 1}").bias.copy_(
                            _n2p(w[f"{bp}gn{r + 1}/bias"])
                        )
                    if block.downsample is not None:
                        block.downsample.conv.weight.copy_(
                            _n2p(w[f"{bp}conv_proj/kernel"])
                        )
                        block.downsample.norm.weight.copy_(
                            _n2p(w[f"{bp}gn_proj/scale"])
                        )
                        block.downsample.norm.bias.copy_(_n2p(w[f"{bp}gn_proj/bias"]))
        embed_conv_w = _n2p(w[f"{prefix}embedding/kernel"])
    else:
        embed_conv_w = adapt_input_conv(
            model.patch_embed.proj.weight.shape[1], _n2p(w[f"{prefix}embedding/kernel"])
        )
    model.patch_embed.proj.weight.copy_(embed_conv_w)
    model.patch_embed.proj.bias.copy_(_n2p(w[f"{prefix}embedding/bias"]))
    model.cls_token.copy_(_n2p(w[f"{prefix}cls"], t=False))
    pos_embed_w = _n2p(w[f"{prefix}Transformer/posembed_input/pos_embedding"], t=False)
    if pos_embed_w.shape != model.pos_embed.shape:
        pos_embed_w = resize_pos_embed(  # resize pos embedding when different size from pretrained weights
            pos_embed_w,
            model.pos_embed,
            getattr(model, "num_tokens", 1),
            model.patch_embed.grid_size,
        )
    model.pos_embed.copy_(pos_embed_w)
    model.norm.weight.copy_(_n2p(w[f"{prefix}Transformer/encoder_norm/scale"]))
    model.norm.bias.copy_(_n2p(w[f"{prefix}Transformer/encoder_norm/bias"]))
    for i, block in enumerate(model.blocks.children()):
        block_prefix = f"{prefix}Transformer/encoderblock_{i}/"
        mha_prefix = block_prefix + "MultiHeadDotProductAttention_1/"
        block.norm1.weight.copy_(_n2p(w[f"{block_prefix}LayerNorm_0/scale"]))
        block.norm1.bias.copy_(_n2p(w[f"{block_prefix}LayerNorm_0/bias"]))
        block.attn.qkv.weight.copy_(
            torch.cat(
                [
                    _n2p(w[f"{mha_prefix}{n}/kernel"], t=False).flatten(1).T
                    for n in ("query", "key", "value")
                ]
            )
        )
        block.attn.qkv.bias.copy_(
            torch.cat(
                [
                    _n2p(w[f"{mha_prefix}{n}/bias"], t=False).reshape(-1)
                    for n in ("query", "key", "value")
                ]
            )
        )
        block.attn.proj.weight.copy_(_n2p(w[f"{mha_prefix}out/kernel"]).flatten(1))
        block.attn.proj.bias.copy_(_n2p(w[f"{mha_prefix}out/bias"]))
        for r in range(2):
            getattr(block.mlp, f"fc{r + 1}").weight.copy_(
                _n2p(w[f"{block_prefix}MlpBlock_3/Dense_{r}/kernel"])
            )
            getattr(block.mlp, f"fc{r + 1}").bias.copy_(
                _n2p(w[f"{block_prefix}MlpBlock_3/Dense_{r}/bias"])
            )
        block.norm2.weight.copy_(_n2p(w[f"{block_prefix}LayerNorm_2/scale"]))
        block.norm2.bias.copy_(_n2p(w[f"{block_prefix}LayerNorm_2/bias"]))


def interpolate_pos_embed(pos_embed_checkpoint, visual_encoder):
    # interpolate position embedding
    embedding_size = pos_embed_checkpoint.shape[-1]
    num_patches = visual_encoder.patch_embed.num_patches
    num_extra_tokens = visual_encoder.pos_embed.shape[-2] - num_patches
    # height (== width) for the checkpoint position embedding
    orig_size = int((pos_embed_checkpoint.shape[-2] - num_extra_tokens) ** 0.5)
    # height (== width) for the new position embedding
    new_size = int(num_patches**0.5)

    if orig_size != new_size:
        # class_token and dist_token are kept unchanged
        extra_tokens = pos_embed_checkpoint[:, :num_extra_tokens]
        # only the position tokens are interpolated
        pos_tokens = pos_embed_checkpoint[:, num_extra_tokens:]
        pos_tokens = pos_tokens.reshape(
            -1, orig_size, orig_size, embedding_size
        ).permute(0, 3, 1, 2)
        pos_tokens = torch.nn.functional.interpolate(
            pos_tokens, size=(new_size, new_size), mode="bicubic", align_corners=False
        )
        pos_tokens = pos_tokens.permute(0, 2, 3, 1).flatten(1, 2)
        new_pos_embed = torch.cat((extra_tokens, pos_tokens), dim=1)
        print("reshape position embedding from %d to %d" % (orig_size**2, new_size**2))

        return new_pos_embed
    else:
        return pos_embed_checkpoint


================================================
FILE: service/image_captioning/api/im2txt/build_vocab.py
================================================
import pickle
from collections import Counter

from tqdm import tqdm

caption_path = "api/im2txt/data/annotations/captions_train2014.json"
vocab_path = "api/im2txt/data/vocab.pkl"
threshold = 4


class Vocabulary:
    """Simple vocabulary wrapper."""

    def __init__(self):
        self.word2idx = {}
        self.idx2word = {}
        self.idx = 0

    def add_word(self, word):
        if word not in self.word2idx:
            self.word2idx[word] = self.idx
            self.idx2word[self.idx] = word
            self.idx += 1

    def __call__(self, word):
        if word not in self.word2idx:
            return self.word2idx["<unk>"]
        return self.word2idx[word]

    def __len__(self):
        return len(self.word2idx)


def build_vocab(json, threshold):
    import nltk
    from pycocotools.coco import COCO

    """Build a simple vocabulary wrapper."""
    coco = COCO(json)
    counter = Counter()
    ids = coco.anns.keys()
    for i, id in tqdm(enumerate(ids)):
        caption = str(coco.anns[id]["caption"])
        tokens = nltk.tokenize.word_tokenize(caption.lower())
        counter.update(tokens)

    #         if (i+1) % 1000 == 0:
    #             print("[{}/{}] Tokenized the captions.".format(i+1, len(ids)))

    # If the word frequency is less than 'threshold', then the word is discarded.
    words = [word for word, cnt in counter.items() if cnt >= threshold]

    # Create a vocab wrapper and add some special tokens.
    vocab = Vocabulary()
    vocab.add_word("<pad>")
    vocab.add_word("<start>")
    vocab.add_word("<end>")
    vocab.add_word("<unk>")

    # Add the words to the vocabulary.
    for i, word in enumerate(words):
        vocab.add_word(word)
    return vocab


def main():
    vocab = build_vocab(json=caption_path, threshold=threshold)
    with open(vocab_path, "wb") as f:
        pickle.dump(vocab, f)
    print(f"Total vocabulary size: {len(vocab)}")
    print(f"Saved the vocabulary wrapper to '{vocab_path}'")


================================================
FILE: service/image_captioning/api/im2txt/data_loader.py
================================================
import os

import torch
from PIL import Image
from torch.utils import data


class CocoDataset(data.Dataset):
    """COCO Custom Dataset compatible with torch.utils.data.DataLoader."""

    def __init__(self, root, json, vocab, transform=None):
        """Set the path for images, captions and vocabulary wrapper.

        Args:
            root: image directory.
            json: coco annotation file path.
            vocab: vocabulary wrapper.
            transform: image transformer.

        """
        self.root = root

        from pycocotools.coco import COCO

        self.coco = COCO(json)
        self.ids = list(self.coco.anns.keys())
        self.vocab = vocab
        self.transform = transform

    def __getitem__(self, index):
        """Returns one data pair (image and caption)."""
        coco = self.coco
        vocab = self.vocab
        ann_id = self.ids[index]
        caption = coco.anns[ann_id]["caption"]
        img_id = coco.anns[ann_id]["image_id"]
        path = coco.loadImgs(img_id)[0]["file_name"]

        image = Image.open(os.path.join(self.root, path)).convert("RGB")
        if self.transform is not None:
            image = self.transform(image)

        # Convert caption (string) to word ids.

        import nltk

        tokens = nltk.tokenize.word_tokenize(str(caption).lower())
        caption = []
        caption.append(vocab("<start>"))
        caption.extend([vocab(token) for token in tokens])
        caption.append(vocab("<end>"))
        target = torch.Tensor(caption)
        return image, target

    def __len__(self):
        return len(self.ids)


def collate_fn(data):
    """Creates mini-batch tensors from the list of tuples (image, caption).

    We should build custom collate_fn rather than using default collate_fn,
    because merging caption (including padding) is not supported in default.

    Args:
        data: list of tuple (image, caption).
            - image: torch tensor of shape (3, 256, 256).
            - caption: torch tensor of shape (?); variable length.

    Returns:
        images: torch tensor of shape (batch_size, 3, 256, 256).
        targets: torch tensor of shape (batch_size, padded_length).
        lengths: list; valid length for each padded caption.

    """
    # Sort a data list by caption length (descending order).
    data.sort(key=lambda x: len(x[1]), reverse=True)
    images, captions = zip(*data)

    # Merge images (from tuple of 3D tensor to 4D tensor).
    images = torch.stack(images, 0)

    # Merge captions (from tuple of 1D tensor to 2D tensor).
    lengths = [len(cap) for cap in captions]
    targets = torch.zeros(len(captions), max(lengths)).long()
    for i, cap in enumerate(captions):
        end = lengths[i]
        targets[i, :end] = cap[:end]
    return images, targets, lengths


def get_loader(root, json, vocab, transform, batch_size, shuffle, num_workers):
    """Returns torch.utils.data.DataLoader for custom coco dataset."""
    # COCO caption dataset
    coco = CocoDataset(root=root, json=json, vocab=vocab, transform=transform)

    # Data loader for COCO dataset
    # This will return (images, captions, lengths) for each iteration.
    # images: a tensor of shape (batch_size, 3, 224, 224).
    # captions: a tensor of shape (batch_size, padded_length).
    # lengths: a list indicating valid length for each caption. length is (batch_size).
    data_loader = torch.utils.data.DataLoader(
        dataset=coco,
        batch_size=batch_size,
        shuffle=shuffle,
        num_workers=num_workers,
        collate_fn=collate_fn,
    )
    return data_loader


================================================
FILE: service/image_captioning/api/im2txt/model.py
================================================
import torch
from torch import nn
from torchvision import models


class EncoderCNN(nn.Module):
    def __init__(self, embed_size):
        """Load the pretrained ResNet-152 and replace top fc layer."""
        super(EncoderCNN, self).__init__()
        resnet = models.resnet152(pretrained=True)
        modules = list(resnet.children())[:-1]  # delete the last fc layer.
        self.resnet = nn.Sequential(*modules)
        self.linear = nn.Linear(resnet.fc.in_features, embed_size)
        self.bn = nn.BatchNorm1d(embed_size, momentum=0.01)

    def forward(self, images):
        """Extract feature vectors from input images."""
        with torch.no_grad():
            features = self.resnet(images)
        features = features.reshape(features.size(0), -1)
        features = self.bn(self.linear(features))
        return features


class DecoderRNN(nn.Module):
    def __init__(
        self, embed_size, hidden_size, vocab_size, num_layers, max_seq_length=20
    ):
        """Set the hyper-parameters and build the layers."""
        super(DecoderRNN, self).__init__()
        self.embed = nn.Embedding(vocab_size, embed_size)
        self.lstm = nn.LSTM(embed_size, hidden_size, num_layers, batch_first=True)
        self.linear = nn.Linear(hidden_size, vocab_size)
        self.max_seg_length = max_seq_length

    def forward(self, features):
        """Generate captions for given image features using greedy search."""
        sampled_ids = []
        states = None
        inputs = features.unsqueeze(1)
        for i in range(self.max_seg_length):
            hiddens, states = self.lstm(
                inputs, states
            )  # hiddens: (batch_size, 1, hidden_size)
            outputs = self.linear(
                hiddens.squeeze(1)
            )  # outputs:  (batch_size, vocab_size)
            _, predicted = outputs.max(1)  # predicted: (batch_size)
            sampled_ids.append(predicted)
            inputs = self.embed(predicted)  # inputs: (batch_size, embed_size)
            inputs = inputs.unsqueeze(1)  # inputs: (batch_size, 1, embed_size)
        sampled_ids = torch.stack(
            sampled_ids, 1
        )  # sampled_ids: (batch_size, max_seq_length)
        return sampled_ids


================================================
FILE: service/image_captioning/api/im2txt/resize.py
================================================
import os

from PIL import Image

image_dir = "api/im2txt/data/train2014/"
output_dir = "api/im2txt/data/resized2014/"
image_size = 256


def resize_image(image, size):
    """Resize an image to the given size."""
    return image.resize(size, Image.ANTIALIAS)


def resize_images(image_dir, output_dir, size):
    """Resize the images in 'image_dir' and save into 'output_dir'."""
    if not os.path.exists(output_dir):
        os.makedirs(output_dir)

    images = os.listdir(image_dir)
    num_images = len(images)
    for i, image in enumerate(images):
        with open(os.path.join(image_dir, image), "r+b") as f:
            with Image.open(f) as img:
                img = resize_image(img, size)
                img.save(os.path.join(output_dir, image), img.format)
        if (i + 1) % 100 == 0:
            print(
                f"[{i + 1}/{num_images}] Resized the images and saved into '{output_dir}'."
            )


def main():
    resize_images(image_dir, output_dir, [image_size, image_size])


================================================
FILE: service/image_captioning/api/im2txt/sample.py
================================================
import os
import pickle


import torch
from PIL import Image
from torchvision import transforms
from torchvision.transforms.functional import InterpolationMode

from api.im2txt.blip.blip import blip_decoder
from api.im2txt.model import DecoderRNN, EncoderCNN

blip_image_size = 384

embed_size = 256
hidden_size = 512
num_layers = 1

im2txt_models_path = "/protected_media/data_models/im2txt"

blip_models_path = "/protected_media/data_models/blip"

encoder_path = os.path.join(im2txt_models_path, "models", "encoder-10-1000.ckpt")
decoder_path = os.path.join(im2txt_models_path, "models", "decoder-10-1000.ckpt")
vocab_path = os.path.join(im2txt_models_path, "data", "vocab.pkl")


blip_model_url = os.path.join(blip_models_path, "model_base_capfilt_large.pth")
blip_config_url = os.path.join(blip_models_path, "med_config.json")


class Im2txt:
    def __init__(
        self,
        device=torch.device("cuda" if torch.cuda.is_available() else "cpu"),
        blip=False,
    ):
        self._instance = self
        self.encoder = None
        self.decoder = None
        self.vocab = None
        self.device = device
        self.blip = blip
        self.model = None

    def load_image(self, image_path, transform=None):
        image = Image.open(image_path)
        # Check if the image has 3 channels (RGB)
        if image.mode != "RGB":
            # Handle grayscale or other modes here (e.g., convert to RGB)
            image = image.convert("RGB")

        if transform is not None:
            image = transform(image).unsqueeze(0)

        return image

    def load_models(self, onnx=False):
        if self.encoder is not None or self.model is not None:
            return

        if self.blip:
            self.model = blip_decoder(
                pretrained=blip_model_url,
                image_size=blip_image_size,
                vit="base",
                med_config=blip_config_url,
            )
            self.model.eval()
            self.model.to(self.device)
            return

        with open(vocab_path, "rb") as f:
            self.vocab = pickle.load(f)

        # Build models
        self.encoder = EncoderCNN(
            embed_size
        ).eval()  # eval mode (batchnorm uses moving mean/variance)
        self.decoder = DecoderRNN(
            embed_size, hidden_size, len(self.vocab), num_layers
        )
        self.encoder = self.encoder.to(self.device)
        self.decoder = self.decoder.to(self.device)

        # Load the trained model parameters
        self.encoder.load_state_dict(
            torch.load(encoder_path, map_location=self.device)
        )
        self.decoder.load_state_dict(
            torch.load(decoder_path, map_location=self.device)
        )

        # self.encoder = torch.compile(self.encoder)
        # self.decoder = torch.compile(self.decoder)

    def unload_models(self):
        del self.encoder
        del self.decoder
        del self.model
        self.encoder = None
        self.decoder = None
        self.model = None

    def generate_caption(
        self,
        image_path,
        onnx=False,
    ):
        self.load_models(onnx=onnx)

        transform = transforms.Compose(
            [
                transforms.Resize((224, 224), interpolation=InterpolationMode.BICUBIC),
                transforms.ToTensor(),
                transforms.Normalize((0.485, 0.456, 0.406), (0.229, 0.224, 0.225)),
            ]
        )

        blip_transform = transforms.Compose(
            [
                transforms.Resize(
                    (blip_image_size, blip_image_size),
                    interpolation=InterpolationMode.BICUBIC,
                ),
                transforms.ToTensor(),
                transforms.Normalize(
                    (0.48145466, 0.4578275, 0.40821073),
                    (0.26862954, 0.26130258, 0.27577711),
                ),
            ]
        )

        if self.blip:
            image = self.load_image(image_path, blip_transform).to(self.device)
            with torch.no_grad():
                caption_blip = self.model.generate(
                    image, sample=True, num_beams=3, max_length=50, min_length=10
                )
                return caption_blip[0]

        # Prepare an image
        image = self.load_image(image_path, transform)
        image_tensor = image.to(self.device)
        feature = self.encoder(image_tensor)
        sampled_ids = self.decoder.forward(feature)
        sampled_ids = (
            sampled_ids[0].cpu().numpy()
        )  # (1, max_seq_length) -> (max_seq_length)

        # Convert word_ids to words
        sampled_caption = []
        for word_id in sampled_ids:
            word = self.vocab.idx2word[word_id]
            sampled_caption.append(word)
            if word == "<end>":
                break
        sentence = " ".join(sampled_caption)

        return sentence


================================================
FILE: service/image_captioning/api/im2txt/train.py
================================================
import os
import pickle

import numpy as np
import torch
from torch import nn
from torch.nn.utils.rnn import pack_padded_sequence
from torchvision import transforms

from api.im2txt.data_loader import get_loader
from api.im2txt.model import DecoderRNN, EncoderCNN

model_path = "api/im2txt/models/"
crop_size = 224
vocab_path = "api/im2txt/data/vocab.pkl"
image_dir = "api/im2txt/data/resized2014/"
caption_path = "api/im2txt/data/annotations/captions_train2014.json"
log_step = 10
save_step = 1000
embed_size = 256
hidden_size = 512
num_layers = 1
num_epochs = 5
batch_size = 128
num_workers = 2
learning_rate = 0.001


# Device configuration
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")


def main():
    # Create model directory
    if not os.path.exists(model_path):
        os.makedirs(model_path)

    # Image preprocessing, normalization for the pretrained resnet
    transform = transforms.Compose(
        [
            transforms.RandomCrop(crop_size),
            transforms.RandomHorizontalFlip(),
            transforms.ToTensor(),
            transforms.Normalize((0.485, 0.456, 0.406), (0.229, 0.224, 0.225)),
        ]
    )

    # Load vocabulary wrapper
    with open(vocab_path, "rb") as f:
        vocab = pickle.load(f)

    # Build data loader
    data_loader = get_loader(
        image_dir,
        caption_path,
        vocab,
        transform,
        batch_size,
        shuffle=True,
        num_workers=num_workers,
    )

    # Build the models
    encoder = EncoderCNN(embed_size).to(device)
    decoder = DecoderRNN(embed_size, hidden_size, len(vocab), num_layers).to(device)

    # Loss and optimizer
    criterion = nn.CrossEntropyLoss()
    params = (
        list(decoder.parameters())
        + list(encoder.linear.parameters())
        + list(encoder.bn.parameters())
    )
    optimizer = torch.optim.Adam(params, lr=learning_rate)

    # Train the models
    total_step = len(data_loader)
    for epoch in range(num_epochs):
        for i, (images, captions, lengths) in enumerate(data_loader):
            # Set mini-batch dataset
            images = images.to(device)
            captions = captions.to(device)
            targets = pack_padded_sequence(captions, lengths, batch_first=True)[0]

            # Forward, backward and optimize
            features = encoder(images)
            outputs = decoder(features, captions, lengths)
            loss = criterion(outputs, targets)
            decoder.zero_grad()
            encoder.zero_grad()
            loss.backward()
            optimizer.step()

            # Print log info
            if i % log_step == 0:
                print(
                    f"Epoch [{epoch}/{num_epochs}], Step [{i}/{total_step}], Loss: {loss.item():.4f}, Perplexity: {np.exp(loss.item()):5.4f}"
                )

            # Save the model checkpoints
            if (i + 1) % save_step == 0:
                torch.save(
                    decoder.state_dict(),
                    os.path.join(model_path, f"decoder-{epoch + 1}-{i + 1}.ckpt"),
                )
                torch.save(
                    encoder.state_dict(),
                    os.path.join(model_path, f"encoder-{epoch + 1}-{i + 1}.ckpt"),
                )


================================================
FILE: service/image_captioning/main.py
================================================
import time

import gevent
from flask import Flask, request
from gevent.pywsgi import WSGIServer

from api.im2txt.sample import Im2txt

app = Flask(__name__)

im2txt_instance = None
last_request_time = None


def log(message):
    print(f"image_captioning: {message}")


@app.route("/generate-caption", methods=["POST"])
def generate_caption():
    global last_request_time
    # Update last request time
    last_request_time = time.time()

    try:
        data = request.get_json()
        image_path = data["image_path"]
        onnx = data["onnx"]
        blip = data["blip"]
    except Exception as e:
        print(str(e))
        return "", 400

    global im2txt_instance

    if im2txt_instance is None:
        im2txt_instance = Im2txt(blip=blip)

    return {
        "caption": im2txt_instance.generate_caption(image_path=image_path, onnx=onnx)
    }, 201


@app.route("/unload-model", methods=["GET"])
def unload_model():
    global im2txt_instance
    im2txt_instance.unload_models()
    im2txt_instance = None
    return "", 200


@app.route("/health", methods=["GET"])
def health():
    return {"last_request_time": last_request_time}, 200


if __name__ == "__main__":
    log("service starting")
    server = WSGIServer(("0.0.0.0", 8007), app)
    server_thread = gevent.spawn(server.serve_forever)
    gevent.joinall([server_thread])


================================================
FILE: service/llm/__init__.py
================================================


================================================
FILE: service/llm/main.py
================================================
"""
LLM Service for LibrePhotos

This service provides Large Language Model capabilities for image captioning and analysis.

Note: CPU compatibility is checked by the main LibrePhotos application before starting this service.
Services with incompatible CPUs will not be started to prevent performance issues.

Usage:
- Normal operation: python main.py (started by LibrePhotos service manager)
"""

import gevent
import time
from pathlib import Path
from flask import Flask, request
from gevent.pywsgi import WSGIServer
from llama_cpp import Llama

app = Flask(__name__)

# Global model instance and last request time for health monitoring
llm_model = None
current_model_path = None
last_request_time = None


def log(message):
    print(f"llm: {message}")


def load_model(model_path, multimodal=False):
    """Load a model with optional multimodal support"""
    global llm_model, current_model_path

    if llm_model is None or current_model_path != model_path:
        try:
            log(f"Loading model from {model_path}, multimodal: {multimodal}")
            if multimodal:
                # For Moondream, we need to use the chat handler approach
                from llama_cpp.llama_chat_format import MoondreamChatHandler

                # Path to the mmproj file for Moondream
                mmproj_path = "/protected_media/data_models/moondream2-mmproj-f16.gguf"

                if not Path(mmproj_path).exists():
                    raise Exception(f"Moondream mmproj file not found at {mmproj_path}")

                log(f"Loading Moondream chat handler with mmproj: {mmproj_path}")
                chat_handler = MoondreamChatHandler(clip_model_path=mmproj_path)

                llm_model = Llama(
                    model_path=model_path,
                    chat_handler=chat_handler,
                    n_ctx=2048,  # Increase context window for image processing
                    verbose=False,
                )
            else:
                # For text-only models
                llm_model = Llama(model_path=model_path, verbose=False)

            current_model_path = model_path
            log("Model loaded successfully")
        except Exception as e:
            log(f"Error loading model: {str(e)}")
            raise


@app.route("/generate", methods=["POST"])
def generate():
    """Unified endpoint for text and multimodal generation"""
    global last_request_time
    last_request_time = time.time()

    try:
        data = request.get_json()
        image_data = data.get("image_data")  # Now expects base64 data URI directly
        prompt = data["prompt"]
        max_tokens = data.get("max_tokens", 128)
        model_path = data.get(
            "model_path", "/protected_media/data_models/moondream2-text-model-f16.gguf"
        )
    except Exception as e:
        log(f"Error parsing request: {str(e)}")
        return "", 400

    try:
        if image_data:
            # Multimodal prompt with image using Moondream
            load_model(model_path, multimodal=True)

            response = llm_model.create_chat_completion(
                messages=[
                    {
                        "role": "user",
                        "content": [
                            {"type": "text", "text": prompt},
                            {"type": "image_url", "image_url": {"url": image_data}},
                        ],
                    }
                ],
                max_tokens=max_tokens,
                temperature=0.1,
            )

            response_text = response["choices"][0]["message"]["content"]
        else:
            # Text-only prompt
            load_model(model_path, multimodal=False)

            output = llm_model(
                prompt,
                max_tokens=max_tokens,
                stop=["Q:", "\n"],
                echo=False,
            )
            response_text = (
                output["choices"][0]["text"] if "choices" in output else str(output)
            )

        log("Generated response")
        return {"response": response_text}, 201

    except Exception as e:
        log(f"Error generating response: {str(e)}")
        return {"error": str(e)}, 500


@app.route("/health", methods=["GET"])
def health():
    return {"status": "OK", "last_request_time": last_request_time}, 200


if __name__ == "__main__":
    log("LLM service with multimodal support starting")
    log(
        "Note: CPU compatibility is verified by LibrePhotos service manager before startup"
    )

    server = WSGIServer(("0.0.0.0", 8008), app)
    server_thread = gevent.spawn(server.serve_forever)
    gevent.joinall([server_thread])


================================================
FILE: service/tags/__init__.py
================================================


================================================
FILE: service/tags/main.py
================================================
import time

import gevent
from flask import Flask, request
from gevent.pywsgi import WSGIServer
from places365.places365 import Places365
from siglip2.siglip2 import SigLIP2

app = Flask(__name__)

places365_instance = None
siglip2_instance = None
last_request_time = None


def log(message):
    print(f"tags: {message}")


@app.route("/generate-tags", methods=["POST"])
def generate_tags():
    global last_request_time
    last_request_time = time.time()

    try:
        data = request.get_json()
        image_path = data["image_path"]
        confidence = data.get("confidence", 0.4)
        tagging_model = data.get("tagging_model", "places365")
    except Exception as e:
        print(str(e))
        return "", 400

    if tagging_model == "siglip2":
        global siglip2_instance
        if siglip2_instance is None:
            siglip2_instance = SigLIP2()
        # SigLIP 2 uses cosine similarity (range -1 to 1), not probability scores.
        # Always return the top 10 most relevant tags above a minimum threshold.
        result = siglip2_instance.predict(image_path, threshold=0.05, max_tags=10)
        return {"tags": result}, 201
    else:
        global places365_instance
        if places365_instance is None:
            places365_instance = Places365()
        result = places365_instance.inference_places365(image_path, confidence)
        return {"tags": result}, 201


@app.route("/health", methods=["GET"])
def health():
    return {"last_request_time": last_request_time}, 200


if __name__ == "__main__":
    log("service starting")
    server = WSGIServer(("0.0.0.0", 8011), app)
    server_thread = gevent.spawn(server.serve_forever)
    gevent.joinall([server_thread])


================================================
FILE: service/tags/places365/__init__.py
================================================


================================================
FILE: service/tags/places365/places365.py
================================================
# PlacesCNN to predict the scene category, attribute, and class activation map in a single pass
# by Bolei Zhou, sep 2, 2017
# last modified date: Dec. 27, 2017, migrating everything to python36 and latest pytorch and torchvision
import os

import numpy as np
import torch
from PIL import Image
from places365 import wideresnet
from torch.autograd import Variable as V
from torch.nn import functional as F
from torchvision import transforms as trn

# import warnings

torch.nn.Module.dump_patches = True
dir_places365_model = os.path.join(
    "/", "protected_media", "data_models", "places365", "model"
)


class Places365:
    labels_and_model_are_load = False

    def unload(self):
        del self.model
        del self.classes
        del self.W_attribute
        del self.labels_IO
        del self.labels_attribute
        del self.labels_and_model_are_load
        self.model = None
        self.classes = None
        self.W_attribute = None
        self.labels_IO = None
        self.labels_attribute = None
        self.labels_and_model_are_load = False

    def load(self):
        self.load_model()
        self.load_labels()
        self.labels_and_model_are_load = True

    def load_model(self):
        # this model has a last conv feature map as 14x14
        def hook_feature(module, input, output):
            self.features_blobs.append(np.squeeze(output.data.cpu().numpy()))

        model_file = os.path.join(dir_places365_model, "wideresnet18_places365.pth.tar")
        self.model = wideresnet.resnet18(num_classes=365)
        checkpoint = torch.load(model_file, map_location=lambda storage, loc: storage)
        state_dict = {
            str.replace(k, "module.", ""): v
            for k, v in checkpoint["state_dict"].items()
        }
        self.model.load_state_dict(state_dict)
        self.model.eval()
        # hook the feature extractor
        features_names = [
            "layer4",
            "avgpool",
        ]  # this is the last conv layer of the resnet
        for name in features_names:
            self.model._modules.get(name).register_forward_hook(hook_feature)

    def load_labels(self):
        # prepare all the labels
        # scene category relevant
        file_path_category = os.path.join(
            dir_places365_model, "categories_places365.txt"
        )
        self.classes = list()
        with open(file_path_category) as class_file:
            for line in class_file:
                self.classes.append(line.strip().split(" ")[0][3:])
        self.classes = tuple(self.classes)

        # indoor and outdoor relevant
        file_path_IO = os.path.join(dir_places365_model, "IO_places365.txt")
        with open(file_path_IO) as f:
            lines = f.readlines()
            self.labels_IO = []
            for line in lines:
                items = line.rstrip().split()
                self.labels_IO.append(int(items[-1]) - 1)  # 0 is indoor, 1 is outdoor
        self.labels_IO = np.array(self.labels_IO)

        # scene attribute relevant
        file_path_attribute = os.path.join(
            dir_places365_model, "labels_sunattribute.txt"
        )
        with open(file_path_attribute) as f:
            lines = f.readlines()
            self.labels_attribute = [item.rstrip() for item in lines]

        file_path_W = os.path.join(
            dir_places365_model, "W_sceneattribute_wideresnet18.npy"
        )
        self.W_attribute = np.load(file_path_W)
        self.labels_are_load = True

    def returnTF(self):
        # load the image transformer
        tf = trn.Compose(
            [
                trn.Resize((224, 224)),
                trn.ToTensor(),
                trn.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]),
            ]
        )
        return tf

    def remove_nonspace_separators(self, text):
        return " ".join(" ".join(" ".join(text.split("_")).split("/")).split("-"))

    def inference_places365(self, img_path, confidence):
        """@param img_path: path to the image to generate labels from
        @param confidence: minimum confidence before an category is selected
        @return: {'environment': 'indoor'/'outdoor', 'categories': [...], 'attributes': [...]}
        """
        try:
            if not self.labels_and_model_are_load:
                self.load()

            # load the model
            self.features_blobs = []

            # load the transformer
            tf = self.returnTF()  # image transformer

            # get the softmax weight
            params = list(self.model.parameters())
            weight_softmax = params[-2].data.numpy()
            weight_softmax[weight_softmax < 0] = 0

            # load the test image
            # img_url = 'http://places2.csail.mit.edu/imgs/3.jpg'
            # os.system('wget %s -q -O test.jpg' % img_url)
            img = Image.open(img_path)
            # Normalize the image for processing
            input_img = V(tf(img).unsqueeze(0))

            # forward pass
            logit = self.model.forward(input_img)
            h_x = F.softmax(logit, 1).data.squeeze()
            probs, idx = h_x.sort(0, True)
            probs = probs.numpy()
            idx = idx.numpy()

            res = {}

            # output the IO prediction
            # labels_IO[idx[:10]] returns a list of 0's and 1's: 0 -> inside, 1 -> outside
            # Determine the mean to reach a consensus
            io_image = np.mean(self.labels_IO[idx[:10]])
            if io_image < 0.5:
                res["environment"] = "indoor"
            else:
                res["environment"] = "outdoor"

            # output the prediction of scene category
            # idx[i] returns a index number for which class it corresponds to
            # classes[idx[i]], thus returns the class name
            # idx is sorted together with probs, with highest probabilities first
            res["categories"] = []
            for i in range(0, 5):
                if probs[i] > confidence:
                    res["categories"].append(
                        self.remove_nonspace_separators(self.classes[idx[i]])
                    )
                else:
                    break
            # TODO Should be replaced with more meaningful tags in the future
            # output the scene attributes
            # This is something I don't quiet grasp yet
            # Probs is not usable here anymore, we're not processing our input_image
            # Take the dot product of out W_attribute model and the feature blobs
            # And sort it along the -1 axis
            # This results in idx_a, with the last elements the index numbers of attributes, we have the most confidence in
            # Can't seem to get any confidence values, also all the attributes it detect are not really meaningful i.m.o.
            responses_attribute = self.W_attribute.dot(self.features_blobs[1])
            idx_a = np.argsort(responses_attribute)
            res["attributes"] = []
            for i in range(-1, -10, -1):
                res["attributes"].append(
                    self.remove_nonspace_separators(self.labels_attribute[idx_a[i]])
                )

            return res
        except Exception as e:
            print("tags: {}".format("Error in Places365 inference"))
            raise e


================================================
FILE: service/tags/places365/wideresnet.py
================================================
import math
import os

from torch import nn

model_path = os.path.join(
    "/", "protected_media", "data_models", "resnet18-5c106cde.pth"
)


def conv3x3(in_planes, out_planes, stride=1):
    """3x3 convolution with padding"""
    return nn.Conv2d(
        in_planes, out_planes, kernel_size=3, stride=stride, padding=1, bias=False
    )


class BasicBlock(nn.Module):
    expansion = 1

    def __init__(self, inplanes, planes, stride=1, downsample=None):
        super(BasicBlock, self).__init__()
        self.conv1 = conv3x3(inplanes, planes, stride)
        self.bn1 = nn.BatchNorm2d(planes)
        self.relu = nn.ReLU(inplace=True)
        self.conv2 = conv3x3(planes, planes)
        self.bn2 = nn.BatchNorm2d(planes)
        self.downsample = downsample
        self.stride = stride

    def forward(self, x):
        residual = x

        out = self.conv1(x)
        out = self.bn1(out)
        out = self.relu(out)

        out = self.conv2(out)
        out = self.bn2(out)

        if self.downsample is not None:
            residual = self.downsample(x)

        out += residual
        out = self.relu(out)

        return out


class ResNet(nn.Module):
    def __init__(self, block, layers, num_classes=1000):
        self.inplanes = 64
        super(ResNet, self).__init__()
        self.conv1 = nn.Conv2d(3, 64, kernel_size=7, stride=2, padding=3, bias=False)
        self.bn1 = nn.BatchNorm2d(64)
        self.relu = nn.ReLU(inplace=True)
        # self.maxpool = nn.MaxPool2d(kernel_size=3, stride=1, padding=1) # previous stride is 2
        self.layer1 = self._make_layer(block, 64, layers[0])
        self.layer2 = self._make_layer(block, 128, layers[1], stride=2)
        self.layer3 = self._make_layer(block, 256, layers[2], stride=2)
        self.layer4 = self._make_layer(block, 512, layers[3], stride=2)
        self.avgpool = nn.AvgPool2d(14)
        self.fc = nn.Linear(512 * block.expansion, num_classes)

        for m in self.modules():
            if isinstance(m, nn.Conv2d):
                n = m.kernel_size[0] * m.kernel_size[1] * m.out_channels
                m.weight.data.normal_(0, math.sqrt(2.0 / n))
            elif isinstance(m, nn.BatchNorm2d):
                m.weight.data.fill_(1)
                m.bias.data.zero_()

    def _make_layer(self, block, planes, blocks, stride=1):
        downsample = None
        if stride != 1 or self.inplanes != planes * block.expansion:
            downsample = nn.Sequential(
                nn.Conv2d(
                    self.inplanes,
                    planes * block.expansion,
                    kernel_size=1,
                    stride=stride,
                    bias=False,
                ),
                nn.BatchNorm2d(planes * block.expansion),
            )

        layers = []
        layers.append(block(self.inplanes, planes, stride, downsample))
        self.inplanes = planes * block.expansion
        for i in range(1, blocks):
            layers.append(block(self.inplanes, planes))

        return nn.Sequential(*layers)

    def forward(self, x):
        x = self.conv1(x)
        x = self.bn1(x)
        x = self.relu(x)
        # x = self.maxpool(x)

        x = self.layer1(x)
        x = self.layer2(x)
        x = self.layer3(x)
        x = self.layer4(x)

        x = self.avgpool(x)
        x = x.view(x.size(0), -1)
        x = self.fc(x)

        return x


def resnet18(pretrained=False, **kwargs):
    """Constructs a ResNet-18 model.

    Args:
        pretrained (bool): If True, returns a model pre-trained on ImageNet

    """
    model = ResNet(BasicBlock, [2, 2, 2, 2], **kwargs)
    if pretrained:
        model.load_state_dict(
            model_path,
            strict=False,
        )
    return model


================================================
FILE: service/tags/siglip2/__init__.py
================================================


================================================
FILE: service/tags/siglip2/siglip2.py
================================================
import os

import numpy as np
import onnxruntime as ort
import sentencepiece as spm
from PIL import Image

SIGLIP2_MODEL_DIR = os.path.join("/", "protected_media", "data_models", "siglip2")
SIGLIP2_VISION_PATH = os.path.join(SIGLIP2_MODEL_DIR, "vision_model.onnx")
SIGLIP2_TEXT_PATH = os.path.join(SIGLIP2_MODEL_DIR, "text_model.onnx")
SIGLIP2_TOKENIZER_PATH = os.path.join(SIGLIP2_MODEL_DIR, "tokenizer.model")
SIGLIP2_EMBEDDINGS_CACHE = os.path.join(SIGLIP2_MODEL_DIR, "tag_embeddings.npy")

TAGS_FILE = os.path.join(os.path.dirname(__file__), "tags.txt")

TARGET_SIZE = 384
IMAGE_MEAN = np.array([0.5, 0.5, 0.5], dtype=np.float32)
IMAGE_STD = np.array([0.5, 0.5, 0.5], dtype=np.float32)

MAX_TOKEN_LENGTH = 64
PAD_TOKEN_ID = 0
EOS_TOKEN_ID = 1


def _pool_embeddings(raw_output, attention_mask=None):
    """Pool model output to (batch, hidden_dim).

    If the output is already 2-D (batch, hidden_dim), return it directly.
    If it is 3-D (batch, seq_len, hidden_dim), pool by taking the last
    non-padding token per sequence (EOS-token pooling used by SigLIP).
    Falls back to taking the last sequence position if no attention mask.
    """
    if raw_output.ndim == 2:
        return raw_output

    # 3-D: (batch, seq_len, hidden_dim)
    if attention_mask is not None:
        # EOS token is the last attended position
        eos_indices = attention_mask.sum(axis=1) - 1  # (batch,)
        batch_idx = np.arange(raw_output.shape[0])
        pooled = raw_output[batch_idx, eos_indices]  # (batch, hidden_dim)
    else:
        # Fallback: take position 0 (CLS-style pooling for vision)
        pooled = raw_output[:, 0, :]

    return pooled


def _l2_normalize(embeddings):
    """L2-normalize along the last axis."""
    norms = np.linalg.norm(embeddings, axis=-1, keepdims=True)
    norms = np.maximum(norms, 1e-8)
    return embeddings / norms


class SigLIP2:
    def __init__(self):
        self.vision_session = None
        self.tokenizer = None
        self.tags = None
        self.tag_embeddings = None
        self.is_loaded = False

    def load(self):
        """Load the vision model, tokenizer, tag list, and pre-computed embeddings."""
        self.vision_session = ort.InferenceSession(
            SIGLIP2_VISION_PATH,
            providers=["CPUExecutionProvider"],
        )

        with open(TAGS_FILE, "r") as f:
            self.tags = [line.strip() for line in f if line.strip()]

        if os.path.exists(SIGLIP2_EMBEDDINGS_CACHE):
            self.tag_embeddings = np.load(SIGLIP2_EMBEDDINGS_CACHE)
            # Invalidate cache if tag count changed or embedding dimension is wrong
            needs_rebuild = False
            if self.tag_embeddings.ndim != 2:
                print(f"siglip2: cache has wrong shape {self.tag_embeddings.shape}, rebuilding...")
                needs_rebuild = True
            elif self.tag_embeddings.shape[0] != len(self.tags):
                print(
                    f"siglip2: cache has {self.tag_embeddings.shape[0]} tags "
                    f"but tags.txt has {len(self.tags)}, rebuilding..."
                )
                needs_rebuild = True
            elif self.tag_embeddings.shape[1] < 128:
                print(
                    f"siglip2: cache has dim={self.tag_embeddings.shape[1]} "
                    f"(likely stale from a failed build), rebuilding..."
                )
                needs_rebuild = True

            if needs_rebuild:
                os.remove(SIGLIP2_EMBEDDINGS_CACHE)
                self._build_tag_embeddings()
            else:
                print(
                    f"siglip2: loaded cached tag embeddings "
                    f"({self.tag_embeddings.shape[0]} tags, dim={self.tag_embeddings.shape[1]})"
                )
        else:
            self._build_tag_embeddings()

        self.is_loaded = True

    def unload(self):
        del self.vision_session
        del self.tag_embeddings
        del self.tokenizer
        self.vision_session = None
        self.tag_embeddings = None
        self.tokenizer = None
        self.tags = None
        self.is_loaded = False

    def _load_tokenizer(self):
        if self.tokenizer is None:
            self.tokenizer = spm.SentencePieceProcessor()
            self.tokenizer.Load(SIGLIP2_TOKENIZER_PATH)

    def _tokenize(self, texts, max_length=MAX_TOKEN_LENGTH):
        """Tokenize a list of texts using SentencePiece, returning input_ids and attention_mask."""
        self._load_tokenizer()

        batch_input_ids = []
        batch_attention_mask = []

        for text in texts:
            token_ids = self.tokenizer.Encode(text)
            # Truncate (leave room for EOS)
            token_ids = token_ids[: max_length - 1]
            # Append EOS
            token_ids.append(EOS_TOKEN_ID)

            attention_mask = [1] * len(token_ids)

            # Pad
            pad_length = max_length - len(token_ids)
            token_ids.extend([PAD_TOKEN_ID] * pad_length)
            attention_mask.extend([0] * pad_length)

            batch_input_ids.append(token_ids)
            batch_attention_mask.append(attention_mask)

        return (
            np.array(batch_input_ids, dtype=np.int64),
            np.array(batch_attention_mask, dtype=np.int64),
        )

    def _build_tag_embeddings(self):
        """Encode all tags with the text model and cache the embeddings."""
        print("siglip2: building tag embeddings (first run, this may take a minute)...")

        text_session = ort.InferenceSession(
            SIGLIP2_TEXT_PATH,
            providers=["CPUExecutionProvider"],
        )

        text_input_names = [inp.name for inp in text_session.get_inputs()]
        text_output_names = [out.name for out in text_session.get_outputs()]

        print(f"siglip2: text model inputs: {text_input_names}")
        print(f"siglip2: text model outputs: {text_output_names}")

        # Use prompt template for better zero-shot performance
        prompted_tags = [f"a photo of {tag}" for tag in self.tags]

        all_embeddings = []
        batch_size = 32

        for i in range(0, len(prompted_tags), batch_size):
            batch_texts = prompted_tags[i : i + batch_size]
            input_ids, attention_mask = self._tokenize(batch_texts)

            feed = {text_input_names[0]: input_ids}
            if len(text_input_names) > 1:
                feed[text_input_names[1]] = attention_mask

            # Run all outputs so we can pick the best one
            raw_outputs = text_session.run(None, feed)

            # Find the output that gives us pooled embeddings (batch, hidden_dim)
            # Prefer a 2-D output; if all are 3-D, pool the first one via EOS token
            embeddings = None
            for idx, out in enumerate(raw_outputs):
                if out.ndim == 2 and out.shape[0] == len(batch_texts):
                    embeddings = out
                    break

            if embeddings is None:
                # All outputs are 3-D; pool the first one using EOS token position
                embeddings = _pool_embeddings(raw_outputs[0], attention_mask)

            if i == 0:
                print(f"siglip2: text embedding shape per batch: {embeddings.shape}")

            embeddings = _l2_normalize(embeddings)
            all_embeddings.append(embeddings)

            if (i // batch_size) % 5 == 0:
                print(
                    f"siglip2: encoded {min(i + batch_size, len(prompted_tags))}"
                    f"/{len(prompted_tags)} tags"
                )

        del text_session

        self.tag_embeddings = np.concatenate(all_embeddings, axis=0)

        os.makedirs(os.path.dirname(SIGLIP2_EMBEDDINGS_CACHE), exist_ok=True)
        np.save(SIGLIP2_EMBEDDINGS_CACHE, self.tag_embeddings)
        print(
            f"siglip2: cached {self.tag_embeddings.shape[0]} tag embeddings "
            f"(dim={self.tag_embeddings.shape[1]}) to {SIGLIP2_EMBEDDINGS_CACHE}"
        )

    def prepare_image(self, image):
        """Resize, rescale, and normalize an image for SigLIP 2."""
        image = image.convert("RGB")
        image = image.resize((TARGET_SIZE, TARGET_SIZE), Image.BICUBIC)

        arr = np.array(image, dtype=np.float32) / 255.0
        arr = (arr - IMAGE_MEAN) / IMAGE_STD
        # HWC -> CHW
        arr = arr.transpose(2, 0, 1)
        # Add batch dimension
        return arr[np.newaxis, :]

    def predict(self, image_path, threshold=0.05, max_tags=10):
        """Run inference and return the top tags by cosine similarity.

        Args:
            image_path: Path to the image file.
            threshold: Minimum cosine similarity to include a tag.
            max_tags: Maximum number of tags to return.

        Returns:
            dict with "tags" key containing a list of predicted tag strings.
        """
        if not self.is_loaded:
            self.load()

        image = Image.open(image_path)
        pixel_values = self.prepare_image(image)

        vision_input_name = self.vision_session.get_inputs()[0].name

        # Run all outputs
        raw_outputs = self.vision_session.run(None, {vision_input_name: pixel_values})

        # Find the pooled image embedding (2-D preferred, else pool from 3-D)
        image_embeds = None
        for out in raw_outputs:
            if out.ndim == 2 and out.shape[0] == 1:
                image_embeds = out
                break

        if image_embeds is None:
            # 3-D output: pool via CLS token (position 0)
            image_embeds = _pool_embeddings(raw_outputs[0], attention_mask=None)

        image_embeds = _l2_normalize(image_embeds)

        # Compute cosine similarity: (1, dim) @ (n_tags, dim).T -> (1, n_tags)
        similarities = image_embeds @ self.tag_embeddings.T
        scores = similarities[0]

        # Get top tags sorted by score, filtered by threshold, capped at max_tags
        ranked_indices = np.argsort(scores)[::-1]
        predicted_tags = []
        for idx in ranked_indices:
            if scores[idx] < threshold:
                break
            predicted_tags.append(self.tags[idx])
            if len(predicted_tags) >= max_tags:
                break

        return {"tags": predicted_tags}


================================================
FILE: service/tags/siglip2/tags.txt
================================================
person
man
woman
child
baby
toddler
teenager
elderly person
couple
family
group of people
crowd
portrait
selfie
face
smile
laughing
glasses
sunglasses
hat
beard
mustache
tattoo
walking
running
jogging
swimming
dancing
cooking
eating
drinking
reading
writing
sleeping
working
playing
sitting
standing
jumping
climbing
hiking
cycling
surfing
skiing
snowboarding
skating
fishing
camping
gardening
painting
drawing
singing
shopping
traveling
driving
talking
hugging
kissing
waving
pointing
clapping
celebrating
praying
meditating
exercising
stretching
yoga
soccer
basketball
tennis
baseball
football
volleyball
golf
boxing
martial arts
gymnastics
weightlifting
cricket
rugby
hockey
badminton
table tennis
wrestling
archery
fencing
cat
dog
puppy
kitten
bird
fish
horse
cow
pig
sheep
goat
chicken
duck
rabbit
deer
bear
fox
wolf
lion
tiger
elephant
giraffe
zebra
monkey
gorilla
panda
snake
lizard
turtle
frog
butterfly
bee
dragonfly
spider
squirrel
hamster
parrot
owl
eagle
hawk
penguin
dolphin
whale
shark
octopus
crab
jellyfish
insect
ant
ladybug
snail
hedgehog
raccoon
swan
flamingo
peacock
coral
seal
food
fruit
apple
banana
orange
strawberry
grape
watermelon
pineapple
cherry
lemon
peach
mango
avocado
coconut
vegetable
tomato
carrot
broccoli
corn
potato
onion
pepper
mushroom
lettuce
cucumber
bread
cake
pie
cookie
pizza
burger
sandwich
pasta
noodles
rice
sushi
soup
salad
steak
chicken meat
seafood
shrimp
cheese
egg
pancake
waffle
donut
chocolate
candy
ice cream
coffee
tea
beer
wine
cocktail
juice
water bottle
breakfast
lunch
dinner
dessert
barbecue
picnic
car
truck
bus
van
motorcycle
bicycle
scooter
train
subway
tram
airplane
helicopter
boat
sailboat
yacht
ship
canoe
kayak
taxi
ambulance
fire truck
police car
tractor
construction vehicle
hot air balloon
skateboard
stroller
wheelchair
house
apartment building
skyscraper
office building
castle
church
cathedral
temple
mosque
tower
lighthouse
barn
cabin
cottage
palace
stadium
bridge
arch
monument
statue
fountain
windmill
factory
warehouse
greenhouse
gazebo
tent
ruins
kitchen
bedroom
bathroom
living room
dining room
office
classroom
library
museum
gallery
theater
cinema
hospital
restaurant
cafe
bar
pub
bakery
supermarket
mall
gym
spa
hotel room
lobby
hallway
staircase
balcony
rooftop
garden
park
forest
jungle
mountain
hill
valley
cliff
canyon
cave
island
volcano
glacier
desert
beach
ocean
sea
river
lake
pond
stream
waterfall
swamp
marsh
field
meadow
grassland
prairie
farmland
vineyard
orchard
city
town
village
street
road
highway
alley
sidewalk
crossroad
intersection
parking lot
playground
courtyard
pier
dock
harbor
marina
boardwalk
promenade
trail
path
tree
palm tree
pine tree
flower
rose
sunflower
tulip
daisy
lily
orchid
lavender
grass
bush
hedge
moss
fern
cactus
bamboo
vine
leaf
petal
branch
trunk
root
mushroom in nature
coral reef
seaweed
sky
cloud
sun
moon
star
rainbow
aurora
sunset
sunrise
dawn
dusk
golden hour
twilight
sunny
cloudy
rainy
snowy
foggy
misty
stormy
windy
overcast
hazy
frost
ice
thunder
lightning
rain
snow
hail
spring
summer
autumn
winter
phone
smartphone
laptop
computer
tablet
keyboard
monitor
camera
television
speaker
headphones
microphone
clock
watch
umbrella
bag
backpack
purse
wallet
suitcase
basket
box
bottle
jar
cup
mug
drinking glass
plate
bowl
fork
knife
spoon
chopsticks
pan
pot
book
newspaper
magazine
pen
pencil
scissors
key
lock
flashlight
candle
lamp
lantern
mirror
frame
painting on wall
map
globe
telescope
binoculars
compass
guitar
piano
violin
drums
flute
trumpet
saxophone
harmonica
bell
chair
table
desk
sofa
couch
bed
bench
stool
shelf
bookshelf
cabinet
drawer
wardrobe
rug
carpet
curtain
pillow
blanket
towel
shirt
dress
suit
jacket
coat
sweater
hoodie
jeans
shorts
skirt
uniform
costume
scarf
glove
boot
sneaker
sandal
high heel
ring
necklace
bracelet
earring
crown
mask
helmet
ribbon
bow tie
necktie
fireworks
balloon
confetti
banner
flag
gift
present
wrapped gift
birthday cake
candles
christmas tree
ornament
wreath
pumpkin
jack-o-lantern
easter egg
wedding dress
wedding ring
bouquet
champagne
trophy
medal
certificate
diploma
sign
billboard
traffic light
stop sign
street sign
neon sign
graffiti
mural
poster
banner sign
tattoo art
sculpture
wood
metal
glass
stone
brick
concrete
marble
ceramic
leather
fabric
paper
sand
rock
pebble
crystal
gold
silver
lace
wool
denim
silk
water
fire
smoke
steam
flame
spark
bubble
wave
foam
icicle
snowflake
shadow
reflection
silhouette
bokeh
lens flare
light beam
darkness
symmetry
pattern
texture
stripe
polka dot
plaid
geometric
abstract
colorful
black and white
vintage
retro
rustic
modern
minimalist
cozy
dramatic
peaceful
romantic
festive
spooky
scary
soothing
stressful
warm
cold
natural
man-made
aged
glossy
rusty
dirty
sterile
moist
dry
cluttered
open area
enclosed area
boating
biking
sunbathing
touring
diving
bathing
cleaning
socializing
studying
training
farming
constructing
competing
spectating
digging
gaming
sports
vegetation
foliage
shrubbery
leaves
flowers
asphalt
pavement
tiles
plastic
vinyl
dirt
running water
still water
natural light
indoor lighting
airfield
airplane cabin
airport terminal
alcove
amphitheater
amusement arcade
amusement park
aquarium
aqueduct
archaeological site
art gallery
art studio
assembly line
attic
auditorium
badlands
ballroom
bamboo forest
banquet hall
baseball field
basketball court
bazaar
beauty salon
beer garden
boat deck
boathouse
bookstore
botanical garden
bowling alley
boxing ring
building facade
burial chamber
campsite
campus
candy store
car interior
carousel
catacomb
cemetery
chalet
clothing store
coast
cockpit
coffee shop
computer room
conference room
construction site
corn field
corridor
courthouse
creek
crevasse
crosswalk
dam
delicatessen
department store
desert road
diner
discotheque
doorway
dorm room
downtown
dressing room
driveway
drugstore
elevator
embassy
engine room
entrance hall
escalator
excavation
fabric store
fast food restaurant
fire escape
fire station
fishpond
flea market
florist shop
food court
football field
forest path
formal garden
garage
gas station
gift shop
golf course
grotto
gymnasium
hangar
hardware store
hayfield
heliport
home office
home theater
hospital room
hot spring
hunting lodge
ice cream parlor
iceberg
igloo
industrial area
inn
jail cell
japanese garden
jewelry shop
junkyard
kindergarten
lagoon
landfill
landing deck
laundromat
lawn
lecture room
loading dock
locker room
mansion
market
mausoleum
moat
motel
mountain path
movie theater
music studio
natural history museum
nursery
nursing home
oil rig
operating room
orchestra pit
pagoda
pantry
parking garage
pasture
patio
pavilion
pet shop
pharmacy
phone booth
picnic area
pizzeria
playroom
plaza
porch
racecourse
raceway
raft
railroad track
rainforest
reception
recreation room
repair shop
residential neighborhood
restaurant kitchen
restaurant patio
rice paddy
rock arch
roof garden
rope bridge
runway
sandbox
sauna
schoolhouse
science museum
server room
shed
shoe shop
shopfront
shopping mall
shower
ski resort
ski slope
slum
snowfield
soccer field
stable
stage
storage room
subway station
sushi bar
swimming hole
swimming pool
synagogue
television studio
throne room
topiary garden
toy shop
train interior
train station
tree farm
tree house
trench
tundra
underwater
utility room
vegetable garden
veterinary office
viaduct
volleyball court
waiting room
water park
water tower
watering hole
wheat field
wind farm
yard
youth hostel
zen garden
christmas
birthday
halloween
easter
thanksgiving
new year
new year's eve
valentine's day
wedding
graduation
anniversary
engagement
baby shower
baptism
communion
funeral
memorial service
hanukkah
diwali
eid
carnival
mardi gras
st. patrick's day
independence day
fourth of july
mother's day
father's day
chinese new year
lunar new year
oktoberfest
prom
homecoming
retirement party
housewarming
reunion
concert
festival
parade
costume party
pool party
garden party
surprise party
bridal shower
bachelor party
bachelorette party
gender reveal
first day of school
award ceremony
charity event
gala
recital
school play
talent show
science fair
sports day
marathon
tournament
quinceañera
bar mitzvah
bat mitzvah


================================================
FILE: service/thumbnail/__init__.py
================================================


================================================
FILE: service/thumbnail/main.py
================================================
import gevent
from flask import Flask, request
from gevent.pywsgi import WSGIServer
from wand.image import Image

app = Flask(__name__)


def log(message):
    print(f"thumbnail: {message}")


@app.route("/", methods=["POST"])
def create_thumbnail():
    try:
        data = request.get_json()
        source = data["source"]
        destination = data["destination"]
        height = data["height"]
    except Exception:
        return "", 400
    log(f"creating for source={source} height={height}")
    with Image(filename=source) as img:
        with img.clone() as thumbnail:
            thumbnail.format = "webp"
            thumbnail.transform(resize=f"x{height}")
            thumbnail.compression_quality = 95
            thumbnail.auto_orient()
            thumbnail.save(filename=destination)
    log(f"created at location={destination}")
    return {"thumbnail": destination}, 201


@app.route("/health", methods=["GET"])
def health():
    return {"status": "OK"}, 200


if __name__ == "__main__":
    log("service starting")
    server = WSGIServer(("0.0.0.0", 8003), app)
    server_thread = gevent.spawn(server.serve_forever)
    gevent.joinall([server_thread])


================================================
FILE: service/thumbnail/test/.gitignore
================================================
samples/*
!samples/.gitkeep
!samples/README.md


================================================
FILE: service/thumbnail/test/__init__.py
================================================


================================================
FILE: service/thumbnail/test/samples/.gitkeep
================================================


================================================
FILE: service/thumbnail/test/samples/README.md
================================================
place any *image* files in this directory that you want to use as test data


================================================
FILE: service/thumbnail/test/test_thumbnail_worker.py
================================================
import os

from pytest import fixture

from service.thumbnail.main import app

HTTP_BAD_REQUEST = 400
HTTP_CREATED = 201


@fixture()
def client():
    return app.test_client()


def test_must_fail_when_passing_empty_string(client):
    response = client.post("/", data="")
    assert response.status_code == HTTP_BAD_REQUEST


def test_must_fail_when_passing_invalid_json(client):
    response = client.post("/", data="invalid json")
    assert response.status_code == HTTP_BAD_REQUEST


def test_must_fail_when_passing_incomplete_json(client):
    invalid_payloads = [
        {"source": "foo"},
        {"destination": "/tmp/result.webp"},
        {"height": 100},
        {"source": "foo", "destination": "/tmp/result.webp"},
        {"destination": "/tmp/result.webp", "height": 100},
        {"height": 100, "source": "foo"},
    ]
    for payload in invalid_payloads:
        response = client.post("/", json=payload)
        assert response.status_code == HTTP_BAD_REQUEST


def test_should_create_thumbnail(client):
    samples_dir = os.path.join(os.path.dirname(os.path.realpath(__file__)), "samples")
    samples = [f for f in os.listdir(samples_dir) if f not in [".gitkeep", "README.md"]]
    thumbnail_path = "/tmp/result.webp"
    for sample in samples:
        if os.path.exists(thumbnail_path):
            os.remove(thumbnail_path)
        source = os.path.join(samples_dir, sample)
        json = {"source": source, "destination": thumbnail_path, "height": 100}
        response = client.post("/", json=json)
        assert response.status_code == HTTP_CREATED