Repository: LibraryOfCongress/concordia
Branch: main
Commit: 80cc6e1b2573
Files: 673
Total size: 3.0 MB

Directory structure:
gitextract_frv4ewgf/

├── .cfnlintrc.yaml
├── .dockerignore
├── .github/
│   ├── ISSUE_TEMPLATE/
│   │   ├── bug_report.md
│   │   └── feature_request.md
│   ├── dependabot.yml
│   └── workflows/
│       ├── black.yml
│       ├── build.yml
│       ├── codeql.yml
│       ├── db_ops.yml
│       ├── dev-main-deploy.yml
│       ├── feature-branch-deploy.yml
│       ├── pip-audit.yml
│       ├── prod-deploy.yml
│       ├── renew_coverage.yml
│       ├── stage-hotfix-rel-deploy.yml
│       ├── stage-image-refresh.yml
│       ├── stage-release-deploy.yml
│       ├── test-main-deploy.yml
│       └── test.yml
├── .gitignore
├── Dockerfile
├── LICENSE.md
├── Loadtesting.md
├── MANIFEST.in
├── Makefile
├── Pipfile
├── README.md
├── build_containers.sh
├── celerybeat/
│   ├── Dockerfile
│   └── entrypoint.sh
├── cloudformation/
│   ├── LICENSE
│   ├── NOTICE
│   ├── README.md
│   ├── add_cloudflare_ips_to_sgs.py
│   ├── create_secrets.sh
│   ├── featurebranch.yaml
│   ├── images/
│   │   └── architecture-overview.graffle/
│   │       └── data.plist
│   ├── infrastructure/
│   │   ├── bastion-hosts.yaml
│   │   ├── data-load.yaml
│   │   ├── elasticache-feature.yaml
│   │   ├── elasticache.yaml
│   │   ├── elasticsearch.yaml
│   │   ├── fargate-cluster.yaml
│   │   ├── fargate-featurebranch.yaml
│   │   ├── jenkins-server.yaml
│   │   ├── network-acl.yaml
│   │   ├── opensearch.yaml
│   │   ├── rds.yaml
│   │   ├── search-proxy-task.yaml
│   │   ├── security-groups.yaml
│   │   └── vpc.yaml
│   ├── master.yaml
│   ├── stack_drift.sh
│   ├── sync_templates.sh
│   └── tests/
│       └── validate-templates.sh
├── concordia/
│   ├── __init__.py
│   ├── admin/
│   │   ├── __init__.py
│   │   ├── actions.py
│   │   ├── filters.py
│   │   ├── forms.py
│   │   ├── utils.py
│   │   └── views.py
│   ├── admin_site.py
│   ├── api/
│   │   ├── __init__.py
│   │   └── schemas.py
│   ├── api_views.py
│   ├── apps.py
│   ├── asgi.py
│   ├── authentication_backends.py
│   ├── celery.py
│   ├── consumers.py
│   ├── context_processors.py
│   ├── contextmanagers.py
│   ├── converters.py
│   ├── decorators.py
│   ├── documents.py
│   ├── exceptions.py
│   ├── forms.py
│   ├── logging.py
│   ├── maintenance.py
│   ├── management/
│   │   ├── __init__.py
│   │   └── commands/
│   │       ├── __init__.py
│   │       ├── calculate_difficulty_values.py
│   │       ├── create_load_test_fixtures.py
│   │       ├── ensure_initial_site_configuration.py
│   │       ├── import_site_reports.py
│   │       ├── prepare_load_test_db.py
│   │       └── print_frontend_test_urls.py
│   ├── middleware.py
│   ├── migrations/
│   │   ├── 0001_initial.py
│   │   ├── 0001_squashed_0040_remove_campaign_is_active.py
│   │   ├── 0002_auto_20181004_1848.py
│   │   ├── 0003_auto_20181004_2103.py
│   │   ├── 0004_auto_20181010_1715.py
│   │   ├── 0005_campaign_short_description.py
│   │   ├── 0006_campaignresource.py
│   │   ├── 0007_thumbnail_images.py
│   │   ├── 0008_auto_20181015_1711.py
│   │   ├── 0009_project_description.py
│   │   ├── 0010_auto_20181021_1659.py
│   │   ├── 0010_auto_20181022_1530.py
│   │   ├── 0011_auto_20181022_1532.py
│   │   ├── 0012_merge_20181022_1554.py
│   │   ├── 0013_auto_20181031_1305.py
│   │   ├── 0014_auto_20181115_1411.py
│   │   ├── 0015_auto_20181115_1436.py
│   │   ├── 0016_auto_20181115_1803.py
│   │   ├── 0017_change_transcription_supersedes_related_name.py
│   │   ├── 0018_auto_20181128_1611.py
│   │   ├── 0018_simplepage.py
│   │   ├── 0019_merge_20181128_1715.py
│   │   ├── 0020_auto_20181128_1718.py
│   │   ├── 0021_sitereport.py
│   │   ├── 0022_auto_20181211_1310.py
│   │   ├── 0023_auto_20190130_1555.py
│   │   ├── 0024_add_site_report_ordering.py
│   │   ├── 0024_auto_20190211_1420.py
│   │   ├── 0025_auto_20190329_1705.py
│   │   ├── 0025_unicode_slugs.py
│   │   ├── 0026_update_published_field_definition.py
│   │   ├── 0027_merge_20190423_1657.py
│   │   ├── 0028_asset_year.py
│   │   ├── 0029_assettranscriptionreservation_reservation_token.py
│   │   ├── 0030_auto_20190503_1559.py
│   │   ├── 0031_auto_20190509_1142.py
│   │   ├── 0032_topic_ordering.py
│   │   ├── 0033_simple_content_blocks.py
│   │   ├── 0034_auto_20190627_1438.py
│   │   ├── 0035_auto_20190627_1455.py
│   │   ├── 0036_auto_20190703_1203.py
│   │   ├── 0037_carouselslide.py
│   │   ├── 0038_sitereport_topic.py
│   │   ├── 0039_auto_20200129_1536.py
│   │   ├── 0040_auto_20200130_1756.py
│   │   ├── 0041_auto_20200203_1351.py
│   │   ├── 0042_auto_20200316_1623.py
│   │   ├── 0043_auto_20200323_1729.py
│   │   ├── 0044_auto_20200323_1827.py
│   │   ├── 0045_auto_20200323_1832.py
│   │   ├── 0046_auto_20200323_1907.py
│   │   ├── 0047_auto_20200324_1103.py
│   │   ├── 0048_auto_20200324_1820.py
│   │   ├── 0049_auto_20200324_2004.py
│   │   ├── 0050_auto_20210920_1544.py
│   │   ├── 0051_asset_storage_image.py
│   │   ├── 0052_auto_20220531_1331.py
│   │   ├── 0053_banner.py
│   │   ├── 0054_banner_active.py
│   │   ├── 0055_campaign_status.py
│   │   ├── 0056_auto_20220922_1508.py
│   │   ├── 0057_resource_resource_type.py
│   │   ├── 0058_banner_slug.py
│   │   ├── 0059_resourcefile.py
│   │   ├── 0060_alter_resourcefile_resource.py
│   │   ├── 0061_auto_20230201_1453.py
│   │   ├── 0061_sitereport_registered_contributors.py
│   │   ├── 0062_resourcefile_updated_on.py
│   │   ├── 0062_userretiredcampaign.py
│   │   ├── 0063_banner_alert_status.py
│   │   ├── 0064_alter_banner_alert_status.py
│   │   ├── 0065_alter_userretiredcampaign_unique_together.py
│   │   ├── 0066_auto_20230217_1302.py
│   │   ├── 0066_campaignretirementprogress.py
│   │   ├── 0067_alter_campaignretirementprogress_campaign.py
│   │   ├── 0068_campaignretirementprogress_complete.py
│   │   ├── 0069_merge_20230224_1446.py
│   │   ├── 0070_alter_campaign_options.py
│   │   ├── 0071_auto_20230306_1456.py
│   │   ├── 0072_merge_20230313_1047.py
│   │   ├── 0073_auto_20230314_1327.py
│   │   ├── 0074_auto_20230314_1341.py
│   │   ├── 0075_auto_20230327_1333.py
│   │   ├── 0076_sitereport_report_name.py
│   │   ├── 0077_alter_sitereport_report_name.py
│   │   ├── 0078_alter_sitereport_report_name.py
│   │   ├── 0079_auto_20230601_1234.py
│   │   ├── 0080_auto_20230602_0920.py
│   │   ├── 0081_sitereport_review_actions.py
│   │   ├── 0082_delete_userretiredcampaign.py
│   │   ├── 0083_sitereport_daily_active_users.py
│   │   ├── 0084_rename_review_actions_sitereport_daily_review_actions.py
│   │   ├── 0085_auto_20231016_1432.py
│   │   ├── 0086_auto_20231215_1311.py
│   │   ├── 0087_auto_20240213_0756.py
│   │   ├── 0088_alter_simplepage_body.py
│   │   ├── 0089_campaign_image_alt_text.py
│   │   ├── 0090_auto_20240408_1334.py
│   │   ├── 0091_guide_simple_page.py
│   │   ├── 0092_auto_20240509_1522.py
│   │   ├── 0093_asset_campaign.py
│   │   ├── 0094_alter_asset_campaign.py
│   │   ├── 0095_transcription_rolled_back_and_more.py
│   │   ├── 0096_transcription_source.py
│   │   ├── 0097_alter_sitereport_options_userprofile_review_count_and_more.py
│   │   ├── 0098_userprofile_create_and_population.py
│   │   ├── 0099_alter_campaign_display_on_homepage_and_more.py
│   │   ├── 0100_researchcenter.py
│   │   ├── 0101_auto_20241119_1215.py
│   │   ├── 0102_campaign_research_centers.py
│   │   ├── 0103_alter_item_title.py
│   │   ├── 0104_nexttranscribabletopicasset_and_more.py
│   │   ├── 0105_nextreviewablecampaignasset_concordia_n_transcr_aafdba_gin_and_more.py
│   │   ├── 0106_alter_nextreviewablecampaignasset_options_and_more.py
│   │   ├── 0107_alter_nextreviewablecampaignasset_options_and_more.py
│   │   ├── 0108_add_next_asset_cache_periodic_task.py
│   │   ├── 0109_alter_nextreviewablecampaignasset_asset_and_more.py
│   │   ├── 0110_remove_asset_media_url_alter_asset_storage_image.py
│   │   ├── 0111_auto_20250428_1023.py
│   │   ├── 0112_projecttopic_url_filter_alter_projecttopic_id.py
│   │   ├── 0113_create_asset_status_periodic_task.py
│   │   ├── 0114_create_daily_activity_periodic_task.py
│   │   ├── 0115_alter_asset_storage_image_alter_banner_link_and_more.py
│   │   ├── 0116_item_thumbnail_image.py
│   │   ├── 0117_alter_projecttopic_options_projecttopic_ordering.py
│   │   ├── 0118_asset_concordia_a_item_id_f10916_idx_and_more.py
│   │   ├── 0119_remove_asset_concordia_a_id_137ca8_idx_and_more.py
│   │   ├── 0120_sitereport_assets_started.py
│   │   ├── 0121_keymetricsreport.py
│   │   ├── 0122_alter_item_title.py
│   │   ├── 0123_alter_campaignretirementprogress_options.py
│   │   ├── 0124_update_periodic_task_paths.py
│   │   ├── 0125_update_userprofile_tasks.py
│   │   ├── 0126_concordiafile_helpfullink_remove_resource_campaign_and_more.py
│   │   ├── 0127_alter_campaignretirementprogress_options_and_more.py
│   │   ├── 0128_alter_campaignretirementprogress_options.py
│   │   └── __init__.py
│   ├── models.py
│   ├── parser.py
│   ├── passwords/
│   │   ├── LICENSE
│   │   ├── __init__.py
│   │   └── validators.py
│   ├── routing.py
│   ├── secrets.py
│   ├── settings_dev.py
│   ├── settings_docker.py
│   ├── settings_ecs.py
│   ├── settings_loadtest.py
│   ├── settings_local_test.py
│   ├── settings_template.py
│   ├── settings_test.py
│   ├── signals/
│   │   ├── __init__.py
│   │   ├── handlers.py
│   │   └── signals.py
│   ├── static/
│   │   ├── admin/
│   │   │   ├── custom-inline.js
│   │   │   └── editor-preview.js
│   │   ├── js/
│   │   │   └── src/
│   │   │       ├── about-accordions.js
│   │   │       ├── asset-reservation.js
│   │   │       ├── banner.js
│   │   │       ├── base.js
│   │   │       ├── campaign-selection.js
│   │   │       ├── contribute.js
│   │   │       ├── filter-assets.js
│   │   │       ├── guide.js
│   │   │       ├── homepage-carousel.js
│   │   │       ├── modules/
│   │   │       │   ├── accessible-colors.js
│   │   │       │   ├── chroma-esm.js
│   │   │       │   ├── concordia-visualization.js
│   │   │       │   ├── quick-tips.js
│   │   │       │   ├── turnstile.js
│   │   │       │   └── visualization-errors.js
│   │   │       ├── ocr.js
│   │   │       ├── password-validation.js
│   │   │       ├── profile-fields.js
│   │   │       ├── quick-tips-setup.js
│   │   │       ├── recent-pages.js
│   │   │       ├── viewer-split.js
│   │   │       ├── viewer.js
│   │   │       └── visualizations/
│   │   │           ├── asset-status-by-campaign.js
│   │   │           ├── asset-status-overview.js
│   │   │           └── daily-activity.js
│   │   ├── scss/
│   │   │   ├── _variables.scss
│   │   │   └── base.scss
│   │   └── vendor/
│   │       └── jquery.cookie.js
│   ├── storage.py
│   ├── storage_backends.py
│   ├── tasks/
│   │   ├── __init__.py
│   │   ├── assets.py
│   │   ├── blog.py
│   │   ├── housekeeping.py
│   │   ├── next_asset/
│   │   │   ├── __init__.py
│   │   │   ├── renew.py
│   │   │   ├── reviewable.py
│   │   │   └── transcribable.py
│   │   ├── reports/
│   │   │   ├── __init__.py
│   │   │   ├── backfill.py
│   │   │   ├── key_metrics.py
│   │   │   └── sitereport.py
│   │   ├── reservations.py
│   │   ├── retirement.py
│   │   ├── search_index.py
│   │   ├── thumbnails.py
│   │   ├── unusualactivity.py
│   │   ├── useractivity.py
│   │   └── visualizations.py
│   ├── templates/
│   │   ├── 404.html
│   │   ├── 429.html
│   │   ├── 500.html
│   │   ├── 503.html
│   │   ├── account/
│   │   │   ├── account_deletion.html
│   │   │   ├── email_reconfirmation_failed.html
│   │   │   └── profile.html
│   │   ├── admin/
│   │   │   ├── auth/
│   │   │   │   └── user/
│   │   │   │       └── change_form.html
│   │   │   ├── base_site.html
│   │   │   ├── bulk_change.html
│   │   │   ├── bulk_import.html
│   │   │   ├── bulk_review.html
│   │   │   ├── celery_task.html
│   │   │   ├── clear_cache.html
│   │   │   ├── concordia/
│   │   │   │   ├── asset/
│   │   │   │   │   ├── change_form.html
│   │   │   │   │   └── change_list.html
│   │   │   │   ├── campaign/
│   │   │   │   │   ├── change_form.html
│   │   │   │   │   └── retire.html
│   │   │   │   ├── item/
│   │   │   │   │   └── change_form.html
│   │   │   │   ├── project/
│   │   │   │   │   ├── change_form.html
│   │   │   │   │   └── item_import.html
│   │   │   │   ├── simplepage/
│   │   │   │   │   └── change_form.html
│   │   │   │   └── transcription/
│   │   │   │       └── change_form.html
│   │   │   ├── index.html
│   │   │   ├── long_name_filter.html
│   │   │   ├── process_bagit.html
│   │   │   └── project_level_export.html
│   │   ├── base.html
│   │   ├── django_registration/
│   │   │   ├── activation_complete.html
│   │   │   ├── activation_email_body.txt
│   │   │   ├── activation_email_subject.txt
│   │   │   ├── activation_failed.html
│   │   │   ├── registration_closed.html
│   │   │   ├── registration_complete.html
│   │   │   └── registration_form.html
│   │   ├── documents/
│   │   │   └── service_letter.html
│   │   ├── emails/
│   │   │   ├── delete_account_body.txt
│   │   │   ├── delete_account_subject.txt
│   │   │   ├── email_reconfirmation_body.txt
│   │   │   ├── email_reconfirmation_subject.txt
│   │   │   ├── unusual_activity.html
│   │   │   ├── unusual_activity.txt
│   │   │   ├── welcome_email_body.html
│   │   │   ├── welcome_email_body.txt
│   │   │   └── welcome_email_subject.txt
│   │   ├── error.html
│   │   ├── forms/
│   │   │   └── widgets/
│   │   │       ├── email.html
│   │   │       └── turnstile_widget.html
│   │   ├── fragments/
│   │   │   ├── _filter-buttons.html
│   │   │   ├── _modal_footer.html
│   │   │   ├── activity-filter-sort.html
│   │   │   ├── codemirror.html
│   │   │   ├── common-stylesheets.html
│   │   │   ├── featured_blog_posts.html
│   │   │   ├── recent-pages.html
│   │   │   ├── sharing-button-group.html
│   │   │   ├── standard-pagination.html
│   │   │   ├── transcription-progress-bar.html
│   │   │   ├── transcription-progress-row.html
│   │   │   └── transcription-status-filters.html
│   │   ├── home.html
│   │   ├── registration/
│   │   │   ├── activate.html
│   │   │   ├── login.html
│   │   │   ├── password_change_done.html
│   │   │   ├── password_change_form.html
│   │   │   ├── password_reset_complete.html
│   │   │   ├── password_reset_confirm.html
│   │   │   ├── password_reset_done.html
│   │   │   ├── password_reset_email.html
│   │   │   ├── password_reset_form.html
│   │   │   └── password_reset_subject.txt
│   │   ├── static-page.html
│   │   └── transcriptions/
│   │       ├── asset_detail/
│   │       │   ├── asset_reservation_failure_modal.html
│   │       │   ├── editor.html
│   │       │   ├── error_modal.html
│   │       │   ├── guide.html
│   │       │   ├── language_selection_modal.html
│   │       │   ├── navigation.html
│   │       │   ├── nothing_to_transcribe_modal.html
│   │       │   ├── ocr_help_modal.html
│   │       │   ├── ocr_transcription_modal.html
│   │       │   ├── quick_tips_modal.html
│   │       │   ├── review_accepted_modal.html
│   │       │   ├── successful_submission_modal.html
│   │       │   ├── tags.html
│   │       │   ├── viewer.html
│   │       │   └── viewer_filters.html
│   │       ├── asset_detail.html
│   │       ├── campaign_detail.html
│   │       ├── campaign_detail_completed.html
│   │       ├── campaign_detail_retired.html
│   │       ├── campaign_list.html
│   │       ├── campaign_list_small_blocks.html
│   │       ├── campaign_report.html
│   │       ├── campaign_small_block.html
│   │       ├── campaign_topic_list.html
│   │       ├── completed_campaigns_section.html
│   │       ├── item_detail.html
│   │       ├── project_detail.html
│   │       ├── topic_detail.html
│   │       └── transcription.html
│   ├── templatetags/
│   │   ├── __init__.py
│   │   ├── concordia_filtering_tags.py
│   │   ├── concordia_media_tags.py
│   │   ├── concordia_querystring.py
│   │   ├── concordia_sharing_tags.py
│   │   ├── concordia_text_tags.py
│   │   ├── custom_math.py
│   │   ├── group_list.py
│   │   ├── reject_filter.py
│   │   ├── truncation.py
│   │   └── visualization.py
│   ├── tests/
│   │   ├── README.md
│   │   ├── __init__.py
│   │   ├── axe.py
│   │   ├── data/
│   │   │   └── site_reports.csv
│   │   ├── test_account_views.py
│   │   ├── test_admin.py
│   │   ├── test_admin_actions.py
│   │   ├── test_admin_filters.py
│   │   ├── test_admin_forms.py
│   │   ├── test_admin_views.py
│   │   ├── test_api_views.py
│   │   ├── test_authentication.py
│   │   ├── test_celery.py
│   │   ├── test_consumers.py
│   │   ├── test_contextmanagers.py
│   │   ├── test_decorators.py
│   │   ├── test_fields.py
│   │   ├── test_logging.py
│   │   ├── test_maintenance.py
│   │   ├── test_management_commands.py
│   │   ├── test_models.py
│   │   ├── test_parser.py
│   │   ├── test_registration_views.py
│   │   ├── test_s3.py
│   │   ├── test_selenium.py
│   │   ├── test_sentry.py
│   │   ├── test_signals.py
│   │   ├── test_tasks_assets.py
│   │   ├── test_tasks_blog.py
│   │   ├── test_tasks_housekeeping.py
│   │   ├── test_tasks_next_asset.py
│   │   ├── test_tasks_reports_backfill.py
│   │   ├── test_tasks_reports_key_metrics.py
│   │   ├── test_tasks_reports_sitereport.py
│   │   ├── test_tasks_retirement.py
│   │   ├── test_tasks_search_index.py
│   │   ├── test_tasks_thumbnails.py
│   │   ├── test_tasks_unusualactivity.py
│   │   ├── test_tasks_useractivity.py
│   │   ├── test_tasks_visualizations.py
│   │   ├── test_templatetags.py
│   │   ├── test_top_level_views.py
│   │   ├── test_utils_celery.py
│   │   ├── test_utils_logging.py
│   │   ├── test_utils_next_asset_reviewable_campaign.py
│   │   ├── test_utils_next_asset_reviewable_topic.py
│   │   ├── test_utils_next_asset_transcribable_campaign.py
│   │   ├── test_utils_next_asset_transcribable_topic.py
│   │   ├── test_validators.py
│   │   ├── test_view_decorators.py
│   │   ├── test_views.py
│   │   ├── test_views_asset_reservation.py
│   │   ├── test_views_redirect_next_reviewable.py
│   │   ├── test_views_redirect_next_transcribable.py
│   │   ├── test_views_tags.py
│   │   ├── test_views_topics.py
│   │   ├── test_views_transcription_review.py
│   │   ├── test_views_transcription_save.py
│   │   ├── test_views_transcription_submit.py
│   │   ├── test_views_utils.py
│   │   ├── test_widgets.py
│   │   └── utils.py
│   ├── turnstile/
│   │   ├── LICENSE
│   │   ├── __init__.py
│   │   ├── context_processors.py
│   │   ├── fields.py
│   │   └── widgets.py
│   ├── urls.py
│   ├── utils/
│   │   ├── __init__.py
│   │   ├── celery.py
│   │   ├── constants.py
│   │   └── next_asset/
│   │       ├── __init__.py
│   │       ├── reviewable/
│   │       │   ├── __init__.py
│   │       │   ├── campaign.py
│   │       │   └── topic.py
│   │       └── transcribable/
│   │           ├── __init__.py
│   │           ├── campaign.py
│   │           └── topic.py
│   ├── validators.py
│   ├── version.py
│   ├── views/
│   │   ├── README.md
│   │   ├── __init__.py
│   │   ├── accounts.py
│   │   ├── ajax.py
│   │   ├── assets.py
│   │   ├── campaigns.py
│   │   ├── decorators.py
│   │   ├── items.py
│   │   ├── maintenance_mode.py
│   │   ├── projects.py
│   │   ├── rate_limit.py
│   │   ├── simple_pages.py
│   │   ├── topics.py
│   │   ├── utils.py
│   │   └── visualizations.py
│   ├── widgets.py
│   └── wsgi.py
├── configuration/
│   ├── __init__.py
│   ├── admin.py
│   ├── apps.py
│   ├── management/
│   │   ├── __init__.py
│   │   └── commands/
│   │       ├── __init__.py
│   │       └── configcache.py
│   ├── migrations/
│   │   ├── 0001_initial.py
│   │   ├── 0002_populate_configurations.py
│   │   ├── 0003_populate_retry_configurations.py
│   │   ├── 0004_alter_configuration_options.py
│   │   ├── 0005_alter_configuration_data_type.py
│   │   ├── 0006_populate_next_asset_rate_limit.py
│   │   └── __init__.py
│   ├── models.py
│   ├── signals.py
│   ├── templates/
│   │   └── admin/
│   │       └── configuration_confirm_update.html
│   ├── templatetags/
│   │   ├── __init__.py
│   │   └── configuration_tags.py
│   ├── tests/
│   │   ├── __init__.py
│   │   ├── test_admin.py
│   │   ├── test_models.py
│   │   ├── test_signals.py
│   │   ├── test_templatetags.py
│   │   ├── test_utils.py
│   │   └── test_validation.py
│   ├── utils.py
│   ├── validation.py
│   └── views.py
├── db_scripts/
│   ├── Dockerfile
│   ├── dump.sh
│   └── restore.sh
├── development/
│   ├── Containerfile
│   ├── README.md
│   └── compose.yml
├── docker-compose.yml
├── docs/
│   ├── accessibility-goals.md
│   ├── accessibility-techniques.md
│   ├── design-principles.md
│   ├── for-developers.md
│   └── how-we-work.md
├── entrypoint.sh
├── exporter/
│   ├── __init__.py
│   ├── admin.py
│   ├── apps.py
│   ├── exceptions.py
│   ├── migrations/
│   │   └── __init__.py
│   ├── models.py
│   ├── tabular_export/
│   │   ├── admin.py
│   │   └── core.py
│   ├── templates/
│   │   └── admin/
│   │       └── exporter/
│   │           └── unacceptable_character_report.html
│   ├── tests/
│   │   ├── __init__.py
│   │   ├── test_exceptions.py
│   │   ├── test_tabular_export.py
│   │   ├── test_utils.py
│   │   └── test_views.py
│   ├── utils.py
│   └── views.py
├── fixtures/
│   └── original-static-pages.json
├── frontend/
│   ├── .gitignore
│   ├── README.md
│   ├── eslint.config.js
│   ├── index.html
│   ├── package.json
│   ├── src/
│   │   ├── App.jsx
│   │   ├── ViewerSplit.jsx
│   │   ├── config.js
│   │   ├── editor/
│   │   │   ├── Buttons.jsx
│   │   │   ├── Editor.jsx
│   │   │   ├── Header.jsx
│   │   │   ├── StatusMessages.jsx
│   │   │   ├── TranscriptionTextarea.jsx
│   │   │   └── buttons/
│   │   │       ├── Editable.jsx
│   │   │       ├── Redo.jsx
│   │   │       ├── Review.jsx
│   │   │       ├── Save.jsx
│   │   │       ├── Submit.jsx
│   │   │       └── Undo.jsx
│   │   ├── main.jsx
│   │   ├── ocr/
│   │   │   ├── Button.jsx
│   │   │   ├── ConfirmModal.jsx
│   │   │   ├── Handler.jsx
│   │   │   ├── HelpModal.jsx
│   │   │   ├── LanguageModal.jsx
│   │   │   └── Section.jsx
│   │   └── viewer/
│   │       ├── Controls.jsx
│   │       ├── FilterTabNav.jsx
│   │       ├── GammaFilterForm.jsx
│   │       ├── ImageFilters.jsx
│   │       ├── InvertFilterForm.jsx
│   │       ├── KeyboardHelpModal.jsx
│   │       ├── KeyboardShortcutRow.jsx
│   │       ├── ThresholdFilterForm.jsx
│   │       └── Viewer.jsx
│   └── vite.config.js
├── importer/
│   ├── Dockerfile
│   ├── README.md
│   ├── __init__.py
│   ├── admin.py
│   ├── apps.py
│   ├── celery.py
│   ├── config.py
│   ├── entrypoint.sh
│   ├── exceptions.py
│   ├── migrations/
│   │   ├── 0001_initial.py
│   │   ├── 0001_squashed_0015_auto_20180925_1851.py
│   │   ├── 0002_auto_20180709_0833.py
│   │   ├── 0003_auto_20180709_0933.py
│   │   ├── 0004_auto_20180812_1007.py
│   │   ├── 0005_auto_20180816_1702.py
│   │   ├── 0006_auto_20180912_0229.py
│   │   ├── 0007_auto_20180917_1654.py
│   │   ├── 0008_campaigntaskdetails_project.py
│   │   ├── 0009_convert_project_text_to_keys.py
│   │   ├── 0010_auto_20180920_2013.py
│   │   ├── 0011_auto_20180922_0208.py
│   │   ├── 0012_auto_20180923_0231.py
│   │   ├── 0013_auto_20180924_1318.py
│   │   ├── 0014_auto_20180924_1943.py
│   │   ├── 0015_auto_20180925_1851.py
│   │   ├── 0016_importitem_failure_reason_and_more.py
│   │   ├── 0017_importitem_failure_history_importitem_retry_count_and_more.py
│   │   ├── 0018_importitem_status_history_and_more.py
│   │   ├── 0019_alter_downloadassetimagejob_batch_and_more.py
│   │   ├── 0020_alter_downloadassetimagejob_unique_together_and_more.py
│   │   └── __init__.py
│   ├── models.py
│   ├── setup.py
│   ├── tasks/
│   │   ├── __init__.py
│   │   ├── assets.py
│   │   ├── collections.py
│   │   ├── decorators.py
│   │   ├── images.py
│   │   └── items.py
│   ├── tests/
│   │   ├── README.md
│   │   ├── __init__.py
│   │   ├── test_admin.py
│   │   ├── test_celery.py
│   │   ├── test_models.py
│   │   ├── test_tasks_assets.py
│   │   ├── test_tasks_collections.py
│   │   ├── test_tasks_core.py
│   │   ├── test_tasks_decorators.py
│   │   ├── test_tasks_images.py
│   │   ├── test_tasks_items.py
│   │   ├── test_utils.py
│   │   └── utils.py
│   └── utils/
│       ├── __init__.py
│       ├── excel.py
│       └── verify_images.py
├── load_test.sh
├── locustfile.py
├── manage.py
├── package.json
├── postgresql/
│   └── create-multiple-postgresql-databases.sh
├── prometheus_metrics/
│   ├── LICENSE
│   ├── __init__.py
│   ├── apps.py
│   ├── middleware.py
│   ├── models.py
│   └── views.py
├── pylenium.json
├── pyproject.toml
├── setup.cfg
├── setup.py
├── src/
│   ├── about.js
│   ├── main.js
│   └── profile.js
├── static/
│   └── .gitignore
├── tools/
│   └── readme_symbol_check.py
└── vite.config.js

================================================
FILE CONTENTS
================================================

================================================
FILE: .cfnlintrc.yaml
================================================
# The W2001 check is used to ignore the featurebranch.yaml DataLoadStackName parameter in the nested
# stack fargate-featurebranch.yaml used to signal when the DataLoadHost UserData commands are complete.
# Check if Parameters are Used
ignore_checks:
    - W2001


================================================
FILE: .dockerignore
================================================
node_modules
static-files


================================================
FILE: .github/ISSUE_TEMPLATE/bug_report.md
================================================
---
name: Bug report
about: Create a report to help us improve
---

**What behavior did you observe? Please describe the bug**
A clear and concise description of what you experienced.

**How can we reproduce the bug?**
Steps to reproduce the behavior:

1. Go to '...'
2. Click on '....'
3. Scroll down to '....'
4. See error

**What is the expected behavior?**
A clear and concise description of what you expected to happen.

**Got screenshots? This helps us identify the issue**
Add screenshots to help explain your problem.

**Desktop (please complete the following information):**

-   OS: [e.g. iOS]
-   Browser [e.g. chrome, safari]

**Additional context**
Add any other context about the problem here.


================================================
FILE: .github/ISSUE_TEMPLATE/feature_request.md
================================================
---
name: Feature request
about: Suggest an idea for this project
---

**User story/persona**
As {a user}, I want to {action} so that I can {goal}

**Is your feature request related to a problem? Please describe.**
A clear and concise description of what the problem is. Ex. I'm always frustrated when [...]

**Additional context**
Add any other context or screenshots about the feature request here.

**Acceptance Criteria**
Add a list items this new feature needs to meet. Ex: The user would not be able to submit a form if all the mandatory fields are not entered.

**Acceptance Test:**
Add a list of steps to test for a user to check if functionality satisfies the acceptance criteria.


================================================
FILE: .github/dependabot.yml
================================================
# To get started with Dependabot version updates, you'll need to specify which
# package ecosystems to update and where the package manifests are located.
# Please see the documentation for all configuration options:
# https://docs.github.com/code-security/dependabot/dependabot-version-updates/configuration-options-for-the-dependabot.yml-file

version: 2
updates:
    - package-ecosystem: 'github-actions' # See documentation for possible values
      directory: '/workflows' # Location of package manifests
      schedule:
          interval: 'weekly'
    - package-ecosystem: 'npm' # See documentation for possible values
      directory: '/' # Location of package manifests
      schedule:
          interval: 'daily'
    - package-ecosystem: 'pip' # See documentation for possible values
      directory: '/' # Location of package manifests
      schedule:
          interval: 'daily'


================================================
FILE: .github/workflows/black.yml
================================================
name: Lint

on:
    workflow_dispatch:
    pull_request:
        branches: [main, 'feature-*', release]
        paths-ignore:
            - docs/**
            - README.md
            - .github/**
            - cloudformation/**
            - db_scripts/**
            - jenkins/**
            - search-proxy/**
            - postgresql/**

jobs:
    lint:
        runs-on: ubuntu-latest
        steps:
            - uses: actions/checkout@v6
            - uses: actions/setup-python@v6
              with:
                  python-version: '3.12'
            - uses: psf/black@stable


================================================
FILE: .github/workflows/build.yml
================================================
name: 'Build'

on:
    workflow_dispatch:
    pull_request:
        branches: [main, 'feature-*', release]
        paths-ignore:
            - docs/**
            - README.md
            - .github/**
            - cloudformation/**
            - db_scripts/**
            - jenkins/**
            - search-proxy/**
            - postgresql/**

jobs:
    build:
        name: Build
        runs-on: ubuntu-latest

        steps:
            - name: Install system packages
              run: |
                  sudo apt-get update -qy && sudo apt-get dist-upgrade -qy && sudo apt-get install -qy \
                  libmemcached-dev libz-dev libfreetype6-dev libtiff-dev \
                  libjpeg-dev libopenjp2-7-dev libwebp-dev zlib1g-dev libpq-dev

            - name: Install node and npm
              uses: actions/setup-node@v6
              with:
                  node-version: '20'

            - name: Checkout repository
              uses: actions/checkout@v6

            - name: Set up Python 3.12
              uses: actions/setup-python@v6
              with:
                  # Semantic version range syntax or exact version of a Python version
                  python-version: '3.12'
                  # Optional - x64 or x86 architecture, defaults to x64
                  architecture: 'x64'

            - name: Display Python version
              run: python -c "import sys; print(sys.version)"

            - name: build containers
              run: |
                  docker build -t concordia .
                  docker build -t concordia/importer --file importer/Dockerfile .
                  docker build -t concordia/celerybeat --file celerybeat/Dockerfile .


================================================
FILE: .github/workflows/codeql.yml
================================================
name: 'CodeQL Advanced'

on:
    workflow_dispatch:
    push:
        branches: [main, 'feature-*']
    pull_request:
        branches: [main, 'feature-*', release]
        paths-ignore:
            - docs/**
            - README.md
            - cloudformation/**
            - db_scripts/**
            - jenkins/**
            - search-proxy/**
            - postgresql/**
    schedule:
        - cron: '20 23 * * 2'

jobs:
    analyze:
        name: Analyze (${{ matrix.language }})
        runs-on: ubuntu-latest

        permissions:
            actions: read
            contents: read
            security-events: write
            packages: read

        strategy:
            fail-fast: false
            matrix:
                include:
                    - language: javascript-typescript
                      build-mode: none
                    - language: python
                      build-mode: none

        steps:
            - name: Install system packages
              run: |
                  sudo apt-get update -qy && sudo apt-get dist-upgrade -qy && sudo apt-get install -qy \
                  libmemcached-dev libz-dev libfreetype6-dev libtiff-dev \
                  libjpeg-dev libopenjp2-7-dev libwebp-dev zlib1g-dev libpq-dev

            - name: Checkout repository
              uses: actions/checkout@v6

            - if: matrix.language == 'python'
              name: Setup python
              uses: actions/setup-python@v6
              with:
                  python-version: '3.12'

            # Initializes the CodeQL tools for scanning.
            - name: Initialize CodeQL
              uses: github/codeql-action/init@v4
              with:
                  languages: ${{ matrix.language }}
                  build-mode: ${{ matrix.build-mode }}

            - if: matrix.language == 'python'
              run: |
                  pip install -U packaging
                  pip install -U setuptools
                  pip install pipenv
                  pipenv install --dev --deploy

            - name: Perform CodeQL Analysis
              uses: github/codeql-action/analyze@v4
              with:
                  category: '/language:${{matrix.language}}'


================================================
FILE: .github/workflows/db_ops.yml
================================================
name: DB Operations Multi-Repo Pipeline

on:
    workflow_dispatch:
        inputs:
            action_type:
                description: 'Action'
                required: true
                default: 'build_test'
                type: choice
                options:
                    - build_test
                    - promote_to_latest
            operation:
                description: 'Operation'
                required: true
                default: 'dump'
                type: choice
                options:
                    - dump
                    - restore

env:
    AWS_REGION: us-east-1
    # Mapping the operation to the specific ECR Repo Name
    DUMP_REPO: crowd-db-dump
    RESTORE_REPO: crowd-db-restore

jobs:
    process:
        runs-on: ubuntu-latest
        steps:
            - name: Checkout Code
              uses: actions/checkout@v6

            - name: Configure AWS Credentials
              uses: aws-actions/configure-aws-credentials@v6
              with:
                  aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
                  aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
                  aws-region: ${{ env.AWS_REGION }}
                  role-session-name: github_to_aws_deploy

            - name: Login to Amazon ECR
              id: login-ecr
              uses: aws-actions/amazon-ecr-login@v2

            # LOGIC: Determine Repo Name and Docker Stage Target
            - name: Set Variables
              id: vars
              run: |
                  if [[ "${{ github.event.inputs.operation }}" == "dump" ]]; then
                    echo "REPO_NAME=${{ env.DUMP_REPO }}" >> $GITHUB_OUTPUT
                    echo "STAGE_TARGET=dump" >> $GITHUB_OUTPUT
                  else
                    echo "REPO_NAME=${{ env.RESTORE_REPO }}" >> $GITHUB_OUTPUT
                    echo "STAGE_TARGET=restore" >> $GITHUB_OUTPUT
                  fi

            # ACTION 1: BUILD AND PUSH 'test'
            - name: Build and Push Test
              if: ${{ github.event.inputs.action_type == 'build_test' }}
              uses: docker/build-push-action@v7
              with:
                  # context: defines where the 'COPY' commands look for files
                  context: ./db_scripts
                  # file: path to the actual Dockerfile relative to repo root
                  file: ./db_scripts/Dockerfile
                  # target: tells Docker to stop at the 'dump' or 'restore' stage
                  target: ${{ steps.vars.outputs.STAGE_TARGET }}
                  push: true
                  tags: ${{ steps.login-ecr.outputs.registry }}/${{ steps.vars.outputs.REPO_NAME }}:test

            # ACTION 2: PROMOTE 'test' to 'latest'
            - name: Promote Test to Latest
              if: ${{ github.event.inputs.action_type == 'promote_to_latest' }}
              run: |
                  REPO=${{ steps.vars.outputs.REPO_NAME }}

                  MANIFEST=$(aws ecr batch-get-image \
                    --repository-name $REPO \
                    --image-ids imageTag=test \
                    --query 'images[0].imageManifest' \
                    --output text)

                  aws ecr put-image \
                    --repository-name $REPO \
                    --image-tag latest \
                    --image-manifest "$MANIFEST"


================================================
FILE: .github/workflows/dev-main-deploy.yml
================================================
name: 'Deploy to dev'

on:
    workflow_dispatch:
    push:
        branches: [main]
        paths-ignore:
            - docs/**
            - README.md
            - .github/**
            - cloudformation/**
            - db_scripts/**
            - jenkins/**
            - search-proxy/**
            - postgresql/**
            - cloudformation/tests/**
            - concordia/tests/**
            - exporter/tests/**
            - importer/tests/**

env:
    AWS_REGION: us-east-1

permissions:
    id-token: write
    contents: read

jobs:
    deploy:
        name: Deploy to Dev
        runs-on: ubuntu-latest
        environment:
            name: development

        steps:
            - name: Install system packages
              run: |
                  sudo apt-get update -qy && sudo apt-get dist-upgrade -qy && sudo apt-get install -qy \
                  libmemcached-dev libz-dev libfreetype6-dev libtiff-dev \
                  libjpeg-dev libopenjp2-7-dev libwebp-dev zlib1g-dev libpq-dev

            - name: Install node and npm
              uses: actions/setup-node@v6
              with:
                  node-version: '20'

            - name: Checkout repository
              uses: actions/checkout@v6
              with:
                  fetch-depth: 0
                  fetch-tags: 'true'

            - name: Set up Python 3.12
              uses: actions/setup-python@v6
              with:
                  # Semantic version range syntax or exact version of a Python version
                  python-version: '3.12'
                  # Optional - x64 or x86 architecture, defaults to x64
                  architecture: 'x64'

            - name: Install Python Dependencies and Retrieve Version Number
              id: python-build
              run: |
                  python3 -m pip install --upgrade pip
                  pip3 install -U setuptools
                  pip3 install -U setuptools-scm

                  FULL_VERSION_NUMBER="$(python3 -m setuptools_scm)"
                  echo "version_number=$(echo "${FULL_VERSION_NUMBER}" | cut -d '+' -f 1)" >> $GITHUB_ENV

            - name: configure aws credentials
              uses: aws-actions/configure-aws-credentials@v6
              with:
                  aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
                  aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
                  aws-region: ${{ env.AWS_REGION }}
                  role-session-name: github_to_aws_deploy

            - name: Login to Amazon ECR
              id: login-ecr
              uses: aws-actions/amazon-ecr-login@v2

            - name: Build, tag and push docker images ECR
              env:
                  REGISTRY: ${{ steps.login-ecr.outputs.registry }}
                  IMAGE_TAG: ${{ secrets.IMAGE_TAG }}
                  CLUSTER: ${{ secrets.CLUSTER }}
                  TARGET_SERVICE: ${{ secrets.TARGET_SERVICE }}
              run: |
                  docker build -t concordia .
                  docker build -t concordia/importer --file importer/Dockerfile .
                  docker build -t concordia/celerybeat --file celerybeat/Dockerfile .

                  docker tag concordia:latest $REGISTRY/concordia:$version_number
                  docker tag concordia:latest $REGISTRY/concordia:$IMAGE_TAG
                  docker tag concordia/importer:latest $REGISTRY/concordia/importer:$version_number
                  docker tag concordia/importer:latest $REGISTRY/concordia/importer:$IMAGE_TAG
                  docker tag concordia/celerybeat:latest $REGISTRY/concordia/celerybeat:$version_number
                  docker tag concordia/celerybeat:latest $REGISTRY/concordia/celerybeat:$IMAGE_TAG

                  docker push $REGISTRY/concordia:$version_number
                  docker push $REGISTRY/concordia:$IMAGE_TAG
                  docker push $REGISTRY/concordia/importer:$version_number
                  docker push $REGISTRY/concordia/importer:$IMAGE_TAG
                  docker push $REGISTRY/concordia/celerybeat:$version_number
                  docker push $REGISTRY/concordia/celerybeat:$IMAGE_TAG

                  aws ecs update-service --region ${{ env.AWS_REGION }} --force-new-deployment --cluster $CLUSTER --service $TARGET_SERVICE


================================================
FILE: .github/workflows/feature-branch-deploy.yml
================================================
name: 'Deploy feature branch to test'

on:
    workflow_dispatch:
    push:
        branches: ['feature-*']
        paths-ignore:
            - docs/**
            - README.md
            - .github/**
            - cloudformation/**
            - db_scripts/**
            - jenkins/**
            - search-proxy/**
            - postgresql/**

env:
    AWS_REGION: us-east-1

permissions:
    id-token: write
    contents: read

jobs:
    deploy:
        name: Deploy Feature Branch to Test
        runs-on: ubuntu-latest
        environment:
            name: feature
        steps:
            - name: Install system packages
              run: |
                  sudo apt-get update -qy && sudo apt-get dist-upgrade -qy && sudo apt-get install -qy \
                  libmemcached-dev libz-dev libfreetype6-dev libtiff-dev \
                  libjpeg-dev libopenjp2-7-dev libwebp-dev zlib1g-dev libpq-dev

            - name: Install node and npm
              uses: actions/setup-node@v6
              with:
                  node-version: '20'

            - name: Checkout repository
              uses: actions/checkout@v6
              with:
                  ref: ${{ vars.FEATURE_BRANCH }}
                  fetch-depth: 0
                  fetch-tags: 'true'

            - name: Set up Python 3.12
              uses: actions/setup-python@v6
              with:
                  # Semantic version range syntax or exact version of a Python version
                  python-version: '3.12'
                  # Optional - x64 or x86 architecture, defaults to x64
                  architecture: 'x64'

            - name: Install Python Dependencies and Retrieve Version Number
              id: python-build
              run: |
                  python3 -m pip install --upgrade pip
                  pip3 install -U setuptools
                  pip3 install -U setuptools-scm

                  FULL_VERSION_NUMBER="$(python3 -m setuptools_scm)"
                  echo "version_number=$(echo "${FULL_VERSION_NUMBER}" | cut -d '+' -f 1)" >> $GITHUB_ENV

            - name: configure aws credentials
              uses: aws-actions/configure-aws-credentials@v6
              with:
                  aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
                  aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
                  aws-region: ${{ env.AWS_REGION }}
                  role-session-name: github_to_aws_deploy

            - name: Login to Amazon ECR
              id: login-ecr
              uses: aws-actions/amazon-ecr-login@v2

            - name: Build, tag and push docker images ECR
              env:
                  REGISTRY: ${{ steps.login-ecr.outputs.registry }}
                  IMAGE_TAG: ${{ secrets.IMAGE_TAG }}
                  CLUSTER: ${{ secrets.CLUSTER }}
                  TARGET_SERVICE: ${{ secrets.TARGET_SERVICE }}
              run: |
                  docker build -t concordia .
                  docker build -t concordia/importer --file importer/Dockerfile .
                  docker build -t concordia/celerybeat --file celerybeat/Dockerfile .

                  docker tag concordia:latest $REGISTRY/concordia:$version_number
                  docker tag concordia:latest $REGISTRY/concordia:$IMAGE_TAG
                  docker tag concordia/importer:latest $REGISTRY/concordia/importer:$version_number
                  docker tag concordia/importer:latest $REGISTRY/concordia/importer:$IMAGE_TAG
                  docker tag concordia/celerybeat:latest $REGISTRY/concordia/celerybeat:$version_number
                  docker tag concordia/celerybeat:latest $REGISTRY/concordia/celerybeat:$IMAGE_TAG

                  docker push $REGISTRY/concordia:$version_number
                  docker push $REGISTRY/concordia:$IMAGE_TAG
                  docker push $REGISTRY/concordia/importer:$version_number
                  docker push $REGISTRY/concordia/importer:$IMAGE_TAG
                  docker push $REGISTRY/concordia/celerybeat:$version_number
                  docker push $REGISTRY/concordia/celerybeat:$IMAGE_TAG

                  aws ecs update-service --region ${{ env.AWS_REGION }} --force-new-deployment --cluster $CLUSTER --service $TARGET_SERVICE


================================================
FILE: .github/workflows/pip-audit.yml
================================================
name: pip-audit

on:
    workflow_dispatch:
    pull_request:
        branches: [main, release]
        paths-ignore:
            - docs/**
            - README.md
            - .github/**
            - cloudformation/**
            - db_scripts/**
            - jenkins/**
            - search-proxy/**
            - postgresql/**

jobs:
    pip-audit:
        runs-on: ubuntu-latest
        steps:
            - uses: actions/checkout@v6
            - uses: actions/setup-python@v6
              with:
                  python-version: '3.12'

            - name: 'Generate requirements.txt'
              run: |
                  pipx run pipfile-requirements Pipfile.lock > requirements.txt

            - uses: pypa/gh-action-pip-audit@v1.1.0
              with:
                  inputs: requirements.txt
                  ignore-vulns: |
                      PYSEC-2023-312


================================================
FILE: .github/workflows/prod-deploy.yml
================================================
name: 'Deploy to production'

on:
    workflow_dispatch:

env:
    AWS_REGION: us-east-1

permissions:
    id-token: write
    contents: read

jobs:
    deploy:
        name: Deploy to Production
        runs-on: ubuntu-latest
        environment:
            name: production

        steps:
            - name: configure aws credentials
              uses: aws-actions/configure-aws-credentials@v6
              with:
                  aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
                  aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
                  aws-region: ${{ env.AWS_REGION }}
                  role-session-name: github_to_aws_deploy

            - name: Login to Amazon ECR
              id: login-ecr
              uses: aws-actions/amazon-ecr-login@v2

            - name: Pull, tag and push docker images ECR
              env:
                  REGISTRY: ${{ steps.login-ecr.outputs.registry }}
                  IMAGE_TAG_PULL: ${{ secrets.IMAGE_TAG_PULL }}
                  IMAGE_TAG: ${{ secrets.IMAGE_TAG }}
                  CLUSTER: ${{ secrets.CLUSTER }}
                  TARGET_SERVICE_A: ${{ secrets.TARGET_SERVICE_A }}
                  TARGET_SERVICE: ${{ secrets.TARGET_SERVICE }}
              run: |
                  docker pull $REGISTRY/concordia:$IMAGE_TAG_PULL
                  docker pull $REGISTRY/concordia/importer:$IMAGE_TAG_PULL
                  docker pull $REGISTRY/concordia/celerybeat:$IMAGE_TAG_PULL

                  docker tag $REGISTRY/concordia:$IMAGE_TAG_PULL $REGISTRY/concordia:$IMAGE_TAG
                  docker tag $REGISTRY/concordia/importer:$IMAGE_TAG_PULL $REGISTRY/concordia/importer:$IMAGE_TAG
                  docker tag $REGISTRY/concordia/celerybeat:$IMAGE_TAG_PULL $REGISTRY/concordia/celerybeat:$IMAGE_TAG

                  docker push $REGISTRY/concordia:$IMAGE_TAG
                  docker push $REGISTRY/concordia/importer:$IMAGE_TAG
                  docker push $REGISTRY/concordia/celerybeat:$IMAGE_TAG

                  aws ecs update-service --region ${{ env.AWS_REGION }} --force-new-deployment --cluster $CLUSTER --service $TARGET_SERVICE_A
                  aws ecs update-service --region ${{ env.AWS_REGION }} --force-new-deployment --cluster $CLUSTER --service $TARGET_SERVICE


================================================
FILE: .github/workflows/renew_coverage.yml
================================================
name: Renew Coverage Cache

on:
    schedule:
        - cron: '0 0 */5 * *' # Runs every 5 days at midnight UTC
    workflow_dispatch:

        # The renew_coverage.yml action is used to keep the cached release coverage value by
        #  accessing it every five days. Normally, cached values are discarded after they're
        #  not accessed for seven days. To avoid that, the task simply accessing the value so
        #  it's not lost in case we have a seven-day period with no pull requests.

jobs:
    renew-cache:
        runs-on: ubuntu-latest
        steps:
            - name: Access Coverage Cache to Renew Expiration
              uses: actions/cache@v5
              with:
                  path: coverage.txt
                  key: release-coverage
                  restore-keys: |
                      release-coverage


================================================
FILE: .github/workflows/stage-hotfix-rel-deploy.yml
================================================
name: 'Deploy hotfix to stage'

on:
    workflow_dispatch:

env:
    AWS_REGION: us-east-1

permissions:
    id-token: write
    contents: read

jobs:
    deploy:
        name: Deploy Release to Stage
        runs-on: ubuntu-latest
        environment:
            name: stage

        steps:
            - name: Install system packages
              run: |
                  sudo apt-get update -qy && sudo apt-get dist-upgrade -qy && sudo apt-get install -qy \
                  libmemcached-dev libz-dev libfreetype6-dev libtiff-dev \
                  libjpeg-dev libopenjp2-7-dev libwebp-dev zlib1g-dev libpq-dev

            - name: Install node and npm
              uses: actions/setup-node@v6
              with:
                  node-version: '20'

            - name: Checkout repository
              uses: actions/checkout@v6
              with:
                  ref: release
                  fetch-depth: 0
                  fetch-tags: 'true'

            - name: Set up Python 3.12
              uses: actions/setup-python@v6
              with:
                  # Semantic version range syntax or exact version of a Python version
                  python-version: '3.12'
                  # Optional - x64 or x86 architecture, defaults to x64
                  architecture: 'x64'

            - name: Get version from Git
              run: |
                  # Get latest version tag number (e.g. release was tagged in GitHub for this hot fix)
                  HOTFIX_VERSION_NUMBER="$(git describe --tags)"
                  echo "version_number=$(echo "${HOTFIX_VERSION_NUMBER}" | cut -d '-' -f 1 | cut -c 2- )" >> $GITHUB_ENV

            - name: configure aws credentials
              uses: aws-actions/configure-aws-credentials@v6
              with:
                  aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
                  aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
                  aws-region: ${{ env.AWS_REGION }}
                  role-session-name: github_to_aws_deploy

            - name: Login to Amazon ECR
              id: login-ecr
              uses: aws-actions/amazon-ecr-login@v2

            - name: Build, tag and push docker images ECR
              env:
                  REGISTRY: ${{ steps.login-ecr.outputs.registry }}
                  IMAGE_TAG: ${{ secrets.IMAGE_TAG }}
                  CLUSTER: ${{ secrets.CLUSTER }}
                  TARGET_SERVICE: ${{ secrets.TARGET_SERVICE }}
              run: |
                  echo "version number: $version_number"

                  docker build -t concordia .
                  docker build -t concordia/importer --file importer/Dockerfile .
                  docker build -t concordia/celerybeat --file celerybeat/Dockerfile .

                  docker tag concordia:latest $REGISTRY/concordia:$version_number
                  docker tag concordia:latest $REGISTRY/concordia:$IMAGE_TAG
                  docker tag concordia/importer:latest $REGISTRY/concordia/importer:$version_number
                  docker tag concordia/importer:latest $REGISTRY/concordia/importer:$IMAGE_TAG
                  docker tag concordia/celerybeat:latest $REGISTRY/concordia/celerybeat:$version_number
                  docker tag concordia/celerybeat:latest $REGISTRY/concordia/celerybeat:$IMAGE_TAG

                  docker push $REGISTRY/concordia:$version_number
                  docker push $REGISTRY/concordia:$IMAGE_TAG
                  docker push $REGISTRY/concordia/importer:$version_number
                  docker push $REGISTRY/concordia/importer:$IMAGE_TAG
                  docker push $REGISTRY/concordia/celerybeat:$version_number
                  docker push $REGISTRY/concordia/celerybeat:$IMAGE_TAG

                  aws ecs update-service --region ${{ env.AWS_REGION }} --force-new-deployment --cluster $CLUSTER --service $TARGET_SERVICE


================================================
FILE: .github/workflows/stage-image-refresh.yml
================================================
name: 'Deploy image refresh to stage'

on:
    workflow_dispatch:

env:
    AWS_REGION: us-east-1

permissions:
    id-token: write
    contents: read

jobs:
    deploy:
        name: Deploy Container Environment Update
        runs-on: ubuntu-latest
        environment:
            name: stage

        steps:
            - name: Install system packages
              run: |
                  sudo apt-get update -qy && sudo apt-get dist-upgrade -qy && sudo apt-get install -qy \
                  libmemcached-dev libz-dev libfreetype6-dev libtiff-dev \
                  libjpeg-dev libopenjp2-7-dev libwebp-dev zlib1g-dev libpq-dev

            - name: Install node and npm
              uses: actions/setup-node@v6
              with:
                  node-version: '20'

            - name: Checkout repository
              uses: actions/checkout@v6
              with:
                  ref: release
                  fetch-depth: 0
                  fetch-tags: 'true'

            - name: Set up Python 3.12
              uses: actions/setup-python@v6
              with:
                  # Semantic version range syntax or exact version of a Python version
                  python-version: '3.12'
                  # Optional - x64 or x86 architecture, defaults to x64
                  architecture: 'x64'

            - name: Create image tags
              run: |
                  # Get latest version tag number (e.g. main was tagged in GitHub for this Release)
                  FULL_VERSION_NUMBER="$(git describe --tags `git rev-list --tags --max-count=1`)"
                  echo "version_number=$(echo "${FULL_VERSION_NUMBER}" | cut -c2- )" >> $GITHUB_ENV

                  # Create image tag for image being being replaced/refreshed/updated
                  echo "tag_stale_image=$(echo "${FULL_VERSION_NUMBER}" | cut -c2- )_$(date +%Y%m%dT%H%M%S)" >> $GITHUB_ENV

            - name: configure aws credentials
              uses: aws-actions/configure-aws-credentials@v6
              with:
                  aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
                  aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
                  aws-region: ${{ env.AWS_REGION }}
                  role-session-name: github_to_aws_deploy

            - name: Login to Amazon ECR
              id: login-ecr
              uses: aws-actions/amazon-ecr-login@v2

            - name: Build, tag and push docker images ECR
              env:
                  REGISTRY: ${{ steps.login-ecr.outputs.registry }}
                  IMAGE_TAG: ${{ secrets.IMAGE_TAG }}
                  CLUSTER: ${{ secrets.CLUSTER }}
                  TARGET_SERVICE: ${{ secrets.TARGET_SERVICE }}
              run: |
                  docker build -t concordia .
                  docker build -t concordia/importer --file importer/Dockerfile .
                  docker build -t concordia/celerybeat --file celerybeat/Dockerfile .

                  docker tag concordia:latest $REGISTRY/concordia:$version_number
                  docker tag concordia:latest $REGISTRY/concordia:$IMAGE_TAG
                  docker tag concordia/importer:latest $REGISTRY/concordia/importer:$version_number
                  docker tag concordia/importer:latest $REGISTRY/concordia/importer:$IMAGE_TAG
                  docker tag concordia/celerybeat:latest $REGISTRY/concordia/celerybeat:$version_number
                  docker tag concordia/celerybeat:latest $REGISTRY/concordia/celerybeat:$IMAGE_TAG

                  docker push $REGISTRY/concordia:$version_number
                  docker push $REGISTRY/concordia:$IMAGE_TAG
                  docker push $REGISTRY/concordia/importer:$version_number
                  docker push $REGISTRY/concordia/importer:$IMAGE_TAG
                  docker push $REGISTRY/concordia/celerybeat:$version_number
                  docker push $REGISTRY/concordia/celerybeat:$IMAGE_TAG

                  aws ecs update-service --region ${{ env.AWS_REGION }} --force-new-deployment --cluster $CLUSTER --service $TARGET_SERVICE

            - name: Tag existing images
              env:
                  IT_TAG: ${{ secrets.IT_IMAGE_TAG }}
              run: |

                  # Add a new tag to existing concordia images to preserve the history of images after final deployment
                  # Tag concordia
                  APP_MANIFEST="$(aws ecr batch-get-image --repository-name concordia --image-ids imageTag=${IT_TAG} --output json | jq --raw-output --join-output '.images[0].imageManifest')"
                  aws ecr put-image --repository-name concordia --image-tag $tag_stale_image --image-manifest "$APP_MANIFEST"

                  # Tag concordia/celerybeat
                  BEAT_MANIFEST="$(aws ecr batch-get-image --repository-name concordia/celerybeat --image-ids imageTag=${IT_TAG} --output json | jq --raw-output --join-output '.images[0].imageManifest')"
                  aws ecr put-image --repository-name concordia/celerybeat --image-tag $tag_stale_image --image-manifest "$BEAT_MANIFEST"

                  # Tag concordia/importer
                  IMPORT_MANIFEST="$(aws ecr batch-get-image --repository-name concordia/importer --image-ids imageTag=${IT_TAG} --output json | jq --raw-output --join-output '.images[0].imageManifest')"
                  aws ecr put-image --repository-name concordia/importer --image-tag $tag_stale_image --image-manifest "$IMPORT_MANIFEST"


================================================
FILE: .github/workflows/stage-release-deploy.yml
================================================
name: 'Deploy release to stage'

on:
    workflow_dispatch:
    push:
        branches: [release]
        paths-ignore:
            - docs/**
            - README.md
            - .github/**
            - cloudformation/**
            - db_scripts/**
            - jenkins/**
            - search-proxy/**
            - postgresql/**
            - cloudformation/tests/**
            - concordia/tests/**
            - exporter/tests/**
            - importer/tests/**

env:
    AWS_REGION: us-east-1

permissions:
    id-token: write
    contents: read

jobs:
    deploy:
        name: Deploy Release to Stage
        runs-on: ubuntu-latest
        environment:
            name: stage

        steps:
            - name: Install system packages
              run: |
                  sudo apt-get update -qy && sudo apt-get dist-upgrade -qy && sudo apt-get install -qy \
                  libmemcached-dev libz-dev libfreetype6-dev libtiff-dev \
                  libjpeg-dev libopenjp2-7-dev libwebp-dev zlib1g-dev libpq-dev

            - name: Install node and npm
              uses: actions/setup-node@v6
              with:
                  node-version: '20'

            - name: Checkout repository
              uses: actions/checkout@v6
              with:
                  ref: release
                  fetch-depth: 0
                  fetch-tags: 'true'

            - name: Set up Python 3.12
              uses: actions/setup-python@v6
              with:
                  # Semantic version range syntax or exact version of a Python version
                  python-version: '3.12'
                  # Optional - x64 or x86 architecture, defaults to x64
                  architecture: 'x64'

            - name: Get version from Git
              run: |
                  # Get latest version tag number (e.g. main was tagged in GitHub for this Release)
                  FULL_VERSION_NUMBER="$(git describe --tags `git rev-list --tags --max-count=1`)"
                  echo "version_number=$(echo "${FULL_VERSION_NUMBER}" | cut -c2- )" >> $GITHUB_ENV

            - name: configure aws credentials
              uses: aws-actions/configure-aws-credentials@v6
              with:
                  aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
                  aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
                  aws-region: ${{ env.AWS_REGION }}
                  role-session-name: github_to_aws_deploy

            - name: Login to Amazon ECR
              id: login-ecr
              uses: aws-actions/amazon-ecr-login@v2

            - name: Build, tag and push docker images ECR
              env:
                  REGISTRY: ${{ steps.login-ecr.outputs.registry }}
                  IMAGE_TAG: ${{ secrets.IMAGE_TAG }}
                  CLUSTER: ${{ secrets.CLUSTER }}
                  TARGET_SERVICE: ${{ secrets.TARGET_SERVICE }}
              run: |
                  docker build -t concordia .
                  docker build -t concordia/importer --file importer/Dockerfile .
                  docker build -t concordia/celerybeat --file celerybeat/Dockerfile .

                  docker tag concordia:latest $REGISTRY/concordia:$version_number
                  docker tag concordia:latest $REGISTRY/concordia:$IMAGE_TAG
                  docker tag concordia/importer:latest $REGISTRY/concordia/importer:$version_number
                  docker tag concordia/importer:latest $REGISTRY/concordia/importer:$IMAGE_TAG
                  docker tag concordia/celerybeat:latest $REGISTRY/concordia/celerybeat:$version_number
                  docker tag concordia/celerybeat:latest $REGISTRY/concordia/celerybeat:$IMAGE_TAG

                  docker push $REGISTRY/concordia:$version_number
                  docker push $REGISTRY/concordia:$IMAGE_TAG
                  docker push $REGISTRY/concordia/importer:$version_number
                  docker push $REGISTRY/concordia/importer:$IMAGE_TAG
                  docker push $REGISTRY/concordia/celerybeat:$version_number
                  docker push $REGISTRY/concordia/celerybeat:$IMAGE_TAG

                  aws ecs update-service --region ${{ env.AWS_REGION }} --force-new-deployment --cluster $CLUSTER --service $TARGET_SERVICE


================================================
FILE: .github/workflows/test-main-deploy.yml
================================================
name: 'Deploy to test'

on:
    workflow_dispatch:

env:
    AWS_REGION: us-east-1

permissions:
    id-token: write
    contents: read

jobs:
    deploy:
        name: Deploy to Test
        runs-on: ubuntu-latest
        environment:
            name: test

        steps:
            - name: configure aws credentials
              uses: aws-actions/configure-aws-credentials@v6
              with:
                  aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
                  aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
                  aws-region: ${{ env.AWS_REGION }}
                  role-session-name: github_to_aws_deploy

            - name: Login to Amazon ECR
              id: login-ecr
              uses: aws-actions/amazon-ecr-login@v2

            - name: Pull, tag and push docker images ECR
              env:
                  REGISTRY: ${{ steps.login-ecr.outputs.registry }}
                  IMAGE_TAG_PULL: ${{ secrets.IMAGE_TAG_PULL }}
                  IMAGE_TAG: ${{ secrets.IMAGE_TAG }}
                  CLUSTER: ${{ secrets.CLUSTER }}
                  TARGET_SERVICE: ${{ secrets.TARGET_SERVICE }}
                  TARGET_SERVICE_B: ${{ secrets.TARGET_SERVICE_B }}
              run: |
                  docker pull $REGISTRY/concordia:$IMAGE_TAG_PULL
                  docker pull $REGISTRY/concordia/importer:$IMAGE_TAG_PULL
                  docker pull $REGISTRY/concordia/celerybeat:$IMAGE_TAG_PULL

                  docker tag $REGISTRY/concordia:$IMAGE_TAG_PULL $REGISTRY/concordia:$IMAGE_TAG
                  docker tag $REGISTRY/concordia/importer:$IMAGE_TAG_PULL $REGISTRY/concordia/importer:$IMAGE_TAG
                  docker tag $REGISTRY/concordia/celerybeat:$IMAGE_TAG_PULL $REGISTRY/concordia/celerybeat:$IMAGE_TAG

                  docker push $REGISTRY/concordia:$IMAGE_TAG
                  docker push $REGISTRY/concordia/importer:$IMAGE_TAG
                  docker push $REGISTRY/concordia/celerybeat:$IMAGE_TAG

                  aws ecs update-service --region ${{ env.AWS_REGION }} --force-new-deployment --cluster $CLUSTER --service $TARGET_SERVICE
                  aws ecs update-service --region ${{ env.AWS_REGION }} --force-new-deployment --cluster $CLUSTER --service $TARGET_SERVICE_B


================================================
FILE: .github/workflows/test.yml
================================================
name: Test

on:
    workflow_dispatch:
    pull_request:
        branches: [main, 'feature-*', release]
        paths-ignore:
            - docs/**
            - README.md
            - .github/**
            - cloudformation/**
            - db_scripts/**
            - jenkins/**
            - search-proxy/**
            - postgresql/**

env:
    PIPENV_IGNORE_VIRTUALENVS: 1
    DJANGO_SETTINGS_MODULE: concordia.settings_test

jobs:
    test:
        runs-on: ubuntu-latest

        services:
            # Label used to access the service container
            postgres:
                # Docker Hub image
                image: postgres
                # Provide the password for postgres
                env:
                    POSTGRES_DB: concordia
                    POSTGRES_PASSWORD: postgres
                # Set health checks to wait until postgres has started
                options: >-
                    --health-cmd pg_isready
                    --health-interval 10s
                    --health-timeout 5s
                    --health-retries 5
                ports:
                    # Maps tcp port 5432 on service container to the host
                    - 5432:5432

        steps:
            - name: Remove Firefox
              run: sudo apt-get purge firefox

            - name: Install system packages
              run: |
                  sudo apt-get update -qy && sudo apt-get dist-upgrade -qy && sudo apt-get install -qy \
                  libmemcached-dev libz-dev libfreetype6-dev libtiff-dev \
                  libjpeg-dev libopenjp2-7-dev libwebp-dev zlib1g-dev libpq-dev \
                  tesseract-ocr tesseract-ocr-all

            - name: Install node and npm
              uses: actions/setup-node@v6
              with:
                  node-version: '20'

            - name: Checkout repository
              uses: actions/checkout@v6

            - name: Set up Python 3.12
              uses: actions/setup-python@v6
              with:
                  python-version: '3.12'
                  architecture: 'x64'
                  cache: 'pipenv'

            - name: Display Python version
              run: python -c "import sys; print(sys.version)"

            - name: Install Python Dependencies
              run: |
                  python3 -m pip install --upgrade pip
                  pip3 install -U packaging
                  pip3 install -U setuptools
                  pip3 install -U pipenv
                  pipenv install --dev --deploy
                  pipenv install tblib # For parallel test debugging

            - name: Install Node Dependencies #and Add .bin to Path
              run:
                  npm install
                  # echo "PATH=$PWD/node_modules/.bin:$PATH" >> $GITHUB_ENV

            - name: Configure Logs
              run: |
                  mkdir logs
                  touch ./logs/concordia-celery.log

            - name: Bundle, Build (Vite) and Collect Static Files
              run: |
                  npm run build
                  pipenv run ./manage.py collectstatic --no-input --no-post-process

            # - name: Install Chrome for Testing and Set Path
            #   run: |
            #       chromepath=$(npx @puppeteer/browsers install chrome@latest)
            #       chromepath=${chromepath#* }
            #       echo "Chrome installed at: $chromepath"
            #       $chromepath --version
            #       chromepath=${chromepath%/chrome} # Remove the binary so we can add it to the PATH
            #       # Update PATH for subsequent steps
            #       echo "PATH=$chromepath:$PATH" >> $GITHUB_ENV

            - name: Run Tests with Coverage
              run: |
                  mkdir -p coverage_report
                  pipenv run coverage run --parallel-mode ./manage.py test --parallel auto
                  pipenv run coverage combine  # Merge results from parallel test workers
                  # Save full report to coverage_report/coverage.txt and just the total coverage percent to pr_coverage.txt
                  pipenv run coverage report | tee coverage_report/coverage.txt | grep 'TOTAL' | awk '{print $6}' > pr_coverage.txt
                  echo "Stored PR coverage:"
                  cat pr_coverage.txt  # Debugging output to verify correct storage
                  pipenv run coverage html
                  mv htmlcov coverage_report/html  # Move HTML report into a separate directory
              env:
                  PGPASSWORD: postgres
                  # The hostname used to communicate with the PostgreSQL service container
                  POSTGRES_HOST: localhost
                  # The default PostgreSQL port
                  POSTGRES_PORT: 5432
                  # COMMIT_RANGE: ${{ github.event.pull_request.base.sha }}..${{ github.event.pull_request.head.sha }}

            # Store coverage results if running on the release branch
            - name: Store Release Coverage (if running on release branch)
              if: github.ref == 'refs/heads/release'
              run: cp pr_coverage.txt coverage.txt

            # Cache coverage results if running on the release branch
            - name: Cache Release Coverage (if running on release branch)
              if: github.ref == 'refs/heads/release'
              uses: actions/cache@v5
              with:
                  path: coverage.txt
                  key: release-coverage

            # Upload full coverage report as an artifact
            - name: Upload Full Coverage Report
              uses: actions/upload-artifact@v7
              with:
                  name: coverage-report
                  path: coverage_report

            # Download the stored release branch coverage for PR comparison, if it exists
            - name: Restore Release Coverage (if running on PR)
              if: github.event_name == 'pull_request'
              uses: actions/cache@v5
              with:
                  path: coverage.txt
                  key: release-coverage
                  restore-keys: |
                      release-coverage

            # Compare PR coverage against stored release coverage
            - name: Compare Coverage (if running on PR)
              if: github.event_name == 'pull_request'
              run: |
                  echo "Reading PR coverage from pr_coverage.txt..."
                  cat pr_coverage.txt || echo "⚠️ ERROR: pr_coverage.txt not found or empty"
                  PR_COVERAGE=$(cat pr_coverage.txt)
                  if [ -z "$PR_COVERAGE" ]; then
                      echo "⚠️ ERROR: PR_COVERAGE is empty!"
                      PR_COVERAGE="N/A"
                  fi

                  echo "PR Coverage: $PR_COVERAGE"
                  if [ -f "coverage.txt" ]; then
                      RELEASE_COVERAGE=$(cat coverage.txt)
                      COMPARISON_AVAILABLE=true
                  else
                      COMPARISON_AVAILABLE=false
                      RELEASE_COVERAGE="N/A"
                  fi

                  if [ "$COMPARISON_AVAILABLE" = true ]; then
                      # Strip '%' from PR_COVERAGE and RELEASE_COVERAGE for numerical comparison
                      PR_COVERAGE_NUM=${PR_COVERAGE%\%}
                      RELEASE_COVERAGE_NUM=${RELEASE_COVERAGE%\%}
                      if (( $(echo "$PR_COVERAGE_NUM > $RELEASE_COVERAGE_NUM" | bc -l) )); then
                          CHANGE="🔼 Coverage increased (+$(echo "$PR_COVERAGE_NUM - $RELEASE_COVERAGE_NUM" | bc -l)%)!"
                      elif (( $(echo "$PR_COVERAGE_NUM < $RELEASE_COVERAGE_NUM" | bc -l) )); then
                          CHANGE="🔽 Coverage decreased (-$(echo "$RELEASE_COVERAGE_NUM - $PR_COVERAGE_NUM" | bc -l)%)!"
                      else
                          CHANGE="✅ Coverage remained the same."
                      fi
                  else
                      CHANGE="⚠️ No baseline coverage available from 'release' branch."
                  fi

                  echo "COVERAGE_CHANGE=$CHANGE" >> $GITHUB_ENV
                  printf "RELEASE_COVERAGE=%s\n" "$RELEASE_COVERAGE" >> $GITHUB_ENV
                  printf "PR_COVERAGE=%s\n" "$PR_COVERAGE" >> $GITHUB_ENV

            # Generate and store command for display on the Action UI and PR (if any)
            - name: Generate Coverage Report Comment
              run: |
                  echo "**🛡 Test Coverage Report 🛡**" > coverage_comment.txt
                  echo "- **Current PR Coverage:** ${{ env.PR_COVERAGE }}" >> coverage_comment.txt
                  echo "- **Release Branch Coverage:** ${{ env.RELEASE_COVERAGE }}" >> coverage_comment.txt
                  echo "- **${{ env.COVERAGE_CHANGE }}**" >> coverage_comment.txt
                  echo "- 📊 **[Download Full Coverage Report (Under "Artifacts")](${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}#artifacts)**" >> coverage_comment.txt
                  echo "" >> coverage_comment.txt
                  echo "<details>" >> coverage_comment.txt
                  echo "<summary>📜 Click to view full text coverage report</summary>" >> coverage_comment.txt
                  echo "" >> coverage_comment.txt
                  echo '```text' >> coverage_comment.txt
                  cat coverage_report/coverage.txt >> coverage_comment.txt
                  echo '```' >> coverage_comment.txt
                  echo "</details>" >> coverage_comment.txt

            # Display the coverage summary in the GitHub Actions UI
            - name: Post Coverage Summary
              run: cat coverage_comment.txt >> $GITHUB_STEP_SUMMARY

            # Post a comment on the PR with the coverage results
            - name: Comment Coverage Change on PR
              if: github.event_name == 'pull_request'
              uses: mshick/add-pr-comment@v3
              with:
                  message-path: coverage_comment.txt


================================================
FILE: .gitignore
================================================
node_modules/
bin/
target/
local/
build/
.project
.classpath
.settings/
*.pyc
buildstatus.log
deploystatus.log
.metadata/
artifacts/
/.*
!.gitignore
!.cfnlintrc.yaml
!.github
!.dockerignore
.DS_Store
docs/build
env.ini
.venv
*.sqlite3
*.egg-info/
/temp/
/emails/
/logs/*
env-dev.ini
docs/_build
docs/modules
dist/
profile_pics/
mss*
*.swp
config-optional-override.json
env/
concordia/settings_dev_*.py
concordia/settings_test_*.py
concordia/settings_loadtest_*.py
version.txt
static-files


================================================
FILE: Dockerfile
================================================
# Base runtime: Debian 12 (bookworm) slim + Python 3.12.
FROM python:3.12-slim-bookworm

# Major Node.js version to install (e.g., 20, 22). This is used to select the
# NodeSource APT repository "node_<major>.x".
ARG NODE_MAJOR=20

# Include a small "wait for dependencies" helper used by the container command.
# This is downloaded at build time and placed at /wait.
## Add the wait script to the image
ADD https://github.com/ufoscout/docker-compose-wait/releases/download/2.2.1/wait /wait
RUN chmod +x /wait

# Prevent interactive prompts during apt operations.
ENV DEBIAN_FRONTEND="noninteractive"

# Bootstrap minimal tooling needed later in the build:
# - curl: download files/keys
# - ca-certificates: validate HTTPS endpoints
# - gnupg: import and dearmor APT repository signing keys
RUN apt-get update -qy && apt-get install -qy curl ca-certificates gnupg

# Trust the Library's certificate authority so the HTTPS tampering proxy does
# not break TLS validation for clients inside the container.
#
# This downloads the CA certificate, converts it to PEM, and refreshes the
# OpenSSL certificate hashes so it is recognized by OpenSSL-based clients.
# Ensure that the Library's certificate authority is trusted so the tampering
# proxy will not break TLS validation. See
# https://staff.loc.gov/wikis/display/SE/Configuring+HTTPS+clients+for+the+HTTPS+tampering+proxy.
RUN curl -fso /etc/ssl/certs/LOC-ROOT-CA-1.crt http://crl.loc.gov/LOC-ROOT-CA-1.crt && openssl x509 -inform der -in /etc/ssl/certs/LOC-ROOT-CA-1.crt -outform pem -out /etc/ssl/certs/LOC-ROOT-CA-1.pem && c_rehash

# Install Node.js via the NodeSource APT repository (manual setup; no setup
# script). Debian bookworm ships Node 18; adding this repo allows installing a
# newer major version (e.g., Node 20) via apt.
#
# This step:
# - creates a dedicated keyring directory under /etc/apt/keyrings
# - downloads and installs the NodeSource signing key into a keyring file
# - registers the NodeSource repository for the selected Node.js major line
#
# Note: When installing Node.js from NodeSource, the `nodejs` package includes
# npm (and npm comes with node-gyp), so there is no separate `npm` or
# `node-gyp` APT package to install here.
#
# References: NodeSource "Repository Manual Installation" guide. https://github.com/nodesource/distributions/wiki/Repository-Manual-Installation
RUN \
    # Create a dedicated directory for third-party APT keyrings.
    mkdir -p /etc/apt/keyrings && \
    # Download the NodeSource repository signing key and store it as a keyring
    # file that apt can use to verify NodeSource packages.
    curl -fsSL https://deb.nodesource.com/gpgkey/nodesource-repo.gpg.key \
        | gpg --dearmor -o /etc/apt/keyrings/nodesource.gpg && \
    # Register the NodeSource repository for the selected Node.js major version.
    # The "signed-by=" option scopes trust to just this repository entry.
    echo "deb [signed-by=/etc/apt/keyrings/nodesource.gpg] https://deb.nodesource.com/node_${NODE_MAJOR}.x nodistro main" \
        > /etc/apt/sources.list.d/nodesource.list

# Bring the base OS packages fully up to date, then install system dependencies
# needed to build and run the application.
#
# Notes:
# - dist-upgrade pulls in security and point-release updates for the base image.
# - --force-confnew ensures updated config files are accepted when prompted.
# - autoremove/autoclean reduce image size after installing packages.
RUN apt-get update -qy && apt-get dist-upgrade -qy && apt-get install -o Dpkg::Options::='--force-confnew' -qy \
    build-essential \
    git \
    libmemcached-dev \
    # Pillow/Imaging: https://pillow.readthedocs.io/en/latest/installation.html#external-libraries
    libz-dev libfreetype6-dev \
    libtiff-dev libjpeg-dev libopenjp2-7-dev libwebp-dev zlib1g-dev \
    # Postgres client library to build psycopg
    libpq-dev \
    locales \
    # Weasyprint requirements
    libpango-1.0-0 libharfbuzz0b libpangoft2-1.0-0 \
    # Tesseract
    tesseract-ocr tesseract-ocr-all \
    # Node.js runtime (from NodeSource) and build tooling for native addons.
    nodejs && apt-get -qy autoremove && apt-get -qy autoclean

# Generate and configure a UTF-8 locale for consistent string handling.
RUN locale-gen en_US.UTF-8
ENV LC_ALL=en_US.UTF-8
ENV LANG=en_US.UTF-8
ENV LANGUAGE=en_US.UTF-8

# Python runtime settings:
# - unbuffered output for log visibility in containers
# - add /app to PYTHONPATH for module resolution
ENV PYTHONUNBUFFERED=1 \
    PYTHONPATH=/app

# Default Django settings module for container runtime (can be overridden).
ENV DJANGO_SETTINGS_MODULE=${DJANGO_SETTINGS_MODULE:-concordia.settings_docker}

# Ensure an up-to-date pip and install pipenv for dependency management.
RUN pip install --upgrade pip
RUN pip install --no-cache-dir pipenv

# Copy application code into the image.
WORKDIR /app
COPY . /app

# Front-end build and asset pipeline:
# - update npm to a known major version
# - Install all JS dependencies (including devDependencies for plugins)
RUN npm install --silent --global npm@10 && npm install --silent

# Additional JS build step for Vite.
# - Build assets (Vite) complile scss, bundle, hash and compress js
# - This populates concordia/static/dist with hashed and compressed files.
RUN npm run build

# Create Log Directory
# - Required for Django logging initialization when running collecstatic.
RUN mkdir -p /app/logs

# Install Python dependencies into the system environment using Pipenv and
# - Bake static files into the image (Fast, no post-processing)
# - remove Pipenv cache to reduce image size.
RUN pipenv install --system --dev --deploy && \
    python manage.py collectstatic --no-input --no-post-process && \
    rm -rf ~/.cache/

# - Clean up node artifacts to reduce image size
RUN rm -rf node_modules && rm -rf ~/.cache/

# Container listens on port 80.
EXPOSE 80

# Wait for dependencies (via /wait) and then run the application entrypoint.
CMD /wait && /bin/bash entrypoint.sh


================================================
FILE: LICENSE.md
================================================
As a work of the United States Government, this project is in the
public domain within the United States.

Additionally, we waive copyright and related rights in the work
worldwide through the CC0 1.0 Universal public domain dedication.

## CC0 1.0 Universal Summary

This is a human-readable summary of the
[Legal Code (read the full text)](https://creativecommons.org/publicdomain/zero/1.0/legalcode).

### No Copyright

The person who associated a work with this deed has dedicated the work to
the public domain by waiving all of his or her rights to the work worldwide
under copyright law, including all related and neighboring rights, to the
extent allowed by law.

You can copy, modify, distribute and perform the work, even for commercial
purposes, all without asking permission.

### Other Information

In no way are the patent or trademark rights of any person affected by CC0,
nor are the rights that other persons may have in the work or in how the
work is used, such as publicity or privacy rights.

Unless expressly stated otherwise, the person who associated a work with
this deed makes no warranties about the work, and disclaims liability for
all uses of the work, to the fullest extent permitted by applicable law.
When using or citing the work, you should not imply endorsement by the
author or the affirmer.


================================================
FILE: Loadtesting.md
================================================
# Load Testing Mode

This document describes the current (incomplete but runnable) "load testing mode"
implementation and how to run it end-to-end manually.

Load testing mode consists of:

-   A fixture generator that builds a single JSON fixture from an existing DB
-   A DB preparation command that creates a fresh load test DB, migrates it, and
    loads the fixture while suppressing all Django signals
-   A load test settings file that points the app at the load test DB and disables
    Turnstile blocking
-   A Locust script (`locustfile.py`) plus a wrapper shell script (`load_test.sh`)
    to run a headless load test

The intended lifecycle is:

1. Generate a fixture from a DB with real-ish data
2. Create and populate a fresh `concordia_lt` database from that fixture
3. Run the web app against `concordia_lt` using load test settings
4. Run Locust against that host

The load test database is intended to be single-use.

## Files

-   `concordia/management/commands/create_load_test_fixtures.py`
-   `concordia/management/commands/prepare_load_test_db.py`
-   `concordia/settings_loadtest.py` (or your own `concordia/settings_loadtest_<name>.py`)
-   `locustfile.py` (repo root)
-   `load_test.sh` (repo root)

## Safety notes

-   `create_load_test_fixtures` is read-only against the source DB and only
    writes a JSON file. It is safe to run against production, though it is
    normally run against a refreshed copy of production.
-   `prepare_load_test_db` creates and optionally drops a separate database
    (`concordia_lt`), runs migrations, and loads fixtures into it.
    -   It requires PostgreSQL credentials with `CREATE DATABASE` privileges.
    -   If recreating or dropping, it terminates active connections to the target DB.
-   During fixture load, all Django signals are suppressed to avoid side effects
    (Celery tasks, storage writes, cache updates, derived fields, etc).
-   Storage in load test mode is configured to use dev/staging buckets for safety.
    The workflow is designed to avoid writes to external systems.
-   Locust defaults to a non-production host to reduce risk.

## Prerequisites

-   VPN access to the target environment
-   PostgreSQL credentials available via environment variables
    -   The DB user must be able to connect to `dbname=postgres` and create databases
-   Python environment with the normal dev dependencies installed (Locust is a dev
    dependency)
-   Ability to restart the web app with a different settings module
-   A reachable host running the app in load test mode

## Fixture contents

The fixture generated by `create_load_test_fixtures` contains:

-   Up to 2 published Topics, chosen by ascending `ordering`
-   Up to 5 published Campaigns, preferring Topic-linked Campaigns and filling with
    additional published Campaigns by ascending `ordering`
-   Up to `--assets-limit` Assets (default 10,000), collected by walking:
    -   Topic-linked Projects first, then
    -   Campaign-linked Projects if needed
-   Closure of referenced Items, Projects, Campaigns and Topics for the chosen Assets
-   All Transcriptions for selected Assets
-   Anonymized fixtures for any Users referenced by those Transcriptions
    (`user` and `reviewed_by`)
-   A synthetic pool of test users:
    -   Default: 10,000 users named `locusttest00001`..`locusttest10000`
    -   All share the same password: `locustpass123`
    -   Email: `<username>@example.test`
    -   Users are created with explicit PKs beyond the existing fixture user PKs to
        avoid collisions
-   ProjectTopic rows for selected Topic+Project links (preserves the M2M)

Notes:

-   Selection is best-effort. If there are fewer than `--assets-limit` Assets, the
    fixture is still written.
-   The output is a single JSON file (default `loadtest_fixture.json`).
-   By default, the command validates the fixture by calling `prepare_load_test_db`
    unless `--no-validate` is provided.

## Commands

### 1) Create the fixture

Run against a DB with real data (usually a refreshed prod copy):

```bash
python manage.py create_load_test_fixtures
```

Common options:

```bash
python manage.py create_load_test_fixtures \
  --assets-limit 10000 \
  --test-users 10000 \
  --test-user-prefix locusttest \
  --test-user-password locustpass123 \
  --output loadtest_fixture.json
```

Validation options:

-   `--no-validate` to skip validation
-   `--validate-db-name NAME` to override the validation DB name
-   `--validate-recreate` to recreate the validation DB if it exists
-   `--validate-drop` to drop the validation DB after loading

### 2) Create and populate the load test DB

Standard DB name: `concordia_lt`

```bash
python manage.py prepare_load_test_db \
  --db-name concordia_lt \
  --recreate \
  --fixtures loadtest_fixture.json
```

Behavior:

-   Creates or recreates `concordia_lt`
-   Runs migrations
-   Loads fixtures with all signals suppressed by default

## Running the app in load test mode

### Settings file

`concordia/settings_loadtest.py` is an override layer on top of
`settings_template.py`. It:

-   Points the DB at `concordia_lt`
-   Disables rate limiting
-   Forces Turnstile to always-pass test keys by default
-   Uses console email backend
-   Uses dev buckets for safety
-   Adjusts logging to be visible in common run contexts

If you need a different DB name, do not edit `settings_loadtest.py` directly.
Create a personal settings file, following the local dev convention:

-   `concordia/settings_loadtest_<username>.py`
-   Override `DATABASES["default"]["NAME"]` (and any other local overrides)

### Selecting settings at runtime

Local example:

```bash
DJANGO_SETTINGS_MODULE=concordia.settings_loadtest \
  python manage.py runserver 0.0.0.0:8000
```

Server/container example:

-   Set `DJANGO_SETTINGS_MODULE=concordia.settings_loadtest`
-   Restart/redeploy the web process so it actually uses the load test settings

Important:

-   Creating `concordia_lt` does not affect any running web process.
    You must restart the app with the load test settings selected.

## Locust

### Overview

The load test simulates three flows:

-   Anonymous browsing/transcription page interactions
-   Authenticated users who transcribe
-   Authenticated users who review

The script uses these endpoints:

-   `/` (homepage)
-   `/next-transcribable-asset/` (redirect to next asset)
-   `/next-reviewable-asset/` (redirect to next reviewable asset)
-   `/account/login/` (login)
-   `/account/ajax-status/` and `/account/ajax-messages/` (simulates normal page load)

The script parses asset pages to find:

-   The transcription form action (`<form id="transcription-editor" ...>`)
-   Reservation endpoint (`<script id="asset-reservation-data" data-reserve-asset-url="...">`)
-   Review endpoints (`data-review-url`, `data-submit-url`)

If parsing fails, it is treated as a fundamental mismatch between the Locust
script and the UI.

### "No work" abort behavior

The Locust run aborts the entire test if it determines there is no work
available. "No work" is defined as either:

-   A `/next-*` redirect eventually landing on `/` (homepage), or
-   An asset page not containing the transcription form

This is controlled by:

-   `ABORT_WHEN_NO_WORK = True` (default)
-   `NO_WORK_DUMP_HTML = False` (set True to dump a debug HTML file on abort)

The abort is coordinated across master/workers in distributed mode via a custom
message (`global-abort`). Locust is forced to exit with a non-zero exit code.

### load_test.sh

`load_test.sh` runs Locust in headless mode with defaults that can be overridden
via environment variables.

Defaults:

-   Users: 100
-   Spawn rate: 2
-   Run time: 1m30s
-   Host: `https://crowd-dev.loc.gov`

Override example:

```bash
LOCUST_USERS=500 \
LOCUST_SPAWN_RATE=10 \
LOCUST_RUN_TIME=10m \
LOCUST_HOST=https://your-loadtest-host.example \
./load_test.sh
```

## End-to-end manual runbook

This is the current manual process. Nothing here is automated end-to-end yet.

1. Choose the environment to test

-   Typically your personal environment, dev or staging prepared from a refreshed DB copy of production

2. Generate a fixture

```bash
python manage.py create_load_test_fixtures \
  --output loadtest_fixture.json
```

If you want a smaller dataset for quicker iteration, lower `--assets-limit`
and/or `--test-users`.

3. Create and populate the load test DB

```bash
python manage.py prepare_load_test_db \
  --db-name concordia_lt \
  --recreate \
  --fixtures loadtest_fixture.json
```

4. Switch the web app to load test settings and restart it

-   Set `DJANGO_SETTINGS_MODULE=concordia.settings_loadtest`
-   Restart/redeploy the web process so it uses:
    -   `DATABASES["default"]["NAME"] = "concordia_lt"`
    -   Turnstile always-pass test keys

Sanity checks:

-   Visit the site and confirm pages load without Turnstile blocking.
-   Attempt login with a known test user:
    -   Username: `locusttest00001`
    -   Password: `locustpass123`

5. Run Locust

```bash
./load_test.sh
```

Tune parameters if needed:

```bash
LOCUST_USERS=200 LOCUST_SPAWN_RATE=5 LOCUST_RUN_TIME=5m ./load_test.sh
```

6. Common failure modes

-   Immediate login failures:
    -   App not pointing at `concordia_lt`
    -   Fixture not loaded or test users missing
    -   Turnstile not disabled for load test mode
-   Global abort "no work":
    -   `next-*` redirects to `/` because there is no eligible work
    -   This is likely due to running the script multiple times without refreshing DB
-   Lots of 403s:
    -   Turnstile still active
    -   CSRF issues (the script attempts to seed and use CSRF correctly)

7. Cleanup

There is no automated cleanup step. The DB is intended to be thrown away or
recreated for each run.

To recreate on the next run, rerun step (3) with `--recreate`.

## Known gaps / Next development priorities

-   No single "one command" workflow; all steps are manual.
-   No automated mechanism to build and deploy a load-test-mode container in AWS.
-   No automated environment switching between normal and load test settings.
-   No automated teardown of the load test DB after a run.


================================================
FILE: MANIFEST.in
================================================
include README.md
include MANIFEST.in
recursive-include concordia *
recursive-include tests *.py


================================================
FILE: Makefile
================================================
.PHONY: allup firstup adminuser devup down clean

firstup:
	docker-compose -f docker-compose.yml up -d
	adminuser

adminuser:
	docker-compose -f docker-compose.yml run --rm app ./manage.py shell -c "from django.contrib.auth.models import User; User.objects.create_superuser('admin', 'crowd@loc.gov', '${CONCORDIA_ADMIN_PW}')"

allup:
	docker-compose -f docker-compose.yml up -d

devup:
	docker-compose -f docker-compose.yml up -d

down:
	docker-compose -f docker-compose.yml down

clean:	down
	docker-compose -f docker-compose.yml down -v --remove-orphans
	rm -rf postgresql-data/


================================================
FILE: Pipfile
================================================
[[source]]
url = "https://pypi.org/simple"
verify_ssl = true
name = "pypi"

[packages]
gunicorn = "==23.0.0"
celery = { extras = ["redis"], version = "==5.5.3" }
django-tinymce = "==4.1.0"
whitenoise = "==6.9.0"
openpyxl = "==3.1.5"
markdown = "==3.10"
django-bootstrap5 = "==25.2"
django-robots = "==6.1"
setuptools-scm = "==9.2.2"
django-ratelimit = "==4.1.0"
pylibmc = "==1.6.3"
kombu = "==5.5.4"
django-flags = "==5.0.14"
sentry-sdk = "==2.57.0"
channels = { extras = ["daphne"], version = "==4.2.2" }
channels-redis = "==4.3.0"
more-itertools = "==10.7.0"
nh3 = "==0.3.4"
django-admin-multiple-choice-list-filter = "==0.1.1"
django-npm = "==1.0.1"
pymemcache = "==4.0.0"
weasyprint = "==68.1"
tesseract = "==0.1.3"
pytesseract = "==0.3.13"
django-redis = "==6.0.0"
twisted = { extras = ["http2", "tls"], version = "==25.5.0" }
pyleniumio = "==1.21.0"
django-maintenance-mode = "==0.22.0"
xlsxwriter = "==3.2.5"
psycopg2 = "==2.9.11"
django-storages = { extras = ["s3"], version = "==1.14.6" }
django-structlog = {extras = ["celery"], version = "==10.0.0"}
defusedxml = "==0.7.1"
django-ninja = "==1.4.3"
urllib3 = "==2.6.3"
bagit = "==1.9.0"
django-registration = "==3.4"
boto3 = "==1.39.17"
botocore = "==1.39.17"
certifi = "==2025.7.14"
websocket-client = "<1.8.0"
black = "*"
django-vite = "~=3.1.0"
pyasn1 = "~=0.6.3"
requests = "~=2.33.0"
hiredis = "~=3.3.0"
django-celery-beat = "~=2.8.1"
prometheus-client = "~=0.25.0"
aws-xray-sdk = "~=2.15.0"
pre-commit = "~=4.5.1"
django = "~=5.2.13"
django-opensearch-dsl = "==0.8.0"

[dev-packages]
invoke = "==2.2.0"
django-extensions = "==3.2.3"
django-debug-toolbar = "==6.3.0"
coverage = "==7.9.2"
locust = "~=2.43"
tblib = "~=3.2.0"
pre-commit = "~=4.5.1"

[requires]
python_version = "3.12"


================================================
FILE: README.md
================================================
[![Lint](https://github.com/LibraryOfCongress/concordia/actions/workflows/black.yml/badge.svg)](https://github.com/LibraryOfCongress/concordia/actions/workflows/black.yml)
[![Test](https://github.com/LibraryOfCongress/concordia/actions/workflows/test.yml/badge.svg)](https://github.com/LibraryOfCongress/concordia/actions/workflows/test.yml)
[![Build](https://github.com/LibraryOfCongress/concordia/actions/workflows/build.yml/badge.svg)](https://github.com/LibraryOfCongress/concordia/actions/workflows/build.yml)
[![Coverage Status](https://coveralls.io/repos/github/LibraryOfCongress/concordia/badge.svg?branch=main)](https://coveralls.io/github/LibraryOfCongress/concordia?branch=main)

# Welcome to Concordia

Concordia is a platform developed by the Library of Congress (LOC) for crowdsourcing transcription and tagging of text in digitized images with the dual goals of collection enhancement and public engagement. Concordia is a user-centered project centering the principles of trust and approachability. [Read our full design principles here](https://github.com/LibraryOfCongress/concordia/blob/master/docs/design-principles.md). Learn more about the Concordia development process in [this Code4Lib article](https://journal.code4lib.org/articles/14901).

LOC launched the first iteration of Concordia as [By the People at crowd.loc.gov](https://crowd.loc.gov/) in October 2018.

The Library of Congress publishes transcriptions created by By the People volunteers on [loc.gov](https://www.loc.gov/) to improve search, readability, and access to handwritten and typed documents. Individual transcriptions are published alongside the transcribed images in digital collections and transcriptions are also published in bulk as [datasets](https://www.loc.gov/search/?fa=contributor:by+the+people+%28program%29). [Learn more about how we publish transcriptions](https://blogs.loc.gov/folklife/2022/05/etl-searching-the-lomax-family-papers-through-the-magic-of-crowdsourcing/).

Concordia code and the By the People transcriptions are released into the public domain. Anyone is free to use or reuse the data. [More info on our licensing page](https://github.com/LibraryOfCongress/concordia/blob/main/LICENSE.md).

As of May 2022 the Library of Congress Concordia development team has moved issues out of Github to an internal system due to reporting needs. Open github issue tickets may not be active or up-to-date. We continue to publish our code here as it is released. Learn more about [How We Work](https://github.com/LibraryOfCongress/concordia/blob/main/docs/how-we-work.md).

_Concordia and By the People are supported by the National Digital Library Trust Fund._

## What Concordia does

The application invites volunteers to transcribe and tag digitized images of manuscript and typed materials from the Library’s collections. All transcriptions are made by volunteers and reviewed by volunteers. It takes at least one volunteer to transcribe a page and at least one other volunteer to review and mark it complete. Some complex documents may pass through both transcription and review many times before they are accepted as complete by a volunteer.

Concordia is a containerized Python-Django-Postgres-etc web application. The Library hosts its instance in the cloud.

Concordia leverages the publicly-available [loc.gov API](https://libraryofcongress.github.io/data-exploration/) to call collection metadata and images in JPEG format and save copies for use in Concordia. Completed transcriptions can be exported out of the application as a single CSV or individual TXT files in a BagIt bag.

## Want to use or reuse our code?

For more on our tech stack and to learn how to set up the Concordia on your computer, check out the [For Developers page](docs/for-developers.md).

## Want to help?

We're excited that you want to be part of Concordia! Here are two ways to contribute:

**1. Report bugs by submitting an issue.** If you are reporting a bug, please include:

-   Your operating system name and version.
-   Any details about your local setup that might be helpful in troubleshooting.
-   Detailed steps to reproduce the bug.

**2. Create an issue to give feedback or suggest a new feature.** The best way to give feedback is to file an issue at https://github.com/LibraryOfCongress/concordia/issues. If you are proposing a feature:

-   Explain in detail how it would work.
-   Explain how it would serve Concordia via a user story
-   Keep the scope as narrow as possible, to make it easier to implement.

If you use or build on our code, we'd love to hear from you! [Contact us here at ask.loc.gov](https://ask.loc.gov/).


================================================
FILE: build_containers.sh
================================================
#!/bin/bash

set -eu -o pipefail

BUILD_ALL=${BUILD_ALL:=0}
BUILD_NUMBER=${BUILD_NUMBER:=1}
TAG=${TAG:-test}
PUBLISH_CONTAINERS=${PUBLISH_CONTAINERS:=1}

# Get an unique venv folder to use inside workspace
VENV=".venv-${BUILD_NUMBER}"

# Initialize new venv
python3 -m venv "${VENV}"
source "${VENV}/bin/activate"

# Update pip
pip3 install -U pip
pip3 install packaging
pip3 install -U setuptools
pip3 install -U pipenv

pipenv install --dev --system --deploy

FULL_VERSION_NUMBER="$(python3 setup.py --version)"
VERSION_NUMBER=$(echo "${FULL_VERSION_NUMBER}" | cut -d '+' -f 1)

if [ $PUBLISH_CONTAINERS -eq 1 ]; then
    AWS_ACCOUNT_ID="$(aws sts get-caller-identity  --output=text --query "Account")"
    eval "$(aws ecr get-login --no-include-email --region us-east-1)"
fi

python3 setup.py build

docker build -t concordia .

if [ $PUBLISH_CONTAINERS -eq 1 ]; then
    docker tag concordia:latest "${AWS_ACCOUNT_ID}.dkr.ecr.us-east-1.amazonaws.com/concordia:${VERSION_NUMBER}"
    docker tag concordia:latest "${AWS_ACCOUNT_ID}.dkr.ecr.us-east-1.amazonaws.com/concordia:${TAG}"
    docker push "${AWS_ACCOUNT_ID}.dkr.ecr.us-east-1.amazonaws.com/concordia:${VERSION_NUMBER}"
    docker push "${AWS_ACCOUNT_ID}.dkr.ecr.us-east-1.amazonaws.com/concordia:${TAG}"
fi

if [ $BUILD_ALL -eq 1 ]; then

    docker build -t concordia/importer --file importer/Dockerfile .
    docker build -t concordia/celerybeat --file celerybeat/Dockerfile .

    if [ $PUBLISH_CONTAINERS -eq 1 ]; then
        docker tag concordia/importer:latest "${AWS_ACCOUNT_ID}.dkr.ecr.us-east-1.amazonaws.com/concordia/importer:${VERSION_NUMBER}"
        docker tag concordia/importer:latest "${AWS_ACCOUNT_ID}.dkr.ecr.us-east-1.amazonaws.com/concordia/importer:${TAG}"
        docker push "${AWS_ACCOUNT_ID}.dkr.ecr.us-east-1.amazonaws.com/concordia/importer:${VERSION_NUMBER}"
        docker push "${AWS_ACCOUNT_ID}.dkr.ecr.us-east-1.amazonaws.com/concordia/importer:${TAG}"

        docker tag concordia/celerybeat:latest "${AWS_ACCOUNT_ID}.dkr.ecr.us-east-1.amazonaws.com/concordia/celerybeat:${VERSION_NUMBER}"
        docker tag concordia/celerybeat:latest "${AWS_ACCOUNT_ID}.dkr.ecr.us-east-1.amazonaws.com/concordia/celerybeat:${TAG}"
        docker push "${AWS_ACCOUNT_ID}.dkr.ecr.us-east-1.amazonaws.com/concordia/celerybeat:${VERSION_NUMBER}"
        docker push "${AWS_ACCOUNT_ID}.dkr.ecr.us-east-1.amazonaws.com/concordia/celerybeat:${TAG}"
    fi
fi


================================================
FILE: celerybeat/Dockerfile
================================================
FROM python:3.12-slim-bookworm

## Add the wait script to the image
ADD https://github.com/ufoscout/docker-compose-wait/releases/download/2.2.1/wait /wait
RUN chmod +x /wait

ENV DEBIAN_FRONTEND="noninteractive"

RUN apt-get update -qy && apt-get install -qy curl

# Ensure that the Library's certificate authority is trusted so the tampering
# proxy will not break TLS validation. See
# https://staff.loc.gov/wikis/display/SE/Configuring+HTTPS+clients+for+the+HTTPS+tampering+proxy.

RUN curl -fso /etc/ssl/certs/LOC-ROOT-CA-1.crt http://crl.loc.gov/LOC-ROOT-CA-1.crt && openssl x509 -inform der -in /etc/ssl/certs/LOC-ROOT-CA-1.crt -outform pem -out /etc/ssl/certs/LOC-ROOT-CA-1.pem && c_rehash

RUN apt-get update -qy && apt-get dist-upgrade -qy && apt-get install -o Dpkg::Options::='--force-confnew' -qy \
    git \
    libmemcached-dev \
    # Pillow/Imaging: https://pillow.readthedocs.io/en/latest/installation.html#external-libraries
    libz-dev libfreetype6-dev \
    libtiff-dev libjpeg-dev libopenjp2-7-dev libwebp-dev zlib1g-dev \
    # Postgres client library to build psycopg
    libpq-dev \
    locales \
    # Weasyprint requirements
    libpango-1.0-0 libharfbuzz0b libpangoft2-1.0-0 \
    gcc && apt-get -qy autoremove && apt-get -qy autoclean

RUN locale-gen en_US.UTF-8
ENV LC_ALL=en_US.UTF-8
ENV LANG=en_US.UTF-8
ENV LANGUAGE=en_US.UTF-8

ENV PYTHONUNBUFFERED=1 \
    PYTHONPATH=/app

ENV DJANGO_SETTINGS_MODULE=${DJANGO_SETTINGS_MODULE:-concordia.settings_docker}

RUN pip install --upgrade pip
RUN pip install --no-cache-dir pipenv

WORKDIR /app
COPY . /app

RUN pipenv install --system --dev --deploy && rm -rf ~/.cache/

CMD /wait && ./celerybeat/entrypoint.sh


================================================
FILE: celerybeat/entrypoint.sh
================================================
#!/bin/bash

set -e -u # Exit immediately for unhandled errors or undefined variables

mkdir -p /app/logs
touch /app/logs/concordia.log

#  To avoid trace and reporting of errors in the X-Ray SDK
export AWS_XRAY_CONTEXT_MISSING=LOG_ERROR

echo "Running celerybeat"
celery -A concordia beat -l info --scheduler django_celery_beat.schedulers:DatabaseScheduler


================================================
FILE: cloudformation/LICENSE
================================================
                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      "License" shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      "Licensor" shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      "Legal Entity" shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      "control" means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      "You" (or "Your") shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      "Source" form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      "Object" form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      "Work" shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      "Derivative Works" shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      "Contribution" shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, "submitted"
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as "Not a Contribution."

      "Contributor" shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a "NOTICE" text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an "AS IS" BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets "{}"
      replaced with your own identifying information. (Don't include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same "printed page" as the copyright notice for easier
      identification within third-party archives.

   Copyright 2016 Amazon Web Services, Inc.

   Licensed under the Apache License, Version 2.0 (the "License");
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an "AS IS" BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.


================================================
FILE: cloudformation/NOTICE
================================================
ecs-refarch-cloudformation
Copyright 2011-2016 Amazon.com, Inc. or its affiliates. All Rights Reserved.


================================================
FILE: cloudformation/README.md
================================================
# Note Regarding Concordia Usage

This README, and set of CloudFormation templates, is based on the AWS sample templates at [ecs-refarch-cloudformation](https://s3.amazonaws.com/ecs-refarch-cloudformation/master.yaml).

The sample templates have been modified and new templates have been added.

To use these templates:

1.  Upload this directory to an S3 bucket:

```
cd cloudformation
./sync_templates.sh
```

2.  Read [how to get started with AWS ECR](https://docs.aws.amazon.com/AmazonECR/latest/userguide/ECR_GetStarted.html) and follow the instructions to create an ECR repository for each docker image that will be deployed.
3.  Set a BUILD_NUMBER in your environment and run `./build_containers.sh`
4.  Create a KMS key for this project.
5.  Populate the secrets in `create_secrets.sh` and run that script to create a new set of secrets.
6.  Upload a certificate for the environment to IAM using the canonical host name.
7.  If you don't already have the ECS service linked role in your AWS account, run: `aws iam create-service-linked-role --aws-service-name ecs.amazonaws.com`
8.  Use CloudFormation to create a stack, using the `master.yaml` in the S3 bucket you uploaded in step 1 as the initial template.
9.  If your environment name is not dev, test, stage or prod: Create a new revision of the task definition, changing the ENV_NAME variable to point to the correct secret storage location. Update the service to use the newest task definition version.

![build-status](https://codebuild.eu-west-1.amazonaws.com/badges?uuid=eyJlbmNyeXB0ZWREYXRhIjoiKzBuNjJCUFk2STRvbDZENXlMUFJOenF2V2EyQ3FMbEtuWDlQeVp6TWlxdXhNMGVOZGo5bG9jdTl1YU16RmZIVVNxa3VqTVg3V3drSnJxOUQwSmhqV2g0PSIsIml2UGFyYW1ldGVyU3BlYyI6IlJJRE4wZGJaS25LL0s0dzkiLCJtYXRlcmlhbFNldFNlcmlhbCI6MX0%3D&branch=master)

# Deploying Microservices with Amazon ECS, AWS CloudFormation, and an Application Load Balancer

This reference architecture provides a set of YAML templates for deploying microservices to [Amazon EC2 Container Service (Amazon ECS)](http://docs.aws.amazon.com/AmazonECS/latest/developerguide/Welcome.html) with [AWS CloudFormation](https://aws.amazon.com/cloudformation/).

You can launch this CloudFormation stack in your account:

| AWS Region              | Short name |                                                                                                                                                                                                                                                             |
| ----------------------- | ---------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
| US East (Ohio)          | us-east-2  | [![cloudformation-launch-button](images/cloudformation-launch-stack.png)](https://console.aws.amazon.com/cloudformation/home?region=us-east-2#/stacks/new?stackName=Production&templateURL=https://s3.amazonaws.com/ecs-refarch-cloudformation/master.yaml) |
| US East (N. Virginia)   | us-east-1  | [![cloudformation-launch-button](images/cloudformation-launch-stack.png)](https://console.aws.amazon.com/cloudformation/home?region=us-east-1#/stacks/new?stackName=Production&templateURL=https://s3.amazonaws.com/ecs-refarch-cloudformation/master.yaml) |
| US West (N. California) | us-west-2  | [![cloudformation-launch-button](images/cloudformation-launch-stack.png)](https://console.aws.amazon.com/cloudformation/home?region=us-west-2#/stacks/new?stackName=Production&templateURL=https://s3.amazonaws.com/ecs-refarch-cloudformation/master.yaml) |
| US West (Oregon)        | us-west-1  | [![cloudformation-launch-button](images/cloudformation-launch-stack.png)](https://console.aws.amazon.com/cloudformation/home?region=us-west-1#/stacks/new?stackName=Production&templateURL=https://s3.amazonaws.com/ecs-refarch-cloudformation/master.yaml) |

## Overview

![infrastructure-overview](images/architecture-overview.png)

The repository consists of a set of nested templates that deploy the following:

-   A tiered [VPC](http://docs.aws.amazon.com/AmazonVPC/latest/UserGuide/VPC_Introduction.html) with public and private subnets, spanning an AWS region.
-   A highly available ECS cluster deployed across two [Availability Zones](http://docs.aws.amazon.com/AWSEC2/latest/UserGuide/using-regions-availability-zones.html) in an [Auto Scaling](https://aws.amazon.com/autoscaling/) group and that are AWS SSM enabled.
-   A pair of [NAT gateways](http://docs.aws.amazon.com/AmazonVPC/latest/UserGuide/vpc-nat-gateway.html) (one in each zone) to handle outbound traffic.
-   Two interconnecting microservices deployed as [ECS services](http://docs.aws.amazon.com/AmazonECS/latest/developerguide/ecs_services.html) (website-service and product-service).
-   An [Application Load Balancer (ALB)](https://aws.amazon.com/elasticloadbalancing/applicationloadbalancer/) to the public subnets to handle inbound traffic.
-   ALB path-based routes for each ECS service to route the inbound traffic to the correct service.
-   Centralized container logging with [Amazon CloudWatch Logs](http://docs.aws.amazon.com/AmazonCloudWatch/latest/logs/WhatIsCloudWatchLogs.html).
-   A [Lambda Function](https://docs.aws.amazon.com/lambda/latest/dg/welcome.html) and [Auto Scaling Lifecycle Hook](https://docs.aws.amazon.com/autoscaling/ec2/userguide/lifecycle-hooks.html) to [drain Tasks from your Container Instances](https://docs.aws.amazon.com/AmazonECS/latest/developerguide/container-instance-draining.html) when an Instance is selected for Termination in your Auto Scaling Group.

## Why use AWS CloudFormation with Amazon ECS?

Using CloudFormation to deploy and manage services with ECS has a number of nice benefits over more traditional methods ([AWS CLI](https://aws.amazon.com/cli), scripting, etc.).

#### Infrastructure-as-Code

A template can be used repeatedly to create identical copies of the same stack (or to use as a foundation to start a new stack). Templates are simple YAML- or JSON-formatted text files that can be placed under your normal source control mechanisms, stored in private or public locations such as Amazon S3, and exchanged via email. With CloudFormation, you can see exactly which AWS resources make up a stack. You retain full control and have the ability to modify any of the AWS resources created as part of a stack.

#### Self-documenting

Fed up with outdated documentation on your infrastructure or environments? Still keep manual documentation of IP ranges, security group rules, etc.?

With CloudFormation, your template becomes your documentation. Want to see exactly what you have deployed? Just look at your template. If you keep it in source control, then you can also look back at exactly which changes were made and by whom.

#### Intelligent updating & rollback

CloudFormation not only handles the initial deployment of your infrastructure and environments, but it can also manage the whole lifecycle, including future updates. During updates, you have fine-grained control and visibility over how changes are applied, using functionality such as [change sets](https://aws.amazon.com/blogs/aws/new-change-sets-for-aws-cloudformation/), [rolling update policies](http://docs.aws.amazon.com/AWSCloudFormation/latest/UserGuide/aws-attribute-updatepolicy.html) and [stack policies](http://docs.aws.amazon.com/AWSCloudFormation/latest/UserGuide/protect-stack-resources.html).

## Template details

The templates below are included in this repository and reference architecture:

| Template                                                                       | Description                                                                                                                                                                                                                                                                                                                                                                          |
| ------------------------------------------------------------------------------ | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
| [master.yaml](master.yaml)                                                     | This is the master template - deploy it to CloudFormation and it includes all of the others automatically.                                                                                                                                                                                                                                                                           |
| [infrastructure/vpc.yaml](infrastructure/vpc.yaml)                             | This template deploys a VPC with a pair of public and private subnets spread across two Availability Zones. It deploys an [Internet gateway](http://docs.aws.amazon.com/AmazonVPC/latest/UserGuide/VPC_Internet_Gateway.html), with a default route on the public subnets. It deploys a pair of NAT gateways (one in each zone), and default routes for them in the private subnets. |
| [infrastructure/security-groups.yaml](infrastructure/security-groups.yaml)     | This template contains the [security groups](http://docs.aws.amazon.com/AmazonVPC/latest/UserGuide/VPC_SecurityGroups.html) required by the entire stack. They are created in a separate nested template, so that they can be referenced by all of the other nested templates.                                                                                                       |
| [infrastructure/load-balancers.yaml](infrastructure/load-balancers.yaml)       | This template deploys an ALB to the public subnets, which exposes the various ECS services. It is created in in a separate nested template, so that it can be referenced by all of the other nested templates and so that the various ECS services can register with it.                                                                                                             |
| [infrastructure/ecs-cluster.yaml](infrastructure/ecs-cluster.yaml)             | This template deploys an ECS cluster to the private subnets using an Auto Scaling group and installs the AWS SSM agent with related policy requirements.                                                                                                                                                                                                                             |
| [infrastructure/lifecyclehook.yaml](infrastructure/lifecyclehook.yaml)         | This template deploys a Lambda Function and Auto Scaling Lifecycle Hook to drain Tasks from your Container Instances when an Instance is selected for Termination in your Auto Scaling Group.                                                                                                                                                                                        |
| [services/product-service/service.yaml](services/product-service/service.yaml) | This is an example of a long-running ECS service that serves a JSON API of products. For the full source for the service, see [services/product-service/src](services/product-service/src).                                                                                                                                                                                          |
| [services/website-service/service.yaml](services/website-service/service.yaml) | This is an example of a long-running ECS service that needs to connect to another service (product-service) via the load-balanced URL. We use an environment variable to pass the product-service URL to the containers. For the full source for this service, see [services/website-service/src](services/website-service/src).                                                     |

After the CloudFormation templates have been deployed, the [stack outputs](http://docs.aws.amazon.com/AWSCloudFormation/latest/UserGuide/outputs-section-structure.html) contain a link to the load-balanced URLs for each of the deployed microservices.

![stack-outputs](images/stack-outputs.png)

The ECS instances should also appear in the Managed Instances section of the EC2 console.

## How do I...?

### Get started and deploy this into my AWS account

You can launch this CloudFormation stack in your account:

| AWS Region              | Short name |                                                                                                                                                                                                                                                             |
| ----------------------- | ---------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
| US East (Ohio)          | us-east-2  | [![cloudformation-launch-button](images/cloudformation-launch-stack.png)](https://console.aws.amazon.com/cloudformation/home?region=us-east-2#/stacks/new?stackName=Production&templateURL=https://s3.amazonaws.com/ecs-refarch-cloudformation/master.yaml) |
| US East (N. Virginia)   | us-east-1  | [![cloudformation-launch-button](images/cloudformation-launch-stack.png)](https://console.aws.amazon.com/cloudformation/home?region=us-east-1#/stacks/new?stackName=Production&templateURL=https://s3.amazonaws.com/ecs-refarch-cloudformation/master.yaml) |
| US West (N. California) | us-west-2  | [![cloudformation-launch-button](images/cloudformation-launch-stack.png)](https://console.aws.amazon.com/cloudformation/home?region=us-west-2#/stacks/new?stackName=Production&templateURL=https://s3.amazonaws.com/ecs-refarch-cloudformation/master.yaml) |
| US West (Oregon)        | us-west-1  | [![cloudformation-launch-button](images/cloudformation-launch-stack.png)](https://console.aws.amazon.com/cloudformation/home?region=us-west-1#/stacks/new?stackName=Production&templateURL=https://s3.amazonaws.com/ecs-refarch-cloudformation/master.yaml) |

### Customize the templates

1. [Fork](https://github.com/awslabs/ecs-refarch-cloudformation#fork-destination-box) this GitHub repository.
1. Clone the forked GitHub repository to your local machine.
1. Modify the templates.
1. Verify your changes locally: `pipenv run cfn-lint path/to/template.yaml`
1. Upload them to an Amazon S3 bucket of your choice.
1. Either create a new CloudFormation stack by deploying the master.yaml template, or update your existing stack with your version of the templates.

### Create a new ECS service

1. Push your container to a registry somewhere (e.g., [Amazon ECR](https://aws.amazon.com/ecr/)).
2. Copy one of the existing service templates in [services/\*](/services).
3. Update the `ContainerName` and `Image` parameters to point to your container image instead of the example container.
4. Increment the `ListenerRule` priority number (no two services can have the same priority number - this is used to order the ALB path based routing rules).
5. Copy one of the existing service definitions in [master.yaml](master.yaml) and point it at your new service template. Specify the HTTP `Path` at which you want the service exposed.
6. Deploy the templates as a new stack, or as an update to an existing stack.

### Setup centralized container logging

By default, the containers in your ECS tasks/services are already configured to send log information to CloudWatch Logs and retain them for 365 days. Within each service's template (in [services/\*](services/)), a LogGroup is created that is named after the CloudFormation stack. All container logs are sent to that CloudWatch Logs log group.

You can view the logs by looking in your [CloudWatch Logs console](https://console.aws.amazon.com/cloudwatch/home?#logs:) (make sure you are in the correct AWS region).

ECS also supports other logging drivers, including `syslog`, `journald`, `splunk`, `gelf`, `json-file`, and `fluentd`. To configure those instead, adjust the service template to use the alternative `LogDriver`. You can also adjust the log retention period from the default 365 days by tweaking the `RetentionInDays` parameter.

For more information, see the [LogConfiguration](http://docs.aws.amazon.com/AmazonECS/latest/APIReference/API_LogConfiguration.html) API operation.

### Change the ECS host instance type

This is specified in the [master.yaml](master.yaml) template.

By default, [t2.large](https://aws.amazon.com/ec2/instance-types/) instances are used, but you can change this by modifying the following section:

```
ECS:
  Type: AWS::CloudFormation::Stack
    Properties:
      TemplateURL: ...
      Parameters:
        ...
        InstanceType: t2.large
        InstanceCount: 4
        ...
```

### Adjust the Auto Scaling parameters for ECS hosts and services

The Auto Scaling group scaling policy provided by default launches and maintains a cluster of 4 ECS hosts distributed across two Availability Zones (min: 4, max: 4, desired: 4).

It is **_not_** set up to scale automatically based on any policies (CPU, network, time of day, etc.).

If you would like to configure policy or time-based automatic scaling, you can add the [ScalingPolicy](http://docs.aws.amazon.com/AWSCloudFormation/latest/UserGuide/aws-properties-as-policy.html) property to the AutoScalingGroup deployed in [infrastructure/ecs-cluster.yaml](infrastructure/ecs-cluster.yaml#L69).

As well as configuring Auto Scaling for the ECS hosts (your pool of compute), you can also configure scaling each individual ECS service. This can be useful if you want to run more instances of each container/task depending on the load or time of day (or a custom CloudWatch metric). To do this, you need to create [AWS::ApplicationAutoScaling::ScalingPolicy](http://docs.aws.amazon.com/pt_br/AWSCloudFormation/latest/UserGuide/aws-resource-applicationautoscaling-scalingpolicy.html) within your service template.

### Deploy multiple environments (e.g., dev, test, pre-production)

Deploy another CloudFormation stack from the same set of templates to create a new environment. The stack name provided when deploying the stack is prefixed to all taggable resources (e.g., EC2 instances, VPCs, etc.) so you can distinguish the different environment resources in the AWS Management Console.

### Change the VPC or subnet IP ranges

This set of templates deploys the following network design:

| Item           | CIDR Range     | Usable IPs | Description                                        |
| -------------- | -------------- | ---------- | -------------------------------------------------- |
| VPC            | 10.180.0.0/16  | 65,536     | The whole range used for the VPC and all subnets   |
| Public Subnet  | 10.180.8.0/21  | 2,041      | The public subnet in the first Availability Zone   |
| Public Subnet  | 10.180.16.0/21 | 2,041      | The public subnet in the second Availability Zone  |
| Private Subnet | 10.180.24.0/21 | 2,041      | The private subnet in the first Availability Zone  |
| Private Subnet | 10.180.32.0/21 | 2,041      | The private subnet in the second Availability Zone |

You can adjust the CIDR ranges used in this section of the [master.yaml](master.yaml) template:

```
VPC:
  Type: AWS::CloudFormation::Stack
    Properties:
      TemplateURL: !Sub ${TemplateLocation}/infrastructure/vpc.yaml
      Parameters:
        EnvironmentName:    !Ref AWS::StackName
        VpcCIDR:            10.180.0.0/16
        PublicSubnet1CIDR:  10.180.8.0/21
        PublicSubnet2CIDR:  10.180.16.0/21
        PrivateSubnet1CIDR: 10.180.24.0/21
        PrivateSubnet2CIDR: 10.180.32.0/21
```

### Update an ECS service to a new Docker image version

ECS has the ability to perform rolling upgrades to your ECS services to minimize downtime during deployments. For more information, see [Updating a Service](http://docs.aws.amazon.com/AmazonECS/latest/developerguide/update-service.html).

To update one of your services to a new version, adjust the `Image` parameter in the service template (in [services/\*](services/) to point to the new version of your container image. For example, if `1.0.0` was currently deployed and you wanted to update to `1.1.0`, you could update it as follows:

```
TaskDefinition:
  Type: AWS::ECS::TaskDefinition
  Properties:
    ContainerDefinitions:
      - Name: your-container
        Image: registry.example.com/your-container:1.1.0
```

After you've updated the template, update the deployed CloudFormation stack; CloudFormation and ECS handle the rest.

To adjust the rollout parameters (min/max number of tasks/containers to keep in service at any time), you need to configure `DeploymentConfiguration` for the ECS service.

For example:

```
Service:
  Type: AWS::ECS::Service
    Properties:
      ...
      DesiredCount: 4
      DeploymentConfiguration:
        MaximumPercent: 200
        MinimumHealthyPercent: 50
```

### Use the SSM Run Command function to see details in the ECS instances

The AWS SSM Run Command function, in the EC2 console, can be used to execute commands at the shell on the ECS instances. These can be helpful for examining the installed configuration of the instances without requiring direct access to them.

### Spot Instances and the Hibernate Agent.

In order to use Spot with this template, you will need to enable `SpotPrice` under the `AWS::AutoScaling::LaunchConfiguration` or add in `AWS::EC2::SpotFleet` support. To fully use Hibernation with Spot instances, please review [Spot Instance Interruptions](https://docs.aws.amazon.com/AWSEC2/latest/UserGuide/spot-interruptions.html).

### Add a new item to this list

If you found yourself wishing this set of frequently asked questions had an answer for a particular problem, please [submit a pull request](https://help.github.com/articles/creating-a-pull-request-from-a-fork/). The chances are that others will also benefit from having the answer listed here.

## Contributing

Please [create a new GitHub issue](https://github.com/awslabs/ecs-refarch-cloudformation/issues/new) for any feature requests, bugs, or documentation improvements.

Where possible, please also [submit a pull request](https://help.github.com/articles/creating-a-pull-request-from-a-fork/) for the change.

## License

Copyright 2011-2016 Amazon.com, Inc. or its affiliates. All Rights Reserved.

Licensed under the Apache License, Version 2.0 (the "License"). You may not use this file except in compliance with the License. A copy of the License is located at

[http://aws.amazon.com/apache2.0/](http://aws.amazon.com/apache2.0/)

or in the "license" file accompanying this file. This file is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License.
​


================================================
FILE: cloudformation/add_cloudflare_ips_to_sgs.py
================================================
#!/usr/bin/env python3
"""
Ensure that every security group tagged with “AllowCloudFlareIngress” has
permissions for every public CloudFlare netblock
"""

import sys

import boto3
import requests
from botocore.exceptions import ClientError

EC2_CLIENT = boto3.client("ec2")

CLOUDFLARE_IPV4 = requests.get(
    "https://www.cloudflare.com/ips-v4", timeout=30
).text.splitlines()
CLOUDFLARE_IPV6 = requests.get(
    "https://www.cloudflare.com/ips-v6", timeout=30
).text.splitlines()


def add_ingess_rules_for_group(sg_id, existing_permissions):
    permissions = {"IpProtocol": "tcp", "FromPort": 443, "ToPort": 443}

    existing_ipv4 = set()
    existing_ipv6 = set()

    for existing in existing_permissions:
        if any(
            permissions[k] != existing[k] for k in ("IpProtocol", "FromPort", "ToPort")
        ):
            continue

        existing_ipv4.update(i["CidrIp"] for i in existing["IpRanges"])
        existing_ipv6.update(i["CidrIpv6"] for i in existing["Ipv6Ranges"])

    ipv4_ranges = [
        {"CidrIp": cidr, "Description": "CloudFlare"}
        for cidr in CLOUDFLARE_IPV4
        if cidr not in existing_ipv4
    ]
    ipv6_ranges = [
        {"CidrIpv6": cidr, "Description": "CloudFlare"}
        for cidr in CLOUDFLARE_IPV6
        if cidr not in existing_ipv6
    ]

    permissions["IpRanges"] = ipv4_ranges
    permissions["Ipv6Ranges"] = ipv6_ranges

    try:
        EC2_CLIENT.authorize_security_group_ingress(
            GroupId=sg_id, IpPermissions=[permissions]
        )
    except ClientError as exc:
        print(f"Unable to add permssions for {sg_id}: {exc}", file=sys.stderr)


def get_security_groups():
    paginator = EC2_CLIENT.get_paginator("describe_security_groups")
    page_iterator = paginator.paginate(
        Filters=[{"Name": "tag-key", "Values": ["AllowCloudFlareIngress"]}]
    )

    for page in page_iterator:
        for sg in page["SecurityGroups"]:
            yield sg["GroupId"], sg["IpPermissions"]


if __name__ == "__main__":
    for security_group_id, existing_permissions in get_security_groups():
        add_ingess_rules_for_group(security_group_id, existing_permissions)


================================================
FILE: cloudformation/create_secrets.sh
================================================
#!/bin/bash

set -eu

# If you create a new set of secrets using a new ENV_NAME here,
# then add the new ENV_NAME option to the list of allowed options in
# master.yaml and infrastructure/fargate-cluster.yaml

export ENV_NAME=cftest2

export DJANGO_SECRET_KEY=
export DB_PASSWORD=
export KMS_KEY_ARN=arn:aws:kms:us-east-1:619333082511:key/d300e73d-9170-4001-933a-37af0bcdb956

aws secretsmanager create-secret --name "crowd/${ENV_NAME}/Django/SecretKey" --kms-key-id "${KMS_KEY_ARN}" --secret-string "{\"DjangoSecretKey\": \"${DJANGO_SECRET_KEY}\"}"

aws secretsmanager create-secret --name "crowd/${ENV_NAME}/DB/MasterUserPassword" --kms-key-id "${KMS_KEY_ARN}" --secret-string "{\"username\": \"concordia\",\"engine\": \"postgres\",\"port\": 5432,\"dbname\": \"concordia\",\"password\": \"${DB_PASSWORD}\"}"

# aws secretsmanager create-secret --name "concordia/SMTP" --kms-key-id "${KMS_KEY_ARN}" --secret-string '{"Hostname": "email-smtp.us-east-1.amazonaws.com","Username": "","Password": ""}'


================================================
FILE: cloudformation/featurebranch.yaml
================================================
---
AWSTemplateFormatVersion: '2010-09-09'
Description: >
    Deploy a feature branch to a subdomain of crowd-test.loc.gov
    using pre-existing infrastructure.
    Assumes docker images have been published to ECR with
    tag matching the feature branch name.

Parameters:
    ConcordiaBranch:
        Description: which branch name to deploy
        Type: String
        Default: release

    AbbreviatedName:
        Description: an abbreviation used for creating short-named cloudformation resources
        Type: String
        Default: rel

    Priority:
        Type: Number
        Description: Priority of the subdomain listener rule, must be unique in the set of listener rules
        Default: 100

Resources:
    RDS:
        Type: AWS::CloudFormation::Stack
        Properties:
            TemplateURL: 'https://s3.amazonaws.com/crowd-deployment/infrastructure/rds.yaml'
            Parameters:
                DbPassword: '{{resolve:secretsmanager:crowd/test/DB/MasterUserPassword:SecretString:password}}'
                DbUsername: '{{resolve:secretsmanager:crowd/test/DB/MasterUserPassword:SecretString:username}}'
                DatabaseSecurityGroup: 'sg-0496910b800de2869'
                PrivateSubnet1: 'subnet-0aa55b322229b945a'
                PrivateSubnet2: 'subnet-0f65558b319b2d4dc'

    DataLoadHost:
        Type: AWS::CloudFormation::Stack
        Properties:
            TemplateURL: 'https://s3.amazonaws.com/crowd-deployment/infrastructure/data-load.yaml'
            Parameters:
                PostgresqlHost: !GetAtt RDS.Outputs.DatabaseHostName
                PostgresqlPassword: '{{resolve:secretsmanager:crowd/test/DB/MasterUserPassword:SecretString:password}}'
                EnvironmentName: 'test'

    ElastiCache:
        Type: AWS::CloudFormation::Stack
        Properties:
            TemplateURL: 'https://s3.amazonaws.com/crowd-deployment/infrastructure/elasticache-feature.yaml'
            Parameters:
                EnvironmentName: !Ref AbbreviatedName
                SecurityGroup: 'sg-028ebfe14211447c4'

    FargateCluster:
        Type: AWS::CloudFormation::Stack
        Properties:
            TemplateURL: 'https://s3.amazonaws.com/crowd-deployment/infrastructure/fargate-featurebranch.yaml'
            Parameters:
                EnvName: 'test'
                FullEnvironmentName: 'test'
                S3BucketName: 'crowd-test-content'
                ExportS3BucketName: 'crowd-test-export'
                ConcordiaVersion: !Ref ConcordiaBranch
                CanonicalHostName: !Sub '${ConcordiaBranch}.crowd-test.loc.gov'
                VpcId: 'vpc-018e5a73079d0b350'
                SecurityGroup: 'sg-04de21574623caca7'
                RedisAddress: !GetAtt ElastiCache.Outputs.RedisAddress
                RedisPort: !GetAtt ElastiCache.Outputs.RedisPort
                DatabaseEndpoint: !GetAtt RDS.Outputs.DatabaseHostName
                Priority: !Ref Priority
                DataLoadStackName: !GetAtt DataLoadHost.Outputs.StackName


================================================
FILE: cloudformation/infrastructure/bastion-hosts.yaml
================================================
Description: This template deploys a bastion host in each of the public subnets.

Parameters:
    EnvironmentName:
        Description: An environment name that will be prefixed to resource names
        Type: String
        AllowedValues:
            - dev
            - test
            - stage
            - prod

    KeyPairName:
        Description: key pair (within this region) for ECS instances access
        Type: String

Mappings:
    AWSRegionToAMI:
        us-east-1:
            AMI: ami-04e5276ebb8451442

    EnvironmentMapping:
        IamInstanceProfileName:
            dev: crowd-dev-FargateCluster-WFCY4I0U7JSM-ConcordiaInstanceProfile-RQHLRZADDM9M
            test: crowd-test-FargateCluster-1R5U1VT4HOYX2-ConcordiaInstanceProfile-1FJXY570ZM2O3
            stage: crowd-stage-FargateCluster-1TBKSIZQKLJHV-ConcordiaInstanceProfile-1XG3TR3LY42ND
            prod: crowd-prod-FargateCluster-1X1CI0J3HFJ9F-ConcordiaInstanceProfile-13SHE5FAB7D6Q

        # The ID of the public subnet in the first AZ
        # Type: AWS::EC2::Subnet::Id
        PublicSubnet1:
            dev: subnet-079b5dd4f9acf44e6
            test: subnet-06f443ea589879e8d
            stage: subnet-06f40e2fc8d891692
            prod: subnet-09fdaf1c5c73f588f

        # The ID of the public subnet in the second AZ
        # Type: AWS::EC2::Subnet::Id
        PublicSubnet2:
            dev: subnet-01d6614725c7dabd6
            test: subnet-05a15c6058ebdf54f
            stage: subnet-0a022eb0c614b0b00
            prod: subnet-01580e2a4d6d42b52

        # The security group for bastion hosts
        # Type: AWS::EC2::SecurityGroup::Id
        BastionHostsSecurityGroup:
            dev: sg-062afe8941ace25ad
            test: sg-0208b0df704b66c3c
            stage: sg-0a2175a2df32a4332
            prod: sg-066c68e77787b2a10

Resources:
    Bastion1:
        Type: AWS::EC2::Instance
        Properties:
            ImageId:
                Fn::FindInMap:
                    - AWSRegionToAMI
                    - Ref: 'AWS::Region'
                    - 'AMI'
            InstanceType: 't2.medium'
            IamInstanceProfile:
                Fn::FindInMap:
                    - EnvironmentMapping
                    - IamInstanceProfileName
                    - Ref: EnvironmentName
            KeyName:
                Ref: KeyPairName
            NetworkInterfaces:
                - AssociatePublicIpAddress: true
                  DeviceIndex: '0'
                  GroupSet:
                      - Fn::FindInMap:
                            - EnvironmentMapping
                            - BastionHostsSecurityGroup
                            - Ref: EnvironmentName
                  SubnetId:
                      Fn::FindInMap:
                          - EnvironmentMapping
                          - PublicSubnet1
                          - Ref: EnvironmentName
            UserData:
                Fn::Base64: !Sub |
                    #!/bin/bash -xe
                    echo "Running userdata for ${EnvironmentName}"
                    echo "export ENV_NAME=${EnvironmentName}" >> /home/ec2-user/.bash_profile
                    source /home/ec2-user/.bash_profile
                    # TODO while true is a workaround for AL2023 Consistently Failing to boot
                    #  · Issue #3741· philips-labs/terraform-aws-github-runner
                    # https://github.com/amazonlinux/amazon-linux-2023/issues/397
                    while true; do
                      dnf -y upgrade --releasever=latest && break
                    done
                    while true; do
                      dnf -y install --assumeyes git && break
                    done
                    while true; do
                      dnf -y install --assumeyes postgresql15.x86_64 && break
                    done
                    while true; do
                      dnf -y install --assumeyes docker.x86_64 && break
                    done
                    aws s3 cp s3://crowd-deployment/database-dumps/concordia.latest.dmp concordia.dmp
            Tags:
                - Key: Name
                  Value: !Sub ${EnvironmentName}-BastionHost-1

    Bastion2:
        Type: AWS::EC2::Instance
        Properties:
            ImageId:
                Fn::FindInMap:
                    - AWSRegionToAMI
                    - Ref: 'AWS::Region'
                    - 'AMI'
            InstanceType: 't2.medium'
            IamInstanceProfile:
                Fn::FindInMap:
                    - EnvironmentMapping
                    - IamInstanceProfileName
                    - Ref: EnvironmentName
            KeyName:
                Ref: KeyPairName
            NetworkInterfaces:
                - AssociatePublicIpAddress: true
                  DeviceIndex: '0'
                  GroupSet:
                      - Fn::FindInMap:
                            - EnvironmentMapping
                            - BastionHostsSecurityGroup
                            - Ref: EnvironmentName
                  SubnetId:
                      Fn::FindInMap:
                          - EnvironmentMapping
                          - PublicSubnet2
                          - Ref: EnvironmentName
            UserData:
                Fn::Base64: !Sub |
                    #!/bin/bash -xe
                    echo "Running userdata for ${EnvironmentName}"
                    echo "export ENV_NAME=${EnvironmentName}" >> /home/ec2-user/.bash_profile
                    source /home/ec2-user/.bash_profile
                    while true; do
                      dnf -y upgrade --releasever=latest && break
                    done
                    while true; do
                      dnf -y install --assumeyes git && break
                    done
                    while true; do
                      dnf -y install --assumeyes postgresql15.x86_64 && break
                    done
                    while true; do
                      dnf -y install --assumeyes docker.x86_64 && break
                    done
                    aws s3 cp s3://crowd-deployment/database-dumps/concordia.latest.dmp concordia.dmp
            Tags:
                - Key: Name
                  Value: !Sub ${EnvironmentName}-BastionHost-2


================================================
FILE: cloudformation/infrastructure/data-load.yaml
================================================
Description:
    This template deploys a host in a private subnet and loads the most recent
    database dump to the specified database server.

Parameters:
    EnvironmentName:
        Description: An environment name that will be prefixed to resource names
        Type: String
        AllowedValues:
            - dev
            - test
            - stage
            - prod

    PostgresqlHost:
        Description: the end point of the RDS database host to restore
        Type: String

    PostgresqlPassword:
        Description: the password for the RDS endpoint to restore
        Type: String
        NoEcho: true

Mappings:
    AWSRegionToAMI:
        us-east-1:
            AMI: ami-04e5276ebb8451442

    EnvironmentMapping:
        IamInstanceProfileName:
            dev: crowd-dev-FargateCluster-WFCY4I0U7JSM-ConcordiaInstanceProfile-RQHLRZADDM9M
            test: crowd-test-FargateCluster-1R5U1VT4HOYX2-ConcordiaInstanceProfile-1FJXY570ZM2O3
            stage: crowd-stage-FargateCluster-1TBKSIZQKLJHV-ConcordiaInstanceProfile-1XG3TR3LY42ND
            prod: crowd-prod-FargateCluster-1X1CI0J3HFJ9F-ConcordiaInstanceProfile-13SHE5FAB7D6Q

        PrivateSubnet1:
            dev: subnet-0c95a830ce007fa65
            test: subnet-0aa55b322229b945a
            stage: subnet-0f7c7d66b66d6dd90
            prod: subnet-0da84976b66c32ce4

        # The security group for bastion hosts
        # Type: AWS::EC2::SecurityGroup::Id
        BastionHostsSecurityGroup:
            dev: sg-062afe8941ace25ad
            test: sg-0208b0df704b66c3c
            stage: sg-0a2175a2df32a4332
            prod: sg-066c68e77787b2a10

Resources:
    DataLoadHost:
        Type: AWS::EC2::Instance
        CreationPolicy:
            ResourceSignal:
                Timeout: PT30M
        Properties:
            ImageId:
                Fn::FindInMap:
                    - AWSRegionToAMI
                    - Ref: 'AWS::Region'
                    - 'AMI'
            InstanceType: 't2.medium'
            IamInstanceProfile:
                Fn::FindInMap:
                    - EnvironmentMapping
                    - IamInstanceProfileName
                    - Ref: EnvironmentName
            InstanceInitiatedShutdownBehavior: terminate
            NetworkInterfaces:
                - AssociatePublicIpAddress: true
                  DeviceIndex: '0'
                  GroupSet:
                      - Fn::FindInMap:
                            - EnvironmentMapping
                            - BastionHostsSecurityGroup
                            - Ref: EnvironmentName
                  SubnetId:
                      Fn::FindInMap:
                          - EnvironmentMapping
                          - PrivateSubnet1
                          - Ref: EnvironmentName
            UserData:
                Fn::Base64: !Sub |
                    #!/bin/bash -xe
                    trap '/opt/aws/bin/cfn-signal --exit-code 1 --resource DataLoadHost --region ${AWS::Region} --stack ${AWS::StackName}' ERR
                    echo "Running userdata for ${EnvironmentName}"
                    echo "export ENV_NAME=${EnvironmentName}" >> /home/ec2-user/.bash_profile
                    source /home/ec2-user/.bash_profile
                    # TODO while true is a workaround for AL2023 Consistently Failing to boot
                    #  · Issue #3741· philips-labs/terraform-aws-github-runner
                    # https://github.com/amazonlinux/amazon-linux-2023/issues/397
                    while true; do
                      dnf -y upgrade --releasever=latest && break
                    done
                    while true; do
                      dnf -y install --assumeyes postgresql15.x86_64 && break
                    done
                    aws s3 cp s3://crowd-deployment/database-dumps/concordia.latest.dmp concordia.dmp
                    echo "${PostgresqlHost}:5432:*:concordia:${PostgresqlPassword}" >> /root/.pgpass
                    chmod 0600 /root/.pgpass
                    psql -U concordia -h ${PostgresqlHost} -d postgres -c "select pg_terminate_backend(pid) from pg_stat_activity where datname='concordia';"
                    psql -U concordia -h ${PostgresqlHost} -d postgres -c "drop database concordia;"
                    pg_restore --create -Fc -U concordia -h ${PostgresqlHost} --dbname=postgres --no-password --no-owner --no-acl concordia.dmp
                    # Signal the status from cfn-init
                    /opt/aws/bin/cfn-signal --exit-code 0 --resource DataLoadHost --region ${AWS::Region} --stack ${AWS::StackName}
                    shutdown -h now
            Tags:
                - Key: Name
                  Value: !Sub ${EnvironmentName}-DataLoadHost
Outputs:
    StackName:
        Description: 'Stackname for the DataLoadHost'
        Value: !Ref AWS::StackName


================================================
FILE: cloudformation/infrastructure/elasticache-feature.yaml
================================================
Description: >
    This template deploys an elasticache cluster to the provided VPC and subnets

Parameters:
    EnvironmentName:
        Description: An environment name that will be prefixed to resource names
        Type: String

    SecurityGroup:
        Description: Select the Security Group to use for the ECS cluster hosts
        Type: AWS::EC2::SecurityGroup::Id

    CacheNodeType:
        Type: String
        Default: cache.m5.large

Resources:
    RedisService:
        Type: AWS::ElastiCache::CacheCluster
        Properties:
            VpcSecurityGroupIds:
                - !Ref 'SecurityGroup'
            CacheSubnetGroupName: 'crowd-cache-1frtjeewr57u7'
            CacheNodeType: !Ref 'CacheNodeType'
            ClusterName: !Sub '${EnvironmentName}-redis'
            Engine: redis
            AutoMinorVersionUpgrade: true
            NumCacheNodes: 1
            SnapshotRetentionLimit: 1

Outputs:
    RedisAddress:
        Description: Redis endpoint address
        Value: !GetAtt 'RedisService.RedisEndpoint.Address'

    RedisPort:
        Description: Redis endpoint port
        Value: !GetAtt 'RedisService.RedisEndpoint.Port'


================================================
FILE: cloudformation/infrastructure/elasticache.yaml
================================================
Description: >
    This template deploys an elasticache cluster to the provided VPC and subnets

Parameters:
    EnvironmentName:
        Description: An environment name that will be prefixed to resource names
        Type: String

    PrivateSubnets:
        Description: Choose which subnets this ECS cluster should be deployed to
        Type: List<AWS::EC2::Subnet::Id>

    SecurityGroup:
        Description: Select the Security Group to use for the ECS cluster hosts
        Type: AWS::EC2::SecurityGroup::Id

    CacheNodeType:
        Type: String
        Default: cache.m1.small

Resources:
    CachePrivateSubnetGroup:
        UpdateReplacePolicy: Retain
        Type: AWS::ElastiCache::SubnetGroup
        DeletionPolicy: Retain
        Properties:
            Description: Private subnet group
            SubnetIds: !Ref PrivateSubnets
    RedisService:
        UpdateReplacePolicy: Retain
        Type: AWS::ElastiCache::CacheCluster
        DeletionPolicy: Retain
        Properties:
            VpcSecurityGroupIds:
                - !Ref 'SecurityGroup'
            CacheSubnetGroupName: !Ref 'CachePrivateSubnetGroup'
            CacheNodeType: !Ref 'CacheNodeType'
            ClusterName: !Sub '${EnvironmentName}-redis'
            Engine: redis
            AutoMinorVersionUpgrade: true
            NumCacheNodes: 1
            SnapshotRetentionLimit: 1

Outputs:
    RedisAddress:
        Description: Redis endpoint address
        Value: !GetAtt 'RedisService.RedisEndpoint.Address'

    RedisPort:
        Description: Redis endpoint port
        Value: !GetAtt 'RedisService.RedisEndpoint.Port'


================================================
FILE: cloudformation/infrastructure/elasticsearch.yaml
================================================
Description: >
    This template deploys a VPC-based ElasticSearch cluster.

Parameters:
    EnvName:
        Type: String
        Description: which environment to target
        AllowedValues:
            - 'dev'
            - 'test'
            - 'stage'
            - 'prod'
        ConstraintDescription: Must match a location for secret storage in secretsmanager

    SecurityGroup:
        Description: Select the Security Group to use for the ECS cluster hosts
        Type: AWS::EC2::SecurityGroup::Id

    PrivateSubnet2:
        Description: The private subnet in AZ2 for the VPC
        Type: AWS::EC2::Subnet::Id

Resources:
    ESCluster:
        Type: AWS::Elasticsearch::Domain
        Properties:
            ElasticsearchClusterConfig:
                InstanceCount: 1
                ZoneAwarenessEnabled: false
                InstanceType: 'm5.xlarge.elasticsearch'
            ElasticsearchVersion: '7.10'
            EBSOptions:
                EBSEnabled: true
                Iops: 0
                VolumeSize: 20
                VolumeType: 'standard'
            SnapshotOptions:
                AutomatedSnapshotStartHour: 0
            AccessPolicies:
                Version: '2012-10-17'
                Statement:
                    - Effect: 'Allow'
                      Principal:
                          AWS: '*'
                      Action: 'es:*'
                      Resource: !Sub 'arn:aws:es:us-east-1:619333082511:domain/crowd-${EnvName}-vpc/*'
            AdvancedOptions:
                rest.action.multi.allow_explicit_index: 'true'
            Tags:
                - Key: Environment
                  Value: !Ref EnvName
            VPCOptions:
                SubnetIds:
                    - Ref: PrivateSubnet2
                SecurityGroupIds:
                    - Ref: SecurityGroup


================================================
FILE: cloudformation/infrastructure/fargate-cluster.yaml
================================================
Description: >
    This template deploys a fargate cluster to the provided VPC and subnets

Parameters:
    EnvironmentName:
        Description: An environment name that will be prefixed to resource names
        Type: String

    PublicSubnets:
        Description: The subnets for the load balancer
        Type: List<AWS::EC2::Subnet::Id>

    PrivateSubnets:
        Description: Choose which subnets this ECS cluster should be deployed to
        Type: List<AWS::EC2::Subnet::Id>

    SecurityGroup:
        Description: Select the Security Group to use for the ECS cluster hosts
        Type: AWS::EC2::SecurityGroup::Id

    LoadBalancerSecurityGroup:
        Description: The SecurityGroup for load balancer
        Type: AWS::EC2::SecurityGroup::Id

    VpcId:
        Description: The Id of the VPC for this cluster
        Type: AWS::EC2::VPC::Id

    ConcordiaVersion:
        Type: String
        Description: version of concordia docker images to pull and deploy
        Default: latest

    DjangoKeyId:
        Type: String
        Description: unique ID appended to end of DjangoSecretKey ARN in secrets manager
        Default: xxxxx

    DbSecretId:
        Type: String
        Description: unique ID appended to end of DB password ARN in secrets manager
        Default: xxxxx

    EnvName:
        Type: String
        Description: which environment to target
        AllowedValues:
            - 'dev'
            - 'test'
            - 'stage'
            - 'prod'
            - 'cftest2'
        ConstraintDescription: Must match a location for secret storage in secretsmanager

    FullEnvironmentName:
        Type: String
        Description: Full name of deployment environment
        AllowedValues:
            - 'development'
            - 'test'
            - 'staging'
            - 'production'

    RedisAddress:
        Type: String
        Description: Redis endpoint address

    RedisPort:
        Type: String
        Description: Redis endpoint port

    CanonicalHostName:
        Type: String
        Description: canonical host name of the application, e.g. crowd-test.loc.gov

    DatabaseEndpoint:
        Type: String
        Description: Host name of the Postgres RDS service

    S3BucketName:
        Type: String
        Description: name of the S3 bucket (public) where collection images will be stored

    ExportS3BucketName:
        Type: String
        Description: name of the S3 bucket (public) where exported transcriptions will be stored

Resources:
    ConcordiaS3BucketAccessPolicy:
        UpdateReplacePolicy: Retain
        Type: AWS::IAM::Policy
        Metadata:
            cfn_nag:
                rules_to_suppress:
                    - id: W12
                      reason: 'S3 buckets must be specified with /* after the bucket name'
        DeletionPolicy: Retain
        Properties:
            PolicyName: !Sub ConcordiaServiceS3BucketAccess-${EnvironmentName}
            Roles:
                - !Ref 'ConcordiaTaskRole'
                - !Ref 'ConcordiaEC2Role'
            PolicyDocument:
                Version: '2012-10-17'
                Statement:
                    - Effect: Allow
                      Action:
                          - 's3:PutObject'
                          - 's3:GetObject'
                          - 's3:AbortMultipartUpload'
                          - 's3:ListMultipartUploadParts'
                          - 's3:ListBucket'
                          - 's3:ListBucketMultipartUploads'
                      Resource:
                          - !Sub 'arn:aws:s3:::crowd-${EnvironmentName}-content/*'
                          - !Sub 'arn:aws:s3:::crowd-${EnvironmentName}-export/*'

    ConcordiaKMSAccessPolicy:
        UpdateReplacePolicy: Retain
        Type: AWS::IAM::Policy
        DeletionPolicy: Retain
        Properties:
            PolicyName: !Sub ConcordiaServiceKMSAccess-${EnvironmentName}
            Roles:
                - !Ref 'ConcordiaTaskRole'
                - !Ref 'ConcordiaEC2Role'
            PolicyDocument:
                Version: '2012-10-17'
                Statement:
                    - Effect: Allow
                      Action:
                          - 'kms:GetParametersForImport'
                          - 'kms:GetKeyRotationStatus'
                          - 'kms:GetKeyPolicy'
                          - 'kms:DescribeKey'
                          - 'kms:ListResourceTags'
                          - 'kms:Decrypt'
                          - 'kms:GenerateDataKey'
                      Resource:
                          - 'arn:aws:kms:us-east-1:619333082511:key/d300e73d-9170-4001-933a-37af0bcdb956'

    ConcordiaServiceSecretAccessPolicy:
        UpdateReplacePolicy: Retain
        Type: AWS::IAM::Policy
        DeletionPolicy: Retain
        Properties:
            PolicyName: !Sub ConcordiaServiceSecretAccess-${EnvironmentName}
            Roles:
                - !Ref 'ConcordiaTaskRole'
                - !Ref 'ConcordiaEC2Role'
            PolicyDocument:
                Version: '2012-10-17'
                Statement:
                    - Effect: Allow
                      Action:
                          - 'secretsmanager:GetResourcePolicy'
                          - 'secretsmanager:GetSecretValue'
                          - 'secretsmanager:DescribeSecret'
                          - 'secretsmanager:ListSecretVersionIds'
                      Resource:
                          - 'arn:aws:secretsmanager:us-east-1:619333082511:secret:concordia/SMTP-GVlolk'
                          - !Sub 'arn:aws:secretsmanager:us-east-1:619333082511:secret:crowd/${EnvName}/Django/SecretKey-${DjangoKeyId}'
                          - !Sub 'arn:aws:secretsmanager:us-east-1:619333082511:secret:crowd/${EnvName}/DB/MasterUserPassword-${DbSecretId}'

    ConcordiaEC2Role:
        UpdateReplacePolicy: Retain
        Type: AWS::IAM::Role
        DeletionPolicy: Retain
        Properties:
            Path: /
            AssumeRolePolicyDocument:
                Version: '2012-10-17'
                Statement:
                    - Effect: Allow
                      Principal:
                          Service: ec2.amazonaws.com
                      Action: sts:AssumeRole
            ManagedPolicyArns:
                - arn:aws:iam::aws:policy/AmazonEC2ContainerRegistryReadOnly
                - arn:aws:iam::aws:policy/service-role/AmazonECSTaskExecutionRolePolicy

    ConcordiaInstanceProfile:
        UpdateReplacePolicy: Retain
        Type: AWS::IAM::InstanceProfile
        DeletionPolicy: Retain
        Properties:
            Path: /
            Roles:
                - !Ref 'ConcordiaEC2Role'

    ConcordiaTaskRole:
        UpdateReplacePolicy: Retain
        Type: AWS::IAM::Role
        DeletionPolicy: Retain
        Properties:
            AssumeRolePolicyDocument:
                Version: '2012-10-17'
                Statement:
                    - Effect: Allow
                      Principal:
                          Service: ecs-tasks.amazonaws.com
                      Action:
                          - sts:AssumeRole
            ManagedPolicyArns:
                - arn:aws:iam::aws:policy/AmazonEC2ContainerRegistryReadOnly
                - arn:aws:iam::aws:policy/service-role/AmazonECSTaskExecutionRolePolicy

    ConcordiaAppLogsGroup:
        UpdateReplacePolicy: Retain
        Type: AWS::Logs::LogGroup
        DeletionPolicy: Retain
        Properties:
            LogGroupName: !Ref AWS::StackName
            RetentionInDays: 30

    ConcordiaExternalTargetGroup:
        UpdateReplacePolicy: Retain
        Type: AWS::ElasticLoadBalancingV2::TargetGroup
        DeletionPolicy: Retain
        Properties:
            HealthCheckIntervalSeconds: 30
            HealthCheckPath: /healthz
            HealthCheckProtocol: HTTP
            HealthCheckTimeoutSeconds: 5
            HealthyThresholdCount: 2
            UnhealthyThresholdCount: 10
            TargetType: ip
            Port: 80
            Protocol: HTTP
            VpcId: !Ref VpcId

    LoadBalancer:
        UpdateReplacePolicy: Retain
        Type: AWS::ElasticLoadBalancingV2::LoadBalancer
        DeletionPolicy: Retain
        Properties:
            Subnets: !Ref PublicSubnets
            SecurityGroups:
                - !Ref LoadBalancerSecurityGroup

    ExternalLoadBalancerListener:
        UpdateReplacePolicy: Retain
        DeletionPolicy: Retain
        Properties:
            DefaultActions:
                # FIXME: When AWS CF supports it, redirect to https
                # instead of forward to target group
                - TargetGroupArn: !Ref ConcordiaExternalTargetGroup
                  Type: forward
            LoadBalancerArn: !Ref LoadBalancer
            Port: 80
            Protocol: HTTP
        Type: AWS::ElasticLoadBalancingV2::Listener

    SecureExternalLoadBalancerListener:
        UpdateReplacePolicy: Retain
        DeletionPolicy: Retain
        Properties:
            Certificates:
                - CertificateArn: !Sub 'arn:aws:iam::${AWS::AccountId}:server-certificate/${CanonicalHostName}'
            DefaultActions:
                - TargetGroupArn: !Ref ConcordiaExternalTargetGroup
                  Type: forward
            LoadBalancerArn: !Ref LoadBalancer
            Port: 443
            Protocol: HTTPS
        Type: AWS::ElasticLoadBalancingV2::Listener

    ECSCluster:
        UpdateReplacePolicy: Retain
        Type: AWS::ECS::Cluster
        DeletionPolicy: Retain
        Properties:
            ClusterName: !Ref EnvironmentName

    ConcordiaTask:
        UpdateReplacePolicy: Retain
        Type: AWS::ECS::TaskDefinition
        DeletionPolicy: Retain
        Properties:
            Family: !Sub crowd-${EnvName}
            Cpu: '4096'
            Memory: '16384'
            NetworkMode: awsvpc
            RequiresCompatibilities:
                - FARGATE
            ExecutionRoleArn: !GetAtt ConcordiaTaskRole.Arn
            TaskRoleArn: !GetAtt ConcordiaTaskRole.Arn
            Volumes:
                - Name: images_volume
            ContainerDefinitions:
                - Name: app
                  Cpu: 2048
                  Image: !Sub '${AWS::AccountId}.dkr.ecr.${AWS::Region}.amazonaws.com/concordia:${ConcordiaVersion}'
                  LogConfiguration:
                      LogDriver: awslogs
                      Options:
                          awslogs-group: !Ref 'ConcordiaAppLogsGroup'
                          awslogs-region: !Ref 'AWS::Region'
                          awslogs-stream-prefix: ConcordiaServer
                  Environment:
                      - Name: AWS
                        Value: '1'
                      - Name: ENV_NAME
                        Value: !Ref EnvName
                      - Name: CONCORDIA_ENVIRONMENT
                        Value: !Ref FullEnvironmentName
                      - Name: S3_BUCKET_NAME
                        Value: !Ref S3BucketName
                      - Name: EXPORT_S3_BUCKET_NAME
                        Value: !Ref ExportS3BucketName
                      - Name: CELERY_BROKER_URL
                        Value: !Sub 'redis://${RedisAddress}:${RedisPort}/0'
                      - Name: AWS_DEFAULT_REGION
                        Value: !Ref AWS::Region
                      - Name: SENTRY_BACKEND_DSN
                        Value: https://6727341eabcd47e3a48ce300432e840b@errorlogging.loc.gov/5
                      - Name: SENTRY_FRONTEND_DSN
                        Value: https://77a13a941ffd485dbf41dbf8e7a0bdd0@errorlogging.loc.gov/4
                      - Name: REDIS_ADDRESS
                        Value: !Ref RedisAddress
                      - Name: REDIS_PORT
                        Value: !Ref RedisPort
                      - Name: POSTGRESQL_HOST
                        Value: !Ref DatabaseEndpoint
                      - Name: HOST_NAME
                        Value: !Ref CanonicalHostName
                      - Name: DJANGO_SETTINGS_MODULE
                        Value: concordia.settings_ecs
                  MountPoints:
                      - SourceVolume: images_volume
                        ContainerPath: /concordia_images
                  PortMappings:
                      - ContainerPort: 80
                - Name: importer
                  Cpu: 1024
                  Image: !Sub '${AWS::AccountId}.dkr.ecr.${AWS::Region}.amazonaws.com/concordia/importer:${ConcordiaVersion}'
                  LogConfiguration:
                      LogDriver: awslogs
                      Options:
                          awslogs-group: !Ref 'ConcordiaAppLogsGroup'
                          awslogs-region: !Ref 'AWS::Region'
                          awslogs-stream-prefix: ConcordiaWorker
                  Environment:
                      - Name: AWS
                        Value: '1'
                      - Name: ENV_NAME
                        Value: !Ref EnvName
                      - Name: CONCORDIA_ENVIRONMENT
                        Value: !Ref FullEnvironmentName
                      - Name: S3_BUCKET_NAME
                        Value: !Ref S3BucketName
                      - Name: EXPORT_S3_BUCKET_NAME
                        Value: !Ref ExportS3BucketName
                      - Name: CELERY_BROKER_URL
                        Value: !Sub 'redis://${RedisAddress}:${RedisPort}/0'
                      - Name: AWS_DEFAULT_REGION
                        Value: !Ref AWS::Region
                      - Name: SENTRY_BACKEND_DSN
                        Value: https://6727341eabcd47e3a48ce300432e840b@errorlogging.loc.gov/5
                      - Name: SENTRY_FRONTEND_DSN
                        Value: https://77a13a941ffd485dbf41dbf8e7a0bdd0@errorlogging.loc.gov/4
                      - Name: REDIS_ADDRESS
                        Value: !Ref RedisAddress
                      - Name: REDIS_PORT
                        Value: !Ref RedisPort
                      - Name: POSTGRESQL_HOST
                        Value: !Ref DatabaseEndpoint
                      - Name: HOST_NAME
                        Value: !Ref CanonicalHostName
                      - Name: DJANGO_SETTINGS_MODULE
                        Value: concordia.settings_ecs
                  MountPoints:
                      - SourceVolume: images_volume
                        ContainerPath: /concordia_images
                - Name: celerybeat
                  Cpu: 1024
                  Image: !Sub '${AWS::AccountId}.dkr.ecr.${AWS::Region}.amazonaws.com/concordia/celerybeat:${ConcordiaVersion}'
                  LogConfiguration:
                      LogDriver: awslogs
                      Options:
                          awslogs-group: !Ref 'ConcordiaAppLogsGroup'
                          awslogs-region: !Ref 'AWS::Region'
                          awslogs-stream-prefix: ConcordiaWorker
                  Environment:
                      - Name: AWS
                        Value: '1'
                      - Name: ENV_NAME
                        Value: !Ref EnvName
                      - Name: CONCORDIA_ENVIRONMENT
                        Value: !Ref FullEnvironmentName
                      - Name: S3_BUCKET_NAME
                        Value: !Ref S3BucketName
                      - Name: EXPORT_S3_BUCKET_NAME
                        Value: !Ref ExportS3BucketName
                      - Name: CELERY_BROKER_URL
                        Value: !Sub 'redis://${RedisAddress}:${RedisPort}/0'
                      - Name: AWS_DEFAULT_REGION
                        Value: !Ref AWS::Region
                      - Name: SENTRY_BACKEND_DSN
                        Value: https://6727341eabcd47e3a48ce300432e840b@errorlogging.loc.gov/5
                      - Name: SENTRY_FRONTEND_DSN
                        Value: https://77a13a941ffd485dbf41dbf8e7a0bdd0@errorlogging.loc.gov/4
                      - Name: REDIS_ADDRESS
                        Value: !Ref RedisAddress
                      - Name: REDIS_PORT
                        Value: !Ref RedisPort
                      - Name: POSTGRESQL_HOST
                        Value: !Ref DatabaseEndpoint
                      - Name: HOST_NAME
                        Value: !Ref CanonicalHostName
                      - Name: DJANGO_SETTINGS_MODULE
                        Value: concordia.settings_ecs

    ConcordiaExternalService:
        UpdateReplacePolicy: Retain
        Type: AWS::ECS::Service
        DependsOn: ExternalLoadBalancerListener
        DeletionPolicy: Retain
        Properties:
            Cluster: !Ref ECSCluster
            LaunchType: FARGATE
            DeploymentConfiguration:
                MaximumPercent: 200
                MinimumHealthyPercent: 75
            DesiredCount: 1
            NetworkConfiguration:
                AwsvpcConfiguration:
                    SecurityGroups:
                        - !Ref SecurityGroup
                    Subnets: !Ref PrivateSubnets
            TaskDefinition: !Ref ConcordiaTask
            LoadBalancers:
                - ContainerName: 'app'
                  ContainerPort: 80
                  TargetGroupArn: !Ref ConcordiaExternalTargetGroup

Outputs:
    LoadBalancerUrl:
        Description: The URL of the ALB
        Value: !GetAtt LoadBalancer.DNSName


================================================
FILE: cloudformation/infrastructure/fargate-featurebranch.yaml
================================================
Description: >
    This template deploys a fargate cluster to the provided VPC and subnets

Parameters:
    SecurityGroup:
        Description: Select the Security Group to use for the ECS cluster hosts
        Type: AWS::EC2::SecurityGroup::Id

    VpcId:
        Description: The Id of the VPC for this cluster
        Type: AWS::EC2::VPC::Id

    ConcordiaVersion:
        Type: String
        Description: docker tag of concordia app image to pull and deploy
        Default: latest

    EnvName:
        Type: String
        Description: which environment to target
        AllowedValues:
            - 'dev'
            - 'test'
            - 'stage'
            - 'prod'
        ConstraintDescription: Must match a location for secret storage in secretsmanager

    FullEnvironmentName:
        Type: String
        Description: Full name of deployment environment
        AllowedValues:
            - 'development'
            - 'test'
            - 'staging'
            - 'production'

    RedisAddress:
        Type: String
        Description: Redis endpoint address

    RedisPort:
        Type: String
        Description: Redis endpoint port

    CanonicalHostName:
        Type: String
        Description: canonical host name of the application, e.g. crowd-test.loc.gov

    DatabaseEndpoint:
        Type: String
        Description: Host name of the Postgres RDS service

    S3BucketName:
        Type: String
        Description: name of the S3 bucket (public) where collection images will be stored

    ExportS3BucketName:
        Type: String
        Description: name of the S3 bucket (public) where exported transcriptions will be stored

    Priority:
        Type: Number
        Description: Priority of the subdomain listener rule, must be unique in the set of listener rules
        Default: 100

    DataLoadStackName:
        Type: String
        Description: Signal that the DataLoadHost UserData has completed

Resources:
    ConcordiaAppLogsGroup:
        Type: AWS::Logs::LogGroup
        Properties:
            LogGroupName: !Ref AWS::StackName
            RetentionInDays: 30

    ConcordiaExternalTargetGroup:
        Type: AWS::ElasticLoadBalancingV2::TargetGroup
        Properties:
            HealthCheckIntervalSeconds: 30
            HealthCheckPath: /healthz
            HealthCheckProtocol: HTTP
            HealthCheckTimeoutSeconds: 5
            HealthyThresholdCount: 2
            UnhealthyThresholdCount: 10
            TargetType: ip
            Port: 80
            Protocol: HTTP
            VpcId: !Ref VpcId

    SubdomainListenerRule:
        Type: AWS::ElasticLoadBalancingV2::ListenerRule
        Properties:
            Actions:
                - TargetGroupArn: !Ref ConcordiaExternalTargetGroup
                  Type: forward
            Conditions:
                - Field: host-header
                  Values:
                      - !Ref CanonicalHostName
            ListenerArn: arn:aws:elasticloadbalancing:us-east-1:619333082511:listener/app/crowd-test/81e4820e354ea810/187fd94e534ad833
            Priority: !Ref Priority

    ConcordiaTask:
        Type: AWS::ECS::TaskDefinition
        Properties:
            Family: !Sub crowd-${ConcordiaVersion}
            Cpu: '4096'
            Memory: '30720'
            NetworkMode: awsvpc
            RequiresCompatibilities:
                - FARGATE
            ExecutionRoleArn: !Sub 'arn:aws:iam::${AWS::AccountId}:role/ConcordiaServerTaskRole-crowd-test'
            TaskRoleArn: !Sub 'arn:aws:iam::${AWS::AccountId}:role/ConcordiaServerTaskRole-crowd-test'
            Volumes:
                - Name: images_volume
            ContainerDefinitions:
                - Name: app
                  Cpu: 2048
                  Image: !Sub '${AWS::AccountId}.dkr.ecr.${AWS::Region}.amazonaws.com/concordia:${ConcordiaVersion}'
                  LogConfiguration:
                      LogDriver: awslogs
                      Options:
                          awslogs-group: !Ref 'ConcordiaAppLogsGroup'
                          awslogs-region: !Ref 'AWS::Region'
                          awslogs-stream-prefix: ConcordiaServer
                  Environment:
                      - Name: AWS
                        Value: '1'
                      - Name: ENV_NAME
                        Value: !Ref EnvName
                      - Name: CONCORDIA_ENVIRONMENT
                        Value: !Ref FullEnvironmentName
                      - Name: S3_BUCKET_NAME
                        Value: !Ref S3BucketName
                      - Name: EXPORT_S3_BUCKET_NAME
                        Value: !Ref ExportS3BucketName
                      - Name: CELERY_BROKER_URL
                        Value: !Sub 'redis://${RedisAddress}:${RedisPort}/0'
                      - Name: AWS_DEFAULT_REGION
                        Value: !Ref AWS::Region
                      - Name: SENTRY_BACKEND_DSN
                        Value: https://6727341eabcd47e3a48ce300432e840b@errorlogging.loc.gov/5
                      - Name: SENTRY_FRONTEND_DSN
                        Value: https://77a13a941ffd485dbf41dbf8e7a0bdd0@errorlogging.loc.gov/4
                      - Name: REDIS_ADDRESS
                        Value: !Ref RedisAddress
                      - Name: REDIS_PORT
                        Value: !Ref RedisPort
                      - Name: POSTGRESQL_HOST
                        Value: !Ref DatabaseEndpoint
                      - Name: HOST_NAME
                        Value: !Ref CanonicalHostName
                      - Name: DJANGO_SETTINGS_MODULE
                        Value: concordia.settings_ecs
                  MountPoints:
                      - SourceVolume: images_volume
                        ContainerPath: /concordia_images
                  PortMappings:
                      - ContainerPort: 80
                - Name: importer
                  Cpu: 1024
                  Image: !Sub '${AWS::AccountId}.dkr.ecr.${AWS::Region}.amazonaws.com/concordia/importer:${ConcordiaVersion}'
                  LogConfiguration:
                      LogDriver: awslogs
                      Options:
                          awslogs-group: !Ref 'ConcordiaAppLogsGroup'
                          awslogs-region: !Ref 'AWS::Region'
                          awslogs-stream-prefix: ConcordiaWorker
                  Environment:
                      - Name: AWS
                        Value: '1'
                      - Name: ENV_NAME
                        Value: !Ref EnvName
                      - Name: CONCORDIA_ENVIRONMENT
                        Value: !Ref FullEnvironmentName
                      - Name: S3_BUCKET_NAME
                        Value: !Ref S3BucketName
                      - Name: EXPORT_S3_BUCKET_NAME
                        Value: !Ref ExportS3BucketName
                      - Name: CELERY_BROKER_URL
                        Value: !Sub 'redis://${RedisAddress}:${RedisPort}/0'
                      - Name: AWS_DEFAULT_REGION
                        Value: !Ref AWS::Region
                      - Name: SENTRY_BACKEND_DSN
                        Value: https://6727341eabcd47e3a48ce300432e840b@errorlogging.loc.gov/5
                      - Name: SENTRY_FRONTEND_DSN
                        Value: https://77a13a941ffd485dbf41dbf8e7a0bdd0@errorlogging.loc.gov/4
                      - Name: REDIS_ADDRESS
                        Value: !Ref RedisAddress
                      - Name: REDIS_PORT
                        Value: !Ref RedisPort
                      - Name: POSTGRESQL_HOST
                        Value: !Ref DatabaseEndpoint
                      - Name: HOST_NAME
                        Value: !Ref CanonicalHostName
                      - Name: DJANGO_SETTINGS_MODULE
                        Value: concordia.settings_ecs
                  MountPoints:
                      - SourceVolume: images_volume
                        ContainerPath: /concordia_images
                - Name: celerybeat
                  Cpu: 1024
                  Image: !Sub '${AWS::AccountId}.dkr.ecr.${AWS::Region}.amazonaws.com/concordia/celerybeat:${ConcordiaVersion}'
                  LogConfiguration:
                      LogDriver: awslogs
                      Options:
                          awslogs-group: !Ref 'ConcordiaAppLogsGroup'
                          awslogs-region: !Ref 'AWS::Region'
                          awslogs-stream-prefix: ConcordiaWorker
                  Environment:
                      - Name: AWS
                        Value: '1'
                      - Name: ENV_NAME
                        Value: !Ref EnvName
                      - Name: CONCORDIA_ENVIRONMENT
                        Value: !Ref FullEnvironmentName
                      - Name: S3_BUCKET_NAME
                        Value: !Ref S3BucketName
                      - Name: EXPORT_S3_BUCKET_NAME
                        Value: !Ref ExportS3BucketName
                      - Name: CELERY_BROKER_URL
                        Value: !Sub 'redis://${RedisAddress}:${RedisPort}/0'
                      - Name: AWS_DEFAULT_REGION
                        Value: !Ref AWS::Region
                      - Name: SENTRY_BACKEND_DSN
                        Value: https://6727341eabcd47e3a48ce300432e840b@errorlogging.loc.gov/5
                      - Name: SENTRY_FRONTEND_DSN
                        Value: https://77a13a941ffd485dbf41dbf8e7a0bdd0@errorlogging.loc.gov/4
                      - Name: REDIS_ADDRESS
                        Value: !Ref RedisAddress
                      - Name: REDIS_PORT
                        Value: !Ref RedisPort
                      - Name: POSTGRESQL_HOST
                        Value: !Ref DatabaseEndpoint
                      - Name: HOST_NAME
                        Value: !Ref CanonicalHostName
                      - Name: DJANGO_SETTINGS_MODULE
                        Value: concordia.settings_ecs

    ConcordiaExternalService:
        Type: AWS::ECS::Service
        Properties:
            Cluster: crowd-test
            LaunchType: FARGATE
            DeploymentConfiguration:
                DeploymentCircuitBreaker:
                    Enable: true
                    Rollback: false
                MaximumPercent: 200
                MinimumHealthyPercent: 75
            DesiredCount: 1
            EnableExecuteCommand: true
            NetworkConfiguration:
                AwsvpcConfiguration:
                    SecurityGroups:
                        - !Ref SecurityGroup
                    Subnets:
                        - subnet-0aa55b322229b945a
                        - subnet-0f65558b319b2d4dc
            TaskDefinition: !Ref ConcordiaTask
            LoadBalancers:
                - ContainerName: 'app'
                  ContainerPort: 80
                  TargetGroupArn: !Ref ConcordiaExternalTargetGroup


================================================
FILE: cloudformation/infrastructure/jenkins-server.yaml
================================================
Description: This template deploys an Ubuntu jenkins server in the default VPC.

Resources:
    Jenkins:
        Type: AWS::EC2::Instance
        Properties:
            ImageId: 'ami-042e8287309f5df03'
            InstanceType: 't2.xlarge'
            IamInstanceProfile: 'concordia-jenkins-ec2-role'
            BlockDeviceMappings:
                - DeviceName: /dev/sda1
                  Ebs:
                      VolumeSize: 128
                      VolumeType: gp3
                      DeleteOnTermination: true
            NetworkInterfaces:
                - AssociatePublicIpAddress: true
                  DeviceIndex: '0'
                  GroupSet:
                      - 'sg-02ff28781d04fd191'
                  SubnetId: 'subnet-3748107d'
            UserData:
                Fn::Base64: !Sub |
                    #!/bin/bash -xe
                    echo "Running userdata for ${AWS::StackName}"
                    wget -q -O - https://pkg.jenkins.io/debian/jenkins.io.key | apt-key add -
                    curl -fsSL https://download.docker.com/linux/ubuntu/gpg | apt-key add -
                    sh -c 'echo deb http://pkg.jenkins.io/debian-stable binary/ > /etc/apt/sources.list.d/jenkins.list'
                    add-apt-repository \
                      "deb [arch=amd64] https://download.docker.com/linux/ubuntu \
                      $(lsb_release -cs) \
                      stable"
                    apt-get update
                    apt-get install -qy -o Dpkg::Options::='--force-confnew' \
                      python3 python3-dev python3-venv python3-pip \
                      libtiff-dev libmemcached-dev libjpeg-dev libopenjp2-7-dev libwebp-dev zlib1g-dev \
                      graphviz apt-transport-https libpq-dev \
                      ca-certificates \
                      curl \
                      gnupg-agent \
                      software-properties-common \
                      docker-ce docker-ce-cli containerd.io \
                      openjdk-8-jdk jenkins \
                      nginx awscli
                    usermod -aG docker jenkins
                    snap install postgresql12
                    pip3 install awscli --upgrade
            Tags:
                - Key: Name
                  Value: Jenkins
                - Key: Environment
                  Value: dev


================================================
FILE: cloudformation/infrastructure/network-acl.yaml
================================================
Description: >
    This template contains the security groups required by our entire stack.
    We create them in a seperate nested template, so they can be referenced
    by all of the other nested templates.

Parameters:
    EnvironmentName:
        Description: An environment name that will be prefixed to resource names
        Type: String

    VPC:
        Type: AWS::EC2::VPC::Id
        Description: Choose which VPC the security groups should be deployed to

    PublicSubnet1:
        Description: A reference to the public subnet in the 1st Availability Zone
        Type: AWS::EC2::Subnet::Id

    PublicSubnet2:
        Description: A reference to the public subnet in the 2nd Availability Zone
        Type: AWS::EC2::Subnet::Id

    PrivateSubnet1:
        Description: A reference to the private subnet in the 1st Availability Zone
        Type: AWS::EC2::Subnet::Id

    PrivateSubnet2:
        Description: A reference to the private subnet in the 2nd Availability Zone
        Type: AWS::EC2::Subnet::Id

Resources:
    NetworkAcl:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::NetworkAcl
        DeletionPolicy: Retain
        Properties:
            VpcId:
                Ref: VPC
            Tags:
                - Key: Name
                  Value: !Ref EnvironmentName

    # TODO: Update these ACLs to the latest OCIO standard ones
    # NOTE: These rules are for dev / test / stage only

    acl4:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::NetworkAclEntry
        DeletionPolicy: Retain
        Properties:
            CidrBlock: 0.0.0.0/0
            Egress: true
            Protocol: -1
            RuleAction: allow
            RuleNumber: 100
            NetworkAclId: !Ref NetworkAcl
    acl5:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::NetworkAclEntry
        DeletionPolicy: Retain
        Properties:
            CidrBlock: 140.147.236.152/32
            Protocol: -1
            RuleAction: deny
            RuleNumber: 10
            NetworkAclId: !Ref NetworkAcl
    acl6:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::NetworkAclEntry
        DeletionPolicy: Retain
        Properties:
            CidrBlock: 140.147.236.214/32
            Protocol: -1
            RuleAction: deny
            RuleNumber: 11
            NetworkAclId: !Ref NetworkAcl
    acl6b:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::NetworkAclEntry
        DeletionPolicy: Retain
        Properties:
            CidrBlock: 140.147.236.213/32
            Protocol: -1
            RuleAction: deny
            RuleNumber: 12
            NetworkAclId: !Ref NetworkAcl
    acl7:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::NetworkAclEntry
        DeletionPolicy: Retain
        Properties:
            CidrBlock: 140.147.0.0/16
            Protocol: 6
            RuleAction: allow
            RuleNumber: 100
            PortRange:
                From: 22
                To: 22
            NetworkAclId:
                Ref: NetworkAcl
    acl8:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::NetworkAclEntry
        DeletionPolicy: Retain
        Properties:
            CidrBlock: 0.0.0.0/0
            Protocol: 6
            RuleAction: allow
            RuleNumber: 110
            PortRange:
                From: 1024
                To: 65535
            NetworkAclId:
                Ref: NetworkAcl
    acl9:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::NetworkAclEntry
        DeletionPolicy: Retain
        Properties:
            CidrBlock: 0.0.0.0/0
            Protocol: 6
            RuleAction: allow
            RuleNumber: 200
            PortRange:
                From: 80
                To: 80
            NetworkAclId: !Ref NetworkAcl
    acl10:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::NetworkAclEntry
        DeletionPolicy: Retain
        Properties:
            CidrBlock: 0.0.0.0/0
            Protocol: 6
            RuleAction: allow
            RuleNumber: 210
            PortRange:
                From: 443
                To: 443
            NetworkAclId: !Ref NetworkAcl

    acl11:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::NetworkAclEntry
        DeletionPolicy: Retain
        Properties:
            CidrBlock: 0.0.0.0/0
            Protocol: -1
            RuleAction: allow
            RuleNumber: 300
            NetworkAclId: !Ref NetworkAcl

    subnetacl5:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::SubnetNetworkAclAssociation
        DeletionPolicy: Retain
        Properties:
            NetworkAclId: !Ref NetworkAcl
            SubnetId: !Ref PrivateSubnet1

    subnetacl6:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::SubnetNetworkAclAssociation
        DeletionPolicy: Retain
        Properties:
            NetworkAclId: !Ref NetworkAcl
            SubnetId: !Ref PrivateSubnet2

    subnetacl7:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::SubnetNetworkAclAssociation
        DeletionPolicy: Retain
        Properties:
            NetworkAclId: !Ref NetworkAcl
            SubnetId: !Ref PublicSubnet1

    subnetacl8:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::SubnetNetworkAclAssociation
        DeletionPolicy: Retain
        Properties:
            NetworkAclId: !Ref NetworkAcl
            SubnetId: !Ref PublicSubnet2


================================================
FILE: cloudformation/infrastructure/opensearch.yaml
================================================
Description: >
    This template deploys a VPC-based OpenSearch cluster.

Parameters:
    EnvName:
        Type: String
        Description: which environment to target
        AllowedValues:
            - 'dev'
            - 'test'
            - 'stage'
            - 'prod'
        ConstraintDescription: Must match a location for secret storage in secretsmanager

    SecurityGroup:
        Description: Select the Security Group to use for the ECS cluster hosts
        Type: AWS::EC2::SecurityGroup::Id

    PrivateSubnet2:
        Description: The private subnet in AZ2 for the VPC
        Type: AWS::EC2::Subnet::Id

Resources:
    ESCluster:
        Type: AWS::OpenSearchService::Domain
        Properties:
            ClusterConfig:
                InstanceCount: 1
                ZoneAwarenessEnabled: false
                InstanceType: 'm7g.xlarge.search'
            EngineVersion: '1.3'
            EBSOptions:
                EBSEnabled: true
                Iops: 0
                VolumeSize: 30
                VolumeType: 'gp3'
            SnapshotOptions:
                AutomatedSnapshotStartHour: 0
            AccessPolicies:
                Version: '2012-10-17'
                Statement:
                    - Effect: 'Allow'
                      Principal:
                          AWS: '*'
                      Action: 'es:*'
                      Resource: !Sub 'arn:aws:es:us-east-1:619333082511:domain/crowd-${EnvName}-vpc/*'
            AdvancedOptions:
                rest.action.multi.allow_explicit_index: 'true'
            Tags:
                - Key: Environment
                  Value: !Ref EnvName
            VPCOptions:
                SubnetIds:
                    - Ref: PrivateSubnet2
                SecurityGroupIds:
                    - Ref: SecurityGroup


================================================
FILE: cloudformation/infrastructure/rds.yaml
================================================
AWSTemplateFormatVersion: '2010-09-09'
Parameters:
    DatabaseSecurityGroup:
        Description: Sets the security group to use for RDS database access
        Type: AWS::EC2::SecurityGroup::Id

    PrivateSubnet1:
        Description: A reference to the private subnet in the 1st Availability Zone
        Type: AWS::EC2::Subnet::Id

    PrivateSubnet2:
        Description: A reference to the private subnet in the 2nd Availability Zone
        Type: AWS::EC2::Subnet::Id

    DbUsername:
        Description: The username to use for the database
        Type: String
        NoEcho: true

    DbPassword:
        Description: The password to use for the database
        Type: String
        NoEcho: true

Resources:
    PostgresSubnetGroup:
        UpdateReplacePolicy: Retain
        Type: AWS::RDS::DBSubnetGroup
        DeletionPolicy: Retain
        Properties:
            DBSubnetGroupDescription: Created from the RDS Management Console
            SubnetIds:
                - Ref: PrivateSubnet1
                - Ref: PrivateSubnet2

    PostgresService:
        UpdateReplacePolicy: Retain
        Type: AWS::RDS::DBInstance
        DeletionPolicy: Retain
        Properties:
            AllocatedStorage: '20'
            AllowMajorVersionUpgrade: false
            AutoMinorVersionUpgrade: true
            DBInstanceClass: db.t4g.medium
            Port: '5432'
            PubliclyAccessible: false
            StorageType: gp3
            StorageEncrypted: True
            BackupRetentionPeriod: 31
            MasterUsername: !Ref DbUsername
            MasterUserPassword: !Ref DbPassword
            PreferredBackupWindow: 03:47-04:17
            PreferredMaintenanceWindow: tue:03:14-tue:03:44
            DBName: concordia
            Engine: postgres
            EngineVersion: '15.5'
            LicenseModel: postgresql-license
            DBSubnetGroupName:
                Ref: PostgresSubnetGroup
            VPCSecurityGroups:
                - Ref: DatabaseSecurityGroup
            Tags:
                - Key: workload-type
                  Value: other

Outputs:
    DatabaseHostName:
        Description: 'Hostname for the relational database service'
        Value: !GetAtt PostgresService.Endpoint.Address


================================================
FILE: cloudformation/infrastructure/search-proxy-task.yaml
================================================
Description: >
    This template deploys an opensearch dashboard proxy server to the specified VPC

Parameters:
    VpcId:
        Description: The Id of the VPC for this cluster
        Type: AWS::EC2::VPC::Id

    EnvName:
        Type: String
        Description: which environment to target
        AllowedValues:
            - 'dev'
            - 'test'
            - 'stage'
            - 'prod'
        ConstraintDescription: Must match a location for secret storage in secretsmanager

    Priority:
        Type: Number
        Description: Priority of the subdomain listener rule, must be unique in the set of listener rules
        Default: 100

Mappings:
    EnvironmentMapping:
        ListenerArn:
            dev: 'arn:aws:elasticloadbalancing:us-east-1:619333082511:listener/app/crowd-dev/112d22a79e25de0b/8bb4cb9c8b054e91'
            test: 'arn:aws:elasticloadbalancing:us-east-1:619333082511:listener/app/crowd-test/81e4820e354ea810/187fd94e534ad833'
            stage: 'arn:aws:elasticloadbalancing:us-east-1:619333082511:listener/app/crowd-stage/7d954bca84b62358/ab34414a68f355f2'
            prod: 'arn:aws:elasticloadbalancing:us-east-1:619333082511:listener/app/crowd-prod/746d0ae14ecc23e4/747212dd4e5706be'

        TaskRoleArn:
            dev: 'arn:aws:iam::619333082511:role/ConcordiaServerTaskRole-crowd-dev'
            test: 'arn:aws:iam::619333082511:role/ConcordiaServerTaskRole-crowd-test'
            stage: 'arn:aws:iam::619333082511:role/ConcordiaServerTaskRole-crowd-stage'
            prod: 'arn:aws:iam::619333082511:role/ConcordiaServerTaskRole-crowd-prod'

        # The ID of a private subnet
        # Type: AWS::EC2::Subnet::Id
        PrivateSubnet1:
            dev: subnet-0c95a830ce007fa65
            test: subnet-0aa55b322229b945a
            stage: subnet-0f7c7d66b66d6dd90
            prod: subnet-0da84976b66c32ce4

        OpensearchEndpoint:
            dev: 'https://vpc-crowd-dev-vpc-6xqqrxn5naqkvtdl6r6uanlhbe.us-east-1.es.amazonaws.com'
            test: 'https://vpc-crowd-test-vpc-63g3ylzduyzywhqbsqotnnm7ke.us-east-1.es.amazonaws.com'
            stage: 'https://vpc-crowd-stage-vpc-x5lgoj5yo76dvrxpfhmusss2b4.us-east-1.es.amazonaws.com'
            prod: 'https://vpc-crowd-prod-vpc-zl5xdhmtpr7squr6mtl7znqyqa.us-east-1.es.amazonaws.com'

        # The security group
        # Type: AWS::EC2::SecurityGroup::Id
        SecurityGroup:
            dev: sg-0ceb6b1dc0de899b3
            test: sg-09bc01194e6c52cb9
            stage: sg-0f6145067777b1cc3
            prod: sg-031594e2cfc8b25c7

Resources:
    DashboardLogsGroup:
        Type: AWS::Logs::LogGroup
        Properties:
            LogGroupName: !Ref AWS::StackName
            RetentionInDays: 30

    DashboardTargetGroup:
        Type: AWS::ElasticLoadBalancingV2::TargetGroup
        Properties:
            HealthCheckIntervalSeconds: 30
            HealthCheckPath: /
            HealthCheckProtocol: HTTP
            HealthCheckTimeoutSeconds: 5
            HealthyThresholdCount: 2
            UnhealthyThresholdCount: 10
            TargetType: ip
            Port: 80
            Protocol: HTTP
            VpcId: !Ref VpcId
            Matcher:
                HttpCode: '200,301' # Add this line for success codes
            Tags:
                - Key: Project
                  Value: Concordia
                - Key: Department
                  Value: OCIO
                - Key: ArcherID
                  Value: LIB-361
                - Key: Environment
                  Value: Development
                - Key: StackManaged
                  Value: crowd-dev-searchproxy

    SubdomainListenerRule:
        Type: AWS::ElasticLoadBalancingV2::ListenerRule
        Properties:
            Actions:
                - TargetGroupArn: !Ref DashboardTargetGroup
                  Type: forward
            Conditions:
                - Field: path-pattern
                  Values:
                      - '/_dashboards*'
            ListenerArn:
                Fn::FindInMap:
                    - EnvironmentMapping
                    - ListenerArn
                    - Ref: EnvName
            Priority: !Ref Priority

    DashboardTask:
        Type: AWS::ECS::TaskDefinition
        Properties:
            Family: !Sub crowd-${EnvName}-searchproxy
            Cpu: '256'
            Memory: '512'
            NetworkMode: awsvpc
            RequiresCompatibilities:
                - FARGATE
            ExecutionRoleArn: !Sub 'arn:aws:iam::${AWS::AccountId}:role/ecsTaskExecutionRole'
            TaskRoleArn:
                Fn::FindInMap:
                    - EnvironmentMapping
                    - TaskRoleArn
                    - Ref: EnvName
            ContainerDefinitions:
                - Name: sigv4proxy
                  Image: public.ecr.aws/aws-observability/aws-sigv4-proxy:1.10
                  Cpu: 256
                  Memory: 512
                  Essential: true
                  PortMappings:
                      - ContainerPort: 80
                        Protocol: tcp
                  LogConfiguration:
                      LogDriver: awslogs
                      Options:
                          awslogs-group: !Ref 'DashboardLogsGroup'
                          awslogs-region: !Ref 'AWS::Region'
                          awslogs-stream-prefix: ConcordiaDashboardProxy
                  Environment:
                      - Name: OPENSEARCH_ENDPOINT
                        Value:
                            Fn::FindInMap:
                                - EnvironmentMapping
                                - OpensearchEndpoint
                                - Ref: EnvName
                  Command:
                      - --name
                      - es
                      - --region
                      - !Ref AWS::Region
                      - --host
                      - !Select
                        - 1
                        - !Split
                          - '://'
                          - !FindInMap [
                                EnvironmentMapping,
                                OpensearchEndpoint,
                                !Ref EnvName,
                            ]
                      - --port
                      - '0.0.0.0:80'
                      - --sign-host
                      - !Select
                        - 1
                        - !Split
                          - '://'
                          - !FindInMap [
                                EnvironmentMapping,
                                OpensearchEndpoint,
                                !Ref EnvName,
                            ]
                      - --no-verify-ssl
            Tags:
                - Key: Project
                  Value: Concordia
                - Key: Department
                  Value: OCIO
                - Key: ArcherID
                  Value: LIB-361
                - Key: Environment
                  Value: Development
                - Key: StackManaged
                  Value: crowd-dev-searchproxy

    DashboardService:
        Type: AWS::ECS::Service
        Properties:
            Cluster: !Sub crowd-${EnvName}
            LaunchType: FARGATE
            DeploymentConfiguration:
                MaximumPercent: 200
                MinimumHealthyPercent: 100
            DesiredCount: 1
            NetworkConfiguration:
                AwsvpcConfiguration:
                    SecurityGroups:
                        - Fn::FindInMap:
                              - EnvironmentMapping
                              - SecurityGroup
                              - Ref: EnvName
                    Subnets:
                        - Fn::FindInMap:
                              - EnvironmentMapping
                              - PrivateSubnet1
                              - Ref: EnvName
            TaskDefinition: !Ref DashboardTask
            LoadBalancers:
                - ContainerName: 'sigv4proxy'
                  ContainerPort: 80
                  TargetGroupArn: !Ref DashboardTargetGroup
            EnableExecuteCommand: true
            Tags:
                - Key: Project
                  Value: Concordia
                - Key: Department
                  Value: OCIO
                - Key: ArcherID
                  Value: LIB-361
                - Key: Environment
                  Value: Development
                - Key: StackManaged
                  Value: crowd-dev-searchproxy


================================================
FILE: cloudformation/infrastructure/security-groups.yaml
================================================
Description: >
    This template contains the security groups required by our entire stack.
    We create them in a seperate nested template, so they can be referenced
    by all of the other nested templates.

Parameters:
    EnvironmentName:
        Description: An environment name that will be prefixed to resource names
        Type: String

    VPC:
        Type: AWS::EC2::VPC::Id
        Description: Choose which VPC the security groups should be deployed to

Resources:
    # This security group defines who/where is allowed to access the ECS hosts directly.
    # By default we're just allowing access from the load balancer.  If you want to SSH
    # into the hosts, or expose non-load balanced services you can open their ports here.
    ECSHostSecurityGroup:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::SecurityGroup
        DeletionPolicy: Retain
        Properties:
            VpcId: !Ref VPC
            GroupDescription: Access to the ECS hosts and the tasks/containers that run on them
            SecurityGroupIngress:
                - Description: 'Open access to container hosts from the load balancer'
                  SourceSecurityGroupId: !Ref LoadBalancerSecurityGroup
                  IpProtocol: '-1'
                - Description: 'SSH access to container hosts from bastion hosts'
                  SourceSecurityGroupId: !Ref BastionHostSecurityGroup
                  IpProtocol: tcp
                  FromPort: 22
                  ToPort: 22
            SecurityGroupEgress:
                - Description: 'Explicit outbound access'
                  IpProtocol: '-1'
                  CidrIp: 0.0.0.0/0

            Tags:
                - Key: Name
                  Value: !Sub ${EnvironmentName}-ECS-Hosts

    LoadBalancerSecurityGroup:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::SecurityGroup
        Metadata:
            cfn_nag:
                rules_to_suppress:
                    - id: W9
                      reason: 'The CIDR block should only allow 140.147.*.* IPs so it should end in /16'
        DeletionPolicy: Retain
        Properties:
            VpcId: !Ref VPC
            GroupDescription: Access to the load balancer that sits in front of ECS
            SecurityGroupIngress:
                - Description: 'Allow HTTP access from the LC network to our ECS services'
                  CidrIp: 140.147.0.0/16
                  IpProtocol: tcp
                  FromPort: 80
                  ToPort: 80
                - Description: 'Allow HTTPS access from the LC network to our ECS services'
                  CidrIp: 140.147.0.0/16
                  IpProtocol: tcp
                  FromPort: 443
                  ToPort: 443
            SecurityGroupEgress:
                - Description: 'Explicit outbound access'
                  IpProtocol: '-1'
                  CidrIp: 0.0.0.0/0
            Tags:
                - Key: Name
                  Value: !Sub ${EnvironmentName}-LoadBalancers
                - Key: AllowCloudFlareIngress
                  Value: 'true'

    DatabaseSecurityGroup:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::SecurityGroup
        DeletionPolicy: Retain
        Properties:
            VpcId: !Ref VPC
            GroupDescription: Access to the RDS Postgres database
            SecurityGroupIngress:
                - Description: 'Postgresql access to RDS from container hosts'
                  SourceSecurityGroupId: !Ref ECSHostSecurityGroup
                  IpProtocol: tcp
                  FromPort: 5432
                  ToPort: 5432
            SecurityGroupEgress:
                - Description: 'Explicit outbound access'
                  IpProtocol: '-1'
                  CidrIp: 0.0.0.0/0

    BastionHostSecurityGroup:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::SecurityGroup
        Metadata:
            cfn_nag:
                rules_to_suppress:
                    - id: W9
                      reason: 'The CIDR block should only allow 140.147.*.* IPs so it should end in /16'
        DeletionPolicy: Retain
        Properties:
            VpcId: !Ref VPC
            GroupDescription: Bastion hosts for ECS access
            SecurityGroupIngress:
                - Description: 'SSH access from LC network to bastion hosts'
                  CidrIp: 140.147.0.0/16
                  IpProtocol: tcp
                  FromPort: 22
                  ToPort: 22
            SecurityGroupEgress:
                - Description: 'Explicit outbound access'
                  IpProtocol: '-1'
                  CidrIp: 0.0.0.0/0
            Tags:
                - Key: Name
                  Value: !Sub ${EnvironmentName}-BastionHosts

    CacheServiceSecurityGroup:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::SecurityGroup
        DeletionPolicy: Retain
        Properties:
            VpcId: !Ref VPC
            GroupDescription: Access to cache services for ECS hosts
            SecurityGroupIngress:
                - Description: 'Redis service access from container hosts'
                  SourceSecurityGroupId: !Ref 'ECSHostSecurityGroup'
                  IpProtocol: tcp
                  FromPort: 6379
                  ToPort: 6379
            SecurityGroupEgress:
                - Description: 'Explicit outbound access'
                  IpProtocol: '-1'
                  CidrIp: 0.0.0.0/0

Outputs:
    ECSHostSecurityGroup:
        Description: A reference to the security group for ECS hosts
        Value: !Ref ECSHostSecurityGroup

    LoadBalancerSecurityGroup:
        Description: A reference to the security group for load balancers
        Value: !Ref LoadBalancerSecurityGroup

    DatabaseSecurityGroup:
        Description: A reference to the security group for RDS
        Value: !Ref DatabaseSecurityGroup

    BastionHostSecurityGroup:
        Description: A reference to the security group for bastion hosts
        Value: !Ref BastionHostSecurityGroup

    CacheServiceSecurityGroup:
        Description: A reference to the security group for cache services
        Value: !Ref CacheServiceSecurityGroup


================================================
FILE: cloudformation/infrastructure/vpc.yaml
================================================
Description: >
    This template deploys a VPC, with a pair of public and private subnets spread
    across two Availabilty Zones. It deploys an Internet Gateway, with a default
    route on the public subnets. It deploys a pair of NAT Gateways (one in each AZ),
    and default routes for them in the private subnets.

Parameters:
    EnvironmentName:
        Description: An environment name that will be prefixed to resource names
        Type: String

    VpcCIDR:
        Description: Please enter the IP range (CIDR notation) for this VPC
        Type: String
        Default: 10.192.0.0/16
        AllowedPattern: '^(([0-9]|[1-9][0-9]|1[0-9]{2}|2[0-4][0-9]|25[0-5])\.){3}([0-9]|[1-9][0-9]|1[0-9]{2}|2[0-4][0-9]|25[0-5])(\/([0-9]|[1-2][0-9]|3[0-2]))$'

    PublicSubnet1CIDR:
        Description: Please enter the IP range (CIDR notation) for the public subnet in the first Availability Zone
        Type: String
        Default: 10.192.10.0/24
        AllowedPattern: '^(([0-9]|[1-9][0-9]|1[0-9]{2}|2[0-4][0-9]|25[0-5])\.){3}([0-9]|[1-9][0-9]|1[0-9]{2}|2[0-4][0-9]|25[0-5])(\/([0-9]|[1-2][0-9]|3[0-2]))$'

    PublicSubnet2CIDR:
        Description: Please enter the IP range (CIDR notation) for the public subnet in the second Availability Zone
        Type: String
        Default: 10.192.11.0/24
        AllowedPattern: '^(([0-9]|[1-9][0-9]|1[0-9]{2}|2[0-4][0-9]|25[0-5])\.){3}([0-9]|[1-9][0-9]|1[0-9]{2}|2[0-4][0-9]|25[0-5])(\/([0-9]|[1-2][0-9]|3[0-2]))$'

    PrivateSubnet1CIDR:
        Description: Please enter the IP range (CIDR notation) for the private subnet in the first Availability Zone
        Type: String
        Default: 10.192.20.0/24
        AllowedPattern: '^(([0-9]|[1-9][0-9]|1[0-9]{2}|2[0-4][0-9]|25[0-5])\.){3}([0-9]|[1-9][0-9]|1[0-9]{2}|2[0-4][0-9]|25[0-5])(\/([0-9]|[1-2][0-9]|3[0-2]))$'

    PrivateSubnet2CIDR:
        Description: Please enter the IP range (CIDR notation) for the private subnet in the second Availability Zone
        Type: String
        Default: 10.192.21.0/24
        AllowedPattern: '^(([0-9]|[1-9][0-9]|1[0-9]{2}|2[0-4][0-9]|25[0-5])\.){3}([0-9]|[1-9][0-9]|1[0-9]{2}|2[0-4][0-9]|25[0-5])(\/([0-9]|[1-2][0-9]|3[0-2]))$'

    AvailabilityZone1:
        Description: The index of the availability zone for private and public subnet 1
        Type: Number
        Default: 0

    AvailabilityZone2:
        Description: The index of availability zone for private and public subnet 2
        Type: Number
        Default: 1

Resources:
    VPC:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::VPC
        DeletionPolicy: Retain
        Properties:
            CidrBlock: !Ref VpcCIDR
            InstanceTenancy: default
            EnableDnsHostnames: true
            EnableDnsSupport: true
            Tags:
                - Key: Name
                  Value: !Ref EnvironmentName

    InternetGateway:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::InternetGateway
        DeletionPolicy: Retain
        Properties:
            Tags:
                - Key: Name
                  Value: !Ref EnvironmentName

    InternetGatewayAttachment:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::VPCGatewayAttachment
        DeletionPolicy: Retain
        Properties:
            InternetGatewayId: !Ref InternetGateway
            VpcId: !Ref VPC

    PublicSubnet1:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::Subnet
        Metadata:
            cfn_nag:
                rules_to_suppress:
                    - id: W33
                      reason: "It's a public subnet"
        DeletionPolicy: Retain
        Properties:
            VpcId: !Ref VPC
            AvailabilityZone: !Select [!Ref AvailabilityZone1, !GetAZs '']
            CidrBlock: !Ref PublicSubnet1CIDR
            MapPublicIpOnLaunch: true
            Tags:
                - Key: Name
                  Value: !Sub ${EnvironmentName} Public Subnet (AZ1)

    PublicSubnet2:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::Subnet
        Metadata:
            cfn_nag:
                rules_to_suppress:
                    - id: W33
                      reason: "It's a public subnet"
        DeletionPolicy: Retain
        Properties:
            VpcId: !Ref VPC
            AvailabilityZone: !Select [!Ref AvailabilityZone2, !GetAZs '']
            CidrBlock: !Ref PublicSubnet2CIDR
            MapPublicIpOnLaunch: true
            Tags:
                - Key: Name
                  Value: !Sub ${EnvironmentName} Public Subnet (AZ2)

    PrivateSubnet1:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::Subnet
        DeletionPolicy: Retain
        Properties:
            VpcId: !Ref VPC
            AvailabilityZone: !Select [!Ref AvailabilityZone1, !GetAZs '']
            CidrBlock: !Ref PrivateSubnet1CIDR
            MapPublicIpOnLaunch: false
            Tags:
                - Key: Name
                  Value: !Sub ${EnvironmentName} Private Subnet (AZ1)

    PrivateSubnet2:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::Subnet
        DeletionPolicy: Retain
        Properties:
            VpcId: !Ref VPC
            AvailabilityZone: !Select [!Ref AvailabilityZone2, !GetAZs '']
            CidrBlock: !Ref PrivateSubnet2CIDR
            MapPublicIpOnLaunch: false
            Tags:
                - Key: Name
                  Value: !Sub ${EnvironmentName} Private Subnet (AZ2)

    NatGateway1EIP:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::EIP
        DependsOn: InternetGatewayAttachment
        DeletionPolicy: Retain
        Properties:
            Domain: vpc

    NatGateway2EIP:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::EIP
        DependsOn: InternetGatewayAttachment
        DeletionPolicy: Retain
        Properties:
            Domain: vpc

    NatGateway1:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::NatGateway
        DeletionPolicy: Retain
        Properties:
            AllocationId: !GetAtt NatGateway1EIP.AllocationId
            SubnetId: !Ref PublicSubnet1

    NatGateway2:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::NatGateway
        DeletionPolicy: Retain
        Properties:
            AllocationId: !GetAtt NatGateway2EIP.AllocationId
            SubnetId: !Ref PublicSubnet2

    PublicRouteTable:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::RouteTable
        DeletionPolicy: Retain
        Properties:
            VpcId: !Ref VPC
            Tags:
                - Key: Name
                  Value: !Sub ${EnvironmentName} Public Routes

    DefaultPublicRoute:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::Route
        DependsOn: InternetGatewayAttachment
        DeletionPolicy: Retain
        Properties:
            RouteTableId: !Ref PublicRouteTable
            DestinationCidrBlock: 0.0.0.0/0
            GatewayId: !Ref InternetGateway

    PublicSubnet1RouteTableAssociation:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::SubnetRouteTableAssociation
        DeletionPolicy: Retain
        Properties:
            RouteTableId: !Ref PublicRouteTable
            SubnetId: !Ref PublicSubnet1

    PublicSubnet2RouteTableAssociation:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::SubnetRouteTableAssociation
        DeletionPolicy: Retain
        Properties:
            RouteTableId: !Ref PublicRouteTable
            SubnetId: !Ref PublicSubnet2

    PrivateRouteTable1:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::RouteTable
        DeletionPolicy: Retain
        Properties:
            VpcId: !Ref VPC
            Tags:
                - Key: Name
                  Value: !Sub ${EnvironmentName} Private Routes (AZ1)

    DefaultPrivateRoute1:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::Route
        DeletionPolicy: Retain
        Properties:
            RouteTableId: !Ref PrivateRouteTable1
            DestinationCidrBlock: 0.0.0.0/0
            NatGatewayId: !Ref NatGateway1

    PrivateSubnet1RouteTableAssociation:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::SubnetRouteTableAssociation
        DeletionPolicy: Retain
        Properties:
            RouteTableId: !Ref PrivateRouteTable1
            SubnetId: !Ref PrivateSubnet1

    PrivateRouteTable2:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::RouteTable
        DeletionPolicy: Retain
        Properties:
            VpcId: !Ref VPC
            Tags:
                - Key: Name
                  Value: !Sub ${EnvironmentName} Private Routes (AZ2)

    DefaultPrivateRoute2:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::Route
        DeletionPolicy: Retain
        Properties:
            RouteTableId: !Ref PrivateRouteTable2
            DestinationCidrBlock: 0.0.0.0/0
            NatGatewayId: !Ref NatGateway2

    PrivateSubnet2RouteTableAssociation:
        UpdateReplacePolicy: Retain
        Type: AWS::EC2::SubnetRouteTableAssociation
        DeletionPolicy: Retain
        Properties:
            RouteTableId: !Ref PrivateRouteTable2
            SubnetId: !Ref PrivateSubnet2

Outputs:
    VPC:
        Description: A reference to the created VPC
        Value: !Ref VPC

    PublicSubnets:
        Description: A list of the public subnets
        Value: !Join [',', [!Ref PublicSubnet1, !Ref PublicSubnet2]]

    PrivateSubnets:
        Description: A list of the private subnets
        Value: !Join [',', [!Ref PrivateSubnet1, !Ref PrivateSubnet2]]

    PublicSubnet1:
        Description: A reference to the public subnet in the 1st Availability Zone
        Value: !Ref PublicSubnet1

    PublicSubnet2:
        Description: A reference to the public subnet in the 2nd Availability Zone
        Value: !Ref PublicSubnet2

    PrivateSubnet1:
        Description: A reference to the private subnet in the 1st Availability Zone
        Value: !Ref PrivateSubnet1

    PrivateSubnet2:
        Description: A reference to the private subnet in the 2nd Availability Zone
        Value: !Ref PrivateSubnet2


================================================
FILE: cloudformation/master.yaml
================================================
---
AWSTemplateFormatVersion: '2010-09-09'
Description: >

    This template deploys a VPC, with a pair of public and private subnets spread
    across two Availabilty Zones. It deploys an Internet Gateway, with a default
    route on the public subnets. It deploys a pair of NAT Gateways (one in each AZ),
    and default routes for them in the private subnets.

    It then deploys a Fargate ECS cluster distributed across multiple
    Availability Zones.

    Finally, it deploys crowd ECS services from containers published in
    Amazon EC2 Container Registry (Amazon ECR).
Mappings:
    EnvironmentMapping:
        AvailabilityZone1Map:
            dev: 0
            test: 2
            stage: 2
            prod: 0
            cftest2: 0
        AvailabilityZone2Map:
            dev: 1
            test: 3
            stage: 3
            prod: 1
            cftest2: 1
        VPCCIDRMap:
            dev: 10.192.0.0/16
            test: 10.193.0.0/16
            stage: 10.194.0.0/16
            prod: 10.195.0.0/16
            cftest2: 10.196.0.0/16
        PublicSubnet1CIDRMap:
            dev: 10.192.10.0/24
            test: 10.193.10.0/24
            stage: 10.194.10.0/24
            prod: 10.195.10.0/24
            cftest2: 10.196.10.0/24
        PublicSubnet2CIDRMap:
            dev: 10.192.11.0/24
            test: 10.193.11.0/24
            stage: 10.194.11.0/24
            prod: 10.195.11.0/24
            cftest2: 10.196.11.0/24
        PrivateSubnet1CIDRMap:
            dev: 10.192.20.0/24
            test: 10.193.20.0/24
            stage: 10.194.20.0/24
            prod: 10.195.20.0/24
            cftest2: 10.196.20.0/24
        PrivateSubnet2CIDRMap:
            dev: 10.192.21.0/24
            test: 10.193.21.0/24
            stage: 10.194.21.0/24
            prod: 10.195.21.0/24
            cftest2: 10.196.21.0/24
        S3BucketNameMap:
            dev: crowd-dev-content
            test: crowd-test-content
            stage: crowd-stage-content
            prod: crowd-content
            cftest2: crowd-dev-content
        ExportS3BucketNameMap:
            dev: crowd-dev-export
            test: crowd-test-export
            stage: crowd-stage-export
            prod: crowd-export
            cftest2: crowd-dev-export

Parameters:
    ConcordiaVersion:
        Description: which version of the docker images to deploy
        Type: String
        Default: latest

    EnvName:
        Description: which type of environment we are setting up
        Type: String
        AllowedValues:
            - 'dev'
            - 'test'
            - 'stage'
            - 'prod'
            - 'cftest2'

    FullEnvironmentName:
        Type: String
        Description: Full name of deployment environment
        AllowedValues:
            - 'development'
            - 'test'
            - 'staging'
            - 'production'

    CanonicalHostName:
        Description: the canonical host name for this environment
        Type: String
        AllowedValues:
            - 'crowd-dev.loc.gov'
            - 'crowd-test.loc.gov'
            - 'crowd-stage.loc.gov'
            - 'crowd.loc.gov'

    DjangoKeyId:
        Type: String
        Description: unique ID appended to end of DjangoSecretKey ARN in secrets manager

    DbSecretId:
        Type: String
        Description: unique ID appended to end of DB password ARN in secrets manager

Resources:
    VPC:
        UpdateReplacePolicy: Retain
        Type: AWS::CloudFormation::Stack
        DeletionPolicy: Retain
        Properties:
            #            TemplateURL: !Join [ "/", [ !Ref BasePath, "/infrastructure/vpc.yaml" ]]
            TemplateURL: 'https://s3.amazonaws.com/crowd-deployment/infrastructure/vpc.yaml'
            Parameters:
                EnvironmentName: !Ref AWS::StackName
                VpcCIDR:
                    !FindInMap [EnvironmentMapping, VPCCIDRMap, !Ref EnvName]
                PublicSubnet1CIDR:
                    !FindInMap [
                        EnvironmentMapping,
                        PublicSubnet1CIDRMap,
                        !Ref EnvName,
                    ]
                PublicSubnet2CIDR:
                    !FindInMap [
                        EnvironmentMapping,
                        PublicSubnet2CIDRMap,
                        !Ref EnvName,
                    ]
                PrivateSubnet1CIDR:
                    !FindInMap [
                        EnvironmentMapping,
                        PrivateSubnet1CIDRMap,
                        !Ref EnvName,
                    ]
                PrivateSubnet2CIDR:
                    !FindInMap [
                        EnvironmentMapping,
                        PrivateSubnet2CIDRMap,
                        !Ref EnvName,
                    ]
                AvailabilityZone1:
                    !FindInMap [
                        EnvironmentMapping,
                        AvailabilityZone1Map,
                        !Ref EnvName,
                    ]
                AvailabilityZone2:
                    !FindInMap [
                        EnvironmentMapping,
                        AvailabilityZone2Map,
                        !Ref EnvName,
                    ]

    NetworkACL:
        UpdateReplacePolicy: Retain
        Type: AWS::CloudFormation::Stack
        DeletionPolicy: Retain
        Properties:
            #            TemplateURL: !Join [ "/", [ !Ref BasePath, "/infrastructure/network-acl.yaml" ]]
            TemplateURL: 'https://s3.amazonaws.com/crowd-deployment/infrastructure/network-acl.yaml'
            Parameters:
                EnvironmentName: !Ref AWS::StackName
                VPC: !GetAtt VPC.Outputs.VPC
                PublicSubnet1: !GetAtt VPC.Outputs.PublicSubnet1
                PublicSubnet2: !GetAtt VPC.Outputs.PublicSubnet2
                PrivateSubnet1: !GetAtt VPC.Outputs.PrivateSubnet1
                PrivateSubnet2: !GetAtt VPC.Outputs.PrivateSubnet2

    SecurityGroups:
        UpdateReplacePolicy: Retain
        Type: AWS::CloudFormation::Stack
        DeletionPolicy: Retain
        Properties:
            TemplateURL: 'https://s3.amazonaws.com/crowd-deployment/infrastructure/security-groups.yaml'
            Parameters:
                EnvironmentName: !Ref AWS::StackName
                VPC: !GetAtt VPC.Outputs.VPC

    RDS:
        UpdateReplacePolicy: Retain
        Type: AWS::CloudFormation::Stack
        DeletionPolicy: Retain
        Properties:
            TemplateURL: 'https://s3.amazonaws.com/crowd-deployment/infrastructure/rds.yaml'
            Parameters:
                DbUsername: !Sub '{{resolve:secretsmanager:crowd/${EnvName}/DB/MasterUserPassword:SecretString:username}}'
                DbPassword: !Sub '{{resolve:secretsmanager:crowd/${EnvName}/DB/MasterUserPassword:SecretString:password}}'
                DatabaseSecurityGroup: !GetAtt SecurityGroups.Outputs.DatabaseSecurityGroup
                PrivateSubnet1: !GetAtt VPC.Outputs.PrivateSubnet1
                PrivateSubnet2: !GetAtt VPC.Outputs.PrivateSubnet2

    ElastiCache:
        UpdateReplacePolicy: Retain
        Type: AWS::CloudFormation::Stack
        DeletionPolicy: Retain
        Properties:
            TemplateURL: 'https://s3.amazonaws.com/crowd-deployment/infrastructure/elasticache.yaml'
            Parameters:
                EnvironmentName: !Ref AWS::StackName
                SecurityGroup: !GetAtt SecurityGroups.Outputs.CacheServiceSecurityGroup
                PrivateSubnets: !GetAtt VPC.Outputs.PrivateSubnets

    FargateCluster:
        UpdateReplacePolicy: Retain
        Type: AWS::CloudFormation::Stack
        DeletionPolicy: Retain
        Properties:
            TemplateURL: 'https://s3.amazonaws.com/crowd-deployment/infrastructure/fargate-cluster.yaml'
            Parameters:
                EnvironmentName: !Ref AWS::StackName
                EnvName: !Ref EnvName
                VpcId: !GetAtt VPC.Outputs.VPC
                SecurityGroup: !GetAtt SecurityGroups.Outputs.ECSHostSecurityGroup
                LoadBalancerSecurityGroup: !GetAtt SecurityGroups.Outputs.LoadBalancerSecurityGroup
                PrivateSubnets: !GetAtt VPC.Outputs.PrivateSubnets
                PublicSubnets: !GetAtt VPC.Outputs.PublicSubnets
                ConcordiaVersion: !Ref ConcordiaVersion
                RedisAddress: !GetAtt ElastiCache.Outputs.RedisAddress
                RedisPort: !GetAtt ElastiCache.Outputs.RedisPort
                CanonicalHostName: !Ref CanonicalHostName
                DatabaseEndpoint: !GetAtt RDS.Outputs.DatabaseHostName
                FullEnvironmentName: !Ref FullEnvironmentName
                DjangoKeyId: !Ref DjangoKeyId
                DbSecretId: !Ref DbSecretId
                S3BucketName:
                    !FindInMap [
                        EnvironmentMapping,
                        S3BucketNameMap,
                        !Ref EnvName,
                    ]
                ExportS3BucketName:
                    !FindInMap [
                        EnvironmentMapping,
                        ExportS3BucketNameMap,
                        !Ref EnvName,
                    ]

Outputs:
    WebsiteServiceUrl:
        Description: The URL endpoint for the concordia website service
        Value: !Join ['', [!GetAtt FargateCluster.Outputs.LoadBalancerUrl, '/']]


================================================
FILE: cloudformation/stack_drift.sh
================================================
#!/bin/bash

set -eu -o pipefail

STACK_NAME=$1
if [[ -z "${STACK_NAME}" ]]; then
    echo "STACK_NAME must be set prior to running this script."
    exit 1
fi

TODAY=$(date +%Y%m%d)
# job log and json output file names
LOG_FILE="stack-drift-${STACK_NAME}-${TODAY}.log"
echo $STACK_NAME | tee ${LOG_FILE}

OUTPUT_FILE="stack-drift-${STACK_NAME}-${TODAY}.json"
echo $OUTPUT_FILE | tee ${LOG_FILE}

# to get a list of nested stack names for concordia's crowd environment based stack use the aws cli to
#   to fetch the arns and extract the name needed for the drift results command
#
NESTED_STACK_ARNS="$(aws cloudformation list-stack-resources \
    --stack-name ${STACK_NAME} \
    --query "StackResourceSummaries[*].PhysicalResourceId")"
echo "NESTED_STACK_ARNS: $NESTED_STACK_ARNS" | tee -a ${LOG_FILE}


COUNT=1;

for ARN in $NESTED_STACK_ARNS; do
    # Extract logical nested stack name from the arn
    NESTED_STACK_NAME="$(echo ${ARN} | awk -F'/' '{ print $2}')"

    # the list brackets in the result set will be blank - skip them
    if [[ $NESTED_STACK_NAME == "" ]]; then
        NESTED_STACK_NAME=None
        echo "skip not a valid value: $NESTED_STACK_NAME" | tee -a ${LOG_FILE};
    else
        echo "Nested stack name: $NESTED_STACK_NAME" | tee -a ${LOG_FILE};
        echo $COUNT;

        # fetch logical resources names where drift exists to report out the details
        # list of MODIFIED
        LOGICAL_RESOURCE_IDS_MODIFIED="$(aws cloudformation describe-stack-resources \
            --stack-name ${NESTED_STACK_NAME} \
            --query 'StackResources[?DriftInformation.StackResourceDriftStatus==`MODIFIED`].LogicalResourceId' --output text)"
        echo "LOGICAL_RESOURCE_IDS_MODIFIED: $LOGICAL_RESOURCE_IDS_MODIFIED" | tee -a ${LOG_FILE}

        for id in $LOGICAL_RESOURCE_IDS_MODIFIED; do
            echo "modified resource id: $id";
            aws cloudformation detect-stack-resource-drift --stack-name "$NESTED_STACK_NAME" --logical-resource-id "$id" >> "$OUTPUT_FILE" | tee -a ${LOG_FILE};
        done;

        # list of DELETED
        LOGICAL_RESOURCE_IDS_DELETED="$(aws cloudformation describe-stack-resources \
            --stack-name ${NESTED_STACK_NAME} \
            --query 'StackResources[?DriftInformation.StackResourceDriftStatus==`DELETED`].LogicalResourceId' --output text)"
        echo "LOGICAL_RESOURCE_IDS_DELETED: $LOGICAL_RESOURCE_IDS_DELETED" | tee -a ${LOG_FILE}

        for id in $LOGICAL_RESOURCE_IDS_DELETED; do
            echo "deleted resource id: $id";
            aws cloudformation detect-stack-resource-drift --stack-name "$NESTED_STACK_NAME" --logical-resource-id "$id" >> "$OUTPUT_FILE" | tee -a ${LOG_FILE};
        done;
        ((COUNT++));
    fi;
done;
RETURNCODE=$?

echo $RETURNCODE | tee -a ${LOG_FILE}

echo "Drift results saved to $OUTPUT_FILE" | tee -a ${LOG_FILE}
exit $RETURNCODE
EOF


================================================
FILE: cloudformation/sync_templates.sh
================================================
#!/bin/bash

set -eu

aws s3 sync . s3://crowd-deployment


================================================
FILE: cloudformation/tests/validate-templates.sh
================================================
#!/bin/bash
ERROR_COUNT=0;

echo "Validating AWS CloudFormation templates..."

# Loop through the YAML templates in this repository
for TEMPLATE in $(find . -name '*.yaml'); do

    # Validate the template with CloudFormation
    ERRORS=$(aws cloudformation validate-template --template-body file://$TEMPLATE 2>&1 >/dev/null);
    if [ "$?" -gt "0" ]; then
        ((ERROR_COUNT++));
        echo "[fail] $TEMPLATE: $ERRORS";
    else
        echo "[pass] $TEMPLATE";
    fi;

done;

echo "$ERROR_COUNT template validation error(s)";
if [ "$ERROR_COUNT" -gt 0 ];
    then exit 1;
fi


================================================
FILE: concordia/__init__.py
================================================
from __future__ import absolute_import, unicode_literals

from concordia.celery import app as celery_app

__all__ = ["celery_app"]


================================================
FILE: concordia/admin/__init__.py
================================================
import io
import logging
import zipfile
from typing import Any

from django.contrib import admin, messages
from django.contrib.admin.models import CHANGE, LogEntry
from django.contrib.admin.options import get_content_type_for_model
from django.contrib.auth import get_permission_codename
from django.contrib.auth.admin import UserAdmin
from django.contrib.auth.decorators import permission_required
from django.contrib.auth.models import User
from django.db.models import Exists, OuterRef, QuerySet
from django.http import Http404, HttpRequest, HttpResponse, HttpResponseRedirect
from django.shortcuts import get_object_or_404, render
from django.template.defaultfilters import truncatechars
from django.template.response import TemplateResponse
from django.urls import path, reverse
from django.utils.decorators import method_decorator
from django.utils.html import format_html
from django.utils.http import url_has_allowed_host_and_scheme
from django.views.decorators.csrf import csrf_protect

from exporter import views as exporter_views
from exporter.tabular_export.admin import export_to_csv_action, export_to_excel_action
from exporter.tabular_export.core import export_to_csv_response, flatten_queryset
from importer.tasks.items import import_items_into_project_from_url

from ..models import (
    Asset,
    AssetTranscriptionReservation,
    Banner,
    Campaign,
    CampaignRetirementProgress,
    Card,
    CardFamily,
    CarouselSlide,
    ConcordiaFile,
    Guide,
    HelpfulLink,
    Item,
    KeyMetricsReport,
    NextReviewableCampaignAsset,
    NextReviewableTopicAsset,
    NextTranscribableCampaignAsset,
    NextTranscribableTopicAsset,
    Project,
    ProjectTopic,
    SimplePage,
    SiteReport,
    Tag,
    Topic,
    Transcription,
    TutorialCard,
    UserAssetTagCollection,
    UserProfileActivity,
)
from ..tasks.retirement import retire_campaign
from ..views.campaigns import ReportCampaignView
from .actions import (
    anonymize_action,
    change_status_to_completed,
    change_status_to_in_progress,
    change_status_to_needs_review,
    publish_action,
    publish_item_action,
    unpublish_action,
    unpublish_item_action,
    verify_assets_action,
)
from .filters import (
    AcceptedFilter,
    AssetCampaignListFilter,
    AssetCampaignStatusListFilter,
    AssetProjectListFilter,
    CardCampaignListFilter,
    HelpfulLinkCampaignListFilter,
    HelpfulLinkCampaignStatusListFilter,
    ItemCampaignListFilter,
    ItemCampaignStatusListFilter,
    ItemProjectListFilter,
    NextAssetCampaignListFilter,
    OcrGeneratedFilter,
    OcrOriginatedFilter,
    ProjectCampaignListFilter,
    ProjectCampaignStatusListFilter,
    RejectedFilter,
    SiteReportCampaignListFilter,
    SiteReportSortedCampaignListFilter,
    SubmittedFilter,
    SupersededListFilter,
    TagCampaignListFilter,
    TagCampaignStatusListFilter,
    TopicListFilter,
    TranscriptionCampaignListFilter,
    TranscriptionCampaignStatusListFilter,
    TranscriptionProjectListFilter,
    UserAssetTagCollectionCampaignListFilter,
    UserAssetTagCollectionCampaignStatusListFilter,
    UserProfileActivityCampaignListFilter,
    UserProfileActivityCampaignStatusListFilter,
)
from .forms import (
    AdminItemImportForm,
    AssetStatusActionForm,
    CampaignAdminForm,
    CardAdminForm,
    GuideAdminForm,
    ItemAdminForm,
    KeyMetricsReportAdminForm,
    ProjectAdminForm,
    ProjectTopicInlineForm,
    TopicAdminForm,
)

logger = logging.getLogger(__name__)


class ConcordiaUserAdmin(UserAdmin):
    """
    Customize the Django admin for `User` objects.

    Adds transcription and review counters to the changelist and provides
    CSV and Excel export actions.
    """

    list_display = (
        "username",
        "email",
        "is_staff",
        "date_joined",
        "transcription_count",
        "review_count",
    )

    def get_queryset(
        self,
        request: HttpRequest,
    ) -> QuerySet[User]:
        """
        Build the queryset used for the user changelist.

        Adds a `select_related` on the related profile to reduce per-row
        database queries when rendering counts.

        Args:
            request (HttpRequest): Current admin request.

        Returns:
            QuerySet[User]: Queryset with related profiles preloaded.
        """
        qs = super().get_queryset(request).select_related("profile")
        return qs

    @admin.display(
        description="Transcription Count",
        ordering="profile__transcribe_count",
    )
    def transcription_count(self, obj: User) -> int:
        return obj.profile.transcribe_count

    @admin.display(
        description="Review Count",
        ordering="profile__review_count",
    )
    def review_count(self, obj: User) -> int:
        return obj.profile.review_count

    EXPORT_FIELDS = (
        "username",
        "email",
        "first_name",
        "last_name",
        "is_active",
        "is_staff",
        "is_superuser",
        "date_joined",
        "last_login",
        "profile__transcribe_count",
        "profile__review_count",
    )

    EXTRA_VERBOSE_NAMES = {
        "profile__transcribe_count": "transcription count",
        "profile__review_count": "review count",
    }

    def export_users_as_csv(
        self,
        request: HttpRequest,
        queryset: QuerySet[User],
    ) -> HttpResponse:
        """
        Export selected users as a CSV file.

        Args:
            request (HttpRequest): Current admin request.
            queryset (QuerySet[User]): Selected users to export.

        Returns:
            HttpResponse: Response that streams a CSV download.
        """
        return export_to_csv_action(
            self,
            request,
            queryset,
            field_names=self.EXPORT_FIELDS,
            extra_verbose_names=self.EXTRA_VERBOSE_NAMES,
        )

    def export_users_as_excel(
        self,
        request: HttpRequest,
        queryset: QuerySet[User],
    ) -> HttpResponse:
        """
        Export selected users as an Excel file.

        Args:
            request (HttpRequest): Current admin request.
            queryset (QuerySet[User]): Selected users to export.

        Returns:
            HttpResponse: Response that streams an Excel download.
        """
        return export_to_excel_action(
            self,
            request,
            queryset,
            field_names=self.EXPORT_FIELDS,
            extra_verbose_names=self.EXTRA_VERBOSE_NAMES,
        )

    actions = (anonymize_action, export_users_as_csv, export_users_as_excel)


admin.site.unregister(User)
admin.site.register(User, ConcordiaUserAdmin)


@admin.register(Banner)
class BannerAdmin(admin.ModelAdmin):
    list_display = (
        "text",
        "active",
    )


class CustomListDisplayFieldsMixin:
    """
    Provide reusable list display helpers for admin changelists.

    This mixin defines helpers that truncate long text and render selected
    fields using HTML formatting.
    """

    @admin.display(description="Description")
    def truncated_description(self, obj):
        return truncatechars(obj.description, 200)

    @admin.display(description="Metadata")
    def truncated_metadata(self, obj):
        if obj.metadata:
            return format_html("<code>{}</code>", truncatechars(obj.metadata, 200))
        else:
            return ""


@admin.register(Campaign)
class CampaignAdmin(admin.ModelAdmin, CustomListDisplayFieldsMixin):
    """
    Admin configuration for `Campaign` objects.

    Adds filters, publishing actions, export links and a custom retirement
    workflow.
    """

    form = CampaignAdminForm

    list_display = (
        "title",
        "status",
        "published",
        "display_on_homepage",
        "next_transcription_campaign",
        "next_review_campaign",
        "ordering",
        "launch_date",
        "completed_date",
    )
    list_editable = (
        "display_on_homepage",
        "next_transcription_campaign",
        "next_review_campaign",
        "ordering",
        "published",
        "unlisted",
        "status",
        "launch_date",
        "completed_date",
    )
    list_display_links = ("title",)
    fields = (
        "published",
        "unlisted",
        "status",
        "next_transcription_campaign",
        "next_review_campaign",
        "ordering",
        "display_on_homepage",
        "title",
        "slug",
        "card_family",
        "thumbnail_image",
        "image_alt_text",
        "launch_date",
        "completed_date",
        "description",
        "short_description",
        "metadata",
        "disable_ocr",
        "research_centers",
    )
    prepopulated_fields = {"slug": ("title",)}
    raw_id_fields = ("card_family",)
    search_fields = ["title", "description"]
    list_filter = (
        "published",
        "display_on_homepage",
        "unlisted",
        "status",
        "next_transcription_campaign",
        "next_review_campaign",
    )

    actions = (publish_action, unpublish_action, verify_assets_action)

    def get_form(
        self,
        request: HttpRequest,
        obj: Campaign | None = None,
        **kwargs: Any,
    ):
        """
        Build the model form used to edit a campaign.

        Updates some field labels to be clearer for staff users before
        returning the base form from `ModelAdmin`.

        Args:
            request (HttpRequest): Current admin request.
            obj (Campaign | None): Campaign being edited, or `None` when
                creating a new one.
            **kwargs (Any): Extra keyword arguments passed to
                `ModelAdmin.get_form`.

        Returns:
            forms.ModelForm: Form class used by the admin for this model.
        """
        form = super().get_form(request, obj, **kwargs)
        form.base_fields["display_on_homepage"].label = "Display on homepage"
        form.base_fields["next_transcription_campaign"].label = (
            "Next transcription campaign"
        )
        form.base_fields["next_review_campaign"].label = "Next review campaign"
        return form

    def get_urls(self):
        """
        Add custom admin URLs for campaign exports, reports and retirement.

        Returns:
            list: List of URL patterns including the default admin URLs and
            the custom campaign URLs.
        """
        urls = super().get_urls()

        app_label = self.model._meta.app_label
        model_name = self.model._meta.model_name

        custom_urls = [
            path(
                "exportCSV/<path:campaign_slug>",
                exporter_views.ExportCampaignToCSV.as_view(),
                name=f"{app_label}_{model_name}_export-csv",
            ),
            path(
                "exportBagIt/<path:campaign_slug>",
                exporter_views.ExportCampaignToBagIt.as_view(),
                name=f"{app_label}_{model_name}_export-bagit",
            ),
            path(
                "report/<path:campaign_slug>",
                ReportCampaignView.as_view(),
                name=f"{app_label}_{model_name}_report",
            ),
            path(
                "retire/<path:campaign_slug>",
                self.admin_site.admin_view(self.retire),
                name=f"{app_label}_{model_name}_retire",
            ),
        ]

        return custom_urls + urls

    @method_decorator(csrf_protect)
    @method_decorator(
        permission_required("concordia.retire_campaign", raise_exception=True)
    )
    @method_decorator(
        permission_required("concordia.delete_project", raise_exception=True)
    )
    @method_decorator(
        permission_required("concordia.delete_item", raise_exception=True)
    )
    @method_decorator(
        permission_required("concordia.delete_asset", raise_exception=True)
    )
    @method_decorator(
        permission_required("concordia.delete_transcription", raise_exception=True)
    )
    @method_decorator(
        permission_required("concordia.delete_import_item_asset", raise_exception=True)
    )
    def retire(
        self,
        request: HttpRequest,
        campaign_slug: str,
    ) -> HttpResponse:
        """
        Start the retirement process for a campaign.

        This view shows a confirmation page that lists how many projects,
        items, assets and transcriptions will be removed. When the request
        is `POST`, it enqueues the retirement task and redirects to the
        progress object in the admin.

        Args:
            request (HttpRequest): Current admin request.
            campaign_slug (str): Slug of the campaign being retired.

        Returns:
            HttpResponse: Confirmation page or redirect to the progress
            object.
        """
        try:
            campaign = Campaign.objects.filter(slug=campaign_slug)[0]
        except IndexError:
            return self._get_obj_does_not_exist_redirect(
                request, self.opts, campaign_slug
            )

        projects = campaign.project_set.values_list("id", flat=True)
        items = Item.objects.filter(project__id__in=projects).values_list(
            "id", flat=True
        )
        assets = Asset.objects.filter(item__id__in=items).values_list("id", flat=True)
        transcriptions = Transcription.objects.filter(asset__id__in=assets)

        model_count = {
            "project": len(projects),
            "item": len(items),
            "asset": len(assets),
            "transcription": transcriptions.count(),
        }

        if request.POST:
            # This means the user confirmed the retirement
            obj_display = str(campaign)
            self.log_retirement(request, campaign, obj_display)
            progress = retire_campaign(campaign.id)
            self.message_user(
                request,
                'The retirement process for %(name)s "%(obj)s" has begun.'
                % {
                    "name": self.opts.verbose_name,
                    "obj": obj_display,
                },
                messages.SUCCESS,
            )
            post_url = reverse(
                "admin:concordia_campaignretirementprogress_change",
                args=[progress.id],
                current_app=self.admin_site.name,
            )
            return HttpResponseRedirect(post_url)

        context = {
            **self.admin_site.each_context(request),
            "title": "Are you sure?",
            "subtitle": None,
            "object_name": "Campaign",
            "object": campaign,
            "model_count": model_count.items(),
            "opts": self.opts,
            "app_label": self.opts.app_label,
            "preserved_filters": self.get_preserved_filters(request),
        }

        return TemplateResponse(
            request, "admin/concordia/campaign/retire.html", context
        )

    def log_retirement(
        self,
        request: HttpRequest,
        obj: Campaign,
        object_repr: str,
    ) -> LogEntry:
        """
        Create an admin log entry for a campaign retirement.

        Args:
            request (HttpRequest): Current admin request.
            obj (Campaign): Campaign that is being retired.
            object_repr (str): Text representation of the campaign used in
                the log entry.

        Returns:
            LogEntry: The created log entry instance.
        """
        return LogEntry.objects.log_action(
            user_id=request.user.pk,
            content_type_id=get_content_type_for_model(obj).pk,
            object_id=obj.pk,
            object_repr=object_repr,
            action_flag=CHANGE,
        )


@admin.register(HelpfulLink)
class HelpfulLinkAdmin(admin.ModelAdmin, CustomListDisplayFieldsMixin):
    list_display = ("campaign", "topic", "sequence", "title", "link_url")
    list_display_links = ("campaign", "topic", "sequence", "title")
    list_filter = (
        "link_type",
        HelpfulLinkCampaignStatusListFilter,
        TopicListFilter,
        HelpfulLinkCampaignListFilter,
    )

    def formfield_for_foreignkey(
        self,
        db_field: Any,
        request: HttpRequest,
        **kwargs: Any,
    ) -> Any:
        """
        Customize the form field for foreign key relations.

        Orders campaigns alphabetically when selecting a campaign.

        Args:
            db_field (Any): Model field being rendered.
            request (HttpRequest): Current admin request.
            **kwargs (Any): Extra keyword arguments for the base
                implementation.

        Returns:
            Any: Form field instance for the foreign key.
        """
        if db_field.name == "campaign":
            kwargs["queryset"] = Campaign.objects.order_by("title")
        return super().formfield_for_foreignkey(db_field, request, **kwargs)


@admin.register(ConcordiaFile)
class ConcordiaFileAdmin(admin.ModelAdmin):
    # Bulk delete bypasses file deletion, so we do not want any bulk actions
    actions = None
    list_display = ("name", "file_url", "updated_on")
    readonly_fields = ("file_url", "updated_on")

    def file_url(self, obj: ConcordiaFile) -> str:
        """
        Return the public URL for this file without any query string.

        Boto3 storage backends often append query parameters that are not
        needed for public files. This helper strips them so the URL is
        easier to copy and read.

        Args:
            obj (ConcordiaFile): File instance.

        Returns:
            str: Public URL without query parameters.
        """
        # Boto3 adds querystring parameters to the URL to allow access
        # to private files. In this case, all files are public, and we
        # do not want the querystring, so we remove it.
        # This looks hacky, but seems to be the least hacky way to do
        # this without a third-party library.
        return obj.uploaded_file.url.split("?")[0]

    def get_fields(
        self,
        request: HttpRequest,
        obj: ConcordiaFile | None = None,
    ) -> tuple[str, ...]:
        """
        Control which fields are shown on the change and add views.

        When editing an existing object some fields are read only, but
        when creating a new one only editable fields are shown.

        Args:
            request (HttpRequest): Current admin request.
            obj (ConcordiaFile | None): File being edited, or
                `None` when adding a new one.

        Returns:
            tuple[str, ...]: Field names to display in the form.
        """
        if obj:
            return (
                "name",
                "file_url",
                "uploaded_file",
                "updated_on",
            )
        return ("name", "uploaded_file")


class TopicProjectInline(admin.TabularInline):
    model = ProjectTopic
    form = ProjectTopicInlineForm
    extra = 1
    autocomplete_fields = ["project"]
    fields = ["project", "url_filter", "ordering"]
    fk_name = "topic"


@admin.register(Topic)
class TopicAdmin(admin.ModelAdmin):
    form = TopicAdminForm

    inlines = [TopicProjectInline]

    list_display = (
        "id",
        "title",
        "slug",
        "short_description",
        "published",
        "unlisted",
        "ordering",
    )

    list_display_links = ("id", "title", "slug")
    prepopulated_fields = {"slug": ("title",)}
    search_fields = [
        "title",
    ]


class ProjectTopicInline(admin.TabularInline):
    model = ProjectTopic
    form = ProjectTopicInlineForm
    extra = 1
    autocomplete_fields = ["topic"]
    fields = ["topic", "url_filter"]


@admin.register(Project)
class ProjectAdmin(admin.ModelAdmin, CustomListDisplayFieldsMixin):
    form = ProjectAdminForm

    inlines = [ProjectTopicInline]

    list_display = ("id", "title", "slug", "campaign", "published", "ordering")
    list_editable = ("ordering",)
    list_display_links = ("id", "title", "slug")
    prepopulated_fields = {"slug": ("title",)}
    search_fields = ["title", "campaign__title"]
    list_filter = (
        "published",
        "topics",
        ProjectCampaignStatusListFilter,
        ProjectCampaignListFilter,
    )

    actions = (publish_action, unpublish_action, verify_assets_action)

    def lookup_allowed(self, key: str, value: str) -> bool:
        """
        Allow filtering by campaign id in the changelist.

        Args:
            key (str): Lookup parameter key.
            value (str): Lookup parameter value.

        Returns:
            bool: True if the lookup is allowed.
        """
        if key in ("campaign__id__exact"):
            return True
        else:
            return super().lookup_allowed(key, value)

    def get_urls(self):
        """
        Add custom URLs for project item import and CSV export.

        Returns:
            list: Custom URL patterns combined with the default admin URLs.
        """
        urls = super().get_urls()

        app_label = self.model._meta.app_label
        model_name = self.model._meta.model_name

        custom_urls = [
            path(
                "<path:object_id>/item-import/",
                self.admin_site.admin_view(self.item_import_view),
                name=f"{app_label}_{model_name}_item-import",
            ),
            path(
                "exportCSV/<path:campaign_slug>/<path:project_slug>/",
                exporter_views.ExportProjectToCSV.as_view(),
                name=f"{app_label}_{model_name}_export-csv",
            ),
        ]

        return custom_urls + urls

    @method_decorator(
        permission_required("concordia.add_campaign", raise_exception=True)
    )
    @method_decorator(
        permission_required("concordia.change_campaign", raise_exception=True)
    )
    @method_decorator(
        permission_required("concordia.add_project", raise_exception=True)
    )
    @method_decorator(
        permission_required("concordia.change_project", raise_exception=True)
    )
    @method_decorator(permission_required("concordia.add_item", raise_exception=True))
    @method_decorator(
        permission_required("concordia.change_item", raise_exception=True)
    )
    def item_import_view(
        self,
        request: HttpRequest,
        object_id: str,
    ) -> HttpResponse:
        """
        Display and process the admin item import form for a project.

        When the request is `GET`, this view shows a form where staff can
        paste a URL for the import. When the request is `POST` and the form
        is valid, it queues an item import job and redisplays the form with
        basic job information.

        Args:
            request (HttpRequest): Current admin request.
            object_id (str): Primary key of the project being imported
                into.

        Returns:
            HttpResponse: Rendered admin page for the import form.
        """
        project = get_object_or_404(Project, pk=object_id)

        if request.method == "POST":
            form = AdminItemImportForm(request.POST)

            if form.is_valid():
                import_url = form.cleaned_data["import_url"]

                import_job = import_items_into_project_from_url(
                    request.user, project, import_url
                )
            else:
                import_job = None
        else:
            form = AdminItemImportForm()
            import_job = None

        media = self.media

        context = {
            **self.admin_site.each_context(request),
            "app_label": self.model._meta.app_label,
            "add": False,
            "change": False,
            "save_as": False,
            "save_on_top": False,
            "opts": self.model._meta,
            "title": f"Import Items into “{project.title}”",
            "object_id": object_id,
            "original": project,
            "media": media,
            "preserved_filters": self.get_preserved_filters(request),
            "is_popup": False,
            "has_view_permission": True,
            "has_add_permission": True,
            "has_change_permission": True,
            "has_delete_permission": False,
            "has_editable_inline_admin_formsets": False,
            "project": project,
            "form": form,
            "import_job": import_job,
        }

        return render(request, "admin/concordia/project/item_import.html", context)


@admin.register(Item)
class ItemAdmin(admin.ModelAdmin):
    form = ItemAdminForm
    list_display = ("title", "item_id", "campaign_title", "project", "published")
    list_display_links = ("title", "item_id")
    search_fields = [
        "title",
        "item_id",
        "item_url",
        "project__campaign__title",
        "project__title",
    ]

    list_filter = (
        "published",
        "project__topics",
        ItemCampaignStatusListFilter,
        ItemCampaignListFilter,
        ItemProjectListFilter,
    )

    actions = (publish_item_action, unpublish_item_action, verify_assets_action)

    def lookup_allowed(self, key: str, value: str) -> bool:
        """
        Allow filtering by campaign id in the changelist.

        Args:
            key (str): Lookup parameter key.
            value (str): Lookup parameter value.

        Returns:
            bool: True if the lookup is allowed.
        """
        if key in ("project__campaign__id__exact",):
            return True
        else:
            return super().lookup_allowed(key, value)

    def get_deleted_objects(
        self,
        objs: list[Item],
        request: HttpRequest,
    ):
        """
        Summarize the impact of deleting the given items.

        This override includes counts of related assets and transcriptions
        and enforces delete permissions for related models.

        Args:
            objs (list[Item]): Items selected for deletion.
            request (HttpRequest): Current admin request.

        Returns:
            tuple[list[str], dict[str, int], set[str], list]:
                Deleted object labels, counts per model, permissions that
                are still needed and a list of protected objects.
        """
        if len(objs) < 30:
            deleted_objects = [str(obj) for obj in objs]
        else:
            deleted_objects = [str(obj) for obj in objs[:3]]
            deleted_objects.append(
                f"… and {len(objs) - 3} more {Item._meta.verbose_name_plural}"
            )
        perms_needed = set()
        for model in (Item, Asset, Transcription):
            perm = "%s.%s" % (
                model._meta.app_label,
                get_permission_codename("delete", model._meta),
            )
            if not request.user.has_perm(perm):
                perms_needed.add(model._meta.verbose_name)
        protected = []

        model_count = {
            Item._meta.verbose_name_plural: len(objs),
            Asset._meta.verbose_name_plural: Asset.objects.filter(
                item__in=objs
            ).count(),
            Transcription._meta.verbose_name_plural: Transcription.objects.filter(
                asset__item__in=objs
            ).count(),
        }

        return (deleted_objects, model_count, perms_needed, protected)

    def get_queryset(
        self,
        request: HttpRequest,
    ):
        """
        Optimize the queryset used on the item changelist.

        Adds related project and campaign so list-display columns do not
        trigger extra database queries.
        """
        qs = super().get_queryset(request)
        qs = qs.select_related("project", "project__campaign")
        return qs

    def campaign_title(self, obj: Item) -> str:
        """
        Return the campaign title for the item's project.

        Args:
            obj (Item): Item instance.

        Returns:
            str: Title of the related campaign.
        """
        return obj.project.campaign.title


@admin.register(AssetTranscriptionReservation)
class AssetTranscriptionReservationAdmin(
    admin.ModelAdmin, CustomListDisplayFieldsMixin
):
    list_display = (
        "created_on",
        "updated_on",
        "asset",
        "reservation_token",
        "tombstoned",
    )
    list_display_links = ("reservation_token", "created_on")
    readonly_fields = ("asset", "created_on", "updated_on")


@admin.register(Asset)
class AssetAdmin(admin.ModelAdmin, CustomListDisplayFieldsMixin):
    list_display = (
        "published",
        "transcription_status",
        "item_id",
        "year",
        "sequence",
        "difficulty",
        "truncated_storage_image",
        "media_type",
        "truncated_metadata",
    )
    list_display_links = ("item_id", "sequence")
    prepopulated_fields = {"slug": ("title",)}
    search_fields = [
        "title",
        "storage_image",
        "item__project__campaign__title",
        "item__project__title",
        "item__item_id",
    ]
    list_filter = (
        "transcription_status",
        "published",
        "item__project__topics",
        AssetCampaignStatusListFilter,
        AssetCampaignListFilter,
        AssetProjectListFilter,
        "media_type",
    )
    actions = (
        publish_action,
        change_status_to_completed,
        change_status_to_in_progress,
        change_status_to_needs_review,
        unpublish_action,
        export_to_csv_action,
        export_to_excel_action,
        verify_assets_action,
    )
    status_action_names = (
        "change_status_to_completed",
        "change_status_to_needs_review",
        "change_status_to_in_progress",
    )
    autocomplete_fields = ("item",)
    ordering = ("item__item_id", "sequence")
    change_list_template = "admin/concordia/asset/change_list.html"

    def get_queryset(
        self,
        request: HttpRequest,
    ):
        """
        Optimize the queryset used on the asset changelist.

        Selects related items so fields displayed in the changelist do not
        trigger per-row database queries.
        """
        qs = super().get_queryset(request)
        return qs.select_related("item").order_by("item__item_id", "sequence")

    def lookup_allowed(self, key: str, value: str) -> bool:
        """
        Allow filtering by project and campaign id on the changelist.

        Args:
            key (str): Lookup parameter key.
            value (str): Lookup parameter value.

        Returns:
            bool: True if the lookup is allowed.
        """
        if key in ("item__project__id__exact", "item__project__campaign__id__exact"):
            return True
        else:
            return super().lookup_allowed(key, value)

    def response_action(
        self,
        request: HttpRequest,
        queryset: QuerySet[Asset],
    ) -> HttpResponse:
        """
        Run the selected action and optionally redirect to a `next` URL.

        After the base implementation runs the action, this override checks
        for a `next` parameter in `POST` and, if it is a safe URL, redirects
        to it instead of the default changelist.

        Args:
            request (HttpRequest): Current admin request.
            queryset (QuerySet[Asset]): Selected assets for the action.

        Returns:
            HttpResponse: Default admin response or a redirect to the
            `next` URL.
        """
        # Let Django run the chosen action(s) normally
        response = super().response_action(request, queryset)

        # If a "next" came from our form, redirect there,
        # after confirming it is either a relative path
        # that starts with "/" or is an absolute URL
        # pointing to our hostname
        next_url = request.POST.get("next")
        if next_url:
            if url_has_allowed_host_and_scheme(
                url=next_url,
                allowed_hosts={request.get_host()},
                require_https=request.is_secure(),
            ):
                return HttpResponseRedirect(next_url)

        # Otherwise, return whatever Django gave us
        return response

    def item_id(self, obj: Asset) -> str:
        return obj.item.item_id

    @admin.display(description="Media URL")
    def truncated_storage_image(self, obj: Asset) -> str:
        return format_html(
            '<a target="_blank" href="{}">{}</a>',
            obj.storage_image.url,
            truncatechars(obj.get_existing_storage_image_filename(), 100),
        )

    def get_readonly_fields(
        self,
        request: HttpRequest,
        obj: Asset | None = None,
    ) -> tuple[str, ...]:
        """
        Mark some fields as read only after an asset has been created.

        The item and campaign cannot be changed on existing assets but
        remain editable when creating a new asset.

        Args:
            request (HttpRequest): Current admin request.
            obj (Asset | None): Asset being edited, or `None` when adding.

        Returns:
            tuple[str, ...]: Names of fields that should be read only.
        """
        if obj:
            return self.readonly_fields + ("item", "campaign")
        return self.readonly_fields

    def change_view(
        self,
        request: HttpRequest,
        object_id: str,
        extra_context: dict[str, Any] | None = None,
        **kwargs: Any,
    ) -> HttpResponse:
        """
        Render the asset change form with extra status and transcription data.

        This override injects a form for bulk status changes and a list of
        related transcriptions into the template context.

        Args:
            request (HttpRequest): Current admin request.
            object_id (str): Primary key of the asset being edited.
            extra_context (dict[str, Any] | None): Extra template context,
                if any.
            **kwargs (Any): Extra keyword arguments passed to the base
                implementation.

        Returns:
            HttpResponse: Response from the admin change view.
        """
        extra_context = extra_context or {}
        asset = None
        if object_id:
            asset = self.get_object(request, object_id)
            current_status = asset.transcription_status
            # Dealing with this one special case let's use simplify the
            # desired_actions filtering code here significantly
            if current_status == "submitted":
                current_status = "needs_review"
            # We need the name of the action (for example,
            # 'change_status_to_in_progress') and the description to show
            # in the form (for example, "Change status to In Progress").
            # We filter out any action matching the current status, since
            # that is unneeded and potentially confusing.
            desired_actions = [
                (name, data[2])
                for name, data in self.get_actions(request).items()
                if name in self.status_action_names and current_status not in name
            ]
            status_form = AssetStatusActionForm(available_actions=desired_actions)
            extra_context["status_action_form"] = status_form

        extra_context["transcriptions"] = (
            Transcription.objects.filter(asset__pk=object_id)
            .select_related("user", "reviewed_by")
            .order_by("-pk")
        )

        return super().change_view(
            request, object_id, extra_context=extra_context, **kwargs
        )

    def has_reopen_permission(self, request: HttpRequest) -> bool:
        """
        Check whether the user has the custom `reopen` permission.

        Args:
            request (HttpRequest): Current admin request.

        Returns:
            bool: True if the user has permission to reopen assets.
        """
        opts = self.opts
        codename = get_permission_codename("reopen", opts)
        return request.user.has_perm(f"{opts.app_label}.{codename}")


@admin.register(Tag)
class TagAdmin(admin.ModelAdmin):
    list_display = ("id", "value")
    list_display_links = ("id", "value")
    list_filter = (TagCampaignStatusListFilter, TagCampaignListFilter)

    search_fields = ["value"]

    actions = ("export_tags_as_csv",)

    def lookup_allowed(self, key: str, value: str) -> bool:
        """
        Allow filtering by campaign id when viewing tags.

        Args:
            key (str): Lookup parameter key.
            value (str): Lookup parameter value.

        Returns:
            bool: True if the lookup is allowed.
        """
        if key in ["userassettagcollection__asset__item__project__campaign__id__exact"]:
            return True
        return super().lookup_allowed(key, value)

    def export_tags_as_csv(
        self,
        request: HttpRequest,
        queryset: QuerySet[Tag],
    ) -> HttpResponse:
        """
        Export tag usage details as a CSV file.

        Args:
            request (HttpRequest): Current admin request.
            queryset (QuerySet[Tag]): Selected tags to export.

        Returns:
            HttpResponse: Response that streams a CSV download.
        """
        tags = queryset.prefetch_related(
            "userassettagcollection", "userassettagcollection__asset"
        ).order_by("userassettagcollection__asset_id")

        headers, data = flatten_queryset(
            tags,
            field_names=[
                "value",
                "userassettagcollection__created_on",
                "userassettagcollection__user_id",
                "userassettagcollection__asset_id",
                "userassettagcollection__asset__title",
                "userassettagcollection__asset__download_url",
                "userassettagcollection__asset__resource_url",
                "userassettagcollection__asset__item__project__campaign__slug",
            ],
            extra_verbose_names={
                "value": "tag value",
                "userassettagcollection__created_on": "user asset tag collection date created",  # noqa: E501
                "userassettagcollection__user_id": "user asset tag collection user_id",
                "userassettagcollection__asset_id": "asset id",
                "userassettagcollection__asset__title": "asset title",
                "userassettagcollection__asset__download_url": "asset download url",
                "userassettagcollection__asset__resource_url": "asset resource url",
                "userassettagcollection__asset__item__project__campaign__slug": "campaign slug",  # noqa: E501
            },
        )

        return export_to_csv_response("tags.csv", headers, data)


@admin.register(UserAssetTagCollection)
class UserAssetTagCollectionAdmin(admin.ModelAdmin):
    list_display = ("id", "asset", "user", "created_on", "updated_on")
    list_display_links = ("id", "asset")
    date_hierarchy = "created_on"
    search_fields = ["asset__title", "asset__campaign__title", "asset__project__title"]
    list_filter = (
        UserAssetTagCollectionCampaignStatusListFilter,
        UserAssetTagCollectionCampaignListFilter,
        "asset__item__project",
        "user__is_staff",
    )


@admin.register(Transcription)
class TranscriptionAdmin(admin.ModelAdmin):
    list_display = (
        "id",
        "asset",
        "user",
        "campaign_slug",
        "truncated_text",
        "created_on",
        "accepted",
        "rejected",
        "reviewed_by",
        "superseded",
    )
    list_display_links = ("id", "asset")

    list_filter = (
        SubmittedFilter,
        AcceptedFilter,
        RejectedFilter,
        SupersededListFilter,
        OcrGeneratedFilter,
        OcrOriginatedFilter,
        TranscriptionCampaignStatusListFilter,
        TranscriptionCampaignListFilter,
        TranscriptionProjectListFilter,
    )

    search_fields = ["text", "user__username", "user__email"]

    readonly_fields = (
        "asset",
        "user",
        "created_on",
        "updated_on",
        "submitted",
        "accepted",
        "rejected",
        "reviewed_by",
        "supersedes",
        "text",
        "source",
    )

    EXPORT_FIELDS = (
        "id",
        "asset__id",
        "asset__slug",
        "user",
        "created_on",
        "updated_on",
        "supersedes",
        "submitted",
        "accepted",
        "rejected",
        "reviewed_by",
        "text",
        "ocr_generated",
        "ocr_originated",
    )

    show_full_result_count = False

    def get_queryset(
        self,
        request: HttpRequest,
    ) -> QuerySet[Transcription]:
        """
        Optimize the queryset used on the transcription changelist.

        Selects related asset and user records and annotates a boolean flag
        so the superseded column can be rendered without extra queries.

        Args:
            request (HttpRequest): Current admin request.

        Returns:
            QuerySet[Transcription]: Optimized queryset for the changelist.
        """
        qs = super().get_queryset(request)
        # Make FK columns cheaper to render
        qs = qs.select_related("asset", "user", "reviewed_by")

        # Annotate a boolean so the "Superseded?" column is O(1) per row
        return qs.annotate(
            is_superseded=Exists(
                Transcription.objects.filter(supersedes=OuterRef("pk"))
            )
        )

    @admin.display(description="Text")
    def truncated_text(self, obj: Transcription) -> str:
        """
        Return a shortened version of the transcription text.

        Args:
            obj (Transcription): Transcription instance.

        Returns:
            str: Text truncated to a reasonable length for display.
        """
        return truncatechars(obj.text, 100)

    @admin.display(boolean=True, description="Superseded?")
    def superseded(self, obj: Transcription) -> bool:
        """
        Indicate whether this transcription has been superseded.

        Uses the `is_superseded` annotation added in `get_queryset` so the
        column can be rendered without extra queries.

        Args:
            obj (Transcription): Transcription instance.

        Returns:
            bool: True if a later transcription supersedes this one.
        """
        # Uses the annotation from get_queryset; no per-row queries.
        return bool(getattr(obj, "is_superseded", False))

    def lookup_allowed(self, key: str, value: str) -> bool:
        """
        Allow filtering by campaign id in the transcription admin.

        Args:
            key (str): Lookup parameter key.
            value (str): Lookup parameter value.

        Returns:
            bool: True if the lookup is allowed.
        """
        if key in ("asset__item__project__campaign__id__exact",):
            return True
        return super().lookup_allowed(key, value)

    def export_to_csv(
        self,
        request: HttpRequest,
        queryset: QuerySet[Transcription],
    ) -> HttpResponse:
        """
        Export selected transcriptions as a CSV file.

        Args:
            request (HttpRequest): Current admin request.
            queryset (QuerySet[Transcription]): Transcriptions to export.

        Returns:
            HttpResponse: Response that streams a CSV download.
        """
        return export_to_csv_action(
            self, request, queryset, field_names=self.EXPORT_FIELDS
        )

    def export_to_excel(
        self,
        request: HttpRequest,
        queryset: QuerySet[Transcription],
    ) -> HttpResponse:
        """
        Export selected transcriptions as an Excel file.

        Args:
            request (HttpRequest): Current admin request.
            queryset (QuerySet[Transcription]): Transcriptions to export.

        Returns:
            HttpResponse: Response that streams an Excel download.
        """
        return export_to_excel_action(
            self, request, queryset, field_names=self.EXPORT_FIELDS
        )

    actions = (export_to_csv, export_to_excel)


@admin.register(CarouselSlide)
class CarouselSlideAdmin(admin.ModelAdmin):
    list_display = ("headline", "published", "ordering")
    readonly_fields = ("created_on", "updated_on")


@admin.register(SimplePage)
class SimplePageAdmin(admin.ModelAdmin):
    list_display = ("path", "title", "created_on", "updated_on")
    readonly_fields = ("created_on", "updated_on")

    fieldsets = (
        (None, {"fields": ("created_on", "updated_on", "path", "title")}),
        ("Body", {"classes": ("markdown-preview",), "fields": ("body",)}),
    )


@admin.register(SiteReport)
class SiteReportAdmin(admin.ModelAdmin):
    list_display = ("created_on", "report_type")
    readonly_fields = (
        "created_on",
        "report_type",
        "previous_in_series_link",
        "next_in_series_link",
        "report_json",
    )
    fieldsets = (
        ("Summary", {"fields": ("created_on", "report_type")}),
        (
            "Navigation within series",
            {"fields": ("previous_in_series_link", "next_in_series_link")},
        ),
        (
            "Data",
            {
                "fields": (
                    "report_name",
                    "campaign",
                    "topic",
                    "assets_total",
                    "assets_published",
                    "assets_not_started",
                    "assets_in_progress",
                    "assets_waiting_review",
                    "assets_completed",
                    "assets_unpublished",
                    "assets_started",
                    "items_published",
                    "items_unpublished",
                    "projects_published",
                    "projects_unpublished",
                    "anonymous_transcriptions",
                    "transcriptions_saved",
                    "daily_review_actions",
                    "distinct_tags",
                    "tag_uses",
                    "campaigns_published",
                    "campaigns_unpublished",
                    "users_registered",
                    "users_activated",
                    "registered_contributors",
                    "daily_active_users",
                )
            },
        ),
        ("Debug", {"fields": ("report_json",)}),
    )

    list_filter = (
        "report_name",
        SiteReportSortedCampaignListFilter,
        SiteReportCampaignListFilter,
        "topic",
    )

    @admin.display(description="Report type")
    def report_type(self, obj: "SiteReport") -> str:
        """
        Describe what kind of report this SiteReport represents.

        Args:
            obj (SiteReport): Site report instance.

        Returns:
            str: Human readable description of the report source.
        """
        if obj.report_name:
            return f"Report name: {obj.report_name}"
        elif obj.campaign:
            return f"Campaign: {obj.campaign}"
        elif obj.topic:
            return f"Topic: {obj.topic}"
        else:
            return f"SiteReport: <{obj.id}>"

    @admin.display(description="SiteReport as JSON")
    def report_json(self, obj: "SiteReport") -> str:
        """
        Render a pretty printed JSON representation of this report.

        Args:
            obj (SiteReport): Site report instance.

        Returns:
            str: HTML snippet that shows the report JSON in a `<pre>` block.
        """
        return format_html(
            "<pre style='white-space:pre-wrap;word-break:break-word;margin:0'>{}</pre>",
            obj.to_debug_json(),
        )

    @admin.display(description="Previous in series")
    def previous_in_series_link(self, obj: "SiteReport") -> str:
        """
        Link to the previous report in this series, if any.

        Args:
            obj (SiteReport): Site report instance.

        Returns:
            str: HTML anchor tag for the previous report or a dash when
            none exists.
        """
        prev_obj = obj.previous_in_series()
        if not prev_obj:
            return "—"
        url = reverse(
            f"admin:{prev_obj._meta.app_label}_{prev_obj._meta.model_name}_change",
            args=[prev_obj.pk],
        )
        label = f"{prev_obj.created_on:%Y-%m-%d %H:%M:%S} (id {prev_obj.pk})"
        return format_html('<a href="{}">{}</a>', url, label)

    @admin.display(description="Next in series")
    def next_in_series_link(self, obj: "SiteReport") -> str:
        """
        Link to the next report in this series, if any.

        Args:
            obj (SiteReport): Site report instance.

        Returns:
            str: HTML anchor tag for the next report or a dash when
            none exists.
        """
        next_obj = obj.next_in_series()
        if not next_obj:
            return "—"
        url = reverse(
            f"admin:{next_obj._meta.app_label}_{next_obj._meta.model_name}_change",
            args=[next_obj.pk],
        )
        label = f"{next_obj.created_on:%Y-%m-%d %H:%M:%S} (id {next_obj.pk})"
        return format_html('<a href="{}">{}</a>', url, label)

    def export_to_csv(
        self,
        request: HttpRequest,
        queryset: QuerySet[SiteReport],
    ) -> HttpResponse:
        """
        Export selected site reports as a CSV file.

        Args:
            request (HttpRequest): Current admin request.
            queryset (QuerySet[SiteReport]): Site reports to export.

        Returns:
            HttpResponse: Response that streams a CSV download.
        """
        return export_to_csv_action(
            self, request, queryset, field_names=SiteReport.DEFAULT_EXPORT_FIELDNAMES
        )

    def export_to_excel(
        self,
        request: HttpRequest,
        queryset: QuerySet[SiteReport],
    ) -> HttpResponse:
        """
        Export selected site reports as an Excel file.

        Args:
            request (HttpRequest): Current admin request.
            queryset (QuerySet[SiteReport]): Site reports to export.

        Returns:
            HttpResponse: Response that streams an Excel download.
        """
        return export_to_excel_action(
            self, request, queryset, field_names=SiteReport.DEFAULT_EXPORT_FIELDNAMES
        )

    actions = (export_to_csv, export_to_excel)


@admin.register(UserProfileActivity)
class UserProfileActivityAdmin(admin.ModelAdmin):
    list_display = (
        "id",
        "user",
        "campaign",
        "get_status",
        "transcribe_count",
        "review_count",
    )
    list_filter = (
        UserProfileActivityCampaignStatusListFilter,
        UserProfileActivityCampaignListFilter,
    )
    raw_id_fields = ["user", "campaign"]
    read_only_fields = (
        "user",
        "campaign",
        "asset_count",
        "asset_tag_count",
        "transcribe_count",
        "review_count",
    )
    search_fields = [
        "user__username",
    ]


@admin.register(CampaignRetirementProgress)
class CampaignRetirementProgressAdmin(admin.ModelAdmin):
    list_display = ("campaign", "started_on", "complete", "completed_on")
    readonly_fields = (
        "campaign",
        "completion",
        "projects_removed",
        "project_total",
        "items_removed",
        "item_total",
        "assets_removed",
        "asset_total",
        "complete",
        "started_on",
        "completed_on",
        "removal_log",
    )
    fieldsets = (
        (
            None,
            {
                "fields": (
                    "campaign",
                    "completion",
                    "projects_removed",
                    "project_total",
                    "items_removed",
                    "item_total",
                    "assets_removed",
                    "asset_total",
                    "complete",
                    "started_on",
                    "completed_on",
                ),
            },
        ),
        (
            "Log",
            {
                "fields": ("removal_log",),
                "classes": ("collapse",),
            },
        ),
    )

    @admin.display(description="Completion percentage")
    def completion(self, obj: CampaignRetirementProgress) -> str:
        """
        Compute a human readable completion percentage for display.

        Args:
            obj (CampaignRetirementProgress): Progress instance.

        Returns:
            str: Percentage text such as `"100%"`.
        """
        if obj.complete:
            return "100%"
        total = obj.project_total + obj.item_total + obj.asset_total
        removed = obj.projects_removed + obj.items_removed + obj.assets_removed
        return "{}%".format(round(removed / total * 100, 2))


@admin.register(Card)
class CardAdmin(admin.ModelAdmin):
    form = CardAdminForm
    fields = ("title", "display_heading", "body_text", "image", "image_alt_text")
    list_display = ["title", "display_heading", "created_on", "updated_on"]
    list_filter = (CardCampaignListFilter, "updated_on")


class TutorialInline(admin.TabularInline):
    model = TutorialCard
    extra = 1
    raw_id_fields = ("card",)


@admin.register(CardFamily)
class CardFamilyAdmin(admin.ModelAdmin):
    inlines = (TutorialInline,)

    class Media:
        js = ("dist/js/admin_custom-HASH.js",)


@admin.register(Guide)
class GuideAdmin(admin.ModelAdmin):
    form = GuideAdminForm


@admin.register(NextTranscribableCampaignAsset)
class NextTranscribableCampaignAssetAdmin(admin.ModelAdmin):
    list_display = (
        "asset",
        "transcription_status",
        "campaign",
        "created_on",
    )
    list_filter = (
        NextAssetCampaignListFilter,
        "transcription_status",
    )
    search_fields = (
        "asset__title",
        "item__title",
        "project__title",
        "campaign__title",
    )
    readonly_fields = (
        "asset",
        "sequence",
        "item",
        "item_item_id",
        "project",
        "project_slug",
        "campaign",
        "created_on",
    )
    ordering = ("-created_on",)


@admin.register(NextReviewableCampaignAsset)
class NextReviewableCampaignAssetAdmin(admin.ModelAdmin):
    list_display = (
        "asset",
        "campaign",
        "created_on",
    )
    list_filter = (NextAssetCampaignListFilter,)
    search_fields = (
        "asset__title",
        "item__title",
        "project__title",
        "campaign__title",
        "transcriber_ids",
    )
    readonly_fields = (
        "asset",
        "item",
        "project",
        "campaign",
        "transcriber_ids",
        "created_on",
    )
    ordering = ("-created_on",)


@admin.register(NextTranscribableTopicAsset)
class NextTranscribableTopicAssetAdmin(admin.ModelAdmin):
    list_display = (
        "asset",
        "transcription_status",
        "topic",
        "created_on",
    )
    list_filter = (
        TopicListFilter,
        "transcription_status",
    )
    search_fields = (
        "asset__title",
        "item__title",
        "project__title",
        "topic__title",
    )
    readonly_fields = (
        "asset",
        "sequence",
        "item",
        "item_item_id",
        "project",
        "project_slug",
        "topic",
        "created_on",
    )
    ordering = ("-created_on",)


@admin.register(NextReviewableTopicAsset)
class NextReviewableTopicAssetAdmin(admin.ModelAdmin):
    list_display = (
        "asset",
        "topic",
        "created_on",
    )
    list_filter = (TopicListFilter,)
    search_fields = (
        "asset__title",
        "item__title",
        "project__title",
        "topic__title",
        "transcriber_ids",
    )
    readonly_fields = (
        "asset",
        "item",
        "project",
        "topic",
        "transcriber_ids",
        "created_on",
    )
    ordering = ("-created_on",)


@admin.register(KeyMetricsReport)
class KeyMetricsReportAdmin(admin.ModelAdmin):
    form = KeyMetricsReportAdminForm

    readonly_fields = (
        "created_on",
        "updated_on",
        "period_type",
        "period_start",
        "period_end",
        "fiscal_year",
        "fiscal_quarter",
        "month",
        "download_csv_link",
    )

    list_display = (
        "period_type",
        "fiscal_year",
        "fiscal_quarter",
        "month",
        "period_start",
        "period_end",
        "updated_on",
    )
    list_filter = (
        "period_type",
        "fiscal_year",
        "fiscal_quarter",
        "month",
    )
    search_fields = ("period_type",)
    ordering = ("-period_start", "-period_end", "period_type")

    fieldsets = (
        (
            "Report details",
            {
                "description": (
                    "These fields describe which period this report covers and "
                    "when it was last updated. They cannot be edited here."
                ),
                "fields": (
                    "period_type",
                    "period_start",
                    "period_end",
                    "fiscal_year",
                    "fiscal_quarter",
                    "month",
                    "created_on",
                    "updated_on",
                    "download_csv_link",
                ),
            },
        ),
        (
            "Manual Fields (editable)",
            {
                "description": (
                    "You can type values here if you track them outside of "
                    "Concordia. Blank values are not included in quarterly or "
                    "fiscal-year totals. If you later add values for the "
                    "underlying months, those totals may update the quarterly "
                    "and fiscal-year reports when reports are rebuilt."
                ),
                "fields": (
                    "crowd_emails_and_libanswers_sent",
                    "crowd_visits",
                    "crowd_page_views",
                    "crowd_unique_visitors",
                    "avg_visit_seconds",
                    "transcriptions_added_to_loc_gov",
                    "datasets_added_to_loc_gov",
                ),
            },
        ),
        (
            "Calculated metrics (editable, may be overwritten)",
            {
                "description": (
                    "These numbers are usually calculated from Site Reports. "
                    "You can edit them here if needed, but they may be "
                    "overwritten when reports are rebuilt. Monthly reports can "
                    "be recomputed when new daily Site Reports arrive. "
                    "Quarterly reports can be recomputed when any monthly "
                    "report in the quarter is updated. Fiscal-year reports can "
                    "be recomputed when any quarterly report in the year is "
                    "updated."
                ),
                "fields": (
                    "assets_published",
                    "assets_started",
                    "assets_completed",
                    "users_activated",
                    "anonymous_transcriptions",
                    "transcriptions_saved",
                    "tag_uses",
                ),
            },
        ),
    )

    @admin.display(description="Download CSV")
    def download_csv_link(self, obj: "KeyMetricsReport") -> str:
        """
        Provide a link to download this report as a CSV file.

        Args:
            obj (KeyMetricsReport): Report instance.

        Returns:
            str: HTML anchor tag for the CSV download.
        """
        url = reverse(
            f"admin:{obj._meta.app_label}_{obj._meta.model_name}_download_csv",
            args=[obj.pk],
        )
        return format_html('<a class="button" href="{}">Download CSV</a>', url)

    def get_urls(self):
        """
        Register a custom admin view to serve CSV files for reports.

        Returns:
            list: Custom URL patterns combined with the default admin URLs.
        """
        urls = super().get_urls()
        opts = self.model._meta
        custom_urls = [
            path(
                "<path:object_id>/download_csv/",
                self.admin_site.admin_view(self.download_csv_view),
                name=f"{opts.app_label}_{opts.model_name}_download_csv",
            ),
        ]
        return custom_urls + urls

    def download_csv_view(
        self,
        request: HttpRequest,
        object_id: str,
    ) -> HttpResponse:
        """
        Serve the CSV for a single KeyMetricsReport instance.

        Args:
            request (HttpRequest): Current admin request.
            object_id (str): Primary key of the report to download.

        Returns:
            HttpResponse: CSV download response.

        Raises:
            Http404: If the report cannot be found.
        """
        obj = self.get_object(request, object_id)
        if obj is None:
            raise Http404("Report not found.")
        csv_bytes = obj.render_csv()
        response = HttpResponse(csv_bytes, content_type="text/csv")
        response["Content-Disposition"] = f'attachment; filename="{obj.csv_filename()}"'
        return response

    @admin.action(description="Download CSVs of selected reports as a ZIP")
    def download_selected_as_zip(
        self,
        request: HttpRequest,
        queryset: QuerySet[KeyMetricsReport],
    ) -> HttpResponse:
        """
        Stream a ZIP file containing one CSV per selected report.

        Args:
            request (HttpRequest): Current admin request.
            queryset (QuerySet[KeyMetricsReport]): Reports to export.

        Returns:
            HttpResponse: ZIP download response.
        """
        memory_file = io.BytesIO()
        with zipfile.ZipFile(
            memory_file, mode="w", compression=zipfile.ZIP_DEFLATED
        ) as zf:
            for report in queryset.order_by("period_start", "period_type"):
                zf.writestr(report.csv_filename(), report.render_csv())
        memory_file.seek(0)

        response = HttpResponse(memory_file.getvalue(), content_type="application/zip")
        response["Content-Disposition"] = (
            'attachment; filename="key_metrics_reports.zip"'
        )
        return response

    actions = ("download_selected_as_zip",)


================================================
FILE: concordia/admin/actions.py
================================================
import uuid
from logging import getLogger

from django.contrib import admin, messages
from django.db.models import QuerySet
from django.http import HttpRequest
from django.utils.timezone import now

from importer.utils import create_verify_asset_image_job_batch

from ..models import (
    Asset,
    Campaign,
    Item,
    Project,
    Transcription,
    TranscriptionStatus,
)
from .utils import _bulk_change_status

logger = getLogger(__name__)


@admin.action(
    permissions=["change"],
    description="Anonymize and disable user accounts",
)
def anonymize_action(
    modeladmin: admin.ModelAdmin,
    request: HttpRequest,
    queryset: QuerySet,
) -> None:
    """
    Anonymize and disable selected user accounts.

    Replaces identifying fields of each user account with placeholder values,
    sets the account to inactive, and removes staff and superuser status.
    Records a message with the number of accounts changed.

    Args:
        modeladmin (admin.ModelAdmin): Admin class that owns this action.
        request (HttpRequest): Current request.
        queryset (QuerySet): Selected user accounts to anonymize.

    Returns:
        None
    """
    count = queryset.count()
    for user_account in queryset:
        user_account.username = "Anonymized %s" % uuid.uuid4()
        user_account.first_name = ""
        user_account.last_name = ""
        user_account.email = ""
        user_account.set_unusable_password()
        user_account.is_staff = False
        user_account.is_superuser = False
        user_account.is_active = False
        user_account.save()

    messages.info(
        request,
        f"Anonymized and disabled {count} user accounts",
        fail_silently=True,
    )


@admin.action(permissions=["change"], description="Publish selected items and assets")
def publish_item_action(
    modeladmin: admin.ModelAdmin,
    request: HttpRequest,
    queryset: QuerySet[Item],
) -> None:
    """
    Publish selected items and their related assets.

    Marks each selected `Item` as published and updates any related `Asset`
    instances that are not yet published. Records a message with the number
    of items and assets changed.

    Args:
        modeladmin (admin.ModelAdmin): Admin class that owns this action.
        request (HttpRequest): Current request.
        queryset (QuerySet[Item]): Selected items to publish.

    Returns:
        None
    """
    count = queryset.filter(published=False).update(published=True)
    asset_count = Asset.objects.filter(item__in=queryset, published=False).update(
        published=True
    )

    messages.info(
        request,
        f"Published {count} items and {asset_count} assets",
        fail_silently=True,
    )


@admin.action(
    permissions=["change"],
    description="Unpublish selected items and assets",
)
def unpublish_item_action(
    modeladmin: admin.ModelAdmin,
    request: HttpRequest,
    queryset: QuerySet[Item],
) -> None:
    """
    Unpublish selected items and their related assets.

    Marks each selected `Item` as unpublished and updates any related `Asset`
    instances that are currently published. Records a message with the number
    of items and assets changed.

    Args:
        modeladmin (admin.ModelAdmin): Admin class that owns this action.
        request (HttpRequest): Current request.
        queryset (QuerySet[Item]): Selected items to unpublish.

    Returns:
        None
    """
    count = queryset.filter(published=True).update(published=False)
    asset_count = Asset.objects.filter(item__in=queryset, published=True).update(
        published=False
    )

    messages.info(
        request,
        f"Unpublished {count} items and {asset_count} assets",
        fail_silently=True,
    )


@admin.action(permissions=["change"], description="Publish selected")
def publish_action(
    modeladmin: admin.ModelAdmin,
    request: HttpRequest,
    queryset: QuerySet,
) -> None:
    """
    Publish selected objects.

    Marks each selected object in the queryset as published. This action
    assumes the target model has a boolean `published` field. Records a
    message with the number of objects changed.

    Args:
        modeladmin (admin.ModelAdmin): Admin class that owns this action.
        request (HttpRequest): Current request.
        queryset (QuerySet): Selected objects to publish.

    Returns:
        None
    """
    count = queryset.filter(published=False).update(published=True)
    messages.info(request, f"Published {count} objects", fail_silently=True)


@admin.action(permissions=["change"], description="Unpublish selected")
def unpublish_action(
    modeladmin: admin.ModelAdmin,
    request: HttpRequest,
    queryset: QuerySet,
) -> None:
    """
    Unpublish selected objects.

    Marks each selected object in the queryset as unpublished. This action
    assumes the target model has a boolean `published` field. Records a
    message with the number of objects changed.

    Args:
        modeladmin (admin.ModelAdmin): Admin class that owns this action.
        request (HttpRequest): Current request.
        queryset (QuerySet): Selected objects to unpublish.

    Returns:
        None
    """
    count = queryset.filter(published=True).update(published=False)
    messages.info(request, f"Unpublished {count} objects", fail_silently=True)


@admin.action(permissions=["reopen"], description="Change status to Completed")
def change_status_to_completed(
    modeladmin: admin.ModelAdmin,
    request: HttpRequest,
    queryset: QuerySet[Asset],
) -> None:
    """
    Mark selected assets as completed by accepting a transcription.

    For each asset whose `transcription_status` is not
    `TranscriptionStatus.COMPLETED`, accepts the latest transcription or
    creates a new one if none exists. The new or updated transcription is
    marked as accepted by the current user and validated before saving.
    Records a message describing which assets were changed.

    Args:
        modeladmin (admin.ModelAdmin): Admin class that owns this action.
        request (HttpRequest): Current request.
        queryset (QuerySet[Asset]): Selected assets to mark as completed.

    Returns:
        None
    """
    assets = queryset.exclude(transcription_status=TranscriptionStatus.COMPLETED)
    count = assets.count()
    if count == 1:
        changed_asset = assets.first()
    else:
        changed_asset = False

    for asset in assets:
        latest_transcription = asset.transcription_set.order_by("-pk").first()
        if latest_transcription is None:
            kwargs = {
                "asset": asset,
                "user": request.user,
            }
            latest_transcription = Transcription(**kwargs)
        latest_transcription.accepted = now()
        latest_transcription.rejected = None
        latest_transcription.reviewed_by = request.user
        latest_transcription.clean_fields()
        latest_transcription.validate_unique()
        latest_transcription.save()

    if changed_asset:
        messages.info(
            request,
            f"Changed status of {changed_asset.title} to Complete",
            fail_silently=True,
        )
    else:
        messages.info(
            request,
            f"Changed status of {count} assets to Complete",
            fail_silently=True,
        )


@admin.action(permissions=["reopen"], description="Change status to Needs Review")
def change_status_to_needs_review(
    modeladmin: admin.ModelAdmin,
    request: HttpRequest,
    queryset: QuerySet[Asset],
) -> None:
    """
    Move selected assets to the Needs Review workflow status.

    Filters out assets that are already submitted, then calls `_change_status`
    to create new submitted transcriptions reviewed by the current user.
    Records a message describing which assets were changed.

    Args:
        modeladmin (admin.ModelAdmin): Admin class that owns this action.
        request (HttpRequest): Current request.
        queryset (QuerySet[Asset]): Selected assets to move to Needs Review.

    Returns:
        None
    """
    eligible = queryset.exclude(transcription_status=TranscriptionStatus.SUBMITTED)
    rows = [
        {"slug": asset.slug, "status": TranscriptionStatus.SUBMITTED}
        for asset in eligible
    ]
    count = _bulk_change_status(request.user, rows)

    if count == 1:
        asset = queryset.first()
        messages.info(
            request,
            f"Changed status of {asset.title} to Needs Review",
            fail_silently=True,
        )
    else:
        messages.info(
            request,
            f"Changed status of {count} assets to Needs Review",
            fail_silently=True,
        )


@admin.action(permissions=["reopen"], description="Change status to In Progress")
def change_status_to_in_progress(
    modeladmin: admin.ModelAdmin,
    request: HttpRequest,
    queryset: QuerySet[Asset],
) -> None:
    """
    Move selected assets to the In Progress workflow status.

    Filters out assets that are already in progress, then calls
    `_change_status` with `submit` set to false to create new rejected
    transcriptions reviewed by the current user. Records a message describing
    which assets were changed.

    Args:
        modeladmin (admin.ModelAdmin): Admin class that owns this action.
        request (HttpRequest): Current request.
        queryset (QuerySet[Asset]): Selected assets to move to In Progress.

    Returns:
        None
    """
    eligible = queryset.exclude(transcription_status=TranscriptionStatus.IN_PROGRESS)
    rows = [
        {"slug": asset.slug, "status": TranscriptionStatus.IN_PROGRESS}
        for asset in eligible
    ]
    count = _bulk_change_status(request.user, rows)

    if count == 1:
        asset = queryset.first()
        messages.info(
            request,
            f"Changed status of {asset.title} to In Progress",
            fail_silently=True,
        )
    else:
        messages.info(
            request,
            f"Changed status of {count} assets to In Progress",
            fail_silently=True,
        )


@admin.action(
    permissions=["change"],
    description="Verify images for all assets for selected objects",
)
def verify_assets_action(
    modeladmin: admin.ModelAdmin,
    request: HttpRequest,
    queryset: QuerySet,
) -> None:
    """
    Create image verification jobs for assets related to the selected objects.

    Depending on which admin model invoked this action, it collects asset
    primary keys from the selected `Campaign`, `Project`, `Item` or `Asset`
    instances. It then calls `create_verify_asset_image_job_batch` to create
    a batch of verification jobs and shows a link to the batch in the admin
    messages.

    Args:
        modeladmin (admin.ModelAdmin): Admin class that owns this action.
        request (HttpRequest): Current request.
        queryset (QuerySet): Selected objects used to look up assets.

    Returns:
        None
    """
    batch = str(uuid.uuid4())

    if modeladmin.model == Campaign:
        asset_pks = Asset.objects.filter(campaign__in=queryset).values_list(
            "id", flat=True
        )
    elif modeladmin.model == Project:
        asset_pks = Asset.objects.filter(item__project__in=queryset).values_list(
            "id", flat=True
        )
    elif modeladmin.model == Item:
        asset_pks = Asset.objects.filter(item__in=queryset).values_list(
            "id",
            flat=True,
        )
    elif modeladmin.model == Asset:
        asset_pks = queryset.values_list("id", flat=True)
    else:
        modeladmin.message_user(
            request, "This action is not available for this model.", level="error"
        )
        return

    job_count, url = create_verify_asset_image_job_batch(asset_pks, batch)

    modeladmin.message_user(
        request,
        f"Created {job_count} VerifyAssetImageJobs as part of batch {batch}. "
        f'<a href="{url}" target="_blank">View the created jobs</a>',
        extra_tags="marked-safe",
    )


================================================
FILE: concordia/admin/filters.py
================================================
from django.contrib import admin
from django.db.models import Exists, OuterRef
from django.utils.translation import gettext_lazy as _

from ..models import Campaign, Project, Topic, Transcription


class NullableTimestampFilter(admin.SimpleListFilter):
    """
    Base class for admin list filters that test if a datetime field is set.

    Provides "null" and "not-null" choices based on a configured
    `parameter_name` that points to a `DateTimeField` or similar attribute.
    """

    # Title displayed on the list filter URL
    title = ""
    # Model field name:
    parameter_name = ""
    # Choices displayed
    lookup_labels = ("NULL", "NOT NULL")

    def lookups(self, request, model_admin):
        return zip(("null", "not-null"), self.lookup_labels, strict=False)

    def queryset(self, request, queryset):
        kwargs = {"%s__isnull" % self.parameter_name: True}
        if self.value() == "null":
            return queryset.filter(**kwargs)
        elif self.value() == "not-null":
            return queryset.exclude(**kwargs)
        return queryset


class SubmittedFilter(NullableTimestampFilter):
    """
    Filter transcriptions by whether the `submitted` timestamp is set.
    """

    title = "Submitted"
    parameter_name = "submitted"
    lookup_labels = ("Pending", "Submitted")


class AcceptedFilter(NullableTimestampFilter):
    """
    Filter transcriptions by whether the `accepted` timestamp is set.
    """

    title = "Accepted"
    parameter_name = "accepted"
    lookup_labels = ("Pending", "Accepted")


class RejectedFilter(NullableTimestampFilter):
    """
    Filter transcriptions by whether the `rejected` timestamp is set.
    """

    title = "Rejected"
    parameter_name = "rejected"
    lookup_labels = ("Pending", "Rejected")


class CampaignListFilter(admin.SimpleListFilter):
    """
    Base class for campaign filters used in admin changelists.

    Filters by a campaign identifier stored in `parameter_name` and
    optionally narrows results by campaign status when a related status
    query parameter is present.
    """

    title = "Campaign"
    template = "admin/long_name_filter.html"

    def lookups(self, request, model_admin):
        queryset = Campaign.objects.exclude(status=Campaign.Status.RETIRED)
        if self.status_filter_parameter in request.GET:
            queryset = queryset.filter(status=request.GET[self.status_filter_parameter])
        return queryset.values_list("id", "title").order_by("title")

    def queryset(self, request, queryset):
        if self.value():
            return queryset.filter(**{self.parameter_name: self.value()})
        return queryset


class CardCampaignListFilter(admin.SimpleListFilter):
    """
    Filter cards by the campaign that owns their card family.

    Shows only campaigns with a non-null `card_family` and restricts
    cards to those within the selected campaign's family.
    """

    title = _("campaign")
    parameter_name = "campaign"

    def lookups(self, request, model_admin):
        return Campaign.objects.exclude(card_family__isnull=True).values_list(
            "pk", "title"
        )

    def queryset(self, request, queryset):
        campaign_id = self.value()
        if campaign_id:
            card_family = Campaign.objects.get(pk=campaign_id).card_family
            if card_family is None:
                pks = []
            else:
                pks = card_family.cards.values_list("pk", flat=True)
            queryset = queryset.filter(id__in=pks)
        return queryset


class TopicListFilter(admin.SimpleListFilter):
    """
    Base class for topic filters used in admin changelists.

    Filters by topic identifier using the configured `parameter_name`.
    """

    title = "Topic"
    template = "admin/long_name_filter.html"
    parameter_name = "topic__id__exact"

    def lookups(self, request, model_admin):
        queryset = Topic.objects.all()
        return queryset.values_list("id", "title").order_by("title")

    def queryset(self, request, queryset):
        if self.value():
            return queryset.filter(**{self.parameter_name: self.value()})
        return queryset


class ProjectCampaignListFilter(CampaignListFilter):
    parameter_name = "campaign__id__exact"
    status_filter_parameter = "campaign__status"


class ItemCampaignListFilter(CampaignListFilter):
    parameter_name = "project__campaign__id__exact"
    status_filter_parameter = "project__campaign__status"


class AssetCampaignListFilter(CampaignListFilter):
    parameter_name = "item__project__campaign__id__exact"
    status_filter_parameter = "item__project__campaign__status"


class UserProfileActivityCampaignListFilter(CampaignListFilter):
    parameter_name = "campaign__id__exact"
    status_filter_parameter = "campaign__status"


class SiteReportCampaignListBaseFilter(CampaignListFilter):
    """
    Base filter for site report campaigns that supports empty-campaign rows.

    Extends `CampaignListFilter` to optionally include an explicit "no
    campaign" choice controlled by `include_empty_choice` and the
    `lookup_kwarg_isnull` query parameter.
    """

    lookup_kwarg_isnull = "campaign__isnull"
    include_empty_choice = True

    def __init__(self, request, params, model, model_admin):
        self.empty_value_display = model_admin.get_empty_value_display()
        self.lookup_val_isnull = params.get(self.lookup_kwarg_isnull)
        super().__init__(request, params, model, model_admin)

    def has_output(self):
        if self.include_empty_choice:
            extra = 1
        else:
            extra = 0
        return len(self.lookup_choices) + extra > 1

    def expected_parameters(self):
        return [self.parameter_name, self.lookup_kwarg_isnull]

    def choices(self, changelist):
        yield {
            "selected": self.value() is None and not self.lookup_val_isnull,
            "query_string": changelist.get_query_string(
                remove=[self.parameter_name, self.lookup_kwarg_isnull]
            ),
            "display": "All",
        }
        for lookup, title in self.lookup_choices:
            yield {
                "selected": self.value() == str(lookup),
                "query_string": changelist.get_query_string(
                    {self.parameter_name: lookup}, self.lookup_kwarg_isnull
                ),
                "display": title,
            }
        if self.include_empty_choice:
            yield {
                "selected": bool(self.lookup_val_isnull),
                "query_string": changelist.get_query_string(
                    {self.lookup_kwarg_isnull: "True"}, [self.parameter_name]
                ),
                "display": self.empty_value_display,
            }


class SiteReportSortedCampaignListFilter(SiteReportCampaignListBaseFilter):
    title = "Sorted Campaign"
    parameter_name = "campaign__id__exact"
    status_filter_parameter = "campaign__status"


class SiteReportCampaignListFilter(SiteReportCampaignListBaseFilter):
    parameter_name = "campaign__id__exact"
    status_filter_parameter = "campaign__status"

    def lookups(self, request, model_admin):
        return Campaign.objects.values_list("id", "title")


class HelpfulLinkCampaignListFilter(CampaignListFilter):
    title = "Campaign Sorted"
    parameter_name = "campaign__id__exact"
    status_filter_parameter = "campaign__status"


class TagCampaignListFilter(CampaignListFilter):
    parameter_name = "userassettagcollection__asset__item__project__campaign__id__exact"
    status_filter_parameter = (
        "userassettagcollection__asset__item__project__campaign__status"
    )


class TranscriptionCampaignListFilter(CampaignListFilter):
    parameter_name = "asset__item__project__campaign__id__exact"
    status_filter_parameter = "asset__item__project__campaign__status"


class UserAssetTagCollectionCampaignListFilter(CampaignListFilter):
    parameter_name = "asset__item__project__campaign__id__exact"
    status_filter_parameter = "asset__item__project__campaign__status"


class NextAssetCampaignListFilter(CampaignListFilter):
    parameter_name = "campaign__id__exact"

    def lookups(self, request, model_admin):
        campaigns = Campaign.objects.filter(
            pk__in=model_admin.model.objects.values_list(
                "campaign_id", flat=True
            ).distinct()
        )
        return campaigns.values_list("id", "title").order_by("title")


class CampaignProjectListFilter(admin.SimpleListFilter):
    """
    Base class for project filters grouped by campaign.

    Provides a project dropdown whose choices can be narrowed by a related
    campaign filter, then filters the changelist using `project_ref`.
    """

    title = "ProjectRedux"
    parameter_name = "project"
    related_filter_parameter = ""
    project_ref = ""
    template = "admin/long_name_filter.html"

    def lookups(self, request, model_admin):
        list_of_questions = []
        queryset = Project.objects.order_by("campaign_id")
        if self.related_filter_parameter in request.GET:
            queryset = queryset.filter(
                campaign_id=request.GET[self.related_filter_parameter]
            )
        for project in queryset:
            list_of_questions.append((str(project.id), project.title))
        return sorted(list_of_questions, key=lambda tp: tp[1])

    def queryset(self, request, queryset):
        if self.value():
            return queryset.filter(**{self.project_ref: self.value()})
        return queryset


class ItemProjectListFilter(CampaignProjectListFilter):
    parameter_name = "project__in"
    related_filter_parameter = "project__campaign__id__exact"
    project_ref = "project_id"


class AssetProjectListFilter(CampaignProjectListFilter):
    parameter_name = "item__project__in"
    related_filter_parameter = "item__project__campaign__id__exact"
    project_ref = "item__project_id"


class TranscriptionProjectListFilter(CampaignProjectListFilter):
    parameter_name = "asset__item__project__in"
    related_filter_parameter = "asset__item__project__campaign__id__exact"
    project_ref = "asset__item__project_id"


class CampaignStatusListFilter(admin.SimpleListFilter):
    """
    Base class for campaign status filters.

    Filters changelist rows by campaign status using the configured
    `parameter_name` and the `Campaign.Status` choices.
    """

    title = "Campaign status"

    def lookups(self, request, model_admin):
        return Campaign.Status.choices

    def queryset(self, request, queryset):
        if self.value():
            return queryset.filter(**{self.parameter_name: self.value()})
        return queryset


class AssetCampaignStatusListFilter(CampaignStatusListFilter):
    parameter_name = "item__project__campaign__status"


class ItemCampaignStatusListFilter(CampaignStatusListFilter):
    parameter_name = "project__campaign__status"


class ProjectCampaignStatusListFilter(CampaignStatusListFilter):
    parameter_name = "campaign__status"


class HelpfulLinkCampaignStatusListFilter(CampaignStatusListFilter):
    parameter_name = "campaign__status"


class TranscriptionCampaignStatusListFilter(CampaignStatusListFilter):
    parameter_name = "asset__item__project__campaign__status"


class TagCampaignStatusListFilter(CampaignStatusListFilter):
    parameter_name = "userassettagcollection__asset__item__project__campaign__status"


class UserAssetTagCollectionCampaignStatusListFilter(CampaignStatusListFilter):
    parameter_name = "asset__item__project__campaign__status"


class UserProfileActivityCampaignStatusListFilter(CampaignStatusListFilter):
    parameter_name = "campaign__status"


class BooleanFilter(admin.SimpleListFilter):
    """
    Base class for simple yes/no boolean filters.

    Provides "Yes" and "No" choices and filters using the configured
    `parameter_name`.
    """

    def lookups(self, request, model_admin):
        return [
            (True, _("Yes")),
            (False, _("No")),
        ]

    def queryset(self, request, queryset):
        if self.value() is None:
            return queryset
        else:
            return queryset.filter(**{self.parameter_name: self.value()})


class OcrGeneratedFilter(BooleanFilter):
    title = "OCR Generated"
    parameter_name = "ocr_generated"


class OcrOriginatedFilter(BooleanFilter):
    title = "OCR Originated"
    parameter_name = "ocr_originated"


class SupersededListFilter(admin.SimpleListFilter):
    """
    Filter transcriptions by whether they have been superseded.

    Uses an `Exists` subquery on the `Transcription.supersedes` relation to
    efficiently determine superseded rows.
    """

    title = "superseded"
    parameter_name = "superseded"

    def lookups(self, request, model_admin):
        return (("yes", "Superseded"), ("no", "Not superseded"))

    def queryset(self, request, queryset):
        # Uses Exists to make joining cheaper
        superseded_exists = Transcription.objects.filter(supersedes=OuterRef("pk"))
        val = self.value()
        if val == "yes":
            return queryset.annotate(_is_superseded=Exists(superseded_exists)).filter(
                _is_superseded=True
            )
        if val == "no":
            return queryset.annotate(_is_superseded=Exists(superseded_exists)).filter(
                _is_superseded=False
            )
        return queryset


================================================
FILE: concordia/admin/forms.py
================================================
import nh3
from django import forms
from django.core.cache import caches
from tinymce.widgets import TinyMCE

from ..models import (
    Campaign,
    Card,
    Guide,
    Item,
    KeyMetricsReport,
    Project,
    ProjectTopic,
    Topic,
    TranscriptionStatus,
)

FRAGMENT_ALLOWED_TAGS = {
    "a",
    "abbr",
    "acronym",
    "b",
    "blockquote",
    "br",
    "code",
    "em",
    "i",
    "kbd",
    "li",
    "ol",
    "p",
    "span",
    "strong",
    "ul",
}

BLOCK_ALLOWED_TAGS = FRAGMENT_ALLOWED_TAGS | {
    "div",
    "h1",
    "h2",
    "h3",
    "h4",
    "h5",
    "h6",
    "hr",
    "section",
}

ALLOWED_ATTRIBUTES = {
    "a": {"class", "id", "href", "title"},
    "abbr": {"title"},
    "acronym": {"title"},
    "div": {"class", "id"},
    "span": {"class", "id"},
    "p": {"class", "id"},
}


class AdminItemImportForm(forms.Form):
    """
    Admin form for importing items into a project from a URL.

    Provides a single `import_url` field pointing to an item, collection or
    search page to import from.
    """

    import_url = forms.URLField(
        required=True, label="URL of the item/collection/search page to import"
    )


class AdminProjectBulkImportForm(forms.Form):
    """
    Admin form for bulk importing campaigns, projects and items.

    Accepts a spreadsheet file describing the content to import and an
    optional `redownload` flag that controls whether existing items should
    be fetched again.
    """

    spreadsheet_file = forms.FileField(
        required=True,
        label="Spreadsheet containing the campaigns, projects, and items to import",
    )

    redownload = forms.BooleanField(
        required=False, label="Should existing items be redownloaded?"
    )


class AdminAssetsBulkChangeStatusForm(forms.Form):
    """
    Admin form for changing status of assets across multiple items in bulk
    via CSV upload.
    """

    spreadsheet_file = forms.FileField(
        required=True,
        label="Spreadsheet containing the items to change",
    )


class SanitizedDescriptionAdminForm(forms.ModelForm):
    """
    Base admin form that sanitizes HTML description fields.

    Uses `nh3` to strip disallowed tags and attributes from `description`
    and `short_description` fields while keeping a limited set of inline
    and block-level markup.
    """

    class Meta:
        model = Campaign
        fields = "__all__"

    def clean_description(self) -> str:
        """
        Clean the `description` field using the block-level sanitizer.

        Returns:
            str: Sanitized HTML content for `description`.
        """
        return nh3.clean(
            self.cleaned_data["description"],
            tags=BLOCK_ALLOWED_TAGS,
            attributes=ALLOWED_ATTRIBUTES,
        )

    def clean_short_description(self) -> str:
        """
        Clean the `short_description` field using the fragment sanitizer.

        Returns:
            str: Sanitized HTML content for `short_description`.
        """
        return nh3.clean(
            self.cleaned_data["short_description"],
            tags=FRAGMENT_ALLOWED_TAGS,
            attributes=ALLOWED_ATTRIBUTES,
        )


class TopicAdminForm(SanitizedDescriptionAdminForm):
    """
    Admin form for topics with sanitized rich-text descriptions.
    """

    class Meta(SanitizedDescriptionAdminForm.Meta):
        model = Topic
        widgets = {
            "description": TinyMCE(),
            "short_description": TinyMCE(),
        }


class CampaignAdminForm(SanitizedDescriptionAdminForm):
    """
    Admin form for campaigns with sanitized rich-text descriptions.
    """

    class Meta(SanitizedDescriptionAdminForm.Meta):
        model = Campaign
        widgets = {
            "short_description": TinyMCE(),
            "description": TinyMCE(),
        }
        fields = "__all__"


class ProjectAdminForm(SanitizedDescriptionAdminForm):
    """
    Admin form for projects with sanitized rich-text descriptions.
    """

    class Meta(SanitizedDescriptionAdminForm.Meta):
        model = Project
        widgets = {
            "description": TinyMCE(),
        }


class ProjectTopicInlineForm(forms.ModelForm):
    """
    Admin inline form that links `Project` and `Topic` with a URL filter.

    Adds a `url_filter` choice field that maps to `TranscriptionStatus`
    values and controls which asset statuses are shown in topic URLs.
    """

    url_filter = forms.ChoiceField(
        choices=[("", "-- All Statuses --")] + list(TranscriptionStatus.CHOICES),
        required=False,
    )

    class Meta:
        model = ProjectTopic
        fields = ["topic", "url_filter"]


class ItemAdminForm(forms.ModelForm):
    """
    Admin form for items with a rich-text `description` field.
    """

    class Meta:
        model = Item
        widgets = {"description": TinyMCE()}
        fields = "__all__"


class CardAdminForm(forms.ModelForm):
    """
    Admin form for tutorial cards with a rich-text `body_text` field.
    """

    class Meta:
        model = Card
        widgets = {
            "body_text": TinyMCE(),
        }
        fields = "__all__"


class GuideAdminForm(forms.ModelForm):
    """
    Admin form for guides with a rich-text `body` field.
    """

    class Meta:
        model = Guide
        widgets = {
            "body": TinyMCE(),
        }
        fields = "__all__"


def get_cache_name_choices() -> list[tuple[str, str]]:
    """
    Build choices for the cache-clearing admin form.

    Skips the `default` cache, since it holds semi-persistent data that
    should not be cleared through this form.

    Returns:
        list[tuple[str, str]]: `(cache_name, label)` pairs for non-default
            cache aliases.
    """
    # We don't want the default cache to be cleared,
    # since it's meant to contain semi-persistent data
    return [
        (name, f"{name} ({settings['BACKEND']})")
        for name, settings in caches.settings.items()
        if name != "default"
    ]


class ClearCacheForm(forms.Form):
    """
    Admin form for clearing selected Django caches.

    Presents a dropdown of non-default cache aliases built from
    `get_cache_name_choices()`.
    """

    cache_name = forms.ChoiceField(choices=get_cache_name_choices)


class AssetStatusActionForm(forms.Form):
    """
    Admin form used to select an asset status action.

    Renders a select box of available actions plus the hidden
    `_selected_action` field that the changelist expects. You must pass
    `available_actions` when creating the form.

    This form only builds the choice list. The admin changelist view still
    handles processing and execution of the selected action, just like
    standard admin actions.
    """

    action = forms.ChoiceField(
        choices=(),
        label="Change status",
        widget=forms.Select(attrs={"class": "vSelectField"}),
    )

    def __init__(
        self,
        *args,
        available_actions: list[tuple[str, str]],
        **kwargs,
    ) -> None:
        """
        Initialize the form with a list of available admin actions.

        Args:
            available_actions (list[tuple[str, str]]): Pairs of action name
                and human-readable label for each action that should appear
                in the dropdown.
        """
        super().__init__(*args, **kwargs)

        choices: list[tuple[str, str]] = [("", "---------")]

        for action_name, action_label in available_actions:
            choices.append((action_name, action_label))

        self.fields["action"].choices = choices


class KeyMetricsReportAdminForm(forms.ModelForm):
    """
    Admin form for `KeyMetricsReport` objects.

    Keeps manual and calculated metric fields editable while period
    metadata remains read-only through the `KeyMetricsReportAdmin`.
    """

    class Meta:
        model = KeyMetricsReport
        fields = "__all__"
        help_texts = {
            # Manual fields
            "crowd_emails_and_libanswers_sent": (
                "Optional. Leave blank if not known. "
                "Blank values are not included in quarterly or fiscal-year "
                "totals."
            ),
            "crowd_visits": (
                "Optional. Leave blank if not known. "
                "Blank values are not included in quarterly or fiscal-year "
                "totals."
            ),
            "crowd_page_views": (
                "Optional. Leave blank if not known. "
                "Blank values are not included in quarterly or fiscal-year "
                "totals."
            ),
            "crowd_unique_visitors": (
                "Optional. Leave blank if not known. "
                "Blank values are not included in quarterly or fiscal-year "
                "totals."
            ),
            "avg_visit_seconds": (
                "Optional average visit length in seconds. "
                "If blank, no average is used for quarterly or fiscal-year "
                "rollups."
            ),
            "transcriptions_added_to_loc_gov": (
                "Optional. Leave blank if not known. "
                "Blank values are not included in quarterly or fiscal-year "
                "totals."
            ),
            "datasets_added_to_loc_gov": (
                "Optional. Leave blank if not known. "
                "Blank values are not included in quarterly or fiscal-year "
                "totals."
            ),
            # Calculated fields (still editable)
            "assets_published": (
                "Usually calculated from Site Reports. "
                "If you edit this, it may be overwritten when reports are "
                "rebuilt."
            ),
            "assets_started": (
                "Usually calculated from Site Reports. "
                "If you edit this, it may be overwritten when reports are "
                "rebuilt."
            ),
            "assets_completed": (
                "Usually calculated from Site Reports. "
                "If you edit this, it may be overwritten when reports are "
                "rebuilt."
            ),
            "users_activated": (
                "Usually calculated from Site Reports. "
                "If you edit this, it may be overwritten when reports are "
                "rebuilt."
            ),
            "anonymous_transcriptions": (
                "Usually calculated from Site Reports. "
                "If you edit this, it may be overwritten when reports are "
                "rebuilt."
            ),
            "transcriptions_saved": (
                "Usually calculated from Site Reports. "
                "If you edit this, it may be overwritten when reports are "
                "rebuilt."
            ),
            "tag_uses": (
                "Usually calculated from Site Reports. "
                "If you edit this, it may be overwritten when reports are "
                "rebuilt."
            ),
        }


================================================
FILE: concordia/admin/utils.py
================================================
from django.contrib.auth.models import User
from django.db.models import Prefetch
from django.utils.timezone import now

from ..models import Asset, Transcription, TranscriptionStatus
from ..utils import get_anonymous_user


def _change_status(
    request_user: User,
    asset: Asset,
    status: str = TranscriptionStatus.SUBMITTED,
    transcription_user: User = None,
) -> int:
    """
    Create transcriptions to move assets to a new workflow status.

    For each asset in `assets` this helper creates a new `Transcription` that
    supersedes the latest transcription when one exists. The new transcription
    copies the latest text. Reviewer is only assigned for accepted/rejected.
    It sets the appropriate timestamp depending on `status`. Signals are
    preserved because this does not use `bulk_create`.

    Args:
        reviewer (User): user performing the action.
        assets (QuerySet[Asset]): Assets whose status should be updated.
        status (str): Workflow status to apply. Supported values are constants
        user (User): User that should be credited with submitting the
                    transcription. Defaults to None
        from TranscriptionStatus: NOT_STARTED, IN_PROGRESS, SUBMITTED, COMPLETED.
    Returns:
        int: 1 if asset was updated, otherwise 0
    """
    if hasattr(asset, "prefetched_transcriptions"):
        latest_transcription = (
            asset.prefetched_transcriptions[0]
            if asset.prefetched_transcriptions
            else None
        )
    else:
        latest_transcription = asset.transcription_set.order_by("-pk").first()

    if status == TranscriptionStatus.NOT_STARTED:
        return 0

    kwargs = {
        "asset": asset,
        "user": transcription_user or get_anonymous_user(),
    }
    if latest_transcription is not None:
        kwargs.update(
            **{
                "supersedes": latest_transcription,
                "text": latest_transcription.text,
            }
        )

    if status == TranscriptionStatus.SUBMITTED:
        kwargs["submitted"] = now()
    elif status == TranscriptionStatus.COMPLETED:
        kwargs["reviewed_by"] = request_user
        kwargs["accepted"] = now()
    elif status == TranscriptionStatus.IN_PROGRESS:
        if (
            latest_transcription
            and latest_transcription.status == TranscriptionStatus.COMPLETED
        ):
            kwargs["rejected"] = now()
        kwargs["reviewed_by"] = request_user

    transcription = Transcription(**kwargs)
    transcription.full_clean()
    transcription.save()
    return 1


def _bulk_change_status(
    request_user: User,
    rows: list,
) -> int:
    """
    Bulk update assets by delegating to _change_status
    Args:
        request_user: the staff user performing the bulk change.
        asset_rows: iterable of dicts like:
            {"asset": Asset, "status": TranscriptionStatus.SUBMITTED, "user": User}
    """
    slugs = {row["slug"] for row in rows if row.get("slug")}
    assets = Asset.objects.filter(slug__in=slugs).prefetch_related(
        Prefetch(
            "transcription_set",
            queryset=Transcription.objects.order_by("-pk"),
            to_attr="prefetched_transcriptions",
        )
    )
    asset_map = {asset.slug: asset for asset in assets}

    updated_total = 0
    for row in rows:
        asset = asset_map.get(row.get("slug"))
        if asset:
            updated_total += _change_status(
                request_user, asset, row["status"], row.get("user")
            )

    return updated_total


================================================
FILE: concordia/admin/views.py
================================================
import logging
import re
import tempfile
import time
from http import HTTPStatus
from typing import Any

from django.apps import apps
from django.contrib import messages
from django.contrib.admin.views.decorators import staff_member_required
from django.contrib.auth.decorators import permission_required, user_passes_test
from django.contrib.auth.models import User
from django.core.cache import caches
from django.core.exceptions import ValidationError
from django.db.models import OuterRef, Prefetch, Subquery
from django.http import HttpRequest, HttpResponse, JsonResponse
from django.shortcuts import render
from django.urls import reverse_lazy
from django.utils.decorators import method_decorator
from django.utils.text import slugify
from django.views import View
from django.views.decorators.cache import never_cache
from django.views.generic.edit import FormView

from concordia.models import (
    Asset,
    Item,
    Transcription,
    TranscriptionStatus,
    validated_get_or_create,
)
from exporter.tabular_export.core import export_to_csv_response, flatten_queryset
from exporter.views import do_bagit_export
from importer.models import ImportItem, ImportItemAsset, ImportJob
from importer.tasks import fetch_all_urls
from importer.tasks.items import import_items_into_project_from_url
from importer.utils import slurp_excel

from ..models import Campaign, Project, SiteReport
from .forms import (
    AdminAssetsBulkChangeStatusForm,
    AdminProjectBulkImportForm,
    ClearCacheForm,
)
from .utils import _bulk_change_status

logger = logging.getLogger(__name__)


@never_cache
@staff_member_required
@permission_required("concordia.add_campaign")
@permission_required("concordia.change_campaign")
@permission_required("concordia.add_project")
@permission_required("concordia.change_project")
@permission_required("concordia.add_item")
@permission_required("concordia.change_item")
def project_level_export(request: HttpRequest) -> HttpResponse:
    """
    Render the project-level BagIt export admin view and run exports.

    When called with `GET`, shows a form to select campaigns and projects.
    When called with `POST`, builds a BagIt export for completed items in
    the selected projects.

    Request Parameters:
        `id` (str, optional): Campaign primary key used to filter projects.
        `slug` (str, optional): Campaign slug used when building the export
            filename.

    Args:
        request (HttpRequest): Current admin request.

    Returns:
        HttpResponse: HTML response for the selection view or a streamed
            BagIt export.
    """
    request.current_app = "admin"
    context = {"title": "Project Level Bagit Exporter"}
    form = AdminProjectBulkImportForm()
    context["campaigns"] = all_campaigns = []
    context["projects"] = all_projects = []
    idx = request.GET.get("id")

    if request.method == "POST":
        project_list = request.POST.getlist("project_name")
        campaign_slug = request.GET.get("slug")

        proj_titles = "_projects"

        item_qs = Item.objects.filter(
            project__campaign__slug=campaign_slug, project__id__in=project_list
        )
        incomplete_item_assets = Asset.objects.filter(
            item__in=item_qs,
            transcription_status__in=(
                TranscriptionStatus.NOT_STARTED,
                TranscriptionStatus.IN_PROGRESS,
                TranscriptionStatus.SUBMITTED,
            ),
        )
        item_qs = item_qs.exclude(asset__in=incomplete_item_assets)
        asset_qs = Asset.objects.filter(item__in=item_qs).order_by(
            "item__project", "item", "sequence"
        )
        item_qs = asset_qs

        latest_trans_subquery = (
            Transcription.objects.filter(asset=OuterRef("pk"))
            .order_by("-pk")
            .values("text")
        )

        assets = asset_qs.annotate(
            latest_transcription=Subquery(latest_trans_subquery[:1])
        )

        campaign_slug_dbv = Campaign.objects.get(slug__exact=campaign_slug).slug

        export_filename_base = "%s%s" % (
            campaign_slug_dbv,
            proj_titles,
        )

        with tempfile.TemporaryDirectory(
            prefix=export_filename_base
        ) as export_base_dir:
            return do_bagit_export(
                assets, export_base_dir, export_filename_base, request
            )

    if idx is not None:
        context["campaigns"] = []
        form = AdminProjectBulkImportForm()
        projects = Project.objects.filter(campaign_id=int(idx))
        for project in projects:
            proj_dict = {}
            proj_dict["title"] = project.title
            proj_dict["id"] = project.pk
            proj_dict["campaign_id"] = idx
            all_projects.append(proj_dict)

    else:
        context["projects"] = []
        for campaigns in Campaign.objects.exclude(status=Campaign.Status.RETIRED):
            all_campaigns.append(campaigns)
        form = AdminProjectBulkImportForm()

    context["form"] = form
    return render(request, "admin/project_level_export.html", context)


@never_cache
@staff_member_required
@permission_required("concordia.add_campaign")
@permission_required("concordia.change_campaign")
@permission_required("concordia.add_project")
@permission_required("concordia.change_project")
@permission_required("concordia.add_item")
@permission_required("concordia.change_item")
def celery_task_review(request: HttpRequest) -> HttpResponse:
    """
    Inspect importer Celery tasks and summarize their status by project.

    For a selected campaign, iterates through related projects, import
    jobs and item assets to count successful, incomplete, unstarted and
    failed tasks. Writes per-asset status messages to the admin message
    framework and renders a summary table.

    Request Parameters:
        `id` (str, optional): Campaign primary key used to select which
            projects to inspect.

    Args:
        request (HttpRequest): Current admin request.

    Returns:
        HttpResponse: HTML response showing task counts by project or a
            campaign picker.
    """
    request.current_app = "admin"
    totalcount = 0
    counter = 0
    asset_successful = 0
    asset_incomplete = 0
    asset_unstarted = 0
    asset_failure = 0
    context = {
        "title": "Importer Tasks",
        "campaigns": [],
        "projects": [],
    }
    idx = request.GET.get("id")

    if idx is not None:
        for project in Project.objects.filter(campaign_id=int(idx)):
            asset_successful = 0
            asset_failure = 0
            asset_incomplete = 0
            asset_unstarted = 0
            proj_dict = {"title": project.title, "id": project.pk, "campaign_id": idx}
            messages.info(request, f"{project.title}")
            for importjob in ImportJob.objects.filter(project_id=project.pk).order_by(
                "-created"
            ):
                for asset in ImportItem.objects.filter(job_id=importjob.pk).order_by(
                    "-created"
                ):
                    counter += 1
                    countasset = 0
                    for assettask in ImportItemAsset.objects.filter(
                        import_item_id=asset.pk
                    ):
                        if (
                            assettask.failed is not None
                            and assettask.last_started is not None
                        ):
                            asset_failure += 1
                            messages.warning(
                                request,
                                f"{assettask.url}-{assettask.status}",
                            )
                        elif (
                            assettask.completed is None
                            and assettask.last_started is not None
                        ):
                            asset_incomplete += 1
                            messages.warning(
                                request,
                                f"{assettask.url}-{assettask.status}",
                            )
                        elif (
                            assettask.completed is None
                            and assettask.last_started is None
                        ):
                            asset_unstarted += 1
                            messages.warning(
                                request,
                                f"{assettask.url}-{assettask.status}",
                            )
                        else:
                            asset_successful += 1
                            messages.info(
                                request,
                                f"{assettask.url}-{assettask.status}",
                            )
                        countasset += 1
                        totalcount += 1
            proj_dict["successful"] = asset_successful
            proj_dict["incomplete"] = asset_incomplete
            proj_dict["unstarted"] = asset_unstarted
            proj_dict["failure"] = asset_failure
            context["projects"].append(proj_dict)
        messages.info(request, f"{totalcount} Total Assets Processed")
        context["totalassets"] = totalcount
    else:
        context["campaigns"] = Campaign.objects.exclude(
            status=Campaign.Status.RETIRED
        ).order_by("-launch_date")

    return render(request, "admin/celery_task.html", context)


@never_cache
@staff_member_required
@permission_required("concordia.add_campaign")
@permission_required("concordia.change_campaign")
@permission_required("concordia.add_project")
@permission_required("concordia.change_project")
@permission_required("concordia.add_item")
@permission_required("concordia.change_item")
def admin_bulk_import_review(request: HttpRequest) -> HttpResponse:
    """
    Preview a bulk import spreadsheet without creating campaigns or items.

    Parses the uploaded spreadsheet, validates required columns and slugs
    and extracts all import URLs. Uses `fetch_all_urls` to preflight the
    URLs then reports the results and total asset count in admin messages.

    Request Parameters:
        Uploaded file `spreadsheet_file` (multipart): Spreadsheet with one
            row per campaign and project definition.

    Args:
        request (HttpRequest): Current admin request.

    Returns:
        HttpResponse: HTML response containing the review form and any
            status messages.
    """
    request.current_app = "admin"
    url_regex = r"[-\w+]+"
    pattern = re.compile(url_regex)
    context = {"title": "Bulk Import Review"}

    urls = []
    all_urls = []
    url_counter = 0
    sum_count = 0
    if request.method == "POST":
        form = AdminProjectBulkImportForm(request.POST, request.FILES)

        if form.is_valid():
            rows = slurp_excel(request.FILES["spreadsheet_file"])
            required_fields = [
                "Campaign",
                "Campaign Short Description",
                "Campaign Long Description",
                "Campaign Slug",
                "Project Slug",
                "Project",
                "Project Description",
                "Import URLs",
            ]
            try:
                for idx, row in enumerate(rows):
                    missing_fields = [i for i in required_fields if i not in row]
                    if missing_fields:
                        messages.warning(
                            request,
                            f"Skipping row {idx}: missing fields {missing_fields}",
                        )
                        continue

                    campaign_title = row["Campaign"]
                    project_title = row["Project"]
                    import_url_blob = row["Import URLs"]

                    if not all((campaign_title, project_title, import_url_blob)):
                        if not any(row.values()):
                            # No messages for completely blank rows
                            continue

                        warning_message = (
                            f"Skipping row {idx}: at least one required field "
                            "(Campaign, Project, Import URLs) is empty"
                        )
                        messages.warning(request, warning_message)
                        continue

                    # Read Campaign slug value from excel
                    campaign_slug = row["Campaign Slug"]
                    if campaign_slug and not pattern.fullmatch(campaign_slug):
                        messages.warning(
                            request, "Campaign slug doesn't match pattern."
                        )

                    # Read Project slug value from excel
                    project_slug = row["Project Slug"]
                    if project_slug and not pattern.fullmatch(project_slug):
                        messages.warning(request, "Project slug doesn't match pattern.")

                    potential_urls = filter(None, re.split(r"[\s]+", import_url_blob))

                    for url in potential_urls:
                        if not url.startswith("http"):
                            messages.warning(
                                request, f"Skipping unrecognized URL value: {url}"
                            )
                            continue

                        urls.append(url)
                        url_counter = url_counter + 1

                        if url_counter == 50:
                            all_urls.append(urls)
                            url_counter = 0
                            urls = []

                all_urls.append(urls)
                for _i, val in enumerate(all_urls):
                    return_result = fetch_all_urls(val)
                    for res in return_result[0]:
                        messages.info(request, f"{res}")

                    sum_count = sum_count + return_result[1]
                    time.sleep(7)

                messages.info(request, f"Total Asset Count:{sum_count}")
            finally:
                messages.info(request, "All Processes Completed")

    else:
        form = AdminProjectBulkImportForm()

    context["form"] = form

    return render(request, "admin/bulk_review.html", context)


@method_decorator(staff_member_required, name="dispatch")
@method_decorator(never_cache, name="dispatch")
class AdminBulkChangeAssetStatusView(FormView):
    template_name = "admin/bulk_change.html"
    form_class = AdminAssetsBulkChangeStatusForm

    def form_valid(self, form):
        try:
            rows = slurp_excel(self.request.FILES["spreadsheet_file"])
        except Exception as e:
            messages.error(self.request, f"Could not read spreadsheet: {e}")

            return self.render_to_response(self.get_context_data(form=form))
        total_in_sheet = len(rows)

        # Normalize and validate statuses from spreadsheet rows
        def normalize_status(status):
            if status is not None:
                v = str(status).strip().lower()
                # accept canonical keys from TranscriptionStatus
                valid = {
                    TranscriptionStatus.NOT_STARTED,
                    TranscriptionStatus.IN_PROGRESS,
                    TranscriptionStatus.SUBMITTED,
                    TranscriptionStatus.COMPLETED,
                }
                if v in valid:
                    return v
            return None

        normalized_rows = []
        invalid_rows = 0
        slugs_all = set()

        user_ids = {row.get("user") for row in rows if row.get("user")}
        users = {u.id: u for u in User.objects.filter(id__in=user_ids)}

        for row in rows:
            slug = row.get("asset__slug")
            status_raw = row.get("New Status", TranscriptionStatus.SUBMITTED)
            user_id = row.get("user", None)
            status = normalize_status(status_raw)
            if slug and status_raw:
                slugs_all.add(slug)
                normalized_row = {
                    "slug": slug,
                    "status": status,
                }
                if user_id:
                    normalized_row["user"] = users.get(user_id)
                normalized_rows.append(normalized_row)
            else:
                invalid_rows += 1

        # Fetch matched assets once
        assets_qs = Asset.objects.filter(slug__in=slugs_all).prefetch_related(
            Prefetch(
                "transcription_set",
                queryset=Transcription.objects.order_by("-pk"),
                to_attr="prefetched_transcriptions",
            )
        )
        matched = assets_qs.count()

        if matched == 0:
            messages.warning(
                self.request,
                (
                    f"No matching assets found in database. "
                    f"Spreadsheet contained {total_in_sheet} rows."
                ),
            )
            return self.render_to_response(self.get_context_data(form=form))

        updated_total = _bulk_change_status(self.request.user, normalized_rows)

        unmatched = len(slugs_all) - matched

        messages.success(
            self.request,
            (
                f"Processed spreadsheet with {total_in_sheet} rows. "
                f"Updated {updated_total} assets. "
                f"{invalid_rows} invalid rows. "
                f"{unmatched} unmatched asset slugs. "
            ),
        )
        return self.render_to_response(self.get_context_data(form=form))


@never_cache
@staff_member_required
@permission_required("concordia.add_campaign")
@permission_required("concordia.change_campaign")
@permission_required("concordia.add_project")
@permission_required("concordia.change_project")
@permission_required("concordia.add_item")
@permission_required("concordia.change_item")
def admin_bulk_import_view(request: HttpRequest) -> HttpResponse:
    """
    Queue bulk import jobs from a spreadsheet.

    Reads an uploaded spreadsheet, creates or reuses `Campaign` and
    `Project` records using `validated_get_or_create` then queues import
    jobs via `import_items_into_project_from_url` for each URL.

    Request Parameters:
        Uploaded file `spreadsheet_file` (multipart): Spreadsheet defining
            campaigns, projects and URLs.
        Field `redownload` (bool, optional): If true, forces existing
            items to be re-downloaded.

    Args:
        request (HttpRequest): Current admin request.

    Returns:
        HttpResponse: HTML response containing the bulk import form and
            any queued job information.
    """
    request.current_app = "admin"
    url_regex = r"[-\w+]+"
    pattern = re.compile(url_regex)
    context = {"title": "Bulk Import"}

    if request.method == "POST":
        form = AdminProjectBulkImportForm(request.POST, request.FILES)

        if form.is_valid():
            context["import_jobs"] = import_jobs = []
            redownload = form.cleaned_data.get("redownload", False)

            rows = slurp_excel(request.FILES["spreadsheet_file"])
            required_fields = [
                "Campaign",
                "Campaign Short Description",
                "Campaign Long Description",
                "Campaign Slug",
                "Project Slug",
                "Project",
                "Project Description",
                "Import URLs",
            ]
            for idx, row in enumerate(rows):
                missing_fields = [i for i in required_fields if i not in row]
                if missing_fields:
                    messages.warning(
                        request, f"Skipping row {idx}: missing fields {missing_fields}"
                    )
                    continue

                campaign_title = row["Campaign"]
                project_title = row["Project"]
                import_url_blob = row["Import URLs"]

                if not all((campaign_title, project_title, import_url_blob)):
                    if not any(row.values()):
                        # No messages for completely blank rows
                        continue

                    warning_message = (
                        f"Skipping row {idx}: at least one required field "
                        "(Campaign, Project, Import URLs) is empty"
                    )
                    messages.warning(request, warning_message)
                    continue

                try:
                    # Read Campaign slug value from excel
                    campaign_slug = row["Campaign Slug"]
                    if campaign_slug and not pattern.fullmatch(campaign_slug):
                        messages.warning(
                            request, "Campaign slug doesn't match pattern."
                        )
                    campaign, created = validated_get_or_create(
                        Campaign,
                        title=campaign_title,
                        defaults={
                            "slug": row["Campaign Slug"]
                            or slugify(campaign_title, allow_unicode=True),
                            "description": row["Campaign Long Description"] or "",
                            "short_description": row["Campaign Short Description"]
                            or "",
                        },
                    )
                except ValidationError as exc:
                    messages.error(
                        request, f"Unable to create campaign {campaign_title}: {exc}"
                    )
                    continue

                if created:
                    messages.info(request, f"Created new campaign {campaign_title}")
                else:
                    messages.info(
                        request,
                        f"Reusing campaign {campaign_title} without modification",
                    )

                try:
                    # Read Project slug value from excel
                    project_slug = row["Project Slug"]
                    if project_slug and not pattern.fullmatch(project_slug):
                        messages.warning(request, "Project slug doesn't match pattern.")
                    project, created = validated_get_or_create(
                        Project,
                        title=project_title,
                        campaign=campaign,
                        defaults={
                            "slug": row["Project Slug"]
                            or slugify(project_title, allow_unicode=True),
                            "description": row["Project Description"] or "",
                            "campaign": campaign,
                        },
                    )
                except ValidationError as exc:
                    messages.error(
                        request, f"Unable to create project {project_title}: {exc}"
                    )
                    continue

                if created:
                    messages.info(request, f"Created new project {project_title}")
                else:
                    messages.info(
                        request,
                        f"Reusing project {project_title} without modification",
                    )

                potential_urls = filter(None, re.split(r"[\s]+", import_url_blob))
                for url in potential_urls:
                    if not url.startswith("http"):
                        messages.warning(
                            request, f"Skipping unrecognized URL value: {url}"
                        )
                        continue

                    try:
                        import_jobs.append(
                            import_items_into_project_from_url(
                                request.user, project, url, redownload
                            )
                        )

                        messages.info(
                            request,
                            (
                                f"Queued {campaign_title} {project_title} "
                                f"import for {url}"
                            ),
                        )
                    except Exception as exc:
                        messages.error(
                            request,
                            f"Unhandled error attempting to import {url}: {exc}",
                        )
    else:
        form = AdminProjectBulkImportForm()

    context["form"] = form

    return render(request, "admin/bulk_import.html", context)


@never_cache
@staff_member_required
def admin_site_report_view(request: HttpRequest) -> HttpResponse:
    """
    Export all `SiteReport` records as a CSV file.

    Builds tabular data using `flatten_queryset` and returns a CSV
    response suitable for download.

    Args:
        request (HttpRequest): Current admin request.

    Returns:
        HttpResponse: CSV download with one row per `SiteReport`.
    """
    site_reports = SiteReport.objects.all()

    headers, data = flatten_queryset(
        site_reports,
        field_names=SiteReport.DEFAULT_EXPORT_FIELDNAMES,
        extra_verbose_names={"created_on": "Date", "campaign__title": "Campaign"},
    )

    return export_to_csv_response("site-report.csv", headers, data)


@never_cache
@staff_member_required
def admin_retired_site_report_view(request: HttpRequest) -> HttpResponse:
    """
    Export a CSV of the latest `SiteReport` per retired campaign.

    Selects the most recent report per retired campaign then appends a
    final summary row that totals numeric fields across all rows.

    Args:
        request (HttpRequest): Current admin request.

    Returns:
        HttpResponse: CSV download including per-campaign rows and a
            `RETIRED TOTAL` row.
    """
    site_reports = site_reports = (
        SiteReport.objects.filter(campaign__status=Campaign.Status.RETIRED)
        .order_by("campaign_id", "-created_on")
        .distinct("campaign_id")
    )

    headers, data = flatten_queryset(
        site_reports,
        field_names=SiteReport.DEFAULT_EXPORT_FIELDNAMES,
        extra_verbose_names={"created_on": "Date", "campaign__title": "Campaign"},
    )
    data = list(data)
    row = ["", "RETIRED TOTAL", "", ""]
    # You can't use aggregate with distinct(*fields), so the sum for each
    # has to be done in Python
    for field in SiteReport.DEFAULT_EXPORT_FIELDNAMES[4:]:
        row.append(
            sum(
                [
                    getattr(site_report, field) if getattr(site_report, field) else 0
                    for site_report in site_reports
                ]
            )
        )
    data.append(row)

    return export_to_csv_response("retired-site-report.csv", headers, data)


class SerializedObjectView(View):
    """
    Return a single field from a Concordia model instance as JSON.

    The model, instance and field to fetch are provided through query
    string parameters. This is intended for lightweight admin tools that
    need to inspect or preview stored values.
    """

    def get(
        self,
        request: HttpRequest,
        *args: Any,
        **kwargs: Any,
    ) -> JsonResponse:
        """
        Handle `GET` requests and serialize the requested field.

        Request Parameters:
            `model_name` (str): Name of the `concordia` app model to query.
            `object_id` (str): Primary key of the model instance.
            `field_name` (str): Name of the attribute or field to return.

        Args:
            request (HttpRequest): Current HTTP request.
            *args (Any): Positional arguments passed by the URLconf.
            **kwargs (Any): Keyword arguments passed by the URLconf.

        Returns:
            JsonResponse: JSON object containing the field value or a 404
                status if the instance does not exist.
        """
        model_name = request.GET.get("model_name")
        object_id = request.GET.get("object_id")
        field_name = request.GET.get("field_name")

        model = apps.get_model(app_label="concordia", model_name=model_name)
        try:
            instance = model.objects.get(pk=object_id)
            value = getattr(instance, field_name)
            return JsonResponse({field_name: value})
        except model.DoesNotExist:
            return JsonResponse({"status": "false"}, status=HTTPStatus.NOT_FOUND)


@method_decorator(never_cache, name="dispatch")
@method_decorator(user_passes_test(lambda u: u.is_superuser), name="dispatch")
class ClearCacheView(FormView):
    """
    Admin view for clearing non-default Django caches.

    Uses `ClearCacheForm` to pick a cache alias then calls `clear()` on
    the selected cache. Only superusers can access this view.
    """

    form_class = ClearCacheForm
    template_name = "admin/clear_cache.html"
    success_url = reverse_lazy("admin:clear-cache")

    def form_valid(self, form: ClearCacheForm) -> HttpResponse:
        """
        Clear the selected cache and redirect back to the form.

        On success, adds a success message. On failure, logs an error
        message then continues with the normal `FormView` redirect.

        Args:
            form (ClearCacheForm): Validated form containing the selected
                cache alias.

        Returns:
            HttpResponse: Redirect to the configured `success_url` after
                processing.
        """
        try:
            cache_name = form.cleaned_data["cache_name"]
            caches[cache_name].clear()
            messages.success(self.request, f"Successfully cleared '{cache_name}' cache")
        except Exception as err:
            messages.error(
                self.request,
                (
                    f"Couldn't clear cache '{cache_name}', "
                    f"something went wrong. Received error: {err}"
                ),
            )
        return super().form_valid(form)


================================================
FILE: concordia/admin_site.py
================================================
"""Admin site customizations for Concordia.

Provides a subclass of Django's ``AdminSite`` that adds project-specific
admin URLs alongside the default admin views.
"""

from django.contrib import admin
from django.urls import path


class ConcordiaAdminSite(admin.AdminSite):
    """Custom admin site with additional Concordia tools and views."""

    site_header = "Concordia Admin"
    site_title = "Concordia"

    def get_urls(self) -> list:
        """Return admin URL patterns including Concordia-specific routes.

        This extends ``admin.AdminSite.get_urls`` by prepending a set of
        project routes for bulk import, bulk review, Celery task review,
        site reporting, project-level export, JSON object inspection
        and the cache-clearing tool. The base admin URLs are returned
        unchanged after the custom routes.

        Returns:
            list: URL patterns for the custom admin views followed by the
            default admin URLs.
        """
        from concordia.admin import views

        urls = super().get_urls()

        custom_urls = [
            path("bulk-import/", views.admin_bulk_import_view, name="bulk-import"),
            path("bulk-review/", views.admin_bulk_import_review, name="bulk-review"),
            path("celery-review/", views.celery_task_review, name="celery-review"),
            path("site-report/", views.admin_site_report_view, name="site-report"),
            path(
                "retired-site-report/",
                views.admin_retired_site_report_view,
                name="retired-site-report",
            ),
            path(
                "project-level-export/",
                views.project_level_export,
                name="project-level-export",
            ),
            path(
                "serialized_object/",
                views.SerializedObjectView.as_view(),
                name="serialized_object",
            ),
            path("clear-cache/", views.ClearCacheView.as_view(), name="clear-cache"),
            path(
                "bulk-change/",
                views.AdminBulkChangeAssetStatusView.as_view(),
                name="bulk-change",
            ),
        ]

        return custom_urls + urls


================================================
FILE: concordia/api/__init__.py
================================================
"""
Experimental API endpoints backing the React transcription page.

Status
------
This module is in active development and not yet in its final form. Interfaces
and behavior may change without deprecation.

Intended Use
------------
These endpoints exist to support the React app's transcription page during
ongoing development and trial rollout.

Duplication and Future Plan
---------------------------
To enable rapid iteration, this module currently duplicates substantial logic
from existing Django views (e.g., validation, submission/review workflows,
rollback/rollforward and serialization). When the React transcription page is
ready for production, one of the following will occur:

1. Shared logic will be factored into reusable helpers imported by both these
   endpoints and the legacy views; or
2. The legacy views that these endpoints duplicate will be removed.

Until then, expect overlap and keep changes synchronized across both places.

Note
----
The React app still requires significant development work. Treat these endpoints
as provisional and subject to change.
"""

import re
from time import time
from typing import Optional

from django.conf import settings
from django.db.transaction import atomic
from django.http import HttpRequest
from django.shortcuts import get_object_or_404
from django.urls import reverse
from django.utils.timezone import now
from ninja import NinjaAPI, Router
from ninja.errors import HttpError

from concordia.exceptions import RateLimitExceededError
from concordia.logging import ConcordiaLogger
from concordia.models import (
    Asset,
    CardFamily,
    ConcordiaUser,
    Guide,
    Transcription,
    TranscriptionStatus,
    TutorialCard,
    UserAssetTagCollection,
)
from concordia.templatetags.concordia_media_tags import asset_media_url
from concordia.utils import get_anonymous_user
from concordia.utils.constants import URL_REGEX
from configuration.utils import configuration_value

from .schemas import CamelSchema

structured_logger = ConcordiaLogger.get_logger(__name__)

api = NinjaAPI(version=None, urls_namespace="api")


class AssetOut(CamelSchema):
    """
    Serialized representation of an Asset for API responses.

    Fields mirror what the web client needs to render the asset view,
    including navigation context, image URLs, tagging, tutorial cards,
    available languages and undo/redo availability.
    """

    id: int  # noqa: A003
    title: str
    item_id: str
    project_slug: str
    campaign_slug: str
    transcription: Optional[dict]
    transcription_status: str
    activity_mode: str
    disable_ocr: bool
    previous_asset_url: Optional[str]
    next_asset_url: Optional[str]
    asset_navigation: list[tuple[int, str]]
    image_url: str
    thumbnail_url: str
    current_asset_url: str
    tags: list[str]
    registered_contributors: int
    cards: list[str]
    guides: Optional[list[dict[str, str]]]
    languages: list[tuple[str, str]]
    undo_available: bool
    redo_available: bool


class ReviewIn(CamelSchema):
    """
    Request Parameters:
        action (str): Review action, either `"accept"` or `"reject"`.
    """

    action: str  # "accept" or "reject"


class TranscriptionIn(CamelSchema):
    """
    Request Parameters:
        text (str): The transcription text to save.
        supersedes (Optional[int]): The ID of the transcription being
            superseded.
    """

    text: str
    supersedes: Optional[int]


class OcrTranscriptionIn(CamelSchema):
    """
    Request Parameters:
        language (str): The ISO 639-3 code of the OCR language to use.
        supersedes (Optional[int]): The ID of the transcription being
            superseded.
    """

    language: str
    supersedes: Optional[int]


class TranscriptionOut(CamelSchema):
    """
    Serialized representation of a Transcription event/result returned
    by API endpoints that create or mutate transcriptions.
    """

    id: int  # noqa: A003
    text: str
    sent: float
    submission_url: Optional[str] = None
    asset: AssetOut
    undo_available: bool
    redo_available: bool


def serialize_asset(asset: Asset, request: HttpRequest) -> AssetOut:
    """
    Build the `AssetOut` payload for a single asset.

    Args:
        asset (Asset): Published asset instance to serialize.
        request (HttpRequest): Current request, used for absolute URLs.

    Returns:
        AssetOut: Serialized asset suitable for API responses.
    """
    item = asset.item
    project = item.project
    campaign = project.campaign

    transcription = asset.transcription_set.order_by("-pk").first()
    if transcription:
        transcription_out = {
            "id": transcription.pk,
            "status": transcription.status,
            "text": transcription.text,
            "contributors": asset.get_contributor_count(),
        }
        if transcription.status in TranscriptionStatus.CHOICE_MAP.values():
            transcription_status = [
                k
                for k, v in TranscriptionStatus.CHOICE_MAP.items()
                if v == transcription.status
            ][0]
        else:
            transcription_status = TranscriptionStatus.NOT_STARTED
    else:
        transcription_out = None
        transcription_status = TranscriptionStatus.NOT_STARTED

    if transcription_status in [
        TranscriptionStatus.NOT_STARTED,
        TranscriptionStatus.IN_PROGRESS,
    ]:
        activity_mode = "transcribe"
        disable_ocr = asset.turn_off_ocr()
    elif transcription_status == TranscriptionStatus.SUBMITTED:
        activity_mode = "review"
        disable_ocr = True
    else:
        activity_mode = "transcribe"
        disable_ocr = True

    current_asset_url = request.build_absolute_uri()
    previous_asset = (
        item.asset_set.published()
        .filter(sequence__lt=asset.sequence)
        .order_by("sequence")
        .last()
    )
    next_asset = (
        item.asset_set.published()
        .filter(sequence__gt=asset.sequence)
        .order_by("sequence")
        .first()
    )

    # Build URLs
    previous_asset_url = previous_asset.get_absolute_url() if previous_asset else None
    next_asset_url = next_asset.get_absolute_url() if next_asset else None

    # Navigation list
    asset_navigation = list(
        item.asset_set.published().order_by("sequence").values_list("sequence", "slug")
    )

    # Thumbnail URL
    image_url = asset_media_url(asset)
    if asset.download_url and "iiif" in asset.download_url:
        thumbnail_url = asset.download_url.replace(
            "http://tile.loc.gov", "https://tile.loc.gov"
        ).replace("/pct:100/", "/!512,512/")
    else:
        thumbnail_url = image_url

    # Tags
    tag_groups = UserAssetTagCollection.objects.filter(asset__slug=asset.slug)
    tags = sorted({tag.value for tg in tag_groups for tag in tg.tags.all()})

    # Cards
    if project.campaign.card_family:
        card_family = project.campaign.card_family
    else:
        card_family = CardFamily.objects.filter(default=True).first()
    if card_family:
        cards = list(
            TutorialCard.objects.filter(tutorial=card_family)
            .order_by("order")
            .values_list("card__title", flat=True)
        )
    else:
        cards = []

    # Guides
    guides_qs = Guide.objects.order_by("order").values("title", "body")
    guides = list(guides_qs) if guides_qs.exists() else None

    # Undo/redo availability
    undo_available = asset.can_rollback()[0] if transcription else False
    redo_available = asset.can_rollforward()[0] if transcription else False

    return AssetOut(
        id=asset.id,
        title=asset.title,
        item_id=item.item_id,
        project_slug=project.slug,
        campaign_slug=campaign.slug,
        transcription=transcription_out,
        transcription_status=transcription_status,
        activity_mode=activity_mode,
        disable_ocr=disable_ocr,
        current_asset_url=current_asset_url,
        previous_asset_url=previous_asset_url,
        next_asset_url=next_asset_url,
        asset_navigation=asset_navigation,
        image_url=image_url,
        thumbnail_url=thumbnail_url,
        tags=tags,
        registered_contributors=asset.get_contributor_count(),
        cards=cards,
        guides=guides,
        languages=list(settings.LANGUAGE_CODES.items()),
        undo_available=undo_available,
        redo_available=redo_available,
    )


assets: Router = Router(tags=["assets"])


@assets.get(
    "/{campaign_slug}/{project_slug}/{item_id}/{asset_slug}/",
    response=AssetOut,
    by_alias=True,
)
def asset_detail_by_slugs(
    request: HttpRequest,
    campaign_slug: str,
    project_slug: str,
    item_id: str,
    asset_slug: str,
) -> AssetOut:
    """
    Resolve and return a published asset using slugs and item_id.

    Path Parameters:
        campaign_slug (str): Campaign slug.
        project_slug (str): Project slug.
        item_id (str): Item identifier within the project.
        asset_slug (str): Asset slug.

    Returns:
        AssetOut: Serialized asset record.
    """
    asset = get_object_or_404(
        Asset.objects.published()
        .select_related("item__project__campaign")
        .filter(
            item__project__campaign__slug=campaign_slug,
            item__project__slug=project_slug,
            item__item_id=item_id,
            slug=asset_slug,
        )
    )
    return serialize_asset(asset, request)


@assets.get("/{asset_id}", response=AssetOut, by_alias=True)
def asset_detail(request: HttpRequest, asset_id: int) -> AssetOut:
    """GET /assets/{asset_id}/ - basic asset record."""
    asset = get_object_or_404(
        Asset.objects.published().select_related("item__project__campaign"), pk=asset_id
    )
    return serialize_asset(asset, request)


@assets.post("/{asset_id}/transcriptions", response=TranscriptionOut, by_alias=True)
def create_transcription(
    request: HttpRequest, asset_id: int, payload: TranscriptionIn
) -> TranscriptionOut:
    """
    Create a new draft transcription for the given asset.

    Replaces any open draft transcription and validates content. Mirrors
    the legacy `save_transcription` view.
    """
    asset = get_object_or_404(
        Asset.objects.published().select_related("item__project__campaign"), pk=asset_id
    )

    user = request.user if not request.user.is_anonymous else get_anonymous_user()

    structured_logger.info(
        "API transcription save start",
        event_code="transcription_save_start",
        user=user,
        asset=asset,
    )

    # Validate transcription text (disallow URLs)
    if re.search(URL_REGEX, payload.text):
        structured_logger.warning(
            "API transcription rejected due to URL",
            event_code="transcription_save_rejected",
            reason="URL detected in transcription",
            reason_code="url_detected",
            user=user,
            asset=asset,
        )
        raise HttpError(
            400,
            "It looks like your text contains URLs. Please remove them and try again.",
        )

    # Supersede logic
    supersedes_pk = payload.supersedes
    superseded = None

    if not supersedes_pk:
        if asset.transcription_set.filter(supersedes=None).exists():
            structured_logger.warning(
                "API transcription save failed: open transcription exists",
                event_code="transcription_save_aborted",
                reason="Open transcription already exists",
                reason_code="already_exists",
                user=user,
                asset=asset,
            )
            raise HttpError(409, "An open transcription already exists")
    else:
        if asset.transcription_set.filter(supersedes=supersedes_pk).exists():
            structured_logger.warning(
                "API transcription save failed: already superseded",
                event_code="transcription_save_aborted",
                reason="Superseded transcription is invalid",
                reason_code="superseded_invalid",
                user=user,
                asset=asset,
                supersedes_pk=supersedes_pk,
            )
            raise HttpError(409, "This transcription has been superseded")

        try:
            superseded = asset.transcription_set.get(pk=supersedes_pk)
        except Transcription.DoesNotExist as err:
            structured_logger.warning(
                "API transcription save failed: supersedes not found",
                event_code="transcription_save_aborted",
                reason="Superseded transcription not found",
                reason_code="not_found",
                user=user,
                asset=asset,
                supersedes_pk=supersedes_pk,
            )
            raise HttpError(400, "Invalid supersedes value") from err

    ocr_originated = bool(
        superseded and (superseded.ocr_generated or superseded.ocr_originated)
    )

    transcription = Transcription(
        asset=asset,
        user=user,
        supersedes=superseded,
        text=payload.text,
        ocr_originated=ocr_originated,
    )
    transcription.full_clean()
    transcription.save()

    structured_logger.info(
        "API transcription save success",
        event_code="transcription_save_success",
        user=user,
        transcription=transcription,
    )

    return TranscriptionOut(
        id=transcription.pk,
        sent=time(),
        text=transcription.text,
        submission_url=reverse("api:submit_transcription", args=[transcription.pk]),
        asset=serialize_asset(asset, request),
        undo_available=asset.can_rollback()[0],
        redo_available=asset.can_rollforward()[0],
    )


@assets.post("/{asset_id}/transcriptions/ocr", response=TranscriptionOut, by_alias=True)
@atomic
def create_ocr_transcription(
    request: HttpRequest, asset_id: int, payload: OcrTranscriptionIn
) -> TranscriptionOut:
    """
    Create and save a new OCR-generated transcription for an asset.
    """
    asset = get_object_or_404(
        Asset.objects.published().select_related("item__project__campaign"),
        pk=asset_id,
    )
    user = request.user if not request.user.is_anonymous else get_anonymous_user()

    supersedes_pk = payload.supersedes
    language = payload.language

    structured_logger.info(
        "API OCR transcription generation start",
        event_code="ocr_generation_start",
        user=user,
        asset=asset,
        supersedes_pk=supersedes_pk,
        language=language,
    )

    # Determine superseded transcription
    superseded = None
    if supersedes_pk:
        superseded_qs = asset.transcription_set.filter(pk=supersedes_pk)
        if asset.transcription_set.filter(supersedes=supersedes_pk).exists():
            structured_logger.warning(
                "API OCR generation aborted: superseded transcription is invalid.",
                event_code="ocr_generation_aborted",
                reason="Superseded transcription is already superseded",
                reason_code="superseded_invalid",
                user=user,
                asset=asset,
                supersedes_pk=supersedes_pk,
            )
            raise HttpError(409, "This transcription has already been superseded")
        try:
            superseded = superseded_qs.get()
        except Transcription.DoesNotExist as err:
            structured_logger.warning(
                "API OCR generation aborted: superseded transcription not found.",
                event_code="ocr_generation_aborted",
                reason="Superseded transcription not found",
                reason_code="not_found",
                user=user,
                asset=asset,
                supersedes_pk=supersedes_pk,
            )
            raise HttpError(400, "Invalid supersedes value") from err
    else:
        # No transcription exists, so we create a blank one
        structured_logger.info(
            "No existing transcription; creating blank for OCR supersession",
            event_code="ocr_blank_supersede",
            user=user,
            asset=asset,
        )
        superseded = Transcription(
            asset=asset,
            user=get_anonymous_user(),
            text="",
        )
        superseded.full_clean()
        superseded.save()

        structured_logger.info(
            "Blank transcription created for OCR supersession",
            event_code="ocr_blank_transcription_created",
            user=user,
            transcription=superseded,
        )

    transcription_text = asset.get_ocr_transcript(language)

    transcription = Transcription(
        asset=asset,
        user=user,
        supersedes=superseded,
        text=transcription_text,
        ocr_generated=True,
        ocr_originated=True,
    )
    transcription.full_clean()
    transcription.save()

    structured_logger.info(
        "API OCR transcription successfully created",
        event_code="ocr_generation_success",
        user=user,
        transcription=transcription,
    )

    return TranscriptionOut(
        id=transcription.pk,
        sent=time(),
        text=transcription.text,
        submission_url=reverse("api:submit_transcription", args=[transcription.pk]),
        asset=serialize_asset(asset, request),
        undo_available=asset.can_rollback()[0],
        redo_available=asset.can_rollforward()[0],
    )


@assets.post(
    "/{asset_id}/transcriptions/rollback",
    response=TranscriptionOut,
    by_alias=True,
)
@atomic
def rollback(request: HttpRequest, asset_id: int) -> TranscriptionOut:
    """
    Restores the asset's transcription to the previous version in its history.

    Raises:
        HttpError: If no previous transcription exists to roll back to.
    """
    asset = get_object_or_404(Asset, pk=asset_id)
    user = request.user if not request.user.is_anonymous else get_anonymous_user()

    try:
        transcription = asset.rollback_transcription(user)
    except ValueError as e:
        structured_logger.warning(
            "Rollback failed: no previous transcription to revert to.",
            event_code="rollback_failed",
            reason_code="no_valid_target",
            reason=str(e),
            asset=asset,
            user=user,
        )
        raise HttpError(400, "No previous transcription available") from e

    structured_logger.info(
        "Rollback successfully performed.",
        event_code="rollback_success",
        user=user,
        transcription=transcription,
    )

    return TranscriptionOut(
        id=transcription.pk,
        sent=time(),
        text=transcription.text,
        submission_url=reverse("api:submit_transcription", args=[transcription.pk]),
        asset=serialize_asset(asset, request),
        undo_available=asset.can_rollback()[0],
        redo_available=asset.can_rollforward()[0],
    )


@assets.post(
    "/{asset_id}/transcriptions/rollforward",
    response=TranscriptionOut,
    by_alias=True,
)
@atomic
def rollforward(request: HttpRequest, asset_id: int) -> TranscriptionOut:
    """
    Restores the asset's transcription to the next version in its history.

    Raises:
        HttpError: If no future transcription exists to restore.
    """
    asset = get_object_or_404(Asset, pk=asset_id)
    user = request.user if not request.user.is_anonymous else get_anonymous_user()

    try:
        transcription = asset.rollforward_transcription(user)
    except ValueError as e:
        structured_logger.warning(
            "Rollforward failed: no transcription available to restore.",
            event_code="rollforward_failed",
            reason_code="no_valid_target",
            reason=str(e),
            asset=asset,
            user=user,
        )
        raise HttpError(400, "No transcription to restore") from e

    structured_logger.info(
        "Rollforward successfully performed.",
        event_code="rollforward_success",
        user=user,
        transcription=transcription,
    )

    return TranscriptionOut(
        id=transcription.pk,
        sent=time(),
        text=transcription.text,
        submission_url=reverse("api:submit_transcription", args=[transcription.pk]),
        asset=serialize_asset(asset, request),
        undo_available=asset.can_rollback()[0],
        redo_available=asset.can_rollforward()[0],
    )


transcriptions: Router = Router(tags=["transcriptions"])


@transcriptions.post("/{pk}/submit", response=TranscriptionOut, by_alias=True)
def submit_transcription(request: HttpRequest, pk: int) -> TranscriptionOut:
    """
    Submit a transcription for review (API version of legacy view).
    """
    transcription = get_object_or_404(Transcription, pk=pk)
    asset = transcription.asset

    user = request.user if not request.user.is_anonymous else get_anonymous_user()

    structured_logger.info(
        "API transcription submit start",
        event_code="transcription_submit_start",
        user=user,
        transcription=transcription,
    )

    # Cannot submit already-submitted or superseded transcription
    is_superseded = asset.transcription_set.filter(supersedes=pk).exists()
    is_already_submitted = transcription.submitted and not transcription.rejected

    if is_superseded or is_already_submitted:
        structured_logger.warning(
            "API transcription submit failed: already submitted or superseded",
            event_code="transcription_submit_rejected",
            reason="Transcrition already submitted or superseded",
            reason_code="already_updated",
            user=user,
            transcription=transcription,
            is_superseded=is_superseded,
            is_already_submitted=is_already_submitted,
        )
        raise HttpError(
            400,
            "This transcription has already been updated. "
            "Reload the current status before continuing.",
        )

    # Perform the submission
    transcription.submitted = now()
    transcription.rejected = None
    transcription.full_clean()
    transcription.save()

    structured_logger.info(
        "API transcription submitted",
        event_code="transcription_submit_success",
        user=user,
        transcription=transcription,
    )

    return TranscriptionOut(
        id=transcription.pk,
        text=transcription.text,
        sent=time(),
        asset=serialize_asset(asset, request),
        undo_available=False,
        redo_available=False,
    )


@transcriptions.patch(
    "/{pk}/review",
    response=TranscriptionOut,
    by_alias=True,
)
def review_transcription(
    request: HttpRequest, pk: int, payload: ReviewIn
) -> TranscriptionOut:
    """
    Accept or reject a submitted transcription.

    Request Parameters:
        action (str): `"accept"` to accept or `"reject"` to reject.

    Raises:
        HttpError: If the action is invalid, the transcription was already
            reviewed, the user attempts a self-accept, or the review rate
            limit is exceeded.
    """
    transcription = get_object_or_404(Transcription, pk=pk)
    asset = transcription.asset
    user = request.user if not request.user.is_anonymous else get_anonymous_user()

    # Temporary workaround to allow self-accepts for testing
    if payload.action == "accept" and transcription.user.pk == user.pk:
        user = ConcordiaUser.objects.latest("date_joined")
    # End workaround

    structured_logger.info(
        "API transcription review start",
        event_code="transcription_review_start",
        user=user,
        transcription_id=pk,
        action=payload.action,
    )

    if payload.action not in ("accept", "reject"):
        structured_logger.warning(
            "API review rejected: invalid action",
            event_code="transcription_review_rejected",
            reason="Invalid review action",
            reason_code="invalid_action",
            user=user,
            transcription_id=pk,
        )
        raise HttpError(400, "Invalid action")

    if transcription.accepted or transcription.rejected:
        structured_logger.warning(
            "API review rejected: already reviewed",
            event_code="transcription_review_rejected",
            reason="Transcription has already been reviewed",
            reason_code="already_reviewed",
            user=user,
            transcription=transcription,
        )
        raise HttpError(400, "This transcription has already been reviewed")

    if payload.action == "accept" and transcription.user.pk == user.pk:
        structured_logger.warning(
            "API review rejected: self-accept",
            event_code="transcription_review_rejected",
            reason="User attempted to accept their own transcription",
            reason_code="self_accept",
            user=request.user,
            transcription=transcription,
        )
        raise HttpError(400, "You cannot accept your own transcription")

    transcription.reviewed_by = user

    if payload.action == "accept":
        concordia_user = ConcordiaUser.objects.get(pk=user.pk)
        try:
            concordia_user.check_and_track_accept_limit(transcription)
        except RateLimitExceededError as err:
            structured_logger.warning(
                "API review rejected: rate limit exceeded",
                event_code="transcription_review_rejected",
                reason="User exceeded review rate limit",
                reason_code="rate_limit_exceeded",
                user=user,
                transcription=transcription,
            )
            raise HttpError(
                429, configuration_value("review_rate_limit_banner_message")
            ) from err
        transcription.accepted = now()
    else:
        transcription.rejected = now()

    transcription.full_clean()
    transcription.save()

    structured_logger.info(
        "API transcription review success",
        event_code="transcription_review_success",
        user=user,
        transcription=transcription,
        action=payload.action,
    )

    return TranscriptionOut(
        id=transcription.pk,
        text=transcription.text,
        sent=time(),
        asset=serialize_asset(asset, request),
        undo_available=False,
        redo_available=False,
    )


api.add_router("/assets", assets)
api.add_router("/transcriptions", transcriptions)


================================================
FILE: concordia/api/schemas.py
================================================
from ninja import Schema


def to_camel(string: str) -> str:
    """
    Convert a snake_case string to camelCase.

    Args:
        string (str): Input string using snake_case.

    Returns:
        str: camelCase version of the input. The first segment remains lowercase,
        and subsequent segments are capitalized and concatenated.
    """
    parts = string.split("_")
    return parts[0] + "".join(word.capitalize() for word in parts[1:])


class CamelSchema(Schema):
    """
    Base schema for Django Ninja that renders JSON with camelCase field names
    while keeping snake_case attribute names in Python code.
    """

    class Config(Schema.Config):
        """
        Pydantic-style configuration (ninja.Schema is a thin wrapper around Pydantic)
        that enables automatic camelCase aliases and allows population using original
        snake_case field names.
        """

        alias_generator = to_camel
        populate_by_name = True


================================================
FILE: concordia/api_views.py
================================================
"""
Very simple generic API views

These provide base classes for Django CBVs which behave differently when the URL
ends with ".json".

You register the view twice in urls.py and it will default to the stock Django
behaviour for the non-JSON endpoint:

    path("transcribe/", views.TranscribeListView.as_view()),
    path("transcribe.json", views.TranscribeListView.as_view()),

The base APIViewMixin implements a base implementation of serialize_object which
uses the generic django.forms.models.model_to_dict and can be overridden as needed.
"""

from time import time

from django.core.serializers.json import DjangoJSONEncoder
from django.forms.models import model_to_dict
from django.http import JsonResponse
from django.views.generic import DetailView, ListView
from django.views.generic.base import TemplateResponseMixin


class URLAwareEncoder(DjangoJSONEncoder):
    """
    JSON encoder subclass which handles things like ImageFieldFile which define
    a url property
    """

    def default(self, obj):
        if not obj:
            # Beyond the obvious, this handles the case where FileFields and
            # their subclasses (e.g. ImageField) define a url property which
            # will raise ValueError if accessed when the name property is empty.
            return None
        elif hasattr(obj, "url"):
            return obj.url
        elif hasattr(obj, "get_absolute_url"):
            return obj.get_absolute_url()
        else:
            return super().default(obj)


class APIViewMixin(TemplateResponseMixin):
    """
    TemplateResponseMixin subclass which will optionally render a JSON view of
    the context data when the URL path ends in .json or the querystring has
    "format=json"
    """

    def render_to_response(self, context, **response_kwargs):
        # This could also parse Accept headers if we wanted to take on the
        # support overhead of content-negotiation:
        req = self.request
        if req.path.endswith(".json") or req.GET.get("format") == "json":
            return self.render_to_json_response(context)
        else:
            return super().render_to_response(context, **response_kwargs)

    def render_to_json_response(self, context):
        data = self.serialize_context(context)
        self.make_absolute_urls(data)
        return JsonResponse(data, encoder=URLAwareEncoder)

    def serialize_context(self, context):
        # Subclasses will want to selectively filter this but we
        # will simply return the context verbatim:
        return context

    def serialize_object(self, obj):
        data = model_to_dict(obj)
        if hasattr(obj, "get_absolute_url"):
            data["url"] = obj.get_absolute_url()
        return data

    def make_absolute_urls(self, data):
        if isinstance(data, dict):
            for k, v in data.items():
                if k.endswith("url") and isinstance(v, str) and v.startswith("/"):
                    data[k] = self.request.build_absolute_uri(v)
                elif isinstance(v, (dict, list)):
                    self.make_absolute_urls(v)
        elif isinstance(data, list):
            for i in data:
                self.make_absolute_urls(i)


class APIDetailView(APIViewMixin, DetailView):
    """DetailView which can also return JSON"""

    def serialize_context(self, context):
        return {"object": self.serialize_object(context["object"])}


class APIListView(APIViewMixin, ListView):
    """ListView which can also return JSON with consistent pagination"""

    def render_to_response(self, context, **response_kwargs):
        page_obj = context["page_obj"]

        if page_obj:
            per_page = context["paginator"].per_page

            context["pagination"] = pagination = {
                "first": self.build_url_for_page(1, per_page),
                "last": self.build_url_for_page(page_obj.paginator.num_pages, per_page),
            }
            if page_obj.has_next():
                pagination["next"] = self.build_url_for_page(
                    page_obj.next_page_number(), per_page
                )

        response = super().render_to_response(context, **response_kwargs)

        if "pagination" in context:
            response["Link"] = ", ".join(
                f'<{url}>; rel="{rel}"' for rel, url in pagination.items()
            )

        return response

    def build_url_for_page(self, page_number, per_page):
        qs = self.request.GET.copy()
        qs["page"] = page_number
        qs["per_page"] = per_page
        return self.request.build_absolute_uri(
            "%s?%s" % (self.request.path, qs.urlencode())
        )

    def get_paginate_by(self, queryset):
        per_page = self.request.GET.get("per_page")

        if per_page and per_page.isdigit():
            return int(per_page)
        else:
            return self.paginate_by

    def serialize_context(self, context):
        data = {
            "objects": [self.serialize_object(i) for i in context["object_list"]],
            "sent": time(),
        }

        if "pagination" in context:
            data["pagination"] = context["pagination"]

        return data


================================================
FILE: concordia/apps.py
================================================
from django.apps.config import AppConfig
from django.contrib.admin.apps import AdminConfig
from django.contrib.staticfiles.apps import StaticFilesConfig


class ConcordiaAppConfig(AppConfig):
    name = "concordia"

    def ready(self):
        from .signals import handlers  # NOQA


class ConcordiaAdminConfig(AdminConfig):
    default_site = "concordia.admin_site.ConcordiaAdminSite"

    def ready(self):
        self.module.autodiscover()


class ConcordiaStaticFilesConfig(StaticFilesConfig):
    ignore_patterns = ["scss", "js/src/*"]


================================================
FILE: concordia/asgi.py
================================================
"""
ASGI entrypoint — see https://channels.readthedocs.io/en/latest/asgi.html
"""

import django
from channels.routing import get_default_application

django.setup()

application = get_default_application()


================================================
FILE: concordia/authentication_backends.py
================================================
from typing import Any

from django.contrib.auth import get_user_model
from django.contrib.auth.backends import ModelBackend
from django.contrib.auth.models import AbstractBaseUser
from django.db.models import Q
from django.http import HttpRequest


class EmailOrUsernameModelBackend(ModelBackend):
    """
    Authentication backend that accepts either username or email.

    Behavior:
      * Looks up users by ``USERNAME_FIELD`` or case-insensitive ``email``.
      * If multiple accounts match (e.g., same email in different fields),
        iterates through matches and returns the first with a valid password.
      * When no user matches, runs the hasher once to reduce timing
        differences between existing and non-existing users.

    Usage:
        In ``settings.py``:

            AUTHENTICATION_BACKENDS = [
                "concordia.authentication_backends.EmailOrUsernameModelBackend",
                "django.contrib.auth.backends.ModelBackend",
            ]

    Security notes:
      * The fallback hash on a miss helps mitigate user enumeration via
        timing side channels.
    """

    def authenticate(
        self,
        request: HttpRequest | None,
        username: str | None = None,
        password: str | None = None,
        **kwargs: Any,
    ) -> AbstractBaseUser | None:
        """
        Authenticate with either a username or an email address.

        Args:
            request:
                The current HTTP request or ``None`` (older Django may pass
                ``None``).
            username:
                The credential provided by the client. May be a username or an
                email address. If ``None``, the method will read the
                ``USERNAME_FIELD`` from ``kwargs``.
            password:
                The plaintext password to validate.

        Returns:
            The authenticated user instance, or ``None`` if authentication
            fails.
        """
        # n.b. Django <2.1 does not pass the `request`
        user_model = get_user_model()

        if username is None:
            username = kwargs.get(user_model.USERNAME_FIELD)

        # The `username` field is allowed to contain `@` characters so
        # technically a given email address could be present in either field,
        # possibly even for different users, so we'll query for all matching
        # records and test each one.
        users = user_model._default_manager.filter(
            Q(**{user_model.USERNAME_FIELD: username}) | Q(email__iexact=username)
        )

        # Test whether any matched user has the provided password:
        for user in users:
            if user.check_password(password):
                return user
        if not users:
            # Run the default password hasher once to reduce the timing
            # difference between an existing and a non-existing user (see
            # https://code.djangoproject.com/ticket/20760)
            user_model().set_password(password)
        return None


================================================
FILE: concordia/celery.py
================================================
import importlib
import os
import pkgutil

import sentry_sdk
from celery import Celery
from sentry_sdk.integrations.celery import CeleryIntegration

from concordia.version import get_concordia_version

SENTRY_BACKEND_DSN = os.environ.get("SENTRY_BACKEND_DSN", None)

if SENTRY_BACKEND_DSN:
    CONCORDIA_ENVIRONMENT = os.environ.get("CONCORDIA_ENVIRONMENT", None)
    sentry_sdk.init(
        SENTRY_BACKEND_DSN,
        environment=CONCORDIA_ENVIRONMENT,
        release=get_concordia_version(),
        integrations=[CeleryIntegration()],
    )

app = Celery("concordia")

# Using a string here means the worker doesn't have to serialize
# the configuration object to child processes.
# - namespace='CELERY' means all celery-related configuration keys
#   should have a `CELERY_` prefix.
app.config_from_object("django.conf:settings", namespace="CELERY")

# Load task modules from all registered Django app configs.
app.autodiscover_tasks()


def import_all_submodules(package_name: str):
    """
    Import a package and recursively import all submodules.
    Used sparingly at Celery startup to ensure all task modules are loaded.
    """
    pkg = importlib.import_module(package_name)
    if not hasattr(pkg, "__path__"):
        return
    for mod in pkgutil.walk_packages(pkg.__path__, pkg.__name__ + "."):
        importlib.import_module(mod.name)


# Import all task modules under these packages
# We do this because celery autodiscovery won't
# find anything not in tasks.py or tasks/__init__.py
# We need to defer this until after Django is fully loaded
@app.on_after_finalize.connect
def _load_all_task_modules(sender, **kwargs):
    import_all_submodules("concordia.tasks")
    import_all_submodules("importer.tasks")


================================================
FILE: concordia/consumers.py
================================================
import time

from channels.generic.websocket import AsyncJsonWebsocketConsumer


class AssetConsumer(AsyncJsonWebsocketConsumer):
    async def connect(self):
        await self.channel_layer.group_add("asset_updates", self.channel_name)
        await self.accept()

    async def disconnect(self, code):
        await self.channel_layer.group_discard("asset_updates", self.channel_name)

    async def asset_update(self, message):
        await self.send_json({"message": message, "sent": int(time.time())})

    async def asset_reservation_obtained(self, message):
        await self.send_json({"message": message, "sent": int(time.time())})

    async def asset_reservation_released(self, message):
        await self.send_json({"message": message, "sent": int(time.time())})


================================================
FILE: concordia/context_processors.py
================================================
from typing import Any, Dict

from django.conf import settings
from django.core.cache import cache
from django.http import HttpRequest


def system_configuration(request: HttpRequest) -> Dict[str, Any]:
    """
    Expose selected settings to templates via the default context.

    Adds the following keys:
      * SENTRY_FRONTEND_DSN: Front-end DSN string or None
      * CONCORDIA_ENVIRONMENT: Current environment label
      * S3_BUCKET_NAME: Bucket name for public media or None
      * APPLICATION_VERSION: Deployed version string or None

    Args:
        request:
            The current HTTP request. Included for the context processor
            signature; it is not used.

    Returns:
        dict: Mapping of configuration keys to values for templates.
    """
    return {
        "SENTRY_FRONTEND_DSN": getattr(settings, "SENTRY_FRONTEND_DSN", None),
        "CONCORDIA_ENVIRONMENT": settings.CONCORDIA_ENVIRONMENT,
        "S3_BUCKET_NAME": getattr(settings, "S3_BUCKET_NAME", None),
        "APPLICATION_VERSION": getattr(settings, "APPLICATION_VERSION", None),
    }


def site_navigation(request: HttpRequest) -> Dict[str, Any]:
    """
    Provide navigation helpers derived from the request.

    Adds:
      * VIEW_NAME: The resolved Django view name if available
      * VIEW_NAME_FOR_CSS: VIEW_NAME with ``:`` replaced by ``--`` for CSS
      * PATH_LEVEL_N: Each path segment by position, 1-indexed

    Example:
        For ``/campaigns/demo/item/123/`` this yields::

            {
                "PATH_LEVEL_1": "campaigns",
                "PATH_LEVEL_2": "demo",
                "PATH_LEVEL_3": "item",
                "PATH_LEVEL_4": "123",
            }

    Args:
        request:
            The current HTTP request used to derive view and path data.

    Returns:
        dict: Mapping of helper keys to values for templates.
    """
    data: Dict[str, Any] = {}

    if request.resolver_match:
        data["VIEW_NAME"] = request.resolver_match.view_name
        data["VIEW_NAME_FOR_CSS"] = data["VIEW_NAME"].replace(":", "--")

    path_components = request.path.strip("/").split("/")
    for i, component in enumerate(path_components, start=1):
        data["PATH_LEVEL_%d" % i] = component

    return data


def maintenance_mode_frontend_available(request: HttpRequest) -> Dict[str, Any]:
    """
    Expose a flag indicating front-end maintenance mode readiness.

    Reads the ``maintenance_mode_frontend_available`` cache key and returns a
    boolean under the same name in the template context.

    Args:
        request:
            The current HTTP request. Included for the context processor
            signature; it is not used.

    Returns:
        dict: ``{"maintenance_mode_frontend_available": bool}``.
    """
    value = cache.get("maintenance_mode_frontend_available", False)
    return {"maintenance_mode_frontend_available": value}


def request_id_context(request: HttpRequest) -> Dict[str, Any]:
    """
    Expose the per-request identifier, if present.

    Relies on middleware attaching ``request.request_id``. Returns the value
    or ``None`` if absent.

    Args:
        request:
            The current HTTP request holding ``request_id`` if set.

    Returns:
        dict: ``{"request_id": str | None}``.
    """
    return {"request_id": getattr(request, "request_id", None)}


================================================
FILE: concordia/contextmanagers.py
================================================
# Based on code from
# https://docs.celeryq.dev/en/v5.5.0/tutorials/task-cookbook.html#ensuring-a-task-is-only-executed-one-at-a-time

import logging
import time
from collections.abc import Generator
from contextlib import contextmanager

from django.core.cache import cache

logger = logging.getLogger(__name__)

DEFAULT_LOCK_DURATION = 60 * 10  # 10 minutes


@contextmanager
def cache_lock(
    lock_id: str,
    oid: str,
    lock_duration: int = DEFAULT_LOCK_DURATION,
) -> Generator[bool, None, None]:
    """
    Context manager to acquire a distributed cache-based lock.

    Ensures that only one process or thread can execute a block of code
    associated with a given lock ID at a time. Uses Django's cache backend
    and `cache.add` to store the lock key, then `cache.delete` to release the
    lock when exiting the context if it was acquired and has not expired.

    Args:
        lock_id (str): Unique key identifying the lock in the cache.
        oid (str): Identifier for the owner of the lock. Stored as the cache
            value but not otherwise used.
        lock_duration (int): How long to hold the lock in seconds. Defaults
            to 10 minutes.

    Yields:
        bool: True if the lock was acquired, False otherwise.

    Usage:
        with cache_lock("my-task-lock", "worker-1") as acquired:
            if acquired:
                # Do protected work here
            else:
                # Skip or retry later
    """
    try:
        timeout_at = time.monotonic() + lock_duration
        # cache.add does nothing and returns False if the key already exists
        status = cache.add(lock_id, oid, lock_duration)
        yield status
    finally:
        if status and time.monotonic() < timeout_at:
            # Don't release the lock if we did not acquire it
            # Also, don't release the lock if we exceeded the timeout
            # to reduce the chance of releasing an expired lock
            # owned by someone else
            cache.delete(lock_id)


================================================
FILE: concordia/converters.py
================================================
from django.urls.converters import SlugConverter, StringConverter


class UnicodeSlugConverter(SlugConverter):
    # This is similar to the slug_unicode_re pattern but is not anchored to the
    # start of the string:
    regex = r"[-\w+]+"


class ItemIdConverter(StringConverter):
    # Allows . in the item ID
    regex = r"[-a-zA-Z0-9_\.]+"


================================================
FILE: concordia/decorators.py
================================================
# Based on code from https://gist.github.com/dmwyatt/d09da3f03cbdcad217db35f5cf8a9f94
import hashlib
import logging
from functools import wraps

from celery import Task

from concordia.contextmanagers import cache_lock

logger = logging.getLogger(__name__)


def locked_task(function=None, lock_by_args: bool = True):
    """
    Decorator to lock a task from concurrent execution.
    This requires the task to be bound (bind=True) and for the
    task decorate to be above this decorator.
    ## Locking by task + arguments
    Allows duplicate calls of the task as long as each call uses different arguments.
    >>> from celery.task import task
    >>> @task(bind=True)
    ... @locked_task        # <=========== Note no-arg version of decorator
    ... def a_task(self, some_arg):
    ...     time.sleep(10)
    Start a task.
    >>> a_task.delay("foo")
    Try to start task with same args again. Nothing happens since it was just called
    with those args and it's still running
    >>> a_task.delay("foo")
    Will run even though first call started task since this call has different args.
    >>> a_task.delay("bar")

    ## Locking by task
    Lock task against concurrent calls regardless of arguments
    >>> @task(bind=True)
    ... @locked_task(lock_by_args=False)        # <=========== Note `lock_by_args`
    ... def a_task(self, some_arg):
    ...     time.sleep(10)

    ## Forcing a run
    You can force the task to run regardless of the lock by passing force=True
    This is most useful if a lock is "stuck" or if you have a case where you don't
    care about the lock
    This can be used when directly (synchronously) calling the task and through
    kwargs with apply_async. It cannot be used with delay.
    >>> a_task(some_arg, force=True)
    >>> a_task.apply_async(args=(some_arg,), kwargs={'force' : True})
    """

    def decorator(f):
        @wraps(f)
        def wrapped(self: Task, *args, **kwargs):
            force = kwargs.pop("force", False)  # Remove 'force' before passing to task

            if lock_by_args:
                # lock with name of function and its hashed arguments.  This
                # means that if any of the function, args or kwargs are
                # different, then the lock won't match and another instance
                # of the task will run
                try:
                    # We hash the arguments to make them safe for use as a cache key
                    raw_key = f"{repr(args)}:{repr(sorted(kwargs.items()))}"
                    key = f"{self.name}:{hashlib.sha256(raw_key.encode()).hexdigest()}"
                except Exception:
                    logger.exception(
                        "Unable to create cache key from arguments for %s.", self.name
                    )
                    raise

            else:
                # Use name of task as key.
                key = self.name

            with cache_lock(key, self.request.hostname) as acquired:
                if acquired or force:
                    if not acquired:
                        logger.warning(
                            "Force-running task %s with key %s; lock not acquired",
                            self.name,
                            key,
                        )
                    return f(self, *args, **kwargs)
                logger.info(
                    "Task %s with key %s is already running; skipping", self.name, key
                )

        return wrapped

    return decorator(function) if function else decorator


================================================
FILE: concordia/documents.py
================================================
# Contains OpenSearch documents for indexing models in the Concordia application.
from django.contrib.auth.models import User
from django.db.models import Count
from django_opensearch_dsl import Document, fields
from django_opensearch_dsl.registries import registry

from .models import Asset, SiteReport, Transcription, UserAssetTagCollection


@registry.register_document
class UserDocument(Document):
    class Index:
        # Name of the Opensearch index
        name = "users"
        # See Opensearch Indices API reference for available settings
        settings = {"number_of_shards": 1, "number_of_replicas": 0}

    transcription_count = fields.IntegerField()

    class Django:
        model = User
        fields = ["last_login", "date_joined", "is_active", "id"]

    def prepare_transcription_count(self, instance):
        qs = User.objects.filter(id=instance.id).annotate(Count("transcription"))
        return qs[0].transcription__count


@registry.register_document
class SiteReportDocument(Document):
    class Index:
        # Name of the Opensearch index
        name = "site_reports"
        # See Opensearch Indices API reference for available settings
        settings = {"number_of_shards": 1, "number_of_replicas": 0}

    campaign = fields.ObjectField(properties={"slug": fields.KeywordField()})
    topic = fields.ObjectField(properties={"slug": fields.KeywordField()})

    class Django:
        model = SiteReport

        fields = [
            "created_on",
            "report_name",
            "assets_total",
            "assets_published",
            "assets_not_started",
            "assets_in_progress",
            "assets_waiting_review",
            "assets_completed",
            "assets_unpublished",
            "items_published",
            "items_unpublished",
            "projects_published",
            "projects_unpublished",
            "anonymous_transcriptions",
            "transcriptions_saved",
            "daily_review_actions",
            "distinct_tags",
            "tag_uses",
            "campaigns_published",
            "campaigns_unpublished",
            "users_registered",
            "users_activated",
            "registered_contributors",
            "daily_active_users",
        ]


@registry.register_document
class TagCollectionDocument(Document):
    class Index:
        # Name of the Opensearch index
        name = "tags"
        # See Opensearch Indices API reference for available settings
        settings = {"number_of_shards": 1, "number_of_replicas": 0}

    tags = fields.NestedField(properties={"value": fields.TextField()})
    asset = fields.ObjectField(
        properties={
            "title": fields.TextField(),
            "slug": fields.TextField(),
            "transcription_status": fields.KeywordField(),
            "item": fields.ObjectField(
                properties={
                    "item_id": fields.TextField(),
                    "project": fields.ObjectField(
                        properties={
                            "slug": fields.KeywordField(),
                            "campaign": fields.ObjectField(
                                properties={"slug": fields.KeywordField()}
                            ),
                        }
                    ),
                }
            ),
        }
    )
    user = fields.ObjectField(properties={"id": fields.IntegerField()})

    class Django:
        model = UserAssetTagCollection
        fields = ["created_on", "updated_on"]

    def get_queryset(self, *args, **kwargs):
        return (
            super()
            .get_queryset(*args, **kwargs)
            .order_by("pk")
            .prefetch_related(
                "asset__item", "asset__item__project", "asset__item__project__campaign"
            )
        )


@registry.register_document
class TranscriptionDocument(Document):
    class Index:
        # Name of the Opensearch index
        name = "transcriptions"
        # See Opensearch Indices API reference for available settings
        settings = {"number_of_shards": 1, "number_of_replicas": 0}

    asset = fields.ObjectField(
        properties={
            "title": fields.TextField(),
            "slug": fields.TextField(),
            "transcription_status": fields.KeywordField(),
            "item": fields.ObjectField(
                properties={
                    "item_id": fields.TextField(),
                    "project": fields.ObjectField(
                        properties={
                            "slug": fields.KeywordField(),
                            "campaign": fields.ObjectField(
                                properties={"slug": fields.KeywordField()}
                            ),
                            "topics": fields.NestedField(
                                properties={"slug": fields.KeywordField()}
                            ),
                        }
                    ),
                }
            ),
        }
    )
    user = fields.ObjectField(properties={"id": fields.IntegerField()})
    reviewed_by = fields.ObjectField(properties={"id": fields.IntegerField()})
    supersedes = fields.ObjectField(properties={"id": fields.IntegerField()})

    class Django:
        model = Transcription

        fields = [
            "id",
            "created_on",
            "updated_on",
            "text",
            "accepted",
            "rejected",
            "submitted",
        ]

    def get_queryset(self, *args, **kwargs):
        return (
            super()
            .get_queryset(*args, **kwargs)
            .order_by("pk")
            .prefetch_related(
                "asset__item",
                "asset__item__project",
                "asset__item__project__topics",
                "asset__item__project__campaign",
            )
        )


@registry.register_document
class AssetDocument(Document):
    class Index:
        # Name of the Opensearch index
        name = "assets"
        # See Opensearch Indices API reference for available settings
        settings = {"number_of_shards": 1, "number_of_replicas": 0}

    item = fields.ObjectField(
        properties={
            "item_id": fields.KeywordField(),
            "project": fields.ObjectField(
                properties={
                    "slug": fields.KeywordField(),
                    "campaign": fields.ObjectField(
                        properties={"slug": fields.KeywordField()}
                    ),
                    "topics": fields.NestedField(
                        properties={"slug": fields.KeywordField()}
                    ),
                }
            ),
        }
    )

    transcription_status = fields.KeywordField()

    latest_transcription = fields.ObjectField(
        properties={
            "created_on": fields.DateField(),
            "updated_on": fields.DateField(),
            "accepted": fields.DateField(),
            "rejected": fields.DateField(),
            "submitted": fields.DateField(),
        }
    )

    submission_count = fields.IntegerField()

    def prepare_submission_count(self, instance):
        return Transcription.objects.filter(
            asset=instance, submitted__isnull=True
        ).count()

    class Django:
        model = Asset
        fields = ["published", "difficulty", "slug", "sequence", "year"]

    def get_queryset(self, *args, **kwargs):
        return (
            super()
            .get_queryset(*args, **kwargs)
            .order_by("pk")
            .prefetch_related(
                "item",
                "item__project",
                "item__project__topics",
                "item__project__campaign",
            )
        )


================================================
FILE: concordia/exceptions.py
================================================
# Creating a specfic error for this, since our pre-commit
# checks will not allow us to test for generic exceptions
class CacheLockedError(Exception):
    def __init__(self, message, details=None):
        super().__init__(message)
        self.details = details


class RateLimitExceededError(Exception):
    pass


================================================
FILE: concordia/forms.py
================================================
from logging import getLogger
from typing import Any, Iterator

from django import forms
from django.contrib.auth import get_user_model
from django.contrib.auth.forms import (
    AuthenticationForm,
    PasswordResetForm,
    SetPasswordForm,
    UsernameField,
)
from django.http import HttpRequest
from django_registration.backends.activation.views import RegistrationView
from django_registration.forms import RegistrationForm
from django_registration.signals import user_activated

from .turnstile.fields import TurnstileField

User = get_user_model()

logger = getLogger(__name__)


class AllowInactivePasswordResetForm(PasswordResetForm):
    """
    Password reset form which includes inactive users.

    Behavior:
        Overrides Django's default user lookup so that inactive users with a
        usable password are included, allowing a single reset flow to both
        confirm email and activate the account.
    """

    def get_users(self, email: str) -> Iterator[User]:
        """
        Yield users matching the provided email, including inactive accounts.

        Args:
            email: Case-insensitive email address to search.

        Returns:
            Iterator over users that have a usable password.
        """
        # Allow inactive users to reset their passwords and confirm their email
        # account in one step.
        all_users = User._default_manager.filter(
            **{"%s__iexact" % User.get_email_field_name(): email}
        )
        return (u for u in all_users if u.has_usable_password())


class ActivateAndSetPasswordForm(SetPasswordForm):
    """
    Set-password form which activates the user on successful save.

    Behavior:
        If the associated user is inactive, mark the user active, emit the
        django-registration ``user_activated`` signal to trigger the welcome
        email, then proceed with the normal password save.
    """

    # A successful password reset means the user
    # has confirmed their email address, so
    # set is_active to True.
    def save(self, commit: bool = True) -> User:
        """
        Save the new password and ensure the user is marked active.

        Also emits ``user_activated`` when activation occurs.

        Args:
            commit: Whether to persist changes immediately.

        Returns:
            The updated user instance.
        """
        if not self.user.is_active:
            logger.info("Activated user %s due to password reset", self.user.username)
            self.user.is_active = True
            # send user_activation signal so that the user will
            # receive a welcome email
            user_activated.send(sender=self.__class__, user=self.user, request=None)
        return super().save(commit=commit)


class UserRegistrationForm(RegistrationForm):
    """
    Registration form with newsletter opt-in.

    Adds a boolean field which, when selected, is later used to add the new
    user to the newsletter group during signal handling.
    """

    newsletterOptIn = forms.BooleanField(
        label="Newsletter",
        initial=True,
        required=False,
        help_text=(
            "Email me 2-3 times a month about campaign updates, upcoming "
            "events and new features."
        ),
    )

    class Meta(RegistrationForm.Meta):
        help_texts = {
            "username": (
                "Can only contain letters, numbers and any of these symbols:"
                " <kbd>@</kbd>, <kbd>.</kbd>, <kbd>+</kbd>, <kbd>-</kbd>"
                " or <kbd>_</kbd>. 150 characters or fewer."
            )
        }


class UserLoginForm(AuthenticationForm):
    """
    Login form which resends activation for inactive but valid credentials.

    Behavior:
        If credentials are correct but the user is inactive, resend an
        activation email and raise a validation error with user guidance.
    """

    username = UsernameField(
        label="Username or email address",
        widget=forms.TextInput(attrs={"autofocus": True}),
    )

    def confirm_login_allowed(self, user: Any) -> None:
        """
        Enforce activation: resend activation email and block login if inactive.

        Args:
            user: The authenticated user instance.

        Raises:
            forms.ValidationError: When the user account is inactive.
        """
        inactive_message = (
            "This account has not yet been activated. "
            "An activation email has been sent to the email "
            "address associated with this account. "
            "Please check for this message and click the link "
            "to finish your account registration."
        )

        # If the user provided a correct username and password combination,
        # but has not yet confirmed their email,
        # resend the email activation request and display a custom message.
        if not user.is_active:
            logger.warning("Inactive user tried to log in with valid credentials.")
            view = RegistrationView(request=self.request)
            view.send_activation_email(user)

            raise forms.ValidationError(inactive_message, code="inactive")


class UserNameForm(forms.Form):
    """
    Minimal form for updating a user's first and last name.

    Fields:
        first_name: Optional first name.
        last_name: Optional last name.
    """

    first_name = forms.CharField(label="", required=False)
    last_name = forms.CharField(label="", required=False)


class UserProfileForm(forms.Form):
    """
    Profile form for updating the user's email address.

    Validates that the email is not already in use and, for the current user,
    is not unchanged to avoid unnecessary confirmation flows.
    """

    email = forms.EmailField(label="", required=True)

    def __init__(self, *, request: HttpRequest, **kwargs) -> None:
        """
        Store the request for later use.

        Args:
            request: The current HTTP request.
        """
        self.request = request
        super().__init__(**kwargs)

    def clean_email(self) -> str:
        """
        Validate that the submitted email is available and meaningful.

        Rejects emails already in use by any account and the current user's
        existing email to avoid triggering a redundant confirmation.

        Returns:
            The cleaned email string.

        Raises:
            forms.ValidationError: If the email is not available.
        """
        data = self.cleaned_data["email"]
        # Previously, this code only checked against other users, but it
        # is also an error if a user tries to change their email to the one
        # they're already using--we don't want to initiate the email
        # confirmation process when the user isn't actually checking their email.
        if User.objects.filter(email__iexact=data).exists():
            raise forms.ValidationError("That email address is not available")
        return data


class AccountDeletionForm(forms.Form):
    """
    Trivial form that retains the request for view logic.

    Used where the view needs the request object after validation.
    """

    def __init__(self, *, request: HttpRequest, **kwargs) -> None:
        """
        Store the request for later use.

        Args:
            request: The current HTTP request.
        """
        self.request = request
        super().__init__(**kwargs)


class TurnstileForm(forms.Form):
    """
    Simple form embedding the Cloudflare Turnstile verification field.

    Fields:
        turnstile: A required TurnstileField that validates with the API.
    """

    turnstile = TurnstileField()


================================================
FILE: concordia/logging.py
================================================
import warnings
from types import MappingProxyType
from typing import Any, Callable, Optional

import structlog


def get_logging_user_id(user: Any) -> str:
    """
    Return a consistent identifier for logging purposes.

    Args:
        user (Any): A Django user object (possibly anonymous).

    Returns:
        user_id (str): User's ID or "anonymous" if unauthenticated, represents
                         the Concordia anonymous user, or has no ID.
    """
    if not getattr(user, "is_authenticated", False):
        return "anonymous"

    if getattr(user, "username", None) == "anonymous":
        return "anonymous"

    user_id = getattr(user, "id", None)
    if user_id is None:
        return "anonymous"

    return str(user_id)


# Default global registry for semantic context extractors
_DEFAULT_EXTRACTORS: dict[str, Callable[[Any], dict[str, Any]]] = {}


def _register_default_extractor(
    context_key: str, extractor_function: Callable[[Any], dict[str, Any]]
):
    _DEFAULT_EXTRACTORS[context_key] = extractor_function


# Built-in extractors
_register_default_extractor("user", lambda user: {"user_id": get_logging_user_id(user)})

# Extractors to use other extractors have to be registered in order, so
# campaign must be registered before item, item before asset, asset before transcription
_register_default_extractor(
    "campaign",
    lambda campaign: {
        "campaign_slug": getattr(campaign, "slug", None),
    },
)

_register_default_extractor(
    "item",
    lambda item: {
        **_DEFAULT_EXTRACTORS["campaign"](getattr(item, "campaign", None)),
        "item_id": getattr(item, "item_id", None),
    },
)

_register_default_extractor(
    "asset",
    lambda asset: {
        **_DEFAULT_EXTRACTORS["item"](getattr(asset, "item", None)),
        "asset_id": getattr(asset, "pk", None),
    },
)

_register_default_extractor(
    "transcription",
    lambda transcription: {
        **_DEFAULT_EXTRACTORS["asset"](getattr(transcription, "asset", None)),
        "transcription_id": getattr(transcription, "pk", None),
    },
)

_register_default_extractor(
    "topic",
    lambda topic: {
        "topic_slug": getattr(topic, "slug", None),
    },
)

# Freeze default extractors to prevent mutation
_DEFAULT_EXTRACTORS = MappingProxyType(_DEFAULT_EXTRACTORS)


class ConcordiaLogger:
    """
    A structured logging wrapper around structlog that enforces consistent logging
    conventions across the Concordia application.

    Features:
        - Requires 'message' and 'event_code' for all logs, and 'reason'/'reason_code'
          for warnings/errors.
        - Automatically extracts common context from objects like Asset, User
          and Transcription.
        - Allows semantic binding of objects (e.g., asset=self) which are expanded
          at log time.
        - Supports binding persistent fields via structlog's context mechanism.

    Usage:
    -----

    Create a logger:
        ```python
        structured_logger = ConcordiaLogger.get_logger(f"{__name__}")
        ```

    Log an info-level event:
        ```python
        structured_logger.info(
            "Started OCR processing.",
            event_code="asset_ocr_started",
            asset=my_asset,
            user=request.user,
        )
        ```

    Log a warning with reason:
        ```python
        structured_logger.warning(
            "Rollback failed.",
            event_code="rollback_attempt_failed",
            reason="No eligible transcription found.",
            reason_code="no_valid_target",
            asset=my_asset,
            user=request.user,
        )
        ```

    Bind a logger for repeated use:
        ```python
        logger = ConcordiaLogger.get_logger(f"{__name__}")
        my_logger = logger.bind(asset=asset)
        my_logger.info("Transcription updated.", event_code="transcription_updated")
        ```

        This is the equivalent of:
        ```python
        logger = ConcordiaLogger.get_logger(f"{__name__}")
        logger.info(
            "Transcription updated.",
            event_code="transcription_updated",
            asset=asset
        )
        ```

        This can save you from having to repeatedly pass in the same data to every
        logging call. For instance, if you bind a logger to a particular model
        instance like `.bind(asset=self)`, that bound logger will automatically
        include the instance as context for all the logging statements done by it.

    Special Context Expansion:
    --------------------------

    The logger recognizes certain context object names and extracts fields from them
    automatically. These include:

    - `user` -> `user_id`
    - `asset` -> `asset_id`, `campaign_slug`, `item_id`
    - `transcription` -> `transcription_id`
    - `campaign` -> `campaign_slug`
    - `item` -> `item_id`
    - `topic` -> `topic_slug`

    If these objects are passed directly (e.g., as `user=request.user`), their relevant
    fields will be included automatically in the log entry.

    Explicit values passed (e.g., `item_id=...`) override extracted ones. Fields with
    `None` values are omitted from the final log output.

    Extractor System:
    -----------------

    The logger uses a registry of extractor functions to convert common objects
    (e.g., Asset, User, Transcription) into structured logging fields.

    Each extractor is a callable that takes an object and returns a dictionary of
    field names and values. Fields with `None` values are omitted.

    Extractors can be:

    - Global defaults (defined in concordia.logging and shared by all loggers)
    - Per-logger overrides (via `register_extractor()`)

    The default extractors may internally invoke other extractors to avoid code
    duplication. For example, the `transcription` extractor invokes the `asset`
    extractor, which calls the `item` extractor, which uses the `campaign` extractor.

    Registering a new extractor on a logger overrides the default for that logger
    only.

    Extractors are callables that take a single object and return a dictionary.

    Example:
        ```python
        logger = ConcordiaLogger.get_logger(__name__)
        logger.register_extractor("session", lambda s: {"session_id": s.id})
        ```

        Now, passing `session=session_obj` to `.info()` (or any other logging method)
        will include `session_id`.

    Note:
        Chained extractors (e.g., `transcription` -> `asset` -> `item`) are hardcoded to
        use the default global extractors. If you override an extractor on a logger,
        chained calls will not reflect that override. So, if you override the "asset"
        extractor, if you pass in "transcription", that extractor will use the default
        `asset` extractor, rather than your newly registered one.
    """

    def __init__(self, logger, context: Optional[dict[str, Any]] = None):
        self._logger = logger
        self._context = context or {}
        self._extractors = _DEFAULT_EXTRACTORS.copy()

    @classmethod
    def get_logger(cls, name: str) -> "ConcordiaLogger":
        """
        Factory method to create a ConcordiaLogger from a given logger name.

        Args:
            name (str): The logger name (typically f"structlog.{__name__}").

        Returns:
            ConcordiaLogger: A logger instance with enriched behavior.
        """
        return cls(structlog.get_logger(f"structlog.{name}"))

    def register_extractor(
        self, key: str, extractor: Callable[[Any], dict[str, Any]]
    ) -> None:
        """
        Register a custom context extractor for this logger instance only.

        Args:
            key (str): The context key to extract (e.g., "custom_object").
            extractor (Callable): A function that returns a dict of fields to log.
        """
        self._extractors[key] = extractor
        if key in _DEFAULT_EXTRACTORS:
            warnings.warn(
                f"Extractor for '{key}' registered but default extractors may still "
                f"reference the original implementation via chaining. Overriding it "
                f"here will not affect those chained uses.",
                UserWarning,
                stacklevel=2,
            )

    def unregister_extractor(self, key: str) -> None:
        """
        Remove a previously registered extractor from this logger instance.

        Args:
            key (str): The context key to remove.
        """
        self._extractors.pop(key, None)

    def log(
        self,
        level: str,
        message: str,
        *,
        event_code: str,
        reason: Optional[str] = None,
        reason_code: Optional[str] = None,
        **context: Any,
    ) -> None:
        """
        Emit structured logs with standardized context. This shouldn't be called
        directly under ordinary circumstances, with one of the level methods (
        debug, info, warning, error) used instead.

        Args:
            level (str): Logging level ('debug', 'info', 'warning', 'error').
            message (str): Human-readable log message.
            event_code (str): Required short machine-readable identifier.
            reason (str, optional): Human-readable reason for failure (required for
                warnings/errors).
            reason_code (str, optional): Short identifier for reason (required for
                warnings/errors).
            context (Any): Additional structured context for the log.

        Raises:
            ValueError: If required fields are missing for the given log level.
        """
        if not message:
            raise ValueError("Log message is required.")
        if not event_code:
            raise ValueError("Structured logs must include an 'event_code' field.")
        if level in ("warning", "error") and (not reason or not reason_code):
            raise ValueError(
                "Warnings and errors must include both 'reason' and 'reason_code'."
            )

        context_data = {"event_code": event_code}
        if reason:
            context_data["reason"] = reason
        if reason_code:
            context_data["reason_code"] = reason_code

        bound_context = self._context

        # Extract data from provided context, falling back to the bound context
        # if it exists
        for context_key, extractor_function in self._extractors.items():
            context_object = context.pop(context_key, bound_context.get(context_key))
            if context_object:
                extracted_fields = extractor_function(context_object)
                for key, value in extracted_fields.items():
                    if value is not None:
                        context_data.setdefault(key, value)

        # Add remaining values in bound_context
        # (i.e., keys that weren't already extracted)
        for key, value in bound_context.items():
            if key not in self._extractors and key not in context and value is not None:
                context_data[key] = value

        # Override extracted and bound context with any explicit values passed in
        # For instance, if `asset` and `asset_id` were both passed in, we would
        # have extracted `asset`.`asset_id`, `asset`.`item`.`item_id`, etc., and
        # now the extracted `asset_id` would be overriden by the explicit `asset_id`
        # in the passed-in context.
        for key, value in context.items():
            if value is not None:
                context_data[key] = value

        getattr(self._logger, level)(message, **context_data)

    def debug(self, message: str, *, event_code: str, **kwargs):
        """Emit a debug-level structured log."""
        self.log("debug", message, event_code=event_code, **kwargs)

    def info(self, message: str, *, event_code: str, **kwargs):
        """Emit an info-level structured log."""
        self.log("info", message, event_code=event_code, **kwargs)

    def warning(
        self, message: str, *, event_code: str, reason: str, reason_code: str, **kwargs
    ):
        """Emit a warning-level structured log. Requires reason and reason_code."""
        self.log(
            "warning",
            message,
            event_code=event_code,
            reason=reason,
            reason_code=reason_code,
            **kwargs,
        )

    def error(
        self, message: str, *, event_code: str, reason: str, reason_code: str, **kwargs
    ):
        """Emit an error-level structured log. Requires reason and reason_code."""
        self.log(
            "error",
            message,
            event_code=event_code,
            reason=reason,
            reason_code=reason_code,
            **kwargs,
        )

    def exception(
        self,
        message: str,
        *,
        event_code: str,
        reason: str,
        reason_code: str,
        **kwargs: Any,
    ) -> None:
        """
        Emit an error-level structured log with exception info.

        This is equivalent to calling `.error(..., exc_info=True)` and should be used
        within an exception handler to capture tracebacks.
        """
        self.log(
            "error",
            message,
            event_code=event_code,
            reason=reason,
            reason_code=reason_code,
            exc_info=True,
            **kwargs,
        )

    def bind(self, **kwargs: Any) -> "ConcordiaLogger":
        """
        Return a new ConcordiaLogger with additional context permanently bound.

        Bound context can include semantic objects like asset, user or transcription,
        in addition to primitive data types. Objects with registered extractors
        will be expanded into structured fields at log time.

        Args:
            **kwargs: Context to bind.

        Returns:
            ConcordiaLogger: A logger with the provided context bound.
        """
        # We make our own bound context rather than using structlog's
        # .bind so we can safely access it ourselves
        new_context = self._context.copy()
        new_context.update(kwargs)
        return ConcordiaLogger(self._logger, context=new_context)


================================================
FILE: concordia/maintenance.py
================================================
"""
Maintenance-mode helpers for conditional frontend availability.

This module wraps ``maintenance_mode.http.need_maintenance_response`` to allow
staff or superusers limited frontend access during maintenance when a cache
flag is set.
"""

from django.core.cache import cache
from django.http import HttpRequest
from maintenance_mode.http import (
    need_maintenance_response as base_need_maintenance_response,
)


def _need_maintenence_frontend(request: HttpRequest) -> bool | None:
    """
    Optionally allow frontend access for privileged users during maintenance.

    When the cache key ``maintenance_mode_frontend_available`` is truthy and the
    request has an authenticated user who is staff or a superuser, return
    ``False`` to indicate maintenance should not block the response. Otherwise
    return ``None`` to defer to the default logic.

    Args:
        request: Current HTTP request.

    Returns:
        False to allow access, None to defer to default handling.
    """
    if not hasattr(request, "user"):
        return None

    user = request.user

    frontend_available = cache.get("maintenance_mode_frontend_available", False)
    if frontend_available and (user.is_staff or user.is_superuser):
        return False
    return None


def need_maintenance_response(request: HttpRequest) -> bool:
    """
    Determine whether maintenance mode should block this request.

    First delegates to the upstream maintenance-mode check. If it indicates that
    maintenance applies, call ``_need_maintenence_frontend`` to allow privileged
    access when enabled via cache. Returns a boolean suitable for the middleware.

    Args:
        request: Current HTTP request.

    Returns:
        True if maintenance mode should block the request, else False.
    """
    value = base_need_maintenance_response(request)
    if value is True:
        value = _need_maintenence_frontend(request)
    if isinstance(value, bool):
        return value
    return True


================================================
FILE: concordia/management/__init__.py
================================================


================================================
FILE: concordia/management/commands/__init__.py
================================================


================================================
FILE: concordia/management/commands/calculate_difficulty_values.py
================================================
"""
Management command to populate initial difficulty values.

Usage:
    python manage.py calculate_difficulty_values
    python manage.py calculate_difficulty_values --verbosity 2
"""

from timeit import default_timer

from django.core.management.base import BaseCommand

from concordia.tasks.assets import calculate_difficulty_values


class Command(BaseCommand):
    """
    Run the task which calculates initial difficulty values for assets.

    This command invokes `concordia.tasks.assets.calculate_difficulty_values()`
    and, when verbosity is greater than 1, prints how many records were
    updated and how long the run took.
    """

    def handle(self, *, verbosity: int, **kwargs) -> None:
        """
        Execute the command.

        Args:
            verbosity (int): Django's verbosity level (0, 1, 2, or 3).

        Returns:
            None
        """
        start_time = default_timer()

        updated_count = calculate_difficulty_values()

        if verbosity > 1:
            print(
                "Updated %d records in %0.1f seconds"
                % (updated_count, default_timer() - start_time)
            )


================================================
FILE: concordia/management/commands/create_load_test_fixtures.py
================================================
# ruff: noqa: ERA001 A003
# bandit:skip-file

import json
import uuid
from pathlib import Path

from django.contrib.auth import get_user_model
from django.contrib.auth.hashers import make_password
from django.core import serializers
from django.core.management import BaseCommand, call_command

from concordia.models import (
    Asset,
    Campaign,
    CardFamily,
    Item,
    Project,
    ProjectTopic,
    ResearchCenter,
    Topic,
    Transcription,
)

ASSETS_LIMIT_DEFAULT = 10_000
TEST_USERS_DEFAULT = 10_000
TEST_USER_PREFIX_DEFAULT = "locusttest"
TEST_USER_PASSWORD_DEFAULT = "locustpass123"  # nosec B105


def _serialize_qs(qs):
    return json.loads(serializers.serialize("json", qs))


def _serialize_list(objs):
    return json.loads(serializers.serialize("json", objs))


class Command(BaseCommand):
    help = (
        "Build a single JSON fixture for load-testing:\n"
        "- 2 published Topics by ascending `ordering`\n"
        "- Consider 5 published Campaigns by ascending `ordering`\n"
        "- Walk Items/Assets from Topic projects first (cap 10,000 assets),\n"
        "  then from Campaign projects if needed, until the cap\n"
        "- Include closure of Items/Projects/Campaigns/Topics actually used "
        "by chosen Assets\n"
        "- Include all Transcriptions for those Assets and anonymized Users "
        "from those Transcriptions\n"
        "- Add 10,000 new test users (locusttest00001..locusttest10000) "
        "with a known password\n"
        "- Include ProjectTopic rows for selected Topic+Project links\n"
        "- Write one JSON fixture"
    )

    def add_arguments(self, p):
        p.add_argument(
            "--assets-limit",
            type=int,
            default=ASSETS_LIMIT_DEFAULT,
            help=f"Max assets to include (default {ASSETS_LIMIT_DEFAULT})",
        )
        p.add_argument(
            "--test-users",
            type=int,
            default=TEST_USERS_DEFAULT,
            help=f"How many new test users to include (default {TEST_USERS_DEFAULT})",
        )
        p.add_argument(
            "--test-user-prefix",
            default=TEST_USER_PREFIX_DEFAULT,
            help=f"Prefix for test usernames (default '{TEST_USER_PREFIX_DEFAULT}')",
        )
        p.add_argument(
            "--test-user-password",
            default=TEST_USER_PASSWORD_DEFAULT,
            help=(
                f"Password for all test users (default "
                f"'{TEST_USER_PASSWORD_DEFAULT}')"
            ),
        )
        p.add_argument(
            "--output",
            default="loadtest_fixture.json",
            help="Path to write the fixture JSON (default loadtest_fixture.json)",
        )
        p.add_argument(
            "--no-validate",
            action="store_true",
            help=(
                "Do not load the fixture into a test database. "
                "WARNING: fixture will not be verified."
            ),
        )
        p.add_argument(
            "--validate-drop",
            action="store_true",
            help=(
                "Validate by loading into a fresh test DB, "
                "then drop it after loading."
            ),
        )
        p.add_argument(
            "--validate-db-name",
            default=None,
            help=(
                "Override the test DB name used for validation "
                "(default: <default.NAME>_lt)."
            ),
        )
        p.add_argument(
            "--validate-recreate",
            action="store_true",
            help="Force recreation of the validation DB if it already exists.",
        )

    def handle(self, *args, **o):
        assets_limit = int(o["assets_limit"])
        out_path = Path(o["output"]).resolve()

        # Select 2 published Topics by ordering
        topics_qs = Topic.objects.filter(published=True).order_by("ordering")[:2]
        topics = list(topics_qs)
        topic_ids = {t.id for t in topics}
        if not topics:
            self.stderr.write(
                self.style.WARNING(
                    "No published Topics found. "
                    "Proceeding with Campaign-only selection."
                )
            )

        # Projects in those topics via ProjectTopics
        proj_ids_from_topics = set(
            ProjectTopic.objects.filter(topic_id__in=topic_ids).values_list(
                "project_id", flat=True
            )
        )

        # ensure we consider 5 published Campaigns
        # campaigns connected to the topic-derived projects:
        campaigns_from_topics_qs = Campaign.objects.filter(
            published=True,
            id__in=Project.objects.filter(id__in=proj_ids_from_topics).values_list(
                "campaign_id", flat=True
            ),
        ).distinct()

        needed = max(0, 5 - campaigns_from_topics_qs.count())
        if needed > 0:
            # take extra published campaigns (not already counted) by ordering ASC
            extra_campaigns_qs = (
                Campaign.objects.filter(published=True)
                .exclude(id__in=campaigns_from_topics_qs.values_list("id", flat=True))
                .order_by("ordering")[:needed]
            )
            selected_campaigns_qs = campaigns_from_topics_qs.union(extra_campaigns_qs)
        else:
            selected_campaigns_qs = campaigns_from_topics_qs

        # We might end up with <5 if not enough published; that's fine

        # Collect assets up to cap
        asset_ids = set()
        item_ids = set()
        project_ids = set()

        # walk projects from Topics first
        for proj in (
            Project.objects.filter(id__in=proj_ids_from_topics)
            .order_by("id")
            .iterator()
        ):
            if len(asset_ids) >= assets_limit:
                break
            project_ids.add(proj.id)

            for item in (
                Item.objects.filter(project_id=proj.id).order_by("id").iterator()
            ):
                if len(asset_ids) >= assets_limit:
                    break
                item_ids.add(item.id)

                for a in (
                    Asset.objects.filter(item_id=item.id)
                    .order_by("id")
                    .values_list("id", flat=True)
                    .iterator()
                ):
                    if len(asset_ids) >= assets_limit:
                        break
                    asset_ids.add(int(a))

        # If needed, walk projects from selected campaigns (not already included)
        if len(asset_ids) < assets_limit and selected_campaigns_qs.exists():
            proj_ids_from_campaigns = set(
                Project.objects.filter(
                    campaign_id__in=selected_campaigns_qs.values_list("id", flat=True)
                )
                .exclude(id__in=project_ids)
                .values_list("id", flat=True)
            )
            for proj in (
                Project.objects.filter(id__in=proj_ids_from_campaigns)
                .order_by("id")
                .iterator()
            ):
                if len(asset_ids) >= assets_limit:
                    break
                project_ids.add(proj.id)

                for item in (
                    Item.objects.filter(project_id=proj.id).order_by("id").iterator()
                ):
                    if len(asset_ids) >= assets_limit:
                        break
                    item_ids.add(item.id)

                    for a in (
                        Asset.objects.filter(item_id=item.id)
                        .order_by("id")
                        .values_list("id", flat=True)
                        .iterator()
                    ):
                        if len(asset_ids) >= assets_limit:
                            break
                        asset_ids.add(int(a))

        # recompute exact asset set
        assets_qs = Asset.objects.filter(id__in=asset_ids)

        # Items actually referenced by chosen assets
        items_qs = Item.objects.filter(
            id__in=assets_qs.values_list("item_id", flat=True).distinct()
        )
        item_ids = set(items_qs.values_list("id", flat=True))

        # Projects from those items
        projects_qs = Project.objects.filter(
            id__in=items_qs.values_list("project_id", flat=True).distinct()
        )
        project_ids = set(projects_qs.values_list("id", flat=True))

        # Campaigns from those projects
        campaigns_qs = Campaign.objects.filter(
            id__in=projects_qs.values_list("campaign_id", flat=True).distinct()
        )

        # CardFamilies referenced by the selected Campaigns (FK target)
        card_families_qs = CardFamily.objects.filter(
            id__in=campaigns_qs.exclude(card_family__isnull=True)
            .values_list("card_family_id", flat=True)
            .distinct()
        )

        # ResearchCenters referenced by the selected Campaigns (M2M target)
        rc_through = Campaign.research_centers.through
        rc_ids = (
            rc_through.objects.filter(
                campaign_id__in=campaigns_qs.values_list("id", flat=True)
            )
            .values_list("researchcenter_id", flat=True)
            .distinct()
        )
        research_centers_qs = ResearchCenter.objects.filter(id__in=rc_ids)

        # Topics linked to those projects
        topics_from_projects_qs = Topic.objects.filter(
            id__in=ProjectTopic.objects.filter(project_id__in=project_ids)
            .values_list("topic_id", flat=True)
            .distinct()
        )
        # Merge with the initial two topics (won't duplicate)
        topics_final_qs = Topic.objects.filter(
            id__in=set(topics_from_projects_qs.values_list("id", flat=True)) | topic_ids
        )

        # ProjectTopic rows for selected Topic+Project pairs (needed to preserve M2M)
        project_topics_final_qs = ProjectTopic.objects.filter(
            topic_id__in=topics_final_qs.values_list("id", flat=True),
            project_id__in=project_ids,
        )

        # transcriptions + users (anonymize users in-memory)
        trans_qs = Transcription.objects.filter(asset_id__in=asset_ids)
        User = get_user_model()

        # Collect users from both author and reviewer fields, dropping Nones
        author_ids = set(trans_qs.values_list("user_id", flat=True))
        reviewer_ids = set(trans_qs.values_list("reviewed_by_id", flat=True))
        user_ids = {uid for uid in (author_ids | reviewer_ids) if uid is not None}

        users_qs = User.objects.filter(id__in=user_ids)

        # Build anonymized user fixtures explicitly (no M2M)
        user_app_label = User._meta.app_label
        user_model_name = User._meta.model_name
        anonymized_user_fixtures = []
        for u in users_qs:
            anonymized_user_fixtures.append(
                {
                    "model": f"{user_app_label}.{user_model_name}",
                    "pk": int(u.pk) if u.pk is not None else None,
                    "fields": {
                        User.USERNAME_FIELD: f"Anonymized {uuid.uuid4()}",
                        "email": f"anon-{uuid.uuid4()}@example.com",
                        "password": "!",
                        "is_active": False if hasattr(u, "is_active") else False,
                        "is_staff": False if hasattr(u, "is_staff") else False,
                        "is_superuser": False if hasattr(u, "is_superuser") else False,
                        **({"first_name": ""} if hasattr(u, "first_name") else {}),
                        **({"last_name": ""} if hasattr(u, "last_name") else {}),
                        # no groups / permissions
                    },
                }
            )

        # build test users
        test_user_count = int(o["test_users"])
        test_prefix = o["test_user_prefix"]
        test_pw_hash = make_password(o["test_user_password"])

        # ensure test user PKs cannot collide with anonymized users
        max_existing_pk = 0
        if anonymized_user_fixtures:
            max_existing_pk = max(
                int(obj["pk"])
                for obj in anonymized_user_fixtures
                if obj["pk"] is not None
            )
        start_test_pk = max_existing_pk + 10_000

        test_user_fixtures = []
        for i in range(1, test_user_count + 1):
            uname = f"{test_prefix}{i:05d}"
            test_user_fixtures.append(
                {
                    "model": f"{user_app_label}.{user_model_name}",
                    "pk": start_test_pk
                    + i,  # explicit PKs to avoid sequence collisions
                    "fields": {
                        User.USERNAME_FIELD: uname,
                        "password": test_pw_hash,
                        "email": f"{uname}@example.test",
                        "is_active": True if hasattr(User, "is_active") else True,
                        "is_staff": False if hasattr(User, "is_staff") else False,
                        "is_superuser": (
                            False if hasattr(User, "is_superuser") else False
                        ),
                        **({"first_name": ""} if hasattr(User, "first_name") else {}),
                        **({"last_name": ""} if hasattr(User, "last_name") else {}),
                        # no groups / permissions
                    },
                }
            )

        # Serialize everything into one fixture list
        fixture_objs = []
        # Core, ensure FK/M2M targets appear before dependents
        fixture_objs += _serialize_qs(topics_final_qs.order_by("id"))
        fixture_objs += _serialize_qs(card_families_qs.order_by("id"))
        fixture_objs += _serialize_qs(research_centers_qs.order_by("id"))
        fixture_objs += _serialize_qs(campaigns_qs.order_by("id"))
        fixture_objs += _serialize_qs(projects_qs.order_by("id"))
        fixture_objs += _serialize_qs(items_qs.order_by("id"))
        fixture_objs += _serialize_qs(assets_qs.order_by("id"))
        # Users must appear before Transcriptions (FK dependency)
        fixture_objs += anonymized_user_fixtures
        fixture_objs += test_user_fixtures
        # Transcriptions
        fixture_objs += _serialize_qs(trans_qs.order_by("id"))
        # Through model rows
        fixture_objs += _serialize_qs(project_topics_final_qs.order_by("id"))

        # Warn if below cap, but we don't need to abort
        if len(asset_ids) < assets_limit:
            self.stderr.write(
                self.style.WARNING(
                    f"Collected {len(asset_ids)} assets "
                    f"(cap {assets_limit}). Proceeding."
                )
            )

        # write file
        out_path.parent.mkdir(parents=True, exist_ok=True)
        out_path.write_text(json.dumps(fixture_objs, indent=2), encoding="utf-8")
        self.stdout.write(
            self.style.SUCCESS(
                f"Wrote fixture with {len(fixture_objs)} objects -> {out_path}"
            )
        )

        # optionally validate by loading into a test DB (migrate + loaddata)
        if o["no_validate"]:
            self.stderr.write(
                self.style.WARNING("Fixture NOT validated (--no-validate set).")
            )
        else:
            call_command(
                "prepare_load_test_db",
                db_alias="default",
                db_name=o["validate_db_name"] or None,
                recreate=bool(o["validate_recreate"]),
                fixtures=[str(out_path)],
                drop_after=bool(o["validate_drop"]),
            )


================================================
FILE: concordia/management/commands/ensure_initial_site_configuration.py
================================================
"""
Ensure that basic site configuration has been applied.

This command is intended for automated scenarios: a fresh database should be
configured on first run, but a newly launched container should not make any
changes. For convenience with Docker, default values for each argument are
read from environment variables.

Usage:
    python manage.py ensure_initial_site_configuration
    python manage.py ensure_initial_site_configuration \
        --admin-username admin --admin-email admin@example.com \
        --site-name "Example" --site-domain example.com

Environment defaults:
    CONCORDIA_ADMIN_USERNAME -> --admin-username (default: "admin")
    CONCORDIA_ADMIN_EMAIL    -> --admin-email    (default: "crowd@loc.gov")
    HOST_NAME                -> --site-name and --site-domain
                                (default: "example.com")

Tasks performed:
  1. Ensure at least one admin user exists. If missing, create one with an
     unusable password so the password reset flow must be used.
  2. Ensure the Sites framework has the intended site name and domain.
"""

import os
from argparse import ArgumentParser

from django.contrib.auth.models import User
from django.contrib.sites.models import Site
from django.core.management.base import BaseCommand
from django.db.transaction import atomic


class Command(BaseCommand):
    help = "Ensure that core site configuration has been applied"  # NOQA: A003

    def add_arguments(self, parser: ArgumentParser) -> None:
        """
        Add command-line arguments with environment-based defaults.

        Notes:
            The defaults mirror container-friendly env vars so this command can
            run non-interactively during provisioning.
        """
        parser.add_argument(
            "--admin-username",
            default=os.environ.get("CONCORDIA_ADMIN_USERNAME", "admin"),
            help="Admin user's username (default=%(default)s)",
        )
        parser.add_argument(
            "--admin-email",
            default=os.environ.get("CONCORDIA_ADMIN_EMAIL", "crowd@loc.gov"),
            help="Admin user's email address (default=%(default)s)",
        )
        parser.add_argument(
            "--site-name",
            default=os.environ.get("HOST_NAME", "example.com"),
            help="Site name (default=%(default)s)",
        )
        parser.add_argument(
            "--site-domain",
            default=os.environ.get("HOST_NAME", "example.com"),
            help="Site domain (default=%(default)s)",
        )

    @atomic
    def handle(
        self,
        *,
        admin_username: str,
        admin_email: str,
        site_name: str,
        site_domain: str,
        **options,
    ) -> None:
        """
        Ensure an admin user and the Site record are in the desired state.

        Behavior:
            - Get or create a superuser with the provided username and email.
              If created, set an unusable password.
            - Update the user's email if it differs.
            - If the site domain is not the placeholder "example.com", update
              all Site rows to use the provided name and domain.

        Args:
            admin_username (str): Username for the admin user.
            admin_email (str): Email for the admin user.
            site_name (str): Desired Site.name value.
            site_domain (str): Desired Site.domain value.

        Returns:
            None
        """
        user, user_created = User.objects.get_or_create(
            username=admin_username, defaults={"email": admin_email}
        )
        user.is_staff = user.is_superuser = True

        if user.email != admin_email:
            self.stdout.write(
                f"Changing {admin_username} email from {user.email} to {admin_email}"
            )
            user.email = admin_email

        if user_created:
            user.set_unusable_password()

        user.full_clean()
        user.save()

        if user_created:
            self.stdout.write(
                f"Created superuser {admin_username} account for {admin_email}."
                " Use the password reset form to change the unusable password."
            )

        if site_domain != "example.com":
            updated = Site.objects.update(name=site_name, domain=site_domain)
            if updated:
                self.stdout.write(
                    f"Configured site with name {site_name} and domain {site_domain}"
                )


================================================
FILE: concordia/management/commands/import_site_reports.py
================================================
"""
Import CSV Site Report data into the database.

This command reads a CSV file, maps each row to `SiteReport` fields and
creates `SiteReport` rows. If a "campaign" column is present and non-empty,
its value is treated as a `Campaign.id` and looked up before creation.

Usage:
    python manage.py import_site_reports --csv-file path/to/file.csv

Arguments:
    --csv-file  Path to the CSV file. Defaults to "site_reports.csv".

CSV expectations:
    - The first row is a header. Field names must match `SiteReport` fields,
      except:
        * "time" is combined with "created_on" to form a single datetime.
    - Empty strings are ignored and not included in the create kwargs.
    - "created_on" and "time" are combined then parsed with the format:
        %m/%d/%Y %I:%M %p %Z
      Example: "04/30/2024 09:15 AM UTC"
    - "campaign" is optional. If present and non-empty, it must be a valid
      `Campaign.id`.

Notes:
    - Rows are created one by one. This is intentional to match current
      behavior.
"""

import csv
from argparse import ArgumentParser
from datetime import datetime

from django.core.management.base import BaseCommand

from concordia.models import Campaign, SiteReport


class Command(BaseCommand):
    help = "Import CSV Site Report data"  # NOQA: A003

    def add_arguments(self, parser: ArgumentParser) -> None:
        """
        Add the --csv-file argument with a sensible default.

        Args:
            parser: The Django command argument parser.
        """
        parser.add_argument(
            "--csv-file",
            default="site_reports.csv",
            help="Path to CSV file to import (default=%(default)s)",
        )

    def handle(self, *, csv_file: str, **options) -> None:
        """
        Read the CSV, normalize fields and create `SiteReport` rows.

        Behavior:
            - Reads the header row to build a name->value mapping for each row.
            - Drops keys with empty-string values.
            - Concatenates "created_on" and "time" to a single string,
              parses with `%m/%d/%Y %I:%M %p %Z`, assigns to "created_on".
            - Removes the "time" key after parsing.
            - If "campaign" is present, replaces it with the model instance
              using `Campaign.objects.get(id=...)`.
            - Creates a `SiteReport` with the remaining data.

        Args:
            csv_file: Path to the CSV file to import.

        Returns:
            None
        """
        with open(csv_file, "r") as csv_file:
            reader = csv.reader(csv_file, delimiter=",")
            header = reader.__next__()
            for row in reader:
                site_report_data = dict(zip(header, row, strict=True))
                site_report = {}

                for key in site_report_data:
                    if site_report_data[key] != "":
                        site_report[key] = site_report_data[key]

                site_report["created_on"] = "%s %s" % (
                    site_report["created_on"],
                    site_report["time"],
                )

                site_report["created_on"] = datetime.strptime(
                    site_report["created_on"], "%m/%d/%Y %I:%M %p %Z"
                )

                site_report.pop("time")

                if site_report.get("campaign"):
                    campaign = Campaign.objects.get(id=site_report["campaign"])
                    site_report["campaign"] = campaign

                SiteReport.objects.create(**site_report)


================================================
FILE: concordia/management/commands/prepare_load_test_db.py
================================================
# ruff: noqa: ERA001 A003
# bandit:skip-file

from contextlib import contextmanager
from pathlib import Path

from django.conf import settings
from django.core.management import BaseCommand, CommandError, call_command
from django.db import connections


def _dbinfo(alias: str):
    cfg = settings.DATABASES[alias]
    return {
        "engine": cfg["ENGINE"],
        "name": cfg["NAME"],
        "user": cfg.get("USER"),
        "password": cfg.get("PASSWORD"),
        "host": cfg.get("HOST"),
        "port": cfg.get("PORT"),
    }


def _require_postgres(engine: str):
    if "postgresql" not in engine:
        raise CommandError(f"PostgreSQL only. ENGINE={engine!r}.")


def _maintenance_dsn(info: dict) -> str:
    parts = ["dbname=postgres"]
    if info.get("user"):
        parts.append(f"user={info['user']}")
    if info.get("password"):
        parts.append(f"password={info['password']}")
    if info.get("host"):
        parts.append(f"host={info['host']}")
    if info.get("port"):
        parts.append(f"port={info['port']}")
    return " ".join(parts)


def _pg_connect(dsn: str):
    """
    Return a live psycopg connection (supports psycopg3 or psycopg2).
    """
    try:
        import psycopg  # psycopg3

        return psycopg.connect(dsn)
    except Exception:
        try:
            import psycopg2  # type: ignore

            return psycopg2.connect(dsn)  # type: ignore
        except Exception as e2:
            raise CommandError(
                "Could not import psycopg (v3) or psycopg2. "
                "Install one of them to manage databases."
            ) from e2


def _db_exists(cur, name: str) -> bool:
    cur.execute("SELECT 1 FROM pg_database WHERE datname = %s", (name,))
    return cur.fetchone() is not None


def _create_db_if_needed(src_info: dict, name: str, *, recreate: bool = False):
    dsn = _maintenance_dsn(src_info)
    conn = _pg_connect(dsn)
    try:
        conn.autocommit = True
        with conn.cursor() as cur:
            if _db_exists(cur, name):
                if recreate:
                    cur.execute(
                        "SELECT pg_terminate_backend(pid) FROM pg_stat_activity "
                        "WHERE datname = %s AND pid <> pg_backend_pid()",
                        (name,),
                    )
                    cur.execute(f'DROP DATABASE "{name}"')
                else:
                    return
            cur.execute(f'CREATE DATABASE "{name}"')
    finally:
        conn.close()


def _drop_db(src_info: dict, name: str):
    dsn = _maintenance_dsn(src_info)
    conn = _pg_connect(dsn)
    try:
        conn.autocommit = True
        with conn.cursor() as cur:
            cur.execute(
                "SELECT pg_terminate_backend(pid) FROM pg_stat_activity "
                "WHERE datname = %s AND pid <> pg_backend_pid()",
                (name,),
            )
            cur.execute(f'DROP DATABASE IF EXISTS "{name}"')
    finally:
        conn.close()


def _switch_process_db(alias: str, new_name: str):
    settings.DATABASES[alias]["NAME"] = new_name
    connections.close_all()


@contextmanager
def _suppress_all_django_signals(active: bool):
    """
    Monkey-patch Django's Signal dispatch to no-op while active is True.
    This suppresses all signals (model and custom) during fixture loading.
    """
    if not active:
        yield
        return

    from django.dispatch import dispatcher as _dispatcher

    orig_send = _dispatcher.Signal.send
    orig_send_robust = _dispatcher.Signal.send_robust

    def _no_send(self, sender, **named):
        return []

    def _no_send_robust(self, sender, **named):
        return []

    _dispatcher.Signal.send = _no_send
    _dispatcher.Signal.send_robust = _no_send_robust
    try:
        yield
    finally:
        _dispatcher.Signal.send = orig_send
        _dispatcher.Signal.send_robust = orig_send_robust


class Command(BaseCommand):
    help = (
        "Create (or reuse) a PostgreSQL database, switch the process to it, run "
        "migrate, and load one or more fixtures. Optionally drop the DB afterward."
    )

    def add_arguments(self, p):
        p.add_argument(
            "--db-alias", default="default", help="DATABASES alias (default: default)."
        )
        p.add_argument(
            "--db-name",
            default=None,
            help=(
                "Target DB name (default: <alias.NAME>_lt). If it exists and "
                "--recreate is not set, it will be reused."
            ),
        )
        p.add_argument(
            "--recreate",
            action="store_true",
            help="Drop existing DB first, then create.",
        )
        p.add_argument(
            "--fixtures",
            nargs="+",
            default=["loadtest_fixture.json"],
            help=("Fixture file(s) to load. " "Defaults to loadtest_fixture.json."),
        )
        p.add_argument(
            "--drop-after",
            action="store_true",
            help="Drop the DB after loading (validation-only).",
        )
        p.add_argument(
            "--enable-signals",
            action="store_true",
            help="Do NOT suppress Django signals during loaddata (default suppresses).",
        )

    def handle(self, *args, **o):
        alias = o["db_alias"]
        info = _dbinfo(alias)
        _require_postgres(info["engine"])

        base_name = info["name"]
        if not base_name:
            raise CommandError(f"DATABASES[{alias!r}]['NAME'] is empty.")

        db_name = o["db_name"] or f"{base_name}_lt"

        fixture_paths = [Path(f).resolve() for f in o["fixtures"]]
        missing = [str(p) for p in fixture_paths if not p.exists()]
        if missing:
            raise CommandError(f"Fixture(s) not found: {', '.join(missing)}")

        self.stdout.write(self.style.NOTICE(f"Preparing DB {db_name!r}"))
        _create_db_if_needed(info, db_name, recreate=bool(o["recreate"]))

        self.stdout.write(self.style.SUCCESS(f"Switching process to DB {db_name!r}"))
        _switch_process_db(alias, db_name)

        self.stdout.write(self.style.NOTICE("Applying migrations..."))
        call_command("migrate", database=alias, interactive=False, run_syncdb=True)

        # Suppress signals by default; --enable-signals turns suppression off
        suppress = not bool(o.get("enable_signals"))
        if suppress:
            self.stdout.write(
                self.style.NOTICE("Suppressing Django signals during loaddata...")
            )
        else:
            self.stdout.write(self.style.NOTICE("Signals ENABLED during loaddata."))

        self.stdout.write(self.style.NOTICE("Loading fixtures..."))
        with _suppress_all_django_signals(active=suppress):
            for fp in fixture_paths:
                call_command("loaddata", str(fp), database=alias)

        if o["drop_after"]:
            self.stdout.write(self.style.NOTICE(f"Dropping DB {db_name!r}"))
            # switch away to avoid dropping the active DB
            _switch_process_db(alias, base_name)
            _drop_db(info, db_name)
            self.stdout.write(self.style.SUCCESS(f"Dropped {db_name!r}"))
        else:
            self.stdout.write(self.style.SUCCESS(f"Loaded fixtures into {db_name!r}"))


================================================
FILE: concordia/management/commands/print_frontend_test_urls.py
================================================
"""
Print a list of URLs (derived from local database content) suitable for
front-end testing.

Usage:
    python manage.py print_frontend_test_urls \
        --base-url "http://localhost:8000/"

Notes:
    - Always prints a core set of static paths.
    - If a visible Asset exists it also prints detail pages for that
      asset, its item, project and campaign.
"""

import argparse
from urllib.parse import urljoin

from django.core.management.base import BaseCommand
from django.urls import reverse

from concordia.models import Asset


class Command(BaseCommand):
    """Management command to emit front-end test URLs."""

    help = "Print URLs for front-end testing"  # NOQA: A003

    def add_arguments(self, parser: "argparse.ArgumentParser") -> None:
        """Register command-line arguments."""
        parser.add_argument(
            "--base-url",
            default="http://localhost:8000/",
            help="Change the base URL for all generated URLs from %(default)s",
        )

    def handle(self, *, base_url: str, **options) -> None:
        """Generate and print URLs, prefixed by ``base_url``."""
        paths = [
            reverse("homepage"),
            reverse("about"),
            reverse("contact"),
            # Help pages
            reverse("help-center"),
            reverse("welcome-guide"),
            reverse("transcription-basic-rules"),
            reverse("how-to-review"),
            reverse("how-to-tag"),
            reverse("for-educators"),
            reverse("questions"),
            # Account pages
            reverse("registration_register"),
            reverse("registration_login"),
            reverse("password_reset"),
            reverse("login"),
            reverse("transcriptions:campaign-list"),
            reverse("campaign-topic-list"),
        ]

        # Database content
        # First find an asset which is actually visible:
        asset_qs = Asset.objects.filter(
            published=True,
            item__published=True,
            item__project__published=True,
            item__project__campaign__published=True,
        )
        if asset_qs.exists():
            asset = asset_qs.first()
            item = asset.item
            project = item.project
            campaign = project.campaign

            paths.extend(
                [
                    reverse(
                        "transcriptions:asset-detail",
                        kwargs={
                            "campaign_slug": campaign.slug,
                            "project_slug": project.slug,
                            "item_id": item.item_id,
                            "slug": asset.slug,
                        },
                    ),
                    reverse(
                        "transcriptions:item-detail",
                        kwargs={
                            "campaign_slug": campaign.slug,
                            "project_slug": project.slug,
                            "item_id": item.item_id,
                        },
                    ),
                    reverse(
                        "transcriptions:project-detail",
                        kwargs={"campaign_slug": campaign.slug, "slug": project.slug},
                    ),
                    reverse(
                        "transcriptions:campaign-detail", kwargs={"slug": campaign.slug}
                    ),
                ]
            )
        for path in sorted(paths):
            print(urljoin(base_url, path))


================================================
FILE: concordia/middleware.py
================================================
from maintenance_mode.http import get_maintenance_response
from maintenance_mode.middleware import (
    MaintenanceModeMiddleware as BaseMaintenanceModeMiddleware,
)

from .maintenance import need_maintenance_response


class MaintenanceModeMiddleware(BaseMaintenanceModeMiddleware):
    def process_request(self, request):
        if need_maintenance_response(request):
            return get_maintenance_response(request)
        return None


================================================
FILE: concordia/migrations/0001_initial.py
================================================
# Generated by Django 2.0.4 on 2018-04-17 18:59

import django.db.models.deletion
from django.conf import settings
from django.db import migrations, models


class Migration(migrations.Migration):
    initial = True

    dependencies = [migrations.swappable_dependency(settings.AUTH_USER_MODEL)]

    operations = [
        migrations.CreateModel(
            name="UserProfile",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("myfile", models.FileField(upload_to="profile_pics/")),
                (
                    "user",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to=settings.AUTH_USER_MODEL,
                    ),
                ),
            ],
        )
    ]


================================================
FILE: concordia/migrations/0001_squashed_0040_remove_campaign_is_active.py
================================================
# Generated by Django 2.0.9 on 2018-10-03 20:04

import django.contrib.postgres.fields.jsonb
import django.core.validators
import django.db.models.deletion
from django.conf import settings
from django.db import migrations, models


def create_groups(apps, schema_editor):
    Group = apps.get_model("auth", "Group")
    Group.objects.get_or_create(name=settings.COMMUNITY_MANAGER_GROUP_NAME)
    Group.objects.get_or_create(name=settings.NEWSLETTER_GROUP_NAME)


class Migration(migrations.Migration):
    replaces = [
        ("concordia", "0001_initial"),
        ("concordia", "0002_auto_20180511_1722"),
        ("concordia", "0003_campaign_is_active"),
        ("concordia", "0004_auto_20180712_1857"),
        ("concordia", "0005_auto_20180713_1753"),
        ("concordia", "0006_auto_20180713_1759"),
        ("concordia", "0007_pageinuse"),
        ("concordia", "0008_auto_20180727_2021"),
        ("concordia", "0009_auto_20180730_2017"),
        ("concordia", "0010_auto_20180730_2032"),
        ("concordia", "0011_auto_20180730_2046"),
        ("concordia", "0007_campaign_s3_storage"),
        ("concordia", "0012_merge_20180806_1254"),
        ("concordia", "0013_auto_20180826_0928"),
        ("concordia", "0014_auto_20180904_1758"),
        ("concordia", "0015_auto_20180905_1756"),
        ("concordia", "0016_auto_20180906_1720"),
        ("concordia", "0017_auto_20180912_0229"),
        ("concordia", "0018_auto_20180917_1654"),
        ("concordia", "0019_auto_20180920_1503"),
        ("concordia", "0020_auto_20180922_0139"),
        ("concordia", "0021_auto_20180922_0202"),
        ("concordia", "0022_auto_20180924_1511"),
        ("concordia", "0023_auto_20180924_1511"),
        ("concordia", "0024_auto_20180924_1529"),
        ("concordia", "0025_auto_20180924_2022"),
        ("concordia", "0026_auto_20180925_2000"),
        ("concordia", "0027_auto_20180926_1705"),
        ("concordia", "0026_creategroups"),
        ("concordia", "0028_merge_20180927_1529"),
        ("concordia", "0029_remove_userprofile_myfile"),
        ("concordia", "0029_auto_20180928_1437"),
        ("concordia", "0030_merge_20181002_1350"),
        ("concordia", "0031_auto_20181002_1900"),
        ("concordia", "0032_auto_20181002_1901"),
        ("concordia", "0033_auto_20181002_1909"),
        ("concordia", "0034_remove_transcription_parent"),
        ("concordia", "0035_auto_20181002_1914"),
        ("concordia", "0036_remove_item_slug"),
        ("concordia", "0037_auto_20181002_1939"),
        ("concordia", "0030_merge_20180928_1740"),
        ("concordia", "0031_merge_20181002_1846"),
        ("concordia", "0038_merge_20181002_1949"),
        ("concordia", "0039_remove_campaign_s3_storage"),
        ("concordia", "0040_remove_campaign_is_active"),
    ]

    initial = True

    dependencies = [
        ("auth", "0001_initial"),
        migrations.swappable_dependency(settings.AUTH_USER_MODEL),
    ]

    operations = [
        migrations.CreateModel(
            name="UserProfile",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                (
                    "user",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to=settings.AUTH_USER_MODEL,
                    ),
                ),
            ],
        ),
        migrations.CreateModel(
            name="Asset",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("title", models.CharField(max_length=100)),
                ("slug", models.SlugField(max_length=100)),
                ("description", models.TextField(blank=True)),
                ("media_url", models.URLField(max_length=255)),
                (
                    "media_type",
                    models.CharField(
                        choices=[("IMG", "Image"), ("AUD", "Audio"), ("VID", "Video")],
                        db_index=True,
                        max_length=4,
                    ),
                ),
                ("sequence", models.PositiveIntegerField(default=1)),
                (
                    "metadata",
                    django.contrib.postgres.fields.jsonb.JSONField(default=dict),
                ),
                (
                    "status",
                    models.CharField(
                        choices=[
                            ("0", "0%"),
                            ("25", "25%"),
                            ("50", "50%"),
                            ("75", "75%"),
                            ("100", "100%"),
                            ("DONE", "Complete"),
                        ],
                        default="0",
                        max_length=4,
                    ),
                ),
            ],
            options={"ordering": ["title", "sequence"]},
        ),
        migrations.CreateModel(
            name="Campaign",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("title", models.CharField(max_length=50)),
                ("slug", models.SlugField(unique=True)),
                ("description", models.TextField(blank=True)),
                ("start_date", models.DateTimeField(blank=True, null=True)),
                ("end_date", models.DateTimeField(blank=True, null=True)),
                (
                    "metadata",
                    django.contrib.postgres.fields.jsonb.JSONField(default=dict),
                ),
                (
                    "status",
                    models.CharField(
                        choices=[
                            ("0", "0%"),
                            ("25", "25%"),
                            ("50", "50%"),
                            ("75", "75%"),
                            ("100", "100%"),
                            ("DONE", "Complete"),
                        ],
                        default="0",
                        max_length=4,
                    ),
                ),
            ],
        ),
        migrations.CreateModel(
            name="Project",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("title", models.CharField(max_length=50)),
                ("slug", models.SlugField()),
                ("category", models.CharField(blank=True, max_length=12)),
                (
                    "metadata",
                    django.contrib.postgres.fields.jsonb.JSONField(default=dict),
                ),
                (
                    "status",
                    models.CharField(
                        choices=[
                            ("Edit", "Open for Edit"),
                            ("Submitted", "Submitted for Review"),
                            ("Completed", "Transcription Completed"),
                            ("Inactive", "Inactive"),
                            ("Active", "Active"),
                        ],
                        default="Edit",
                        max_length=10,
                    ),
                ),
                (
                    "campaign",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.Campaign",
                    ),
                ),
                ("is_publish", models.BooleanField(default=False)),
            ],
            options={"ordering": ["title"]},
        ),
        migrations.CreateModel(
            name="Tag",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("value", models.CharField(max_length=50, unique=True)),
            ],
        ),
        migrations.CreateModel(
            name="Transcription",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("user_id", models.PositiveIntegerField(db_index=True)),
                ("text", models.TextField(blank=True)),
                (
                    "status",
                    models.CharField(
                        choices=[
                            ("Edit", "Open for Edit"),
                            ("Submitted", "Submitted for Review"),
                            ("Completed", "Transcription Completed"),
                            ("Inactive", "Inactive"),
                            ("Active", "Active"),
                        ],
                        default="Edit",
                        max_length=10,
                    ),
                ),
                ("created_on", models.DateTimeField(auto_now_add=True)),
                ("updated_on", models.DateTimeField(auto_now=True)),
                (
                    "asset",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.Asset",
                    ),
                ),
            ],
        ),
        migrations.CreateModel(
            name="UserAssetTagCollection",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("user_id", models.PositiveIntegerField(db_index=True)),
                ("created_on", models.DateTimeField(auto_now_add=True)),
                ("updated_on", models.DateTimeField(auto_now=True)),
                (
                    "asset",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.Asset",
                    ),
                ),
                ("tags", models.ManyToManyField(blank=True, to="concordia.Tag")),
            ],
        ),
        migrations.AlterUniqueTogether(
            name="project", unique_together={("slug", "campaign")}
        ),
        migrations.AlterField(
            model_name="asset",
            name="status",
            field=models.CharField(
                choices=[
                    ("Edit", "Open for Edit"),
                    ("Submitted", "Submitted for Review"),
                    ("Completed", "Transcription Completed"),
                ],
                default="Edit",
                max_length=4,
            ),
        ),
        migrations.AlterField(
            model_name="asset",
            name="status",
            field=models.CharField(
                choices=[
                    ("Edit", "Open for Edit"),
                    ("Submitted", "Submitted for Review"),
                    ("Completed", "Transcription Completed"),
                ],
                default="Edit",
                max_length=10,
            ),
        ),
        migrations.AlterField(
            model_name="asset",
            name="status",
            field=models.CharField(
                choices=[
                    ("Edit", "Open for Edit"),
                    ("Submitted", "Submitted for Review"),
                    ("Completed", "Transcription Completed"),
                    ("Inactive", "Inactive"),
                    ("Active", "Active"),
                ],
                default="Edit",
                max_length=10,
            ),
        ),
        migrations.AlterField(
            model_name="campaign",
            name="status",
            field=models.CharField(
                choices=[
                    ("Edit", "Open for Edit"),
                    ("Submitted", "Submitted for Review"),
                    ("Completed", "Transcription Completed"),
                ],
                default="Edit",
                max_length=4,
            ),
        ),
        migrations.AlterField(
            model_name="campaign",
            name="status",
            field=models.CharField(
                choices=[
                    ("Edit", "Open for Edit"),
                    ("Submitted", "Submitted for Review"),
                    ("Completed", "Transcription Completed"),
                ],
                default="Edit",
                max_length=10,
            ),
        ),
        migrations.CreateModel(
            name="PageInUse",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("page_url", models.CharField(max_length=256)),
                ("created_on", models.DateTimeField(editable=False)),
                ("updated_on", models.DateTimeField()),
                (
                    "user",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.DO_NOTHING,
                        to=settings.AUTH_USER_MODEL,
                    ),
                ),
            ],
        ),
        migrations.AddField(
            model_name="campaign",
            name="is_publish",
            field=models.BooleanField(default=False),
        ),
        migrations.AlterField(
            model_name="campaign",
            name="status",
            field=models.CharField(
                choices=[
                    ("Edit", "Open for Edit"),
                    ("Submitted", "Submitted for Review"),
                    ("Completed", "Transcription Completed"),
                    ("Inactive", "Inactive"),
                    ("Active", "Active"),
                ],
                default="Edit",
                max_length=10,
            ),
        ),
        migrations.CreateModel(
            name="Item",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("title", models.CharField(max_length=100)),
                ("description", models.TextField(blank=True)),
                ("item_url", models.URLField(max_length=255)),
                ("item_id", models.CharField(blank=True, max_length=100)),
                (
                    "metadata",
                    django.contrib.postgres.fields.jsonb.JSONField(
                        blank=True, default=dict, null=True
                    ),
                ),
                (
                    "thumbnail_url",
                    models.URLField(blank=True, max_length=255, null=True),
                ),
                (
                    "status",
                    models.CharField(
                        choices=[
                            ("Edit", "Open for Edit"),
                            ("Submitted", "Submitted for Review"),
                            ("Completed", "Transcription Completed"),
                            ("Inactive", "Inactive"),
                            ("Active", "Active"),
                        ],
                        default="Edit",
                        max_length=10,
                    ),
                ),
                ("is_publish", models.BooleanField(default=False)),
                (
                    "project",
                    models.ForeignKey(
                        blank=True,
                        null=True,
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.Project",
                    ),
                ),
            ],
            options={"ordering": ["item_id"]},
        ),
        migrations.AlterModelOptions(
            name="asset", options={"ordering": ["item", "sequence"]}
        ),
        migrations.AddField(
            model_name="asset",
            name="item",
            field=models.ForeignKey(
                blank=True,
                null=True,
                on_delete=django.db.models.deletion.CASCADE,
                to="concordia.Item",
            ),
        ),
        migrations.AlterModelOptions(
            name="asset", options={"ordering": ["title", "sequence"]}
        ),
        migrations.AddField(
            model_name="asset",
            name="download_url",
            field=models.CharField(blank=True, max_length=255, null=True),
        ),
        migrations.AddField(
            model_name="asset",
            name="resource_id",
            field=models.CharField(blank=True, max_length=100, null=True),
        ),
        migrations.AlterField(
            model_name="campaign",
            name="slug",
            field=models.SlugField(max_length=500, unique=True),
        ),
        migrations.AlterField(
            model_name="campaign", name="title", field=models.CharField(max_length=500)
        ),
        migrations.AlterField(
            model_name="project", name="slug", field=models.SlugField(max_length=500)
        ),
        migrations.AlterField(
            model_name="project", name="title", field=models.CharField(max_length=500)
        ),
        migrations.AlterField(
            model_name="campaign",
            name="slug",
            field=models.SlugField(max_length=80, unique=True),
        ),
        migrations.AlterField(
            model_name="campaign", name="title", field=models.CharField(max_length=80)
        ),
        migrations.AlterField(
            model_name="project", name="slug", field=models.SlugField(max_length=80)
        ),
        migrations.AlterField(
            model_name="project", name="title", field=models.CharField(max_length=80)
        ),
        migrations.AlterField(
            model_name="asset",
            name="metadata",
            field=django.contrib.postgres.fields.jsonb.JSONField(
                blank=True, default=dict, null=True
            ),
        ),
        migrations.AlterField(
            model_name="campaign",
            name="metadata",
            field=django.contrib.postgres.fields.jsonb.JSONField(
                blank=True, default=dict, null=True
            ),
        ),
        migrations.AlterField(
            model_name="project",
            name="metadata",
            field=django.contrib.postgres.fields.jsonb.JSONField(
                blank=True, default=dict, null=True
            ),
        ),
        migrations.AlterField(
            model_name="asset",
            name="media_url",
            field=models.TextField(
                max_length=255, verbose_name="Path component of the URL"
            ),
        ),
        migrations.AlterField(
            model_name="asset",
            name="item",
            field=models.ForeignKey(
                on_delete=django.db.models.deletion.CASCADE, to="concordia.Item"
            ),
        ),
        migrations.AlterField(
            model_name="item", name="title", field=models.CharField(max_length=300)
        ),
        migrations.AlterField(
            model_name="item",
            name="metadata",
            field=django.contrib.postgres.fields.jsonb.JSONField(
                blank=True,
                default=dict,
                help_text="Raw metadata returned by the remote API",
                null=True,
            ),
        ),
        migrations.AlterField(
            model_name="tag", name="value", field=models.CharField(max_length=50)
        ),
        migrations.RenameField(
            model_name="campaign", old_name="is_publish", new_name="published"
        ),
        migrations.RenameField(
            model_name="item", old_name="is_publish", new_name="published"
        ),
        migrations.RenameField(
            model_name="project", old_name="is_publish", new_name="published"
        ),
        migrations.RunPython(code=create_groups),
        migrations.AlterField(
            model_name="tag",
            name="value",
            field=models.CharField(
                max_length=50,
                validators=[django.core.validators.RegexValidator("^[- _'\\w]{1,50}$")],
            ),
        ),
        migrations.RenameField(
            model_name="transcription", old_name="user_id", new_name="user"
        ),
        migrations.RenameField(
            model_name="userassettagcollection", old_name="user_id", new_name="user"
        ),
        migrations.AlterField(
            model_name="transcription",
            name="user",
            field=models.ForeignKey(
                on_delete=django.db.models.deletion.CASCADE, to=settings.AUTH_USER_MODEL
            ),
        ),
        migrations.AlterField(
            model_name="userassettagcollection",
            name="user",
            field=models.ForeignKey(
                on_delete=django.db.models.deletion.CASCADE, to=settings.AUTH_USER_MODEL
            ),
        ),
        migrations.AlterField(
            model_name="pageinuse",
            name="user",
            field=models.ForeignKey(
                on_delete=django.db.models.deletion.CASCADE, to=settings.AUTH_USER_MODEL
            ),
        ),
        migrations.AlterUniqueTogether(
            name="item", unique_together={("item_id", "project")}
        ),
        migrations.AlterUniqueTogether(
            name="asset", unique_together={("slug", "item")}
        ),
        migrations.AlterModelOptions(name="item", options={}),
        migrations.AlterField(
            model_name="item",
            name="item_id",
            field=models.CharField(
                help_text="Unique item ID assigned by the upstream source",
                max_length=100,
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0002_auto_20181004_1848.py
================================================
# Generated by Django 2.0.9 on 2018-10-04 18:48

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0001_squashed_0040_remove_campaign_is_active")]

    operations = [
        migrations.AlterField(
            model_name="pageinuse",
            name="created_on",
            field=models.DateTimeField(auto_now_add=True),
        ),
        migrations.AlterField(
            model_name="pageinuse",
            name="page_url",
            field=models.URLField(max_length=768),
        ),
        migrations.AlterField(
            model_name="pageinuse",
            name="updated_on",
            field=models.DateTimeField(auto_now=True),
        ),
    ]


================================================
FILE: concordia/migrations/0003_auto_20181004_2103.py
================================================
# Generated by Django 2.0.9 on 2018-10-04 21:03

import django.db.models.deletion
from django.conf import settings
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        migrations.swappable_dependency(settings.AUTH_USER_MODEL),
        ("concordia", "0002_auto_20181004_1848"),
    ]

    operations = [
        migrations.CreateModel(
            name="AssetTranscriptionReservation",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("created_on", models.DateTimeField(auto_now_add=True)),
                ("updated_on", models.DateTimeField(auto_now=True)),
                (
                    "asset",
                    models.OneToOneField(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.Asset",
                    ),
                ),
                (
                    "user",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to=settings.AUTH_USER_MODEL,
                    ),
                ),
            ],
        ),
        migrations.RemoveField(model_name="pageinuse", name="user"),
        migrations.DeleteModel(name="PageInUse"),
    ]


================================================
FILE: concordia/migrations/0004_auto_20181010_1715.py
================================================
# Generated by Django 2.0.9 on 2018-10-10 17:15

import django.db.models.deletion
from django.conf import settings
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        migrations.swappable_dependency(settings.AUTH_USER_MODEL),
        ("concordia", "0003_auto_20181004_2103"),
    ]

    operations = [
        migrations.RemoveField(model_name="asset", name="status"),
        migrations.RemoveField(model_name="campaign", name="status"),
        migrations.RemoveField(model_name="item", name="status"),
        migrations.RemoveField(model_name="project", name="status"),
        migrations.RemoveField(model_name="transcription", name="status"),
        migrations.AddField(
            model_name="asset",
            name="published",
            field=models.BooleanField(default=False),
        ),
        migrations.AddField(
            model_name="asset",
            name="transcription_status",
            field=models.CharField(
                choices=[
                    ("edit", "Open for Edit"),
                    ("submitted", "Submitted for Review"),
                    ("completed", "Completed"),
                ],
                default="edit",
                editable=False,
                max_length=10,
            ),
        ),
        migrations.AddField(
            model_name="transcription",
            name="accepted",
            field=models.DateTimeField(blank=True, null=True),
        ),
        migrations.AddField(
            model_name="transcription",
            name="rejected",
            field=models.DateTimeField(blank=True, null=True),
        ),
        migrations.AddField(
            model_name="transcription",
            name="reviewed_by",
            field=models.ForeignKey(
                blank=True,
                null=True,
                on_delete=django.db.models.deletion.SET_NULL,
                related_name="transcription_reviewers",
                to=settings.AUTH_USER_MODEL,
            ),
        ),
        migrations.AddField(
            model_name="transcription",
            name="submitted",
            field=models.DateTimeField(
                blank=True,
                help_text="Timestamp when the creator submitted this for review",
                null=True,
            ),
        ),
        migrations.AddField(
            model_name="transcription",
            name="supersedes",
            field=models.ForeignKey(
                blank=True,
                help_text="A previous transcription record which is replaced by this one",  # NOQA
                null=True,
                on_delete=django.db.models.deletion.CASCADE,
                to="concordia.Transcription",
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0005_campaign_short_description.py
================================================
# Generated by Django 2.0.9 on 2018-10-10 19:31

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0004_auto_20181010_1715")]

    operations = [
        migrations.AddField(
            model_name="campaign",
            name="short_description",
            field=models.TextField(blank=True),
        )
    ]


================================================
FILE: concordia/migrations/0006_campaignresource.py
================================================
# Generated by Django 2.0.9 on 2018-10-10 20:19

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0005_campaign_short_description")]

    operations = [
        migrations.CreateModel(
            name="Resource",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("sequence", models.PositiveIntegerField(default=1)),
                ("title", models.TextField(max_length=255)),
                ("resource_url", models.URLField()),
                (
                    "campaign",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.Campaign",
                    ),
                ),
            ],
        )
    ]


================================================
FILE: concordia/migrations/0007_thumbnail_images.py
================================================
# Generated by Django 2.0.9 on 2018-10-10 18:20

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0006_campaignresource")]

    operations = [
        migrations.AddField(
            model_name="campaign",
            name="thumbnail_image",
            field=models.ImageField(
                blank=True, null=True, default="", upload_to="campaign-thumbnails"
            ),
            preserve_default=False,
        ),
        migrations.AddField(
            model_name="project",
            name="thumbnail_image",
            field=models.ImageField(
                blank=True, null=True, default="", upload_to="project-thumbnails"
            ),
            preserve_default=False,
        ),
    ]


================================================
FILE: concordia/migrations/0008_auto_20181015_1711.py
================================================
# Generated by Django 2.0.9 on 2018-10-15 17:11

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [("concordia", "0007_thumbnail_images")]

    operations = [
        migrations.AlterModelOptions(name="asset", options={}),
        migrations.AlterModelOptions(
            name="resource", options={"ordering": ["campaign", "sequence"]}
        ),
        migrations.AlterUniqueTogether(
            name="resource", unique_together={("campaign", "sequence")}
        ),
    ]


================================================
FILE: concordia/migrations/0009_project_description.py
================================================
# Generated by Django 2.0.9 on 2018-10-17 15:13

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0008_auto_20181015_1711")]

    operations = [
        migrations.AddField(
            model_name="project", name="description", field=models.TextField(blank=True)
        )
    ]


================================================
FILE: concordia/migrations/0010_auto_20181021_1659.py
================================================
# Generated by Django 2.0.9 on 2018-10-21 16:59

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0009_project_description")]

    operations = [
        migrations.RemoveField(model_name="asset", name="resource_id"),
        migrations.AddField(
            model_name="asset",
            name="resource_url",
            field=models.URLField(blank=True, max_length=255, null=True),
        ),
    ]


================================================
FILE: concordia/migrations/0010_auto_20181022_1530.py
================================================
# Generated by Django 2.0.9 on 2018-10-22 15:30

from django.db import migrations


def handle_items_without_projects(apps, schema_editor):
    Item = apps.get_model("concordia", "Item")
    Item.objects.filter(project=None).delete()


class Migration(migrations.Migration):
    dependencies = [("concordia", "0009_project_description")]

    operations = [migrations.RunPython(handle_items_without_projects)]


================================================
FILE: concordia/migrations/0011_auto_20181022_1532.py
================================================
# Generated by Django 2.0.9 on 2018-10-22 15:32

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0010_auto_20181022_1530")]

    operations = [
        migrations.AlterField(
            model_name="item",
            name="project",
            field=models.ForeignKey(
                on_delete=django.db.models.deletion.CASCADE, to="concordia.Project"
            ),
        )
    ]


================================================
FILE: concordia/migrations/0012_merge_20181022_1554.py
================================================
# Generated by Django 2.0.9 on 2018-10-22 15:54

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0010_auto_20181021_1659"),
        ("concordia", "0011_auto_20181022_1532"),
    ]

    operations = []


================================================
FILE: concordia/migrations/0013_auto_20181031_1305.py
================================================
# Generated by Django 2.0.9 on 2018-10-31 17:05

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0012_merge_20181022_1554")]

    operations = [
        migrations.AlterField(
            model_name="resource", name="title", field=models.CharField(max_length=255)
        )
    ]


================================================
FILE: concordia/migrations/0014_auto_20181115_1411.py
================================================
# Generated by Django 2.0.9 on 2018-11-15 19:11

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0013_auto_20181031_1305")]

    operations = [
        migrations.AlterField(
            model_name="asset",
            name="transcription_status",
            field=models.CharField(
                choices=[
                    ("not_started", "Not Started"),
                    ("in_progress", "In Progress"),
                    ("submitted", "Submitted for Review"),
                    ("completed", "Completed"),
                ],
                default="not_started",
                editable=False,
                max_length=20,
            ),
        )
    ]


================================================
FILE: concordia/migrations/0015_auto_20181115_1436.py
================================================
# Generated by Django 2.0.9 on 2018-11-15 19:36

from django.db import migrations

from concordia.models import TranscriptionStatus


def split_edit_statuses(apps, schema_editor):
    Transcription = apps.get_model("concordia", "Transcription")
    Asset = apps.get_model("concordia", "Asset")

    Asset.objects.filter(
        pk__in=Transcription.objects.values("asset_id"), transcription_status="edit"
    ).update(transcription_status=TranscriptionStatus.IN_PROGRESS)
    Asset.objects.filter(transcription_status="edit").update(
        transcription_status=TranscriptionStatus.NOT_STARTED
    )


class Migration(migrations.Migration):
    dependencies = [("concordia", "0014_auto_20181115_1411")]

    operations = [migrations.RunPython(split_edit_statuses)]


================================================
FILE: concordia/migrations/0016_auto_20181115_1803.py
================================================
# Generated by Django 2.0.9 on 2018-11-15 23:03

from django.db import migrations

from concordia.models import TranscriptionStatus


def update_new_statuses(apps, schema_editor):
    Asset = apps.get_model("concordia", "Asset")

    Asset.objects.filter(transcription_status="in progress").update(
        transcription_status=TranscriptionStatus.IN_PROGRESS
    )
    Asset.objects.filter(transcription_status="not started").update(
        transcription_status=TranscriptionStatus.NOT_STARTED
    )


class Migration(migrations.Migration):
    dependencies = [("concordia", "0015_auto_20181115_1436")]

    operations = [migrations.RunPython(update_new_statuses)]


================================================
FILE: concordia/migrations/0017_change_transcription_supersedes_related_name.py
================================================
# Generated by Django 2.0.9 on 2018-11-20 17:07

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0016_auto_20181115_1803")]

    operations = [
        migrations.AlterField(
            model_name="transcription",
            name="supersedes",
            field=models.ForeignKey(
                blank=True,
                help_text="A previous transcription record which is replaced by this one",  # NOQA
                null=True,
                on_delete=django.db.models.deletion.CASCADE,
                related_name="superseded_by",
                to="concordia.Transcription",
            ),
        )
    ]


================================================
FILE: concordia/migrations/0018_auto_20181128_1611.py
================================================
# Generated by Django 2.0.9 on 2018-11-28 21:11

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0017_change_transcription_supersedes_related_name")]

    operations = [
        migrations.AddField(
            model_name="campaign",
            name="display_on_homepage",
            field=models.BooleanField(default=True),
        ),
        migrations.AddField(
            model_name="campaign",
            name="ordering",
            field=models.IntegerField(
                default=0,
                help_text="Sort order override: higher values will be listed first",
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0018_simplepage.py
================================================
# Generated by Django 2.0.9 on 2018-11-26 21:58

import django.core.validators
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0017_change_transcription_supersedes_related_name")]

    operations = [
        migrations.CreateModel(
            name="SimplePage",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("created_on", models.DateTimeField(auto_now_add=True)),
                ("updated_on", models.DateTimeField(auto_now=True)),
                (
                    "path",
                    models.CharField(
                        help_text="URL path where this page will be accessible from",
                        max_length=255,
                        validators=[django.core.validators.RegexValidator("^/.+/$")],
                    ),
                ),
                ("title", models.CharField(max_length=200)),
                ("body", models.TextField()),
            ],
        )
    ]


================================================
FILE: concordia/migrations/0019_merge_20181128_1715.py
================================================
# Generated by Django 2.0.9 on 2018-11-28 22:15

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0018_simplepage"),
        ("concordia", "0018_auto_20181128_1611"),
    ]

    operations = []


================================================
FILE: concordia/migrations/0020_auto_20181128_1718.py
================================================
# Generated by Django 2.0.9 on 2018-11-28 22:18

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [("concordia", "0019_merge_20181128_1715")]

    operations = [
        migrations.RemoveField(model_name="campaign", name="end_date"),
        migrations.RemoveField(model_name="campaign", name="start_date"),
    ]


================================================
FILE: concordia/migrations/0021_sitereport.py
================================================
# Generated by Django 2.0.9 on 2018-12-04 18:26

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0020_auto_20181128_1718")]

    operations = [
        migrations.CreateModel(
            name="SiteReport",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("created_on", models.DateTimeField(auto_now_add=True)),
                ("assets_total", models.IntegerField()),
                ("assets_published", models.IntegerField()),
                ("assets_not_started", models.IntegerField()),
                ("assets_in_progress", models.IntegerField()),
                ("assets_waiting_review", models.IntegerField()),
                ("assets_completed", models.IntegerField()),
                ("assets_unpublished", models.IntegerField()),
                ("items_published", models.IntegerField()),
                ("items_unpublished", models.IntegerField()),
                ("projects_published", models.IntegerField()),
                ("projects_unpublished", models.IntegerField()),
                ("anonymous_transcriptions", models.IntegerField()),
                ("transcriptions_saved", models.IntegerField()),
                ("distinct_tags", models.IntegerField()),
                ("tag_uses", models.IntegerField()),
                ("campaigns_published", models.IntegerField(blank=True, null=True)),
                ("campaigns_unpublished", models.IntegerField(blank=True, null=True)),
                ("users_registered", models.IntegerField(blank=True, null=True)),
                ("users_activated", models.IntegerField(blank=True, null=True)),
                (
                    "campaign",
                    models.ForeignKey(
                        blank=True,
                        null=True,
                        on_delete=django.db.models.deletion.DO_NOTHING,
                        to="concordia.Campaign",
                    ),
                ),
            ],
        )
    ]


================================================
FILE: concordia/migrations/0022_auto_20181211_1310.py
================================================
# Generated by Django 2.0.9 on 2018-12-11 18:10

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0021_sitereport")]

    operations = [
        migrations.AlterField(
            model_name="campaign",
            name="ordering",
            field=models.IntegerField(
                default=0,
                help_text="Sort order override: lower values will be listed first",
            ),
        )
    ]


================================================
FILE: concordia/migrations/0023_auto_20190130_1555.py
================================================
# Generated by Django 2.1.5 on 2019-01-30 20:55

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0022_auto_20181211_1310")]

    operations = [
        migrations.AlterField(
            model_name="asset",
            name="transcription_status",
            field=models.CharField(
                choices=[
                    ("not_started", "Not Started"),
                    ("in_progress", "In Progress"),
                    ("submitted", "Needs Review"),
                    ("completed", "Completed"),
                ],
                default="not_started",
                editable=False,
                max_length=20,
            ),
        )
    ]


================================================
FILE: concordia/migrations/0024_add_site_report_ordering.py
================================================
# Generated by Django 2.2 on 2019-04-19 15:25

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [("concordia", "0023_auto_20190130_1555")]

    operations = [
        migrations.AlterModelOptions(
            name="sitereport", options={"ordering": ("created_on",)}
        )
    ]


================================================
FILE: concordia/migrations/0024_auto_20190211_1420.py
================================================
# Generated by Django 2.1.7 on 2019-02-11 19:20

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0023_auto_20190130_1555")]

    operations = [
        migrations.AlterModelOptions(
            name="sitereport", options={"ordering": ("created_on",)}
        ),
        migrations.AddField(
            model_name="asset",
            name="difficulty",
            field=models.PositiveIntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="asset",
            name="published",
            field=models.BooleanField(blank=True, default=False),
        ),
        migrations.AlterField(
            model_name="asset",
            name="slug",
            field=models.SlugField(allow_unicode=True, max_length=100),
        ),
        migrations.AlterField(
            model_name="campaign",
            name="published",
            field=models.BooleanField(blank=True, default=False),
        ),
        migrations.AlterField(
            model_name="campaign",
            name="slug",
            field=models.SlugField(allow_unicode=True, max_length=80, unique=True),
        ),
        migrations.AlterField(
            model_name="item",
            name="published",
            field=models.BooleanField(blank=True, default=False),
        ),
        migrations.AlterField(
            model_name="project",
            name="published",
            field=models.BooleanField(blank=True, default=False),
        ),
        migrations.AlterField(
            model_name="project",
            name="slug",
            field=models.SlugField(allow_unicode=True, max_length=80),
        ),
    ]


================================================
FILE: concordia/migrations/0025_auto_20190329_1705.py
================================================
# Generated by Django 2.1.7 on 2019-03-29 21:05

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0024_auto_20190211_1420")]

    operations = [
        migrations.AlterField(
            model_name="asset",
            name="difficulty",
            field=models.PositiveIntegerField(blank=True, default=0, null=True),
        )
    ]


================================================
FILE: concordia/migrations/0025_unicode_slugs.py
================================================
# Generated by Django 2.2 on 2019-04-19 15:31

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0024_add_site_report_ordering")]

    operations = [
        migrations.AlterField(
            model_name="asset",
            name="slug",
            field=models.SlugField(allow_unicode=True, max_length=100),
        ),
        migrations.AlterField(
            model_name="campaign",
            name="slug",
            field=models.SlugField(allow_unicode=True, max_length=80, unique=True),
        ),
        migrations.AlterField(
            model_name="project",
            name="slug",
            field=models.SlugField(allow_unicode=True, max_length=80),
        ),
    ]


================================================
FILE: concordia/migrations/0026_update_published_field_definition.py
================================================
# Generated by Django 2.2 on 2019-04-19 15:41

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0025_unicode_slugs")]

    operations = [
        migrations.AlterField(
            model_name="asset",
            name="published",
            field=models.BooleanField(blank=True, default=False),
        ),
        migrations.AlterField(
            model_name="campaign",
            name="published",
            field=models.BooleanField(blank=True, default=False),
        ),
        migrations.AlterField(
            model_name="item",
            name="published",
            field=models.BooleanField(blank=True, default=False),
        ),
        migrations.AlterField(
            model_name="project",
            name="published",
            field=models.BooleanField(blank=True, default=False),
        ),
    ]


================================================
FILE: concordia/migrations/0027_merge_20190423_1657.py
================================================
# Generated by Django 2.2 on 2019-04-23 20:57

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0025_auto_20190329_1705"),
        ("concordia", "0026_update_published_field_definition"),
    ]

    operations = []


================================================
FILE: concordia/migrations/0028_asset_year.py
================================================
# Generated by Django 2.2 on 2019-04-23 20:57

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0027_merge_20190423_1657")]

    operations = [
        migrations.AddField(
            model_name="asset",
            name="year",
            field=models.CharField(blank=True, max_length=50),
        )
    ]


================================================
FILE: concordia/migrations/0029_assettranscriptionreservation_reservation_token.py
================================================
# Generated by Django 2.2 on 2019-04-23 15:13

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0028_asset_year")]

    operations = [
        migrations.AddField(
            model_name="assettranscriptionreservation",
            name="reservation_token",
            field=models.CharField(max_length=50, default="migration"),
        )
    ]


================================================
FILE: concordia/migrations/0030_auto_20190503_1559.py
================================================
# Generated by Django 2.2 on 2019-05-03 19:59

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0029_assettranscriptionreservation_reservation_token")
    ]

    operations = [
        migrations.RemoveField(model_name="assettranscriptionreservation", name="user"),
        migrations.AlterField(
            model_name="assettranscriptionreservation",
            name="reservation_token",
            field=models.CharField(max_length=50),
        ),
    ]


================================================
FILE: concordia/migrations/0031_auto_20190509_1142.py
================================================
# Generated by Django 2.2 on 2019-05-09 15:42

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0030_auto_20190503_1559")]

    operations = [
        migrations.CreateModel(
            name="Topic",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("published", models.BooleanField(blank=True, default=False)),
                ("title", models.CharField(max_length=255)),
                ("slug", models.SlugField(allow_unicode=True, max_length=80)),
                ("description", models.TextField(blank=True)),
                (
                    "thumbnail_image",
                    models.ImageField(
                        blank=True, null=True, upload_to="topic-thumbnails"
                    ),
                ),
                ("short_description", models.TextField(blank=True)),
            ],
            options={"ordering": ["title"]},
        ),
        migrations.AlterModelOptions(name="resource", options={}),
        migrations.RemoveField(model_name="project", name="category"),
        migrations.AlterField(
            model_name="resource",
            name="campaign",
            field=models.ForeignKey(
                blank=True,
                null=True,
                on_delete=django.db.models.deletion.CASCADE,
                to="concordia.Campaign",
            ),
        ),
        migrations.AlterUniqueTogether(name="resource", unique_together=set()),
        migrations.AddField(
            model_name="project",
            name="topics",
            field=models.ManyToManyField(to="concordia.Topic"),
        ),
        migrations.AddField(
            model_name="resource",
            name="topic",
            field=models.ForeignKey(
                blank=True,
                null=True,
                on_delete=django.db.models.deletion.CASCADE,
                to="concordia.Topic",
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0032_topic_ordering.py
================================================
# Generated by Django 2.2 on 2019-05-29 18:11

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0031_auto_20190509_1142")]

    operations = [
        migrations.AddField(
            model_name="topic",
            name="ordering",
            field=models.IntegerField(
                default=0,
                help_text="Sort order override: lower values will be listed first",
            ),
        )
    ]


================================================
FILE: concordia/migrations/0033_simple_content_blocks.py
================================================
# Generated by Django 2.2.2 on 2019-06-21 18:39

from django.db import migrations, models


def load_legacy_content_blocks(apps, schema_editor):
    SimpleContentBlock = apps.get_model("concordia", "SimpleContentBlock")

    prototype_quicktips = SimpleContentBlock(
        label="prototype_quicktips", body=PROTOTYPE_QUICKTIPS
    )
    prototype_quicktips.full_clean()
    prototype_quicktips.save()

    classic_quicktips = SimpleContentBlock(
        label="classic_quicktips", body=CLASSIC_QUICKTIPS
    )
    classic_quicktips.full_clean()
    classic_quicktips.save()


class Migration(migrations.Migration):
    dependencies = [("concordia", "0032_topic_ordering")]

    operations = [
        migrations.AlterModelOptions(name="topic", options={}),
        migrations.CreateModel(
            name="SimpleContentBlock",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("created_on", models.DateTimeField(auto_now_add=True)),
                ("updated_on", models.DateTimeField(auto_now=True)),
                (
                    "label",
                    models.CharField(
                        help_text="Label that is used to refer to this content in the code",
                        max_length=255,
                        unique=True,
                    ),
                ),
                ("body", models.TextField()),
            ],
        ),
        migrations.RunPython(code=load_legacy_content_blocks),
        migrations.RenameField(
            model_name="simplecontentblock", old_name="label", new_name="slug"
        ),
        migrations.AlterField(
            model_name="simplecontentblock",
            name="slug",
            field=models.SlugField(
                help_text="Label that templates use to retrieve this block",
                max_length=255,
                unique=True,
            ),
        ),
    ]


PROTOTYPE_QUICKTIPS = """
<h2 class="sr-only">Help</h2>
<section>
    <h3>Transcription tips</h3>
    <ul>
        <li>Type what you see: Preserve line breaks, original spelling, and punctuation.</li>
        <li>Use brackets [ ] around deleted, illegible or partially legible text.</li>
        <li>Use question mark ? for any words or letters you can't identify.</li>
        <li>Use square brackets and asterisks [ * * ] around text from margins.</li>
        <li>Include insertions where you would read them in the text.</li>
        <li>Click “Save” to save work in progress and “Submit” when complete</li>
    </ul>
</section>
<hr />
<section>
    <h3>Review tips</h3>
    <ul>
        <li>Carefully compare each line of the transcription to the original.</li>
        <li>Use “Transcription tips” as a guide.</li>
        <li>Click “Accept” if accurate or “Edit” if page needs correction.</li>
    </ul>
</section>
<hr />
<section>
    <h3 class="sr-only">More information</h3>
    <p>
    Find more detailed instructions in the <a href="/help-center/" target="_blank">Help Center</a>
    </p>
</section>
<hr />
<section>
    <h3>Keyboard Shortcuts</h3>
    <ul class="list-unstyled d-table">
        <li class="d-table-row">
            <div class="d-table-cell align-middle border-top py-2"><kbd>w</kbd> or <kbd>up</kbd></div>
            <div class="d-table-cell align-middle border-top py-2 pl-2 w-60">Scroll the viewport up</div>
        </li>
        <li class="d-table-row">
            <div class="d-table-cell align-middle border-top py-2"><kbd>s</kbd> or <kbd>down</kbd></div>
            <div class="d-table-cell align-middle border-top py-2 pl-2">Scroll the viewport down</div>
        </li>
        <li class="d-table-row">
            <div class="d-table-cell align-middle border-top py-2"><kbd>a</kbd> or <kbd>left</kbd></div>
            <div class="d-table-cell align-middle border-top py-2 pl-2">Scroll the viewport left</div>
        </li>
        <li class="d-table-row">
            <div class="d-table-cell align-middle border-top py-2"><kbd>d</kbd> or <kbd>right</kbd></div>
            <div class="d-table-cell align-middle border-top py-2 pl-2">Scroll the viewport right</div>
        </li>
        <li class="d-table-row">
            <div class="d-table-cell align-middle border-top py-2"><kbd>0</kbd></div>
            <div class="d-table-cell align-middle border-top py-2 pl-2">Fit the entire image to the viewport</div>
        </li>
        <li class="d-table-row">
            <div class="d-table-cell align-middle border-top py-2"><kbd>-</kbd> or <kbd>_</kbd></div>
            <div class="d-table-cell align-middle border-top py-2 pl-2">Zoom the viewport out</div>
        </li>
        <li class="d-table-row">
            <div class="d-table-cell align-middle border-top py-2"><kbd>=</kbd> or <kbd>+</kbd></div>
            <div class="d-table-cell align-middle border-top py-2 pl-2">Zoom the viewport in</div>
        </li>
        <li class="d-table-row">
            <div class="d-table-cell align-middle border-top py-2"><kbd>r</kbd></div>
            <div class="d-table-cell align-middle border-top py-2 pl-2">Rotate the viewport clockwise</div>
        </li>
        <li class="d-table-row">
            <div class="d-table-cell align-middle border-top py-2"><kbd>R</kbd></div>
            <div class="d-table-cell align-middle border-top py-2 pl-2">Rotate the viewport counterclockwise</div>
        </li>
        <li class="d-table-row">
            <div class="d-table-cell align-middle border-top py-2"><kbd>f</kbd></div>
            <div class="d-table-cell align-middle border-top py-2 pl-2">Flip the viewport horizontally</div>
        </li>
    </ul>
</section>
"""

CLASSIC_QUICKTIPS = """
<ul>
    <li>Transcribe original spelling, punctuation, word order, and any page numbers or catalog marks.</li>
    <li>Preserve line breaks except when a word breaks over a line or page. Then transcribe it on the line or page where it starts.</li>
    <li>Use brackets [ ] around deleted, illegible or partially legible text, and square brackets and asterisks around text in margins [ * * ].</li>
    <li>Transcribe any words or letters you can't identify as [?].</li>
    <li>Include insertions where you would read them in the text.</li>
</ul>
Find more detailed instructions in the <a href="/help-center/">Help Center</a>
"""


================================================
FILE: concordia/migrations/0034_auto_20190627_1438.py
================================================
# Generated by Django 2.2.2 on 2019-06-27 18:38

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0033_simple_content_blocks")]

    operations = [
        migrations.AlterField(
            model_name="sitereport",
            name="anonymous_transcriptions",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="sitereport",
            name="assets_completed",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="sitereport",
            name="assets_in_progress",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="sitereport",
            name="assets_not_started",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="sitereport",
            name="assets_published",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="sitereport",
            name="assets_total",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="sitereport",
            name="assets_unpublished",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="sitereport",
            name="assets_waiting_review",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="sitereport",
            name="distinct_tags",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="sitereport",
            name="items_published",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="sitereport",
            name="items_unpublished",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="sitereport",
            name="projects_published",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="sitereport",
            name="projects_unpublished",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="sitereport",
            name="tag_uses",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="sitereport",
            name="transcriptions_saved",
            field=models.IntegerField(blank=True, null=True),
        ),
    ]


================================================
FILE: concordia/migrations/0035_auto_20190627_1455.py
================================================
# Generated by Django 2.2.2 on 2019-06-27 18:55

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0034_auto_20190627_1438")]

    operations = [
        migrations.AlterField(
            model_name="sitereport",
            name="created_on",
            field=models.DateTimeField(editable=False),
        )
    ]


================================================
FILE: concordia/migrations/0036_auto_20190703_1203.py
================================================
# Generated by Django 2.2.2 on 2019-07-03 16:09

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0035_auto_20190627_1455")]

    operations = [
        migrations.AlterField(
            model_name="sitereport",
            name="created_on",
            field=models.DateTimeField(auto_now_add=True),
        )
    ]


================================================
FILE: concordia/migrations/0037_carouselslide.py
================================================
# Generated by Django 2.2.3 on 2019-07-31 16:29

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0036_auto_20190703_1203")]

    operations = [
        migrations.CreateModel(
            name="CarouselSlide",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("created_on", models.DateTimeField(auto_now_add=True)),
                ("updated_on", models.DateTimeField(auto_now=True)),
                (
                    "ordering",
                    models.IntegerField(
                        default=0,
                        help_text="Sort order: lower values will be listed first",
                    ),
                ),
                ("published", models.BooleanField(blank=True, default=False)),
                (
                    "overlay_position",
                    models.CharField(
                        choices=[("left", "Left"), ("right", "Right")], max_length=5
                    ),
                ),
                ("headline", models.CharField(max_length=255)),
                ("body", models.TextField(blank=True)),
                ("image_alt_text", models.TextField(blank=True)),
                (
                    "carousel_image",
                    models.ImageField(
                        blank=True, null=True, upload_to="carousel-slides"
                    ),
                ),
                ("lets_go_url", models.CharField(max_length=255)),
            ],
        )
    ]


================================================
FILE: concordia/migrations/0038_sitereport_topic.py
================================================
# Generated by Django 2.2.3 on 2019-07-31 22:09

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("concordia", "0037_carouselslide")]

    operations = [
        migrations.AddField(
            model_name="sitereport",
            name="topic",
            field=models.ForeignKey(
                blank=True,
                null=True,
                on_delete=django.db.models.deletion.DO_NOTHING,
                to="concordia.Topic",
            ),
        )
    ]


================================================
FILE: concordia/migrations/0039_auto_20200129_1536.py
================================================
# Generated by Django 2.2.7 on 2020-01-29 20:36

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0038_sitereport_topic"),
    ]

    operations = [
        migrations.AlterField(
            model_name="item",
            name="title",
            field=models.CharField(max_length=500),
        ),
        migrations.AlterField(
            model_name="sitereport",
            name="campaign",
            field=models.ForeignKey(
                blank=True,
                null=True,
                on_delete=django.db.models.deletion.SET_NULL,
                to="concordia.Campaign",
            ),
        ),
        migrations.AlterField(
            model_name="sitereport",
            name="topic",
            field=models.ForeignKey(
                blank=True,
                null=True,
                on_delete=django.db.models.deletion.SET_NULL,
                to="concordia.Topic",
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0040_auto_20200130_1756.py
================================================
# Generated by Django 2.2.7 on 2020-01-30 22:56

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0039_auto_20200129_1536"),
    ]

    operations = [
        migrations.AddField(
            model_name="assettranscriptionreservation",
            name="tombstoned",
            field=models.BooleanField(blank=True, default=False, null=True),
        ),
        migrations.AlterField(
            model_name="assettranscriptionreservation",
            name="asset",
            field=models.ForeignKey(
                on_delete=django.db.models.deletion.CASCADE, to="concordia.Asset"
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0041_auto_20200203_1351.py
================================================
# Generated by Django 2.2.7 on 2020-02-03 18:51

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0040_auto_20200130_1756"),
    ]

    operations = [
        migrations.AlterField(
            model_name="item",
            name="title",
            field=models.CharField(max_length=600),
        ),
    ]


================================================
FILE: concordia/migrations/0042_auto_20200316_1623.py
================================================
# Generated by Django 2.2.10 on 2020-03-16 20:23

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0041_auto_20200203_1351"),
    ]

    operations = [
        migrations.AddField(
            model_name="campaign",
            name="unlisted",
            field=models.BooleanField(blank=True, default=False),
        ),
        migrations.AddField(
            model_name="topic",
            name="unlisted",
            field=models.BooleanField(blank=True, default=False),
        ),
    ]


================================================
FILE: concordia/migrations/0043_auto_20200323_1729.py
================================================
# Generated by Django 2.2.11 on 2020-03-23 21:29

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0042_auto_20200316_1623"),
    ]

    operations = [
        migrations.AlterField(
            model_name="asset",
            name="published",
            field=models.BooleanField(blank=True, db_index=True, default=False),
        ),
        migrations.AlterField(
            model_name="campaign",
            name="published",
            field=models.BooleanField(blank=True, db_index=True, default=False),
        ),
        migrations.AlterField(
            model_name="campaign",
            name="unlisted",
            field=models.BooleanField(blank=True, db_index=True, default=False),
        ),
        migrations.AlterField(
            model_name="item",
            name="published",
            field=models.BooleanField(blank=True, db_index=True, default=False),
        ),
        migrations.AlterField(
            model_name="project",
            name="published",
            field=models.BooleanField(blank=True, db_index=True, default=False),
        ),
        migrations.AlterField(
            model_name="topic",
            name="published",
            field=models.BooleanField(blank=True, db_index=True, default=False),
        ),
        migrations.AlterField(
            model_name="topic",
            name="unlisted",
            field=models.BooleanField(blank=True, db_index=True, default=False),
        ),
    ]


================================================
FILE: concordia/migrations/0044_auto_20200323_1827.py
================================================
# Generated by Django 2.2.11 on 2020-03-23 22:27

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0043_auto_20200323_1729"),
    ]

    operations = [
        migrations.AddIndex(
            model_name="asset",
            index=models.Index(
                fields=["id", "published", "transcription_status"],
                name="concordia_a_id_0c37bf_idx",
            ),
        ),
        migrations.AddIndex(
            model_name="campaign",
            index=models.Index(
                fields=["published", "unlisted"], name="concordia_c_publish_2c3b1c_idx"
            ),
        ),
        migrations.AddIndex(
            model_name="topic",
            index=models.Index(
                fields=["published", "unlisted"], name="concordia_t_publish_7f5b9d_idx"
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0045_auto_20200323_1832.py
================================================
# Generated by Django 2.2.11 on 2020-03-23 22:32

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0044_auto_20200323_1827"),
    ]

    operations = [
        migrations.AddIndex(
            model_name="asset",
            index=models.Index(
                fields=["published", "transcription_status"],
                name="concordia_a_publish_4761f1_idx",
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0046_auto_20200323_1907.py
================================================
# Generated by Django 2.2.11 on 2020-03-23 23:07

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0045_auto_20200323_1832"),
    ]

    operations = [
        migrations.AlterField(
            model_name="asset",
            name="transcription_status",
            field=models.CharField(
                choices=[
                    ("not_started", "Not Started"),
                    ("in_progress", "In Progress"),
                    ("submitted", "Needs Review"),
                    ("completed", "Completed"),
                ],
                db_index=True,
                default="not_started",
                editable=False,
                max_length=20,
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0047_auto_20200324_1103.py
================================================
# Generated by Django 2.2.11 on 2020-03-24 15:03

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0046_auto_20200323_1907"),
    ]

    operations = [
        migrations.AddIndex(
            model_name="transcription",
            index=models.Index(
                fields=["asset", "user"], name="concordia_t_asset_i_4fcaa1_idx"
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0048_auto_20200324_1820.py
================================================
# Generated by Django 2.2.11 on 2020-03-24 22:20

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0047_auto_20200324_1103"),
    ]

    operations = [
        migrations.RemoveIndex(
            model_name="asset",
            name="concordia_a_id_0c37bf_idx",
        ),
        migrations.AlterField(
            model_name="item",
            name="published",
            field=models.BooleanField(blank=True, default=False),
        ),
        migrations.AlterField(
            model_name="project",
            name="published",
            field=models.BooleanField(blank=True, default=False),
        ),
        migrations.AddIndex(
            model_name="asset",
            index=models.Index(
                fields=["id", "item", "published", "transcription_status"],
                name="concordia_a_id_137ca8_idx",
            ),
        ),
        migrations.AddIndex(
            model_name="item",
            index=models.Index(
                fields=["project", "published"], name="concordia_i_project_d8caf0_idx"
            ),
        ),
        migrations.AddIndex(
            model_name="project",
            index=models.Index(
                fields=["id", "campaign", "published"], name="concordia_p_id_17c9c9_idx"
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0049_auto_20200324_2004.py
================================================
# Generated by Django 2.2.11 on 2020-03-25 00:04

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0048_auto_20200324_1820"),
    ]

    operations = [
        migrations.AlterField(
            model_name="project",
            name="published",
            field=models.BooleanField(blank=True, db_index=True, default=False),
        ),
    ]


================================================
FILE: concordia/migrations/0050_auto_20210920_1544.py
================================================
# Generated by Django 2.2.20 on 2021-09-20 19:44

import django.core.validators
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0049_auto_20200324_2004"),
    ]

    operations = [
        migrations.AddField(
            model_name="project",
            name="ordering",
            field=models.IntegerField(
                default=0,
                help_text="Sort order override: lower values will be listed first",
            ),
        ),
        migrations.AlterField(
            model_name="tag",
            name="value",
            field=models.CharField(
                max_length=50,
                validators=[
                    django.core.validators.RegexValidator("^[- _À-ž'\\w]{1,50}$")
                ],
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0051_asset_storage_image.py
================================================
# Generated by Django 2.2.24 on 2022-01-11 18:14

from django.db import migrations, models

import concordia.models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0050_auto_20210920_1544"),
    ]

    operations = [
        migrations.AddField(
            model_name="asset",
            name="storage_image",
            field=models.ImageField(
                blank=True,
                max_length=255,
                null=True,
                upload_to=concordia.models.Asset.get_storage_path,
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0052_auto_20220531_1331.py
================================================
# Generated by Django 3.2.13 on 2022-05-31 17:31

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0051_asset_storage_image"),
    ]

    operations = [
        migrations.AlterModelOptions(
            name="resource",
            options={"ordering": ("sequence",)},
        ),
        migrations.AlterModelOptions(
            name="sitereport",
            options={"ordering": ("-created_on",)},
        ),
        migrations.AlterField(
            model_name="asset",
            name="metadata",
            field=models.JSONField(blank=True, default=dict, null=True),
        ),
        migrations.AlterField(
            model_name="campaign",
            name="metadata",
            field=models.JSONField(blank=True, default=dict, null=True),
        ),
        migrations.AlterField(
            model_name="item",
            name="metadata",
            field=models.JSONField(
                blank=True,
                default=dict,
                help_text="Raw metadata returned by the remote API",
                null=True,
            ),
        ),
        migrations.AlterField(
            model_name="project",
            name="metadata",
            field=models.JSONField(blank=True, default=dict, null=True),
        ),
    ]


================================================
FILE: concordia/migrations/0053_banner.py
================================================
# Generated by Django 3.2.14 on 2022-08-09 17:28

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0052_auto_20220531_1331"),
    ]

    operations = [
        migrations.CreateModel(
            name="Banner",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("created_on", models.DateTimeField(auto_now_add=True)),
                ("updated_on", models.DateTimeField(auto_now=True)),
                ("text", models.CharField(max_length=255)),
                ("link", models.CharField(max_length=255)),
                (
                    "open_in_new_window_tab",
                    models.BooleanField(blank=True, default=True),
                ),
            ],
        ),
    ]


================================================
FILE: concordia/migrations/0054_banner_active.py
================================================
# Generated by Django 3.2.14 on 2022-09-16 17:10

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0053_banner"),
    ]

    operations = [
        migrations.AddField(
            model_name="banner",
            name="active",
            field=models.BooleanField(blank=True, default=False),
        ),
    ]


================================================
FILE: concordia/migrations/0055_campaign_status.py
================================================
# Generated by Django 3.2.15 on 2022-09-19 19:16

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0054_banner_active"),
    ]

    operations = [
        migrations.AddField(
            model_name="campaign",
            name="status",
            field=models.IntegerField(
                choices=[(1, "Active"), (2, "Completed"), (3, "Retired")], default=1
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0056_auto_20220922_1508.py
================================================
# Generated by Django 3.2.15 on 2022-09-22 19:08

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0055_campaign_status"),
    ]

    operations = [
        migrations.AddField(
            model_name="campaign",
            name="completed_date",
            field=models.DateField(blank=True, null=True),
        ),
        migrations.AddField(
            model_name="campaign",
            name="launch_date",
            field=models.DateField(blank=True, null=True),
        ),
    ]


================================================
FILE: concordia/migrations/0057_resource_resource_type.py
================================================
# Generated by Django 3.2.15 on 2022-09-26 17:20

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0056_auto_20220922_1508"),
    ]

    operations = [
        migrations.AddField(
            model_name="resource",
            name="resource_type",
            field=models.IntegerField(
                choices=[(1, "Related Link"), (2, "Completed Transcription Link")],
                default=1,
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0058_banner_slug.py
================================================
# Generated by Django 3.2.14 on 2022-10-18 17:28

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0057_resource_resource_type"),
    ]

    operations = [
        migrations.AddField(
            model_name="banner",
            name="slug",
            field=models.SlugField(
                allow_unicode=True, default="banner_1", max_length=80, unique=True
            ),
            preserve_default=False,
        ),
    ]


================================================
FILE: concordia/migrations/0059_resourcefile.py
================================================
# Generated by Django 3.2.15 on 2022-12-17 20:47

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0058_banner_slug"),
    ]

    operations = [
        migrations.CreateModel(
            name="ResourceFile",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("name", models.CharField(max_length=255)),
                ("resource", models.FileField(upload_to="cm-uploads/")),
            ],
            options={
                "ordering": ["name"],
            },
        ),
    ]


================================================
FILE: concordia/migrations/0060_alter_resourcefile_resource.py
================================================
# Generated by Django 3.2.15 on 2022-12-17 21:53

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0059_resourcefile"),
    ]

    operations = [
        migrations.AlterField(
            model_name="resourcefile",
            name="resource",
            field=models.FileField(upload_to="cm-uploads/resources/%Y/"),
        ),
    ]


================================================
FILE: concordia/migrations/0061_auto_20230201_1453.py
================================================
# Generated by Django 3.2.15 on 2023-02-01 19:53

from django.db import migrations, models

import concordia.models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0060_alter_resourcefile_resource"),
    ]

    operations = [
        migrations.AddField(
            model_name="resourcefile",
            name="path",
            field=models.CharField(blank=True, default="", max_length=255),
        ),
        migrations.AlterField(
            model_name="resourcefile",
            name="resource",
            field=models.FileField(
                upload_to=concordia.models.resource_file_upload_path
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0061_sitereport_registered_contributors.py
================================================
# Generated by Django 3.2.15 on 2022-12-15 01:18

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0060_alter_resourcefile_resource"),
    ]

    operations = [
        migrations.AddField(
            model_name="sitereport",
            name="registered_contributors",
            field=models.IntegerField(blank=True, null=True),
        ),
    ]


================================================
FILE: concordia/migrations/0062_resourcefile_updated_on.py
================================================
# Generated by Django 3.2.15 on 2023-02-07 20:45

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0061_auto_20230201_1453"),
    ]

    operations = [
        migrations.AddField(
            model_name="resourcefile",
            name="updated_on",
            field=models.DateTimeField(auto_now=True),
        ),
    ]


================================================
FILE: concordia/migrations/0062_userretiredcampaign.py
================================================
# Generated by Django 3.2.14 on 2023-01-20 18:42

import django.db.models.deletion
from django.conf import settings
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        migrations.swappable_dependency(settings.AUTH_USER_MODEL),
        ("concordia", "0061_sitereport_registered_contributors"),
    ]

    operations = [
        migrations.CreateModel(
            name="UserRetiredCampaign",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("asset_count", models.IntegerField(blank=True, null=True)),
                ("asset_tag_count", models.IntegerField(blank=True, null=True)),
                (
                    "transcribe_count",
                    models.IntegerField(
                        blank=True,
                        null=True,
                        verbose_name="transcription save/submit count",
                    ),
                ),
                (
                    "review_count",
                    models.IntegerField(
                        blank=True, null=True, verbose_name="transcription review count"
                    ),
                ),
                (
                    "campaign",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.campaign",
                    ),
                ),
                (
                    "user",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to=settings.AUTH_USER_MODEL,
                    ),
                ),
            ],
        ),
    ]


================================================
FILE: concordia/migrations/0063_banner_alert_status.py
================================================
# Generated by Django 3.2.17 on 2023-02-16 17:33

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0062_resourcefile_updated_on"),
    ]

    operations = [
        migrations.AddField(
            model_name="banner",
            name="alert_status",
            field=models.CharField(
                choices=[
                    ("DANGER", "Danger"),
                    ("INFO", "Information"),
                    ("SUCCESS", "Success"),
                    ("WARN", "Warning"),
                ],
                default="SUCCESS",
                max_length=7,
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0064_alter_banner_alert_status.py
================================================
# Generated by Django 3.2.17 on 2023-02-23 17:37

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0063_banner_alert_status"),
    ]

    operations = [
        migrations.AlterField(
            model_name="banner",
            name="alert_status",
            field=models.CharField(
                choices=[
                    ("DANGER", "Red"),
                    ("INFO", "Teal"),
                    ("PRIMARY", "Blue"),
                    ("SECONDA", "Grey"),
                    ("SUCCESS", "Green"),
                    ("WARN", "Yellow"),
                ],
                default="SUCCESS",
                max_length=7,
                verbose_name="Color",
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0065_alter_userretiredcampaign_unique_together.py
================================================
# Generated by Django 3.2.14 on 2023-02-13 20:51

from django.conf import settings
from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        migrations.swappable_dependency(settings.AUTH_USER_MODEL),
        ("concordia", "0062_userretiredcampaign"),
    ]

    operations = [
        migrations.AlterUniqueTogether(
            name="userretiredcampaign",
            unique_together={("user", "campaign")},
        ),
    ]


================================================
FILE: concordia/migrations/0066_auto_20230217_1302.py
================================================
# Generated by Django 3.2.17 on 2023-02-17 13:02

import django.db.models.deletion
from django.conf import settings
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        migrations.swappable_dependency(settings.AUTH_USER_MODEL),
        ("concordia", "0065_alter_userretiredcampaign_unique_together"),
    ]

    operations = [
        migrations.AlterModelOptions(
            name="userretiredcampaign",
            options={"verbose_name": "user completed campaign count"},
        ),
        migrations.AlterField(
            model_name="userretiredcampaign",
            name="campaign",
            field=models.ForeignKey(
                on_delete=django.db.models.deletion.CASCADE,
                to="concordia.campaign",
                verbose_name="Campaign Id",
            ),
        ),
        migrations.AlterField(
            model_name="userretiredcampaign",
            name="user",
            field=models.ForeignKey(
                on_delete=django.db.models.deletion.CASCADE,
                to=settings.AUTH_USER_MODEL,
                verbose_name="User Id",
            ),
        ),
        migrations.AlterUniqueTogether(
            name="userretiredcampaign",
            unique_together=set(),
        ),
        migrations.AddConstraint(
            model_name="userretiredcampaign",
            constraint=models.UniqueConstraint(
                fields=("user", "campaign"), name="user_profile_activity"
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0066_campaignretirementprogress.py
================================================
# Generated by Django 3.2.16 on 2023-02-22 20:26

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0065_alter_userretiredcampaign_unique_together"),
    ]

    operations = [
        migrations.CreateModel(
            name="CampaignRetirementProgress",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("project_total", models.IntegerField(default=0)),
                ("projects_removed", models.IntegerField(default=0)),
                ("item_total", models.IntegerField(default=0)),
                ("items_removed", models.IntegerField(default=0)),
                ("asset_total", models.IntegerField(default=0)),
                ("assets_removed", models.IntegerField(default=0)),
                (
                    "campaign",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.campaign",
                    ),
                ),
            ],
        ),
    ]


================================================
FILE: concordia/migrations/0067_alter_campaignretirementprogress_campaign.py
================================================
# Generated by Django 3.2.16 on 2023-02-22 20:56

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0066_campaignretirementprogress"),
    ]

    operations = [
        migrations.AlterField(
            model_name="campaignretirementprogress",
            name="campaign",
            field=models.OneToOneField(
                on_delete=django.db.models.deletion.CASCADE, to="concordia.campaign"
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0068_campaignretirementprogress_complete.py
================================================
# Generated by Django 3.2.16 on 2023-02-23 20:35

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0067_alter_campaignretirementprogress_campaign"),
    ]

    operations = [
        migrations.AddField(
            model_name="campaignretirementprogress",
            name="complete",
            field=models.BooleanField(default=False),
        ),
    ]


================================================
FILE: concordia/migrations/0069_merge_20230224_1446.py
================================================
# Generated by Django 3.2.16 on 2023-02-24 19:46

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0066_auto_20230217_1302"),
        ("concordia", "0068_campaignretirementprogress_complete"),
    ]

    operations = []


================================================
FILE: concordia/migrations/0070_alter_campaign_options.py
================================================
# Generated by Django 3.2.16 on 2023-02-27 16:29

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0069_merge_20230224_1446"),
    ]

    operations = [
        migrations.AlterModelOptions(
            name="campaign",
            options={"permissions": [("retire_campaign", "Can retire campaign")]},
        ),
    ]


================================================
FILE: concordia/migrations/0071_auto_20230306_1456.py
================================================
# Generated by Django 3.2.16 on 2023-03-06 19:56

import django.utils.timezone
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0070_alter_campaign_options"),
    ]

    operations = [
        migrations.AddField(
            model_name="campaignretirementprogress",
            name="completed_on",
            field=models.DateTimeField(null=True),
        ),
        migrations.AddField(
            model_name="campaignretirementprogress",
            name="removal_log",
            field=models.JSONField(default=list),
        ),
        migrations.AddField(
            model_name="campaignretirementprogress",
            name="started_on",
            field=models.DateTimeField(
                auto_now_add=True, default=django.utils.timezone.now
            ),
            preserve_default=False,
        ),
    ]


================================================
FILE: concordia/migrations/0072_merge_20230313_1047.py
================================================
# Generated by Django 3.2.18 on 2023-03-13 14:47

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0064_alter_banner_alert_status"),
        ("concordia", "0071_auto_20230306_1456"),
    ]

    operations = []


================================================
FILE: concordia/migrations/0073_auto_20230314_1327.py
================================================
# Generated by Django 3.2.18 on 2023-03-14 13:27

import django.db.models.deletion
from django.conf import settings
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        migrations.swappable_dependency(settings.AUTH_USER_MODEL),
        ("concordia", "0072_merge_20230313_1047"),
    ]

    operations = [
        migrations.AlterField(
            model_name="banner",
            name="alert_status",
            field=models.CharField(
                choices=[
                    ("DANGER", "Red"),
                    ("INFO", "Blue"),
                    ("SUCCESS", "Green"),
                    ("WARNING", "Grey"),
                ],
                default="SUCCESS",
                max_length=7,
                verbose_name="Color",
            ),
        ),
        migrations.CreateModel(
            name="UserProfileActivity",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("asset_count", models.IntegerField(blank=True, null=True)),
                ("asset_tag_count", models.IntegerField(blank=True, null=True)),
                (
                    "transcribe_count",
                    models.IntegerField(
                        blank=True,
                        null=True,
                        verbose_name="transcription save/submit count",
                    ),
                ),
                (
                    "review_count",
                    models.IntegerField(
                        blank=True, null=True, verbose_name="transcription review count"
                    ),
                ),
                (
                    "campaign",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.campaign",
                        verbose_name="Campaign Id",
                    ),
                ),
                (
                    "user",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to=settings.AUTH_USER_MODEL,
                        verbose_name="User Id",
                    ),
                ),
            ],
        ),
        migrations.AddConstraint(
            model_name="userprofileactivity",
            constraint=models.UniqueConstraint(
                fields=("user", "campaign"), name="user_campaign_count"
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0074_auto_20230314_1341.py
================================================
# Generated by Django 3.2.18 on 2023-03-14 13:41

from django.db import migrations


def forwards_func(apps, schema_editor):
    # moved all of this functionality to tasks.py
    # leaving this migration here, just in case any environments still reference it
    pass


def reverse_func(apps, schema_editor):
    # reverse_func() should delete instances.
    UserProfileActivity = apps.get_model("concordia", "UserProfileActivity")
    db_alias = schema_editor.connection.alias
    UserProfileActivity.objects.using(db_alias).all().delete()


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0073_auto_20230314_1327"),
    ]

    operations = [
        migrations.RunPython(forwards_func, reverse_func),
    ]


================================================
FILE: concordia/migrations/0075_auto_20230327_1333.py
================================================
# Generated by Django 3.2.18 on 2023-03-27 17:33

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0074_auto_20230314_1341"),
    ]

    operations = [
        migrations.AlterModelOptions(
            name="asset",
            options={"permissions": [("reopen_asset", "Can reopen asset")]},
        ),
        migrations.AlterModelOptions(
            name="userprofileactivity",
            options={"verbose_name_plural": "User profile activities"},
        ),
    ]


================================================
FILE: concordia/migrations/0076_sitereport_report_name.py
================================================
# Generated by Django 3.2.18 on 2023-04-27 17:17

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0075_auto_20230327_1333"),
    ]

    operations = [
        migrations.AddField(
            model_name="sitereport",
            name="report_name",
            field=models.CharField(blank=True, default="", max_length=80),
        ),
    ]


================================================
FILE: concordia/migrations/0077_alter_sitereport_report_name.py
================================================
# Generated by Django 3.2.18 on 2023-05-04 15:33

from django.db import migrations, models


def update_report_names(apps, schema_editor):
    SiteReport = apps.get_model("concordia", "SiteReport")
    for report in SiteReport.objects.filter(report_name="RETIRED TOTAL"):
        report.report_name = "RETIRED_TOTAL"
        report.save()
    for report in SiteReport.objects.filter(report_name="Retired campaigns"):
        report.report_name = "RETIRED_TOTAL"
        report.save()
    for report in SiteReport.objects.filter(
        report_name="Active and completed campaigns"
    ):
        report.report_name = "TOTAL"
        report.save()
    for report in SiteReport.objects.filter(
        report_name="", campaign__isnull=True, topic__isnull=True
    ):
        report.report_name = "TOTAL"
        report.save()


def backwards(apps, schema_editor):
    # This can't be reversed, so we leave the report_names alone
    return


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0076_sitereport_report_name"),
    ]

    operations = [
        migrations.AlterField(
            model_name="sitereport",
            name="report_name",
            field=models.CharField(
                blank=True,
                choices=[
                    ("TOTAL", "Active and completed campaigns"),
                    ("RETIRED_TOTAL", "Retired campaigns"),
                ],
                default="",
                max_length=80,
            ),
        ),
        migrations.RunPython(update_report_names, backwards),
    ]


================================================
FILE: concordia/migrations/0078_alter_sitereport_report_name.py
================================================
# Generated by Django 3.2.18 on 2023-05-08 15:13

from django.db import migrations, models


def update_report_names(apps, schema_editor):
    SiteReport = apps.get_model("concordia", "SiteReport")
    for report in SiteReport.objects.filter(report_name="RETIRED_TOTAL"):
        report.report_name = "Retired campaigns"
        report.save()
    for report in SiteReport.objects.filter(report_name="TOTAL"):
        report.report_name = "Active and completed campaigns"
        report.save()


def backwards(apps, schema_editor):
    SiteReport = apps.get_model("concordia", "SiteReport")
    for report in SiteReport.objects.filter(report_name="Retired campaigns"):
        report.report_name = "RETIRED_TOTAL"
        report.save()
    for report in SiteReport.objects.filter(
        report_name="Active and completed campaigns"
    ):
        report.report_name = "TOTAL"
        report.save()


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0077_alter_sitereport_report_name"),
    ]

    operations = [
        migrations.AlterField(
            model_name="sitereport",
            name="report_name",
            field=models.CharField(
                blank=True,
                choices=[
                    (
                        "Active and completed campaigns",
                        "Active and completed campaigns",
                    ),
                    ("Retired campaigns", "Retired campaigns"),
                ],
                default="",
                max_length=80,
            ),
        ),
        migrations.RunPython(update_report_names, backwards),
    ]


================================================
FILE: concordia/migrations/0079_auto_20230601_1234.py
================================================
# Generated by Django 3.2.18 on 2023-06-01 16:34

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0078_alter_sitereport_report_name"),
    ]

    operations = [
        migrations.AlterField(
            model_name="userprofileactivity",
            name="asset_count",
            field=models.IntegerField(default=0),
        ),
        migrations.AlterField(
            model_name="userprofileactivity",
            name="asset_tag_count",
            field=models.IntegerField(default=0),
        ),
        migrations.AlterField(
            model_name="userprofileactivity",
            name="review_count",
            field=models.IntegerField(
                default=0, verbose_name="transcription review count"
            ),
        ),
        migrations.AlterField(
            model_name="userprofileactivity",
            name="transcribe_count",
            field=models.IntegerField(
                default=0, verbose_name="transcription save/submit count"
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0080_auto_20230602_0920.py
================================================
# Generated by Django 3.2.19 on 2023-06-02 13:20

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0079_auto_20230601_1234"),
    ]

    operations = [
        migrations.AddField(
            model_name="transcription",
            name="ocr_generated",
            field=models.BooleanField(
                default=False,
                help_text="Flags transcription as generated directly by OCR",
            ),
        ),
        migrations.AddField(
            model_name="transcription",
            name="ocr_originated",
            field=models.BooleanField(
                default=False,
                help_text="Flags transcription as originated from an OCR transcription",
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0081_sitereport_review_actions.py
================================================
# Generated by Django 3.2.19 on 2023-06-28 16:53

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0080_auto_20230602_0920"),
    ]

    operations = [
        migrations.AddField(
            model_name="sitereport",
            name="review_actions",
            field=models.IntegerField(blank=True, null=True),
        ),
    ]


================================================
FILE: concordia/migrations/0082_delete_userretiredcampaign.py
================================================
# Generated by Django 3.2.19 on 2023-07-10 13:06

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0081_sitereport_review_actions"),
    ]

    operations = [
        migrations.DeleteModel(
            name="UserRetiredCampaign",
        ),
    ]


================================================
FILE: concordia/migrations/0083_sitereport_daily_active_users.py
================================================
# Generated by Django 3.2.19 on 2023-07-10 14:47

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0082_delete_userretiredcampaign"),
    ]

    operations = [
        migrations.AddField(
            model_name="sitereport",
            name="daily_active_users",
            field=models.IntegerField(blank=True, null=True),
        ),
    ]


================================================
FILE: concordia/migrations/0084_rename_review_actions_sitereport_daily_review_actions.py
================================================
# Generated by Django 3.2.19 on 2023-07-21 14:36

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0083_sitereport_daily_active_users"),
    ]

    operations = [
        migrations.RenameField(
            model_name="sitereport",
            old_name="review_actions",
            new_name="daily_review_actions",
        ),
    ]


================================================
FILE: concordia/migrations/0085_auto_20231016_1432.py
================================================
# Generated by Django 3.2.22 on 2023-10-16 18:32

from django.db import migrations, models

import concordia.models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0084_rename_review_actions_sitereport_daily_review_actions"),
    ]

    operations = [
        migrations.AlterField(
            model_name="asset",
            name="storage_image",
            field=models.ImageField(
                max_length=255, upload_to=concordia.models.Asset.get_storage_path
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0086_auto_20231215_1311.py
================================================
# Generated by Django 3.2.23 on 2023-12-15 18:11

import django.contrib.auth.models
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("auth", "0012_alter_user_first_name_max_length"),
        ("concordia", "0085_auto_20231016_1432"),
    ]

    operations = [
        migrations.CreateModel(
            name="ConcordiaUser",
            fields=[],
            options={
                "proxy": True,
                "indexes": [],
                "constraints": [],
            },
            bases=("auth.user",),
            managers=[
                ("objects", django.contrib.auth.models.UserManager()),
            ],
        ),
        migrations.AddField(
            model_name="campaign",
            name="next_review_campaign",
            field=models.BooleanField(blank=True, db_index=True, default=False),
        ),
        migrations.AddField(
            model_name="campaign",
            name="next_transcription_campaign",
            field=models.BooleanField(blank=True, db_index=True, default=False),
        ),
    ]


================================================
FILE: concordia/migrations/0087_auto_20240213_0756.py
================================================
# Generated by Django 3.2.23 on 2024-02-13 12:56

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0086_auto_20231215_1311"),
    ]

    operations = [
        migrations.CreateModel(
            name="Card",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("image_alt_text", models.TextField(blank=True)),
                (
                    "image",
                    models.ImageField(blank=True, null=True, upload_to="card_images"),
                ),
                ("title", models.CharField(max_length=80)),
                ("body_text", models.TextField(blank=True)),
                ("created_on", models.DateTimeField(auto_now_add=True)),
                ("updated_on", models.DateTimeField(auto_now=True, null=True)),
                (
                    "display_heading",
                    models.CharField(blank=True, max_length=80, null=True),
                ),
            ],
            options={
                "ordering": ("title",),
            },
        ),
        migrations.CreateModel(
            name="CardFamily",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                (
                    "slug",
                    models.SlugField(allow_unicode=True, max_length=80, unique=True),
                ),
                ("default", models.BooleanField(default=False)),
            ],
            options={
                "verbose_name_plural": "card families",
            },
        ),
        migrations.CreateModel(
            name="Guide",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("title", models.CharField(max_length=80)),
                ("body", models.TextField(blank=True)),
                ("order", models.IntegerField(default=1)),
                ("link_text", models.CharField(blank=True, max_length=80, null=True)),
                ("link_url", models.CharField(blank=True, max_length=255, null=True)),
            ],
        ),
        migrations.CreateModel(
            name="TutorialCard",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("order", models.IntegerField(default=0)),
                (
                    "card",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE, to="concordia.card"
                    ),
                ),
                (
                    "tutorial",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.cardfamily",
                    ),
                ),
            ],
            options={
                "verbose_name_plural": "cards",
            },
        ),
        migrations.DeleteModel(
            name="SimpleContentBlock",
        ),
        migrations.AddField(
            model_name="cardfamily",
            name="cards",
            field=models.ManyToManyField(
                through="concordia.TutorialCard", to="concordia.Card"
            ),
        ),
        migrations.AddField(
            model_name="campaign",
            name="card_family",
            field=models.ForeignKey(
                blank=True,
                null=True,
                on_delete=django.db.models.deletion.CASCADE,
                to="concordia.cardfamily",
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0088_alter_simplepage_body.py
================================================
# Generated by Django 3.2.24 on 2024-02-21 18:37

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0087_auto_20240213_0756"),
    ]

    operations = [
        migrations.AlterField(
            model_name="simplepage",
            name="body",
            field=models.TextField(blank=True, null=True),
        ),
    ]


================================================
FILE: concordia/migrations/0089_campaign_image_alt_text.py
================================================
# Generated by Django 3.2.24 on 2024-02-26 14:13

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0088_alter_simplepage_body"),
    ]

    operations = [
        migrations.AddField(
            model_name="campaign",
            name="image_alt_text",
            field=models.TextField(blank=True, null=True),
        ),
    ]


================================================
FILE: concordia/migrations/0090_auto_20240408_1334.py
================================================
# Generated by Django 3.2.25 on 2024-04-09 15:25

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0089_campaign_image_alt_text"),
    ]

    operations = [
        migrations.AddField(
            model_name="asset",
            name="disable_ocr",
            field=models.BooleanField(
                default=False, help_text="Turn OCR off for this asset"
            ),
        ),
        migrations.AddField(
            model_name="campaign",
            name="disable_ocr",
            field=models.BooleanField(
                default=False, help_text="Turn OCR off for all assets of this campaign"
            ),
        ),
        migrations.AddField(
            model_name="item",
            name="disable_ocr",
            field=models.BooleanField(
                default=False, help_text="Turn OCR off for all assets of this item"
            ),
        ),
        migrations.AddField(
            model_name="project",
            name="disable_ocr",
            field=models.BooleanField(
                default=False, help_text="Turn OCR off for all assets of this project"
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0091_guide_simple_page.py
================================================
# Generated by Django 4.2.13 on 2024-05-09 19:21

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0090_auto_20240408_1334"),
    ]

    operations = [
        migrations.AddField(
            model_name="guide",
            name="page",
            field=models.ForeignKey(
                blank=True,
                null=True,
                on_delete=django.db.models.deletion.SET_NULL,
                to="concordia.simplepage",
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0092_auto_20240509_1522.py
================================================
# Generated by Django 4.2.13 on 2024-05-09 19:22

from django.db import migrations


def set_simplepages(apps, schema_editor):
    SimplePage = apps.get_model("concordia", "SimplePage")
    Guide = apps.get_model("concordia", "Guide")
    for guide in Guide.objects.all():
        page = SimplePage.objects.get(title=guide.title)
        guide.page = page
        guide.save()


def backwards(apps, schema_editor):
    Guide = apps.get_model("concordia", "Guide")
    for guide in Guide.objects.all():
        guide.page = None
        guide.save()


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0091_guide_simple_page"),
    ]

    operations = [
        migrations.RunPython(set_simplepages, backwards),
    ]


================================================
FILE: concordia/migrations/0093_asset_campaign.py
================================================
# Generated by Django 4.2.13 on 2024-06-17 17:13

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0092_auto_20240509_1522"),
    ]

    operations = [
        migrations.AddField(
            model_name="asset",
            name="campaign",
            field=models.ForeignKey(
                null=True,
                on_delete=django.db.models.deletion.CASCADE,
                to="concordia.campaign",
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0094_alter_asset_campaign.py
================================================
# Generated by Django 4.2.13 on 2024-06-17 17:13

import django.db.models.deletion
from django.db import migrations, models


def set_field_values(apps, schema_editor):
    Asset = apps.get_model("concordia", "asset")
    db_alias = schema_editor.connection.alias
    assets = (
        Asset.objects.using(db_alias)
        .select_related("item__project__campaign")
        .only("item__project__campaign", "campaign")
        .iterator(chunk_size=10000)
    )

    updated = []
    for asset in assets:
        # Can't use an F object across tables
        # using update/bulk_update, so we have
        # loop through all of them
        asset.campaign = asset.item.project.campaign
        updated.append(asset)
        # To avoid running out of memory, we only
        # keep 10,000 assets in memory at a time
        if len(updated) >= 10000:
            Asset.objects.bulk_update(updated, ["campaign"])
            updated = []
    if updated:
        Asset.objects.bulk_update(updated, ["campaign"])


def revert_field_values(apps, schema_editor):
    # We can't actually revert the data, and there's
    # no need to, but we need this function to be
    # able to reverse this migration
    pass


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0093_asset_campaign"),
    ]

    operations = [
        migrations.RunPython(set_field_values, revert_field_values),
        migrations.AlterField(
            model_name="asset",
            name="campaign",
            field=models.ForeignKey(
                on_delete=django.db.models.deletion.CASCADE, to="concordia.campaign"
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0095_transcription_rolled_back_and_more.py
================================================
# Generated by Django 4.2.13 on 2024-06-26 23:26

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0094_alter_asset_campaign"),
    ]

    operations = [
        migrations.AddField(
            model_name="transcription",
            name="rolled_back",
            field=models.BooleanField(
                default=False,
                help_text="Flags transcription as being the result of a rollback (undo)",
            ),
        ),
        migrations.AddField(
            model_name="transcription",
            name="rolled_forward",
            field=models.BooleanField(
                default=False,
                help_text="Flags transcription as being the result of a rollforward (redo)",
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0096_transcription_source.py
================================================
# Generated by Django 4.2.13 on 2024-06-26 23:41

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0095_transcription_rolled_back_and_more"),
    ]

    operations = [
        migrations.AddField(
            model_name="transcription",
            name="source",
            field=models.ForeignKey(
                blank=True,
                help_text="The transcription source for the roll back or roll forward",
                null=True,
                on_delete=django.db.models.deletion.CASCADE,
                related_name="source_of",
                to="concordia.transcription",
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0097_alter_sitereport_options_userprofile_review_count_and_more.py
================================================
# Generated by Django 4.2.13 on 2024-07-29 17:30

import django.db.models.deletion
from django.conf import settings
from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        migrations.swappable_dependency(settings.AUTH_USER_MODEL),
        ("concordia", "0096_transcription_source"),
    ]

    operations = [
        migrations.AlterModelOptions(
            name="sitereport",
            options={"get_latest_by": "created_on", "ordering": ("-created_on",)},
        ),
        migrations.AddField(
            model_name="userprofile",
            name="review_count",
            field=models.IntegerField(
                default=0, verbose_name="transcription review count"
            ),
        ),
        migrations.AddField(
            model_name="userprofile",
            name="transcribe_count",
            field=models.IntegerField(
                default=0, verbose_name="transcription save/submit count"
            ),
        ),
        migrations.AlterField(
            model_name="userprofile",
            name="user",
            field=models.OneToOneField(
                on_delete=django.db.models.deletion.CASCADE,
                related_name="profile",
                to=settings.AUTH_USER_MODEL,
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0098_userprofile_create_and_population.py
================================================
# Generated by Django 4.2.13 on 2024-07-29 17:40

from django.conf import settings
from django.db import migrations


def create_and_populate_profiles(apps, schema_editor):
    User = apps.get_model("auth", "User")
    UserProfile = apps.get_model("concordia", "UserProfile")
    db_alias = schema_editor.connection.alias
    for user in User.objects.using(db_alias).all().iterator(chunk_size=10000):
        profile, created = UserProfile.objects.using(db_alias).get_or_create(user=user)
        for activity in user.userprofileactivity_set.all():
            profile.transcribe_count += activity.transcribe_count
            profile.review_count += activity.review_count
        profile.save()


def revert_create_and_populate_profiles(apps, schema_editor):
    # We can't actually revert the data to the state it was before,
    # and there's no actual need to, but we need this function to be
    # able to reverse this migration
    pass


class Migration(migrations.Migration):

    dependencies = [
        migrations.swappable_dependency(settings.AUTH_USER_MODEL),
        (
            "concordia",
            "0097_alter_sitereport_options_userprofile_review_count_and_more",
        ),
    ]

    operations = [
        migrations.RunPython(
            create_and_populate_profiles, revert_create_and_populate_profiles
        ),
    ]


================================================
FILE: concordia/migrations/0099_alter_campaign_display_on_homepage_and_more.py
================================================
# Generated by Django 4.2.16 on 2024-11-01 17:49

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0098_userprofile_create_and_population"),
    ]

    operations = [
        migrations.AlterField(
            model_name="campaign",
            name="display_on_homepage",
            field=models.BooleanField(default=True, verbose_name="Homepage"),
        ),
        migrations.AlterField(
            model_name="campaign",
            name="next_review_campaign",
            field=models.BooleanField(
                blank=True, db_index=True, default=False, verbose_name="Next-rev."
            ),
        ),
        migrations.AlterField(
            model_name="campaign",
            name="next_transcription_campaign",
            field=models.BooleanField(
                blank=True, db_index=True, default=False, verbose_name="Next-tran."
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0100_researchcenter.py
================================================
# Generated by Django 4.2.16 on 2024-11-19 17:15

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0099_alter_campaign_display_on_homepage_and_more"),
    ]

    operations = [
        migrations.CreateModel(
            name="ResearchCenter",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("title", models.CharField(max_length=80)),
            ],
        ),
    ]


================================================
FILE: concordia/migrations/0101_auto_20241119_1215.py
================================================
# Generated by Django 4.2.16 on 2024-11-19 17:15

from django.db import migrations

TITLES = (
    "American Folklife Center",
    "Law Library",
    "Manuscript",
    "Performing Arts",
    "Rare Book",
)


def forwards_func(apps, schema_editor):
    # create initial data
    ResearchCenter = apps.get_model("concordia", "ResearchCenter")
    db_alias = schema_editor.connection.alias
    ResearchCenter.objects.using(db_alias).bulk_create(
        [
            ResearchCenter(title="American Folklife Center"),
            ResearchCenter(title="Law Library"),
            ResearchCenter(title="Manuscript"),
            ResearchCenter(title="Performing Arts"),
            ResearchCenter(title="Rare Book"),
        ]
    )


def reverse_func(apps, schema_editor):
    ResearchCenter = apps.get_model("concordia", "ResearchCenter")
    db_alias = schema_editor.connection.alias
    for title in TITLES:
        ResearchCenter.objects.using(db_alias).filter(title=title).delete()


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0100_researchcenter"),
    ]

    operations = [migrations.RunPython(forwards_func, reverse_func)]


================================================
FILE: concordia/migrations/0102_campaign_research_centers.py
================================================
# Generated by Django 4.2.16 on 2024-11-20 12:06

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0101_auto_20241119_1215"),
    ]

    operations = [
        migrations.AddField(
            model_name="campaign",
            name="research_centers",
            field=models.ManyToManyField(blank=True, to="concordia.researchcenter"),
        ),
    ]


================================================
FILE: concordia/migrations/0103_alter_item_title.py
================================================
# Generated by Django 4.2.16 on 2024-12-16 18:03

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0102_campaign_research_centers"),
    ]

    operations = [
        migrations.AlterField(
            model_name="item",
            name="title",
            field=models.CharField(max_length=700),
        ),
    ]


================================================
FILE: concordia/migrations/0104_nexttranscribabletopicasset_and_more.py
================================================
# Generated by Django 4.2.16 on 2025-04-04 18:55

import uuid

import django.contrib.postgres.fields
import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0103_alter_item_title"),
    ]

    operations = [
        migrations.CreateModel(
            name="NextTranscribableTopicAsset",
            fields=[
                (
                    "id",
                    models.UUIDField(
                        default=uuid.uuid4,
                        editable=False,
                        primary_key=True,
                        serialize=False,
                    ),
                ),
                ("item_item_id", models.CharField(max_length=100)),
                ("project_slug", models.SlugField(allow_unicode=True, max_length=80)),
                ("sequence", models.PositiveIntegerField(default=1)),
                ("created_on", models.DateTimeField(auto_now_add=True)),
                (
                    "transcription_status",
                    models.CharField(
                        choices=[
                            ("not_started", "Not Started"),
                            ("in_progress", "In Progress"),
                            ("submitted", "Needs Review"),
                            ("completed", "Completed"),
                        ],
                        db_index=True,
                        default="not_started",
                        editable=False,
                        max_length=20,
                    ),
                ),
                (
                    "asset",
                    models.OneToOneField(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.asset",
                    ),
                ),
                (
                    "item",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE, to="concordia.item"
                    ),
                ),
                (
                    "project",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.project",
                    ),
                ),
                (
                    "topic",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.topic",
                    ),
                ),
            ],
            options={
                "abstract": False,
            },
        ),
        migrations.CreateModel(
            name="NextTranscribableCampaignAsset",
            fields=[
                (
                    "id",
                    models.UUIDField(
                        default=uuid.uuid4,
                        editable=False,
                        primary_key=True,
                        serialize=False,
                    ),
                ),
                ("item_item_id", models.CharField(max_length=100)),
                ("project_slug", models.SlugField(allow_unicode=True, max_length=80)),
                ("sequence", models.PositiveIntegerField(default=1)),
                ("created_on", models.DateTimeField(auto_now_add=True)),
                (
                    "transcription_status",
                    models.CharField(
                        choices=[
                            ("not_started", "Not Started"),
                            ("in_progress", "In Progress"),
                            ("submitted", "Needs Review"),
                            ("completed", "Completed"),
                        ],
                        db_index=True,
                        default="not_started",
                        editable=False,
                        max_length=20,
                    ),
                ),
                (
                    "asset",
                    models.OneToOneField(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.asset",
                    ),
                ),
                (
                    "campaign",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.campaign",
                    ),
                ),
                (
                    "item",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE, to="concordia.item"
                    ),
                ),
                (
                    "project",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.project",
                    ),
                ),
            ],
            options={
                "abstract": False,
            },
        ),
        migrations.CreateModel(
            name="NextReviewableTopicAsset",
            fields=[
                (
                    "id",
                    models.UUIDField(
                        default=uuid.uuid4,
                        editable=False,
                        primary_key=True,
                        serialize=False,
                    ),
                ),
                ("item_item_id", models.CharField(max_length=100)),
                ("project_slug", models.SlugField(allow_unicode=True, max_length=80)),
                ("sequence", models.PositiveIntegerField(default=1)),
                ("created_on", models.DateTimeField(auto_now_add=True)),
                (
                    "transcriber_ids",
                    django.contrib.postgres.fields.ArrayField(
                        base_field=models.IntegerField(),
                        blank=True,
                        default=list,
                        size=None,
                    ),
                ),
                (
                    "asset",
                    models.OneToOneField(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.asset",
                    ),
                ),
                (
                    "item",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE, to="concordia.item"
                    ),
                ),
                (
                    "project",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.project",
                    ),
                ),
                (
                    "topic",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.topic",
                    ),
                ),
            ],
            options={
                "abstract": False,
            },
        ),
        migrations.CreateModel(
            name="NextReviewableCampaignAsset",
            fields=[
                (
                    "id",
                    models.UUIDField(
                        default=uuid.uuid4,
                        editable=False,
                        primary_key=True,
                        serialize=False,
                    ),
                ),
                ("item_item_id", models.CharField(max_length=100)),
                ("project_slug", models.SlugField(allow_unicode=True, max_length=80)),
                ("sequence", models.PositiveIntegerField(default=1)),
                ("created_on", models.DateTimeField(auto_now_add=True)),
                (
                    "transcriber_ids",
                    django.contrib.postgres.fields.ArrayField(
                        base_field=models.IntegerField(),
                        blank=True,
                        default=list,
                        size=None,
                    ),
                ),
                (
                    "asset",
                    models.OneToOneField(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.asset",
                    ),
                ),
                (
                    "campaign",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.campaign",
                    ),
                ),
                (
                    "item",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE, to="concordia.item"
                    ),
                ),
                (
                    "project",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.project",
                    ),
                ),
            ],
            options={
                "abstract": False,
            },
        ),
    ]


================================================
FILE: concordia/migrations/0105_nextreviewablecampaignasset_concordia_n_transcr_aafdba_gin_and_more.py
================================================
# Generated by Django 4.2.16 on 2025-04-04 19:09

import django.contrib.postgres.indexes
from django.db import migrations


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0104_nexttranscribabletopicasset_and_more"),
    ]

    operations = [
        migrations.AddIndex(
            model_name="nextreviewablecampaignasset",
            index=django.contrib.postgres.indexes.GinIndex(
                fields=["transcriber_ids"], name="concordia_n_transcr_aafdba_gin"
            ),
        ),
        migrations.AddIndex(
            model_name="nextreviewabletopicasset",
            index=django.contrib.postgres.indexes.GinIndex(
                fields=["transcriber_ids"], name="concordia_n_transcr_415832_gin"
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0106_alter_nextreviewablecampaignasset_options_and_more.py
================================================
# Generated by Django 4.2.16 on 2025-04-09 17:44

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        (
            "concordia",
            "0105_nextreviewablecampaignasset_concordia_n_transcr_aafdba_gin_and_more",
        ),
    ]

    operations = [
        migrations.AlterModelOptions(
            name="nextreviewablecampaignasset",
            options={"get_latest_by": "created_on", "ordering": ("-created_on",)},
        ),
        migrations.AlterModelOptions(
            name="nextreviewabletopicasset",
            options={"get_latest_by": "created_on", "ordering": ("-created_on",)},
        ),
        migrations.AlterModelOptions(
            name="nexttranscribablecampaignasset",
            options={"get_latest_by": "created_on", "ordering": ("-created_on",)},
        ),
        migrations.AlterModelOptions(
            name="nexttranscribabletopicasset",
            options={"get_latest_by": "created_on", "ordering": ("-created_on",)},
        ),
        migrations.AlterField(
            model_name="nextreviewablecampaignasset",
            name="asset",
            field=models.ForeignKey(
                on_delete=django.db.models.deletion.CASCADE, to="concordia.asset"
            ),
        ),
        migrations.AlterField(
            model_name="nextreviewabletopicasset",
            name="asset",
            field=models.ForeignKey(
                on_delete=django.db.models.deletion.CASCADE, to="concordia.asset"
            ),
        ),
        migrations.AlterUniqueTogether(
            name="nextreviewabletopicasset",
            unique_together={("asset", "topic")},
        ),
        migrations.AlterUniqueTogether(
            name="nexttranscribabletopicasset",
            unique_together={("asset", "topic")},
        ),
    ]


================================================
FILE: concordia/migrations/0107_alter_nextreviewablecampaignasset_options_and_more.py
================================================
# Generated by Django 4.2.16 on 2025-04-09 17:50

from django.db import migrations


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0106_alter_nextreviewablecampaignasset_options_and_more"),
    ]

    operations = [
        migrations.AlterModelOptions(
            name="nextreviewablecampaignasset",
            options={"get_latest_by": "created_on", "ordering": ("created_on",)},
        ),
        migrations.AlterModelOptions(
            name="nextreviewabletopicasset",
            options={"get_latest_by": "created_on", "ordering": ("created_on",)},
        ),
        migrations.AlterModelOptions(
            name="nexttranscribablecampaignasset",
            options={"get_latest_by": "created_on", "ordering": ("created_on",)},
        ),
        migrations.AlterModelOptions(
            name="nexttranscribabletopicasset",
            options={"get_latest_by": "created_on", "ordering": ("created_on",)},
        ),
    ]


================================================
FILE: concordia/migrations/0108_add_next_asset_cache_periodic_task.py
================================================
# Generated by Django 4.2.16 on 2025-04-10 13:52

from django.db import migrations


def add_renew_next_asset_cache_task(apps, schema_editor):
    PeriodicTask = apps.get_model("django_celery_beat", "PeriodicTask")
    IntervalSchedule = apps.get_model("django_celery_beat", "IntervalSchedule")

    schedule, _ = IntervalSchedule.objects.get_or_create(every=1, period="hours")

    PeriodicTask.objects.update_or_create(
        name="Renew next asset cache",
        defaults={
            "interval": schedule,
            "task": "concordia.tasks.renew_next_asset_cache",
            "enabled": True,
            "description": (
                "Run every hour to refresh cache of transcribable and reviewable assets"
            ),
        },
    )


def remove_renew_next_asset_cache_task(apps, schema_editor):
    PeriodicTask = apps.get_model("django_celery_beat", "PeriodicTask")
    PeriodicTask.objects.filter(name="Renew next asset cache").delete()


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0107_alter_nextreviewablecampaignasset_options_and_more"),
        ("django_celery_beat", "0019_alter_periodictasks_options"),
    ]

    operations = [
        migrations.RunPython(
            add_renew_next_asset_cache_task,
            reverse_code=remove_renew_next_asset_cache_task,
        ),
    ]


================================================
FILE: concordia/migrations/0109_alter_nextreviewablecampaignasset_asset_and_more.py
================================================
# Generated by Django 4.2.16 on 2025-04-10 19:19

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0108_add_next_asset_cache_periodic_task"),
    ]

    operations = [
        migrations.AlterField(
            model_name="nextreviewablecampaignasset",
            name="asset",
            field=models.OneToOneField(
                on_delete=django.db.models.deletion.CASCADE, to="concordia.asset"
            ),
        ),
        migrations.AlterField(
            model_name="nexttranscribabletopicasset",
            name="asset",
            field=models.ForeignKey(
                on_delete=django.db.models.deletion.CASCADE, to="concordia.asset"
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0110_remove_asset_media_url_alter_asset_storage_image.py
================================================
# Generated by Django 4.2.20 on 2025-04-23 19:22

import storages.backends.s3
from django.db import migrations, models

import concordia.models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0109_alter_nextreviewablecampaignasset_asset_and_more"),
    ]

    operations = [
        migrations.RemoveField(
            model_name="asset",
            name="media_url",
        ),
        migrations.AlterField(
            model_name="asset",
            name="storage_image",
            field=models.ImageField(
                max_length=255,
                storage=storages.backends.s3.S3Storage(querystring_auth=False),
                upload_to=concordia.models.Asset.get_storage_path,
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0111_auto_20250428_1023.py
================================================
# Generated by Django 4.2.20 on 2025-04-28 14:23

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0110_remove_asset_media_url_alter_asset_storage_image"),
    ]

    operations = [
        # We need to update Django so it knows about our intermediate
        # model, but since we're re-using the existing intermediate
        # table, we don't want to change anything in the database itself
        migrations.SeparateDatabaseAndState(
            database_operations=[],  # No DB changes, only Django state
            state_operations=[
                migrations.CreateModel(
                    name="ProjectTopic",
                    fields=[
                        (
                            "id",
                            models.AutoField(
                                auto_created=True,
                                primary_key=True,
                                serialize=False,
                                verbose_name="ID",
                            ),
                        ),
                        (
                            "project",
                            models.ForeignKey(
                                on_delete=models.CASCADE, to="concordia.project"
                            ),
                        ),
                        (
                            "topic",
                            models.ForeignKey(
                                on_delete=models.CASCADE, to="concordia.topic"
                            ),
                        ),
                    ],
                    options={
                        "db_table": "concordia_project_topics",
                        "unique_together": {("project", "topic")},
                    },
                ),
                migrations.AlterField(
                    model_name="project",
                    name="topics",
                    field=models.ManyToManyField(
                        to="concordia.Topic",
                        through="concordia.ProjectTopic",
                    ),
                ),
            ],
        ),
    ]


================================================
FILE: concordia/migrations/0112_projecttopic_url_filter_alter_projecttopic_id.py
================================================
# Generated by Django 4.2.20 on 2025-04-28 14:26

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0111_auto_20250428_1023"),
    ]

    operations = [
        migrations.AddField(
            model_name="projecttopic",
            name="url_filter",
            field=models.CharField(
                blank=True,
                null=True,
                max_length=20,
                choices=[
                    ("not_started", "Not Started"),
                    ("in_progress", "In Progress"),
                    ("submitted", "Needs Review"),
                    ("completed", "Completed"),
                ],
                help_text="Optional filter on the status for this project-topic link",
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0113_create_asset_status_periodic_task.py
================================================
# Generated by Django 4.2.21 on 2025-06-05 14:03

from django.db import migrations


def create_asset_status_task(apps, schema_editor):
    IntervalSchedule = apps.get_model("django_celery_beat", "IntervalSchedule")
    PeriodicTask = apps.get_model("django_celery_beat", "PeriodicTask")

    # Ensure an IntervalSchedule of every 5 minutes exists (or get it).
    interval, created = IntervalSchedule.objects.get_or_create(
        every=5,
        period="minutes",
    )

    # Create the PeriodicTask if it doesn’t already exist
    PeriodicTask.objects.get_or_create(
        name="Populate asset status visualization cache",
        task="concordia.tasks.populate_asset_status_visualization_cache",
        interval=interval,
        defaults={
            "enabled": True,
            "description": "Populates the cache for the asset-status-overview and asset-status-by-campaign visualizations",
        },
    )


def delete_asset_status_task(apps, schema_editor):
    PeriodicTask = apps.get_model("django_celery_beat", "PeriodicTask")
    # Delete by the exact name we used above
    PeriodicTask.objects.filter(
        name="Populate asset status visualization cache"
    ).delete()


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0112_projecttopic_url_filter_alter_projecttopic_id"),
        ("django_celery_beat", "0019_alter_periodictasks_options"),
    ]

    operations = [
        migrations.RunPython(create_asset_status_task, delete_asset_status_task),
    ]


================================================
FILE: concordia/migrations/0114_create_daily_activity_periodic_task.py
================================================
# Generated by Django 4.2.21 on 2025-06-05 14:10

from django.db import migrations


def create_daily_activity_task(apps, schema_editor):
    CrontabSchedule = apps.get_model("django_celery_beat", "CrontabSchedule")
    PeriodicTask = apps.get_model("django_celery_beat", "PeriodicTask")

    # Ensure a CrontabSchedule for daily at 4:00 AM exists.
    crontab, created = CrontabSchedule.objects.get_or_create(
        minute="0",
        hour="4",
        day_of_week="*",
        day_of_month="*",
        month_of_year="*",
        timezone="America/New_York",
    )

    # Create the PeriodicTask if it doesn’t already exist
    PeriodicTask.objects.get_or_create(
        name="Populate daily activity visualization cache",
        task="concordia.tasks.populate_daily_activity_visualization_cache",
        crontab=crontab,
        defaults={
            "enabled": True,
            "description": "Populates the cache for the daily-activity visualization",
        },
    )


def delete_daily_activity_task(apps, schema_editor):
    PeriodicTask = apps.get_model("django_celery_beat", "PeriodicTask")
    PeriodicTask.objects.filter(
        name="Populate daily activity visualization cache"
    ).delete()


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0113_create_asset_status_periodic_task"),
        ("django_celery_beat", "0019_alter_periodictasks_options"),
    ]

    operations = [
        migrations.RunPython(create_daily_activity_task, delete_daily_activity_task),
    ]


================================================
FILE: concordia/migrations/0115_alter_asset_storage_image_alter_banner_link_and_more.py
================================================
# Generated by Django 4.2.22 on 2025-06-16 13:24

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0114_create_daily_activity_periodic_task"),
    ]

    operations = [
        migrations.AlterField(
            model_name="banner",
            name="link",
            field=models.CharField(blank=True, max_length=255, null=True),
        ),
    ]


================================================
FILE: concordia/migrations/0116_item_thumbnail_image.py
================================================
# Generated by Django 4.2.22 on 2025-08-13 17:43

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0115_alter_asset_storage_image_alter_banner_link_and_more"),
    ]

    operations = [
        migrations.AddField(
            model_name="item",
            name="thumbnail_image",
            field=models.ImageField(blank=True, null=True, upload_to="item-thumbnails"),
        ),
    ]


================================================
FILE: concordia/migrations/0117_alter_projecttopic_options_projecttopic_ordering.py
================================================
# Generated by Django 4.2.22 on 2025-08-25 18:39

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0116_item_thumbnail_image"),
    ]

    operations = [
        migrations.AlterModelOptions(
            name="projecttopic",
            options={"ordering": ("ordering",)},
        ),
        migrations.AddField(
            model_name="projecttopic",
            name="ordering",
            field=models.IntegerField(
                default=0,
                help_text="Sort order override: lower values will be listed first",
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0118_asset_concordia_a_item_id_f10916_idx_and_more.py
================================================
# Generated by Django 4.2.22 on 2025-08-26 13:27

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0117_alter_projecttopic_options_projecttopic_ordering"),
    ]

    operations = [
        migrations.AddIndex(
            model_name="asset",
            index=models.Index(
                fields=["item", "published", "transcription_status"],
                name="concordia_a_item_id_f10916_idx",
            ),
        ),
        migrations.AddIndex(
            model_name="project",
            index=models.Index(
                fields=["published", "campaign", "title"],
                name="concordia_p_publish_0a0f1e_idx",
            ),
        ),
        migrations.AddIndex(
            model_name="projecttopic",
            index=models.Index(
                fields=["topic", "project"], name="concordia_p_topic_i_bf12cc_idx"
            ),
        ),
        migrations.AddIndex(
            model_name="projecttopic",
            index=models.Index(
                fields=["topic", "ordering"], name="concordia_p_topic_i_dcbe8c_idx"
            ),
        ),
        migrations.AddIndex(
            model_name="projecttopic",
            index=models.Index(
                fields=["topic", "url_filter"], name="concordia_p_topic_i_ee5c9d_idx"
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0119_remove_asset_concordia_a_id_137ca8_idx_and_more.py
================================================
# Generated by Django 4.2.22 on 2025-09-08 14:19

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0118_asset_concordia_a_item_id_f10916_idx_and_more"),
    ]

    operations = [
        migrations.RemoveIndex(
            model_name="asset",
            name="concordia_a_id_137ca8_idx",
        ),
        migrations.RemoveIndex(
            model_name="asset",
            name="concordia_a_item_id_f10916_idx",
        ),
        migrations.AddIndex(
            model_name="asset",
            index=models.Index(
                fields=["item", "published", "transcription_status", "sequence"],
                name="concordia_a_item_id_0926c0_idx",
            ),
        ),
        migrations.AddIndex(
            model_name="asset",
            index=models.Index(
                fields=["published", "transcription_status", "item", "sequence"],
                name="concordia_a_publish_b60d2f_idx",
            ),
        ),
        migrations.AddIndex(
            model_name="asset",
            index=models.Index(
                fields=["item", "sequence"], name="concordia_a_item_id_24ea05_idx"
            ),
        ),
        migrations.AddIndex(
            model_name="asset",
            index=models.Index(
                fields=["campaign", "sequence"], name="concordia_a_campaig_d64e2f_idx"
            ),
        ),
    ]


================================================
FILE: concordia/migrations/0120_sitereport_assets_started.py
================================================
# Generated by Django 4.2.22 on 2025-09-10 16:09

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0119_remove_asset_concordia_a_id_137ca8_idx_and_more"),
    ]

    operations = [
        migrations.AddField(
            model_name="sitereport",
            name="assets_started",
            field=models.IntegerField(blank=True, null=True),
        ),
    ]


================================================
FILE: concordia/migrations/0121_keymetricsreport.py
================================================
# Generated by Django 4.2.22 on 2025-09-11 16:13

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0120_sitereport_assets_started"),
    ]

    operations = [
        migrations.CreateModel(
            name="KeyMetricsReport",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("created_on", models.DateTimeField(auto_now_add=True)),
                ("updated_on", models.DateTimeField(auto_now=True)),
                (
                    "period_type",
                    models.CharField(
                        choices=[
                            ("MONTHLY", "Monthly"),
                            ("QUARTERLY", "Quarterly"),
                            ("FISCAL_YEAR", "Fiscal year"),
                        ],
                        max_length=20,
                    ),
                ),
                ("period_start", models.DateField()),
                ("period_end", models.DateField()),
                ("fiscal_year", models.IntegerField()),
                ("fiscal_quarter", models.IntegerField(blank=True, null=True)),
                ("month", models.IntegerField(blank=True, null=True)),
                ("assets_published", models.IntegerField(blank=True, null=True)),
                ("assets_started", models.IntegerField(blank=True, null=True)),
                ("assets_completed", models.IntegerField(blank=True, null=True)),
                ("users_activated", models.IntegerField(blank=True, null=True)),
                (
                    "anonymous_transcriptions",
                    models.IntegerField(blank=True, null=True),
                ),
                ("transcriptions_saved", models.IntegerField(blank=True, null=True)),
                ("tag_uses", models.IntegerField(blank=True, null=True)),
                (
                    "crowd_emails_and_libanswers_sent",
                    models.IntegerField(blank=True, null=True),
                ),
                ("crowd_visits", models.IntegerField(blank=True, null=True)),
                ("crowd_page_views", models.IntegerField(blank=True, null=True)),
                ("crowd_unique_visitors", models.IntegerField(blank=True, null=True)),
                (
                    "avg_visit_seconds",
                    models.DecimalField(
                        blank=True, decimal_places=2, max_digits=8, null=True
                    ),
                ),
                (
                    "transcriptions_added_to_loc_gov",
                    models.IntegerField(blank=True, null=True),
                ),
                (
                    "datasets_added_to_loc_gov",
                    models.IntegerField(blank=True, null=True),
                ),
            ],
            options={
                "ordering": ("period_start", "period_end", "period_type"),
                "indexes": [
                    models.Index(
                        fields=["period_type", "period_start", "period_end"],
                        name="concordia_k_period__d8d9b6_idx",
                    ),
                    models.Index(
                        fields=["period_type", "fiscal_year"],
                        name="concordia_k_period__3d99e1_idx",
                    ),
                    models.Index(
                        fields=["period_type", "fiscal_year", "fiscal_quarter"],
                        name="concordia_k_period__420f19_idx",
                    ),
                    models.Index(
                        fields=["period_type", "fiscal_year", "month"],
                        name="concordia_k_period__06112a_idx",
                    ),
                ],
                "unique_together": {("period_type", "period_start", "period_end")},
            },
        ),
    ]


================================================
FILE: concordia/migrations/0122_alter_item_title.py
================================================
# Generated by Django 4.2.22 on 2025-10-06 18:05

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0121_keymetricsreport"),
    ]

    operations = [
        migrations.AlterField(
            model_name="item",
            name="title",
            field=models.CharField(max_length=1000),
        ),
    ]


================================================
FILE: concordia/migrations/0123_alter_campaignretirementprogress_options.py
================================================
# Generated by Django 4.2.22 on 2025-10-06 18:11

from django.db import migrations


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0122_alter_item_title"),
    ]

    operations = [
        migrations.AlterModelOptions(
            name="campaignretirementprogress",
            options={"verbose_name_plural": "campaign retirement progresses"},
        ),
    ]


================================================
FILE: concordia/migrations/0124_update_periodic_task_paths.py
================================================
# Generated by Django 4.2.22 on 2025-10-22 16:03

from django.db import migrations

OLD_TO_NEW = {
    # reservations.py
    "concordia.tasks.expire_inactive_asset_reservations": "concordia.tasks.reservations.expire_inactive_asset_reservations",
    "concordia.tasks.tombstone_old_active_asset_reservations": "concordia.tasks.reservations.tombstone_old_active_asset_reservations",
    "concordia.tasks.delete_old_tombstoned_reservations": "concordia.tasks.reservations.delete_old_tombstoned_reservations",
    # reports/sitereport.py
    "concordia.tasks.site_report": "concordia.tasks.reports.sitereport.site_report",
    # visualizations.py
    "concordia.tasks.populate_asset_status_visualization_cache": "concordia.tasks.visualizations.populate_asset_status_visualization_cache",
    "concordia.tasks.populate_daily_activity_visualization_cache": "concordia.tasks.visualizations.populate_daily_activity_visualization_cache",
    # next_asset/renew.py
    "concordia.tasks.renew_next_asset_cache": "concordia.tasks.next_asset.renew.renew_next_asset_cache",
    # search_index.py
    "concordia.tasks.create_opensearch_indices": "concordia.tasks.search_index.create_opensearch_indices",
    "concordia.tasks.delete_opensearch_indices": "concordia.tasks.search_index.delete_opensearch_indices",
    "concordia.tasks.rebuild_opensearch_indices": "concordia.tasks.search_index.rebuild_opensearch_indices",
    "concordia.tasks.populate_opensearch_users_indices": "concordia.tasks.search_index.populate_opensearch_users_indices",
    "concordia.tasks.populate_opensearch_assets_indices": "concordia.tasks.search_index.populate_opensearch_assets_indices",
    "concordia.tasks.populate_opensearch_indices": "concordia.tasks.search_index.populate_opensearch_indices",
    # assets.py
    "concordia.tasks.calculate_difficulty_values": "concordia.tasks.assets.calculate_difficulty_values",
    "concordia.tasks.populate_asset_years": "concordia.tasks.assets.populate_asset_years",
    "concordia.tasks.fix_storage_images": "concordia.tasks.assets.fix_storage_images",
    # resources.py
    "concordia.tasks.populate_resource_files": "concordia.tasks.resources.populate_resource_files",
    # housekeeping.py
    "concordia.tasks.clear_sessions": "concordia.tasks.housekeeping.clear_sessions",
    # unusualactivity.py
    "concordia.tasks.unusual_activity": "concordia.tasks.unusualactivity.unusual_activity",
    # useractivity.py
    "concordia.tasks.populate_completed_campaign_counts": "concordia.tasks.useractivity.populate_completed_campaign_counts",
    "concordia.tasks.populate_active_campaign_counts": "concordia.tasks.useractivity.populate_active_campaign_counts",
    "concordia.tasks.update_userprofileactivity_from_cache": "concordia.tasks.useractivity.update_userprofileactivity_from_cache",
    # thumbnails.py
    "concordia.tasks.download_missing_thumbnails_task": "concordia.tasks.thumbnails.download_missing_thumbnails_task",
}

NEW_TO_OLD = {v: k for k, v in OLD_TO_NEW.items()}


def forwards(apps, schema_editor):
    PeriodicTask = apps.get_model("django_celery_beat", "PeriodicTask")
    for pt in PeriodicTask.objects.all().only("id", "task"):
        new = OLD_TO_NEW.get(pt.task)
        if new and new != pt.task:
            PeriodicTask.objects.filter(id=pt.id).update(task=new)


def backwards(apps, schema_editor):
    PeriodicTask = apps.get_model("django_celery_beat", "PeriodicTask")
    for pt in PeriodicTask.objects.all().only("id", "task"):
        old = NEW_TO_OLD.get(pt.task)
        if old and old != pt.task:
            PeriodicTask.objects.filter(id=pt.id).update(task=old)


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0123_alter_campaignretirementprogress_options"),
    ]

    operations = [
        migrations.RunPython(forwards, backwards),
    ]


================================================
FILE: concordia/migrations/0125_update_userprofile_tasks.py
================================================
# Generated by Django 4.2.26 on 2025-11-14 15:05

from django.db import migrations

TITLE = "Geography and Map"


def forwards(apps, schema_editor):
    db_alias = schema_editor.connection.alias
    ResearchCenter = apps.get_model("concordia", "ResearchCenter")
    ResearchCenter.objects.using(db_alias).create(title=TITLE)


def reverse_func(apps, schema_editor):
    db_alias = schema_editor.connection.alias
    ResearchCenter = apps.get_model("concordia", "ResearchCenter")
    ResearchCenter.objects.using(db_alias).get(title=TITLE).delete()


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0124_update_periodic_task_paths"),
    ]

    operations = [migrations.RunPython(forwards, reverse_func)]


================================================
FILE: concordia/migrations/0126_concordiafile_helpfullink_remove_resource_campaign_and_more.py
================================================
# Generated by Django 4.2.24 on 2025-12-15 15:49

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0125_update_userprofile_tasks"),
    ]

    operations = [
        migrations.SeparateDatabaseAndState(
            database_operations=[],
            state_operations=[
                migrations.RenameModel(
                    old_name="Resource",
                    new_name="HelpfulLink",
                ),
                migrations.RenameField(
                    model_name="helpfullink",
                    old_name="resource_type",
                    new_name="link_type",
                ),
                migrations.RenameField(
                    model_name="helpfullink",
                    old_name="resource_url",
                    new_name="link_url",
                ),
                migrations.RenameModel(
                    old_name="ResourceFile",
                    new_name="ConcordiaFile",
                ),
                migrations.RenameField(
                    model_name="concordiafile",
                    old_name="resource",
                    new_name="uploaded_file",
                ),
            ],
        ),
    ]


================================================
FILE: concordia/migrations/0127_alter_campaignretirementprogress_options_and_more.py
================================================
# Generated by Django 4.2.24 on 2025-12-15 16:37

from django.db import migrations, models

import concordia.models


class Migration(migrations.Migration):
    dependencies = [
        (
            "concordia",
            "0126_concordiafile_helpfullink_remove_resource_campaign_and_more",
        ),
    ]

    operations = [
        migrations.SeparateDatabaseAndState(
            database_operations=[],
            state_operations=[
                migrations.AlterField(
                    model_name="concordiafile",
                    name="uploaded_file",
                    field=models.FileField(
                        db_column="resource",
                        upload_to=concordia.models.resource_file_upload_path,
                    ),
                ),
                migrations.AlterField(
                    model_name="helpfullink",
                    name="link_type",
                    field=models.IntegerField(
                        choices=[
                            (1, "Related Link"),
                            (2, "Completed Transcription Link"),
                        ],
                        db_column="resource_type",
                        default=1,
                    ),
                ),
                migrations.AlterField(
                    model_name="helpfullink",
                    name="link_url",
                    field=models.URLField(db_column="resource_url"),
                ),
                migrations.AlterModelTable(
                    name="concordiafile",
                    table="concordia_resourcefile",
                ),
                migrations.AlterModelTable(
                    name="helpfullink",
                    table="concordia_resource",
                ),
            ],
        ),
    ]


================================================
FILE: concordia/migrations/0128_alter_campaignretirementprogress_options.py
================================================
# Generated by Django 4.2.24 on 2025-12-15 16:41

from django.db import migrations


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0127_alter_campaignretirementprogress_options_and_more"),
    ]

    operations = [
        migrations.AlterModelOptions(
            name="campaignretirementprogress",
            options={"verbose_name_plural": "campaign retirement progress"},
        ),
    ]


================================================
FILE: concordia/migrations/__init__.py
================================================


================================================
FILE: concordia/models.py
================================================
import calendar
import csv
import datetime
import io
import json
import os.path
import time
import uuid
from decimal import Decimal
from itertools import chain
from logging import getLogger
from typing import Optional, Tuple, Union

import pytesseract
from django.conf import settings
from django.contrib.auth.models import User
from django.contrib.postgres.fields import ArrayField
from django.contrib.postgres.indexes import GinIndex
from django.core import signing
from django.core.cache import cache
from django.core.exceptions import ObjectDoesNotExist, ValidationError
from django.core.serializers.json import DjangoJSONEncoder
from django.core.validators import RegexValidator
from django.db import models
from django.db.models import (
    Avg,
    Case,
    Count,
    ExpressionWrapper,
    F,
    JSONField,
    Q,
    Sum,
    Value,
    When,
)
from django.db.models.functions import Round
from django.db.models.signals import post_save
from django.urls import reverse
from django.utils import timezone
from django.utils.functional import cached_property
from PIL import Image

from concordia.exceptions import RateLimitExceededError
from concordia.logging import ConcordiaLogger
from concordia.storage import ASSET_STORAGE
from configuration.utils import configuration_value
from prometheus_metrics.models import MetricsModelMixin

logger = getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)

metadata_default = dict

User._meta.get_field("email").__dict__["_unique"] = True

ONE_MINUTE = datetime.timedelta(minutes=1)
ONE_DAY = datetime.timedelta(days=1)
ONE_DAY_AGO = timezone.now() - ONE_DAY
THRESHOLD = 2


def resource_file_upload_path(instance, filename):
    """
    Return the upload path for a ConcordiaFile instance.

    If the instance already has a primary key and a stored path, that path is
    reused so the file is not moved on subsequent saves. Otherwise, a dated
    path is generated under ``cm-uploads/resources/`` using the lowercased
    filename.
    """
    if instance.id and instance.path:
        return instance.path
    path = "cm-uploads/resources/%Y/{0}".format(filename.lower())
    return time.strftime(path)


class ConcordiaUser(User):
    """
    Proxy model adding Concordia-specific helpers and rate-limit tracking.

    This avoids changing the base ``auth.User`` model while still attaching
    project-specific behavior such as email reconfirmation flow and review
    rate limiting.
    """

    class Meta:
        proxy = True

    @property
    def email_reconfirmation_cache_key(self):
        """
        Return the cache key used to store the pending reconfirmation email.
        """
        return settings.EMAIL_RECONFIRMATION_KEY.format(id=self.id)

    def set_email_for_reconfirmation(self, email):
        """
        Store a pending reconfirmation email address in the cache.

        The value is stored under :attr:`email_reconfirmation_cache_key` for
        the duration configured by ``EMAIL_RECONFIRMATION_TIMEOUT``.
        """
        cache.set(
            self.email_reconfirmation_cache_key,
            email,
            settings.EMAIL_RECONFIRMATION_TIMEOUT,
        )

    def get_email_for_reconfirmation(self):
        """
        Return the cached reconfirmation email address, if present.

        Returns:
            str | None: The pending reconfirmation email, or None if no value
            is cached.
        """
        return cache.get(self.email_reconfirmation_cache_key)

    def delete_email_for_reconfirmation(self):
        """
        Remove any cached reconfirmation email address for this user.
        """
        cache.delete(self.email_reconfirmation_cache_key)

    def get_email_reconfirmation_key(self):
        """
        Build a signed reconfirmation token for the cached email address.

        The token encodes the username and pending email address using
        Django's :mod:`signing` utilities.

        Returns:
            str: A signed string suitable for use in reconfirmation URLs.

        Raises:
            ValueError: If no email address has been cached for this user.
        """
        email = self.get_email_for_reconfirmation()
        if email:
            return signing.dumps(obj={"username": self.get_username(), "email": email})
        else:
            raise ValueError("No email cached for reconfirmation")

    def validate_reconfirmation_email(self, email):
        """
        Check whether the supplied email matches the cached reconfirmation one.

        Args:
            email (str): Email address to validate.

        Returns:
            bool: True if the email matches the cached value, otherwise False.
        """
        return email == self.get_email_for_reconfirmation()

    def review_incidents(self, recent_accepts, threshold=THRESHOLD):
        """
        Count review-rate incidents for this user within a queryset.

        An incident is counted when this user records ``threshold`` or more
        accepts within any rolling 60-second window among the provided
        ``recent_accepts`` queryset.

        Args:
            recent_accepts (QuerySet): Transcription queryset filtered to rows
                with non-null ``accepted`` timestamps.
            threshold (int): Minimum number of accepts in a 60-second window
                required to count as one incident.

        Returns:
            int: Number of detected review incidents.
        """
        accepts = recent_accepts.filter(reviewed_by=self).values_list(
            "accepted", flat=True
        )
        timestamps = list(accepts)
        timestamps.sort()
        incidents = 0
        for i in range(len(timestamps)):
            count = 1
            for j in range(i + 1, len(timestamps)):
                if (timestamps[j] - timestamps[i]).seconds <= 60:
                    count += 1
                    if count == threshold:
                        incidents += 1
                        break
                else:
                    break
        return incidents

    def transcribe_incidents(self, transcriptions):
        """
        Count transcription-speed incidents for this user.

        An incident is counted when the user submits more than one distinct
        asset's transcription within a 60-second window.

        Args:
            transcriptions (QuerySet): Transcription queryset to inspect. It
                should already be filtered to this user and the desired time
                range.

        Returns:
            int: Number of detected transcription incidents.
        """
        transcriptions = transcriptions.filter(user=self).order_by("submitted")
        incidents = 0
        for transcription in transcriptions:
            start = transcription.submitted
            end = transcription.submitted + datetime.timedelta(minutes=1)
            if (
                transcriptions.filter(submitted__lte=end, submitted__gt=start)
                .exclude(asset=transcription.asset)
                .count()
                > 0
            ):
                incidents += 1
        return incidents

    @property
    def transcription_accepted_cache_key(self):
        """
        Return the cache key used to track this user's recent accept timestamps.
        """
        return settings.TRANSCRIPTION_ACCEPTED_TRACKING_KEY.format(user_id=self.id)

    def check_and_track_accept_limit(self, transcription):
        """
        Enforce and update the per-minute accept-rate limit for this user.

        For non-superusers, this loads the recent acceptance timestamps from
        the cache, discards values older than one minute, and checks the
        resulting count against the ``review_rate_limit`` configuration
        value. If recording another acceptance would exceed that limit, a
        :class:`RateLimitExceededError` is raised. Otherwise, the current
        timestamp is appended and written back to the cache.

        Args:
            transcription (Transcription): The transcription being accepted.
                (The argument is not inspected, but kept for call-site
                clarity.)

        Raises:
            RateLimitExceededError: If the user would exceed the configured
                rate limit.
        """
        if not self.is_superuser:
            key = self.transcription_accepted_cache_key
            now = timezone.now()
            one_minute_ago = now - ONE_MINUTE

            timestamps = cache.get(key, [])
            valid_timestamps = [ts for ts in timestamps if ts >= one_minute_ago]

            if len(valid_timestamps) and len(valid_timestamps) >= configuration_value(
                "review_rate_limit"
            ):
                raise RateLimitExceededError()

            valid_timestamps.append(now)
            cache.set(key, valid_timestamps, 60)


class UserProfile(MetricsModelMixin("userprofile"), models.Model):
    user = models.OneToOneField(User, on_delete=models.CASCADE, related_name="profile")
    transcribe_count = models.IntegerField(
        default=0, verbose_name="transcription save/submit count"
    )
    review_count = models.IntegerField(
        default=0, verbose_name="transcription review count"
    )


class OverlayPosition(object):
    """
    Used in carousel slide content management
    """

    LEFT = "left"
    RIGHT = "right"

    CHOICES = ((LEFT, "Left"), (RIGHT, "Right"))
    CHOICE_MAP = dict(CHOICES)


class TranscriptionStatus(object):
    """
    Status values used for rollup summaries of an asset's transcription status
    to avoid needing to do nested queries in views
    """

    NOT_STARTED = "not_started"
    IN_PROGRESS = "in_progress"
    SUBMITTED = "submitted"
    COMPLETED = "completed"

    CHOICES = (
        (NOT_STARTED, "Not Started"),
        (IN_PROGRESS, "In Progress"),
        (SUBMITTED, "Needs Review"),
        (COMPLETED, "Completed"),
    )
    CHOICE_MAP = dict(CHOICES)


STATUS_COUNT_KEYS = {
    status: f"{status}_count" for status in TranscriptionStatus.CHOICE_MAP
}


class MediaType:
    """
    Enumeration of supported asset media types.
    """

    IMAGE = "IMG"
    AUDIO = "AUD"
    VIDEO = "VID"

    CHOICES = ((IMAGE, "Image"), (AUDIO, "Audio"), (VIDEO, "Video"))


class PublicationQuerySet(models.QuerySet):
    def published(self):
        """
        Return queryset filtered to published objects.
        """
        return self.filter(published=True)

    def unpublished(self):
        """
        Return queryset filtered to unpublished objects.
        """
        return self.filter(published=False)


class UnlistedPublicationQuerySet(PublicationQuerySet):
    def annotated(self):
        """
        Return campaigns/topics annotated with asset counts and completion data.

        The returned queryset includes:

        - ``asset_count``: Number of published assets reachable through the
          associated projects and items.
        - Per-status counts based on :data:`STATUS_COUNT_KEYS`, such as
          ``completed_count`` and ``submitted_count``.
        - ``completed_percent`` and ``needs_review_percent``: Rounded
          percentages of assets in the completed or needs-review state,
          clamped so that 100 percent is only returned if all assets are in
          that state.
        """
        return (
            self.annotate(
                asset_count=Count(
                    "project__item__asset",
                    filter=Q(
                        project__published=True,
                        project__item__published=True,
                        project__item__asset__published=True,
                    ),
                )
            )
            .filter(asset_count__gt=0)
            .annotate(
                **{
                    v: Count(
                        "project__item__asset",
                        filter=Q(
                            project__published=True,
                            project__item__published=True,
                            project__item__asset__published=True,
                            project__item__asset__transcription_status=k,
                        ),
                    )
                    for k, v in STATUS_COUNT_KEYS.items()
                }
            )
            # PostgreSQL does integer division when given two integers, which results
            # in the decimal results being dropped. We implicitly cast one field to
            # be a float through multiplication in order to do floating point division
            .annotate(
                completed_raw_percent=ExpressionWrapper(
                    100 * F("completed_count") * 1.0 / F("asset_count"),
                    output_field=models.FloatField(),
                ),
                needs_review_raw_percent=ExpressionWrapper(
                    100 * F("submitted_count") * 1.0 / F("asset_count"),
                    output_field=models.FloatField(),
                ),
            )
            # Due to rounding issues, we explicitly only allow a 100% value if all
            # assets are in a particular status. Otherwise, we clamp to a maximum of
            # 99%
            .annotate(
                completed_percent=Case(
                    When(
                        completed_raw_percent__gte=99,
                        completed_raw_percent__lt=100,
                        then=Value(99),
                    ),
                    default=Round(F("completed_raw_percent")),
                    output_field=models.FloatField(),
                ),
                needs_review_percent=Case(
                    When(
                        needs_review_raw_percent__gte=99,
                        needs_review_raw_percent__lt=100,
                        then=Value(99),
                    ),
                    default=Round(F("needs_review_raw_percent")),
                    output_field=models.FloatField(),
                ),
            )
        )

    def listed(self):
        return self.filter(unlisted=False)

    def unlisted(self):
        return self.filter(unlisted=True)

    def active(self):
        return self.filter(status=Campaign.Status.ACTIVE)

    def completed(self):
        return self.filter(status=Campaign.Status.COMPLETED)

    def retired(self):
        return self.filter(status=Campaign.Status.RETIRED)

    def get_next_transcription_campaigns(self):
        return self.filter(next_transcription_campaign=True)

    def get_next_review_campaigns(self):
        return self.filter(next_review_campaign=True)


class Card(models.Model):
    image_alt_text = models.TextField(blank=True)
    image = models.ImageField(upload_to="card_images", blank=True, null=True)
    title = models.CharField(max_length=80)
    body_text = models.TextField(blank=True)
    created_on = models.DateTimeField(editable=False, auto_now_add=True)
    updated_on = models.DateTimeField(editable=False, auto_now=True, null=True)
    display_heading = models.CharField(max_length=80, blank=True, null=True)

    def __str__(self):
        return self.title

    class Meta:
        ordering = ("title",)


class CardFamily(models.Model):
    slug = models.SlugField(max_length=80, unique=True, allow_unicode=True)
    default = models.BooleanField(default=False)
    cards = models.ManyToManyField(Card, through="TutorialCard")

    class Meta:
        verbose_name_plural = "card families"

    def __str__(self):
        return self.slug


def on_cardfamily_save(sender, instance, **kwargs):
    # Only one tutorial/ list of cards should be marked as "default".
    # If the flag is set on a tutorial, it needs to be cleared from
    # any other existing tutorials.
    if instance.default:
        CardFamily.objects.filter(default=True).exclude(pk=instance.pk).update(
            default=False
        )


post_save.connect(on_cardfamily_save, sender=CardFamily)


class ResearchCenter(models.Model):
    title = models.CharField(max_length=80)

    def __str__(self):
        return self.title


class Campaign(MetricsModelMixin("campaign"), models.Model):
    class Status(models.IntegerChoices):
        ACTIVE = 1
        COMPLETED = 2
        RETIRED = 3

    objects = UnlistedPublicationQuerySet.as_manager()

    published = models.BooleanField(default=False, blank=True, db_index=True)
    unlisted = models.BooleanField(default=False, blank=True, db_index=True)
    status = models.IntegerField(choices=Status.choices, default=Status.ACTIVE)
    next_transcription_campaign = models.BooleanField(
        default=False, blank=True, db_index=True, verbose_name="Next-tran."
    )
    next_review_campaign = models.BooleanField(
        default=False, blank=True, db_index=True, verbose_name="Next-rev."
    )

    ordering = models.IntegerField(
        default=0, help_text="Sort order override: lower values will be listed first"
    )
    display_on_homepage = models.BooleanField(default=True, verbose_name="Homepage")

    title = models.CharField(max_length=80)
    slug = models.SlugField(max_length=80, unique=True, allow_unicode=True)

    card_family = models.ForeignKey(
        CardFamily, on_delete=models.CASCADE, blank=True, null=True
    )
    thumbnail_image = models.ImageField(
        upload_to="campaign-thumbnails", blank=True, null=True
    )
    image_alt_text = models.TextField(blank=True, null=True)

    launch_date = models.DateField(null=True, blank=True)
    completed_date = models.DateField(null=True, blank=True)

    description = models.TextField(blank=True)
    short_description = models.TextField(blank=True)

    metadata = JSONField(default=metadata_default, blank=True, null=True)

    disable_ocr = models.BooleanField(
        default=False, help_text="Turn OCR off for all assets of this campaign"
    )

    research_centers = models.ManyToManyField(ResearchCenter, blank=True)

    class Meta:
        indexes = [
            models.Index(fields=["published", "unlisted"]),
        ]
        permissions = [
            ("retire_campaign", "Can retire campaign"),
        ]

    def __str__(self):
        return self.title

    def get_absolute_url(self):
        return reverse("transcriptions:campaign-detail", args=(self.slug,))


class Topic(models.Model):
    objects = UnlistedPublicationQuerySet.as_manager()

    published = models.BooleanField(default=False, blank=True, db_index=True)
    unlisted = models.BooleanField(default=False, blank=True, db_index=True)

    ordering = models.IntegerField(
        default=0, help_text="Sort order override: lower values will be listed first"
    )
    title = models.CharField(blank=False, max_length=255)
    slug = models.SlugField(blank=False, allow_unicode=True, max_length=80)
    description = models.TextField(blank=True)
    thumbnail_image = models.ImageField(
        upload_to="topic-thumbnails", blank=True, null=True
    )
    short_description = models.TextField(blank=True)

    class Meta:
        indexes = [
            models.Index(fields=["published", "unlisted"]),
        ]

    def __str__(self):
        return self.title

    def get_absolute_url(self):
        return reverse("topic-detail", kwargs={"slug": self.slug})


class HelpfulLinkTypeQuerySet(models.QuerySet):
    def related_links(self):
        return self.filter(link_type=HelpfulLink.HelpfulLinkType.RELATED_LINK)

    def completed_transcription_links(self):
        return self.filter(
            link_type=HelpfulLink.HelpfulLinkType.COMPLETED_TRANSCRIPTION_LINK
        )


class HelpfulLink(MetricsModelMixin("resource"), models.Model):
    """
    This model was previously known as `Resource`. It was renamed to avoid
    conflict with the same name being used on loc.gov.

    The original table and row names have been maintained.
    """

    class HelpfulLinkType(models.IntegerChoices):
        RELATED_LINK = 1
        COMPLETED_TRANSCRIPTION_LINK = 2

    objects = HelpfulLinkTypeQuerySet.as_manager()

    sequence = models.PositiveIntegerField(default=1)
    title = models.CharField(blank=False, max_length=255)
    link_type = models.IntegerField(
        choices=HelpfulLinkType.choices,
        default=HelpfulLinkType.RELATED_LINK,
        db_column="resource_type",
    )
    link_url = models.URLField(db_column="resource_url")

    campaign = models.ForeignKey(
        Campaign, on_delete=models.CASCADE, blank=True, null=True
    )
    topic = models.ForeignKey(Topic, on_delete=models.CASCADE, blank=True, null=True)

    class Meta:
        ordering = ("sequence",)
        db_table = "concordia_resource"

    def __str__(self):
        return self.title


class ConcordiaFile(models.Model):
    """
    This model was previously known as `ResourceFile`. I twas renamed to avoid
    conflict with the same name being used on loc.gov.

    The original table and row names have been maintained.
    """

    name = models.CharField(blank=False, max_length=255)
    path = models.CharField(blank=True, default="", max_length=255)
    uploaded_file = models.FileField(
        upload_to=resource_file_upload_path, db_column="resource"
    )
    updated_on = models.DateTimeField(auto_now=True)

    class Meta:
        ordering = ["name"]
        db_table = "concordia_resourcefile"

    def __str__(self):
        return self.name

    def save(self, *args, **kwargs):
        super().save(*args, **kwargs)
        if self.id and not self.path:
            self.path = self.uploaded_file.name
            self.save()

    def delete(self, *args, **kwargs):
        storage = self.uploaded_file.storage

        if storage.exists(self.uploaded_file.name):
            self.uploaded_file.delete(save=False)

        super().delete(*args, **kwargs)


class Project(MetricsModelMixin("project"), models.Model):
    objects = PublicationQuerySet.as_manager()

    campaign = models.ForeignKey(Campaign, on_delete=models.CASCADE)

    published = models.BooleanField(default=False, blank=True, db_index=True)
    ordering = models.IntegerField(
        default=0, help_text="Sort order override: lower values will be listed first"
    )
    title = models.CharField(max_length=80)
    slug = models.SlugField(max_length=80, allow_unicode=True)
    thumbnail_image = models.ImageField(
        upload_to="project-thumbnails", blank=True, null=True
    )

    description = models.TextField(blank=True)
    metadata = JSONField(default=metadata_default, blank=True, null=True)

    topics = models.ManyToManyField("Topic", through="ProjectTopic")

    disable_ocr = models.BooleanField(
        default=False, help_text="Turn OCR off for all assets of this project"
    )

    class Meta:
        unique_together = (("slug", "campaign"),)
        ordering = ["title"]
        indexes = [
            models.Index(fields=["id", "campaign", "published"]),
            models.Index(fields=["published", "campaign", "title"]),
        ]

    def __str__(self):
        return self.title

    def get_absolute_url(self):
        return reverse(
            "transcriptions:project-detail",
            kwargs={"campaign_slug": self.campaign.slug, "slug": self.slug},
        )

    def turn_off_ocr(self):
        return self.disable_ocr or self.campaign.disable_ocr


class Item(MetricsModelMixin("item"), models.Model):
    objects = PublicationQuerySet.as_manager()

    project = models.ForeignKey(Project, on_delete=models.CASCADE)

    published = models.BooleanField(default=False, blank=True)

    title = models.CharField(max_length=1000)
    item_url = models.URLField(max_length=255)
    item_id = models.CharField(
        max_length=100, help_text="Unique item ID assigned by the upstream source"
    )
    description = models.TextField(blank=True)
    metadata = JSONField(
        default=metadata_default,
        blank=True,
        null=True,
        help_text="Raw metadata returned by the remote API",
    )
    thumbnail_url = models.URLField(max_length=255, blank=True, null=True)
    thumbnail_image = models.ImageField(
        upload_to="item-thumbnails", blank=True, null=True
    )

    disable_ocr = models.BooleanField(
        default=False, help_text="Turn OCR off for all assets of this item"
    )

    class Meta:
        unique_together = (("item_id", "project"),)
        indexes = [models.Index(fields=["project", "published"])]

    def __str__(self):
        return f"{self.item_id}: {self.title}"

    def get_absolute_url(self):
        return reverse(
            "transcriptions:item-detail",
            kwargs={
                "campaign_slug": self.project.campaign.slug,
                "project_slug": self.project.slug,
                "item_id": self.item_id,
            },
        )

    @property
    def thumbnail_link(self) -> str | None:
        """
        Return the preferred thumbnail URL.

        Prefers thumbnail_image if present and valid; otherwise falls back to
        thumbnail_url. Returns None if neither is available.

        TODO: Remove this when removing thumbnail_url and switch template
        to use thumbnail_image directly (transcriptions/project_detail.html)
        """
        if self.thumbnail_image:
            try:
                return self.thumbnail_image.url
            except ValueError:
                # File missing from storage, fall back to thumbnail_url
                # since we can for now
                pass
        return self.thumbnail_url or None

    def turn_off_ocr(self):
        return self.disable_ocr or self.project.turn_off_ocr()


class AssetQuerySet(PublicationQuerySet):
    def add_contribution_counts(self):
        """Add annotations for the number of transcriptions & users"""

        return self.annotate(
            transcription_count=Count("transcription", distinct=True),
            transcriber_count=Count("transcription__user", distinct=True),
            reviewer_count=Count("transcription__reviewed_by", distinct=True),
        )


class Asset(MetricsModelMixin("asset"), models.Model):
    def get_storage_path(self, filename):
        extension = os.path.splitext(filename)[1].lstrip(".").lower()
        if extension == "jpeg":
            extension = "jpg"
        return self.get_asset_image_filename(extension)

    objects = AssetQuerySet.as_manager()

    item = models.ForeignKey(Item, on_delete=models.CASCADE)
    campaign = models.ForeignKey(Campaign, on_delete=models.CASCADE)

    published = models.BooleanField(default=False, blank=True, db_index=True)

    title = models.CharField(max_length=100)
    slug = models.SlugField(max_length=100, allow_unicode=True)

    description = models.TextField(blank=True)
    media_type = models.CharField(
        max_length=4, choices=MediaType.CHOICES, db_index=True
    )
    sequence = models.PositiveIntegerField(default=1)
    year = models.CharField(blank=True, max_length=50)

    # The original ID of the image resource on loc.gov
    resource_url = models.URLField(max_length=255, blank=True, null=True)
    # The URL used to download this image from loc.gov
    download_url = models.CharField(max_length=255, blank=True, null=True)

    metadata = JSONField(default=metadata_default, blank=True, null=True)

    # This is computed from the Transcription records and should never
    # be directly modified except by the Transcription signal handler:
    transcription_status = models.CharField(
        editable=False,
        max_length=20,
        default=TranscriptionStatus.NOT_STARTED,
        choices=TranscriptionStatus.CHOICES,
        db_index=True,
    )

    difficulty = models.PositiveIntegerField(default=0, blank=True, null=True)

    storage_image = models.ImageField(
        upload_to=get_storage_path, storage=ASSET_STORAGE, max_length=255
    )

    disable_ocr = models.BooleanField(
        default=False, help_text="Turn OCR off for this asset"
    )

    class Meta:
        unique_together = (("slug", "item"),)
        indexes = [
            models.Index(
                fields=["item", "published", "transcription_status", "sequence"]
            ),
            models.Index(
                fields=["published", "transcription_status", "item", "sequence"]
            ),
            models.Index(fields=["published", "transcription_status"]),
            models.Index(fields=["item", "sequence"]),
            models.Index(fields=["campaign", "sequence"]),
        ]
        permissions = [
            ("reopen_asset", "Can reopen asset"),
        ]

    def __str__(self):
        return self.title

    def save(self, *args, **kwargs):
        try:
            self.campaign  # noqa: B018
        except ObjectDoesNotExist:
            self.campaign = self.item.project.campaign
        # This ensures all 'required' fields really are required
        # even when creating objects programmatically. Particularly,
        # we want to make sure we don't end up with an empty storage_image
        self.full_clean()
        super().save(*args, **kwargs)

    def get_absolute_url(self):
        return reverse(
            "transcriptions:asset-detail",
            kwargs={
                "campaign_slug": self.item.project.campaign.slug,
                "project_slug": self.item.project.slug,
                "item_id": self.item.item_id,
                "slug": self.slug,
            },
        )

    @cached_property
    def logger(self):
        return structured_logger.bind(asset=self)

    def latest_transcription(self):
        return self.transcription_set.order_by("-pk").first()

    @staticmethod
    def get_asset_image_path(item):
        return os.path.join(item.project.campaign.slug, item.project.slug, item.item_id)

    def get_asset_image_filename(self, extension="jpg"):
        return os.path.join(
            self.get_asset_image_path(self.item), f"{self.sequence}.{extension}"
        )

    def get_existing_storage_image_filename(self):
        return os.path.basename(self.storage_image.name)

    def get_ocr_transcript(self, language=None):
        if language and language not in settings.PYTESSERACT_ALLOWED_LANGUAGES:
            logger.warning(
                "OCR language '%s' not in settings.PYTESSERACT_ALLOWED_LANGUAGES. "
                "Allowed languages: %s",
                language,
                settings.PYTESSERACT_ALLOWED_LANGUAGES,
            )
            structured_logger.warning(
                "OCR language not allowed; falling back to default.",
                event_code="ocr_language_not_allowed",
                reason="The requested OCR language is not in the allowed list.",
                reason_code="ocr_language_not_permitted",
                language=language,
                allowed_languages=settings.PYTESSERACT_ALLOWED_LANGUAGES,
            )
            language = None
        structured_logger.info(
            "Running OCR on asset image.",
            event_code="ocr_run_started",
            asset=self,
            language=language,
        )
        return pytesseract.image_to_string(
            Image.open(self.storage_image), lang=language
        )

    def get_contributor_count(self):
        transcriptions = Transcription.objects.filter(asset=self)
        reviewer_ids = (
            transcriptions.exclude(reviewed_by__isnull=True)
            .values_list("reviewed_by", flat=True)
            .distinct()
        )
        transcriber_ids = transcriptions.values_list("user", flat=True).distinct()
        user_ids = list(set(list(reviewer_ids) + list(transcriber_ids)))
        return len(user_ids)

    def turn_off_ocr(self):
        return self.disable_ocr or self.item.turn_off_ocr()

    def can_rollback(
        self,
    ) -> Tuple[bool, Union[str, "Transcription"], Optional["Transcription"]]:
        """
        Determine whether the latest transcription on this asset can be rolled back.

        This checks the transcription history for the most recent non-rolled-forward
        transcription that precedes the current latest transcription, excluding any
        transcriptions that are rollforwards or are sources of rollforwards.

        A rollback is only possible if:
        - There is more than one transcription.
        - There is a prior transcription that is not a rollforward or source of one.

        This method does not perform the rollback, only checks feasibility.

        Returns:
            result (tuple): A (bool, value, latest) tuple describing rollback
                possibility.

        Return Behavior:
            - If no transcriptions exist: returns (False, reason_string, None).
            - If no eligible rollback target exists: returns (False, reason_string,
              None).
            - If rollback is possible: returns (True, target_transcription,
              latest_transcription).
        """
        # original_latest_transcription holds the actual latest transcription
        # latest_transcription starts by holding the actual latest transcription,
        # but if it's a rolled forward or backward transcription, we use it to
        # find the most recent non-rolled transcription and store it instead
        original_latest_transcription = latest_transcription = (
            self.latest_transcription()
        )
        if original_latest_transcription is None:
            self.logger.debug(
                "No transcriptions exist for this asset.",
                event_code="rollback_check_failed",
                reason_code="no_transcriptions",
                reason="This asset has no transcriptions, so rollback is not possible.",
            )
            return (
                False,
                "Can not rollback transcription on an asset with no transcriptions",
                None,
            )

        # If the latest transcription has a source (i.e., is a rollback
        # or rollforward transcription), we want the original transcription
        # that it's based on, back to the original source
        while latest_transcription.source:
            latest_transcription = latest_transcription.source

        if original_latest_transcription.source:
            self.logger.debug(
                "Using source transcription as effective latest transcription "
                "for rollback.",
                event_code="rollback_resolve_source",
                original_transcription_id=original_latest_transcription.id,
                resolved_transcription_id=latest_transcription.id,
            )

        # We look back from the latest non-rolled transcription,
        # ignoring any rolled forward or sources of rolled forward
        # transcriptions
        transcription_to_rollback_to = (
            self.transcription_set.exclude(rolled_forward=True)
            .exclude(source_of__rolled_forward=True)
            .exclude(pk__gte=latest_transcription.pk)
            .order_by("-pk")
            .first()
        )
        if transcription_to_rollback_to is None:
            # We did not find one, which means there is no eligible
            # transcription to rollback to, because everything before
            # is either a rollforward or the source of a rollforward
            # (or there just is not an earlier transcription at all)
            self.logger.debug(
                "No eligible transcription found for rollback.",
                event_code="rollback_check_failed",
                reason_code="no_eligible_transcription",
                reason=(
                    "There are no earlier transcriptions that can be rolled back to. "
                    "All earlier transcriptions are rollforwards or sources of "
                    "rollforwards."
                ),
                latest_transcription_id=original_latest_transcription.id,
            )
            return (
                False,
                (
                    "Can not rollback transcription on an asset "
                    "with no non-rollforward older transcriptions"
                ),
                None,
            )

        self.logger.debug(
            "Eligible rollback target found.",
            event_code="rollback_check_passed",
            reason_code="rollback_target_identified",
            reason="Found older transcription not marked as rollforward.",
            target_transcription_id=transcription_to_rollback_to.id,
            latest_transcription_id=original_latest_transcription.id,
        )
        return True, transcription_to_rollback_to, original_latest_transcription

    def rollback_transcription(self, user: User) -> "Transcription":
        """
        Perform a rollback of the latest transcription on this asset.

        This creates a new transcription that copies the text of the most recent
        eligible prior transcription (as determined by ``can_rollback``) and marks
        it as rolled back. It also updates the original latest transcription to
        reflect that it has been superseded.

        If rollback is not possible, raises a ``ValueError``.

        The new transcription will:
            - Have ``rolled_back=True``.
            - Set its ``source`` to the transcription it is rolled back to.
            - Set ``supersedes`` to the current latest transcription.

        Args:
            user (User): The user performing the rollback.

        Returns:
            Transcription: The newly created rollback transcription.

        Raises:
            ValueError: If rollback is not possible due to invalid or missing
                history.
        """
        results = self.can_rollback()
        if results[0] is not True:
            self.logger.warning(
                "Rollback attempt failed: no valid rollback target.",
                event_code="rollback_attempt_failed",
                reason_code="no_valid_target",
                reason=results[1],
                user=user,
            )
            raise ValueError(results[1])

        transcription_to_rollback_to = results[1]
        original_latest_transcription = results[2]

        self.logger.debug(
            "Preparing rollback transcription.",
            event_code="rollback_prepare",
            user=user,
            source_transcription_id=transcription_to_rollback_to.id,
            superseded_transcription_id=original_latest_transcription.id,
        )

        kwargs = {
            "asset": self,
            "user": user,
            "supersedes": original_latest_transcription,
            "text": transcription_to_rollback_to.text,
            "rolled_back": True,
            "source": transcription_to_rollback_to,
        }
        new_transcription = Transcription(**kwargs)
        new_transcription.full_clean()
        new_transcription.save()

        self.logger.info(
            "Rollback successfully performed.",
            event_code="rollback_success",
            user=user,
            new_transcription_id=new_transcription.id,
            rolled_back_from_id=original_latest_transcription.id,
            rolled_back_to_id=transcription_to_rollback_to.id,
        )
        return new_transcription

    def can_rollforward(
        self,
    ) -> Tuple[bool, Union[str, "Transcription"], Optional["Transcription"]]:
        """
        Determine whether a previous rollback on this asset can be rolled forward.

        This checks whether the most recent transcription is a rollback transcription
        and whether the transcription it replaced (its ``supersedes``) can be
        restored.

        This method handles cases where multiple rollforwards were applied,
        walking backward through the transcription chain to find the appropriate
        rollback origin.

        A rollforward is only possible if:
        - The latest transcription is a rollback.
        - The rollback's superseded transcription still exists and can be
          restored.

        This method does not perform the rollforward, only checks feasibility.

        Returns:
            result (tuple): A (bool, value, latest) tuple describing rollforward
                possibility.

        Return Behavior:
            - If no transcriptions exist: returns (False, reason_string, None).
            - If rollforward is not possible: returns (False, reason_string, None).
            - If rollforward is possible: returns
              (True, transcription_to_rollforward, latest_transcription).
        """
        # original_latest_transcription holds the actual latest transcription
        # latest_transcription starts by holding the actual latest transcription,
        # but if it is a rolled forward transcription, we use it to find the most
        # recent non-rolled-forward transcription and store that in
        # latest_transcription
        original_latest_transcription = latest_transcription = (
            self.latest_transcription()
        )

        if original_latest_transcription is None:
            self.logger.debug(
                "No transcriptions exist for this asset.",
                event_code="rollforward_check_failed",
                reason_code="no_transcriptions",
                reason=(
                    "This asset has no transcriptions, "
                    "so rollforward is not possible."
                ),
            )
            return (
                False,
                (
                    "Can not rollforward transcription on an asset "
                    "with no transcriptions"
                ),
                None,
            )

        # Rollforwards can be chained through multiple rollback/forward cycles,
        # so we may need to walk back the supersedes chain to find the original.
        if latest_transcription.rolled_forward:
            # We need to find the latest transcription that was not rolled forward
            rolled_forward_count = 0
            try:
                while latest_transcription.rolled_forward:
                    latest_transcription = latest_transcription.supersedes
                    rolled_forward_count += 1
                self.logger.debug(
                    "Walking back through rolled_forward transcriptions.",
                    event_code="rollforward_resolve_chain",
                    reason_code="resolve_rolled_forward_chain",
                    reason=(
                        f"Resolved {rolled_forward_count} rolled_forward "
                        "transcription(s) before identifying rollback target."
                    ),
                    rolled_forward_count=rolled_forward_count,
                )
            except AttributeError:
                self.logger.warning(
                    (
                        "Rollforward failed: unable to resolve chain of "
                        "rolled_forward transcriptions."
                    ),
                    event_code="rollforward_check_failed",
                    reason_code="unresolvable_rolled_forward_chain",
                    reason=(
                        "Could not walk back through rolled_forward transcriptions "
                        "to find a valid rollback base. Possibly malformed "
                        "transcription history (missing supersedes)."
                    ),
                )
                return (
                    False,
                    (
                        "Can not rollforward transcription on an asset with no "
                        "non-rollforward transcriptions"
                    ),
                    None,
                )
            # latest_transcription is now the most recent non-rolled-forward
            # transcription, but we need to go back fruther based on the number
            # of rolled-forward transcriptions we have seen to get to the actual
            # rollback transcription we need to rollforward from
            try:
                while rolled_forward_count >= 1:
                    latest_transcription = latest_transcription.supersedes
                    if not latest_transcription:
                        # We do this here to handle the error rather than letting
                        # it be raised below when we try to process this
                        # non-existent transcription
                        raise AttributeError
                    rolled_forward_count -= 1
            except AttributeError:
                # This error is raised manually if latest_transcription ends up
                # being None at the end of the loop or automatically if it is None
                # when the loop continues
                # In either case, his should only happen if the transcription
                # history was manually edited.
                self.logger.warning(
                    (
                        "Corrupt transcription state: too "
                        "many rollforwards without originals."
                    ),
                    event_code="rollforward_check_failed",
                    reason_code="corrupt_state",
                    reason=(
                        "More rollforward transcriptions exist than "
                        "non-rollforward ones. This suggests a manually "
                        "corrupted transcription history."
                    ),
                    latest_transcription_id=original_latest_transcription.id,
                )
                return (
                    False,
                    (
                        "More rollforward transcription exist than non-roll-forward "
                        "transcriptions, which shouldn't be possible. Possibly "
                        "incorrectly modified transcriptions for this asset."
                    ),
                    None,
                )

        # If the latest_transcription we end up with is a rollback transcription,
        # we want to rollforward to the transcription it replaced. If not,
        # nothing can be rolled forward
        if latest_transcription.rolled_back:
            transcription_to_rollforward = latest_transcription.supersedes
        else:
            self.logger.debug(
                "Rollforward failed: latest transcription is not a rollback.",
                event_code="rollforward_check_failed",
                reason_code="not_a_rollback",
                reason=(
                    "Can not rollforward transcription on an asset if the latest "
                    "non-rollforward transcription is not a rollback transcription."
                ),
            )
            return (
                False,
                (
                    "Can not rollforward transcription on an asset if the latest "
                    "non-rollforward transcription is not a rollback transcription"
                ),
                None,
            )

        # If that replaced transcription does not exist, we cannot do anything
        # This should not be possible normally, but if a transcription history
        # is manually edited, you could end up in this state.
        if not transcription_to_rollforward:
            self.logger.debug(
                "Rollforward failed: rollback transcription has no superseded value.",
                event_code="rollforward_check_failed",
                reason_code="no_superseded_transcription",
                reason=(
                    "Can not rollforward transcription on an asset if the latest "
                    "rollback transcription did not supersede a previous "
                    "transcription."
                ),
            )
            return (
                False,
                (
                    "Can not rollforward transcription on an asset if the latest "
                    "rollback transcription did not supersede a previous "
                    "transcription"
                ),
                None,
            )

        self.logger.debug(
            "Eligible rollforward target found.",
            event_code="rollforward_check_passed",
            target_transcription_id=transcription_to_rollforward.id,
            latest_transcription_id=original_latest_transcription.id,
        )

        return True, transcription_to_rollforward, original_latest_transcription

    def rollforward_transcription(self, user: User) -> "Transcription":
        """
         Perform a rollforward of the most recent rollback transcription.

        This creates a new transcription that restores the text from the
        rollback's superseded transcription and marks it as a rollforward. A
        rollforward is only possible if the latest transcription is a rollback
        and the replaced transcription still exists.

        If rollforward is not possible, raises a ``ValueError``.

        The new transcription will:
            - Have ``rolled_forward=True``.
            - Set its ``source`` to the transcription being rolled forward to.
            - Set ``supersedes`` to the current latest transcription.

        Args:
            user (User): The user initiating the rollforward.

        Returns:
            Transcription: The newly created rollforward transcription.

        Raises:
            ValueError: If rollforward is not possible, such as when no rollback
                exists or the history is malformed.

        Return Behavior:
            - If rollforward is possible:
                - Creates a new transcription restoring the original text.
                - Marks it with ``rolled_forward=True``.
            - If rollforward is not possible:
                - Raises ``ValueError`` with a descriptive message.
        """
        results = self.can_rollforward()
        if results[0] is not True:
            self.logger.warning(
                "Rollforward attempt failed: no valid rollforward target.",
                event_code="rollforward_attempt_failed",
                reason_code="no_valid_target",
                reason=results[1],
                user=user,
            )
            raise ValueError(results[1])

        transcription_to_rollforward = results[1]
        original_latest_transcription = results[2]

        self.logger.debug(
            "Preparing rollforward transcription.",
            event_code="rollforward_prepare",
            user=user,
            source_transcription_id=transcription_to_rollforward.id,
            superseded_transcription_id=original_latest_transcription.id,
        )

        kwargs = {
            "asset": self,
            "user": user,
            "supersedes": original_latest_transcription,
            "text": transcription_to_rollforward.text,
            "rolled_forward": True,
            "source": transcription_to_rollforward,
        }
        new_transcription = Transcription(**kwargs)
        new_transcription.full_clean()
        new_transcription.save()

        self.logger.info(
            "Rollforward successfully performed.",
            event_code="rollforward_success",
            user=user,
            new_transcription_id=new_transcription.id,
            rolled_forward_from_id=original_latest_transcription.id,
            rolled_forward_to_id=transcription_to_rollforward.id,
        )
        return new_transcription


class Tag(MetricsModelMixin("tag"), models.Model):
    TAG_VALIDATOR = RegexValidator(r"^[- _À-ž'\w]{1,50}$")
    value = models.CharField(max_length=50, validators=[TAG_VALIDATOR])

    def __str__(self):
        return self.value


class UserAssetTagCollection(
    MetricsModelMixin("user_asset_tag_collection"), models.Model
):
    asset = models.ForeignKey(Asset, on_delete=models.CASCADE)

    user = models.ForeignKey(settings.AUTH_USER_MODEL, on_delete=models.CASCADE)

    tags = models.ManyToManyField(Tag, blank=True)
    created_on = models.DateTimeField(auto_now_add=True)
    updated_on = models.DateTimeField(auto_now=True)

    def __str__(self):
        return "{} - {}".format(self.asset, self.user)


class TranscriptionManager(models.Manager):
    def review_actions(self, start, end=None):
        q_accepted = Q(accepted__gte=start)
        q_rejected = Q(rejected__gte=start)
        if end is not None:
            q_accepted &= Q(accepted__lte=end)
            q_rejected &= Q(rejected__lte=end)
        return self.filter(q_accepted | q_rejected)

    def recent_review_actions(self, days=1):
        START = timezone.now() - datetime.timedelta(days=days)
        return self.review_actions(START)

    def review_incidents(self, start=ONE_DAY_AGO):
        user_incident_count = []
        recent_accepts = self.filter(
            accepted__gte=start,
            reviewed_by__is_superuser=False,
            reviewed_by__is_staff=False,
        )
        user_ids = set(
            recent_accepts.order_by("reviewed_by").values_list("reviewed_by", flat=True)
        )

        for user_id in user_ids:
            user = ConcordiaUser.objects.get(id=user_id)
            incident_count = user.review_incidents(recent_accepts)
            if incident_count > 0:
                accept_count = Transcription.objects.filter(
                    reviewed_by=user, accepted__isnull=False
                ).count()
                user_incident_count.append(
                    (user.id, user.username, incident_count, accept_count)
                )

        return user_incident_count

    def recent_transcriptions(self, start=ONE_DAY_AGO):
        return self.get_queryset().filter(
            submitted__gte=start, user__is_superuser=False, user__is_staff=False
        )

    def transcribe_incidents(self, start=ONE_DAY_AGO):
        user_incident_count = []
        transcriptions = self.recent_transcriptions(start)
        user_ids = (
            transcriptions.order_by("user")
            .distinct("user")
            .values_list("user", flat=True)
        )

        for user_id in user_ids:
            user = ConcordiaUser.objects.get(id=user_id)
            incident_count = user.transcribe_incidents(transcriptions)
            if incident_count > 0:
                transcribe_count = Transcription.objects.filter(user=user).count()
                user_incident_count.append(
                    (
                        user.id,
                        user.username,
                        incident_count,
                        transcribe_count,
                    )
                )

        return user_incident_count


class Transcription(MetricsModelMixin("transcription"), models.Model):
    asset = models.ForeignKey(Asset, on_delete=models.CASCADE)

    user = models.ForeignKey(settings.AUTH_USER_MODEL, on_delete=models.CASCADE)

    created_on = models.DateTimeField(auto_now_add=True)
    updated_on = models.DateTimeField(auto_now=True)

    supersedes = models.ForeignKey(
        "self",
        blank=True,
        null=True,
        on_delete=models.CASCADE,
        help_text="A previous transcription record which is replaced by this one",
        related_name="superseded_by",
    )

    submitted = models.DateTimeField(
        blank=True,
        null=True,
        help_text="Timestamp when the creator submitted this for review",
    )

    # Review tracking:
    accepted = models.DateTimeField(blank=True, null=True)
    rejected = models.DateTimeField(blank=True, null=True)
    reviewed_by = models.ForeignKey(
        settings.AUTH_USER_MODEL,
        blank=True,
        null=True,
        on_delete=models.SET_NULL,
        related_name="transcription_reviewers",
    )

    text = models.TextField(blank=True)

    # ocr tracking
    ocr_generated = models.BooleanField(
        default=False,
        help_text="Flags transcription as generated directly by OCR",
    )
    ocr_originated = models.BooleanField(
        default=False,
        help_text="Flags transcription as originated from an OCR transcription",
    )

    rolled_back = models.BooleanField(
        default=False,
        help_text="Flags transcription as being the result of a rollback (undo)",
    )
    rolled_forward = models.BooleanField(
        default=False,
        help_text="Flags transcription as being the result of a rollforward (redo)",
    )
    source = models.ForeignKey(
        "self",
        blank=True,
        null=True,
        on_delete=models.CASCADE,
        help_text="The transcription source for the roll back or roll forward",
        related_name="source_of",
    )

    objects = TranscriptionManager()

    class Meta:
        indexes = [
            models.Index(fields=["asset", "user"]),
        ]

    def __str__(self):
        return f"Transcription #{self.pk}"

    def campaign_slug(self):
        return self.asset.item.project.campaign.slug

    def clean(self):
        if (
            self.user
            and self.reviewed_by
            and self.user == self.reviewed_by
            and self.accepted
        ):
            raise ValidationError("Transcriptions cannot be self-accepted")
        if self.accepted and self.rejected:
            raise ValidationError("Transcriptions cannot be both accepted and rejected")
        return super().clean()

    @property
    def status(self):
        if self.accepted:
            return TranscriptionStatus.CHOICE_MAP[TranscriptionStatus.COMPLETED]
        elif self.submitted and not self.rejected:
            return TranscriptionStatus.CHOICE_MAP[TranscriptionStatus.SUBMITTED]
        else:
            return TranscriptionStatus.CHOICE_MAP[TranscriptionStatus.IN_PROGRESS]


def update_userprofileactivity_table(user, campaign_id, field, increment=1):
    """
    Update per-user activity counters for a campaign and the user's profile.

    This function updates or creates a ``UserProfileActivity`` row for the given
    user and campaign, adjusts the requested counter field by ``increment``,
    and recalculates the number of distinct assets the user has contributed to
    in that campaign. It also updates the corresponding ``UserProfile`` record
    to keep global counters in sync.

    Args:
        user: The Django user whose activity should be updated.
        campaign_id: Primary key of the campaign to update activity for.
        field: Name of the integer field to increment (for example,
            ``"transcribe_count"`` or ``"review_count"``).
        increment: Amount to add to the chosen field. Defaults to ``1``.

    """
    structured_logger.info(
        "Updating user profile activity table.",
        event_code="userprofileactivity_update_start",
        user=user,
        campaign_id=campaign_id,
        activity_field=field,
        increment=increment,
    )
    user_profile_activity, created = UserProfileActivity.objects.get_or_create(
        user=user,
        campaign_id=campaign_id,
    )
    if created:
        value = increment
        structured_logger.info(
            "Created new UserProfileActivity object",
            event_code="userprofileactivity_created",
            user=user,
            campaign_id=campaign_id,
        )

    else:
        value = F(field) + increment
    setattr(user_profile_activity, field, value)
    q = Q(transcription__user=user) | Q(transcription__reviewed_by=user)
    user_profile_activity.asset_count = (
        Asset.objects.filter(q)
        .filter(item__project__campaign=campaign_id)
        .distinct()
        .count()
    )
    user_profile_activity.save()
    structured_logger.info(
        "Saved UserProfileActivity.",
        event_code="userprofileactivity_saved",
        user=user,
        campaign_id=campaign_id,
        updated_field=field,
    )
    if hasattr(user, "profile"):
        profile = user.profile
        value = F(field) + increment
    else:
        profile = UserProfile.objects.create(user=user)
        value = increment
        structured_logger.info(
            "Created new UserProfile OBJECT",
            event_code="userprofile_created",
            user=user,
        )

    setattr(profile, field, value)
    profile.save()
    structured_logger.info(
        "Saved UserProfile",
        event_code="userprofile_saved",
        user=user,
        updated_field=field,
    )


def _update_useractivity_cache(user_id, campaign_id, attr_name):
    """
    Update the in-memory cache of user activity for a campaign.

    The cache stores a mapping of ``user_id`` to a tuple
    ``(transcribe_count, review_count)`` for each campaign. This helper
    increments the requested attribute and persists the updated mapping.

    Args:
        user_id: ID of the user whose cached counters should be updated.
        campaign_id: ID of the related campaign.
        attr_name: Name of the activity type to increment, either
            ``"transcribe"`` or ``"review"``.
    """
    key = f"userprofileactivity_{campaign_id}"
    updates = cache.get(key, {})
    transcribe_count, review_count = updates.get(user_id, (0, 0))
    if attr_name == "transcribe":
        transcribe_count += 1
    else:
        review_count += 1
    updates[user_id] = (transcribe_count, review_count)
    cache.set(key, updates, timeout=None)
    structured_logger.info(
        "Updated user activity cache",
        event_code="useractivity_cache_updated",
        user_id=user_id,
        campaign_id=campaign_id,
        updated_field=attr_name,
        new_transcribe_count=transcribe_count,
        new_review_count=review_count,
    )


class AssetTranscriptionReservation(models.Model):
    """
    Record a user's reservation to transcribe a particular asset.

    The reservation token encodes both a short reservation identifier and the
    user information. Convenience methods slice the stored token to return
    each component.
    """

    asset = models.ForeignKey(Asset, on_delete=models.CASCADE)
    reservation_token = models.CharField(max_length=50)

    created_on = models.DateTimeField(editable=False, auto_now_add=True)
    updated_on = models.DateTimeField(auto_now=True)
    tombstoned = models.BooleanField(default=False, blank=True, null=True)

    def get_token(self):
        return self.reservation_token[:44]

    def get_user(self):
        return self.reservation_token[44:]


class SimplePage(models.Model):
    """
    Simple, CMS-like content page addressable by a URL path.

    These records back lightweight informational pages that can be edited
    via the Django admin instead of being hard-coded in templates.
    """

    created_on = models.DateTimeField(editable=False, auto_now_add=True)
    updated_on = models.DateTimeField(editable=False, auto_now=True)

    path = models.CharField(
        max_length=255,
        help_text="URL path where this page will be accessible from",
        validators=[RegexValidator(r"^/.+/$")],
    )

    title = models.CharField(max_length=200)

    body = models.TextField(blank=True, null=True)

    def __str__(self):
        return f"SimplePage: {self.path}"


class Banner(models.Model):
    """
    Site-wide banner for alerts or announcements.

    Banners can link out to supporting pages and use a limited set of
    alert-style color classes.
    """

    created_on = models.DateTimeField(editable=False, auto_now_add=True)
    updated_on = models.DateTimeField(editable=False, auto_now=True)

    slug = models.SlugField(max_length=80, unique=True, allow_unicode=True)
    text = models.CharField(max_length=255)
    link = models.CharField(max_length=255, blank=True, null=True)
    open_in_new_window_tab = models.BooleanField(default=True, blank=True)
    active = models.BooleanField(default=False, blank=True)
    DANGER = "DANGER"
    INFO = "INFO"
    SUCCESS = "SUCCESS"
    WARN = "WARN"
    ALERT_STATUS_CHOICES = [
        ("DANGER", "Red"),
        ("INFO", "Blue"),
        ("SUCCESS", "Green"),
        ("WARNING", "Grey"),
    ]
    alert_status = models.CharField(
        max_length=7,
        choices=ALERT_STATUS_CHOICES,
        default=SUCCESS,
        verbose_name="Color",
    )

    def __str__(self):
        return f"Banner: {self.slug}"

    def alert_class(self):
        return "alert-" + self.alert_status.lower()

    def btn_class(self):
        return "btn-" + self.alert_status.lower()


class CarouselSlide(models.Model):
    """
    Configurable slide for the homepage carousel.

    Each slide can show an image, text overlay, and call-to-action URL, with
    simple ordering and publication controls.
    """

    objects = PublicationQuerySet.as_manager()

    created_on = models.DateTimeField(editable=False, auto_now_add=True)
    updated_on = models.DateTimeField(editable=False, auto_now=True)

    ordering = models.IntegerField(
        default=0, help_text="Sort order: lower values will be listed first"
    )
    published = models.BooleanField(default=False, blank=True)

    overlay_position = models.CharField(max_length=5, choices=OverlayPosition.CHOICES)

    headline = models.CharField(max_length=255, blank=False)
    body = models.TextField(blank=True)
    image_alt_text = models.TextField(blank=True)

    carousel_image = models.ImageField(
        upload_to="carousel-slides", blank=True, null=True
    )

    lets_go_url = models.CharField(max_length=255)

    def __str__(self):
        return f"CarouselSlide: {self.headline}"


class SiteReportManager(models.Manager):
    """
    Manager providing series-aware helpers for SiteReport.

    A "series" is the set of SiteReport rows that belong to the same logical
    reporting stream:

      - Site-wide TOTAL:          report_name=TOTAL, campaign=None, topic=None
      - Site-wide RETIRED_TOTAL:  report_name=RETIRED_TOTAL
      - Per-campaign:             campaign=<campaign>, topic=None
      - Per-topic:                topic=<topic>, campaign=None

    These helpers avoid duplicating series filtering logic in tasks.
    """

    def _series_filter(
        self,
        *,
        report_name: Optional[str] = None,
        campaign: Optional["Campaign"] = None,
        topic: Optional["Topic"] = None,
    ) -> Q:
        """
        Build a Q filter for a single SiteReport series based on the inputs.

        Args:
            report_name: One of the SiteReport.ReportName values for site-wide
                series (TOTAL, RETIRED_TOTAL). Ignored for per-campaign/topic.
            campaign: Campaign instance for per-campaign series.
            topic: Topic instance for per-topic series.

        Returns:
            Q: A Django Q object representing the series filter.
        """
        if campaign is not None:
            return Q(campaign=campaign, topic__isnull=True)
        if topic is not None:
            return Q(topic=topic, campaign__isnull=True)
        if report_name == SiteReport.ReportName.TOTAL:
            return Q(
                report_name=SiteReport.ReportName.TOTAL,
                campaign__isnull=True,
                topic__isnull=True,
            )
        if report_name == SiteReport.ReportName.RETIRED_TOTAL:
            return Q(report_name=SiteReport.ReportName.RETIRED_TOTAL)
        # Fallback: no rows (prevents accidental wide queries)
        return Q(pk__in=[])  # pragma: no cover

    def previous_in_series(
        self,
        *,
        report_name: Optional[str] = None,
        campaign: Optional["Campaign"] = None,
        topic: Optional["Topic"] = None,
        before: Optional[datetime.datetime] = None,
    ) -> Optional["SiteReport"]:
        """
        Return the latest SiteReport in the same series strictly before 'before'.

        Args:
            report_name: Series selector for site-wide reports (TOTAL/RETIRED_TOTAL).
            campaign: Series selector for per-campaign reports.
            topic: Series selector for per-topic reports.
            before: A timezone-aware datetime; defaults to now() if omitted.

        Returns:
            SiteReport or None: The most recent prior report in the series.
        """
        if before is None:
            before = timezone.now()
        q = self._series_filter(report_name=report_name, campaign=campaign, topic=topic)
        return (
            self.filter(q, created_on__lt=before).order_by("-created_on", "-pk").first()
        )

    def series_filter_for_instance(self, instance: "SiteReport") -> Q:
        """
        Build a Q filter that selects the same logical 'series' as the given
        SiteReport instance (site-wide TOTAL, RETIRED_TOTAL,
        per-campaign, or per-topic).
        """
        if instance.campaign_id is not None:
            return Q(campaign=instance.campaign, topic__isnull=True)
        if instance.topic_id is not None:
            return Q(topic=instance.topic, campaign__isnull=True)
        if instance.report_name == SiteReport.ReportName.TOTAL:
            return Q(
                report_name=SiteReport.ReportName.TOTAL,
                campaign__isnull=True,
                topic__isnull=True,
            )
        if instance.report_name == SiteReport.ReportName.RETIRED_TOTAL:
            return Q(report_name=SiteReport.ReportName.RETIRED_TOTAL)
        return Q(pk__in=[])

    def previous_for_instance(self, instance: "SiteReport") -> "SiteReport | None":
        """
        Return the previous SiteReport within the same series (strictly earlier).
        """
        q = self.series_filter_for_instance(instance)
        return (
            self.filter(q, created_on__lt=instance.created_on)
            .order_by("-created_on", "-pk")
            .first()
        )

    def next_for_instance(self, instance: "SiteReport") -> "SiteReport | None":
        """
        Return the next SiteReport within the same series (strictly later).
        """
        q = self.series_filter_for_instance(instance)
        return (
            self.filter(q, created_on__gt=instance.created_on)
            .order_by("created_on", "pk")
            .first()
        )

    def last_on_or_before_date_for_series(
        self,
        *,
        report_name: Optional[str] = None,
        campaign: Optional["Campaign"] = None,
        topic: Optional["Topic"] = None,
        on_or_before_date: datetime.date,
    ) -> Optional["SiteReport"]:
        """
        Return the latest SiteReport within the series with
        created_on.date() <= on_or_before_date.
        """
        q = self._series_filter(report_name=report_name, campaign=campaign, topic=topic)
        return (
            self.filter(q, created_on__date__lte=on_or_before_date)
            .order_by("-created_on", "-pk")
            .first()
        )

    def first_on_or_after_date_for_series(
        self,
        *,
        report_name: Optional[str] = None,
        campaign: Optional["Campaign"] = None,
        topic: Optional["Topic"] = None,
        on_or_after_date: datetime.date,
        on_or_before_date: Optional[datetime.date] = None,
    ) -> Optional["SiteReport"]:
        """
        Return the earliest SiteReport within the series with
        created_on.date() >= on_or_after_date (and optionally
        <= on_or_before_date).
        """
        q = self._series_filter(report_name=report_name, campaign=campaign, topic=topic)
        filters = {"created_on__date__gte": on_or_after_date}
        if on_or_before_date is not None:
            filters["created_on__date__lte"] = on_or_before_date
        return self.filter(q, **filters).order_by("created_on", "pk").first()

    def sum_assets_started_for_series_between_dates(
        self,
        *,
        report_name: str,
        start_date: datetime.date,
        end_date: datetime.date,
    ) -> int:
        """
        Sum `assets_started` for a site-wide series
        (TOTAL or RETIRED_TOTAL) inclusive of both dates.
        Treat NULLs as zeros.
        """
        agg = self.filter(
            report_name=report_name,
            campaign__isnull=True,
            topic__isnull=True,
            created_on__date__gte=start_date,
            created_on__date__lte=end_date,
        ).aggregate(total=Sum("assets_started"))
        return int(agg["total"] or 0)


class SiteReport(models.Model):
    class ReportName(models.TextChoices):
        TOTAL = "Active and completed campaigns", "Active and completed campaigns"
        RETIRED_TOTAL = "Retired campaigns", "Retired campaigns"

    created_on = models.DateTimeField(auto_now_add=True)
    report_name = models.CharField(
        max_length=80, blank=True, default="", choices=ReportName.choices
    )
    campaign = models.ForeignKey(
        Campaign, on_delete=models.SET_NULL, blank=True, null=True
    )
    topic = models.ForeignKey(Topic, on_delete=models.SET_NULL, blank=True, null=True)
    assets_total = models.IntegerField(blank=True, null=True)
    assets_published = models.IntegerField(blank=True, null=True)
    assets_not_started = models.IntegerField(blank=True, null=True)
    assets_in_progress = models.IntegerField(blank=True, null=True)
    assets_waiting_review = models.IntegerField(blank=True, null=True)
    assets_completed = models.IntegerField(blank=True, null=True)
    assets_unpublished = models.IntegerField(blank=True, null=True)
    assets_started = models.IntegerField(blank=True, null=True)
    items_published = models.IntegerField(blank=True, null=True)
    items_unpublished = models.IntegerField(blank=True, null=True)
    projects_published = models.IntegerField(blank=True, null=True)
    projects_unpublished = models.IntegerField(blank=True, null=True)
    anonymous_transcriptions = models.IntegerField(blank=True, null=True)
    transcriptions_saved = models.IntegerField(blank=True, null=True)
    daily_review_actions = models.IntegerField(blank=True, null=True)
    distinct_tags = models.IntegerField(blank=True, null=True)
    tag_uses = models.IntegerField(blank=True, null=True)
    campaigns_published = models.IntegerField(blank=True, null=True)
    campaigns_unpublished = models.IntegerField(blank=True, null=True)
    users_registered = models.IntegerField(blank=True, null=True)
    users_activated = models.IntegerField(blank=True, null=True)
    registered_contributors = models.IntegerField(blank=True, null=True)
    daily_active_users = models.IntegerField(blank=True, null=True)

    objects = SiteReportManager()

    class Meta:
        ordering = ("-created_on",)
        get_latest_by = "created_on"

    # We have several places where these are exported as CSV/Excel. By default
    # the ORM will be told to retrieve these fields & lookups:
    DEFAULT_EXPORT_FIELDNAMES = [
        "created_on",
        "report_name",
        "campaign__title",
        "topic__title",
        "assets_total",
        "assets_published",
        "assets_not_started",
        "assets_in_progress",
        "assets_waiting_review",
        "assets_completed",
        "assets_unpublished",
        "assets_started",
        "items_published",
        "items_unpublished",
        "projects_published",
        "projects_unpublished",
        "anonymous_transcriptions",
        "transcriptions_saved",
        "daily_review_actions",
        "distinct_tags",
        "tag_uses",
        "campaigns_published",
        "campaigns_unpublished",
        "users_registered",
        "users_activated",
        "registered_contributors",
        "daily_active_users",
    ]

    @staticmethod
    def calculate_assets_started(
        *,
        previous_assets_total: Optional[int],
        previous_assets_not_started: Optional[int],
        current_assets_total: Optional[int],
        current_assets_not_started: Optional[int],
    ) -> int:
        """
        Calculate the daily "assets started" value between two reports.

        Let, for each snapshot:
            total_prev = previous_assets_total
            ns_prev    = previous_assets_not_started
            total_cur  = current_assets_total
            ns_cur     = current_assets_not_started
            started_prev = max(0, total_prev - ns_prev)
            started_cur  = max(0, total_cur - ns_cur)

        Then:
            assets_started = max(0, started_cur - started_prev)

        This treats "started" as any asset that is in progress, waiting review,
        or completed, regardless of published/unpublished status. Using
        assets_total and assets_not_started makes the metric insensitive to
        publish/unpublish changes: moving assets between published and
        unpublished does not affect assets_started as long as their not-started
        status and total count remain consistent.

        All None inputs are treated as zero. The final result is floored at
        zero to avoid negative values that can arise from administrative
        actions such as deleting assets that were already started.
        """
        total_prev = int(previous_assets_total or 0)
        ns_prev = int(previous_assets_not_started or 0)
        total_cur = int(current_assets_total or 0)
        ns_cur = int(current_assets_not_started or 0)

        started_prev = max(0, total_prev - ns_prev)
        started_cur = max(0, total_cur - ns_cur)

        return max(0, started_cur - started_prev)

    def previous_in_series(self) -> "SiteReport | None":
        """
        Return the previous SiteReport within this object's series.
        """
        return SiteReport.objects.previous_for_instance(self)

    def next_in_series(self) -> "SiteReport | None":
        """
        Return the next SiteReport within this object's series.
        """
        return SiteReport.objects.next_for_instance(self)

    def to_debug_dict(self) -> dict:
        """
        Return a JSON-serializable dictionary of this site report suitable for
        copy/paste debugging. Includes core identifiers, related object info
        (if available), and all numeric counters.

        Related objects are expanded into small dicts with common attributes
        when present (id, title, slug, status). Missing attributes are omitted.
        """
        data: dict = {
            "id": self.id,
            "created_on": self.created_on,
            "report_name": self.report_name,
        }

        if self.campaign_id:
            campaign_info = {"id": self.campaign_id}
            for attr in ("title", "slug", "status"):
                value = getattr(self.campaign, attr, None)
                if value is not None:
                    campaign_info[attr] = value
            data["campaign"] = campaign_info

        if self.topic_id:
            topic_info = {"id": self.topic_id}
            for attr in ("title", "slug"):
                value = getattr(self.topic, attr, None)
                if value is not None:
                    topic_info[attr] = value
            data["topic"] = topic_info

        # Numeric counters (explicit list to keep ordering predictable)
        counters = {
            "assets_total": self.assets_total,
            "assets_published": self.assets_published,
            "assets_not_started": self.assets_not_started,
            "assets_in_progress": self.assets_in_progress,
            "assets_waiting_review": self.assets_waiting_review,
            "assets_completed": self.assets_completed,
            "assets_unpublished": self.assets_unpublished,
            "assets_started": self.assets_started,
            "items_published": self.items_published,
            "items_unpublished": self.items_unpublished,
            "projects_published": self.projects_published,
            "projects_unpublished": self.projects_unpublished,
            "anonymous_transcriptions": self.anonymous_transcriptions,
            "transcriptions_saved": self.transcriptions_saved,
            "daily_review_actions": self.daily_review_actions,
            "distinct_tags": self.distinct_tags,
            "tag_uses": self.tag_uses,
            "campaigns_published": self.campaigns_published,
            "campaigns_unpublished": self.campaigns_unpublished,
            "users_registered": self.users_registered,
            "users_activated": self.users_activated,
            "registered_contributors": self.registered_contributors,
            "daily_active_users": self.daily_active_users,
        }
        data["counters"] = counters
        return data

    def to_debug_json(self) -> str:
        """
        Return a pretty-printed JSON string of `to_debug_dict()` with ISO
        datetimes.
        """
        return json.dumps(
            self.to_debug_dict(), cls=DjangoJSONEncoder, indent=2, sort_keys=True
        )


class KeyMetricsReport(models.Model):
    """
    Site-wide Key Metrics report persisted for three period types:

    - MONTHLY: per calendar month (with special handling for the very first
      month)
    - QUARTERLY: fiscal quarter rollup (Q1=Oct-Dec, Q2=Jan-Mar, Q3=Apr-Jun,
      Q4=Jul-Sep)
    - FISCAL_YEAR: fiscal year rollup (Oct 1 - Sep 30)

    Monthly numbers are computed from SiteReport as follows:

    - For cumulative counters (for example, assets_published, assets_completed,
      transcriptions_saved, users_activated, anonymous_transcriptions,
      tag_uses): the monthly value is the non-negative difference between the
      combined site-wide TOTAL + RETIRED_TOTAL values at the end of the month
      and the baseline snapshot. Baseline is the latest snapshot strictly
      before the first day of the month; if none exists, baseline is the first
      snapshot within the month (yielding the delta within that month).
    - For assets_started: the monthly value is the sum of the daily
      ``assets_started`` field across the month for the TOTAL and
      RETIRED_TOTAL site-wide series.

    Quarterly and fiscal-year numbers are rollups from the monthly rows:

    - For count metrics: sum of the months in the period.
    - For avg_visit_seconds: arithmetic mean of the months that have a value.
      If no month has a value, the rollup is NULL.

    Manual fields are stored here too so CMs can edit them in the admin and
    have them included when exporting CSVs. If unset they remain NULL and are
    rendered as empty strings in exports. Manual fields only roll up if at
    least one of the rolled up reports' value is not NULL, so manual values in
    "higher" reports will not be set to NULL if none of the "lower" reports
    have values. This allows manual values to be set only in quarterly and/or
    yearly reports instead of every month.
    """

    class PeriodType(models.TextChoices):
        MONTHLY = "MONTHLY", "Monthly"
        QUARTERLY = "QUARTERLY", "Quarterly"
        FISCAL_YEAR = "FISCAL_YEAR", "Fiscal year"

    created_on = models.DateTimeField(auto_now_add=True)
    updated_on = models.DateTimeField(auto_now=True)

    period_type = models.CharField(max_length=20, choices=PeriodType.choices)
    period_start = models.DateField()  # inclusive
    period_end = models.DateField()  # inclusive

    fiscal_year = models.IntegerField()
    fiscal_quarter = models.IntegerField(blank=True, null=True)  # 1..4 for quarters
    month = models.IntegerField(blank=True, null=True)  # 1..12 for monthly

    # Derived from SiteReport metrics
    assets_published = models.IntegerField(blank=True, null=True)
    assets_started = models.IntegerField(blank=True, null=True)
    assets_completed = models.IntegerField(blank=True, null=True)
    users_activated = models.IntegerField(blank=True, null=True)
    anonymous_transcriptions = models.IntegerField(blank=True, null=True)
    transcriptions_saved = models.IntegerField(blank=True, null=True)
    tag_uses = models.IntegerField(blank=True, null=True)

    # Manual metrics
    crowd_emails_and_libanswers_sent = models.IntegerField(blank=True, null=True)
    crowd_visits = models.IntegerField(blank=True, null=True)
    crowd_page_views = models.IntegerField(blank=True, null=True)
    crowd_unique_visitors = models.IntegerField(blank=True, null=True)
    avg_visit_seconds = models.DecimalField(
        max_digits=8, decimal_places=2, blank=True, null=True
    )
    transcriptions_added_to_loc_gov = models.IntegerField(blank=True, null=True)
    datasets_added_to_loc_gov = models.IntegerField(blank=True, null=True)

    class Meta:
        indexes = [
            models.Index(fields=["period_type", "period_start", "period_end"]),
            models.Index(fields=["period_type", "fiscal_year"]),
            models.Index(fields=["period_type", "fiscal_year", "fiscal_quarter"]),
            models.Index(fields=["period_type", "fiscal_year", "month"]),
        ]
        unique_together = (("period_type", "period_start", "period_end"),)
        ordering = ("period_start", "period_end", "period_type")

    CSV_METRIC_COLUMNS: tuple[tuple[str, str], ...] = (
        # Derived metrics (from SiteReport)
        ("assets_published", "Assets published"),
        ("assets_started", "Assets started"),
        ("assets_completed", "Assets completed"),
        ("users_activated", "User accounts activated"),
        ("anonymous_transcriptions", "Anonymous transcriptions"),
        ("transcriptions_saved", "Transcriptions saved"),
        ("tag_uses", "Tag uses"),
        # Manual metrics
        ("crowd_emails_and_libanswers_sent", "Crowd emails & LibAnswers sent"),
        ("crowd_visits", "Crowd.loc.gov visits"),
        ("crowd_page_views", "Crowd.loc.gov page views"),
        ("crowd_unique_visitors", "Crowd.loc.gov unique visitors"),
        ("avg_visit_seconds", "Avg. crowd.loc.gov visit (in seconds)"),
        ("transcriptions_added_to_loc_gov", "Transcriptions added to loc.gov"),
        ("datasets_added_to_loc_gov", "Datasets added to loc.gov"),
    )

    MANUAL_FIELDS: tuple[str, ...] = (
        "crowd_emails_and_libanswers_sent",
        "crowd_visits",
        "crowd_page_views",
        "crowd_unique_visitors",
        "avg_visit_seconds",
        "transcriptions_added_to_loc_gov",
        "datasets_added_to_loc_gov",
    )

    CALCULATED_FIELDS: tuple[str, ...] = (
        "assets_published",
        "assets_started",
        "assets_completed",
        "users_activated",
        "anonymous_transcriptions",
        "transcriptions_saved",
        "tag_uses",
    )

    def __str__(self) -> str:
        """
        Return a human-friendly name for the report.

        Formats:
        - Fiscal year: ``"FY2024 Report"``
        - Quarter: ``"FY2023 Q2 Report"``
        - Monthly: ``"FY2022M06 Report (June 2022)"``
        """
        if self.period_type == self.PeriodType.FISCAL_YEAR:
            return f"FY{self.fiscal_year} Report"

        if self.period_type == self.PeriodType.QUARTERLY and self.fiscal_quarter:
            return f"FY{self.fiscal_year} Q{self.fiscal_quarter} Report"

        if self.period_type == self.PeriodType.MONTHLY and self.month:
            # Calendar year for this month within the fiscal year
            calendar_year = (
                self.fiscal_year - 1 if self.month >= 10 else self.fiscal_year
            )
            month_name = calendar.month_name[self.month]
            return (
                f"FY{self.fiscal_year}M{self.month:02d} Report "
                f"({month_name} {calendar_year})"
            )

        # Fallback if fields are incomplete
        return (
            "KeyMetricsReport "
            f"{self.period_type} {self.period_start}-{self.period_end}"
        )

    @staticmethod
    def get_fiscal_year_for_date(d: datetime.date) -> int:
        """Return the fiscal year for a date (Oct 1-Sep 30)."""
        return d.year + 1 if d.month >= 10 else d.year

    @staticmethod
    def get_fiscal_quarter_for_date(d: datetime.date) -> int:
        """Return the fiscal quarter for a date (Q1=Oct-Dec, ..., Q4=Jul-Sep)."""
        if 10 <= d.month <= 12:
            return 1
        if 1 <= d.month <= 3:
            return 2
        if 4 <= d.month <= 6:
            return 3
        return 4

    @staticmethod
    def month_bounds(d: datetime.date) -> tuple[datetime.date, datetime.date]:
        """Return (first_day, last_day) for the month containing d, in local time."""
        first = d.replace(day=1)
        if first.month == 12:
            next_month_first = first.replace(year=first.year + 1, month=1, day=1)
        else:
            next_month_first = first.replace(month=first.month + 1, day=1)
        last = next_month_first - datetime.timedelta(days=1)
        return first, last

    @classmethod
    def _monthly_from_sitereports(
        cls, *, month_start: datetime.date, month_end: datetime.date
    ) -> dict[str, int | Decimal | None]:
        """
        Compute monthly site-wide metrics from SiteReport.

        The month is defined by [month_start, month_end]. Snapshot-delta
        metrics are computed as the non-negative difference between:

        ``(total_eom + retired_eom)`` and
        ``(total_baseline + retired_baseline)``

        where baseline is the latest snapshot strictly before month_start. If
        none exists, baseline is the first snapshot within the month.

        assets_started is computed as the sum of daily ``assets_started``
        across the month for TOTAL + RETIRED_TOTAL.
        """
        # Identify the current (EOM) snapshots by series
        total_eom = SiteReport.objects.last_on_or_before_date_for_series(
            report_name=SiteReport.ReportName.TOTAL,
            on_or_before_date=month_end,
        )
        retired_eom = SiteReport.objects.last_on_or_before_date_for_series(
            report_name=SiteReport.ReportName.RETIRED_TOTAL,
            on_or_before_date=month_end,
        )

        # If there is literally no snapshot by month_end for both series,
        # we cannot produce a month.
        if total_eom is None and retired_eom is None:
            return {}

        # Find baselines (strictly before the month start). If missing, fall back
        # to the first snapshot within the month.
        total_baseline = SiteReport.objects.previous_in_series(
            report_name=SiteReport.ReportName.TOTAL,
            before=datetime.datetime.combine(
                month_start, datetime.time.min, tzinfo=timezone.get_current_timezone()
            ),
        )
        if total_baseline is None and total_eom is not None:
            total_baseline = SiteReport.objects.first_on_or_after_date_for_series(
                report_name=SiteReport.ReportName.TOTAL,
                on_or_after_date=month_start,
                on_or_before_date=month_end,
            )

        retired_baseline = SiteReport.objects.previous_in_series(
            report_name=SiteReport.ReportName.RETIRED_TOTAL,
            before=datetime.datetime.combine(
                month_start, datetime.time.min, tzinfo=timezone.get_current_timezone()
            ),
        )
        if retired_baseline is None and retired_eom is not None:
            retired_baseline = SiteReport.objects.first_on_or_after_date_for_series(
                report_name=SiteReport.ReportName.RETIRED_TOTAL,
                on_or_after_date=month_start,
                on_or_before_date=month_end,
            )

        def val(obj: Optional[SiteReport], field: str) -> int:
            """
            Safely extract an integer field from a SiteReport.

            Missing objects or missing fields are treated as zero.
            """
            if obj is None:
                return 0
            return int(getattr(obj, field, 0) or 0)

        def delta(field: str) -> int:
            cur_total = val(total_eom, field) + val(retired_eom, field)
            base_total = val(total_baseline, field) + val(retired_baseline, field)
            return max(0, cur_total - base_total)

        # Snapshot-delta fields
        assets_published = delta("assets_published")
        assets_completed = delta("assets_completed")
        users_activated = delta("users_activated")
        anonymous_transcriptions = delta("anonymous_transcriptions")
        transcriptions_saved = delta("transcriptions_saved")
        tag_uses = delta("tag_uses")

        # assets_started is the sum across the month for TOTAL and RETIRED_TOTAL
        total_started = SiteReport.objects.sum_assets_started_for_series_between_dates(
            report_name=SiteReport.ReportName.TOTAL,
            start_date=month_start,
            end_date=month_end,
        )
        retired_started = (
            SiteReport.objects.sum_assets_started_for_series_between_dates(
                report_name=SiteReport.ReportName.RETIRED_TOTAL,
                start_date=month_start,
                end_date=month_end,
            )
        )
        assets_started = int(total_started + retired_started)

        return {
            "assets_published": assets_published,
            "assets_started": assets_started,
            "assets_completed": assets_completed,
            "users_activated": users_activated,
            "anonymous_transcriptions": anonymous_transcriptions,
            "transcriptions_saved": transcriptions_saved,
            "tag_uses": tag_uses,
        }

    @classmethod
    def upsert_month(cls, *, year: int, month: int) -> Optional["KeyMetricsReport"]:
        """
        Create or update the MONTHLY report for the given (year, month).

        Returns the saved instance, or None if the month cannot be computed
        (no end-of-month snapshots exist in either series).
        """
        month_start = datetime.date(year, month, 1)
        _, month_end = cls.month_bounds(month_start)

        values = cls._monthly_from_sitereports(
            month_start=month_start, month_end=month_end
        )
        if not values:
            return None  # Nothing computable for this month.

        fiscal_year = cls.get_fiscal_year_for_date(month_end)
        obj, _ = cls.objects.get_or_create(
            period_type=cls.PeriodType.MONTHLY,
            period_start=month_start,
            period_end=month_end,
            defaults={
                "fiscal_year": fiscal_year,
                "fiscal_quarter": cls.get_fiscal_quarter_for_date(month_end),
                "month": month,
            },
        )
        # Update derived fields; keep manual fields as-is.
        for key, value in values.items():
            setattr(obj, key, value)
        obj.fiscal_year = fiscal_year
        obj.fiscal_quarter = cls.get_fiscal_quarter_for_date(month_end)
        obj.month = month
        obj.save()
        return obj

    @classmethod
    def upsert_quarter(
        cls, *, fiscal_year: int, fiscal_quarter: int
    ) -> Optional["KeyMetricsReport"]:
        """
        Create or update the QUARTERLY report by rolling up existing monthly rows.

        If no monthly rows exist for the quarter, returns None. We sum all
        monthly rows present in the quarter; partial quarters are allowed (for
        example, at the very beginning of history).
        """
        if fiscal_quarter not in (1, 2, 3, 4):
            raise ValueError("fiscal_quarter must be 1..4")

        # Determine the calendar months for the fiscal quarter
        if fiscal_quarter == 1:
            month_specs = [
                (fiscal_year - 1, 10),
                (fiscal_year - 1, 11),
                (fiscal_year - 1, 12),
            ]
        elif fiscal_quarter == 2:
            month_specs = [(fiscal_year, 1), (fiscal_year, 2), (fiscal_year, 3)]
        elif fiscal_quarter == 3:
            month_specs = [(fiscal_year, 4), (fiscal_year, 5), (fiscal_year, 6)]
        else:
            month_specs = [(fiscal_year, 7), (fiscal_year, 8), (fiscal_year, 9)]

        monthly_queryset = cls.objects.filter(
            period_type=cls.PeriodType.MONTHLY,
            fiscal_year=fiscal_year,
            month__in=[m for (_, m) in month_specs],
        )
        if not monthly_queryset.exists():
            return None

        rollup_sums = monthly_queryset.aggregate(
            # Derived (always recompute)
            assets_published=Sum("assets_published"),
            assets_started=Sum("assets_started"),
            assets_completed=Sum("assets_completed"),
            users_activated=Sum("users_activated"),
            anonymous_transcriptions=Sum("anonymous_transcriptions"),
            transcriptions_saved=Sum("transcriptions_saved"),
            tag_uses=Sum("tag_uses"),
            # Manual (only set if aggregate is not None)
            crowd_emails_and_libanswers_sent=Sum("crowd_emails_and_libanswers_sent"),
            crowd_visits=Sum("crowd_visits"),
            crowd_page_views=Sum("crowd_page_views"),
            crowd_unique_visitors=Sum("crowd_unique_visitors"),
            transcriptions_added_to_loc_gov=Sum("transcriptions_added_to_loc_gov"),
            datasets_added_to_loc_gov=Sum("datasets_added_to_loc_gov"),
        )
        avg_series = monthly_queryset.exclude(avg_visit_seconds__isnull=True).aggregate(
            avg=Avg("avg_visit_seconds")
        )
        average_visit_seconds = avg_series["avg"]

        # Quarter bounds (full quarter)
        quarter_start = datetime.date(month_specs[0][0], month_specs[0][1], 1)
        _, quarter_end = cls.month_bounds(
            datetime.date(month_specs[-1][0], month_specs[-1][1], 1)
        )

        report, _ = cls.objects.get_or_create(
            period_type=cls.PeriodType.QUARTERLY,
            period_start=quarter_start,
            period_end=quarter_end,
            defaults={
                "fiscal_year": fiscal_year,
                "fiscal_quarter": fiscal_quarter,
            },
        )

        derived_fields = (
            "assets_published",
            "assets_started",
            "assets_completed",
            "users_activated",
            "anonymous_transcriptions",
            "transcriptions_saved",
            "tag_uses",
        )
        for field_name in derived_fields:
            setattr(report, field_name, int(rollup_sums[field_name] or 0))

        manual_fields = (
            "crowd_emails_and_libanswers_sent",
            "crowd_visits",
            "crowd_page_views",
            "crowd_unique_visitors",
            "transcriptions_added_to_loc_gov",
            "datasets_added_to_loc_gov",
        )
        for field_name in manual_fields:
            if rollup_sums[field_name] is not None:
                setattr(report, field_name, int(rollup_sums[field_name]))

        if average_visit_seconds is not None:
            report.avg_visit_seconds = average_visit_seconds

        report.fiscal_year = fiscal_year
        report.fiscal_quarter = fiscal_quarter
        report.month = None
        report.save()
        return report

    @classmethod
    def upsert_fiscal_year(cls, *, fiscal_year: int) -> Optional["KeyMetricsReport"]:
        """
        Create or update the FISCAL_YEAR report by rolling up monthly rows.

        Returns None if no monthly rows exist for the fiscal year.
        """
        monthly_qs = cls.objects.filter(
            period_type=cls.PeriodType.MONTHLY, fiscal_year=fiscal_year
        )
        if not monthly_qs.exists():
            return None

        sums = monthly_qs.aggregate(
            # Derived (always recompute)
            assets_published=Sum("assets_published"),
            assets_started=Sum("assets_started"),
            assets_completed=Sum("assets_completed"),
            users_activated=Sum("users_activated"),
            anonymous_transcriptions=Sum("anonymous_transcriptions"),
            transcriptions_saved=Sum("transcriptions_saved"),
            tag_uses=Sum("tag_uses"),
            # Manual (only set if aggregate is not None)
            crowd_emails_and_libanswers_sent=Sum("crowd_emails_and_libanswers_sent"),
            crowd_visits=Sum("crowd_visits"),
            crowd_page_views=Sum("crowd_page_views"),
            crowd_unique_visitors=Sum("crowd_unique_visitors"),
            transcriptions_added_to_loc_gov=Sum("transcriptions_added_to_loc_gov"),
            datasets_added_to_loc_gov=Sum("datasets_added_to_loc_gov"),
        )
        avg_series = monthly_qs.exclude(avg_visit_seconds__isnull=True).aggregate(
            avg=Avg("avg_visit_seconds")
        )
        avg_visit_seconds = avg_series["avg"]

        # FY period bounds: Oct 1 .. Sep 30
        start = datetime.date(fiscal_year - 1, 10, 1)
        end = datetime.date(fiscal_year, 9, 30)

        obj, _ = cls.objects.get_or_create(
            period_type=cls.PeriodType.FISCAL_YEAR,
            period_start=start,
            period_end=end,
            defaults={"fiscal_year": fiscal_year},
        )

        derived_fields = (
            "assets_published",
            "assets_started",
            "assets_completed",
            "users_activated",
            "anonymous_transcriptions",
            "transcriptions_saved",
            "tag_uses",
        )
        for field in derived_fields:
            setattr(obj, field, int(sums[field] or 0))

        manual_fields = (
            "crowd_emails_and_libanswers_sent",
            "crowd_visits",
            "crowd_page_views",
            "crowd_unique_visitors",
            "transcriptions_added_to_loc_gov",
            "datasets_added_to_loc_gov",
        )
        for field in manual_fields:
            if sums[field] is not None:
                setattr(obj, field, int(sums[field]))

        if avg_visit_seconds is not None:
            obj.avg_visit_seconds = avg_visit_seconds

        obj.fiscal_year = fiscal_year
        obj.fiscal_quarter = None
        obj.month = None
        obj.save()
        return obj

    def csv_filename(self) -> str:
        """
        Build a descriptive filename for this report CSV.
        """
        if self.period_type == self.PeriodType.MONTHLY:
            return (
                f"key_metrics_monthly_fy{self.fiscal_year}_"
                f"m{self.month:02d}_{self.period_start}_{self.period_end}.csv"
            )
        if self.period_type == self.PeriodType.QUARTERLY:
            return (
                f"key_metrics_quarterly_fy{self.fiscal_year}_"
                f"q{self.fiscal_quarter}_{self.period_start}_{self.period_end}.csv"
            )
        # FISCAL_YEAR
        return (
            f"key_metrics_fiscal_year_fy{self.fiscal_year}_"
            f"{self.period_start}_{self.period_end}.csv"
        )

    def _format_value_for_csv(self, field_name: str, value) -> str | int | float:
        """
        Convert model values to CSV-friendly outputs.

        Rules:
        - Calculated numeric fields: default to 0 if NULL.
        - Manual fields: default to empty string if NULL.
        - avg_visit_seconds (Decimal) renders as a string with up to 2 decimals;
          empty string if NULL.
        """
        if field_name in self.MANUAL_FIELDS:
            if value is None:
                return ""
            if field_name == "avg_visit_seconds":
                if isinstance(value, Decimal):
                    quantized = value.quantize(Decimal("0.01"))
                    return f"{quantized}"
                return f"{value}"
            return int(value)
        if field_name in self.CALCULATED_FIELDS:
            return int(value or 0)
        # Should not be reached (we only export metrics), but be safe.
        return "" if value is None else value

    def _calendar_year_for_month_in_fy(self, month: int, fiscal_year: int) -> int:
        """
        Return the calendar year for a month number interpreted in FY context.
        """
        return fiscal_year - 1 if 10 <= month <= 12 else fiscal_year

    def _fy_abbrev(self, fiscal_year: int) -> str:
        """
        Return an "FY##" abbreviation for a fiscal year number.

        Example:
            2024 -> "FY24".
        """
        return f"FY{fiscal_year % 100:02d}"

    def _month_label(self, fiscal_year: int, month: int) -> str:
        """
        Return the month name label (for example, "June").
        """
        return calendar.month_name[month]

    def _format_cell(self, field_name: str, value):
        """
        Format a single cell for CSV using the existing per-field rules.
        """
        return self._format_value_for_csv(field_name, value)

    def _csv_matrix_monthly(self) -> tuple[list[str], list[list[str | int | float]]]:
        """
        Build the CSV header and rows for a MONTHLY report.

        MONTHLY CSV:
        - Headers: ``["Metric", "<Month>"]`` (month name only)
        - Rows: one per metric.
        """
        headers = ["Metric", self._month_label(self.fiscal_year, int(self.month))]

        rows: list[list[str | int | float]] = []
        for field_name, label in self.CSV_METRIC_COLUMNS:
            value = getattr(self, field_name)
            rows.append([label, self._format_cell(field_name, value)])
        return headers, rows

    def _quarter_month_specs(self) -> list[tuple[int, int]]:
        """
        Return [(year, month), ...] for months in this object's quarter.

        Months are interpreted in the fiscal-year (FY) context.
        """
        fy = int(self.fiscal_year)
        fq = int(self.fiscal_quarter)
        if fq == 1:
            return [(fy - 1, 10), (fy - 1, 11), (fy - 1, 12)]
        if fq == 2:
            return [(fy, 1), (fy, 2), (fy, 3)]
        if fq == 3:
            return [(fy, 4), (fy, 5), (fy, 6)]
        return [(fy, 7), (fy, 8), (fy, 9)]

    def _csv_matrix_quarterly(self) -> tuple[list[str], list[list[str | int | float]]]:
        """
        Build the CSV header and rows for a QUARTERLY report.

        QUARTERLY CSV:

        Headers:
            ["Metric", "<M1>", "<M2>", "<M3>", "FY## Q# totals",
             "FY## Lifetime totals"]

        - Month columns include only months that have MONTHLY rows.
        - Month labels are month names only ("June", "September", ...).

        Lifetime for a quarter:
            sum(all prior fiscal-year reports) + sum(quarters in current FY with
            quarter < current quarter). Manual fields are blank if all inputs
            are blank.
        """
        # Which months exist for this quarter?
        specs = self._quarter_month_specs()
        months_in_quarter = [m for (_y, m) in specs]
        monthly_rows = (
            KeyMetricsReport.objects.filter(
                period_type=self.PeriodType.MONTHLY,
                fiscal_year=self.fiscal_year,
                month__in=months_in_quarter,
            )
            .only("fiscal_year", "month", *[f for f, _ in self.CSV_METRIC_COLUMNS])
            .order_by("month")
        )
        month_map: dict[int, KeyMetricsReport] = {r.month: r for r in monthly_rows}
        present_months = [m for m in months_in_quarter if m in month_map]
        month_headers = [self._month_label(self.fiscal_year, m) for m in present_months]

        fy_abbrev = self._fy_abbrev(self.fiscal_year)
        quarter_totals_label = f"{fy_abbrev} Q{int(self.fiscal_quarter)} totals"
        lifetime_totals_label = f"{fy_abbrev} Lifetime totals"

        headers = [
            "Metric",
            *month_headers,
            quarter_totals_label,
            lifetime_totals_label,
        ]

        # Pre-fetch prior FY rows and prior quarters in current FY for lifetime calc
        prior_fy_rows = KeyMetricsReport.objects.filter(
            period_type=self.PeriodType.FISCAL_YEAR,
            fiscal_year__lt=self.fiscal_year,
        ).only(*[f for f, _ in self.CSV_METRIC_COLUMNS])

        prior_quarter_rows = KeyMetricsReport.objects.filter(
            period_type=self.PeriodType.QUARTERLY,
            fiscal_year=self.fiscal_year,
            fiscal_quarter__lt=self.fiscal_quarter,
        ).only(*[f for f, _ in self.CSV_METRIC_COLUMNS])

        rows: list[list[str | int | float]] = []
        for field_name, label in self.CSV_METRIC_COLUMNS:
            # Month cells
            per_month_values: list[str | int | float] = []
            quarter_numeric_sum = 0
            saw_manual_value_in_quarter = False

            for m in present_months:
                mv = getattr(month_map[m], field_name, None)
                cell = self._format_cell(field_name, mv)
                per_month_values.append(cell)

                if field_name in self.CALCULATED_FIELDS:
                    quarter_numeric_sum += int(mv or 0)
                else:
                    if mv is not None:
                        saw_manual_value_in_quarter = True
                        quarter_numeric_sum += int(mv)

            if field_name in self.CALCULATED_FIELDS:
                quarter_total_cell: str | int = int(quarter_numeric_sum)
            else:
                quarter_total_cell = (
                    int(quarter_numeric_sum) if saw_manual_value_in_quarter else ""
                )

            # Lifetime = prior FY totals + prior quarters this FY
            lifetime_numeric_sum = 0
            saw_manual_value_lifetime = False

            # Prior FY rows
            for fy_row in prior_fy_rows:
                v = getattr(fy_row, field_name, None)
                if field_name in self.CALCULATED_FIELDS:
                    lifetime_numeric_sum += int(v or 0)
                else:
                    if v is not None:
                        saw_manual_value_lifetime = True
                        lifetime_numeric_sum += int(v)

            # Prior quarters in current FY
            for q_row in prior_quarter_rows:
                v = getattr(q_row, field_name, None)
                if field_name in self.CALCULATED_FIELDS:
                    lifetime_numeric_sum += int(v or 0)
                else:
                    if v is not None:
                        saw_manual_value_lifetime = True
                        lifetime_numeric_sum += int(v)

            if field_name in self.CALCULATED_FIELDS:
                lifetime_total_cell: str | int = int(lifetime_numeric_sum)
            else:
                lifetime_total_cell = (
                    int(lifetime_numeric_sum) if saw_manual_value_lifetime else ""
                )

            rows.append(
                [label, *per_month_values, quarter_total_cell, lifetime_total_cell]
            )

        return headers, rows

    def _csv_matrix_fiscal_year(
        self,
    ) -> tuple[list[str], list[list[str | int | float]]]:
        """
        Build the CSV header and rows for a FISCAL_YEAR report.

        Headers:

        - "Metric"
        - "FY## Q1 totals" (if Q1 present)
        - "Q2 totals" (if present)
        - "Q3 totals" (if present)
        - "Q4 totals" (if present)
        - "FY## totals"
        - "FY## Lifetime totals"

        Lifetime for a fiscal year:
            sum of all FY rows up to and including this FY. Manual fields are
            blank if all inputs are blank.
        """
        # Quarter rows present in this FY
        quarter_rows = (
            KeyMetricsReport.objects.filter(
                period_type=self.PeriodType.QUARTERLY,
                fiscal_year=self.fiscal_year,
            )
            .only("fiscal_quarter", *[f for f, _ in self.CSV_METRIC_COLUMNS])
            .order_by("fiscal_quarter")
        )
        quarter_map: dict[int, KeyMetricsReport] = {
            r.fiscal_quarter: r for r in quarter_rows
        }
        present_quarters = [q for q in (1, 2, 3, 4) if q in quarter_map]

        # Build quarter headers per spec
        headers = ["Metric"]
        if 1 in present_quarters:
            headers.append(f"{self._fy_abbrev(self.fiscal_year)} Q1 totals")
        for quarter_number in (2, 3, 4):
            if quarter_number in present_quarters:
                headers.append(f"Q{quarter_number} totals")

        fiscal_year_abbrev = self._fy_abbrev(self.fiscal_year)
        headers.extend(
            [f"{fiscal_year_abbrev} totals", f"{fiscal_year_abbrev} Lifetime totals"]
        )

        # Order quarters to match headers
        header_quarter_order: list[int] = []
        if 1 in present_quarters:
            header_quarter_order.append(1)
        for quarter_number in (2, 3, 4):
            if quarter_number in present_quarters:
                header_quarter_order.append(quarter_number)

        # Lifetime basis: all FY rows <= this FY
        lifetime_fy_rows = KeyMetricsReport.objects.filter(
            period_type=self.PeriodType.FISCAL_YEAR,
            fiscal_year__lte=self.fiscal_year,
        ).only(*[f for f, _ in self.CSV_METRIC_COLUMNS])

        rows: list[list[str | int | float]] = []
        for field_name, label in self.CSV_METRIC_COLUMNS:
            per_quarter_values: list[str | int | float] = []
            year_numeric_sum = 0
            saw_manual_value_in_year = False

            for q in header_quarter_order:
                q_value = getattr(quarter_map[q], field_name, None)
                cell = self._format_cell(field_name, q_value)
                per_quarter_values.append(cell)

                if field_name in self.CALCULATED_FIELDS:
                    year_numeric_sum += int(q_value or 0)
                else:
                    if q_value is not None:
                        saw_manual_value_in_year = True
                        year_numeric_sum += int(q_value)

            if field_name in self.CALCULATED_FIELDS:
                year_total_cell: str | int = int(year_numeric_sum)
            else:
                year_total_cell = (
                    int(year_numeric_sum) if saw_manual_value_in_year else ""
                )

            # Lifetime across FY rows <= current FY
            lifetime_numeric_sum = 0
            saw_manual_value_in_lifetime = False
            for fy_row in lifetime_fy_rows:
                v = getattr(fy_row, field_name, None)
                if field_name in self.CALCULATED_FIELDS:
                    lifetime_numeric_sum += int(v or 0)
                else:
                    if v is not None:
                        saw_manual_value_in_lifetime = True
                        lifetime_numeric_sum += int(v)

            if field_name in self.CALCULATED_FIELDS:
                lifetime_total_cell: str | int = int(lifetime_numeric_sum)
            else:
                lifetime_total_cell = (
                    int(lifetime_numeric_sum) if saw_manual_value_in_lifetime else ""
                )

            rows.append(
                [label, *per_quarter_values, year_total_cell, lifetime_total_cell]
            )

        return headers, rows

    def render_csv(self) -> bytes:
        """
        Render this report as a CSV pivot.

        Rows:
            Metrics in CSV_METRIC_COLUMNS order.

        Columns:
            - MONTHLY:     Metric | <Month>
            - QUARTERLY:   Metric | months present | FY## Q# totals |
                            FY## Lifetime totals
            - FISCAL_YEAR: Metric | ("FY## Q1 totals" if present) | Q2 totals |
                            Q3 totals | Q4 totals | FY## totals |
                            FY## Lifetime totals
        """
        if self.period_type == self.PeriodType.MONTHLY:
            headers, rows = self._csv_matrix_monthly()
        elif self.period_type == self.PeriodType.QUARTERLY:
            headers, rows = self._csv_matrix_quarterly()
        else:
            headers, rows = self._csv_matrix_fiscal_year()

        buffer = io.StringIO(newline="")
        writer = csv.writer(buffer)
        writer.writerow(headers)
        writer.writerows(rows)
        return buffer.getvalue().encode("utf-8")


class UserProfileActivity(models.Model):
    """
    Per-campaign activity summary for a single user.

    This model stores campaign-scoped counts such as how many assets a user
    has touched and how many transcriptions or reviews they have performed.
    """

    user = models.ForeignKey(User, on_delete=models.CASCADE, verbose_name="User Id")
    campaign = models.ForeignKey(
        Campaign, on_delete=models.CASCADE, verbose_name="Campaign Id"
    )
    asset_count = models.IntegerField(default=0)
    asset_tag_count = models.IntegerField(default=0)
    transcribe_count = models.IntegerField(
        default=0, verbose_name="transcription save/submit count"
    )
    review_count = models.IntegerField(
        default=0, verbose_name="transcription review count"
    )

    class Meta:
        constraints = [
            models.UniqueConstraint(
                fields=["user", "campaign"], name="user_campaign_count"
            )
        ]
        verbose_name_plural = "User profile activities"

    def __str__(self):
        return f"{self.user} - {self.campaign}"

    def get_status(self):
        display = [None, "Active", "Completed", "Retired"]
        return display[self.campaign.status]

    def total_actions(self):
        transcribe_count = self.transcribe_count or 0
        review_count = self.review_count or 0
        return transcribe_count + review_count


class CampaignRetirementProgress(models.Model):
    """
    Track progress while retiring a campaign and deleting related content.

    This model stores counts of projects, items, and assets processed for a
    retiring campaign, along with a log of removal operations.
    """

    campaign = models.OneToOneField(Campaign, on_delete=models.CASCADE)
    project_total = models.IntegerField(default=0)
    projects_removed = models.IntegerField(default=0)
    item_total = models.IntegerField(default=0)
    items_removed = models.IntegerField(default=0)
    asset_total = models.IntegerField(default=0)
    assets_removed = models.IntegerField(default=0)
    complete = models.BooleanField(default=False)
    started_on = models.DateTimeField(auto_now_add=True)
    completed_on = models.DateTimeField(null=True)
    removal_log = models.JSONField(default=list)

    def __str__(self):
        return f"Removal progress for {self.campaign}"

    class Meta:
        verbose_name_plural = "campaign retirement progress"


class TutorialCard(models.Model):
    """
    Through model for ordering cards within a CardFamily tutorial.
    """

    card = models.ForeignKey(Card, on_delete=models.CASCADE)
    tutorial = models.ForeignKey(CardFamily, on_delete=models.CASCADE)
    order = models.IntegerField(default=0)

    class Meta:
        verbose_name_plural = "cards"


class Guide(models.Model):
    """
    Guide entry grouping SimplePage or link-based content.

    Guides back the sidebar and inline help sections that surface how-to
    documentation for contributors.
    """

    title = models.CharField(max_length=80)
    page = models.ForeignKey(
        SimplePage, on_delete=models.SET_NULL, blank=True, null=True
    )
    body = models.TextField(blank=True)
    order = models.IntegerField(default=1)
    link_text = models.CharField(max_length=80, blank=True, null=True)
    link_url = models.CharField(max_length=255, blank=True, null=True)

    def __str__(self):
        return self.title


def validated_get_or_create(klass, **kwargs):
    """
    Create or return an object using full model validation.

    This works like ``QuerySet.get_or_create()``, but always constructs the
    object via attribute assignment and ``full_clean()`` before saving.

    This is helpful for models with validation that is not fully enforced at
    the database level, or when using integrations like django-model-translation
    where fields must be set through normal attribute access.

    Args:
        klass: The model class to query or create.
        **kwargs: Lookup fields, plus optional ``defaults`` dict, as in
            ``get_or_create()``.

    Returns:
        tuple[Model, bool]: A ``(obj, created)`` tuple like
        ``get_or_create()``.
    """
    defaults = kwargs.pop("defaults", {})

    try:
        obj = klass.objects.get(**kwargs)
        return obj, False
    except klass.DoesNotExist:
        obj = klass()

        for k, v in chain(kwargs.items(), defaults.items()):
            setattr(obj, k, v)

        obj.full_clean()
        obj.save()
        return obj, True


class NextAsset(models.Model):
    """
    Abstract base class for "next asset" queues.

    These lightweight records cache the next transcribable or reviewable
    assets selected for a campaign or topic, so they can be fetched quickly
    without recomputing complex queries.
    """

    id = models.UUIDField(  # noqa: A003
        primary_key=True, default=uuid.uuid4, editable=False
    )
    item = models.ForeignKey(Item, on_delete=models.CASCADE)
    item_item_id = models.CharField(max_length=100)
    project = models.ForeignKey(Project, on_delete=models.CASCADE)
    project_slug = models.SlugField(max_length=80, allow_unicode=True)
    sequence = models.PositiveIntegerField(default=1)
    created_on = models.DateTimeField(editable=False, auto_now_add=True)

    class Meta:
        abstract = True

    def __str__(self):
        return self.asset.title


class NextTranscribableAsset(NextAsset):
    """
    Abstract base for cached transcribable asset queues.
    """

    transcription_status = models.CharField(
        editable=False,
        max_length=20,
        default=TranscriptionStatus.NOT_STARTED,
        choices=TranscriptionStatus.CHOICES,
        db_index=True,
    )

    class Meta:
        abstract = True


class NextReviewableAsset(NextAsset):
    """
    Abstract base for cached reviewable asset queues.

    Stores the IDs of prior transcribers to help avoid assigning reviewers
    to assets they have already worked on.
    """

    transcriber_ids = ArrayField(
        base_field=models.IntegerField(),
        blank=True,
        default=list,
    )

    class Meta:
        abstract = True


class NextCampaignAssetManager(models.Manager):
    """
    Base manager for "next asset" campaign queues.

    Subclasses should set ``target_count`` to control how many entries
    should be prepopulated per campaign.
    """

    target_count = None  # Override in subclass

    def needed_for_campaign(self, campaign_id, target_count=None):
        """
        Return how many additional entries are needed for a campaign.

        Args:
            campaign_id: The campaign primary key.
            target_count: Optional override for the per-campaign queue size.
                If omitted, ``self.target_count`` is used.

        Returns:
            int: Number of additional entries required to reach the target.
        """
        if target_count is None:
            if self.target_count is None:
                raise NotImplementedError(
                    "You must define `target_count` in the subclass "
                    "or pass `target_count` explicitly."
                )
            target_count = self.target_count

        current_count = self.filter(campaign_id=campaign_id).count()
        return max(target_count - current_count, 0)


class NextTopicAssetManager(models.Manager):
    """
    Base manager for "next asset" topic queues.

    Subclasses should set ``target_count`` to control how many entries
    should be prepopulated per topic.
    """

    target_count = None  # Override in subclass

    def needed_for_topic(self, topic_id, target_count=None):
        """
        Return how many additional entries are needed for a topic.

        Args:
            topic_id: The topic primary key.
            target_count: Optional override for the per-topic queue size.
                If omitted, ``self.target_count`` is used.

        Returns:
            int: Number of additional entries required to reach the target.
        """
        if target_count is None:
            if self.target_count is None:
                raise NotImplementedError(
                    "You must define `target_count` in the subclass "
                    "or pass `target_count` explicitly."
                )
            target_count = self.target_count

        current_count = self.filter(topic_id=topic_id).count()
        return max(target_count - current_count, 0)


class NextTranscribableCampaignAssetManager(NextCampaignAssetManager):
    target_count = getattr(settings, "NEXT_TRANSCRIBABLE_ASSET_COUNT", 100)


class NextTranscribableTopicAssetManager(NextTopicAssetManager):
    target_count = getattr(settings, "NEXT_TRANSCRIBABLE_ASSET_COUNT", 100)


class NextReviewableCampaignAssetManager(NextCampaignAssetManager):
    target_count = getattr(settings, "NEXT_REVIEWABLE_ASSET_COUNT", 100)


class NextReviewableTopicAssetManager(NextTopicAssetManager):
    target_count = getattr(settings, "NEXT_REVIEWABLE_ASSET_COUNT", 100)


class NextTranscribableCampaignAsset(NextTranscribableAsset):
    """
    Cached transcribable asset entry for a campaign-wide queue.
    """

    asset = models.OneToOneField(Asset, on_delete=models.CASCADE)
    campaign = models.ForeignKey(Campaign, on_delete=models.CASCADE)

    objects = NextTranscribableCampaignAssetManager()

    class Meta:
        ordering = ("created_on",)
        get_latest_by = "created_on"


class NextTranscribableTopicAsset(NextTranscribableAsset):
    """
    Cached transcribable asset entry for a topic-scoped queue.
    """

    asset = models.ForeignKey(Asset, on_delete=models.CASCADE)
    topic = models.ForeignKey(Topic, on_delete=models.CASCADE)

    objects = NextTranscribableTopicAssetManager()

    class Meta:
        ordering = ("created_on",)
        get_latest_by = "created_on"
        unique_together = ("asset", "topic")


class NextReviewableCampaignAsset(NextReviewableAsset):
    """
    Cached reviewable asset entry for a campaign-wide queue.
    """

    asset = models.OneToOneField(Asset, on_delete=models.CASCADE)
    campaign = models.ForeignKey(Campaign, on_delete=models.CASCADE)

    objects = NextReviewableCampaignAssetManager()

    class Meta:
        ordering = ("created_on",)
        get_latest_by = "created_on"
        indexes = [
            GinIndex(fields=["transcriber_ids"]),
        ]


class NextReviewableTopicAsset(NextReviewableAsset):
    """
    Cached reviewable asset entry for a topic-scoped queue.
    """

    asset = models.ForeignKey(Asset, on_delete=models.CASCADE)
    topic = models.ForeignKey(Topic, on_delete=models.CASCADE)

    objects = NextReviewableTopicAssetManager()

    class Meta:
        ordering = ("created_on",)
        get_latest_by = "created_on"
        unique_together = ("asset", "topic")
        indexes = [
            GinIndex(fields=["transcriber_ids"]),
        ]


class ProjectTopic(models.Model):
    """
    Link table connecting projects and topics with optional status filtering.

    url_filter can be used to restrict which asset transcription status is
    shown when browsing the project through a given topic.
    """

    project = models.ForeignKey("Project", on_delete=models.CASCADE)
    topic = models.ForeignKey("Topic", on_delete=models.CASCADE)

    url_filter = models.CharField(
        max_length=20,
        choices=TranscriptionStatus.CHOICES,
        blank=True,
        null=True,
        help_text="Optional filter on the status for this project-topic link",
    )
    ordering = models.IntegerField(
        default=0, help_text="Sort order override: lower values will be listed first"
    )

    class Meta:
        db_table = (
            "concordia_project_topics"  # pre-existing table, so we reuse the name
        )
        unique_together = ("project", "topic")
        ordering = ("ordering",)
        indexes = [
            models.Index(fields=["topic", "project"]),
            models.Index(fields=["topic", "ordering"]),
            models.Index(fields=["topic", "url_filter"]),
        ]


================================================
FILE: concordia/parser.py
================================================
import html
from html.parser import HTMLParser

import defusedxml.ElementTree as ET
import requests
from django.core.cache import cache

from concordia.logging import ConcordiaLogger

structured_logger = ConcordiaLogger.get_logger(__name__)


class OGImageParser(HTMLParser):
    def __init__(self):
        super().__init__()
        self.og_image = None

    def handle_starttag(self, tag, attrs):
        if tag.lower() == "meta":
            attr_dict = dict(attrs)
            print(attr_dict)
            if attr_dict.get("property") == "og:image" and "content" in attr_dict:
                self.og_image = attr_dict["content"]


def extract_og_image(url):
    """Fetch the meta value from the HTML."""
    cache_key = f"og_image:{url}"

    try:
        response = requests.get(url, timeout=5)
        parser = OGImageParser()
        parser.feed(html.unescape(response.text))
        cache.set(cache_key, parser.og_image, timeout=24 * 60 * 60)
        return parser.og_image
    except requests.RequestException:
        structured_logger.warning(
            "Failed to fetch image for blog post: %s",
            event_code="post_image_fetch_failed",
            reason=(
                "Failed to fetch Open Graph image from the "
                "given URL due to a network or HTTP error"
            ),
            reason_code="ogi_req_fail_fetch",
        )


def get_og_image(url):
    """Fetch the meta value from the HTML."""
    cache_key = f"og_image:{url}"
    cached_image = cache.get(cache_key)
    if cached_image is not None:
        return cached_image
    else:
        return extract_og_image(url)


def fetch_blog_posts():
    """get and parse The Signal's RSS feed"""
    try:
        response = requests.get(
            "https://blogs.loc.gov/thesignal/category/by-the-people-transcription-program/feed/",
            timeout=60,
        )
        response.raise_for_status()
        root = ET.fromstring(response.content)
    except requests.exceptions.HTTPError:
        structured_logger.warning(
            "HTTP error when fetching blog posts, but handled: %s",
            event_code="handled_post_fetch_http_error",
            reason="The RSS feed returned an HTTP error response (e.g. 4xx or 5xx)",
            reason_code="blog_http_error",
        )
        return []
    except requests.exceptions.ConnectionError:
        structured_logger.warning(
            "Connection error when fetching blog posts: %s",
            event_code="blog_post_fetch_connection_error",
            reason="Network connection failed while trying to reach the RSS feed.",
            reason_code="blog_conn_error",
        )
        return []
    except requests.exceptions.Timeout:
        structured_logger.warning(
            "Timeout when fetching blog posts: %s",
            event_code="blog_post_fetch_timeout",
            reason="The request to fetch RSS feed exceeded the timeout threshold.",
            reason_code="blog_timeout",
        )
        return []
    except requests.exceptions.RequestException:
        structured_logger.warning(
            "Request exception when fetching blog posts: %s",
            event_code="blog_post_fetch_request_exception",
            reason="General request failure when fetching or parsing RSS feed content.",
            reason_code="blog_req_error",
        )
        return []

    return root.find("channel").findall("item")


def paginate_blog_posts():
    feed_items = []
    items = fetch_blog_posts()
    for item in items[:6]:
        feed_item = {
            "title": item.find("title").text,
        }
        link = item.find("link")
        if link is not None:
            feed_item["link"] = link.text
            og_image = get_og_image(link.text)
            if og_image is not None:
                feed_item["og_image"] = og_image
        feed_items.append(feed_item)
    segmented_items = [feed_items[:3]]
    if len(feed_items) > 3:
        segmented_items.append(feed_items[3:6])

    return segmented_items


================================================
FILE: concordia/passwords/LICENSE
================================================
Copyright (c) 2014, Donald Stufft
All rights reserved.

Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions are met:

* Redistributions of source code must retain the above copyright notice, this
  list of conditions and the following disclaimer.

* Redistributions in binary form must reproduce the above copyright notice,
  this list of conditions and the following disclaimer in the documentation
  and/or other materials provided with the distribution.

THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.


================================================
FILE: concordia/passwords/__init__.py
================================================


================================================
FILE: concordia/passwords/validators.py
================================================
"""
Password complexity validator.

This module provides a `ComplexityValidator` compatible with Django’s validation
pipeline. It checks a password against configurable complexity requirements,
counting unique characters of several categories and optionally unique words.

Settings:
    PASSWORD_COMPLEXITY (dict[str, int] | None):
        Mapping of requirement names to minimum counts. Any missing keys default
        to 0. If the setting is falsy or not provided, no complexity checks run.

        Supported keys:
            - 'UPPER'   : unique uppercase letters
            - 'LOWER'   : unique lowercase letters
            - 'LETTERS' : unique letters (upper or lower)
            - 'DIGITS'  : unique digits
            - 'SPECIAL' : unique non-space, non-alnum characters
            - 'WORDS'   : unique word tokens (\\b\\w+ with re.UNICODE)

Usage:
    In your Django settings:

        AUTH_PASSWORD_VALIDATORS = [
            {
                "NAME":
                "concordia.passwords.validators.ComplexityValidator",
                "OPTIONS": {
                    "complexities": {
                        "UPPER": 1,
                        "LOWER": 1,
                        "DIGITS": 1,
                        "SPECIAL": 1,
                        "LETTERS": 4,
                        "WORDS": 2,
                    }
                },
            },
        ]

"""

# Originally from
# https://github.com/dstufft/django-passwords/blob/master/passwords/validators.py
import re
from typing import Mapping, Set

from django.conf import settings
from django.core.exceptions import ValidationError
from django.utils.translation import gettext_lazy as _

# Settings
PASSWORD_COMPLEXITY = getattr(settings, "PASSWORD_COMPLEXITY", None)


class ComplexityValidator(object):
    """
    Validate password complexity against configured unique-count thresholds.

    The validator counts unique characters in several categories (uppercase,
    lowercase, letters, digits, special) and unique words, then compares those
    counts to thresholds provided at construction time.

    Attributes:
        message (str):
            Base error message template. Interpolated with a comma-separated
            list of failed requirements.
        code (str):
            Error code used in `ValidationError`.
        complexities (dict[str, int] | None):
            Thresholds for each category. When `None`, the validator is
            effectively disabled.
    """

    message = _("Must be more complex (%s)")
    code = "complexity"

    def __init__(self, complexities: Mapping[str, int] | None):
        """
        Initialize the validator.

        Args:
            complexities (Mapping[str, int] | None):
                Per-category minimum unique counts. If `None`, no checks are
                enforced. Missing keys default to 0.
        """
        self.complexities = complexities

    def __call__(self, value: str) -> None:
        """
        Validate a password string.

        The method tallies unique characters by category using `str.isupper`,
        `str.islower`, `str.isdigit`, and a fallback for non-space, non-alnum
        characters, and counts unique words via `re.findall(r"\\b\\w+", ...)`.

        Args:
            value (str): The candidate password.

        Raises:
            ValidationError:
                If one or more configured thresholds are not met. The error
                message lists each failed requirement.
        """
        if self.complexities is None:
            return

        uppercase: Set[str] = set()
        lowercase: Set[str] = set()
        letters: Set[str] = set()
        digits: Set[str] = set()
        special: Set[str] = set()

        for character in value:
            if character.isupper():
                uppercase.add(character)
                letters.add(character)
            elif character.islower():
                lowercase.add(character)
                letters.add(character)
            elif character.isdigit():
                digits.add(character)
            elif not character.isspace():
                special.add(character)

        words = set(re.findall(r"\b\w+", value, re.UNICODE))

        errors = []
        if len(uppercase) < self.complexities.get("UPPER", 0):
            errors.append(
                _("%(UPPER)s or more unique uppercase characters") % self.complexities
            )
        if len(lowercase) < self.complexities.get("LOWER", 0):
            errors.append(
                _("%(LOWER)s or more unique lowercase characters") % self.complexities
            )
        if len(letters) < self.complexities.get("LETTERS", 0):
            errors.append(_("%(LETTERS)s or more unique letters") % self.complexities)
        if len(digits) < self.complexities.get("DIGITS", 0):
            errors.append(_("%(DIGITS)s or more unique digits") % self.complexities)
        if len(special) < self.complexities.get("SPECIAL", 0):
            errors.append(
                _("%(SPECIAL)s or more non unique special characters")
                % self.complexities
            )
        if len(words) < self.complexities.get("WORDS", 0):
            errors.append(_("%(WORDS)s or more unique words") % self.complexities)

        if errors:
            raise ValidationError(
                self.message % (_("must contain ") + ", ".join(errors),),
                code=self.code,
            )


================================================
FILE: concordia/routing.py
================================================
import os

from channels.auth import AuthMiddlewareStack
from channels.routing import ProtocolTypeRouter, URLRouter
from django.core.asgi import get_asgi_application
from django.urls import path

from . import consumers

os.environ.setdefault("DJANGO_SETTINGS_MODULE", "concordia.settings")
django_asgi_app = get_asgi_application()

application = ProtocolTypeRouter(
    {
        "http": django_asgi_app,
        "websocket": AuthMiddlewareStack(
            URLRouter([path("ws/asset/asset_updates/", consumers.AssetConsumer)])
        ),
    }
)


================================================
FILE: concordia/secrets.py
================================================
import os

import boto3
from botocore.exceptions import ClientError

AWS_DEFAULT_REGION = os.getenv("AWS_DEFAULT_REGION", "us-east-1")


def get_secret(secret_name):
    endpoint_url = "https://secretsmanager.%s.amazonaws.com" % AWS_DEFAULT_REGION
    region_name = AWS_DEFAULT_REGION
    secret = None

    session = boto3.session.Session()
    client = session.client(
        service_name="secretsmanager",
        region_name=region_name,
        endpoint_url=endpoint_url,
    )

    try:
        get_secret_value_response = client.get_secret_value(SecretId=secret_name)
    except ClientError as e:
        if e.response["Error"]["Code"] == "ResourceNotFoundException":
            raise Exception(
                "The requested secret " + secret_name + " was not found"
            ) from e
        elif e.response["Error"]["Code"] == "InvalidRequestException":
            raise Exception(
                "The request for " + secret_name + "was invalid due to:", e
            ) from e
        elif e.response["Error"]["Code"] == "InvalidParameterException":
            raise Exception(
                "The request for " + secret_name + "had invalid params:", e
            ) from e
        elif e.response["Error"]["Code"] == "DecryptionFailure":
            raise Exception(
                "The request failed to decrypt the value for " + secret_name + ":", e
            ) from e
        else:
            raise Exception("Unknown exception:", e) from e
    else:
        # Decrypted secret using the associated KMS CMK Depending on whether the
        # secret was a string or binary, one of these fields will be populated
        if "SecretString" in get_secret_value_response:
            secret = get_secret_value_response["SecretString"]
        else:
            secret = get_secret_value_response["SecretBinary"]

    return secret


================================================
FILE: concordia/settings_dev.py
================================================
import os

from .settings_template import *  # NOQA ignore=F405
from .settings_template import DJANGO_VITE, INSTALLED_APPS, LOGGING, MIDDLEWARE

LOGGING["handlers"]["stream"]["level"] = "DEBUG"
LOGGING["handlers"]["file"]["level"] = "DEBUG"
LOGGING["handlers"]["celery"]["level"] = "DEBUG"
LOGGING["handlers"]["structlog"]["level"] = "DEBUG"
LOGGING["handlers"]["django_structlog"]["level"] = "DEBUG"
LOGGING["loggers"] = {
    "django": {"handlers": ["file", "stream"], "level": "DEBUG"},
    "celery": {"handlers": ["celery", "stream"], "level": "DEBUG"},
    "concordia": {"handlers": ["file", "stream"], "level": "DEBUG"},
    "django.utils.autoreload": {"level": "INFO"},
    "django.template": {"level": "INFO"},
    "aws_xray_sdk": {
        "handlers": ["file", "stream"],
        "level": "DEBUG",
        "propagate": True,
    },
    "structlog": {
        "handlers": ["structlog_file", "structlog_console"],
        "level": "INFO",
    },
    "django_structlog": {
        "handlers": ["structlog_file", "structlog_console"],
        "level": "INFO",
    },
}

DEBUG = True

# Toggle this to True only when you run 'npm run dev' - vite dev server
# Otherwise, it will look for the manifest.json in /dist/
USE_VITE_DEV_SERVER = os.getenv("USE_VITE_DEV_SERVER", "false").lower() == "true"

DJANGO_VITE["default"]["dev_mode"] = USE_VITE_DEV_SERVER
DJANGO_VITE["default"]["dev_server_port"] = 5173

ALLOWED_HOSTS = ["127.0.0.1", "0.0.0.0", "*"]  # nosec

EMAIL_BACKEND = "django.core.mail.backends.console.EmailBackend"
EMAIL_FILE_PATH = (
    "/tmp/concordia-messages"  # nosec — change this to a proper location for deployment
)
DEFAULT_FROM_EMAIL = os.environ.get("DEFAULT_FROM_EMAIL", "")
DEFAULT_TO_EMAIL = DEFAULT_FROM_EMAIL
CONCORDIA_DEVS = [
    "rsar@loc.gov",
]

INSTALLED_APPS += ["django_opensearch_dsl"]

# Globally disable auto-syncing. Automatically update the index when a model is
# created / saved / deleted.
OPENSEARCH_DSL_AUTOSYNC = False

OPENSEARCH_DSL = {
    "default": {"hosts": "localhost:9200"},
    "secure": {
        "hosts": [{"scheme": "https", "host": "192.30.255.112", "port": 9201}],
        "http_auth": ("admin", os.environ.get("OPENSEARCH_INITIAL_ADMIN_PASSWORD", "")),
        "timeout": 120,
    },
}

REGISTRATION_SALT = "django_registration"  # doesn't need to be secret

INSTALLED_APPS += ["debug_toolbar"]
MIDDLEWARE += ["debug_toolbar.middleware.DebugToolbarMiddleware"]
INTERNAL_IPS = ("127.0.0.1",)

INSTALLED_APPS += ("django_extensions",)
SHELL_PLUS_PRE_IMPORTS = [
    ("concordia.utils", "get_anonymous_user"),
    ("concordia.models", "TranscriptionStatus"),
]

# X-Ray configuration for local development
if os.environ.get("AWS_XRAY_SDK_ENABLED", "false").lower() == "true":
    import logging

    logger = logging.getLogger(__name__)

    logger.info("ECS X-Ray auto-instrumentation starting")

    # Add X-Ray to INSTALLED_APPS
    INSTALLED_APPS = INSTALLED_APPS + ["aws_xray_sdk.ext.django"]

    # Add middleware - MUST be first in the list
    MIDDLEWARE = ["aws_xray_sdk.ext.django.middleware.XRayMiddleware"] + MIDDLEWARE

    logger.info("ECS X-Ray auto-instrumentation completed")
    logger.info("X-Ray middleware added at position 0: %s", MIDDLEWARE[0])
    logger.info("Current MIDDLEWARE[0]: %s", MIDDLEWARE[0])

    XRAY_RECORDER = {
        "AWS_XRAY_DAEMON_ADDRESS": os.environ.get(
            "AWS_XRAY_DAEMON_ADDRESS", "127.0.0.1:2000"
        ),
        "AUTO_INSTRUMENT": True,
        "AWS_XRAY_CONTEXT_MISSING": os.environ.get(
            "AWS_XRAY_CONTEXT_MISSING", "LOG_ERROR"
        ),
        "PLUGINS": (),
        "AWS_XRAY_TRACING_NAME": os.environ.get(
            "AWS_XRAY_TRACING_NAME",
            os.environ.get("CONCORDIA_ENVIRONMENT", "development"),
        ),
        "PATCH_MODULES": ["boto3", "botocore", "requests", "httplib", "psycopg2"],
        "SAMPLING": False,
        "IGNORE_MODULE_PATTERNS": [
            r"^debug_toolbar\.",
            r"^django\.contrib\.admin\.views\.decorators\.cache",
            r"^django\.contrib\.admin\.options",
            r"^django\.contrib\.admin\.options\.ModelAdmin",
            r"^django\.contrib\.admin\.options\.InlineModelAdmin",
            r"^django\.contrib\.admin\.options\.BaseModelAdmin",
            r"^django\.contrib\.admin\.options\.ModelAdminMixin",
            r"^django\.contrib\.admin\.options\.InlineModelAdminMixin",
            r"^django\.contrib\.admin\.options\.ModelAdminBase",
            r"^django\.contrib\.admin\.options\.InlineModelAdminBase",
            r"^django\.contrib\.admin\.options\.ModelAdminMixinBase",
            r"^django\.contrib\.admin\.options\.InlineModelAdminMixinBase",
            r"^django\.contrib\.admin\.options\.ModelAdminDecorator",
            r"^django\.contrib\.admin\.options\.InlineModelAdminDecorator",
            r"^django\.contrib\.admin\.options\.ModelAdminDecoratorMixin",
            r"^django\.contrib\.admin\.options\.InlineModelAdminDecoratorMixin",
            r"^django\.contrib\.admin\.options\.ModelAdminDecoratorBase",
            r"^django\.contrib\.admin\.options\.InlineModelAdminDecoratorBase",
        ],
    }


================================================
FILE: concordia/settings_docker.py
================================================
import os

from .settings_template import *  # NOQA ignore=F405
from .settings_template import INSTALLED_APPS, STATIC_URL

DEBUG = os.getenv("DEBUG", "").lower() == "true"

EMAIL_BACKEND = "django.core.mail.backends.dummy.EmailBackend"

INSTALLED_APPS += ["django_opensearch_dsl"]


def whitenoise_immutable_file_test(static_url):
    """
    Determine if a file is immutable based on its URL.
    Vite assets in the 'dist/' directory are hashed and safe to cache forever.
    """
    return static_url.startswith(f"{STATIC_URL}dist/")


WHITENOISE_IMMUTABLE_FILE_TEST = whitenoise_immutable_file_test

# Globally disable auto-syncing
OPENSEARCH_DSL_AUTOSYNC = os.getenv("OPENSEARCH_DSL_AUTOSYNC", False)

OPENSEARCH_DSL = {
    "default": {"hosts": os.getenv("OPENSEARCH_ENDPOINT", "9200:9200")},
    "secure": {
        "hosts": [
            {"scheme": "https", "host": os.getenv("OPENSEARCH_ENDPOINT"), "port": 9201}
        ],
        "http_auth": ("admin", os.environ.get("OPENSEARCH_INITIAL_ADMIN_PASSWORD", "")),
        "timeout": 120,
    },
}

# X-Ray configuration for local development
if os.environ.get("AWS_XRAY_SDK_ENABLED", "false").lower() == "true":
    import logging

    logger = logging.getLogger(__name__)

    logger.info("ECS X-Ray auto-instrumentation starting")

    # Add X-Ray to INSTALLED_APPS
    INSTALLED_APPS = INSTALLED_APPS + ["aws_xray_sdk.ext.django"]

    # Add middleware - MUST be first in the list
    MIDDLEWARE = [
        "aws_xray_sdk.ext.django.middleware.XRayMiddleware"
    ] + MIDDLEWARE  # noqa F405

    logger.info("ECS X-Ray auto-instrumentation completed")
    logger.info("X-Ray middleware added at position 0: %s", MIDDLEWARE[0])
    logger.info("Current MIDDLEWARE[0]: %s", MIDDLEWARE[0])

    XRAY_RECORDER = {
        "AWS_XRAY_DAEMON_ADDRESS": os.environ.get(
            "AWS_XRAY_DAEMON_ADDRESS", "127.0.0.1:2000"
        ),
        "AUTO_INSTRUMENT": True,
        "AWS_XRAY_CONTEXT_MISSING": os.environ.get(
            "AWS_XRAY_CONTEXT_MISSING", "LOG_ERROR"
        ),
        "PLUGINS": (),
        "AWS_XRAY_TRACING_NAME": os.environ.get(
            "AWS_XRAY_TRACING_NAME",
            os.environ.get("CONCORDIA_ENVIRONMENT", "development"),
        ),
        "PATCH_MODULES": ["boto3", "botocore", "requests", "httplib", "psycopg2"],
        "SAMPLING": False,
        "IGNORE_MODULE_PATTERNS": [
            r"^debug_toolbar\.",
            r"^django\.contrib\.admin\.views\.decorators\.cache",
            r"^django\.contrib\.admin\.options",
            r"^django\.contrib\.admin\.options\.ModelAdmin",
            r"^django\.contrib\.admin\.options\.InlineModelAdmin",
            r"^django\.contrib\.admin\.options\.BaseModelAdmin",
            r"^django\.contrib\.admin\.options\.ModelAdminMixin",
            r"^django\.contrib\.admin\.options\.InlineModelAdminMixin",
            r"^django\.contrib\.admin\.options\.ModelAdminBase",
            r"^django\.contrib\.admin\.options\.InlineModelAdminBase",
            r"^django\.contrib\.admin\.options\.ModelAdminMixinBase",
            r"^django\.contrib\.admin\.options\.InlineModelAdminMixinBase",
            r"^django\.contrib\.admin\.options\.ModelAdminDecorator",
            r"^django\.contrib\.admin\.options\.InlineModelAdminDecorator",
            r"^django\.contrib\.admin\.options\.ModelAdminDecoratorMixin",
            r"^django\.contrib\.admin\.options\.InlineModelAdminDecoratorMixin",
            r"^django\.contrib\.admin\.options\.ModelAdminDecoratorBase",
            r"^django\.contrib\.admin\.options\.InlineModelAdminDecoratorBase",
        ],
    }


# HMAC activation flow provide the two-step registration process,
# the user signs up and then completes activation via email instructions.

# This is *not* a secret for the HMAC activation workflow — see:
# https://django-registration.readthedocs.io/en/2.0.4/hmac.html#security-considerations
REGISTRATION_SALT = "django_registration"

RATELIMIT_BLOCK = os.getenv("RATELIMIT_BLOCK", "").lower() not in ("false", "0")


================================================
FILE: concordia/settings_ecs.py
================================================
import json
import os

from .secrets import get_secret
from .settings_template import *  # NOQA ignore=F405
from .settings_template import (
    CONCORDIA_ENVIRONMENT,
    DATABASES,
    INSTALLED_APPS,
    MIDDLEWARE,
    STORAGES,
)

if os.getenv("AWS"):
    ENV_NAME = os.getenv("ENV_NAME")

    django_secret_json = get_secret("crowd/%s/Django/SecretKey" % ENV_NAME)
    django_secret = json.loads(django_secret_json)
    SECRET_KEY = django_secret["DjangoSecretKey"]

    postgres_secret_json = get_secret("crowd/%s/DB/MasterUserPassword" % ENV_NAME)
    postgres_secret = json.loads(postgres_secret_json)

    DATABASES["default"].update({"PASSWORD": postgres_secret["password"]})

    cf_turnstile_secret_json = get_secret("crowd/%s/Turnstile" % ENV_NAME)
    cf_turnstile_secret = json.loads(cf_turnstile_secret_json)
    TURNSTILE_SITEKEY = cf_turnstile_secret["TurnstileSiteKey"]
    TURNSTILE_SECRET = cf_turnstile_secret["TurnstileSecret"]

    smtp_secret_json = get_secret("concordia/SMTP")
    smtp_secret = json.loads(smtp_secret_json)
    EMAIL_HOST = smtp_secret["Hostname"]
    EMAIL_HOST_USER = smtp_secret["Username"]
    EMAIL_HOST_PASSWORD = smtp_secret["Password"]

else:
    EMAIL_HOST = os.environ.get("EMAIL_HOST", "localhost")
    EMAIL_HOST_USER = os.environ.get("EMAIL_HOST_USER", "")
    EMAIL_HOST_PASSWORD = os.environ.get("EMAIL_HOST_PASSWORD", "")

SECURE_PROXY_SSL_HEADER = ("HTTP_X_FORWARDED_PROTO", "https")

EMAIL_USE_TLS = True
EMAIL_BACKEND = "django.core.mail.backends.smtp.EmailBackend"
EMAIL_PORT = 587
DEFAULT_FROM_EMAIL = os.environ.get("DEFAULT_FROM_EMAIL", "crowd@loc.gov")
DEFAULT_TO_EMAIL = DEFAULT_FROM_EMAIL
CONCORDIA_DEVS = [
    "jkue@loc.gov",
    "jstegmaier@loc.gov",
    "rsar@loc.gov",
]

CSRF_COOKIE_SECURE = True

CELERY_BROKER_URL = os.getenv("CELERY_BROKER_URL")
CELERY_RESULT_BACKEND = CELERY_BROKER_URL

S3_BUCKET_NAME = os.getenv("S3_BUCKET_NAME")
EXPORT_S3_BUCKET_NAME = os.getenv("EXPORT_S3_BUCKET_NAME")

STORAGES = {
    **STORAGES,
    "default": {
        "BACKEND": "storages.backends.s3boto3.S3Boto3Storage",
    },
    "assets": {
        "BACKEND": "storages.backends.s3boto3.S3Boto3Storage",
        "OPTIONS": {
            "querystring_auth": False,
        },
    },
    "visualizations": {
        "BACKEND": "concordia.storage_backends.OverwriteS3Boto3Storage",
        "OPTIONS": {
            "querystring_auth": False,
            "bucket_name": EXPORT_S3_BUCKET_NAME,
        },
    },
}
AWS_STORAGE_BUCKET_NAME = S3_BUCKET_NAME
AWS_DEFAULT_ACL = None  # Don't set an ACL on the files, inherit the bucket ACLs

if CONCORDIA_ENVIRONMENT == "production":
    MEDIA_URL = "https://crowd-media.loc.gov/"
else:
    MEDIA_URL = "https://%s.s3.amazonaws.com/" % S3_BUCKET_NAME

INSTALLED_APPS += ["django_opensearch_dsl"]

# Globally disable auto-syncing
OPENSEARCH_DSL_AUTOSYNC = os.getenv("OPENSEARCH_DSL_AUTOSYNC", False)

OPENSEARCH_DSL = {
    "default": {"hosts": os.getenv("OPENSEARCH_ENDPOINT", "opensearch-node:9200")}
}

# HMAC activation flow provide the two-step registration process,
# the user signs up and then completes activation via email instructions.

REGISTRATION_SALT = "django_registration"  # doesn't need to be secret

RATELIMIT_BLOCK = os.getenv("RATELIMIT_BLOCK", "").lower() not in ("false", "0")

if os.getenv("USE_PERSISTENT_DATABASE_CONNECTIONS"):
    DATABASES["default"].update({"CONN_MAX_AGE": 15 * 60})

# ECS-specific X-Ray auto-instrumentation (minimal Django config)
if os.environ.get("AWS_XRAY_SDK_ENABLED", "false").lower() == "true":
    import logging

    logger = logging.getLogger(__name__)

    logger.info("ECS X-Ray auto-instrumentation starting")

    # Add X-Ray to INSTALLED_APPS
    INSTALLED_APPS = INSTALLED_APPS + ["aws_xray_sdk.ext.django"]

    # Add middleware
    MIDDLEWARE = [
        "aws_xray_sdk.ext.django.middleware.XRayMiddleware"
    ] + MIDDLEWARE  # noqa F405

    logger.info("ECS X-Ray auto-instrumentation completed")
    logger.info("X-Ray middleware added at position 0: %s", MIDDLEWARE[0])
    logger.info("aws_xray_sdk.ext.django added to INSTALLED_APPS")
    logger.info("All X-Ray configuration handled via environment variables")


================================================
FILE: concordia/settings_loadtest.py
================================================
import os
import sys

from .settings_template import *  # NOQA ignore=F405
from .settings_template import DATABASES, LOGGING, STORAGES

DEBUG = False
RATELIMIT_ENABLE = False

# Load testing DB name standard. If you need a different DB name, create a
# personal settings file (eg settings_loadtest_<username>.py) and override it
# there.
DATABASES["default"]["NAME"] = "concordia_lt"

# Ensure Turnstile does not block Locust. Default to Cloudflare's test keys that
# always pass, but allow env vars to override.
TURNSTILE_SITEKEY = os.environ.get(
    "TURNSTILE_SITEKEY",
    "1x00000000000000000000BB",  # always pass, invisible
)
TURNSTILE_SECRET = os.environ.get(
    "TURNSTILE_SECRET",
    "1x0000000000000000000000000000000AA",  # always pass
)

LOGGING["handlers"]["stream"]["level"] = "INFO"
LOGGING["handlers"]["file"]["level"] = "INFO"
LOGGING["handlers"]["celery"]["level"] = "INFO"
LOGGING["handlers"]["console"] = {
    "level": "INFO",
    "class": "logging.StreamHandler",
    "stream": sys.stdout,
}
LOGGING["handlers"]["celery_console"] = {
    "level": "INFO",
    "class": "logging.StreamHandler",
    "stream": sys.stdout,
    "formatter": "long",
}
LOGGING["handlers"]["structlog_file"]["level"] = "INFO"
LOGGING["handlers"]["structlog_console"]["level"] = "INFO"

LOGGING["loggers"]["django"]["handlers"] = ["file", "stream", "console"]
LOGGING["loggers"]["celery"]["handlers"] = ["celery", "celery_console"]
LOGGING["loggers"]["concordia"]["handlers"] = ["file", "stream", "console"]
LOGGING["loggers"]["concordia"]["level"] = "INFO"
LOGGING["loggers"]["django.utils.autoreload"] = {"level": "INFO"}
LOGGING["loggers"]["django.template"] = {"level": "INFO"}
LOGGING["loggers"]["structlog"]["handlers"] = ["structlog_file", "structlog_console"]
LOGGING["loggers"]["django_structlog"]["handlers"] = [
    "structlog_file",
    "structlog_console",
]

ALLOWED_HOSTS = ["127.0.0.1", "0.0.0.0", "*"]  # nosec

MAIL_BACKEND = "django.core.mail.backends.console.EmailBackend"
EMAIL_FILE_PATH = "/tmp/concordia-messages"  # nosec
DEFAULT_FROM_EMAIL = os.environ.get("DEFAULT_FROM_EMAIL", "test@example.test")
DEFAULT_TO_EMAIL = DEFAULT_FROM_EMAIL

REGISTRATION_SALT = "django_registration"  # doesn't need to be secret

S3_BUCKET_NAME = "crowd-staging-content"
EXPORT_S3_BUCKET_NAME = "crowd-staging-export"
STORAGES = {
    **STORAGES,
    "default": {
        "BACKEND": "storages.backends.s3boto3.S3Boto3Storage",
    },
    "assets": {
        "BACKEND": "storages.backends.s3boto3.S3Boto3Storage",
        "OPTIONS": {
            "querystring_auth": False,
        },
    },
    "visualizations": {
        "BACKEND": "concordia.storage_backends.OverwriteS3Boto3Storage",
        "OPTIONS": {
            "querystring_auth": False,
        },
    },
}

AWS_STORAGE_BUCKET_NAME = S3_BUCKET_NAME
AWS_DEFAULT_ACL = None  # Don't set an ACL on the files, inherit the bucket ACLs
MEDIA_URL = "https://%s.s3.amazonaws.com/" % S3_BUCKET_NAME

SECURE_CROSS_ORIGIN_OPENER_POLICY = None


================================================
FILE: concordia/settings_local_test.py
================================================
import logging
import os

import structlog

from .settings_template import *  # NOQA ignore=F405
from .settings_template import DATABASES

DEBUG = False

DATABASES["default"]["PORT"] = "5432"

CHANNEL_LAYERS = {
    "default": {
        "BACKEND": "channels.layers.InMemoryChannelLayer",
    }
}

CACHES = {
    "default": {
        "BACKEND": "django.core.cache.backends.locmem.LocMemCache",
        "LOCATION": "default-location",
    },
    "view_cache": {
        "BACKEND": "django.core.cache.backends.locmem.LocMemCache",
        "LOCATION": "view-location",
    },
    "configuration_cache": {
        "BACKEND": "django.core.cache.backends.locmem.LocMemCache",
        "LOCATION": "configuration-location",
    },
    "visualization_cache": {
        "BACKEND": "django.core.cache.backends.locmem.LocMemCache",
        "LOCATION": "visualization-location",
    },
}

structlog.configure(
    processors=[],
    wrapper_class=structlog.make_filtering_bound_logger(logging.CRITICAL),
    context_class=dict,
    logger_factory=structlog.stdlib.LoggerFactory(),
)

# These cause Celery to run tasks locally, synchronously and immediately
CELERY_TASK_ALWAYS_EAGER = True
CELERY_TASK_EAGER_PROPAGATES = True

DEFAULT_TO_EMAIL = "rsar@loc.gov"
CONCORDIA_DEVS = [
    "rsar@loc.gov",
]

ALLOWED_HOSTS = ["127.0.0.1", "0.0.0.0"]  # nosec

EMAIL_BACKEND = "django.core.mail.backends.dummy.EmailBackend"

SESSION_ENGINE = "django.contrib.sessions.backends.cache"

RATELIMIT_ENABLE = False

# Turnstile settings
TURNSTILE_JS_API_URL = os.environ.get(
    "TURNSTILE_JS_API_URL", "https://challenges.cloudflare.com/turnstile/v0/api.js"
)
TURNSTILE_VERIFY_URL = os.environ.get(
    "TURNSTILE_VERIFY_URL", "https://challenges.cloudflare.com/turnstile/v0/siteverify"
)
TURNSTILE_SITEKEY = os.environ.get(
    "TURNSTILE_SITEKEY", "1x00000000000000000000BB"
)  # Always pass, invisible
TURNSTILE_SECRET = os.environ.get(
    "TURNSTILE_SECRET", "1x0000000000000000000000000000000AA"
)  # Always pass


================================================
FILE: concordia/settings_template.py
================================================
import os

import sentry_sdk
import structlog
from django.contrib import messages
from django.core.management.utils import get_random_secret_key
from sentry_sdk.integrations.django import DjangoIntegration

from concordia.version import get_concordia_version

# New in 3.2, if no field in a model is defined with primary_key=True an implicit
# primary key is added. This can now be controlled by changing the value below
# 3.2 default value is BigAutoField. But migrations does not support M2M PK
DEFAULT_AUTO_FIELD = "django.db.models.AutoField"

# Build paths inside the project like this: os.path.join(SITE_ROOT_DIR, ...)
CONCORDIA_APP_DIR = os.path.abspath(os.path.dirname(__file__))
SITE_ROOT_DIR = os.path.dirname(CONCORDIA_APP_DIR)

SECRET_KEY = os.getenv("DJANGO_SECRET_KEY", get_random_secret_key())

CONCORDIA_ENVIRONMENT = os.environ.get("CONCORDIA_ENVIRONMENT", "development")
DATA_UPLOAD_MAX_MEMORY_SIZE = 10485760
# Optional SMTP authentication information for EMAIL_HOST.
EMAIL_HOST_USER = ""
EMAIL_HOST_PASSWORD = ""  # nosec
EMAIL_USE_TLS = False
DEFAULT_FROM_EMAIL = "crowd@loc.gov"

ALLOWED_HOSTS = ["*"]

DEBUG = False
CSRF_COOKIE_SECURE = False

AUTH_PASSWORD_VALIDATORS = []
EMAIL_BACKEND = "django.core.mail.backends.filebased.EmailBackend"
EMAIL_HOST = "localhost"
EMAIL_PORT = 25
LANGUAGE_CODE = "en-us"
LOGIN_REDIRECT_URL = "/"
LOGOUT_REDIRECT_URL = "/"
ROOT_URLCONF = "concordia.urls"
STATIC_ROOT = "static-files"
STATIC_URL = "/static/"

STATICFILES_FINDERS = [
    # We let the filesystem override the app directories so Gulp can pre-process
    # files if needed:
    "django.contrib.staticfiles.finders.FileSystemFinder",
    "django.contrib.staticfiles.finders.AppDirectoriesFinder",
    # See https://github.com/kevin1024/django-npm
    "npm.finders.NpmFinder",
]

STATICFILES_DIRS = [
    # Vite's new home (JS/Manifest)
    os.path.join(SITE_ROOT_DIR, "concordia", "static", "dist"),
    # Gulp's home (where base.css lives), based on gulpfile .dest('static/')
    os.path.join(SITE_ROOT_DIR, "static"),
    # Standard Admin assets
    os.path.join(SITE_ROOT_DIR, "concordia", "static", "admin"),
]

NPM_FILE_PATTERNS = {
    "redom": ["dist/*"],
    "split.js": ["dist/*"],
    "urijs": ["src/*"],
    "openseadragon": ["build/*"],
    "openseadragon-filters": ["dist/*", "index.js"],
    "codemirror": ["lib/*", "addon/*", "mode/*"],
    "prettier": ["*.js"],
    "remarkable": ["dist/*"],
    "jquery": ["dist/*"],
    "js-cookie": ["dist/*"],
    "@popperjs/core": ["dist/*"],
    "bootstrap": ["dist/*"],
    "screenfull": ["*"],
    "@duetds/date-picker/": ["dist/*"],
    "@fortawesome/fontawesome-free/": [
        "css/*",
        "js/*",
        "sprites/*",
        "svgs/*",
        "webfonts/*",
    ],
    "chart.js": ["auto/*", "dist/*"],
    "@kurkle/color": ["dist/*"],
    "chroma-js": ["dist/*"],
    "@sentry": ["*"],
    "@sentry-internal": ["*"],
}

TEMPLATE_DEBUG = False
TIME_ZONE = "America/New_York"
USE_I18N = True
USE_TZ = True
WSGI_APPLICATION = "concordia.wsgi.application"

DATABASES = {
    "default": {
        "ENGINE": "django.db.backends.postgresql",
        "NAME": "concordia",
        "USER": "concordia",
        "PASSWORD": os.getenv("POSTGRESQL_PW"),
        "HOST": os.getenv("POSTGRESQL_HOST", "localhost"),
        "PORT": os.getenv("POSTGRESQL_PORT", "5432"),
        # Change this back to 15 minutes (15*60) once celery regression
        # is fixed  see https://github.com/celery/celery/issues/4878
        "CONN_MAX_AGE": 0,  # 15 minutes
    }
}

INSTALLED_APPS = [
    "concordia.apps.ConcordiaAdminConfig",  # Replaces 'django.contrib.admin'
    "django.contrib.auth",
    "django.contrib.contenttypes",
    "django.contrib.humanize",
    "django.contrib.sessions",
    "django.contrib.messages",
    "django.contrib.sites",
    # Replaces "django.contrib.staticfiles",
    "concordia.apps.ConcordiaStaticFilesConfig",
    "django_structlog",
    "django_bootstrap5",
    "maintenance_mode",
    "concordia.apps.ConcordiaAppConfig",
    "exporter",
    "importer",
    "configuration",
    "prometheus_metrics.apps.PrometheusMetricsConfig",
    "robots",
    "django_celery_beat",
    "flags",
    "channels",
    "django_admin_multiple_choice_list_filter",
    "tinymce",
    "django_vite",
]

MIDDLEWARE = [
    "prometheus_metrics.middleware.PrometheusBeforeMiddleware",
    "django.middleware.security.SecurityMiddleware",
    # WhiteNoise serves static files efficiently:
    "whitenoise.middleware.WhiteNoiseMiddleware",
    "django.contrib.sessions.middleware.SessionMiddleware",
    "django.middleware.common.CommonMiddleware",
    "django.middleware.csrf.CsrfViewMiddleware",
    "django.contrib.auth.middleware.AuthenticationMiddleware",
    "django.contrib.messages.middleware.MessageMiddleware",
    "django.middleware.clickjacking.XFrameOptionsMiddleware",
    "django_structlog.middlewares.RequestMiddleware",
    "django_ratelimit.middleware.RatelimitMiddleware",
    "concordia.middleware.MaintenanceModeMiddleware",
]

RATELIMIT_VIEW = "concordia.views.rate_limit.ratelimit_view"
RATELIMIT_BLOCK = False

TEMPLATES = [
    {
        "BACKEND": "django.template.backends.django.DjangoTemplates",
        "DIRS": [
            os.path.join(SITE_ROOT_DIR, "templates"),
            os.path.join(CONCORDIA_APP_DIR, "templates"),
        ],
        "OPTIONS": {
            "context_processors": [
                "django.template.context_processors.debug",
                "django.template.context_processors.request",
                "django.contrib.auth.context_processors.auth",
                "django.contrib.messages.context_processors.messages",
                "django.template.context_processors.media",
                "maintenance_mode.context_processors.maintenance_mode",
                # Concordia
                "concordia.context_processors.system_configuration",
                "concordia.context_processors.site_navigation",
                "concordia.context_processors.maintenance_mode_frontend_available",
                "concordia.context_processors.request_id_context",
                "concordia.turnstile.context_processors.turnstile_default_settings",
            ],
            "libraries": {
                "staticfiles": "django.templatetags.static",
                "django_vite": "django_vite.templatetags.django_vite",
            },
            "loaders": [
                "django.template.loaders.filesystem.Loader",
                "django.template.loaders.app_directories.Loader",
            ],
            "builtins": [
                "configuration.templatetags.configuration_tags",
                "concordia.templatetags.reject_filter",
            ],
        },
    }
]

HAYSTACK_CONNECTIONS = {
    "default": {
        "ENGINE": "haystack.backends.whoosh_backend.WhooshEngine",
        "PATH": os.path.join(os.path.dirname(__file__), "whoosh_index"),
    }
}

REDIS_ADDRESS = os.environ.get("REDIS_ADDRESS", "localhost")
REDIS_PORT = os.environ.get("REDIS_PORT", "")
if REDIS_PORT.isdigit():
    REDIS_PORT = int(REDIS_PORT)
else:
    REDIS_PORT = 6379

if REDIS_ADDRESS and REDIS_PORT:
    CACHES = {
        "default": {
            "BACKEND": "django_redis.cache.RedisCache",
            "LOCATION": f"redis://{REDIS_ADDRESS}:{REDIS_PORT}/1",
            "OPTIONS": {
                "CLIENT_CLASS": "django_redis.client.DefaultClient",
            },
        },
        "view_cache": {
            "BACKEND": "django_redis.cache.RedisCache",
            "LOCATION": f"redis://{REDIS_ADDRESS}:{REDIS_PORT}/2",
            "OPTIONS": {
                "CLIENT_CLASS": "django_redis.client.DefaultClient",
            },
        },
        "configuration_cache": {
            "BACKEND": "django_redis.cache.RedisCache",
            "LOCATION": f"redis://{REDIS_ADDRESS}:{REDIS_PORT}/3",
            "OPTIONS": {
                "CLIENT_CLASS": "django_redis.client.DefaultClient",
            },
        },
        "visualization_cache": {
            "BACKEND": "django_redis.cache.RedisCache",
            "LOCATION": f"redis://{REDIS_ADDRESS}:{REDIS_PORT}/4",
            "OPTIONS": {
                "CLIENT_CLASS": "django_redis.client.DefaultClient",
            },
        },
    }
else:
    CACHES = {
        "default": {
            "BACKEND": "django.core.cache.backends.locmem.LocMemCache",
        },
        "view_cache": {"BACKEND": "django.core.cache.backends.locmem.LocMemCache"},
        "configuration_cache": {
            "BACKEND": "django.core.cache.backends.locmem.LocMemCache"
        },
        "visualization_cache": {
            "BACKEND": "django.core.cache.backends.locmem.LocMemCache"
        },
    }

SESSION_ENGINE = "django.contrib.sessions.backends.db"

CELERY_BROKER_URL = f"redis://{REDIS_ADDRESS}:{REDIS_PORT}/0"
CELERY_RESULT_BACKEND = f"redis://{REDIS_ADDRESS}:{REDIS_PORT}/0"

CELERY_ACCEPT_CONTENT = ["json"]
CELERY_TASK_SERIALIZER = "json"
CELERY_IMPORTS = ("importer.tasks",)

CELERY_BROKER_HEARTBEAT = 0
CELERY_BROKER_CONNECTION_RETRY = True
CELERY_BROKER_CONNECTION_RETRY_ON_STARTUP = True
CELERY_BROKER_TRANSPORT_OPTIONS = {
    "confirm_publish": True,
    "max_retries": 3,
    "interval_start": 0,
    "interval_step": 0.2,
    "interval_max": 0.5,
}

LOGGING = {
    "version": 1,
    "disable_existing_loggers": False,
    "formatters": {
        "long": {
            "format": "[{asctime} {levelname} {name}:{lineno}] {message}",
            "datefmt": "%Y-%m-%dT%H:%M:%S",
            "style": "{",
        },
        "short": {
            "format": "[{levelname} {name}] {message}",
            "datefmt": "%Y-%m-%dT%H:%M:%S",
            "style": "{",
        },
        "structlog_json": {
            "()": structlog.stdlib.ProcessorFormatter,
            "processor": structlog.processors.JSONRenderer(),
        },
        "structlog_console": {
            "()": structlog.stdlib.ProcessorFormatter,
            "processor": structlog.dev.ConsoleRenderer(),
        },
    },
    "handlers": {
        "stream": {
            "class": "logging.StreamHandler",
            "level": "INFO",
            "formatter": "long",
        },
        "null": {"level": "INFO", "class": "logging.NullHandler"},
        "file": {
            "class": "logging.handlers.TimedRotatingFileHandler",
            "level": "INFO",
            "formatter": "long",
            "filename": f"{SITE_ROOT_DIR}/logs/concordia.log",
            "when": "H",
            "interval": 3,
            "backupCount": 16,
        },
        "celery": {
            "level": "INFO",
            "class": "logging.handlers.RotatingFileHandler",
            "filename": f"{SITE_ROOT_DIR}/logs/celery.log",
            "formatter": "long",
            "maxBytes": 1024 * 1024 * 100,  # 100 mb
        },
        "structlog_file": {
            "class": "logging.handlers.TimedRotatingFileHandler",
            "level": "INFO",
            "formatter": "structlog_json",
            "filename": f"{SITE_ROOT_DIR}/logs/concordia-json.log",
            "when": "H",
            "interval": 3,
            "backupCount": 16,
        },
        "structlog_console": {
            "class": "logging.StreamHandler",
            "level": "INFO",
            "formatter": "structlog_console",
        },
    },
    "loggers": {
        "django": {"handlers": ["file"], "level": "INFO"},
        "celery": {"handlers": ["celery"], "level": "INFO"},
        "concordia": {"handlers": ["file"], "level": "INFO"},
        "aws_xray_sdk": {"handlers": ["file"], "level": "INFO", "propagate": True},
        "structlog": {
            "handlers": ["structlog_file"],
            "level": "INFO",
            "propagate": True,
        },
        "django_structlog": {
            "handlers": ["structlog_file"],
            "level": "INFO",
            "propagate": False,
        },
    },
}

structlog.configure(
    processors=[
        structlog.contextvars.merge_contextvars,
        structlog.stdlib.filter_by_level,
        structlog.processors.TimeStamper(fmt="iso"),
        structlog.stdlib.add_logger_name,
        structlog.stdlib.add_log_level,
        structlog.stdlib.PositionalArgumentsFormatter(),
        structlog.processors.StackInfoRenderer(),
        structlog.processors.format_exc_info,
        structlog.processors.UnicodeDecoder(),
        structlog.stdlib.ProcessorFormatter.wrap_for_formatter,
    ],
    logger_factory=structlog.stdlib.LoggerFactory(),
    cache_logger_on_first_use=True,
)


################################################################################
# Django-specific settings above
################################################################################

MEDIA_URL = "/media/"
MEDIA_ROOT = os.path.join(SITE_ROOT_DIR, "media")

LOGIN_URL = "login"

PASSWORD_VALIDATOR = (
    "django.contrib.auth.password_validation.UserAttributeSimilarityValidator"  # nosec
)

AUTH_PASSWORD_VALIDATORS = [
    {"NAME": PASSWORD_VALIDATOR},
    {
        "NAME": "django.contrib.auth.password_validation.MinimumLengthValidator",
        "OPTIONS": {"min_length": 8},
    },
    {"NAME": "django.contrib.auth.password_validation.CommonPasswordValidator"},
    {"NAME": "django.contrib.auth.password_validation.NumericPasswordValidator"},
    {"NAME": "concordia.validators.DjangoPasswordsValidator"},
]

# See https://github.com/dstufft/django-passwords#settings
PASSWORD_COMPLEXITY = {
    "UPPER": 1,
    "LOWER": 1,
    "LETTERS": 1,
    "DIGITS": 1,
    "SPECIAL": 1,
    "WORDS": 1,
}

AUTHENTICATION_BACKENDS = [
    "concordia.authentication_backends.EmailOrUsernameModelBackend"
]

# Turnstile settings
TURNSTILE_JS_API_URL = os.environ.get(
    "TURNSTILE_JS_API_URL", "https://challenges.cloudflare.com/turnstile/v0/api.js"
)
TURNSTILE_VERIFY_URL = os.environ.get(
    "TURNSTILE_VERIFY_URL", "https://challenges.cloudflare.com/turnstile/v0/siteverify"
)
TURNSTILE_SITEKEY = os.environ.get("TURNSTILE_SITEKEY", "")
TURNSTILE_SECRET = os.environ.get("TURNSTILE_SECRET", "")
TURNSTILE_TIMEOUT = os.environ.get("TURNSTILE_TIMEOUT", 5)
TURNSTILE_DEFAULT_CONFIG = os.environ.get(
    "TURNSTILE_DEFAULT_CONFIG", {"appearance": "interaction-only"}
)
TURNSTILE_PROXIES = os.environ.get("TURNSTILE_PROXIES", {})
ANONYMOUS_USER_VALIDATION_INTERVAL = 86400

STORAGES = {
    "default": {
        "BACKEND": "django.core.files.storage.FileSystemStorage",
    },
    "staticfiles": {
        # Use the basic Compressed backend because Vite handled hashing and compression.
        "BACKEND": "whitenoise.storage.CompressedStaticFilesStorage",
    },
    "assets": {
        "BACKEND": "django.core.files.storage.FileSystemStorage",
    },
    "visualizations": {
        "BACKEND": "django.core.files.storage.FileSystemStorage",
    },
}

DJANGO_VITE = {
    "default": {
        "dev_mode": DEBUG,
        "manifest_path": os.path.join(
            SITE_ROOT_DIR, "concordia", "static", "dist", "manifest.json"
        ),
        "static_url_prefix": "",
    }
}

PASSWORD_RESET_TIMEOUT = 604800
ACCOUNT_ACTIVATION_DAYS = 7
REGISTRATION_OPEN = True  # set to false to temporarily disable registrations

REQUIRE_EMAIL_RECONFIRMATION = True
EMAIL_RECONFIRMATION_KEY = "EMAIL_CONFIRMATION_{id}"
EMAIL_RECONFIRMATION_DAYS = 7
EMAIL_RECONFIRMATION_TIMEOUT = 60 * 60 * 24 * EMAIL_RECONFIRMATION_DAYS

MESSAGE_STORAGE = "django.contrib.messages.storage.session.SessionStorage"

MESSAGE_TAGS = {messages.ERROR: "danger"}

SENTRY_BACKEND_DSN = os.environ.get("SENTRY_BACKEND_DSN", "")
SENTRY_FRONTEND_DSN = os.environ.get("SENTRY_FRONTEND_DSN", "")

APPLICATION_VERSION = get_concordia_version()

sentry_sdk.init(
    dsn=SENTRY_BACKEND_DSN,
    environment=CONCORDIA_ENVIRONMENT,
    release=APPLICATION_VERSION,
    integrations=[DjangoIntegration()],
)

# Names of special django.auth Groups
COMMUNITY_MANAGER_GROUP_NAME = "Community Managers"
NEWSLETTER_GROUP_NAME = "Newsletter"

# Django sites framework setting
SITE_ID = 1
ROBOTS_USE_SITEMAP = False
ROBOTS_USE_HOST = False

# django-bootstrap4 customization:
BOOTSTRAP4 = {"required_css_class": "form-group-required", "set_placeholder": False}

# Transcription-related settings

#: Number of seconds an asset reservation is valid for
TRANSCRIPTION_RESERVATION_SECONDS = 15 * 60

#: Number of hours until an asset reservation is tombstoned
TRANSCRIPTION_RESERVATION_TOMBSTONE_HOURS = 24

#: Number of hours until a tombstoned reservation is deleted
TRANSCRIPTION_RESERVATION_TOMBSTONE_LENGTH_HOURS = 24

#: Web cache policy settings
DEFAULT_PAGE_TTL = 5 * 60

# Feature flags
FLAGS = {
    "ADVERTISE_ACTIVITY_UI": [],
    "CAROUSEL_CMS": [],
    "SEND_WELCOME_EMAIL": [],
    "SHOW_BANNER": [],
    "DISPLAY_ITEM_DESCRIPTION": [],
    "IMPORT_IMAGE_CHECKSUM": [],
}

ASGI_APPLICATION = "concordia.routing.application"

CHANNEL_LAYERS = {
    "default": {
        "BACKEND": "channels_redis.core.RedisChannelLayer",
        "CONFIG": {
            "hosts": [(REDIS_ADDRESS, REDIS_PORT)],
            "capacity": 1500,
            "expiry": 10,
        },
    }
}

SECURE_REFERRER_POLICY = "origin"
TINYMCE_COMPRESSOR = False
TINYMCE_DEFAULT_CONFIG = {
    "selector": "textarea.tinymce",
    "referrer_policy": "origin",
    "skin": "oxide-dark",
    "content_css": "dark",
    "plugins": "link lists searchreplace wordcount",
    "browser_spellcheck": "true",
    "newline_behavior": "linebreak",
    "toolbar1": "bold italic | numlist bullist | link | searchreplace wordcount",
    "width": 624,
}
TINYMCE_JS_URL = "https://cdn.tiny.cloud/1/rf486i5f1ww9m8191oolczn7f0ry61mzdtfwbu7maiiiv2kv/tinymce/6/tinymce.min.js"

LANGUAGE_CODES = {
    "eng": "English (default)",
    "afr": "Afrikaans",
    "sqi": "Albanian",
    "amh": "Amharic",
    "ara": "Arabic",
    "asm": "Assamese",
    "aze": "Azerbaijani",
    "aze_cyrl": "Azerbaijani - Cyrillic",
    "eus": "Basque",
    "bel": "Belarusian",
    "ben": "Bengali",
    "bos": "Bosnian",
    "bul": "Bulgarian",
    "mya": "Burmese",
    "cat": "Catalan; Valencian",
    "ceb": "Cebuano",
    "khm": "Central Khmer",
    "chr": "Cherokee",
    "chi_sim": "Chinese - Simplified",
    "chi_tra": "Chinese - Traditional",
    "hrv": "Croatian",
    "ces": "Czech",
    "dan": "Danish",
    "nld": "Dutch; Flemish",
    "dzo": "Dzongkha",
    "enm": "English, Middle (1100-1500)",
    "epo": "Esperanto",
    "est": "Estonian",
    "kat": "Georgian",
    "kat_old": "Georgian - Old",
    "deu": "German",
    "ell": "Greek, Modern (1453-)",
    "fin": "Finnish",
    "fra": "French",
    "frm": "French, Middle (ca. 1400-1600)",
    "glg": "Galician",
    "frk": "German Fraktur",
    "grc": "Greek, Ancient (-1453)",
    "guj": "Gujarati",
    "hat": "Haitian; Haitian Creole",
    "heb": "Hebrew",
    "hin": "Hindi",
    "hun": "Hungarian",
    "isl": "Icelandic",
    "ind": "Indonesian",
    "iku": "Inuktitut",
    "gle": "Irish",
    "ita": "Italian",
    "ita_old": "Italian - Old",
    "jpn": "Japanese",
    "jav": "Javanese",
    "kan": "Kannada",
    "kaz": "Kazakh",
    "kir": "Kirghiz; Kyrgyz",
    "kor": "Korean",
    "kur": "Kurdish",
    "lao": "Lao",
    "lat": "Latin",
    "lav": "Latvian",
    "lit": "Lithuanian",
    "mkd": "Macedonian",
    "mal": "Malayalam",
    "mar": "Marathi",
    "msa": "Malay",
    "mlt": "Maltese",
    "nep": "Nepali",
    "nor": "Norwegian",
    "ori": "Oriya",
    "pan": "Panjabi; Punjabi",
    "fas": "Persian",
    "pol": "Polish",
    "por": "Portuguese",
    "pus": "Pushto; Pashto",
    "ron": "Romanian; Moldavian; Moldovan",
    "rus": "Russian",
    "san": "Sanskrit",
    "srp": "Serbian",
    "srp_latn": "Serbian - Latin",
    "sin": "Sinhala; Sinhalese",
    "slk": "Slovak",
    "slv": "Slovenian",
    "spa": "Spanish; Castilian",
    "spa_old": "Spanish; Castilian - Old",
    "swa": "Swahili",
    "swe": "Swedish",
    "syr": "Syriac",
    "tgl": "Tagalog",
    "tgk": "Tajik",
    "tam": "Tamil",
    "tel": "Telugu",
    "tha": "Thai",
    "bod": "Tibetan",
    "tir": "Tigrinya",
    "tur": "Turkish",
    "uig": "Uighur; Uyghur",
    "ukr": "Ukrainian",
    "urd": "Urdu",
    "uzb": "Uzbek",
    "uzb_cyrl": "Uzbek - Cyrillic",
    "vie": "Vietnamese",
    "cym": "Welsh",
    "yid": "Yiddish",
}
PYTESSERACT_ALLOWED_LANGUAGES = LANGUAGE_CODES.keys()

PYLENIUM_CONFIG = os.path.join(SITE_ROOT_DIR, "pylenium.json")

MAINTENANCE_MODE_STATE_BACKEND = "maintenance_mode.backends.CacheBackend"
MAINTENANCE_MODE_IGNORE_ADMIN_SITE = True
MAINTENANCE_MODE_IGNORE_URLS = ("/healthz*", "/metrics*", "/maintenance-mode*")

DEFAULT_AXE_SCRIPT = os.path.join(
    SITE_ROOT_DIR, "node_modules", "axe-core", "axe.min.js"
)

# Used for tracking accepts for the review rate limit
TRANSCRIPTION_ACCEPTED_TRACKING_KEY = "TRANSCRIPTION_ACCEPTED_{user_id}"

CONFIGURATION_CACHE_TIMEOUT = 3600  # One hour

# The number of assets to store for next_transcribabe/next_reviewable, per campaign
NEXT_TRANSCRIBABE_ASSET_COUNT = 100
NEXT_REVIEWABLE_ASSET_COUNT = NEXT_TRANSCRIBABE_ASSET_COUNT


================================================
FILE: concordia/settings_test.py
================================================
import logging
import os

import structlog

from .settings_template import *  # NOQA ignore=F405
from .settings_template import DATABASES

DEBUG = False

DATABASES["default"].update({"PASSWORD": "", "USER": "postgres"})

CHANNEL_LAYERS = {
    "default": {
        "BACKEND": "channels.layers.InMemoryChannelLayer",
    }
}

CACHES = {
    "default": {
        "BACKEND": "django.core.cache.backends.locmem.LocMemCache",
        "LOCATION": "default-location",
    },
    "view_cache": {
        "BACKEND": "django.core.cache.backends.locmem.LocMemCache",
        "LOCATION": "view-location",
    },
    "configuration_cache": {
        "BACKEND": "django.core.cache.backends.locmem.LocMemCache",
        "LOCATION": "configuration-location",
    },
    "visualization_cache": {
        "BACKEND": "django.core.cache.backends.locmem.LocMemCache",
        "LOCATION": "visualization-location",
    },
}

structlog.configure(
    processors=[],
    wrapper_class=structlog.make_filtering_bound_logger(logging.CRITICAL),
    context_class=dict,
    logger_factory=structlog.stdlib.LoggerFactory(),
)

# These cause Celery to run tasks locally, synchronously and immediately
CELERY_TASK_ALWAYS_EAGER = True
CELERY_TASK_EAGER_PROPAGATES = True

DEFAULT_TO_EMAIL = "rsar@loc.gov"
CONCORDIA_DEVS = [
    "rsar@loc.gov",
]

ALLOWED_HOSTS = ["127.0.0.1", "0.0.0.0"]  # nosec

EMAIL_BACKEND = "django.core.mail.backends.dummy.EmailBackend"

SESSION_ENGINE = "django.contrib.sessions.backends.cache"

RATELIMIT_ENABLE = False

# Turnstile settings
TURNSTILE_JS_API_URL = os.environ.get(
    "TURNSTILE_JS_API_URL", "https://challenges.cloudflare.com/turnstile/v0/api.js"
)
TURNSTILE_VERIFY_URL = os.environ.get(
    "TURNSTILE_VERIFY_URL", "https://challenges.cloudflare.com/turnstile/v0/siteverify"
)
TURNSTILE_SITEKEY = os.environ.get(
    "TURNSTILE_SITEKEY", "1x00000000000000000000BB"
)  # Always pass, invisible
TURNSTILE_SECRET = os.environ.get(
    "TURNSTILE_SECRET", "1x0000000000000000000000000000000AA"
)  # Always pass

CONCORDIA_DEVS = []


================================================
FILE: concordia/signals/__init__.py
================================================


================================================
FILE: concordia/signals/handlers.py
================================================
import logging
from time import time
from typing import Any

import structlog
from asgiref.sync import AsyncToSync
from channels.layers import get_channel_layer
from django.conf import settings
from django.contrib.auth import login as auth_login
from django.contrib.auth.models import Group, User
from django.contrib.auth.signals import user_logged_in, user_login_failed
from django.core.mail import EmailMultiAlternatives
from django.db.models.signals import post_delete, post_save
from django.dispatch import receiver
from django.http import HttpRequest
from django.http.response import HttpResponseBase
from django.template import loader
from django_registration.signals import user_activated, user_registered
from django_structlog import signals
from flags.state import flag_enabled

from concordia.logging import ConcordiaLogger
from concordia.models import (
    Asset,
    Transcription,
    TranscriptionStatus,
    UserProfile,
)
from concordia.tasks.assets import calculate_difficulty_values
from concordia.tasks.useractivity import update_useractivity_cache
from concordia.utils.next_asset import remove_next_asset_objects

from .signals import reservation_obtained, reservation_released

ASSET_CHANNEL_LAYER = get_channel_layer()

logger = logging.getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


@receiver(user_logged_in)
def clear_reservation_token(
    sender: type[User],
    user: User,
    request: HttpRequest,
    **kwargs: Any,
) -> None:
    """
    Clear any reservation token from the session on successful login.

    Behavior:
        If the session contains a key named "reservation_token", remove it and
        persist the session. Emit structured logs describing whether a token
        was cleared or not. Always log a successful login message.

    Args:
        sender (type[User]): The User model class that sent the signal.
        user (User): The authenticated user.
        request (HttpRequest): The current request containing the session.
        **kwargs: Additional signal data (ignored).

    Returns:
        None
    """
    try:
        token = request.session["reservation_token"]
        del request.session["reservation_token"]
        request.session.save()
        logger.info("Clearing reservation token %s for %s on login", token, user)
        structured_logger.info(
            "Reservation token cleared on login.",
            event_code="reservation_token_cleared",
            reservation_token=token,
            user=user,
        )
    except KeyError:
        structured_logger.debug(
            "No reservation token found to clear on login.",
            event_code="reservation_token_absent_on_login",
            user=user,
        )

    logger.info("Successful user login with username %s", user)


@receiver(user_login_failed)
def handle_user_login_failed(
    sender: type[User],
    credentials: dict[str, Any],
    request: HttpRequest | None,
    **kwargs: Any,
) -> None:
    """
    Log a warning when a user login attempt fails.

    Args:
        sender (type[User]): The User model class that sent the signal.
        credentials (dict[str, Any]): Submitted credential data.
        request (HttpRequest | None): The current request if available.
        **kwargs: Additional signal data (ignored).

    Returns:
        None
    """
    logger.warning("Failed user login with username %s", credentials["username"])


@receiver(user_activated)
def user_successfully_activated(
    sender: type[User],
    user: User,
    request: HttpRequest | None,
    **kwargs: Any,
) -> None:
    """
    Handle post-activation tasks for a newly activated user.

    Behavior:
        If this activation is not the result of a password reset (request is
        present), log the user in. Sends a welcome email when the
        "SEND_WELCOME_EMAIL" flag is enabled.

    Args:
        sender (type[User]): The User model class that sent the signal.
        user (User): The activated user.
        request (HttpRequest | None): The current request or None for password
            reset activations.
        **kwargs: Additional signal data (ignored).

    Returns:
        None
    """
    logger.info("Received user activation signal for %s", user.username)

    # Log the user in, if this isn't the result of a password reset
    # The password reset form automatically logs the user in and activates.
    # But when it does so, it sends None for the request.
    # So when the user activates without resetting the password, the behavior
    # should be the same - the user should be automatically logged in.
    if request:
        auth_login(request, user)

    if flag_enabled("SEND_WELCOME_EMAIL"):
        text_body_template = loader.get_template("emails/welcome_email_body.txt")
        text_body_message = text_body_template.render()

        html_body_template = loader.get_template("emails/welcome_email_body.html")
        html_body_message = html_body_template.render()

        subject_template = loader.get_template("emails/welcome_email_subject.txt")
        subject_message = subject_template.render()

        # Send welcome email
        message = EmailMultiAlternatives(
            subject=subject_message.rstrip(),
            body=text_body_message,
            from_email=settings.DEFAULT_FROM_EMAIL,
            to=[user.email],
            reply_to=[settings.DEFAULT_FROM_EMAIL],
        )
        message.attach_alternative(html_body_message, "text/html")
        message.send()


@receiver(user_registered)
def add_user_to_newsletter(
    sender: type[User],
    user: User,
    request: HttpRequest,
    **kwargs: Any,
) -> None:
    """
    Add a newly registered user to the newsletter group if they opted in.

    Args:
        sender (type[User]): The User model class that sent the signal.
        user (User): The newly registered user.
        request (HttpRequest): The registration request containing form data.
        **kwargs: Additional signal data (ignored).

    Returns:
        None
    """
    # If the user checked the newsletter checkbox,
    # add them to the Newsletter group
    if (
        request.POST
        and "newsletterOptIn" in request.POST
        and request.POST["newsletterOptIn"]
    ):
        newsletter_group = Group.objects.get(name=settings.NEWSLETTER_GROUP_NAME)
        newsletter_group.user_set.add(user)
        newsletter_group.save()


@receiver(post_save, sender=Transcription)
def update_asset_status(
    sender: type[Transcription],
    *,
    instance: Transcription,
    **kwargs: Any,
) -> None:
    """
    Update the parent asset's transcription status after a transcription save.

    Behavior:
        Derive the asset's new status based on the latest transcription flags
        (accepted, submitted, rejected). Proceed only if the saved instance is
        the asset's current latest transcription. Persist the new status and
        trigger downstream tasks and cache cleanup.

    Side Effects:
        - Saves the `Asset` with an updated `transcription_status`.
        - Removes next-asset cache entries via `remove_next_asset_objects`.
        - Triggers difficulty calculation on the saved asset.

    Args:
        sender (type[Transcription]): The Transcription model class.
        instance (Transcription): The saved transcription instance.

    Returns:
        None
    """
    logger.info("update_asset_status for %s", instance.id)

    asset = instance.asset

    new_status = TranscriptionStatus.IN_PROGRESS

    if instance.rejected:
        new_status = TranscriptionStatus.IN_PROGRESS
    elif instance.accepted:
        new_status = TranscriptionStatus.COMPLETED
    elif instance.submitted:
        new_status = TranscriptionStatus.SUBMITTED

    # Before we do anything, we need to make sure this
    # is the latest transcription for the asset.
    current_latest_transcription = asset.latest_transcription()
    if instance != current_latest_transcription:
        # A transcription lower down in the asset's history has been updated.
        # This shouldn't happen outside of extraordinary circumstances.
        # We'll log this occurrence then skip the rest of the signal because
        # we don't want to change the asset's status since changing an older
        # transcription doesn't logically affect the status or anything else
        logger.warning(
            "An older transcription (%s) was updated for asset %s (%s). This "
            "would have updated the status to %s, but this was prevented and "
            "the status remained %s. The current latest_transcription is %s. "
            "The sender was %s.",
            instance.id,
            asset,
            asset.id,
            new_status,
            asset.transcription_status,
            current_latest_transcription,
            sender,
        )
        return

    logger.info(
        "Updating asset status for %s (%s) from %s to %s",
        asset,
        asset.id,
        asset.transcription_status,
        new_status,
    )

    asset.transcription_status = new_status
    asset.full_clean()
    asset.save()

    logger.info("Status for %s (%s) updated", asset, asset.id)

    remove_next_asset_objects(asset.id)

    calculate_difficulty_values(Asset.objects.filter(pk=asset.pk))


@receiver(post_save, sender=Asset)
def send_asset_update(
    *,
    instance: Asset,
    **kwargs: Any,
) -> None:
    """
    Broadcast an asset update message to the channel layer.

    Behavior:
        Include the asset's current status, difficulty and the most recent
        transcription details if present.

    Args:
        instance (Asset): The saved asset.

    Returns:
        None
    """
    latest_trans = None

    latest_transcription = instance.transcription_set.order_by("-pk").first()
    if latest_transcription:
        latest_trans = {
            "text": latest_transcription.text,
            "id": latest_transcription.pk,
            "submitted_by": latest_transcription.user.pk,
        }

    AsyncToSync(ASSET_CHANNEL_LAYER.group_send)(
        "asset_updates",
        {
            "type": "asset_update",
            "asset_pk": instance.pk,
            "status": instance.transcription_status,
            "difficulty": instance.difficulty,
            "latest_transcription": latest_trans,
        },
    )


@receiver(reservation_obtained)
def send_asset_reservation_obtained(sender: Any, **kwargs: Any) -> None:
    """
    Broadcast an "asset reservation obtained" message and log the event.

    Args:
        sender (Any): The caller that obtained the reservation.
        **kwargs: Expected keys are "asset_pk" and "reservation_token".

    Returns:
        None
    """
    logger.info(
        "Reservation obtained by %s for asset %s with token %s",
        sender,
        kwargs["asset_pk"],
        kwargs["reservation_token"],
    )

    structured_logger.info(
        "Asset reservation obtained.",
        event_code="asset_reservation_obtained",
        asset_pk=kwargs["asset_pk"],
        reservation_token=kwargs["reservation_token"],
        sender=sender,
    )

    send_asset_reservation_message(
        sender=sender,
        message_type="asset_reservation_obtained",
        asset_pk=kwargs["asset_pk"],
        reservation_token=kwargs["reservation_token"],
    )


@receiver(reservation_released)
def send_asset_reservation_released(sender: Any, **kwargs: Any) -> None:
    """
    Broadcast an "asset reservation released" message and log the event.

    Args:
        sender (Any): The caller that released the reservation.
        **kwargs: Expected keys are "asset_pk" and "reservation_token".

    Returns:
        None
    """
    logger.info(
        "Reservation released by %s for asset %s with token %s",
        sender,
        kwargs["asset_pk"],
        kwargs["reservation_token"],
    )
    structured_logger.info(
        "Asset reservation released.",
        event_code="asset_reservation_released",
        asset_pk=kwargs["asset_pk"],
        reservation_token=kwargs["reservation_token"],
        sender=sender,
    )
    send_asset_reservation_message(
        sender=sender,
        message_type="asset_reservation_released",
        asset_pk=kwargs["asset_pk"],
        reservation_token=kwargs["reservation_token"],
    )


def send_asset_reservation_message(
    *,
    sender: Any,
    message_type: str,
    asset_pk: int,
    reservation_token: str,
) -> None:
    """
    Send a structured reservation message over the "asset_updates" channel group.

    Args:
        sender (Any): The caller dispatching the message.
        message_type (str): The channel message type to emit.
        asset_pk (int): The asset primary key.
        reservation_token (str): The reservation token value.

    Returns:
        None
    """
    structured_logger.debug(
        "Dispatching reservation message to channel layer.",
        event_code="asset_reservation_channel_dispatch",
        message_type=message_type,
        asset_pk=asset_pk,
        reservation_token=reservation_token,
        sender=sender,
    )
    AsyncToSync(ASSET_CHANNEL_LAYER.group_send)(
        "asset_updates",
        {
            "type": message_type,
            "asset_pk": asset_pk,
            "reservation_token": reservation_token,
            "sent": time(),
        },
    )


@receiver(post_delete, sender=Asset)
def remove_file_from_s3(
    sender: type[Asset],
    instance: Asset,
    using: str,
    **kwargs: Any,
) -> None:
    """
    Delete the asset's stored image file from S3 after the asset is removed.

    Args:
        sender (type[Asset]): The Asset model class.
        instance (Asset): The asset being deleted.
        using (str): The database alias used for the operation.
        **kwargs: Additional signal data (ignored).

    Returns:
        None
    """
    instance.storage_image.delete(save=False)


@receiver(post_save, sender=settings.AUTH_USER_MODEL)
def create_user_profile(
    sender: Any,
    instance: Any,
    *args: Any,
    **kwargs: Any,
) -> None:
    """
    Ensure a UserProfile exists for a newly saved user instance.

    Behavior:
        If the user instance does not have a related `profile`, create one.

    Args:
        sender (Any): The user model class.
        instance (Any): The saved user instance.
        *args: Unused positional signal arguments.
        **kwargs: Unused keyword signal arguments.

    Returns:
        None
    """
    if not hasattr(instance, "profile"):
        UserProfile.objects.create(user=instance)


@receiver(post_save, sender=Transcription)
def on_transcription_save(
    sender: type[Transcription],
    instance: Transcription,
    **kwargs: Any,
) -> None:
    """
    Update user activity metrics when a transcription is created or reviewed.

    Behavior:
        - If the transcription was newly created, record a "transcribe" action.
        - Else if it was reviewed, record a "review" action.
        - Skip anonymous user activity.
        - Dispatch `update_useractivity_cache` asynchronously.

    Args:
        sender (type[Transcription]): The Transcription model class.
        instance (Transcription): The saved transcription.
        **kwargs: Signal kwargs; "created" indicates a newly created instance.

    Returns:
        None
    """
    if kwargs.get("created", False):
        user = instance.user
        attr_name = "transcribe"
    elif instance.reviewed_by:
        user = instance.reviewed_by
        attr_name = "review"
    else:
        user = None
        attr_name = None

    if user is not None and attr_name is not None and user.username != "anonymous":
        structured_logger.info(
            "Transcription saved; updating user activity cache.",
            event_code="transcription_useractivity_triggered",
            transcription=instance,
            user=user,
            activity_type=attr_name,
            campaign=instance.asset.item.project.campaign,
        )
        update_useractivity_cache.delay(
            user.id,
            instance.asset.item.project.campaign.id,
            attr_name,
        )


@receiver(signals.update_failure_response)
@receiver(signals.bind_extra_request_finished_metadata)
def add_request_id_to_response(
    response: HttpResponseBase,
    logger: ConcordiaLogger,
    **kwargs: Any,
) -> None:
    """
    Add an `X-Request-ID` header to non-cacheable responses for traceability.

    Behavior:
        If the response is publicly cacheable, do nothing to avoid storing a
        stale or incorrect request identifier. Otherwise, extract the current
        request identifier from structlog context and attach it to the response.

    Args:
        response (HttpResponseBase): The response object to modify.
        logger (Any): A ConcordiaLogger logger object with bound context.
        **kwargs: Additional data (unused).

    Returns:
        None
    """
    cache_control = response.get("Cache-Control", "").lower()

    is_public = "public" in cache_control or "max-age" in cache_control
    is_private = (
        "private" in cache_control
        or "no-store" in cache_control
        or "no-cache" in cache_control
    )

    if is_public and not is_private:
        # Don't add header to potentially cacheable responses
        # to avoid the cache storing a bad request_id
        return

    context = structlog.contextvars.get_merged_contextvars(logger)
    response["X-Request-ID"] = context["request_id"]


================================================
FILE: concordia/signals/signals.py
================================================
"""
Signals emitted by Concordia to announce reservation lifecycle events.

Signals:
    reservation_obtained (Signal): Emitted when an asset reservation is created.
        Sender:
            The actor that initiated the reservation (for example, a view).
        Keyword arguments:
            asset_pk (int): Primary key of the reserved asset.
            reservation_token (str): Reservation token.

    reservation_released (Signal): Emitted when an asset reservation is released.
        Sender:
            The actor that released the reservation.
        Keyword arguments:
            asset_pk (int): Primary key of the asset whose reservation was released.
            reservation_token (str): The reservation token that was released.
"""

from django.dispatch import Signal

reservation_obtained: Signal = Signal()

reservation_released: Signal = Signal()


================================================
FILE: concordia/static/admin/custom-inline.js
================================================
/* global jQuery */

(function ($) {
    function triggerChangeOnField(win, chosenId) {
        var element = document.getElementById(win.name);

        $.ajax({
            url: '/admin/serialized_object/',
            data: {
                model_name: 'Card',
                object_id: chosenId,
                field_name: 'title',
            },
            dataType: 'json',
            success: function (data) {
                const newContent = document.createTextNode(data.title);
                var a = document.createElement('a');
                a.href = '/admin/card/' + chosenId + '/change/';
                a.append(newContent);
                var newStrong = document.createElement('strong');
                newStrong.append(a);
                var strong = element.parentNode.querySelector('strong');
                if (strong) {
                    strong.replaceWith(newStrong);
                } else {
                    element.parentNode.append(newStrong);
                }
            },
        });
    }

    // Vite
    window.triggerChangeOnField = triggerChangeOnField;

    $(document).ready(function () {
        // https://stackoverflow.com/a/33937138/10320488
        window.ORIGINAL_dismissRelatedLookupPopup =
            window.dismissRelatedLookupPopup;
        window.dismissRelatedLookupPopup = function (win, chosenId) {
            window.ORIGINAL_dismissRelatedLookupPopup(win, chosenId);
            triggerChangeOnField(win, chosenId);
        };
    });
})(jQuery);


================================================
FILE: concordia/static/admin/editor-preview.js
================================================
/* global CodeMirror prettier prettierPlugins django */

(function ($) {
    /**
     * Initializes CodeMirror with a side-by-side preview pane and Prettier support.
     */
    var setupCodeMirror = function (textarea, flavor) {
        var converter;
        switch (flavor) {
            case 'html': {
                converter = (input) => input;
                break;
            }
            case 'markdown': {
                var md = new window.remarkable.Remarkable({html: true});
                converter = (input) => md.render(input);
                break;
            }
            default: {
                throw 'Unknown code flavor: ' + flavor;
            }
        }

        var $formRow = $(textarea).parents('.form-row').first();
        $formRow.addClass('codemirror-with-preview');

        var preview = $('<iframe>')
            // Firefox and, reportedly, Safari have a quirk where the <iframe> body
            // is not correctly available until it “loads” the blank page:
            .on('load', function () {
                var frameDocument = this.contentDocument;
                frameDocument.open();
                frameDocument.write(
                    '<html><body><main>Loading…</main></body></html>',
                );
                frameDocument.close();

                var previewTemplate = document.querySelector(
                    'template#preview-head',
                ).content;

                for (const node of previewTemplate.childNodes) {
                    frameDocument.head.append(
                        frameDocument.importNode(node, true),
                    );
                }

                queueUpdate();
            })
            .insertAfter(textarea)
            .get(0);

        function updatePreview() {
            var main = preview.contentDocument.body.querySelector('main');
            if (main) {
                main.innerHTML = converter(editor.getValue());
            }
        }

        var editorMode = flavor;
        if (flavor == 'html') {
            // CodeMirror actually treats HTML as a subset of XML:
            editorMode = {
                name: 'xml',
                htmlMode: true,
            };
        }

        var editor = CodeMirror.fromTextArea(textarea, {
            mode: editorMode,
            lineNumbers: true,
            highlightFormatting: true,
            indentUnit: 4,
            lineWrapping: true,
        });

        var editorLineWidgets = [];

        var queuedUpdate;

        editor.on('change', queueUpdate);

        function queueUpdate() {
            if (queuedUpdate) {
                window.cancelAnimationFrame(queuedUpdate);
            }
            queuedUpdate = window.requestAnimationFrame(updatePreview);
        }

        $('<button class="button">Run Prettier</button>')
            .prependTo($formRow)
            .on('click', function (event) {
                event.preventDefault();

                $formRow.find('.errornote').remove();

                for (const widget of editorLineWidgets) {
                    editor.removeLineWidget(widget);
                }

                try {
                    var pretty = prettier.format(editor.getValue(), {
                        parser: flavor,
                        plugins: prettierPlugins,
                        printWidth: 120,
                        tabWidth: 4,
                    });

                    editor.setValue(pretty);
                    queueUpdate();
                } catch (error) {
                    $('<p class="errornote">').text(error).appendTo($formRow);

                    var lineWarning = document.createElement('div');
                    lineWarning.style.whiteSpace = 'nowrap';
                    lineWarning.style.overflow = 'hidden';

                    var icon = lineWarning.append(
                        document.createElement('span'),
                    );
                    icon.style.marginRight = '1rem';
                    icon.innerHTML = '⚠️';
                    lineWarning.append(document.createTextNode(error.message));

                    editorLineWidgets.push(
                        editor.addLineWidget(
                            error.loc.start.line - 1,
                            lineWarning,
                            {coverGutter: false, noHScroll: true},
                        ),
                    );
                }
            });
    };

    // Auto-initialize specifically for the SimplePage 'body' field
    $(document).ready(function () {
        var textArea = document.getElementById('id_body');

        if (textArea) {
            setupCodeMirror(textArea, 'markdown');
        } else {
            console.warn(
                'CodeMirror: Element #id_content not found on this page.',
            );
        }
    });
})(django.jQuery);


================================================
FILE: concordia/static/js/src/about-accordions.js
================================================
import $ from 'jquery';

$(function () {
    $('.toggle-blog-posts').click(function (event) {
        $('.accordion-icon', event.delegateTarget).toggleClass(
            'fa-plus-square fa-minus-square',
        );
        $('.blog-content').toggle();
    });
    $('.toggle-publications').click(function (event) {
        $('.accordion-icon', event.delegateTarget).toggleClass(
            'fa-plus-square fa-minus-square',
        );
        $('.publications-content').toggle();
    });
    $('.toggle-press').click(function (event) {
        $('.accordion-icon', event.delegateTarget).toggleClass(
            'fa-plus-square fa-minus-square',
        );
        $('.press-content').toggle();
    });
    $('.toggle-program-history').click(function (event) {
        $('.accordion-icon', event.delegateTarget).toggleClass(
            'fa-plus-square fa-minus-square',
        );
        $('.program-history').toggle();
    });
});


================================================
FILE: concordia/static/js/src/asset-reservation.js
================================================
import $ from 'jquery';
import {Modal} from 'bootstrap';
import {buildErrorMessage, displayHtmlMessage, displayMessage} from './base.js';
import * as Sentry from '@sentry/browser';

const assetReservationElement = document.getElementById(
    'asset-reservation-data',
);
const assetReservationData = assetReservationElement
    ? assetReservationElement.dataset
    : {};

function attemptToReserveAsset(reservationURL, findANewPageURL, actionType) {
    let $transcriptionEditor = $('#transcription-editor');
    // We need to do this because BS5 does not automatically initialize modals when you
    // try to show them; without new boostrap.Modal, it doesn't recognize it as a modal
    // at all (it's treated as ordinary HTML), so BS controls do not work
    var reservationModalElement = document.getElementById(
        'asset-reservation-failure-modal',
    );
    // This tries to get the modal if it exists, otherwise it initializes it
    var reservationModal =
        Modal.getInstance(reservationModalElement) ||
        new Modal(reservationModalElement);

    $.ajax({
        url: reservationURL,
        type: 'POST',
        dataType: 'json',
    })
        .done(function () {
            $transcriptionEditor
                .data('hasReservation', true)
                .trigger('update-ui-state');

            // If the asset was successfully reserved, continue reserving it
            window.setTimeout(
                attemptToReserveAsset,
                60_000,
                reservationURL,
                findANewPageURL,
                actionType,
            );
        })
        .fail(function (jqXHR, textStatus, errorThrown) {
            if (jqXHR.status == 409) {
                if (actionType == 'transcribe') {
                    $transcriptionEditor
                        .data('hasReservation', false)
                        .trigger('update-ui-state');
                    reservationModal.show();
                } else {
                    displayHtmlMessage(
                        'warning',
                        'There are other reviewers on this page.' +
                            ' <a href="' +
                            findANewPageURL +
                            '">Find a new page to review</a>',
                        'transcription-reservation',
                    );
                    Sentry.captureException(errorThrown, function (scope) {
                        scope.setTransactionName(
                            '409 error when attempting to reserve asset at ' +
                                reservationURL,
                        );
                    });
                }
            } else if (jqXHR.status == 408) {
                $transcriptionEditor
                    .data('hasReservation', false)
                    .trigger('update-ui-state');
                reservationModal.show();
                Sentry.captureException(errorThrown, function (scope) {
                    scope.setTransactionName(
                        '408 error when attempting to reserve asset at ' +
                            reservationURL,
                    );
                });
            } else {
                displayMessage(
                    'error',
                    'Unable to reserve this page: ' +
                        buildErrorMessage(jqXHR, textStatus, errorThrown),
                    'transcription-reservation',
                );
                Sentry.captureException(errorThrown, function (scope) {
                    scope.setTransactionName(
                        'Error when attempting to reserve asset at ' +
                            reservationURL,
                    );
                });
            }
        });
}

if (!window._assetReservationUnloadBound) {
    window.addEventListener('beforeunload', function () {
        if (assetReservationData.reserveAssetUrl) {
            let payload = {
                release: true,
                csrfmiddlewaretoken: $(
                    'input[name="csrfmiddlewaretoken"]',
                ).val(),
            };

            // We'll try Beacon since that's reliable but until we can drop support for IE11 we need a fallback:
            if ('sendBeacon' in navigator) {
                navigator.sendBeacon(
                    assetReservationData.reserveAssetUrl,
                    new Blob([$.param(payload)], {
                        type: 'application/x-www-form-urlencoded',
                    }),
                );
            } else {
                $.ajax({
                    url: assetReservationData.reserveAssetUrl,
                    type: 'POST',
                    data: payload,
                });
            }
        }
    });
    window._assetReservationUnloadBound = true;
}

function reserveAssetForEditing() {
    if (assetReservationData.reserveAssetUrl) {
        attemptToReserveAsset(
            assetReservationData.reserveAssetUrl,
            '',
            'transcribe',
        );
    }
}

$(function () {
    if (assetReservationData.reserveForEditing) {
        reserveAssetForEditing();
    }
});

export {reserveAssetForEditing};


================================================
FILE: concordia/static/js/src/banner.js
================================================
var storage = window.localStorage;
var storageAvailable;
try {
    const x = '__storage_test__';
    storage.setItem(x, x);
    storage.removeItem(x);
    storageAvailable = true;
} catch {
    storageAvailable = false;
}
if (storageAvailable) {
    for (var key in storage) {
        if (key.startsWith('banner-')) {
            const banner = document.getElementById(key);
            if (banner && banner.classList.contains('alert')) {
                banner.setAttribute('hidden', 'hidden');
            }
        }
    }
}
const noInterfaceBanner = document.getElementById('no-interface-banner');
if (noInterfaceBanner) {
    noInterfaceBanner.addEventListener('click', (event) => {
        var banner = event.target.parentElement.parentElement;
        if (banner.hasAttribute('id')) {
            storage.setItem(banner.id, 'true');
            banner.classList.remove('d-flex');
            banner.setAttribute('hidden', 'hidden');
        }
    });
}


================================================
FILE: concordia/static/js/src/base.js
================================================
import 'bootstrap';
import Cookies from 'js-cookie';
import $ from 'jquery';
import screenfull from 'screenfull';
import {Popover} from 'bootstrap';
import * as Sentry from '@sentry/browser';

(function () {
    /*
        Configure jQuery to use CSRF tokens automatically — see
        https://docs.djangoproject.com/en/2.1/ref/csrf/#setting-the-token-on-the-ajax-request
    */

    var CSRFCookie = Cookies.get('csrftoken');

    if (!CSRFCookie) {
        return;
    }

    function csrfSafeMethod(method) {
        // these HTTP methods do not require CSRF protection
        return /^(GET|HEAD|OPTIONS|TRACE)$/.test(method);
    }

    $.ajaxSetup({
        beforeSend: function (xhr, settings) {
            if (!csrfSafeMethod(settings.type) && !this.crossDomain) {
                xhr.setRequestHeader('X-CSRFToken', CSRFCookie);
            }
        },
    });
})();

document.addEventListener('DOMContentLoaded', () => {
    const popoverTriggerList = document.querySelectorAll(
        '[data-bs-toggle="popover"]',
    );
    for (const popoverTriggerElement of popoverTriggerList) {
        new Popover(popoverTriggerElement);
    }
});

// eslint-disable-next-line no-unused-vars
export function buildErrorMessage(jqXHR, textStatus, errorThrown) {
    /* Construct a nice error message using optional JSON response context */
    var errorMessage;
    // eslint-disable-next-line unicorn/prefer-ternary
    if (jqXHR.responseJSON && jqXHR.responseJSON.error) {
        errorMessage = jqXHR.responseJSON.error;
    } else {
        errorMessage = textStatus + ' ' + errorThrown;
    }
    return errorMessage;
}

export function displayHtmlMessage(level, message, uniqueId) {
    /*
        Display a dismissable message at a level which will match one of the
        Bootstrap alert classes
        (https://getbootstrap.com/docs/5.3/components/alerts/)

        If provided, uniqueId will be used to remove any existing elements which
        have that ID, allowing old messages to be replaced automatically.
    */
    let $messages = $('#messages');
    $messages.removeAttr('hidden');

    let $newMessage = $messages
        .find('#message-template .alert')
        .clone()
        .removeAttr('hidden')
        .removeAttr('id');

    if (level == 'error') {
        // Class for red background
        level = 'danger';
    }

    $newMessage.addClass('alert-' + level);

    if (uniqueId) {
        $('#' + uniqueId).remove();
        $newMessage.attr('id', uniqueId);
    }

    // Add a span to the message to ensure justified
    // styles don't end up splitting the text
    // message might be a Text node, so we need to get
    // the actual text if so
    if (message instanceof Text) {
        message = message.textContent;
    }
    $newMessage.prepend('<span>' + message + '</span>');

    $messages.append($newMessage);

    return $newMessage;
}

export function displayMessage(level, message, uniqueId) {
    return displayHtmlMessage(
        level,
        document.createTextNode(message),
        uniqueId,
    );
}

function isOutdatedBrowser() {
    /*
        See https://caniuse.com/#feat=css-supports-api for the full matrix but
        by now this is effectively the same as testing for IE11 vs. all of the
        evergreen browsers:
    */
    return typeof CSS == 'undefined' || !CSS.supports;
}

function loadLegacyPolyfill(scriptUrl, callback) {
    var script = document.createElement('script');
    script.type = 'text/javascript';
    script.async = false;
    // eslint-disable-next-line unicorn/prefer-add-event-listener
    script.onload = callback;
    // eslint-disable-next-line unicorn/prevent-abbreviations
    script.src = scriptUrl;
    document.body.append(script);
}

document.addEventListener('DOMContent', () => {
    if (isOutdatedBrowser()) {
        var theMessage =
            'You are using an outdated browser. This website fully supports the current ' +
            'version of every major browser ' +
            '(Microsoft Edge, Google Chrome, Mozilla Firefox, and Apple Safari). See ' +
            'our <a href="/help-center/#browserSupport">browser support policy</a> ' +
            'for more information.';

        var warningCookie = 'outdated-browser-message-hidden';
        var warningLastShown = 0;
        try {
            var cookie = Cookies.get(warningCookie);
            if (cookie) {
                warningLastShown = Number.parseInt(cookie, 10);
            }
        } catch (error) {
            Sentry.captureException(error);
        }

        if (Date.now() - warningLastShown > 7 * 86_400) {
            displayHtmlMessage('danger', theMessage).on(
                'closed.bs.alert',
                function () {
                    Cookies.set(warningCookie, Date.now());
                },
            );
        }

        /*
            CSS variables are supported by everything except IE11:
            https://caniuse.com/#feat=css-variables
        */
        loadLegacyPolyfill(
            'https://cdn.jsdelivr.net/npm/css-vars-ponyfill@2.0.2/dist/css-vars-ponyfill.min.js',
            function () {
                /* global cssVars */
                cssVars({
                    legacyOnly: true,
                    preserveStatic: true,
                    include: 'link[rel="stylesheet"][href^="/static/"]',
                });
            },
        );
    }
});

if (screenfull.isEnabled) {
    $('#go-fullscreen')
        .removeAttr('hidden')
        .on('click', function (event) {
            event.preventDefault();
            var targetElement = document.getElementById(this.dataset.bsTarget);

            if (screenfull.isFullscreen) {
                screenfull.exit();
            } else {
                screenfull.request(targetElement);
            }
        });
}

function appendAccountItem(link, $menu) {
    if (link.type !== 'post') {
        $('<a>')
            .addClass('dropdown-item')
            .attr('href', link.url)
            .text(link.title)
            .appendTo($menu);
        return;
    }

    const csrfToken = Cookies.get('csrftoken');
    const formId =
        'nav-post-' + link.title.toLowerCase().replaceAll(/[^\da-z]+/g, '-');

    const $form = $('<form>')
        .attr({id: formId, method: 'post', action: link.url})
        .css('display', 'none')
        .appendTo(document.body);

    // Django expects the hidden field name "csrfmiddlewaretoken"
    $('<input>')
        .attr({type: 'hidden', name: 'csrfmiddlewaretoken', value: csrfToken})
        .appendTo($form);

    if (link.fields) {
        for (const [name, value] of Object.entries(link.fields)) {
            $('<input>')
                .attr({type: 'hidden', name: name, value: value})
                .appendTo($form);
        }
    }

    $('<button>')
        .addClass('dropdown-item')
        .attr({type: 'submit', form: formId})
        .text(link.title)
        .appendTo($menu);
}

$.ajax({
    url: '/account/ajax-status/',
    method: 'GET',
    dataType: 'json',
    cache: true,
}).done(function (data) {
    if (!data.username) {
        $('.anonymous-only').removeClass('d-none');
        $('.anonymous-only').addClass('d-lg-flex');
        $('.authenticated-only').addClass('d-none');
        return;
    }

    $('.anonymous-only').addClass('d-none');
    $('.anonymous-only').removeClass('d-lg-flex');
    $('.authenticated-only').removeClass('d-none');

    var $toggle = $('#topnav-account-dropdown-toggle');
    var $accountDropdownMenu = $('#topnav-account-dropdown-menu');
    if (data.username) {
        $toggle.empty().text(data.username + ' ');
        $('<span>')
            .addClass('fa fa-chevron-down text-primary')
            .appendTo($toggle);
    }

    if (data.links && $accountDropdownMenu.length > 0) {
        $accountDropdownMenu.empty();
        for (const link of data.links) {
            appendAccountItem(link, $accountDropdownMenu);
        }
    }
});

$.ajax({url: '/account/ajax-messages/', method: 'GET', dataType: 'json'}).done(
    function (data) {
        if (data.messages) {
            for (const message of data.messages) {
                displayMessage(message.level, message.message);
            }
        }
    },
);

// eslint-disable-next-line no-unused-vars
export function debounce(function_, timeout = 300) {
    // Based on https://www.freecodecamp.org/news/javascript-debounce-example/
    let timer;
    return (...arguments_) => {
        clearTimeout(timer);
        timer = setTimeout(() => {
            function_.apply(this, arguments_);
        }, timeout);
    };
}

/* Social share stuff */

var hideTooltip = function (tooltipButton) {
    return function () {
        tooltipButton.tooltip('hide');
    };
};

var hideTooltipCallback = function () {
    // wait a couple seconds and then hide the tooltip.
    setTimeout(hideTooltip($(this)), 3000);
};

function trackShareInteraction($element, interactionType) {
    // Adobe analytics user interaction tracking
    if ('loc_ux_tracking' in window) {
        let loc_ux_tracking = window['loc_ux_tracking'];
        loc_ux_tracking.trackUserInteractionEvent(
            $element,
            'Share Tool',
            'click',
            interactionType,
        );
    }
}

var $copyUrlButton = $('.copy-url-button');
var $facebookShareButton = $('.facebook-share-button');
var $twitterShareButton = $('.twitter-share-button');

const copyUrlButton = document.querySelector('.copy-url-button');
if (copyUrlButton) {
    copyUrlButton.addEventListener('click', function (event) {
        event.preventDefault();

        // The asynchronous Clipboard API is not supported by Microsoft Edge or Internet Explorer:
        // https://developer.mozilla.org/en-US/docs/Web/API/Clipboard/writeText#Browser_compatibility
        // We'll use the older document.execCommand("copy") interface which requires a text input:
        var $clipboardInput = $('<input type="text">')
            .val($copyUrlButton.attr('href'))
            .insertAfter($copyUrlButton);
        $clipboardInput.get(0).select();

        var tooltipMessage = '';

        trackShareInteraction($copyUrlButton, 'Link copy');

        try {
            document.execCommand('copy');
            // Show the tooltip with a success message
            tooltipMessage = 'This link has been copied to your clipboard';
            $copyUrlButton
                .tooltip('dispose')
                .tooltip({title: tooltipMessage})
                .tooltip('show')
                .on('shown.bs.tooltip', hideTooltipCallback);
        } catch (error) {
            if (Sentry !== 'undefined') {
                Sentry.captureException(error);
            }

            // Display an error message in the tooltip
            tooltipMessage =
                '<p>Could not access your clipboard.</p><button class="btn btn-light btn-sm" id="dismiss-tooltip-button">Close</button>';
            $copyUrlButton
                .tooltip('dispose')
                .tooltip({title: tooltipMessage, html: true})
                .tooltip('show');
            document
                .querySelector('#dismiss-tooltip-button')
                .addEventListener('click', function () {
                    $copyUrlButton.tooltip('hide');
                });
        } finally {
            $clipboardInput.remove();
        }

        return false;
    });
}

const fbShareButton = document.querySelector('.copy-url-button');
if (fbShareButton) {
    fbShareButton.addEventListener('click', function () {
        trackShareInteraction($facebookShareButton, 'Facebook Share');
        return true;
    });
}

const xShareButton = document.querySelector('.twitter-share-button');
if (xShareButton) {
    xShareButton.addEventListener('click', function () {
        trackShareInteraction($twitterShareButton, 'Twitter Share');
        return true;
    });
}

// eslint-disable-next-line no-unused-vars
export function trackUIInteraction(element, category, action, label) {
    if ('loc_ux_tracking' in window) {
        let loc_ux_tracking = window['loc_ux_tracking'];
        let data = [element, category, action, label];
        loc_ux_tracking.trackUserInteractionEvent(...data);
    }
}


================================================
FILE: concordia/static/js/src/campaign-selection.js
================================================
import $ from 'jquery';

$(function () {
    const queryString = window.location.search;
    const urlParameters = new URLSearchParams(queryString);

    $('#tblTranscription tbody tr').each(function () {
        var rowID = $(this).find('.campaign').attr('id');

        if (rowID == urlParameters.get('campaign_slug')) {
            $(this).find('.campaign').css('font-weight', 'bold');
        } else {
            $(this).find('.campaign').attr('font-weight', 'normal');
        }
    });

    $('input[type="checkbox"]').change(function () {
        if (this.checked) {
            $('.' + this.id).fadeIn('slow');
        } else $('.' + this.id).fadeOut('slow');
    });
});


================================================
FILE: concordia/static/js/src/contribute.js
================================================
import 'bootstrap/dist/css/bootstrap.min.css';
import {Modal} from 'bootstrap';
import {selectLanguage} from './ocr.js';
import {reserveAssetForEditing} from './asset-reservation.js';
import $ from 'jquery';
import {buildErrorMessage, displayMessage} from './base.js';

function lockControls($container) {
    if (!$container) {
        return;
    }
    // Locks all of the controls in the provided jQuery element
    $container.find('input, textarea').attr('readonly', 'readonly');
    $container.find('input:checkbox').attr('disabled', 'disabled');
    $container.find('button:not(#open-guide)').attr('disabled', 'disabled');
}

function unlockControls($container) {
    if (!$container) {
        return;
    }
    // Unlocks all of the controls except buttons in the provided jQuery element
    $container.find('input, textarea').removeAttr('readonly');
    $container.find('input:checkbox').removeAttr('disabled');

    // Though we lock all buttons in lockControls, we don't automatically
    // unlock most of them. Which buttons should be locked or unlocked
    // is more complicated logic handled by the update-ui-state
    // listener on the transcription form and the form
    // results handlers.
    // The only buttons unlocked here are ones that should always be unlocked.
    $container.find('button#open-guide').removeAttr('disabled');
    $container.find('button#ocr-transcription-button').removeAttr('disabled');
    $container.find('button#close-guide').removeAttr('disabled');
    $container.find('button#new-tag-button').removeAttr('disabled');
}

$(document).on('keydown', function (event) {
    /*
        Global keyboard event handlers

        * F1 and ? open help
        * Control-I focuses on the image viewer
        * Control-T focuses on the transcription text field

        n.b. jQuery interferes with setting the focus so our handlers use the
        DOM directly
    */

    if (
        (event.which == 112 || event.which == 191) &&
        !event.target.tagName.match(/(INPUT|TEXTAREA)/i) // eslint-disable-line  unicorn/prefer-regexp-test, unicorn/better-regex
    ) {
        // Either the F1 or ? keys were pressed outside of a text field so we'll show help:
        Modal.getOrCreateInstance(
            document.getElementById('keyboard-help-modal'),
        ).show();
        return false;
    } else if (event.which == 73 && event.ctrlKey) {
        // Control-I == switch to the image viewer
        document.querySelector('#asset-image .openseadragon-canvas').focus();
        return false;
    } else if (event.which == 84 && event.ctrlKey) {
        // Control-T == switch to the transcription field
        document.getElementById('transcription-input').focus();
        return false;
    }
});

function resetTurnstile() {
    if (window.turnstile) {
        window.turnstile.reset('.cf-turnstile');
    }
}

function setupPage() {
    $('form.ajax-submission').each(function (index, formElement) {
        /*
        Generic AJAX submission logic which takes a form and POSTs its data to the
        configured action URL, locking the controls until it gets a response either
        way.

        If the AJAX request is successful, the form-submit-success custom event will
        be triggered. On failures, form-submit-failure will be triggered after
        unlocking the controls.

        Because there's no standard way to get the value of the submit button
        clicked, and forms may be submitted without using a button at all, the
        <form> element may have optional data-submit-name and data-submit-value
        attributes for the default values and a click handler will be used to
        update those values based on user interaction.

        The optional data-lock-element attribute can be set to lock additional
        elements in the same way the form is locked once its submitted.
        */

        var $form = $(formElement);

        $form.on('submit', function (event) {
            event.preventDefault();

            var eventData = $form.data();

            lockControls($form);
            if (eventData.lockElement) {
                lockControls($(eventData.lockElement));
            }

            var formData = $form.serializeArray();

            $.ajax({
                url: $form.attr('action'),
                method: 'POST',
                dataType: 'json',
                data: $.param(formData),
            })
                .done(function (data, textStatus) {
                    $form.trigger('form-submit-success', {
                        textStatus: textStatus,
                        requestData: formData,
                        responseData: data,
                        $form: $form,
                    });
                    unlockControls($form);
                    if (eventData.lockElement) {
                        unlockControls($(eventData.lockElement));
                    }
                })
                .fail(function (jqXHR, textStatus, errorThrown) {
                    $form.trigger('form-submit-failure', {
                        textStatus: textStatus,
                        errorThrown: errorThrown,
                        requestData: formData,
                        $form: $form,
                        jqXHR: jqXHR,
                    });
                    unlockControls($form);
                    if (eventData.lockElement) {
                        unlockControls($(eventData.lockElement));
                    }
                });

            return false;
        });
    });

    var $transcriptionEditor = $('#transcription-editor');
    var $saveButton = $transcriptionEditor
        .find('#save-transcription-button')
        .first();
    var $submitButton = $transcriptionEditor
        .find('#submit-transcription-button')
        .first();
    var $nothingToTranscribeCheckbox = $transcriptionEditor
        .find('#nothing-to-transcribe')
        .on('change', function () {
            var $textarea = $transcriptionEditor.find('textarea');
            if (this.checked) {
                const nothingToTranscribeElement = document.getElementById(
                    'nothing-to-transcribe-modal',
                );
                if (nothingToTranscribeElement) {
                    const nothingToTranscribeModal =
                        Modal.getInstance(nothingToTranscribeElement) ||
                        new Modal(nothingToTranscribeElement);
                    var nothingToTranscribeTitle =
                        nothingToTranscribeElement.querySelector(
                            '.modal-title',
                        );
                    var nothingToTranscribeBody =
                        nothingToTranscribeElement.querySelector('.modal-body');
                    if ($textarea.val()) {
                        nothingToTranscribeTitle.textContent =
                            'Text will be deleted';
                        nothingToTranscribeBody.innerHTML =
                            '<p>Text in the transcription box is removed when “Nothing to transcribe” is checked. Do you want to discard that text?</p>';
                    } else {
                        nothingToTranscribeTitle.textContent =
                            'Nothing to transcribe';
                        nothingToTranscribeBody.innerHTML =
                            '<p>Are you sure?</p>';
                    }
                    nothingToTranscribeModal.show();

                    const okButton = document.getElementById('confirmDiscard');
                    okButton.addEventListener('click', function () {
                        $textarea.val('');
                        nothingToTranscribeModal.hide();
                    });
                    const cancelButton =
                        document.getElementById('cancelDiscard');
                    cancelButton.addEventListener('click', function () {
                        $('#nothing-to-transcribe').prop('checked', false);
                        nothingToTranscribeModal.hide();
                    });
                }
            }
            $transcriptionEditor.trigger('update-ui-state');
        });
    var $ocrSection = $('#ocr-section');
    var $ocrForm = $('#ocr-transcription-form');
    var $ocrModal = $('#ocr-transcription-modal');
    var languageModalElement = document.getElementById(
        'language-selection-modal',
    );
    var languageModal;
    if (languageModalElement) {
        languageModal = Modal.getOrCreateInstance(languageModalElement);
    }
    var $ocrLoading = $('#ocr-loading');
    var rollbackButton = document.getElementById(
        'rollback-transcription-button',
    );
    var rollforwardButton = document.getElementById(
        'rollforward-transcription-button',
    );
    // We need to do this because BS5 does not automatically initialize modals when you
    // try to show them; without new boostrap.Modal, it doesn't recognize it as a modal
    // at all (it's treated as ordinary HTML), so BS controls do not work
    // We try to get Modal.getInstance in case the modal is already initialized
    var errorModalElement = document.getElementById('error-modal');
    if (errorModalElement) {
        var errorModal =
            Modal.getInstance(errorModalElement) ||
            new Modal(errorModalElement);
    }
    var submissionModalElement = document.getElementById(
        'successful-submission-modal',
    );
    if (submissionModalElement) {
        var submissionModal =
            Modal.getInstance(submissionModalElement) ||
            new Modal(submissionModalElement);
    }
    var reviewModalElement = document.getElementById('review-accepted-modal');
    if (reviewModalElement) {
        var reviewModal =
            Modal.getInstance(reviewModalElement) ||
            new Modal(reviewModalElement);
    }

    let firstEditorUpdate = true;
    let editorPlaceholderText = $transcriptionEditor
        .find('textarea')
        .attr('placeholder');
    let editorNothingToTranscribePlaceholderText = 'Nothing to transcribe';

    $transcriptionEditor
        .on('update-ui-state', function () {
            /*
             * All controls are locked when the user does not have the write lock
             *
             * The Save button is enabled when the user has changed the text from
             * what it was when the page was loaded or last saved
             *
             * The Submit button is enabled when the user has either made no changes
             * or has saved the transcription and not changed the text
             */

            var data = $transcriptionEditor.data();

            if (
                !data.hasReservation ||
                (data.transcriptionStatus != 'in_progress' &&
                    data.transcriptionStatus != 'not_started' &&
                    data.transcriptionStatus != 'submitted')
            ) {
                // If the status is completed OR if the user doesn't have the reservation
                lockControls($transcriptionEditor);
                lockControls($ocrSection);
                lockControls($ocrForm);
            } else {
                // Either in transcribe or review mode OR the user has the reservation
                if (data.hasReservation) {
                    unlockControls($ocrSection);
                    unlockControls($ocrForm);
                }
                var $textarea = $transcriptionEditor.find('textarea');

                if (
                    $nothingToTranscribeCheckbox.prop('checked') ||
                    data.transcriptionStatus == 'submitted'
                ) {
                    $textarea.attr('readonly', 'readonly');
                    if ($nothingToTranscribeCheckbox.prop('checked')) {
                        $textarea.attr(
                            'placeholder',
                            editorNothingToTranscribePlaceholderText,
                        );
                    }
                } else {
                    $textarea.removeAttr('readonly');
                    $textarea.attr('placeholder', editorPlaceholderText);
                }

                if (data.transcriptionId && !data.unsavedChanges) {
                    // We have a transcription ID and it's not stale,
                    // so we can submit the transcription for review and disable the save button:
                    $saveButton.attr('disabled', 'disabled');
                    $submitButton.removeAttr('disabled');
                    // We only want to do this the first time the editor ui is updated (i.e., on first load)
                    // because otherwise it's impossible to uncheck the 'Nothing to transcribe' checkbox
                    // since this code would just immediately mark it checked again.
                    if (!$textarea.val() && firstEditorUpdate) {
                        $nothingToTranscribeCheckbox.prop('checked', true);
                        $textarea.attr('readonly', 'readonly');
                        $textarea.attr(
                            'placeholder',
                            editorNothingToTranscribePlaceholderText,
                        );
                    }
                } else {
                    // Unsaved changes are in the textarea and we're in transcribe mode
                    $submitButton.attr('disabled', 'disabled');

                    if (
                        $textarea.val() ||
                        $nothingToTranscribeCheckbox.prop('checked')
                    ) {
                        $saveButton.removeAttr('disabled');
                    } else {
                        $saveButton.attr('disabled', 'disabled');
                    }
                }
            }

            if (
                !data.hasReservation &&
                (data.transcriptionStatus == 'in_progress' ||
                    data.transcriptionStatus == 'not_started')
            ) {
                // If we're in transcribe mode and we don't have the reservation
                $('.transcription-status-display')
                    .children()
                    .attr('hidden', 'hidden')
                    .filter('#display-conflict')
                    .removeAttr('hidden');
            }
            firstEditorUpdate = false;
        })
        .on('form-submit-success', function (event, extra) {
            let responseData = extra.responseData;
            displayMessage(
                'info',
                "Successfully saved your work. Submit it for review when you're done",
                'transcription-save-result',
            );
            $transcriptionEditor.data({
                transcriptionId: responseData.id,
                unsavedChanges: false,
            });
            $transcriptionEditor
                .find('input[name="supersedes"]')
                .val(responseData.id);
            $transcriptionEditor
                .find('textarea[name="text"]')
                .val(responseData.text);
            $transcriptionEditor.data('submitUrl', responseData.submissionUrl);
            $ocrForm.find('input[name="supersedes"]').val(responseData.id);
            $('#transcription-status-display')
                .children()
                .attr('hidden', 'hidden')
                .filter('#display-inprogress')
                .removeAttr('hidden');
            if (responseData.undo_available) {
                $('#rollback-transcription-button').removeAttr('disabled');
            }
            if (responseData.redo_available) {
                $('#rollforward-transcription-button').removeAttr('disabled');
            }
            resetTurnstile();
            let messageChildren = $('#transcription-status-message').children();
            messageChildren
                .attr('hidden', 'hidden')
                .filter('#message-inprogress')
                .removeAttr('hidden');
            $('#transcription-status-display').removeAttr('hidden');
            $('#message-contributors')
                .removeAttr('hidden')
                .find('#message-contributors-num')
                .html(responseData.asset.contributors);
            $transcriptionEditor.trigger('update-ui-state');
        })
        .on('form-submit-failure', function (event, info) {
            displayMessage(
                'error',
                'Unable to save your work: ' +
                    buildErrorMessage(
                        info.jqXHR,
                        info.textStatus,
                        info.errorThrown,
                    ),
                'transcription-save-result',
            );
            resetTurnstile();
            $transcriptionEditor.trigger('update-ui-state');
        });

    $submitButton.on('click', function (event) {
        event.preventDefault();

        $.ajax({
            url: $transcriptionEditor.data('submitUrl'),
            method: 'POST',
            dataType: 'json',
        })
            .done(function (data) {
                $('#transcription-status-display')
                    .children()
                    .attr('hidden', 'hidden');
                let messageChildren = $(
                    '#transcription-status-display',
                ).children();
                messageChildren
                    .attr('hidden', 'hidden')
                    .filter('#message-submitted')
                    .removeAttr('hidden');
                $('#display-submitted').removeAttr('hidden');
                messageChildren
                    .filter('#message-contributors')
                    .removeAttr('hidden')
                    .find('#message-contributors-num')
                    .html(data.asset.contributors);
                submissionModal.show();
                submissionModalElement.addEventListener(
                    'hidden.bs.modal',
                    function () {
                        window.location.reload(true);
                    },
                );
            })
            .fail(function (jqXHR, textStatus, errorThrown) {
                displayMessage(
                    'error',
                    'Unable to save your work: ' +
                        buildErrorMessage(jqXHR, textStatus, errorThrown),
                    'transcription-submit-result',
                );
            });
    });

    $transcriptionEditor
        .find('textarea')
        .each(function (index, textarea) {
            textarea.value = $.trim(textarea.value);
        })
        .on('change input', function () {
            $transcriptionEditor.data('unsavedChanges', true);
            $transcriptionEditor.trigger('update-ui-state');
        });

    function submitReview(status) {
        var reviewUrl = $transcriptionEditor.data('reviewUrl');
        $.ajax({
            url: reviewUrl,
            method: 'POST',
            dataType: 'json',
            data: {
                action: status,
            },
        })
            .done(function (data) {
                if (status == 'reject') {
                    $.ajax({
                        url: window.location,
                        method: 'GET',
                        dataType: 'html',
                    })
                        .done(function (data) {
                            $('#editor-column').html(
                                $(data).find('#editor-column').html(),
                            );
                            $('#ocr-section').html(
                                $(data).find('#ocr-section').html(),
                            );
                            $('#help-container').html(
                                $(data).find('#help-container').html(),
                            );
                            $ocrModal.html(
                                $(data).find('#ocr-transcription-modal').html(),
                            );
                            $('#select-language-button').on(
                                'click',
                                selectLanguage,
                            );
                            reserveAssetForEditing();
                            setupPage();
                        })
                        .fail(function (jqXHR, textStatus, errorThrown) {
                            displayMessage(
                                'error',
                                'Unable to save your review: ' +
                                    buildErrorMessage(
                                        jqXHR,
                                        textStatus,
                                        errorThrown,
                                    ),
                                'transcription-review-result',
                            );
                        });
                } else {
                    $('#transcription-status-display')
                        .children()
                        .attr('hidden', 'hidden');
                    $('#display-completed').removeAttr('hidden');
                    let messageChildren = $(
                        '#transcription-status-message',
                    ).children();
                    messageChildren
                        .attr('hidden', 'hidden')
                        .filter('#message-completed')
                        .removeAttr('hidden');
                    $('#transcription-status-display').removeAttr('hidden');
                    messageChildren
                        .filter('#message-contributors')
                        .removeAttr('hidden')
                        .find('#message-contributors-num')
                        .html(data.asset.contributors);
                    reviewModal.show();
                    reviewModalElement.addEventListener(
                        'hidden.bs.modal',
                        function () {
                            window.location.reload(true);
                        },
                    );
                }
            })
            .fail(function (jqXHR, textStatus, errorThrown) {
                displayMessage(
                    'error',
                    'Unable to save your review: ' +
                        buildErrorMessage(jqXHR, textStatus, errorThrown),
                    'transcription-review-result',
                );
                if (jqXHR.responseJSON && jqXHR.responseJSON.popupError) {
                    let popupErrorMessage = jqXHR.responseJSON.popupError;
                    let popupTitle;
                    if (jqXHR.responseJSON.popupTitle) {
                        popupTitle = jqXHR.responseJSON.popupTitle;
                    } else {
                        popupTitle = 'An error occurred with your review';
                    }
                    $('#error-modal')
                        .find('#error-modal-title')
                        .first()
                        .html(popupTitle);
                    $('#error-modal')
                        .find('#error-modal-message')
                        .first()
                        .html(popupErrorMessage);
                    errorModal.show();
                }
            });
    }

    $('#accept-transcription-button')
        .removeAttr('disabled')
        .on('click', function (event) {
            event.preventDefault();
            submitReview('accept');
        });

    $('#reject-transcription-button')
        .removeAttr('disabled')
        .on('click', function (event) {
            event.preventDefault();
            submitReview('reject');
        });

    function rollTranscription(url) {
        lockControls($transcriptionEditor);
        $.ajax({
            url: url,
            method: 'POST',
            dataType: 'json',
            data: {
                'cf-turnstile-response': $transcriptionEditor
                    .find('input[name="cf-turnstile-response"]')
                    .val(),
            },
        })
            .done(function (responseData) {
                displayMessage(
                    'info',
                    responseData.message,
                    'transcription-save-result',
                );
                $transcriptionEditor.data({
                    transcriptionId: responseData.id,
                    unsavedChanges: false,
                });
                $transcriptionEditor
                    .find('input[name="supersedes"]')
                    .val(responseData.id);
                $transcriptionEditor.data(
                    'submitUrl',
                    responseData.submissionUrl,
                );
                $ocrForm.find('input[name="supersedes"]').val(responseData.id);
                $transcriptionEditor
                    .find('textarea[name="text"]')
                    .val(responseData.text);
                $('#transcription-status-display')
                    .children()
                    .attr('hidden', 'hidden')
                    .filter('#display-inprogress')
                    .removeAttr('hidden');
                if (responseData.undo_available) {
                    $('#rollback-transcription-button').removeAttr('disabled');
                }
                if (responseData.redo_available) {
                    $('#rollforward-transcription-button').removeAttr(
                        'disabled',
                    );
                }
                let messageChildren = $(
                    '#transcription-status-display',
                ).children();
                messageChildren
                    .attr('hidden', 'hidden')
                    .filter('#display-inprogress')
                    .removeAttr('hidden');
                messageChildren
                    .filter('#message-contributors')
                    .removeAttr('hidden')
                    .find('#message-contributors-num')
                    .html(responseData.asset.contributors);
                unlockControls($transcriptionEditor);
                $transcriptionEditor.trigger('update-ui-state');
            })
            .fail(function (jqXHR, textStatus, errorThrown) {
                displayMessage(
                    'error',
                    'Unable to save your work: ' +
                        buildErrorMessage(jqXHR, textStatus, errorThrown),
                    'transcription-save-result',
                );
                unlockControls($transcriptionEditor);
                $transcriptionEditor.trigger('update-ui-state');
            });
    }

    if (rollbackButton) {
        rollbackButton.addEventListener('click', function () {
            rollTranscription(this.dataset.url);
        });
    }

    if (rollforwardButton) {
        rollforwardButton.addEventListener('click', function () {
            rollTranscription(this.dataset.url);
        });
    }

    var $tagEditor = $('#tag-editor'),
        $tagForm = $('#tag-form'),
        $currentTagList = $tagEditor.find('#current-tags'),
        $newTagInput = $('#new-tag-input');

    const characterError =
        'Tags must be between 1-50 characters and may contain only letters, numbers, dashes, underscores, apostrophes, and spaces';
    const duplicateError =
        'That tag has already been added. Each tag can only be added once.';

    function addNewTag() {
        $newTagInput.get(0).setCustomValidity(''); // Resets custom validation
        const $form = $newTagInput.closest('form');
        $form.removeClass('was-validated');
        $newTagInput.val(
            $newTagInput.val().replace('‘', "'").replace('’', "'"),
        );
        if (!$newTagInput.get(0).checkValidity()) {
            $form.find('.invalid-feedback').html(characterError);
            $form.addClass('was-validated');
            return;
        }

        var value = $.trim($newTagInput.val());
        if (value) {
            // Prevent adding tags which are already present:
            var dupeCount = $currentTagList
                .find('input[name="tags"]')
                .filter(function (index, input) {
                    return (
                        input.value.toLocaleLowerCase() ==
                        value.toLocaleLowerCase()
                    );
                }).length;

            if (dupeCount == 0) {
                var $newTag = $(
                    '\
                            <li class="btn btn-outline-dark btn-sm"> \
                                <label class="m-0"> \
                                    <input type="hidden" name="tags" value="' +
                        value +
                        '" /> \
                                </label> \
                                <input type="hidden" name="tags" value="' +
                        value +
                        '" /> \
                                <a class="close" data-bs-dismiss="alert" aria-label="Remove previous tag"> \
                                    <span aria-hidden="true" class="fas fa-times"></span> \
                                </a> \
                            </li> \
                ',
                );
                $newTag.find('label').append(document.createTextNode(value));
                $currentTagList.append($newTag);
                $newTagInput.val('');
                $tagForm.submit();
            } else {
                $newTagInput.get(0).setCustomValidity(duplicateError);
                $form.find('.invalid-feedback').html(duplicateError);
                $newTagInput.closest('form').addClass('was-validated');
                return;
            }
        }
    }

    $tagEditor.find('#new-tag-button').on('click', addNewTag);
    $newTagInput.on('change', addNewTag);
    $newTagInput.on('keydown', function (event) {
        // See https://github.com/LibraryOfCongress/concordia/issues/159 for the source of these values:
        if (event.which == '13' || event.which == '188') {
            // Either the enter or comma keys will add the tag and reset the input field:
            event.preventDefault();
            addNewTag();
        }
    });

    $currentTagList.on('click', '.close', function () {
        $(this).parents('li').remove();
        $tagForm.submit();
    });

    $tagEditor
        .on('form-submit-success', function (event, info) {
            $('#tag-count').html(info.responseData['all_tags'].length);
            unlockControls($tagEditor);
            displayMessage(
                'info',
                'Your tags have been saved',
                'tags-save-result',
            );
        })
        .on('form-submit-failure', function (event, info) {
            unlockControls($tagEditor);

            var message = 'Unable to save your tags: ';
            message += buildErrorMessage(
                info.jqXHR,
                info.textStatus,
                info.errorThrown,
            );

            displayMessage('error', message, 'tags-save-result');
        });

    if ($ocrForm) {
        $ocrForm
            .on('submit', function () {
                languageModal.hide();
                $ocrLoading.removeAttr('hidden');
            })
            .on('form-submit-success', function (event, extra) {
                let responseData = extra.responseData;
                $transcriptionEditor.data({
                    transcriptionId: responseData.id,
                    unsavedChanges: false,
                });
                $transcriptionEditor
                    .find('input[name="supersedes"]')
                    .val(responseData.id);
                $transcriptionEditor.data(
                    'submitUrl',
                    responseData.submissionUrl,
                );
                $transcriptionEditor
                    .find('textarea[name="text"]')
                    .val(responseData.text);
                $ocrLoading.attr('hidden', 'hidden');
                $('#transcription-status-display')
                    .children()
                    .attr('hidden', 'hidden');
                $('#display-inprogress').removeAttr('hidden');
                let messageChildren = $(
                    '#transcription-status-message',
                ).children();
                if (responseData.undo_available) {
                    $('#rollback-transcription-button').removeAttr('disabled');
                }
                if (responseData.redo_available) {
                    $('#rollforward-transcription-button').removeAttr(
                        'disabled',
                    );
                }
                messageChildren
                    .attr('hidden', 'hidden')
                    .filter('#message-inprogress')
                    .removeAttr('hidden');
                messageChildren
                    .filter('#message-contributors')
                    .removeAttr('hidden')
                    .find('#message-contributors-num')
                    .html(responseData.asset.contributors);
                $('#transcription-status-display').removeAttr('hidden');
                $transcriptionEditor.trigger('update-ui-state');
                $ocrForm.find('input[name="supersedes"]').val(responseData.id);
            })
            .on('form-submit-failure', function (event, info) {
                let errorMessage;
                if (info.jqXHR.status == 429) {
                    errorMessage =
                        'OCR is only available once per minute. Please try again later and review all OCR text closely before submitting.';
                } else {
                    errorMessage = buildErrorMessage(
                        info.jqXHR,
                        info.textStatus,
                        info.errorThrown,
                    );
                }
                displayMessage(
                    'error',
                    'Unable to save your work: ' + errorMessage,
                    'transcription-save-result',
                );
                $ocrLoading.attr('hidden', 'hidden');
                $transcriptionEditor.trigger('update-ui-state');
            });
    }
}

let transcriptionForm = document.getElementById('transcription-editor');
let ocrForm = document.getElementById('ocr-transcription-form');

let formChanged = false;
if (transcriptionForm) {
    transcriptionForm.addEventListener('change', function () {
        formChanged = true;
    });
    transcriptionForm.addEventListener('submit', function () {
        formChanged = false;
    });
}
if (ocrForm) {
    ocrForm.addEventListener('submit', function () {
        formChanged = false;
    });
}
window.addEventListener('beforeunload', function (event) {
    if (formChanged) {
        // Some browsers ignore this value and always display a built-in message instead
        return (event.returnValue =
            "The transcription you've started has not been saved.");
    }
});
$('#asset-reservation-failure-modal').click(function () {
    document.getElementById('transcription-input').placeholder =
        "Someone else is already transcribing this page.\n\nYou can help by transcribing a new page, adding tags to this page, or coming back later to review this page's transcription.";
});

setupPage();


================================================
FILE: concordia/static/js/src/filter-assets.js
================================================
function filterAssets(doFilter, url) {
    const button = doFilter
        ? document.getElementById('show-all')
        : document.getElementById('filter-assets');

    button.checked = false;
    window.location = url;
}

document.addEventListener('DOMContentLoaded', () => {
    document.addEventListener('change', function (event) {
        if (event.target.name === 'radioButtons') {
            filterAssets(
                event.target.dataset.filter === 'true',
                event.target.dataset.url,
            );
        }
    });
});

window.filterAssets = filterAssets;


================================================
FILE: concordia/static/js/src/guide.js
================================================
/* global */

import $ from 'jquery';
import {Carousel} from 'bootstrap';
import {trackUIInteraction} from './base.js';

function openOffcanvas() {
    let guide = document.getElementById('guide-sidebar');
    if (guide.classList.contains('offscreen')) {
        guide.classList.remove('offscreen');
        guide.style.borderWidth = '0 0 thick thick';
        guide.style.borderStyle = 'solid';
        guide.style.borderColor = '#0076ad';
        document.addEventListener('keydown', function (event) {
            if (event.key == 'Escape') {
                closeOffcanvas();
            }
        });
        document.getElementById('open-guide').style.background = '#002347';
    } else {
        closeOffcanvas();
    }
}

function closeOffcanvas() {
    let guide = document.getElementById('guide-sidebar');
    guide.classList.add('offscreen');
    guide.style.border = 'none';

    let openGuide = document.getElementById('open-guide');
    if (openGuide) {
        openGuide.style.background = '#0076AD';
    }
}

document.getElementById('open-guide')?.addEventListener('click', openOffcanvas);

document
    .getElementById('close-guide')
    ?.addEventListener('click', closeOffcanvas);

document.addEventListener('DOMContentLoaded', () => {
    const guideCarouselElement = document.getElementById('guide-carousel');
    if (guideCarouselElement) {
        new Carousel(guideCarouselElement, {
            interval: false,
            wrap: false,
        });

        guideCarouselElement.addEventListener('slide.bs.carousel', (event) => {
            const barsCol = document.getElementById('guide-bars-col');
            if (!barsCol) return;

            if (event.to === 0) {
                barsCol.classList.add('d-none');
            } else {
                barsCol.classList.remove('d-none');
            }
        });
    }
});

$('#previous-card').hide();

$('#card-carousel').on('slid.bs.carousel', function () {
    if ($('#card-carousel .carousel-item:first').hasClass('active')) {
        $('#previous-card').hide();
        $('#next-card').show();
    } else if ($('#card-carousel .carousel-item:last').hasClass('active')) {
        $('#previous-card').show();
        $('#next-card').hide();
    } else {
        $('#previous-card').show();
        $('#next-card').show();
    }
});

function trackHowToInteraction(element, label) {
    trackUIInteraction(element, 'How To Guide', 'click', label);
}

if ($('#open-guide').length > 0) {
    $('#open-guide').on('click', function () {
        trackHowToInteraction($(this), 'Open');
    });
}
if ($('#close-guide').length > 0) {
    $('#close-guide').on('click', function () {
        trackHowToInteraction($(this), 'Close');
    });
}
if ($('#previous-guide').length > 0) {
    $('#previous-guide').on('click', function () {
        trackHowToInteraction($(this), 'Back');
    });
}
if ($('#next-guide').length > 0) {
    $('#next-guide').on('click', function () {
        trackHowToInteraction($(this), 'Next');
    });
}
if ($('#guide-bars').length > 0) {
    $('#guide-bars').on('click', function () {
        trackHowToInteraction($(this), 'Hamburger Menu');
    });
}
$('#guide-sidebar .nav-link').on('click', function () {
    let label = $(this).text().trim();
    trackHowToInteraction($(this), label);
});

export {openOffcanvas, closeOffcanvas};


================================================
FILE: concordia/static/js/src/homepage-carousel.js
================================================
import $ from 'jquery';
import {Carousel} from 'bootstrap';

document.addEventListener('DOMContentLoaded', () => {
    const carouselElement = document.getElementById('homepage-carousel');
    if (!carouselElement) return; // exit if not on homepage

    // avoid double init
    const carousel = Carousel.getOrCreateInstance(carouselElement, {
        interval: 5000,
        pause: false,
        ride: 'carousel',
    });

    const playPauseButton = document.getElementById('play-pause-button');
    if (!playPauseButton) return;

    playPauseButton.addEventListener('click', function () {
        if ($(this).hasClass('paused')) {
            carousel.cycle();
        } else {
            carousel.pause();
        }
        $(this).children('.fa').toggleClass('fa-pause').toggleClass('fa-play');
        $(this).toggleClass('paused');
    });

    carouselElement.addEventListener('mouseover', () => {
        carousel.pause();
    });

    carouselElement.addEventListener('mouseleave', () => {
        if (!playPauseButton.classList.contains('paused')) {
            carousel.cycle();
        }
    });
});


================================================
FILE: concordia/static/js/src/modules/accessible-colors.js
================================================
import chroma from 'chroma-js';

/**
 * Adjust a color’s lightness so it meets at least `minContrast` vs. `background`.
 * @param {string} colorString - Input color (any CSS‐parsable string, e.g. '#f66' or 'rgb(255,0,0)')
 * @param {string} [background='#fff'] - Background color to contrast against
 * @param {number} [minContrast=4.5] - Minimum WCAG contrast ratio
 * @returns {string} A colorString string of the adjusted color
 */
export function adjustColorForContrast(
    colorString,
    background = '#fff',
    minContrast = 4.5,
) {
    let color = chroma(colorString);
    const backgroundLum = chroma(background).luminance();
    // if background is light, we darken; if background is dark, we brighten
    let step = 0.05;
    if (backgroundLum > 0.5) {
        step *= -1;
    }

    // We adjust the color's lightness by `step` until it reaches a constract of minConstrast
    // We limit it to 20 iterations to avoid an infinite loop. 20 because at 20
    // iterations, we've definitely traversed the entire possible range
    // (from 0 to 1 or from 1 to 0)
    for (
        let index = 0;
        index < 20 && chroma.contrast(color, background) < minContrast;
        index++
    ) {
        color = color.set('hsl.l', color.get('hsl.l') + step);
    }
    return color.hex();
}

/**
 * Generate a `count`-color palette that all meet `minContrast` vs. `background`.
 * Uses an LCh‐spaced base palette from chroma.js, then adjusts each hue.
 * @param {number} count - Number of colors to generate
 * @param {string} [background='#fff'] - Background color to contrast against
 * @param {number} [minContrast=4.5] - Minimum WCAG contrast ratio
 * @param {string} [scaleName='Spectral']
 *   - Any valid chroma.js scale name (e.g. 'Spectral', 'Rainbow', etc.)
 * @returns {string[]} Array of colorString color strings
 */
export function generateAccessibleColors(
    count,
    background = '#fff',
    minContrast = 4.5,
    scaleName = 'Spectral',
) {
    // build a base LCh (Lightness-Color-hue) palette
    const raw = chroma.scale(scaleName).mode('lch').colors(count);

    // adjust each color for contrast
    return raw.map((colorString) =>
        adjustColorForContrast(colorString, background, minContrast),
    );
}


================================================
FILE: concordia/static/js/src/modules/chroma-esm.js
================================================
// This is a shim to allow chroma-js to be used as an ES modules
// TODO Consider removing the shim and vite config alias and input
//      concordia-visualizations directly
import 'chroma-js'; // Vite resolves this to node_modules/chroma-js - loads the UMD build onto window.chroma
export default window.chroma; // re-export as the module’s default


================================================
FILE: concordia/static/js/src/modules/concordia-visualization.js
================================================
import Chart from 'chart.js/auto';
import {renderEmptyChart, renderErrorOverlay} from './visualization-errors.js';
import {generateAccessibleColors} from './accessible-colors.js';

const defaultAspectRatios = {
    pie: '1 / 1',
    doughnut: '1 / 1',
    radar: '1 / 1',
    bar: '2 / 1',
    line: '2 / 1',
};

export class ConcordiaVisualization {
    /**
     * @param {Object} config
     * @param {string} config.name
     *   The slug used to fetch `/api/visualization/<name>/`.
     * @param {string} config.canvasId
     *   The ID of the <canvas> element where the chart will be drawn.
     * @param {string} [config.chartType="bar"]
     *   The Chart.js chart type (e.g. "bar", "line", "pie", etc.).
     * @param {string} config.title
     *   The title to show on top of the chart (used both for real data and error case).
     * @param {string} [config.xLabel]
     *   The x-axis title (optional-if omitted, no x-axis label is shown).
     * @param {string} [config.yLabel]
     *   The y-axis title (optional-if omitted, no y-axis label is shown).
     * @param {Function} config.buildDataset
     *   A callback `(payload) => { data, [options] }` which receives the raw JSON payload
     *   and must return an object containing:
     *     - `data`: a valid Chart.js `data` object (`{ labels: [...], datasets: [...] }`), and
     *     - (optionally) `options`: partial Chart.js `options` you want to merge on top of the default.
     * @param {Object} [config.chartOptions]
     *   Any additional Chart.js options to merge into the final `options` object
     *   (will be deep-merged after `buildDataset(...).options`).
     * @param {string} [config.pageBackgroundColor="#fff"]
     *   The color of the page's background. Used to create contrasting colors
     * @param {number} [config.minContrast] - Minimum contrast between colors on the chart
     * @param {string} [config.aspectRatio]
     *   CSS aspect ratio. Default is based on chartType, as defined in defaultAspectRatios
     */
    constructor({
        name,
        canvasId,
        chartType = 'bar',
        title,
        xLabel = '',
        yLabel = '',
        buildDataset,
        chartOptions = {},
        pageBackgroundColor = '#fff',
        minContrast = 4.5,
        aspectRatio,
    }) {
        if (
            !name ||
            !canvasId ||
            !title ||
            typeof buildDataset !== 'function'
        ) {
            throw new Error(
                'ConcordiaVisualization requires: name, canvasId, title, and buildDataset()',
            );
        }

        this.name = name;
        this.canvasId = canvasId;
        this.chartType = chartType;
        this.title = title;
        this.xLabel = xLabel;
        this.yLabel = yLabel;
        this.buildDataset = buildDataset;
        this.chartOptions = chartOptions;
        this.pageBackgroundColor = pageBackgroundColor;
        this.minContrast = minContrast;

        if (aspectRatio) {
            this._cssAspectRatio = aspectRatio;
        } else {
            // Use the default if none provided, or failback to 2-to-1
            this._cssAspectRatio =
                defaultAspectRatios[this.chartType] ?? '2 / 1';
        }
    }

    /**
     * Fetches `/api/visualization/<name>/`, handles errors, and renders the chart.
     * Call this once the DOM is ready.
     */
    async render() {
        const canvas = document.getElementById(this.canvasId);
        if (!canvas) {
            console.error(
                `ConcordiaVisualization: Canvas ID '${this.canvasId}' not found.`,
            );
            return;
        }

        // Set accessibility attributes
        canvas.tabIndex = 0;
        canvas.setAttribute('role', 'img');
        canvas.setAttribute('aria-label', this.title);

        // Set aspectRatio on wrapper and make sure canvas fills it
        const wrapper = canvas.parentNode;
        wrapper.style.aspectRatio = this._cssAspectRatio;
        canvas.style.width = '100%';
        canvas.style.height = '100%';

        const context = canvas.getContext('2d');

        let resp;
        try {
            resp = await fetch(`/api/visualization/${this.name}/`);
        } catch (error) {
            console.error(
                `ConcordiaVisualization: Network error fetching '${this.name}':`,
                error,
            );
            this._handleError(context, 'No data available');
            return;
        }

        if (!resp.ok) {
            console.error(
                `ConcordiaVisualization: HTTP ${resp.status} for '${this.name}'.`,
            );
            this._handleError(context, 'No data available');
            return;
        }

        // If a chart already exists on this canvas, destroy it
        Chart.getChart(canvas)?.destroy();

        let payload;
        try {
            payload = await resp.json();
        } catch (error) {
            console.error(
                `ConcordiaVisualization: Failed to parse JSON for '${this.name}':`,
                error,
            );
            this._handleError(context, 'No data available');
            return;
        }

        let data,
            userOptions = {};
        try {
            // Let user-supplied buildDataset transform payload into { data, [options] }
            const result = this.buildDataset(payload);
            data = result.data;
            userOptions = result.options || {};
        } catch (error) {
            console.error(
                `ConcordiaVisualization: buildDataset threw for '${this.name}':`,
                error,
            );
            this._handleError(context, 'No data available');
            return;
        }

        if (!data || typeof data !== 'object') {
            console.error(
                `ConcordiaVisualization: buildDataset must return an object with a 'data' property for '${this.name}'.`,
            );
            this._handleError(context, 'No data available');
            return;
        }

        // Auto-generate accessible colors only if none provided
        const originalDatasets = data.datasets || [];
        if (originalDatasets.length > 0) {
            const hasExplicit = originalDatasets.some(
                (ds) =>
                    ds.backgroundColor !== undefined ||
                    ds.borderColor !== undefined,
            );
            if (!hasExplicit) {
                if (originalDatasets.length > 1) {
                    const colors = generateAccessibleColors(
                        originalDatasets.length,
                        this.pageBackgroundColor,
                        this.minContrast,
                    );
                    data.datasets = originalDatasets.map((ds, index) => ({
                        ...ds,
                        backgroundColor: colors[index],
                        borderColor: colors[index],
                        borderWidth: ds.borderWidth ?? 1,
                    }));
                } else {
                    const count = data.labels?.length || 0;
                    const colors = generateAccessibleColors(
                        count,
                        this.pageBackgroundColor,
                        this.minContrast,
                    );
                    data.datasets = [
                        {
                            ...originalDatasets[0],
                            backgroundColor: colors,
                            borderColor: colors,
                            borderWidth: originalDatasets[0].borderWidth ?? 1,
                        },
                    ];
                }
            }
        }

        // Merge options: default -> userOptions -> this.chartOptions
        const finalOptions = ConcordiaVisualization._deepMerge(
            {},
            ConcordiaVisualization._defaultOptions(
                this.title,
                this.xLabel,
                this.yLabel,
            ),
            userOptions,
            this.chartOptions,
        );

        // Create the Chart.js chart
        let chart = new Chart(context, {
            type: this.chartType,
            data: data,
            options: finalOptions,
        });

        // If CSV URL exists in payload, create a link below the canvas
        if (payload.csv_url) {
            // wrapper is the <section>, container is the <div>
            // Insert link after the wrapper, but within the outer container
            const container = wrapper.parentNode;
            const link = document.createElement('a');
            link.href = payload.csv_url;
            link.textContent = 'Download data as CSV';
            link.classList.add('visualization-data-link');
            link.setAttribute('target', '_blank');
            link.setAttribute('rel', 'noopener noreferrer');
            container.append(link);
        }

        // Create a hidden live region for announcing the current slice/bar
        const live = document.createElement('div');
        live.id = `${this.canvasId}-live`;
        live.setAttribute('aria-live', 'polite');
        Object.assign(live.style, {
            position: 'absolute',
            width: '1px',
            height: '1px',
            margin: '-1px',
            padding: 0,
            border: 0,
            clip: 'rect(0 0 0 0)',
        });
        canvas.parentNode.insertBefore(live, canvas.nextSibling);

        // Wire up keyboard navigation
        const meta = chart.getDatasetMeta(0).data; // first dataset's elements
        let elementIndex = 0;

        // helper to update tooltip and live text
        function highlight(index) {
            // build an array of every datasetIndex at this index
            const elements = chart.data.datasets
                .map((_unusedValue, datasetIndex) => ({datasetIndex, index}))
                .filter(({datasetIndex}) => {
                    // skip if that dataset doesn't actually have a bar at this index
                    return !!chart.getDatasetMeta(datasetIndex).data[index];
                });

            // get a tooltip-friendly position from one of the elements
            const {x, y} = chart
                .getDatasetMeta(elements[0].datasetIndex)
                .data[index].tooltipPosition();

            // activate them all
            chart.setActiveElements(elements);
            chart.tooltip.setActiveElements(elements, {x, y});
            chart.update();

            // update the live region:
            live.textContent =
                `${chart.data.labels[index]} - ` +
                elements
                    .map(({datasetIndex}) => {
                        const ds = chart.data.datasets[datasetIndex];
                        return `${ds.label}: ${ds.data[index]}`;
                    })
                    .join(', ');
        }

        // initialize on focus
        canvas.addEventListener('focus', () => {
            elementIndex = 0;
            highlight(elementIndex);
        });

        // arrow-key handling
        canvas.addEventListener('keydown', (event) => {
            if (event.key === 'ArrowRight' || event.key === 'ArrowDown') {
                elementIndex = (elementIndex + 1) % meta.length;
            } else if (event.key === 'ArrowLeft' || event.key === 'ArrowUp') {
                elementIndex = (elementIndex - 1 + meta.length) % meta.length;
            } else {
                return; // ignore other keys
            }
            event.preventDefault();
            highlight(elementIndex);
        });
    }

    /**
     * Instance-private helper: destroy any existing chart on this canvas,
     * draw a blank chart with title + axes, and overlay an error message.
     */
    _handleError(context, message) {
        renderEmptyChart(context, {
            title: this.title,
            xLabel: this.xLabel,
            yLabel: this.yLabel,
            chartType: this.chartType,
        });
        renderErrorOverlay(context, message);

        // insert a visible error message under the canvas, for UAs (such as screenreaders)
        // that can't handle the canvas
        const canvas = context.canvas;
        const container = canvas.parentNode;
        const alert = document.createElement('div');
        alert.setAttribute('role', 'alert');
        alert.classList.add('visually-hidden');
        alert.textContent = message;
        container.insertBefore(alert, canvas.nextSibling);
    }

    /**
     * Default Chart.js options (title + axes) for a "real" chart.
     * Individual visualizations can override or extend these via userOptions.
     */
    static _defaultOptions(title, xLabel, yLabel) {
        return {
            responsive: true,
            maintainAspectRatio: false,
            plugins: {
                title: {
                    display: true,
                    text: title,
                },
                tooltip: {
                    mode: 'index',
                    intersect: false,
                },
                legend: {
                    position: 'top',
                    labels: {
                        boxWidth: 12,
                        padding: 8,
                    },
                },
            },
            interaction: {
                mode: 'index',
                intersect: false,
            },
            scales: {
                x: {
                    title: {
                        display: !!xLabel,
                        text: xLabel,
                    },
                },
                y: {
                    beginAtZero: true,
                    title: {
                        display: !!yLabel,
                        text: yLabel,
                    },
                },
            },
        };
    }

    /**
     * Simple deep-merge of multiple objects.
     * Later sources overwrite earlier keys.
     */
    static _deepMerge(target, ...sources) {
        for (const source of sources) {
            if (source && typeof source === 'object') {
                for (const [key, value] of Object.entries(source)) {
                    // Skip any attempt to assign "__proto__" or "constructor"
                    if (key === '__proto__' || key === 'constructor') {
                        continue;
                    }

                    if (
                        value &&
                        typeof value === 'object' &&
                        !Array.isArray(value) &&
                        !(value instanceof HTMLElement)
                    ) {
                        if (!target[key] || typeof target[key] !== 'object') {
                            target[key] = {};
                        }
                        ConcordiaVisualization._deepMerge(target[key], value);
                    } else {
                        target[key] = value;
                    }
                }
            }
        }
        return target;
    }
}


================================================
FILE: concordia/static/js/src/modules/quick-tips.js
================================================
import $ from 'jquery';
import {Modal} from 'bootstrap';

function clearCache() {
    const keys = Object.keys(localStorage);
    for (const key of keys) {
        if (key.startsWith('campaign-')) {
            localStorage.removeItem(key);
        }
    }
}

function initCampaignTutorial() {
    const campaignData = document.getElementById('campaign-data');
    if (campaignData) {
        if (typeof Storage === 'undefined') return;

        const campaignSlug = campaignData.dataset.campaignSlug;
        const isAuthenticated =
            campaignData.dataset.userAuthenticated === 'true';
        const hasAsset = campaignData.dataset.hasAsset === 'true';
        if (campaignSlug) {
            const keyName = `campaign-${campaignSlug}`;
            const seen = localStorage.getItem(keyName);

            if (!seen) {
                if (!isAuthenticated) {
                    clearCache();
                }

                if (hasAsset) {
                    if (typeof window.setTutorialHeight === 'function') {
                        window.setTutorialHeight();
                    }

                    $(function () {
                        const modalElement =
                            document.getElementById('tutorial-popup');
                        const modal = new Modal(modalElement);
                        modal.show();
                    });

                    localStorage.setItem(keyName, 'true');
                }
            }
        } else if (!isAuthenticated) {
            clearCache();
        }
    }
}

document.addEventListener('DOMContentLoaded', initCampaignTutorial);

function setTutorialHeight() {
    let $carouselItems = $('#card-carousel .carousel-item');
    let heights = $carouselItems.map(function () {
        let height = $(this).height();
        if (height <= 0) {
            let firstChild = $(this).children[0];
            if (firstChild) {
                height = firstChild.offsetHeight + 48;
            } else {
                return 517.195;
            }
        }
        return height;
    });
    let maxHeight = Math.max.apply(this, heights);
    $carouselItems.height(maxHeight);
}

export {setTutorialHeight};

// Expose globally so inline HTML can see it
window.setTutorialHeight = setTutorialHeight;


================================================
FILE: concordia/static/js/src/modules/turnstile.js
================================================
/* global turnstile */

function resetTurnstile(widgetId) {
    // widgetId is optional. If not provided, the latest
    // turnstile widget is used automatically
    if (
        typeof turnstile !== 'undefined' &&
        turnstile !== null &&
        typeof turnstile.reset === 'function'
    ) {
        turnstile.reset(widgetId);
    } else {
        console.error(
            'Unable to reset turnstile. Turnstile.reset is not a function.',
        );
    }
}

export {resetTurnstile};


================================================
FILE: concordia/static/js/src/modules/visualization-errors.js
================================================
import Chart from 'chart.js/auto';

/**
 * Destroys any existing chart on this canvas and draws a “blank” chart that
 * only renders the title and axes (no data). Returns the new Chart instance.
 *
 * @param {CanvasRenderingContext2D} context
 * @param {Object} options
 * @param {string} options.title - the chart’s title text
 * @param {string} options.xLabel - x-axis title
 * @param {string} options.yLabel - y-axis title
 * @param {string} [options.chartType] - Chart.js type (default: 'bar')
 */
export function renderEmptyChart(
    context,
    {title, xLabel, yLabel, chartType = 'bar'},
) {
    // If there’s already a chart on this canvas, destroy it:
    const existing = Chart.getChart(context.canvas);
    if (existing) {
        existing.destroy();
    }

    // Create a new empty chart
    return new Chart(context, {
        type: chartType,
        data: {
            labels: [], // no x-axis labels
            datasets: [], // no data
        },
        options: {
            responsive: true,
            plugins: {
                title: {
                    display: true,
                    text: title,
                },
                tooltip: {
                    enabled: false,
                },
                legend: {
                    display: false,
                },
            },
            scales: {
                x: {
                    title: {
                        display: !!xLabel,
                        text: xLabel,
                    },
                },
                y: {
                    beginAtZero: true,
                    title: {
                        display: !!yLabel,
                        text: yLabel,
                    },
                },
            },
        },
    });
}

/**
 * Draws a centered error message overlay on top of whatever’s already been
 * rendered on the chart canvas. This does *not* destroy or modify the chart;
 * it simply paints a translucent rectangle and places text in the middle.
 *
 * @param {CanvasRenderingContext2D} context
 * @param {string} message
 * @param {Object} [options]
 * @param {string} [options.backgroundColor] - CSS color for overlay (default: "rgba(255,255,255,0.6)")
 * @param {string} [options.textColor] - CSS color for text (default: "#a00")
 * @param {string} [options.font] - CSS font for text (default: "bold 16px sans-serif")
 */
export function renderErrorOverlay(
    context,
    message,
    {
        backgroundColor = 'rgba(255, 255, 255, 0.6)',
        textColor = '#a00',
        font = 'bold 16px sans-serif',
    } = {},
) {
    const {width, height} = context.canvas;

    // Draw a semi‐transparent rectangle
    context.save();
    context.fillStyle = backgroundColor;
    context.fillRect(0, 0, width, height);
    context.restore();

    // Draw the error text centered
    context.save();
    context.fillStyle = textColor;
    context.font = font;
    context.textAlign = 'center';
    context.textBaseline = 'middle';
    context.fillText(message, width / 2, height / 2);
    context.restore();
}


================================================
FILE: concordia/static/js/src/ocr.js
================================================
import 'bootstrap/dist/css/bootstrap.min.css';
import {Modal} from 'bootstrap';

document.addEventListener('DOMContentLoaded', function () {
    const link = document.getElementById('ocr-transcription-link');
    if (link) {
        if (link.dataset.authenticated === 'true') {
            // Enable the button
            link.classList.remove('disabled');
            link.removeAttribute('aria-disabled');
            link.removeAttribute('tabindex');

            link.dataset.bsToggle = 'modal';
            link.dataset.bsTarget = '#ocr-transcription-modal';
            link.setAttribute('title', 'Transcribe with OCR');
        } else {
            link.classList.add('disabled');
            link.setAttribute('aria-disabled', 'true');

            link.setAttribute(
                'href',
                '/accounts/login/?next=' +
                    encodeURIComponent(window.location.pathname),
            );
            link.setAttribute('title', 'Log in to use "Transcribe with OCR"');

            delete link.dataset.bsToggle;
            delete link.dataset.bsTarget;
        }
    }
});

function selectLanguage() {
    const ocrModalElement = document.getElementById('ocr-transcription-modal');
    const langModalElement = document.getElementById(
        'language-selection-modal',
    );

    const ocrModal = Modal.getOrCreateInstance(ocrModalElement);
    const langModal = Modal.getOrCreateInstance(langModalElement);

    ocrModal.hide();
    langModal.show();
}

const selectLanguageButton = document.getElementById('select-language-button');
if (selectLanguageButton) {
    selectLanguageButton.addEventListener('click', selectLanguage);
}

export {selectLanguage};


================================================
FILE: concordia/static/js/src/password-validation.js
================================================
import $ from 'jquery';

$(function () {
    var requirements = [
        {
            id: 'pw-length',
            text: 'At least 8 characters long',
            test: function (index) {
                return index.length >= 8;
            },
        },
        {
            id: 'pw-uppercase',
            text: '1 or more uppercase characters',
            test: function (index) {
                return index.match(/[A-Z]/);
            },
        },
        {
            id: 'pw-digits',
            text: '1 or more digits',
            test: function (index) {
                return index.match(/\d/);
            },
        },
        {
            id: 'pw-special',
            text: '1 or more special characters',
            test: function (index) {
                return index.match(/[^\d\sa-z]/i);
            },
        },
    ];
    var $password1 = $('#id_password1,#id_new_password1').removeAttr('title');
    var $requirementsList = $password1
        .siblings('.form-text')
        .find('ul')
        .addClass('list-unstyled')
        .empty();

    for (const request of requirements) {
        $('<li>')
            .attr('id', request.id)
            .text(request.text)
            .appendTo($requirementsList);
    }

    $password1.on('input change', function () {
        var currentValue = this.value;
        var validity = true;

        for (const request of requirements) {
            var li = document.getElementById(request.id);

            if (request.test(currentValue)) {
                li.className = 'text-success';
            } else {
                li.className = 'text-warning';
                validity = false;
            }
        }

        if (validity) {
            this.removeAttribute('aria-invalid');
            this.setCustomValidity('');
        } else {
            this.setAttribute('aria-invalid', 'true');
            this.setCustomValidity(
                'Your password does not meet the requirements',
            );
        }
    });
});


================================================
FILE: concordia/static/js/src/profile-fields.js
================================================
import $ from 'jquery';
import {getPages} from './recent-pages.js';

window.sortDateAscending = function () {
    var urlParameters = new URLSearchParams(window.location.search);
    urlParameters.set('order_by', 'date-ascending');
    getPages('?' + urlParameters.toString());
};
window.sortDateDescending = function () {
    var urlParameters = new URLSearchParams(window.location.search);
    urlParameters.set('order_by', 'date-descending');
    getPages('?' + urlParameters.toString());
};

if (!window._profileFieldsInitialized) {
    window._profileFieldsInitialized = true;

    $(document).ready(function () {
        let profilePage = document.getElementById('profile-page');
        let activeTab = profilePage?.dataset.activeTab;
        if (activeTab === 'recent' || window.location.hash === '#recent') {
            getPages();
        }
    });

    // Disable form submissions, if there are invalid fields
    window.addEventListener(
        'load',
        function () {
            // Fetch all the forms we want to apply custom Bootstrap validation styles to
            var forms = document.querySelectorAll('.needs-validation');
            for (const form of forms) {
                form.addEventListener('submit', (event) => {
                    $('#validation-confirmation').hide();
                    if (!form.checkValidity()) {
                        event.preventDefault();
                        event.stopPropagation();
                    }
                    form.classList.add('was-validated');
                });
            }
        },
        false,
    );
}


================================================
FILE: concordia/static/js/src/quick-tips-setup.js
================================================
import $ from 'jquery';

import {setTutorialHeight} from './modules/quick-tips.js';
import {trackUIInteraction} from './base.js';

$('#tutorial-popup').on('shown.bs.modal', function () {
    setTutorialHeight();
});

function trackQuickTipsInteraction(element, label) {
    trackUIInteraction(element, 'Quick Tips', 'click', label);
}

$('#quick-tips').on('click', function () {
    trackQuickTipsInteraction($(this), 'Open');
});

$('#previous-card').on('click', function () {
    trackQuickTipsInteraction($(this), 'Back');
});

$('#next-card').on('click', function () {
    trackQuickTipsInteraction($(this), 'Next');
});

$('.carousel-indicators li').on('click', function () {
    let index = [...this.parentElement.children].indexOf(this);
    trackQuickTipsInteraction($(this), `Carousel ${index}`);
});

$('#tutorial-popup').on('hidden.bs.modal', function () {
    // We're tracking whenever the popup closes, so we don't separately track the close button being clicked
    trackUIInteraction($(this), 'Quick Tips', 'click', 'Close');
});

$('#tutorial-popup').on('shown-on-load', function () {
    // We set a timeout to make sure the analytics code is loaded before trying to track
    setTimeout(function () {
        trackUIInteraction($(this), 'Quick Tips', 'load', 'Open');
    }, 1000);
});


================================================
FILE: concordia/static/js/src/recent-pages.js
================================================
import $ from 'jquery';

let currentRequest;

export function getPages(queryString = window.location.search) {
    // Show indicator
    $('#recent-pages').html(
        '<p class="text-center py-3"><span class="spinner-border spinner-border-sm"></span>Loading...</p>',
    );

    if (currentRequest) {
        // Cancel previous before starting a new one
        currentRequest.abort();
    }
    currentRequest = $.ajax({
        type: 'GET',
        url: '/account/get_pages' + queryString,
        dataType: 'json',
        success: function (data) {
            // Clean up old elements
            const dropdownElements = document.querySelectorAll(
                '[data-bs-toggle="dropdown"]',
            );
            for (const dropdownElement of dropdownElements) {
                const instance = dropdownElement._bs_dropdown;
                if (instance && typeof instance.dispose === 'function') {
                    instance.dispose();
                }
            }

            var recentPages = document.createElement('div');
            recentPages.className = 'col-md';
            recentPages.innerHTML = data.content; // render data into the DOM
            $('#recent-pages').fadeOut(100, function () {
                $(this).html(recentPages).fadeIn(150);
            });
        },
        error: function () {
            $('#recent-pages').html('<p>Failed to load pages.</p>');
        },
        complete: function () {
            // clear the reference
            currentRequest = undefined;
        },
    });
}

if (!window._recentPagesHandlersInitialized) {
    window._recentPagesHandlersInitialized = true;

    $(document).on('click', '#recent-tab', function () {
        if (!this.dataset.loaded) {
            this.dataset.loaded = 'true';
            getPages(window.location.search);
        }
    });

    $(document).on('submit', '.date-filter', function (event) {
        event.preventDefault();

        const parameters = new URLSearchParams(new FormData(this));

        getPages('?' + parameters.toString());
    });

    $(document).on('click', '#current-filters a', function (event) {
        event.preventDefault();

        const href = $(this).attr('href'); // e.g. "?tab=recent"

        getPages(href);
    });

    $(document).on('click', '.dropdown-menu a.filter-link', function (event) {
        event.preventDefault();

        const href = $(this).attr('href') || '';
        const qsFromLink = href.startsWith('?') ? href.slice(1) : href;
        const linkParameters = new URLSearchParams(qsFromLink);

        const currentParameters = new URLSearchParams(window.location.search);

        for (const [key, value] of linkParameters.entries()) {
            if (key.startsWith('delete:')) {
                currentParameters.delete(key.replace('delete:', ''));
            } else {
                currentParameters.set(key, value);
            }
        }
        finalizePageUpdate(currentParameters);
    });

    // Intercept clicks and load via AJAX instead of full page reload
    $(document).on('click', '.pagination a.page-link', function (event) {
        event.preventDefault();

        const href = $(this).attr('href') || '';
        const qs = href.startsWith('?') ? href : '?' + href;

        getPages(qs);

        // Update the URL in the address bar
        history.replaceState(undefined, '', qs + window.location.hash);
    });

    $(document).on(
        'submit',
        'nav[aria-label="Page Jump"] form',
        function (event) {
            event.preventDefault();

            const pageNumber = $(this).find('select[name="page"]').val();

            const currentParameters = new URLSearchParams(
                window.location.search,
            );

            currentParameters.set('page', pageNumber);

            // Preserve other filters
            $(this)
                .find('input[type="hidden"]')
                .each(function () {
                    currentParameters.set(this.name, this.value);
                });
            finalizePageUpdate(currentParameters);
        },
    );
}

function finalizePageUpdate(currentParameters) {
    if (!currentParameters.has('tab')) currentParameters.set('tab', 'recent');

    const newQuery = '?' + currentParameters.toString();
    // Call AJAX loader
    getPages(newQuery);
    // Update the URL in the address bar without reloading
    history.replaceState(undefined, '', newQuery + window.location.hash);
}


================================================
FILE: concordia/static/js/src/viewer-split.js
================================================
import {seadragonViewer} from './viewer.js';
import Split from 'split.js';

let pageSplit;
let contributeContainer = document.getElementById('contribute-container');
let ocrSection = document.getElementById('ocr-section');
let editorColumn = document.getElementById('editor-column');
let viewerColumn = document.getElementById('viewer-column');
let layoutColumns = ['#viewer-column', '#editor-column'];
let verticalKey = 'transcription-split-sizes-vertical';
let horizontalKey = 'transcription-split-sizes-horizontal';

let sizesVertical = localStorage.getItem(verticalKey);

if (sizesVertical) {
    sizesVertical = JSON.parse(sizesVertical);
} else {
    sizesVertical = [50, 50];
}

let sizesHorizontal = localStorage.getItem(horizontalKey);

if (sizesHorizontal) {
    sizesHorizontal = JSON.parse(sizesHorizontal);
} else {
    sizesHorizontal = [50, 50];
}

let splitDirection = localStorage.getItem('transcription-split-direction');

if (splitDirection) {
    splitDirection = JSON.parse(splitDirection);
} else {
    splitDirection = 'h';
}

function saveSizes(sizes) {
    let sizeKey;
    if (splitDirection == 'h') {
        sizeKey = horizontalKey;
        sizesHorizontal = sizes;
    } else {
        sizeKey = verticalKey;
        sizesVertical = sizes;
    }
    localStorage.setItem(sizeKey, JSON.stringify(sizes));
}

function saveDirection(direction) {
    localStorage.setItem(
        'transcription-split-direction',
        JSON.stringify(direction),
    );
}

function verticalSplit() {
    splitDirection = 'v';
    saveDirection(splitDirection);
    if (contributeContainer) {
        contributeContainer.classList.remove('flex-row');
        contributeContainer.classList.add('flex-column');
    }
    viewerColumn.classList.remove('h-100');
    if (ocrSection != undefined) {
        editorColumn.prepend(ocrSection);
    }

    return Split(layoutColumns, {
        sizes: sizesVertical,
        minSize: 100,
        gutterSize: 8,
        direction: 'vertical',
        elementStyle: function (dimension, size, gutterSize) {
            return {
                'flex-basis': 'calc(' + size + '% - ' + gutterSize + 'px)',
            };
        },
        gutterStyle: function (dimension, gutterSize) {
            return {
                'flex-basis': gutterSize + 'px',
            };
        },
        onDragEnd: saveSizes,
    });
}
function horizontalSplit() {
    splitDirection = 'h';
    saveDirection(splitDirection);
    if (contributeContainer) {
        contributeContainer.classList.remove('flex-column');
        contributeContainer.classList.add('flex-row');
    }
    viewerColumn.classList.add('h-100');
    if (ocrSection != undefined) {
        viewerColumn.append(ocrSection);
    }
    return Split(layoutColumns, {
        sizes: sizesHorizontal,
        minSize: 100,
        gutterSize: 8,
        elementStyle: function (dimension, size, gutterSize) {
            return {
                'flex-basis': 'calc(' + size + '% - ' + gutterSize + 'px)',
            };
        },
        gutterStyle: function (dimension, gutterSize) {
            return {
                'flex-basis': gutterSize + 'px',
            };
        },
        onDragEnd: saveSizes,
    });
}

if (contributeContainer && seadragonViewer) {
    if (splitDirection == 'v') {
        pageSplit = verticalSplit();
    } else {
        pageSplit = horizontalSplit();
    }

    document
        .getElementById('viewer-layout-horizontal')
        .addEventListener('click', function () {
            if (splitDirection != 'h') {
                if (pageSplit != undefined) {
                    pageSplit.destroy();
                }
                pageSplit = horizontalSplit();
                setTimeout(function () {
                    // Some quirk in the viewer makes this
                    // sometimes not work depending on
                    // the rotation, unless it's delayed.
                    // Less than 10ms didn't reliable work.
                    // Adding ', null, true' ensures the zoom happens immediately
                    // and doesn't conflict with the CSS flexbox resizing of the container.
                    seadragonViewer.viewport.zoomTo(1, undefined, true);
                }, 10);
            }
        });

    document
        .getElementById('viewer-layout-vertical')
        .addEventListener('click', function () {
            if (splitDirection != 'v') {
                if (pageSplit != undefined) {
                    pageSplit.destroy();
                }
                pageSplit = verticalSplit();
                setTimeout(function () {
                    seadragonViewer.viewport.zoomTo(1, undefined, true);
                }, 10);
            }
        });
}


================================================
FILE: concordia/static/js/src/viewer.js
================================================
import {debounce, displayHtmlMessage} from './base.js';
import screenfull from 'screenfull';
import OpenSeadragon from 'openseadragon';
import {
    initializeFiltering,
    GAMMA,
    INVERT,
    THRESHOLDING,
} from 'openseadragon-filters';

const viewerElement = document.getElementById('viewer-data');

let viewerData;
let seadragonViewer;
let filterPlugin;

if (viewerElement) {
    viewerData = viewerElement.dataset;

    seadragonViewer = OpenSeadragon({
        id: 'asset-image',
        prefixUrl: viewerData.prefixUrl,
        tileSources: {
            type: 'image',
            url: viewerData.tileSourceUrl,
        },
        gestureSettingsTouch: {
            pinchRotate: true,
        },
        showNavigator: true,
        showRotationControl: true,
        showFlipControl: true,
        toolbar: 'viewer-controls',
        zoomInButton: 'viewer-zoom-in',
        zoomOutButton: 'viewer-zoom-out',
        homeButton: 'viewer-home',
        rotateLeftButton: 'viewer-rotate-left',
        rotateRightButton: 'viewer-rotate-right',
        flipButton: 'viewer-flip',
        crossOriginPolicy: 'Anonymous',
        drawer: 'canvas',
        defaultZoomLevel: 0,
        homeFillsView: false,
    });

    // Initialize the filtering plugin
    filterPlugin = initializeFiltering(seadragonViewer);

    // We need to define our own fullscreen function rather than using OpenSeadragon's
    // because the built-in fullscreen function overwrites the DOM with the viewer,
    // breaking our extra controls, such as the image filters.
    if (screenfull.isEnabled) {
        let fullscreenButton = document.querySelector('#viewer-fullscreen');
        fullscreenButton.addEventListener('click', function (event) {
            event.preventDefault();
            let targetElement = document.querySelector(
                fullscreenButton.dataset.target,
            );
            if (screenfull.isFullscreen) {
                screenfull.exit();
            } else {
                screenfull.request(targetElement);
            }
        });
        // Listen for fullscreen changes for proper flex container alinment
        screenfull.on('change', () => {
            let targetElement = document.querySelector(
                fullscreenButton.dataset.target,
            );
            if (screenfull.isFullscreen) {
                // Ensure the flex container takes full width of the screen
                targetElement.style.width = '100vw';
                targetElement.style.display = 'flex';
            } else {
                targetElement.style.width = '';
                targetElement.style.display = '';
            }
        });
    }

    // The buttons configured as controls for the viewer don't properly get focus
    // when clicked. This mostly isn't a problem, but causes odd-looking behavior
    // when one of the extra buttons in the control bar is clicked (and therefore
    // focused) first--clicking the control button leaves the focus on the extra
    // button.
    // TODO: Attempting to add focus to the clicked button here doesn't consistently
    // work for unknown reasons, so it just removes focus from the extra buttons
    // for now
    let viewerControlButtons = document.querySelectorAll(
        '.viewer-control-button',
    );
    for (const node of viewerControlButtons) {
        node.addEventListener('click', function () {
            let focusedButton = document.querySelector(
                '.extra-control-button:focus',
            );
            if (focusedButton) {
                focusedButton.blur();
            }
        });
    }
}

/*
 * Image filter handling
 */

let availableFilters = [
    {
        formId: 'gamma-form',
        inputId: 'gamma',
        getFilter: function () {
            let value = document.getElementById(this.inputId).value;
            if (
                !Number.isNaN(value) &&
                value != 1 &&
                value >= 0 &&
                value <= 5
            ) {
                return GAMMA(Number.parseFloat(value));
            }
        },
    },
    {
        formId: 'invert-form',
        inputId: 'invert',
        getFilter: function () {
            let value = document.getElementById(this.inputId).checked;
            if (value) {
                return INVERT();
            }
        },
    },
    {
        formId: 'threshold-form',
        inputId: 'threshold',
        getFilter: function () {
            let value = document.getElementById(this.inputId).value;
            if (!Number.isNaN(value) && value > 0 && value <= 255) {
                return THRESHOLDING(Number.parseInt(value));
            }
        },
    },
];

function updateFilters() {
    let filters = [];
    for (const filterData of availableFilters) {
        let filter = filterData.getFilter();
        if (filter) {
            filters.push(filter);
        }
    }

    //  Call setFilterOptions on the plugin instance instead of the viewer

    if (filterPlugin) {
        filterPlugin.setFilterOptions({
            filters: {
                processors: filters,
            },
        });
    }
}

if (viewerElement) {
    for (const filterData of availableFilters) {
        let form = document.getElementById(filterData.formId);
        if (form) {
            form.addEventListener('change', updateFilters);
            form.addEventListener('reset', function () {
                // We use setTimeout to push the updateFilters
                // call to the next event cycle in order to
                // call it after the form is reset, instead
                // of before, which is when this listener
                // triggers
                setTimeout(updateFilters);
            });
        }

        let input = document.getElementById(filterData.inputId);
        if (input) {
            // We use debounce here so that updateFilters is only called once,
            // after the user stops typing or scrolling with their mousewheel
            input.addEventListener(
                'keyup',
                debounce(() => updateFilters()),
            );
            input.addEventListener(
                'wheel',
                debounce(() => updateFilters()),
            );
        }
    }
}

/*
 * Image filter form handling
 */
function stepUp(id) {
    let input = document.getElementById(id);
    input.stepUp();
    input.dispatchEvent(new Event('input', {bubbles: true}));
    input.dispatchEvent(new Event('change', {bubbles: true}));
    return false;
}

function stepDown(id) {
    let input = document.getElementById(id);
    input.stepDown();
    input.dispatchEvent(new Event('input', {bubbles: true}));
    input.dispatchEvent(new Event('change', {bubbles: true}));
    return false;
}

function resetImageFilterForms() {
    for (const filterData of availableFilters) {
        let form = document.getElementById(filterData.formId);
        form.reset();
    }
}

if (seadragonViewer) {
    let gammaNumber = document.getElementById('gamma');
    let gammaRange = document.getElementById('gamma-range');

    gammaNumber.addEventListener('input', function () {
        gammaRange.value = gammaNumber.value;
    });

    gammaRange.addEventListener('input', function () {
        gammaNumber.value = gammaRange.value;
    });

    let gammaUp = document.getElementById('gamma-up');
    gammaUp.addEventListener('click', function () {
        stepUp('gamma');
    });

    let gammaDown = document.getElementById('gamma-down');
    gammaDown.addEventListener('click', function () {
        stepDown('gamma');
    });

    let thresholdNumber = document.getElementById('threshold');
    let thresholdRange = document.getElementById('threshold-range');

    thresholdNumber.addEventListener('input', function () {
        thresholdRange.value = thresholdNumber.value;
    });

    thresholdRange.addEventListener('input', function () {
        thresholdNumber.value = thresholdRange.value;
    });

    let thresholdUp = document.getElementById('threshold-up');
    thresholdUp.addEventListener('click', function () {
        stepUp('threshold');
    });

    let thresholdDown = document.getElementById('threshold-down');
    thresholdDown.addEventListener('click', function () {
        stepDown('threshold');
    });

    let reset = document.getElementById('viewer-reset');
    reset.addEventListener('click', resetImageFilterForms);

    // After the viewer has opened, set it to the home
    // view, which insures the entire image is displayed
    // (Workaround for change in behavior introduced during
    // the upgrade to OpenSeadragon 5.0.1)
    seadragonViewer.addHandler('open', function () {
        // We use setTimeout to make sure everything is
        // fully loaded so the viewport is ready calculate
        // the bounds and zoom correctly.
        setTimeout(() => {
            seadragonViewer.viewport.goHome(true);
        }, 0);
    });

    seadragonViewer.addHandler('open-failed', function () {
        // We don't use the eventData or error message
        // because it contains the image URL, which we don't
        // want to display
        let contactUs =
            '<strong><a class="alert-link" href="' +
            viewerData.contactUrl +
            '" target="_blank">Contact us</a></strong>';
        displayHtmlMessage(
            'error',
            'Unable to display image - ' + contactUs,
            'openseadragon-open-failed',
        );
    });
}

export {seadragonViewer};


================================================
FILE: concordia/static/js/src/visualizations/asset-status-by-campaign.js
================================================
import {ConcordiaVisualization} from 'concordia-visualization';

const colors = ['#FFFFFF', '#002347', '#E0F6FF', '#257DB1'];

document.addEventListener('DOMContentLoaded', () => {
    const assetStatusByCampaignChart = new ConcordiaVisualization({
        name: 'asset-status-by-campaign',
        canvasId: 'asset-status-by-campaign',
        chartType: 'bar',
        title: 'Page Status by Campaign (Active Campaigns)',
        xLabel: 'Campaign',
        yLabel: 'Page Count',
        buildDataset: (payload) => {
            const fullNames = payload.campaign_names;
            const shortLabels = fullNames.map((name) =>
                name.length > 20 ? name.slice(0, 20) + '…' : name,
            );

            const statusKeys = Object.keys(payload.per_campaign_counts);
            const statusLabels = payload.status_labels;

            const datasets = statusKeys.map((key, index) => ({
                label: statusLabels[index],
                data: payload.per_campaign_counts[key],
                backgroundColor: colors[index],
                borderColor: 'black',
                borderWidth: 2,
            }));

            return {
                data: {
                    labels: shortLabels, // truncated names on the axis
                    datasets: datasets,
                },
                options: {
                    scales: {
                        x: {stacked: true},
                        y: {stacked: true, beginAtZero: true},
                    },
                    plugins: {
                        tooltip: {
                            // We want the full names on hover
                            callbacks: {
                                title: (tooltipItems) => {
                                    const campaignIndex =
                                        tooltipItems[0].dataIndex;
                                    return fullNames[campaignIndex];
                                },
                                label: (tooltipItem) => {
                                    const status = tooltipItem.dataset.label;
                                    const value = tooltipItem.parsed.y;
                                    return `${status}: ${value}`;
                                },
                            },
                        },
                    },
                },
            };
        },
    });

    assetStatusByCampaignChart.render();
});


================================================
FILE: concordia/static/js/src/visualizations/asset-status-overview.js
================================================
import {ConcordiaVisualization} from '../modules/concordia-visualization.js';

const colors = ['#FFFFFF', '#002347', '#E0F6FF', '#257DB1'];

document.addEventListener('DOMContentLoaded', () => {
    const assetStatusOverviewChart = new ConcordiaVisualization({
        name: 'asset-status-overview',
        canvasId: 'asset-status-overview',
        chartType: 'pie',
        title: 'Page Status (Active Campaigns)',
        xLabel: '',
        yLabel: '',
        buildDataset: (payload) => {
            return {
                data: {
                    labels: payload.status_labels,
                    datasets: [
                        {
                            data: payload.total_counts,
                            backgroundColor: colors,
                            borderColor: 'black',
                            borderWidth: 2,
                        },
                    ],
                },
                options: {
                    scales: {
                        // We don't want scales on a pie chart
                        x: {display: false},
                        y: {display: false},
                    },
                },
            };
        },
    });

    assetStatusOverviewChart.render();
});


================================================
FILE: concordia/static/js/src/visualizations/daily-activity.js
================================================
import {ConcordiaVisualization} from '../modules/concordia-visualization.js';

document.addEventListener('DOMContentLoaded', () => {
    const dailyActivityChart = new ConcordiaVisualization({
        name: 'daily-transcription-activity-last-28-days',
        canvasId: 'daily-activity',
        chartType: 'bar',
        title: 'Daily Transcription Activity (Last 28 Days)',
        xLabel: 'Date',
        yLabel: 'Transcriptions + Reviews',
        buildDataset: (payload) => {
            const colors = ['#911C42', '#BFBBDD'];

            const datasets = payload.transcription_datasets.map(
                (ds, index) => ({
                    ...ds,
                    backgroundColor: colors[index],
                    borderColor: '#000',
                    borderWidth: 1.5,
                }),
            );

            return {
                data: {
                    labels: payload.labels,
                    datasets: datasets,
                },
                options: {
                    scales: {
                        x: {
                            stacked: true,
                            ticks: {
                                callback: function (value, index) {
                                    // Show only every 4th tick starting at index 3 (i.e., the 4th day)
                                    return (index - 3) % 4 === 0
                                        ? this.getLabelForValue(index)
                                        : '';
                                },
                                autoSkip: false,
                            },
                        },
                        y: {
                            stacked: true,
                        },
                    },
                    plugins: {
                        legend: {
                            display: false,
                        },
                    },
                },
            };
        },
    });

    dailyActivityChart.render();
});


================================================
FILE: concordia/static/scss/_variables.scss
================================================
// global variables
$blue: #00618e;
$blue-light: #beeaff;
$orange: #f05129;
$accent: $orange;
$default: $gray-300;
$primary: $blue;

$theme-colors: (
    'accent': $orange,
    'default': $gray-300,
    'primary': $primary,
);

$link-color: map.get($theme-colors, 'primary');
$link-hover-color: color.adjust($link-color, $lightness: 15%);

$kbd-color: $gray-900;
$kbd-bg: $gray-200;

$headings-font-weight: 700;

$sizes: (
    60: 60%,
    65: 65%,
);

// typography
$concordia-app-font-size-xxs: $font-size-base * 0.75;
$concordia-app-font-size-xs: $font-size-base * 0.8125;
$concordia-app-font-size-xl: $font-size-base * 1.5;
$concordia-app-line-height-xs: 1.4;
$concordia-app-line-height-xxs: 1.3;

// toolbar
$concordia-app-toolbar-border: $gray-600;
$concordia-app-toolbar-background: $gray-300;
$concordia-app-active-color: $white;

// thumbnail
$concordia-app-asset-list-thumbnail-width: 140px;
$concordia-app-asset-list-thumbnail-gap: 10px;
$concordia-app-asset-list-text-padding: 8px;

// asset unavailable
$concordia-app-asset-unavailable-background: $blue-light;
$concordia-app-asset-unavailable-padding-x: $concordia-app-asset-list-text-padding;
$concordia-app-asset-unavailable-padding-y: $concordia-app-asset-list-text-padding;
$concordia-app-asset-unavailable-icon-width: 24px;

// footer
$concordia-app-footer-height: $line-height-lg * 1rem;


================================================
FILE: concordia/static/scss/base.scss
================================================
@use 'sass:math';

$gray-100: #f6f6f6;
$gray-200: #efefef;
$gray-300: $gray-200;
$gray-400: #bfbfbf;
$gray-500: $gray-400;
$gray-600: #808080;
$gray-700: #545454;
$gray-800: #242424;
$gray-900: $gray-800;

$blue: #0076ad;
$orange: #f05129;
$green: #218739;
$red: #d1332e;
$navy: #002347;
$white: #fff;

$dark: $gray-900;
$accent: $orange;
$error: $red;
$light: $gray-100;
$secondary: $gray-700;

$theme-colors: (
    'accent': $orange,
    'error': $red,
    'info': $blue,
    'warning': $secondary,
);

$mark-bg: #caeea4;

// additional sizes
$sizes: (
    1: 1%,
    30: 30%,
    35: 35%,
    40: 40%,
    60: 60%,
    65: 65%,
);

// typography
$font-family-sans-serif: 'Open Sans', arial, helvetica, sans-serif;
$font-family-serif: 'Roboto Slab', arial, helvetica, serif;
$headings-font-weight: 700;

// Breadcrumbs
$breadcrumb-padding-y: 7px;
$breadcrumb-padding-x: 0;
$breadcrumb-item-padding: 0.25rem;
$breadcrumb-margin-bottom: 0;
$breadcrumb-bg: transparent;
$breadcrumb-active-color: $dark;

// carousel
$carousel-control-color: black;
$carousel-control-width: 8%;
$carousel-control-opacity: 1;
$carousel-indicator-width: 12px;
$carousel-indicator-height: 12px;
$carousel-control-icon-height: 3.5rem;
$carousel-control-icon-width: 3.5rem;

// dropdown
$dropdown-padding-y: 0.4rem;
$dropdown-item-padding-y: 3px;
$dropdown-item-padding-x: 1rem;
$dropdown-divider-margin-y: 5px;

// small font size
$small-font-size: 87.5%;

// inline list
$list-inline-padding: 12px;

// variables that are placed below dependent on bootstrap variables
@import '../../../node_modules/bootstrap/scss/functions';
@import '../../../node_modules/bootstrap/scss/variables';
@import '../../../node_modules/bootstrap/scss/mixins';
@import '../../../node_modules/bootstrap/scss/maps';
@import '../../../node_modules/bootstrap/scss/utilities';
@import '../../../node_modules/bootstrap/scss/utilities/api';

// navbar
$navbar-toggler-font-size: 32px;
$navbar-toggler-padding-y: 0;
$navbar-toggler-padding-x: 0;
$navbar-light-color: $dark;
$navbar-light-active-color: $dark;
$navbar-light-disabled-color: rgba($black, 0.55);

// forms
$input-border-color: $gray-500;
$label-margin-bottom: 0.4rem;
$form-group-margin-bottom: 1.5rem;

// buttons
$btn-font-weight: $font-weight-bold;
$btn-border-radius: 0.375rem;

// headings
$h1-font-size: $font-size-base * 2.5;
$h2-font-size: $font-size-base * 1.75;
$h3-font-size: $font-size-base * 1.25;
$h4-font-size: $font-size-base * 1.125;
$h5-font-size: $font-size-base;
$h6-font-size: $font-size-base;

// border
$border-color: $gray-500;
$hr-border-color: $gray-500;

// alert
$alert-bg-level: 0;
$alert-border-level: 0;
$alert-color-level: -12;
$alert-padding-y: 9px;
$alert-padding-x: 1rem;

@import '../../../node_modules/bootstrap/scss/root';
@import '../../../node_modules/bootstrap/scss/reboot';
@import '../../../node_modules/bootstrap/scss/type';
@import '../../../node_modules/bootstrap/scss/containers';
@import '../../../node_modules/bootstrap/scss/grid';
@import '../../../node_modules/bootstrap/scss/forms';
@import '../../../node_modules/bootstrap/scss/buttons';
@import '../../../node_modules/bootstrap/scss/dropdown';
@import '../../../node_modules/bootstrap/scss/button-group';
@import '../../../node_modules/bootstrap/scss/nav';
@import '../../../node_modules/bootstrap/scss/navbar';
@import '../../../node_modules/bootstrap/scss/breadcrumb';
@import '../../../node_modules/bootstrap/scss/alert';
@import '../../../node_modules/bootstrap/scss/close';
@import '../../../node_modules/bootstrap/scss/carousel';

// progress
$bg-completed: $blue;
$bg-submitted: #e0f6ff;
/* stylelint-disable-next-line scss/no-global-function-names */
$bg-in-progress: $navy;
$bg-not-started: #fff;

// shadow
/* stylelint-disable-next-line color-function-notation */
$shadow-color: rgba(51, 51, 51, 80%); /* #333333 */

html,
#contribute-main-content {
    background-color: $white;
    color: $dark;
    overflow-x: hidden;
}

body {
    color: $dark;
    border-top: 4px solid $accent;
    display: flex;
    flex-direction: column;
    min-height: 100vh;
}

#body {
    font-family: 'Open Sans', arial, helvetica, sans-serif;
}

main {
    flex: 1 1 0%;
}

body a {
    color: $blue;
    text-decoration: none;
}

body a:hover {
    color: #004261;
}

.simple-page a {
    text-decoration: underline;
}

body .container,
.col-md-2,
.col-md-3,
.row .col-12,
.row .col-lg,
.row .col-lg-auto {
    padding-left: 15px;
    padding-right: 15px;
}

div.row {
    margin-left: -15px;
    margin-right: -15px;
}

small {
    font-weight: 400;
}

header.border-bottom {
    border-bottom: 1px solid $border-color !important;
}

.close {
    opacity: 1;
}

.alert {
    color: #fff;

    &.alert-danger {
        background-color: $red;
        color: #fff;

        .alert-link {
            color: #fff;
            font-weight: bolder;
        }
    }

    &.alert-dismissible {
        padding: 9px 1rem;
    }

    &.alert-info {
        background-color: $blue;
        color: #fff;
    }

    .alert-link {
        color: #fff;
        text-decoration: underline;
    }

    &.alert-light {
        color: $dark;

        .alert-link {
            color: $dark;
        }
    }

    &.alert-success {
        background-color: $green;
    }

    &.alert-warning {
        background-color: $gray-700;
    }
}

div .btn:first-child:active,
a:not(.btn-check) + .btn:active,
div :not(.btn-check) + .btn:active {
    background-color: #005c87;
    border-color: #005c87;
}

.alert a[type='button'] {
    color: inherit;
    font-size: 1.5rem;
}

.font-serif {
    font-family: $font-family-serif;
}

body h1,
.h1 {
    font-family: $font-family-serif;
    font-weight: bold;
}

body h2 {
    font-size: $h2-font-size;
    font-weight: $headings-font-weight;
}

body .h3,
body h3 {
    font-size: $h3-font-size;
    font-weight: $headings-font-weight;
}

body h4 {
    font-size: $h4-font-size;
    font-weight: $headings-font-weight;
}

body h5 {
    font-size: $h5-font-size;
    font-weight: $headings-font-weight;
}

div h6 {
    font-weight: $headings-font-weight;
}

li a {
    text-decoration: none;
}

li a:hover {
    text-decoration: underline;
}

.text-dark {
    color: $gray-800;
}

p a,
.simple-page a {
    text-decoration: underline;
}

p a:hover,
.simple-page a:hover,
.btn:hover {
    text-decoration: none;
}

.row > * {
    padding-left: 0;
    padding-right: 0;
}

.input-group-prepend {
    margin-right: -1px;
}

.input-group-append {
    margin-left: -1px;
}

body .btn {
    font-weight: $btn-font-weight;
}

.btn-block {
    width: 100%;
}

.input-group-sm > .input-group-prepend > .input-group-text {
    font-size: 0.875rem;
}

.input-group-prepend .input-group-text {
    color: $gray-700;
}

.input-group-sm > .input-group-append > .btn {
    font-size: 87.5%;
    padding: 0.25rem 0.5rem;
}

.input-group > .input-group-append > .btn {
    border-top-left-radius: 0;
    border-bottom-left-radius: 0;
}

body .input-group-sm > .form-select {
    padding-right: 1.75rem;
}

body .input-group-sm > .form-select,
body .input-group > .form-select-sm {
    padding-top: 0.25rem;
    padding-bottom: 0.25rem;
    padding-left: 0.5rem;
    font-size: 0.875rem;
}

button.btn-close-blue {
    background: transparent
        url("data:image/svg+xml,%3csvg xmlns='http://www.w3.org/2000/svg' viewBox='0 0 16 16' fill='%230076ad'%3e%3cpath d='M.293.293a1 1 0 011.414 0L8 6.586 14.293.293a1 1 0 111.414 1.414L9.414 8l6.293 6.293a1 1 0 01-1.414 1.414L8 9.414l-6.293 6.293a1 1 0 01-1.414-1.414L6.586 8 .293 1.707a1 1 0 010-1.414z'/%3e%3c/svg%3e")
        center/1em auto no-repeat;
    opacity: 1;
}

body .btn-link,
li .nav-link {
    color: $blue;
}

body .btn-link:hover,
body .nav-link:hover {
    color: #004261;
}

body .btn-primary:hover {
    background-color: #004261;
}

body .btn:disabled,
body .btn-primary.disabled,
body .btn-primary {
    border-color: $blue;
}

body .btn-primary.disabled {
    background-color: $blue;
}

body .btn-primary:disabled,
body .btn-primary {
    background-color: $blue;
    color: #fff;
}

body .btn-outline-primary:disabled {
    background-color: transparent;
    color: $blue;
    opacity: 0.2;
}

a.btn-info:hover {
    background-color: #005c87;
    border-color: #005c87;
    color: $white;
}

button.btn-primary:hover {
    background-color: #005c87;
}

.btn {
    &.btn-danger {
        background-color: $red;
        color: #fff;
    }

    &.btn-info {
        background-color: $blue;
        border-color: $blue;
        color: #fff;
    }

    &.btn-warning {
        background-color: $gray-700;
        border-color: $gray-700;
    }
}

a.btn-dark {
    color: #fff;
}

a.btn-outline-dark {
    color: $gray-800;

    .transcription-status-key-lg {
        border: 1px solid $white;
    }
}

a.btn-outline-dark.active {
    color: #fff;
}

a.btn-outline-dark:hover {
    color: #fff;
}

.btn-light {
    color: $gray-800;
}

body .form-check-input {
    border-color: $gray-800;
}

.form-check .form-check-input:disabled ~ .form-check-label,
.form-check-input[disabled] ~ .form-check-label {
    opacity: 1;
}

#invert-form div {
    margin-left: 10px;
    margin-right: 0;
}

#invert:checked {
    background-color: $blue;
    border-color: $blue;
}

.flex-1 {
    flex: 1;
}

a .campaign-title:hover,
.hero-text a:hover {
    color: $dark;
    text-decoration: underline;
}

p.hero-secondary {
    font-family: $font-family-sans-serif;
    font-size: 1.125rem;
    color: $dark;
}

p.hero-secondary.offwhite-text {
    font-family: $font-family-sans-serif;
    font-size: 1.125rem;
    color: #fff;
}

body .text-primary {
    color: $blue !important;
}

body .bg-primary {
    background-color: $blue !important;
}

.row .bg-completed {
    background-color: $bg-completed;
}

.row .bg-submitted {
    background-color: $bg-submitted;
    border: 1px solid $dark;
}

/* stylelint-disable-next-line selector-class-pattern */
.row .bg-in_progress,
.row .bg-in-progress {
    background-color: $bg-in-progress;
}

/* stylelint-disable-next-line selector-class-pattern */
.row .bg-not_started,
.row .bg-not-started {
    background-color: $bg-not-started;
    background-image: repeating-linear-gradient(
        45deg,
        #242424 0,
        #242424 1px,
        #fff 0,
        #fff 50%
    );
    background-size: 10px 10px;
    border: 1px solid $dark;
    opacity: 0.8;
}

.completed-bar {
    background-color: $navy;
    color: $white;
}

.completed-text {
    padding: 0.3em;
}

.retired-bar {
    background-color: $light;
    color: $blue;
    border: 2px solid $blue;
}

.retired-text {
    padding: 0.3em;
}

input {
    color: $dark;
    background-color: #fff;
}

hr {
    color: $secondary;
}

.row .campaign-thumbnail {
    flex: 0 0 auto;

    @include media-breakpoint-up(lg) {
        width: 16.6667%;
    }

    @include media-breakpoint-down(lg) {
        width: 25%;
    }

    @include media-breakpoint-down(md) {
        width: 33.3333%;
    }
}

.row .campaign-text {
    flex: 0 0 auto;

    @include media-breakpoint-up(lg) {
        width: 83.3333%;
    }

    @include media-breakpoint-down(lg) {
        width: 75%;
    }

    @include media-breakpoint-down(md) {
        width: 66.6667%;
    }
}

.navbar-brand {
    @include media-breakpoint-down(lg) {
        max-width: 350px;
    }

    @include media-breakpoint-down(sm) {
        max-width: 250px;
    }
}

ul.nav-secondary {
    margin: 0 -10px;

    .nav-link {
        padding: 0 10px;
    }

    li {
        line-height: 1;

        &:first-of-type {
            border-right: 1px solid $border-color;
        }
    }
}

.flex-initial {
    flex: initial !important;
}

#transcription-input-container {
    width: 99% !important;
}

/*
 * vertical and horizontal dividers
 */

.navbar-brand .vl {
    height: 6rem;
    background-color: $secondary;
    width: 0.0675rem;
}

.border-login-register {
    border-left: solid 0.0675rem $dark;
}

.border-left-home-contribute {
    border-left: solid 0.0675rem $gray-100;
}

.navbar-nav {
    margin-right: -0.5rem;

    @include media-breakpoint-down(lg) {
        margin: 0;
        padding: 0.5rem 1rem;
        background-color: $light;
    }
}

.navbar-nav .nav-link {
    text-align: left;
    padding-top: 5px;
    padding-bottom: 5px;

    @include media-breakpoint-up(lg) {
        padding-top: 0;
        padding-bottom: 0;
    }

    &.active {
        font-weight: bold;
    }
}

.navbar-light .navbar-nav .nav-link {
    color: $gray-800;
}

.navbar-light .navbar-nav #topnav-account-dropdown-toggle {
    color: $blue;
    cursor: pointer;
}

.logo-loc {
    border-right: 1px solid $border-color;
    margin: 0 15px 0 0 !important;
    padding-right: 15px;
}

.landing-divider {
    margin: 0.25em;
}

/* Forms */

.form-group-required label {
    font-weight: bold;
}

/* Cards */

$card-img-height: 14.8rem;
$card-btn-height: 31px;
$card-progress-height: 12px;

.card-header {
    min-height: 65px;
}

.card-body {
    padding: 1rem 0.5rem;
}

.card-img-campaign {
    object-position: center top;
    object-fit: cover;
    height: $card-img-height;
}

.card-img-overlay {
    left: 0;
    right: 0;
    bottom: 0;
    margin-bottom: 3.0675rem;
    padding: 0.5rem 1.25rem;
}

.card-img-overlay.img-campaign {
    padding: 0;
}

.card-title {
    margin-bottom: 0.5rem;
}

a.card-title {
    color: $blue;
}

a.card-title.text-dark {
    color: $gray-800;
}

.img-project {
    min-height: 13.125rem;
}

.round-corners-bottom {
    border-radius: 0 0 0.5rem 0.5rem;
}

.img-fluid.rounded-circle {
    max-height: 15rem;
    width: auto;
}

.shadow-regular {
    box-shadow: 0 0 0.25rem $shadow-color;
}

/*
 * Common navigational elements
 */

.breadcrumb-wrapper {
    font-size: 13px;
}

.breadcrumb-wrapper .breadcrumb {
    margin-bottom: 0;
    padding: 7px 0;
}

.breadcrumb-item {
    max-width: 20em;
    white-space: nowrap;
    text-overflow: ellipsis;
    overflow: hidden;
}

li.breadcrumb-item.active {
    color: $gray-800;
}

.breadcrumb .breadcrumb-item + .breadcrumb-item {
    padding-left: 0.25rem;
}

.breadcrumb .breadcrumb-item + .breadcrumb-item::before {
    padding-right: 0.25rem;
}

.section-link {
    text-decoration: underline;
    padding-top: 1em;
    padding-bottom: 0.25em;
}

.underline-link {
    text-decoration: underline;
}

.underline-link:hover {
    color: $blue;
}

/*
 * List-like displays for items and assets
 */

.concordia-object-card-row {
    margin: 0 -6px;
}

.row .concordia-object-card-container {
    width: 90%;
}

.concordia-object-card-container {
    display: flex;
    flex-wrap: wrap;
    padding-top: 0.25em;
}

.concordia-object-card-col {
    padding: 6px;

    @include media-breakpoint-up(lg) {
        flex: 0 0 25%;
        max-width: 25%;
    }
}

.concordia-object-card {
    background-color: $gray-100;
    overflow: hidden;
}

.concordia-object-card-title {
    padding: 12px 10px;
}

.concordia-object-card .card-title,
.concordia-object-card .card-actions {
    position: absolute;
    left: 0;
    right: 0;
}

.concordia-object-card[data-transcription-status='completed']:not(:hover)
    .card-img {
    opacity: 0.4;
}

.concordia-object-card .card-img {
    transition: 0.3s ease-in-out;
    border-bottom-right-radius: 0;
    border-bottom-left-radius: 0;
}

.concordia-object-card:hover .card-img,
.concordia-object-card:focus .card-img {
    transform: scale(1.05);
}

.concordia-object-card .card-title {
    bottom: 0;
    padding: 2px;
    margin-bottom: 0;
    font-weight: bold;
    font-size: 0.875rem; // add this line
    position: static; // add this line
}

.concordia-object-card .card-actions {
    top: calc(
        #{$card-img-height} - #{$card-btn-height - $card-progress-height}
    );
    z-index: 3;

    /* stylelint-disable selector-class-pattern */
    .view-transcriptions--item-detail &,
    .view-transcriptions--filtered-item-detail & {
        top: 0;
    }
    /* stylelint-enable selector-class-pattern */
}

.concordia-object-card .card-actions .btn {
    height: $card-btn-height;
    border-radius: 0;
}

.concordia-object-card .card-actions .btn-default:not(:hover) {
    background-color: $shadow-color; // add this line
    border-color: $shadow-color; // add this line
    color: #fff; // add this line
}

.concordia-object-card .card-img-container {
    display: block;
    height: 100%;
    overflow: hidden;
    width: 100%;
}

.card.concordia-object-card .progress {
    height: $card-progress-height;
    border-radius: 0;
    position: relative;
    z-index: 2;
}

.progress {
    background-color: #e5f7ff;

    &::after {
        content: '';
        background-color: #fff;
        background-size: 10px 10px;
        flex: 1 1 0%;
        opacity: 0.8;
    }

    &.campaign-progress::after,
    &.w-100::after {
        background-image: repeating-linear-gradient(
            45deg,
            #242424 0,
            #242424 1px,
            #fff 0,
            #fff 50%
        );
        border: 1px solid $dark;
    }
}

body .campaign-page-progress {
    height: 2.5rem;
}

.campaign-page-progress .progress-bar:last-child {
    border-top-right-radius: 0.375rem;
    border-bottom-right-radius: 0.375rem;
}

div.campaign-progress {
    height: 35px;
    margin-top: 20px;
}

#campaign-list li h3 {
    margin-left: -3.5px;
}

.page-link:hover {
    text-decoration: none;
}

a.page-link {
    color: $blue;
}

body .disabled > .page-link {
    background-color: #fff;
}

.page-item.disabled .page-link {
    color: black;
}

.page-item.active .page-link {
    background-color: #fff;
    border-color: #efefef;
    color: $gray-800;
}

/*
 * Progress displays
 */

#progress-bar {
    height: 1rem;
    border-radius: 0;
}

.progress-bar-label {
    font-size: 14px;
    margin-top: 5px;
    margin-right: 5px;
}

.progress-bar-label span:nth-child(2) {
    margin-left: 5px;
}

#progress-stats {
    font-size: smaller;
}

#progress-stats th {
    font-size: inherit;
    font-weight: inherit;
}

.progress-bar-labels li {
    float: left;
}

.progress-bar-labels li + li::before {
    content: '|';
    padding: 0 0.5em;
}

.transcription-status-key-lg {
    display: inline-block;
    height: 1em;
    width: 1em;
    vertical-align: top;
    margin: 0.25rem !important;
}

.transcription-status-key {
    display: inline-block;
    height: 0.6em;
    width: 0.6em;
    vertical-align: baseline;
}

#transcription-status-message {
    max-width: 270px;
}

// Campaign small blocks

.small-campaign-title {
    min-height: 6ex;
}

.small-campaign-description {
    display: -webkit-box;
    overflow: hidden;
    -webkit-box-orient: vertical;
    -webkit-line-clamp: 4;
}

/*
 * Homepage customizations
 */

.play-pause-button {
    position: absolute;
    top: 5px;
    right: 20px;
    height: 40px;
    width: 40px;
    z-index: 2;

    i {
        color: $white;
    }
}

.carousel-item {
    img {
        background-color: $light;
    }
}

.carousel-overlay {
    padding: 10px 3rem 1rem;

    @include media-breakpoint-up(md) {
        padding: 25px;
        background-color: white;
        position: absolute;
        top: 50px;
        left: 100px;
        width: 420px;

        [data-overlay-position='top-right'] & {
            left: auto;
            right: 100px;
        }
    }

    @include media-breakpoint-down(md) {
        position: absolute;
        top: 19px;
    }

    .title {
        font-size: 2.25rem;
    }
}

.carousel {
    .carousel-control-next-icon {
        background-image: url('/static/img/slick-right-arrow.svg');
    }

    .carousel-control-prev-icon {
        background-image: url('/static/img/slick-left-arrow.svg');
    }

    .carousel-control-next-icon,
    .carousel-control-prev-icon {
        height: $carousel-control-icon-height;
        width: $carousel-control-icon-width;
    }

    .carousel-indicators {
        > button {
            border-radius: 50%;
            border: 1px solid $blue;
            height: 12px;
            opacity: 1;
            width: 12px;

            &.active {
                background-color: $blue;
                border-color: $blue;
            }
        }

        left: 50%;
        width: 60%;
        margin-left: -30%;
        text-align: center;
    }
}

#card-carousel .carousel-indicators > button {
    border: 1px solid $gray-800;
    border-radius: 100%;
    height: 14px;
    width: 14px;
}

#previous-guide,
#next-guide {
    cursor: pointer;
}

#campaign-options {
    margin-left: 1px;

    label {
        font-size: 14px;
    }

    select {
        background-color: $white;
        border-color: $blue;
        font-size: 14px;
        height: 2.155rem;
        padding: 0.3rem;
    }

    .btn {
        border-radius: 0;
        font-size: 14px;
        height: 2.155rem;
    }
}

.aspect-ratio-box {
    height: 0;
    overflow: hidden;
    /* stylelint-disable-next-line scss/no-global-function-names */
    padding-top: percentage(math.div(9, 16));
    position: relative;

    @include media-breakpoint-up(sm) {
        /* stylelint-disable-next-line scss/no-global-function-names */
        padding-top: percentage(math.div(240, 320));
    }
}

.list-view li {
    padding-top: 24px;
}

.list-view .aspect-ratio-box {
    height: 150px;
    padding-top: 0;
    width: 150px;
}

.aspect-ratio-box-inner-wrapper {
    position: absolute;
    top: 0;
    left: 0;
    width: 100%;
    height: 100%;

    img {
        height: 100%;
        width: 100%;
        object-fit: cover;
    }
}

#banner-inner {
    margin-right: 0.75rem;
}

#no-interface-banner {
    margin-left: 0.75rem;
}

#homepage-contribute-activities {
    img {
        @include media-breakpoint-down(sm) {
            max-width: 100px;
        }
    }
}

#homepage-carousel {
    @include media-breakpoint-up(xl) {
        max-width: 1140px;
    }
}

#homepage-next-transcribable-links {
    position: relative;

    &::before {
        content: '';
        width: calc(100% - 2rem);
        position: absolute;
        border-top: 1px solid #000;

        @include media-breakpoint-up(md) {
            width: 725px;
            left: 50%;
            -webkit-transform: translateX(-50%);
            transform: translateX(-50%);
        }
    }
}

/*
 * Asset detail page
 *
 * This page wants to display as much as possible and so the entire page is a flex column
 */

#contribute-main-content {
    overflow: hidden;
    position: relative;
}

#contribute-main-content h2 {
    font-size: inherit;
}

#asset-navigation {
    margin: 0 -0.25rem;
    padding-top: 3px;
    padding-bottom: 3px;
}

#contribute-container {
    @include media-breakpoint-up(md) {
        height: calc(100vh - 53px);
    }
}

@include media-breakpoint-down(sm) {
    #contribute-container {
        flex-direction: column !important;
    }

    #asset-image {
        height: 50vh !important;
    }

    #transcription-editor textarea {
        height: 30vh;
    }

    .gutter.gutter-horizontal {
        display: none !important;
    }

    .gutter.gutter-vertical {
        display: none !important;
    }
}

#viewer-controls .btn-dark {
    &:hover,
    &:focus {
        border-color: $light;
    }
}

.gutter.gutter-horizontal {
    display: block;
    position: relative;
    cursor: ew-resize;
    background-color: $gray-400;
}

.gutter.gutter-horizontal::after {
    display: block;
    position: absolute;
    top: calc(50% - 40px);
    left: -4px;
    content: '';
    height: 40px;
    width: 16px;
    background: url('../img/handle.svg') no-repeat;
}

.gutter.gutter-vertical {
    display: block;
    position: relative;
    cursor: ns-resize;
    background-color: $gray-400;
    width: 100%;
}

.gutter.gutter-vertical::after {
    display: block;
    position: absolute;
    top: -4px;
    left: calc(50% - 60px);
    content: '';
    height: 16px;
    width: 60px;
    background: url('../img/handle-vertical.svg') no-repeat;
}

#transcription-editor textarea {
    resize: none;
}

a.btn-outline-primary,
button.btn-outline-primary {
    border-color: $blue;
    color: $blue;
}

a.btn-outline-primary:hover,
button.btn-outline-primary:hover {
    background-color: $blue;
    border-color: $blue;
}

.btn-outline-primary.disabled,
.btn-outline-primary:disabled {
    opacity: 0.2;
}

/* Help Center */

.help-center-card {
    color: #fff;
    height: 225px;
    background-color: $accent;
    margin-bottom: 1rem;
}

.help-center-card a {
    color: #fff;
}

.help-center .nav-link {
    padding: 0.5rem;
}

.help-center a.nav-link {
    color: #0076ad;
    font-weight: bold;
}

.help-center a.nav-link.active {
    color: #242424;
}

/*
 * Image filter controls
*/

#image-filters .btn-dark {
    color: $light;
    text-decoration: underline;
    border-radius: 0;

    &:hover,
    &:focus,
    &.active {
        color: $dark;
        background-color: $light;
        text-decoration: none;
        font-weight: 400;
        border-color: $light;
        outline: none;
        box-shadow: none;
    }
}

#filter-tabs {
    background-color: $light;
    height: 3em;

    & .custom-control-label::before {
        height: 1.5rem;
        width: 2.75rem;
        border-radius: 4rem;
    }

    & .custom-control-label::after {
        width: calc(1.5rem - 4px);
        height: calc(1.5rem - 4px);
        border-radius: 1.25rem;
    }

    & .custom-control-input:checked ~ .custom-control-label::after {
        transform: translateX(1.25rem);
    }

    & .custom-control-input ~ .custom-control-label::before {
        border-color: $dark !important;
    }

    & .custom-control-input ~ .custom-control-label::after {
        background-color: $white !important;
        border: solid 1px $dark !important;
        left: calc(-2.25rem + 4px);
    }

    & .custom-control-input:focus ~ .custom-control-label::before {
        border-color: $dark !important;
    }

    & .custom-control-input:checked ~ .custom-control-label::before {
        border-color: $dark !important;
        background-color: $dark !important;
    }

    & .custom-control-input:active ~ .custom-control-label::before {
        background-color: $dark !important;
        border-color: $dark !important;
    }

    &
        .custom-control-input:focus:not(:checked)
        ~ .custom-control-label::before {
        border-color: $dark !important;
    }
}

#viewer-reset {
    background-color: $primary;
    border-color: $primary;
    color: $white;
    border-radius: 0;

    &.btn {
        border-radius: $btn-border-radius;
    }
}

.filter-slider {
    appearance: none;
    border: solid 1px $dark;
    height: 0.5em;
    background: $white;
}

.filter-slider::-webkit-slider-thumb {
    -webkit-appearance: none;
    appearance: none;
    width: 1.1em;
    height: 1.5em;
    background: $primary;
    cursor: pointer;
    border-radius: 20%;
}

.filter-slider::-moz-range-thumb {
    appearance: none;
    width: 1.1em;
    height: 1.5em;
    background: $primary;
    cursor: pointer;
    border-radius: 20%;
}

.number-input {
    border: solid 1px $primary;
    background-color: $white;

    & input[type='number'] {
        border: none;
        appearance: textfield;
        -webkit-appearance: textfield;
        -moz-appearance: textfield;
        height: 100%;
        width: 100%;
    }

    & input[type='number']::-webkit-inner-spin-button,
    input[type='number']::-webkit-outer-spin-button {
        -webkit-appearance: none;
    }

    & input[type='number']:focus {
        outline: none;
    }

    & .arrow-button {
        background-color: $primary;
        color: $white;
        font-size: 0.8em;
        width: 100%;
        border: none;
        padding: 0;
    }
}

.row > .filter-buttons {
    width: 1.8rem;
}

#ocr-transcription-link {
    pointer-events: auto;
}

#ocr-transcription-link.disabled {
    cursor: default;
}

#ocr-transcription-modal .modal-dialog {
    max-width: 419px;
}

#language-selection-modal .modal-header a,
#ocr-transcription-modal .modal-header a {
    cursor: pointer;
    font-size: 1.5rem;
}

#language-selection-modal {
    display: none;
    margin-left: 40px;
}

#language-selection-modal .modal-dialog {
    max-width: 428px;
}

#language-selection-modal .modal-footer {
    justify-content: center;
}

/*
 * Tag input on the asset detail page
 */
#tag-label {
    [data-toggle='collapse'][aria-expanded='true'] .fas::before {
        content: '\f146';
    }

    [data-toggle='collapse'].collapsed .fas::before {
        content: '\f0fe';
    }
}

#current-tags {
    margin: 5px -2px 0;

    > li {
        margin: 2px;

        > button {
            color: inherit;
            font-size: inherit;
            padding: 0;
            margin: 0 0 0 5px;
            float: none;
            line-height: inherit;
            opacity: 1;
            text-shadow: none;
        }
    }
}

/*
 * Tutorial popup and cards navigation
 */
#tutorial-popup .modal-header {
    padding-bottom: 0.25rem;
}

#tutorial-popup .modal-body {
    padding-top: 0.25rem;
}

#close-tutorial a {
    position: absolute;
    right: 1rem;
    top: 0.375rem;
    color: $blue;
    cursor: pointer;
    font-size: 1.5rem;
    font-weight: 700;
}

#card-carousel .carousel-item img {
    background-color: #fff;
    border-top: 1px solid #efefef;
    padding-bottom: 1rem;
}

#card-carousel .carousel-item h5 {
    margin-bottom: 0;
}

#card-carousel .carousel-item p {
    margin-bottom: 0.75rem;
}

#card-carousel ul {
    padding-left: 1.5rem;
}

#card-carousel .carousel-indicators .active {
    background-color: $blue;
    border-color: $blue;
}

#previous-card {
    position: absolute;
    bottom: 10px;
    left: 0;
}

#next-card {
    position: absolute;
    bottom: 10px;
    right: 0;
}

/* How to Guide */
@media (width >= 965px) {
    #instruction-buttons {
        justify-content: flex-end;
    }
}

#open-guide {
    border-radius: $btn-border-radius;
    margin: 0 5px 0 9px;
    max-width: 137px;
    white-space: nowrap;
}

#close-guide {
    position: absolute;
    right: -8px;
    color: #fff;
    cursor: pointer;
    font-size: 0.875rem;
    height: 30.5px;
    margin: 0 1rem -1rem auto;
}

.sidebar {
    max-height: calc(100vh - 107px);
    width: 450px;
    position: absolute; /* Stay in place */
    z-index: 1; /* Stay on top */
    right: 0;
    overflow: hidden auto; /* Disable horizontal scrolling */
    transition: 0.3s;
    background-color: $white;
}

.sidebar.offscreen {
    transform: translateX(100%);
}

.sidebar h3 {
    padding-top: 0.5rem;
}

.sidebar li {
    border-bottom: thin solid $gray-400;
}

.sidebar .nav-item a {
    font-size: $font-size-base * 1.25;
    text-decoration: underline;
}

.guide-body {
    max-height: calc(100vh - 249px);
    overflow-x: hidden;
}

div.row.guide-header {
    justify-content: center;
    margin-right: -4px;
    margin-bottom: 1rem;
    padding-bottom: 0.25rem;
    padding-top: 0.25rem;
}

.guide-body h3 {
    font-size: 1rem;
    font-weight: bold;
}

#title-bar {
    font-weight: 700;
}

.toc-title {
    font-weight: 600;
}

#guide-bars {
    color: #fff;
    padding-top: 0.25rem;
}

.sidebar .close {
    font-size: $font-size-base * 0.875;
}

#guide-carousel .container {
    padding-right: 0;
}

/*
 * Campaign Helpful Links Panel
 */

div.related-links {
    background-color: #ddd;
    border: #000 1px solid;
}

.list-inline .list-inline-item:not(:last-child) {
    margin-right: $list-inline-padding;
}

.related-links .list-group-item {
    background-color: #ddd;
    border: 0;
    padding-left: unset;
}

/*
* Footer
*/

.footer {
    background-color: $gray-100;
    margin-top: 1.5rem;

    .footer-links {
        border-top: 1px solid $border-color;
        border-bottom: 1px solid $border-color;
        padding-top: 1rem;
        padding-bottom: 1rem;
        margin-top: 1rem;
        margin-bottom: 1rem;

        @include media-breakpoint-up(lg) {
            border-top: none;
            border-bottom: none;
            border-left: 1px solid $border-color;
            border-right: 1px solid $border-color;
            padding-top: 0;
            padding-bottom: 0;
            margin-top: 0;
            margin-bottom: 0;

            > ul > li {
                display: block;
            }
        }
    }

    .intersites-link-congress a {
        display: block;
        width: 121px;
        height: 24px;
        background: url('../img/congress-gov.svg') no-repeat;
        background-size: 121px 24px;
    }

    .intersites-link-copyright a {
        display: block;
        width: 176px;
        height: 24px;
        background: url('../img/copyright-gov.svg') no-repeat;
        background-size: 176px 24px;
    }
}

.bitmap-icon {
    display: inline-block;
    width: 24px;
    height: 24px;
    vertical-align: text-top;
    background-image: url('../img/social-icons-sprite.png');
    background-position: -200px 0;
    background-repeat: no-repeat;

    &.github-icon {
        background-position: 0 0;
    }

    &.twitter-icon {
        background-position: -40px 0;
    }

    &.email-icon {
        background-position: -80px 0;
    }

    &.facebook-icon {
        background-position: -40px -36px;
    }

    &.copy-link-icon {
        background-position: -80px -36px;
    }
}

/* Registration page */
#registration-form-container > .col-md-6 {
    max-width: 30rem;
}

/* This is here to fix
    https://github.com/LibraryOfCongress/concordia/issues/1127
    until https://github.com/twbs/bootstrap/issues/29439 is fixed */

#registration-form-container .invalid-feedback {
    display: block;
}

/* Profile page */
.contribution-highlight {
    background-color: #f6f6f6;
    border: 1px solid black;
    flex: 1;
    margin: 0.5rem;
    padding-bottom: 10px;
    padding-top: 10px;
    text-align: center;
}

.contribution-highlight .value {
    color: $blue;
    font-size: xxx-large;
    font-weight: bold;
}

.contribution-highlight .label {
    font-size: large;
    font-weight: bold;
    margin-bottom: 0;
}

.contribution-table a {
    text-decoration: underline;
}

.recent-page a {
    text-decoration: underline;
}

.all-campaigns {
    text-decoration: underline;
}

/* stylelint-disable-next-line selector-class-pattern */
input.duet-date__input {
    border-radius: 0;
}

table.table thead.border-y {
    th,
    td {
        border-bottom: 1px solid #000;
        border-top: 1px solid #000;
    }
}

#current-filters {
    margin-bottom: 0.75rem;
    padding: 0.375rem 0;
}

#current-filters ul {
    padding-left: 0.5rem;
}

#current-filters .btn {
    border-color: $blue;
    color: $blue;
}

#current-filters li {
    background-color: $white;
}

#current-filters label {
    padding-left: 5px;
    padding-top: 1px;
}

.btn-xs {
    font-size: 12px;
    padding: 0 0.12rem;
}

.btn-xs .btn {
    font-size: 14px;
    padding: 0 0.12rem;
}

.btn-group-sm > .btn {
    border-radius: $btn-border-radius;
}

#contact-us {
    border-top-left-radius: $btn-border-radius;
    border-bottom-left-radius: $btn-border-radius;
}

#current-filters li .btn {
    border: none;
    padding-right: 4px;
}

/* stylelint-disable-next-line selector-id-pattern */
#nav-tabContent .dropdown-menu a:hover {
    background-color: $navy;
    color: $light;
}

.dropdown-menu .dropdown-item:active {
    background-color: $blue;
}

.change-options {
    background-color: $gray-200;
}

.tab-pane th {
    cursor: pointer;
}

.tab-pane th.date-header {
    cursor: default;
}

.user-fields {
    margin-bottom: ($spacer * 1.5) !important;
    max-width: 450px;
}

#validation-confirmation {
    font-size: 87.5%;
}

/* print */
@media print {
    @page {
        margin: 0.75in;
    }

    body {
        border-style: none;
        background-color: transparent;
        font-size: 14pt;
    }

    header .navbar {
        padding: 0;
        background-color: transparent;
    }

    #navigation-container {
        border-style: none;
        padding: 0;
    }

    #contribute-container {
        border-style: none;
    }

    .print-transcription-image {
        page-break-before: always;
    }

    #contribute-container .gutter-horizontal {
        display: none;
    }

    #contribute-container .gutter-vertical {
        display: none;
    }

    #contribute-container #editor-column .tx-status-display {
        font-size: 24px;
        margin: 2rem 0;
    }

    #contribute-container #editor-column .print-transcription-text {
        display: block !important;
        white-space: pre-wrap;
        color: #000;
    }

    #current-tags {
        max-height: none;
    }

    #current-tags li {
        background-color: transparent;
        color: #000;
        display: inline-block;
    }
}

/* Profile page */
.view-user-profile .nav-tabs,
.view-email-reconfirmation .nav-tabs {
    border-bottom: 1px solid #000;
}

.view-user-profile .nav-tabs .nav-link.active,
.view-user-profile .nav-tabs .nav-item.show .nav-link,
.view-email-reconfirmation .nav-tabs .nav-link.active,
.view-email-reconfirmation .nav-tabs .nav-item.show .nav-link {
    border-color: #000 #000 #fff;
}

/* Accessibility */
.visually-hidden {
    position: absolute !important;
    width: 1px !important;
    height: 1px !important;
    padding: 0 !important;
    margin: -1px !important;
    overflow: hidden !important;
    clip: rect(0, 0, 0, 0) !important;
    white-space: nowrap !important;
    border: 0 !important;
}

/* Error pages */
figure.error-figure {
    img {
        max-width: 75%;
    }

    figcaption {
        padding-top: 5px;
        font-size: 12px;
    }
}

/*
 * About page
 */

#blog-carousel .carousel-control-prev {
    top: 2rem;
    left: 9rem;
    opacity: 1;
}

#blog-carousel .carousel-control-next {
    top: 2rem;
    right: 7rem;
    opacity: 1;
}

#blog-carousel .carousel-control-icon {
    background-color: $blue;
    -webkit-mask-repeat: no-repeat;
    mask-repeat: no-repeat;
    mask-size: 25% 50%;
    height: 3.5rem;
    width: 3.5rem;
}

#blog-carousel .carousel-control-icon.prev {
    -webkit-mask-image: url('/static/img/slick-left-arrow.svg');
    mask-image: url('/static/img/slick-left-arrow.svg');
}

#blog-carousel .carousel-control-icon.next {
    -webkit-mask-image: url('/static/img/slick-right-arrow.svg');
    mask-image: url('/static/img/slick-right-arrow.svg');
}

.blog-chunk {
    width: 684px;
}

.blog-chunk a {
    text-decoration: none;
}

.blog-chunk h5 {
    min-height: 115.2px;
}

#blog-carousel .card {
    border-width: 0;
}

.about-accordion {
    background-color: $gray-100;
    padding-top: 12px;
    padding-left: 28px;
    padding-bottom: 8px;
    margin-top: 5px;
    margin-bottom: 5px;
}

.accordion-icon {
    color: $blue;
    font-style: normal;
}

.icon-plus-square::before {
    content: '\f0fe';
}

.icon-minus-square::before {
    content: '\f146';
}

.blog-content,
.press-content,
.publications-content,
.program-history {
    display: none;
}

.visualization-container {
    display: flex-basis;
    width: 100%;
}

.visualization-container section {
    width: 100%;
}

.visualization-data-link {
    display: block;
    margin-top: 0.25rem;
    font-size: 0.5rem;
}


================================================
FILE: concordia/static/vendor/jquery.cookie.js
================================================
/*!
 * jQuery Cookie Plugin v1.4.1
 * https://github.com/carhartl/jquery-cookie
 *
 * Copyright 2013 Klaus Hartl
 * Released under the MIT license
 */
(function (factory) {
	if (typeof define === 'function' && define.amd) {
		// AMD
		define(['jquery'], factory);
	} else if (typeof exports === 'object') {
		// CommonJS
		factory(require('jquery'));
	} else {
		// Browser globals
		factory(jQuery);
	}
}(function ($) {

	var pluses = /\+/g;

	function encode(s) {
		return config.raw ? s : encodeURIComponent(s);
	}

	function decode(s) {
		return config.raw ? s : decodeURIComponent(s);
	}

	function stringifyCookieValue(value) {
		return encode(config.json ? JSON.stringify(value) : String(value));
	}

	function parseCookieValue(s) {
		if (s.indexOf('"') === 0) {
			// This is a quoted cookie as according to RFC2068, unescape...
			s = s.slice(1, -1).replace(/\\"/g, '"').replace(/\\\\/g, '\\');
		}

		try {
			// Replace server-side written pluses with spaces.
			// If we can't decode the cookie, ignore it, it's unusable.
			// If we can't parse the cookie, ignore it, it's unusable.
			s = decodeURIComponent(s.replace(pluses, ' '));
			return config.json ? JSON.parse(s) : s;
		} catch(e) {}
	}

	function read(s, converter) {
		var value = config.raw ? s : parseCookieValue(s);
		return $.isFunction(converter) ? converter(value) : value;
	}

	var config = $.cookie = function (key, value, options) {

		// Write

		if (value !== undefined && !$.isFunction(value)) {
			options = $.extend({}, config.defaults, options);

			if (typeof options.expires === 'number') {
				var days = options.expires, t = options.expires = new Date();
				t.setTime(+t + days * 864e+5);
			}

			return (document.cookie = [
				encode(key), '=', stringifyCookieValue(value),
				options.expires ? '; expires=' + options.expires.toUTCString() : '', // use expires attribute, max-age is not supported by IE
				options.path    ? '; path=' + options.path : '',
				options.domain  ? '; domain=' + options.domain : '',
				options.secure  ? '; secure' : ''
			].join(''));
		}

		// Read

		var result = key ? undefined : {};

		// To prevent the for loop in the first place assign an empty array
		// in case there are no cookies at all. Also prevents odd result when
		// calling $.cookie().
		var cookies = document.cookie ? document.cookie.split('; ') : [];

		for (var i = 0, l = cookies.length; i < l; i++) {
			var parts = cookies[i].split('=');
			var name = decode(parts.shift());
			var cookie = parts.join('=');

			if (key && key === name) {
				// If second argument (value) is a function it's a converter...
				result = read(cookie, value);
				break;
			}

			// Prevent storing a cookie that we couldn't decode.
			if (!key && (cookie = read(cookie)) !== undefined) {
				result[name] = cookie;
			}
		}

		return result;
	};

	config.defaults = {};

	$.removeCookie = function (key, options) {
		if ($.cookie(key) === undefined) {
			return false;
		}

		// Must not alter options, thus extending a fresh object...
		$.cookie(key, '', $.extend({}, options, { expires: -1 }));
		return !$.cookie(key);
	};

}));


================================================
FILE: concordia/storage.py
================================================
from django.core.files.storage import storages
from django.utils.functional import LazyObject


class LazyAssetStorage(LazyObject):
    def _setup(self):
        self._wrapped = storages["assets"]


class LazyVisualizationStorage(LazyObject):
    def _setup(self):
        self._wrapped = storages["visualizations"]


# This is an intentional alias so we can change this value in the future
# if we need to split storage across multiple buckets
# We use a LazyObject so the value isn't evaluated when the code is loaded,
# which is needed to override the setting during tests

ASSET_STORAGE = LazyAssetStorage()

VISUALIZATION_STORAGE = LazyVisualizationStorage()


================================================
FILE: concordia/storage_backends.py
================================================
from storages.backends.s3boto3 import S3Boto3Storage


class OverwriteS3Boto3Storage(S3Boto3Storage):
    def get_available_name(self, name, max_length=None):
        return name  # Forces overwriting by always returning the given name


================================================
FILE: concordia/tasks/__init__.py
================================================


================================================
FILE: concordia/tasks/assets.py
================================================
import os.path
from logging import getLogger
from tempfile import NamedTemporaryFile

import requests
from more_itertools.more import chunked

from concordia.logging import ConcordiaLogger
from concordia.models import Asset
from concordia.storage import ASSET_STORAGE

from ..celery import app as celery_app

logger = getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


@celery_app.task
def calculate_difficulty_values(asset_qs=None):
    """
    Calculate difficulty scores for assets and update their stored values.

    This Celery task walks a queryset of Asset rows in 500-row chunks, computes
    a difficulty score based on transcription activity, and bulk-updates only
    those assets whose difficulty value has changed.

    Args:
        asset_qs: Optional queryset of Asset instances to process. If omitted,
            all published assets are fetched via Asset.objects.published().

    Returns:
        int: The number of Asset records whose difficulty field was updated.
    """

    if asset_qs is None:
        asset_qs = Asset.objects.published()

    asset_qs = asset_qs.add_contribution_counts()

    updated_count = 0

    # We'll process assets in chunks using an iterator to avoid saving objects
    # which will never be used again in memory. We will find assets which have a
    # difficulty value which is not the same as the value stored in the database
    # and pass them to bulk_update() to be saved in a single query.
    for asset_chunk in chunked(asset_qs.iterator(), 500):
        changed_assets = []

        for asset in asset_chunk:
            difficulty = asset.transcription_count * (
                asset.transcriber_count + asset.reviewer_count
            )
            if difficulty != asset.difficulty:
                asset.difficulty = difficulty
                changed_assets.append(asset)

        if changed_assets:
            # We will only save the new difficulty score both for performance
            # and to avoid any possibility of race conditions causing stale data
            # to be saved:
            Asset.objects.bulk_update(changed_assets, ["difficulty"])
            updated_count += len(changed_assets)

    return updated_count


@celery_app.task
def populate_asset_years():
    """
    Populate the Asset.year field using dates from related Item metadata.

    This Celery task iterates over assets in 500-row chunks, inspects each
    asset's Item.metadata["item"]["dates"] structure, and assigns the final
    year key encountered to the Asset.year field. Only assets whose year value
    changes are persisted with bulk_update().

    Returns:
        int: The number of Asset records whose year field was updated.
    """

    asset_qs = Asset.objects.prefetch_related("item")

    updated_count = 0

    for asset_chunk in chunked(asset_qs, 500):
        changed_assets = []

        for asset in asset_chunk:
            metadata = asset.item.metadata

            year = None
            for date_outer in metadata["item"]["dates"]:
                for date_inner in date_outer.keys():
                    year = date_inner
                    break  # We don't support multiple values

            if asset.year != year:
                asset.year = year
                changed_assets.append(asset)

        if changed_assets:
            Asset.objects.bulk_update(changed_assets, ["year"])
            updated_count += len(changed_assets)

    return updated_count


@celery_app.task(ignore_result=True)
def fix_storage_images(campaign_slug=None, asset_start_id=None):
    """
    Ensure that each Asset has a backing file in the asset storage backend.

    For each matching asset, this Celery task checks whether the file referenced
    by Asset.storage_image exists in ASSET_STORAGE. If it is missing, the task
    downloads the image from Asset.download_url and saves it into storage using
    the expected campaign/project/item/sequence-based filename.

    Args:
        campaign_slug: Optional campaign slug used to restrict the assets that
            are checked. If omitted, all assets are examined.
        asset_start_id: Optional numeric Asset primary key. If provided, only
            assets with id >= this value are processed.

    Raises:
        requests.RequestException: Propagated if the remote download fails.
        Exception: Any other exception encountered during download or save is
            logged and re-raised.
    """

    if campaign_slug:
        from concordia.models import Campaign

        campaign = Campaign.objects.get(slug=campaign_slug)
        asset_queryset = Asset.objects.filter(item__project__campaign=campaign)
    else:
        asset_queryset = Asset.objects.all()

    if asset_start_id:
        asset_queryset = asset_queryset.filter(id__gte=asset_start_id)

    count = 0
    full_count = asset_queryset.count()
    logger.debug("Checking storage image on %s assets", full_count)
    for asset in asset_queryset.order_by("id"):
        count += 1
        if asset.storage_image:
            if not asset.storage_image.storage.exists(asset.storage_image.name):
                logger.info("Storage image does not exist for %s (%s)", asset, asset.id)
                item = asset.item
                download_url = asset.download_url
                asset_filename = os.path.join(
                    item.project.campaign.slug,
                    item.project.slug,
                    item.item_id,
                    "%d.jpg" % asset.sequence,
                )
                try:
                    with NamedTemporaryFile(mode="x+b") as temp_file:
                        resp = requests.get(download_url, stream=True, timeout=30)
                        resp.raise_for_status()

                        for chunk in resp.iter_content(chunk_size=256 * 1024):
                            temp_file.write(chunk)

                        # Rewind the tempfile back to the first byte so we can
                        temp_file.flush()
                        temp_file.seek(0)

                        ASSET_STORAGE.save(asset_filename, temp_file)

                except Exception:
                    logger.exception(
                        "Unable to download %s to %s", download_url, asset_filename
                    )
                    raise
                logger.info("Storage image downloaded for  %s (%s)", asset, asset.id)
        logger.debug("Storage image checked for %s (%s)", asset, asset.id)
        logger.debug("%s / %s (%s%%)", count, full_count, str(count / full_count * 100))


================================================
FILE: concordia/tasks/blog.py
================================================
from logging import getLogger

from concordia.logging import ConcordiaLogger
from concordia.parser import extract_og_image, fetch_blog_posts

from ..celery import app as celery_app

logger = getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


@celery_app.task(bind=True, ignore_result=True)
def fetch_and_cache_blog_images(self):
    """
    Fetch blog posts and cache their Open Graph images.

    This Celery task iterates over entries returned by ``fetch_blog_posts()``,
    finds each entry's ``<link>`` element, and passes the URL to
    ``extract_og_image()`` so the Open Graph image can be fetched and cached
    for later use.
    """
    for item in fetch_blog_posts():
        link = item.find("link")
        if link is not None:
            extract_og_image(link.text)


================================================
FILE: concordia/tasks/housekeeping.py
================================================
from logging import getLogger

from django.core.management import call_command

from concordia.logging import ConcordiaLogger

from ..celery import app as celery_app

logger = getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


@celery_app.task(ignore_result=True)
def clear_sessions():
    """
    Clear expired Django session records.

    This Celery task runs Django's ``clearsessions`` management command to
    remove expired rows from the session store. It is typically invoked on a
    schedule to prevent the session table from growing without bounds.
    """
    call_command("clearsessions")


================================================
FILE: concordia/tasks/next_asset/__init__.py
================================================


================================================
FILE: concordia/tasks/next_asset/renew.py
================================================
from logging import getLogger

from concordia.decorators import locked_task
from concordia.logging import ConcordiaLogger
from concordia.models import Campaign, Topic

from ...celery import app as celery_app
from .reviewable import (
    clean_next_reviewable_for_campaign,
    clean_next_reviewable_for_topic,
)
from .transcribable import (
    clean_next_transcribable_for_campaign,
    clean_next_transcribable_for_topic,
)

logger = getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


@celery_app.task(bind=True, ignore_result=True)
@locked_task
def renew_next_asset_cache(self):
    """
    Triggers cache cleaning and repopulation for all active campaigns and published
    topics.

    This runs cleaning tasks for both transcribable and reviewable assets across all
    campaigns and topics. Each cleaning task ensures that the next asset cache remains
    accurate and up to date by removing invalid entries and restoring the desired count.
    """

    for campaign in Campaign.objects.active():
        logger.info("Spawning clean_next_transcribable_for_campaign for %s", campaign)
        clean_next_transcribable_for_campaign.delay(campaign_id=campaign.id)
        logger.info("Spawning clean_next_reviewable_for_campaign for %s", campaign)
        clean_next_reviewable_for_campaign.delay(campaign_id=campaign.id)

    for topic in Topic.objects.published():
        logger.info("Spawning clean_next_transcribable_for_topic for %s", topic)
        clean_next_transcribable_for_topic.delay(topic_id=topic.id)
        logger.info("Spawning clean_next_reviewable_for_topic for %s", topic)
        clean_next_reviewable_for_topic.delay(topic_id=topic.id)


================================================
FILE: concordia/tasks/next_asset/reviewable.py
================================================
from itertools import chain
from logging import getLogger

from concordia.decorators import locked_task
from concordia.logging import ConcordiaLogger
from concordia.models import (
    Campaign,
    NextReviewableCampaignAsset,
    NextReviewableTopicAsset,
    Topic,
)
from concordia.utils import get_anonymous_user
from concordia.utils.next_asset import (
    find_invalid_next_reviewable_campaign_assets,
    find_invalid_next_reviewable_topic_assets,
    find_new_reviewable_campaign_assets,
    find_new_reviewable_topic_assets,
)

from ...celery import app as celery_app

logger = getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


@celery_app.task(bind=True, ignore_result=True)
@locked_task
def populate_next_reviewable_for_campaign(self, campaign_id):
    """
    Populate the next reviewable cache for a campaign.

    This task checks how many reviewable assets are still needed for the
    campaign, finds eligible assets and inserts them into the
    NextReviewableCampaignAsset table up to the target count.

    The task prefers assets whose transcribers are not already represented in
    the cache to avoid review bottlenecks.

    Only a single instance of this task runs at a time for a given campaign,
    using the cache locking system to avoid duplication. This can be
    overridden with the ``force`` keyword argument, which is stripped by the
    decorator and not passed to the task itself. See the ``locked_task``
    documentation for details.

    Args:
        campaign_id: Primary key of the campaign to process.
    """
    try:
        campaign = Campaign.objects.get(id=campaign_id)
    except Campaign.DoesNotExist:
        logger.error("Campaign %s not found", campaign_id)
        return
    anonymous_user = get_anonymous_user()
    excluded_user_ids = (
        NextReviewableCampaignAsset.objects.filter(campaign=campaign)
        .exclude(transcriber_ids__contains=[anonymous_user.id])
        .values_list("transcriber_ids", flat=True)
        .distinct()
    )
    # Flatten the list and deduplicate
    excluded_user_ids = set(chain.from_iterable(excluded_user_ids))

    needed_asset_count = NextReviewableCampaignAsset.objects.needed_for_campaign(
        campaign_id
    )
    if needed_asset_count:
        assets_qs = find_new_reviewable_campaign_assets(campaign).only(
            "id",
            "item_id",
            "item__project_id",
            "item__project__slug",
            "campaign_id",
            "transcription__user",
        )
        # We prefer to not use transcribers that already exist, to avoid
        # the situation where all possible reviewable assets have the same
        # transcriber (since that would mean that user would miss the cache
        # table when they try to review).
        # If that's impossible, we just take whatever assets we can; that means
        # only these transcribers have reviewable assets in the campaign
        excluded_assets_qs = assets_qs.exclude(
            transcription__user_id__in=excluded_user_ids
        )
        if excluded_assets_qs.exists():
            assets_qs = excluded_assets_qs
        assets = assets_qs[:needed_asset_count]
    else:
        logger.info(
            "Campaign %s already has %s next reviewable assets",
            campaign,
            NextReviewableCampaignAsset.objects.target_count,
        )
        return

    if assets:
        objs = NextReviewableCampaignAsset.objects.bulk_create(
            [
                NextReviewableCampaignAsset(
                    asset_id=asset.id,
                    item_id=asset.item_id,
                    item_item_id=asset.item.item_id,
                    project_id=asset.item.project_id,
                    project_slug=asset.item.project.slug,
                    campaign_id=asset.campaign_id,
                    transcriber_ids=list(
                        asset.transcription_set.exclude(user=anonymous_user)
                        .values_list("user_id", flat=True)
                        .distinct()
                    ),
                    sequence=asset.sequence,
                )
                for asset in assets
            ]
        )
        logger.info(
            "Added %d next reviewable assets for campaign %s", len(objs), campaign
        )
    else:
        logger.info("No reviewable assets found in campaign %s", campaign)


@celery_app.task(bind=True, ignore_result=True)
@locked_task
def populate_next_reviewable_for_topic(self, topic_id):
    """
    Populate the next reviewable cache for a topic.

    This task checks how many reviewable assets are still needed for the topic,
    finds eligible assets and inserts them into the NextReviewableTopicAsset
    table up to the target count.

    The task prefers assets whose transcribers are not already represented in
    the cache to avoid review bottlenecks.

    Only a single instance of this task runs at a time for a given topic,
    using the cache locking system to avoid duplication. This can be
    overridden with the ``force`` keyword argument, which is stripped by the
    decorator and not passed to the task itself. See the ``locked_task``
    documentation for details.

    Args:
        topic_id: Primary key of the topic to process.
    """
    try:
        topic = Topic.objects.get(id=topic_id)
    except Topic.DoesNotExist:
        logger.error("Topic %s not found", topic_id)
        return
    anonymous_user = get_anonymous_user()
    excluded_user_ids = (
        NextReviewableTopicAsset.objects.filter(topic=topic)
        .exclude(transcriber_ids__contains=[anonymous_user.id])
        .values_list("transcriber_ids", flat=True)
        .distinct()
    )
    # Flatten the list and deduplicate
    excluded_user_ids = set(chain.from_iterable(excluded_user_ids))

    needed_asset_count = NextReviewableTopicAsset.objects.needed_for_topic(topic_id)
    if needed_asset_count:
        assets_qs = find_new_reviewable_topic_assets(topic).only(
            "id",
            "item_id",
            "item__project_id",
            "item__project__slug",
            "transcription__user",
        )
        # We prefer to not use transcribers that already exist, to avoid
        # the situation where all possible reviewable assets have the same
        # transcriber (since that would mean that user would miss the cache
        # table when they try to review).
        # If that's impossible, we just take whatever assets we can; that means
        # only these transcribers have reviewable assets in the campaign
        excluded_assets_qs = assets_qs.exclude(
            transcription__user_id__in=excluded_user_ids
        )
        if excluded_assets_qs.exists():
            assets_qs = excluded_assets_qs
        assets = assets_qs[:needed_asset_count]
    else:
        logger.info(
            "Topic %s already has %s next reviewable assets",
            topic,
            NextReviewableTopicAsset.objects.target_count,
        )
        return

    if assets:
        objs = NextReviewableTopicAsset.objects.bulk_create(
            [
                NextReviewableTopicAsset(
                    asset_id=asset.id,
                    item_id=asset.item_id,
                    item_item_id=asset.item.item_id,
                    project_id=asset.item.project_id,
                    project_slug=asset.item.project.slug,
                    topic_id=topic.id,
                    transcriber_ids=list(
                        asset.transcription_set.exclude(user=anonymous_user)
                        .values_list("user_id", flat=True)
                        .distinct()
                    ),
                    sequence=asset.sequence,
                )
                for asset in assets
            ]
        )
        logger.info("Added %d next reviewable assets for topic %s", len(objs), topic)
    else:
        logger.info("No reviewable assets found in topic %s", topic)


@celery_app.task(bind=True, ignore_result=True)
@locked_task
def clean_next_reviewable_for_campaign(self, campaign_id):
    """
    Clean cached reviewable assets for a campaign then repopulate the cache.

    Invalid entries are those whose assets no longer have transcription status
    ``SUBMITTED`` and are no longer eligible for review. After cleaning, the
    corresponding populate task is queued to restore the cache to the target
    count.

    Args:
        campaign_id: Primary key of the campaign to clean.
    """

    for next_asset in find_invalid_next_reviewable_campaign_assets(campaign_id):
        try:
            next_asset.delete()
        except Exception:
            logger.exception("Error deleting cached asset %s", next_asset.id)
    logger.info(
        "Spawning populate_next_reviewable_for_campaign for campgin %s", campaign_id
    )
    populate_next_reviewable_for_campaign.delay(campaign_id)


@celery_app.task(bind=True, ignore_result=True)
@locked_task
def clean_next_reviewable_for_topic(self, topic_id):
    """
    Clean cached reviewable assets for a topic then repopulate the cache.

    Invalid entries are those whose assets no longer have transcription status
    ``SUBMITTED`` and are no longer eligible for review. After cleaning, the
    corresponding populate task is queued to restore the cache to the target
    count.

    Args:
        topic_id: Primary key of the topic to clean.
    """

    for next_asset in find_invalid_next_reviewable_topic_assets(topic_id):
        try:
            next_asset.delete()
        except Exception:
            logger.exception("Error deleting cached asset %s", next_asset.id)
    logger.info("Spawning populate_next_reviewable_for_topic for topic %s", topic_id)
    populate_next_reviewable_for_topic.delay(topic_id)


================================================
FILE: concordia/tasks/next_asset/transcribable.py
================================================
from logging import getLogger

from concordia.decorators import locked_task
from concordia.logging import ConcordiaLogger
from concordia.models import (
    Campaign,
    NextTranscribableCampaignAsset,
    NextTranscribableTopicAsset,
    Topic,
)
from concordia.utils.next_asset import (
    find_invalid_next_transcribable_campaign_assets,
    find_invalid_next_transcribable_topic_assets,
    find_new_transcribable_campaign_assets,
    find_new_transcribable_topic_assets,
)

from ...celery import app as celery_app

logger = getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


@celery_app.task(bind=True, ignore_result=True)
@locked_task
def populate_next_transcribable_for_campaign(self, campaign_id):
    """
    Populate the cache of next transcribable assets for a campaign.

    This task checks how many transcribable assets are still needed for the
    campaign, finds eligible assets and inserts them into the
    NextTranscribableCampaignAsset table up to the target count.

    Only a single instance of the task runs at a time for a particular
    campaign_id by using the cache locking system to avoid duplication. This
    can be overridden with the `force` kwarg, which is stripped out by the
    decorator and not passed to the task itself. See the `locked_task`
    documentation for more information.

    Args:
        campaign_id: Primary key of the campaign to process.
    """
    try:
        campaign = Campaign.objects.get(id=campaign_id)
    except Campaign.DoesNotExist:
        logger.error("Campaign %s not found", campaign_id)
        return

    needed_asset_count = NextTranscribableCampaignAsset.objects.needed_for_campaign(
        campaign_id
    )
    if needed_asset_count:
        assets_qs = find_new_transcribable_campaign_assets(campaign).only(
            "id",
            "item_id",
            "item__project_id",
            "item__project__slug",
            "campaign_id",
            "transcription_status",
        )
        assets = assets_qs[:needed_asset_count]
    else:
        logger.info(
            "Campaign %s already has %s next transcribable assets",
            campaign,
            NextTranscribableCampaignAsset.objects.target_count,
        )
        return

    if assets:
        objs = NextTranscribableCampaignAsset.objects.bulk_create(
            [
                NextTranscribableCampaignAsset(
                    asset_id=asset.id,
                    item_id=asset.item_id,
                    item_item_id=asset.item.item_id,
                    project_id=asset.item.project_id,
                    project_slug=asset.item.project.slug,
                    campaign_id=asset.campaign_id,
                    transcription_status=asset.transcription_status,
                    sequence=asset.sequence,
                )
                for asset in assets
            ]
        )
        logger.info(
            "Added %d next transcribable assets for campaign %s", len(objs), campaign
        )
    else:
        logger.info("No transcribable assets found in campaign %s", campaign)


@celery_app.task(bind=True, ignore_result=True)
@locked_task
def populate_next_transcribable_for_topic(self, topic_id):
    """
    Populate the cache of next transcribable assets for a topic.

    This task checks how many transcribable assets are still needed for the
    topic, finds eligible assets and inserts them into the
    NextTranscribableTopicAsset table up to the target count.

    Only a single instance of the task runs at a time for a particular topic_id
    by using the cache locking system to avoid duplication. This can be
    overridden with the `force` kwarg, which is stripped out by the decorator
    and not passed to the task itself. See the `locked_task` documentation for
    more information.

    Args:
        topic_id: Primary key of the topic to process.
    """
    try:
        topic = Topic.objects.get(id=topic_id)
    except Topic.DoesNotExist:
        logger.error("Topic %s not found", topic_id)
        return

    needed_asset_count = NextTranscribableTopicAsset.objects.needed_for_topic(topic_id)
    if needed_asset_count:
        assets_qs = find_new_transcribable_topic_assets(topic).only(
            "id",
            "item_id",
            "item__project_id",
            "item__project__slug",
            "transcription_status",
        )
        assets = assets_qs[:needed_asset_count]
    else:
        logger.info(
            "Topic %s already has %s next transcribable assets",
            topic,
            NextTranscribableTopicAsset.objects.target_count,
        )
        return

    if assets:
        objs = NextTranscribableTopicAsset.objects.bulk_create(
            [
                NextTranscribableTopicAsset(
                    asset_id=asset.id,
                    item_id=asset.item_id,
                    item_item_id=asset.item.item_id,
                    project_id=asset.item.project_id,
                    project_slug=asset.item.project.slug,
                    topic_id=topic.id,
                    transcription_status=asset.transcription_status,
                    sequence=asset.sequence,
                )
                for asset in assets
            ]
        )
        logger.info("Added %d next transcribable assets for topic %s", len(objs), topic)
    else:
        logger.info("No transcribable assets found in topic %s", topic)


@celery_app.task(bind=True, ignore_result=True)
@locked_task
def clean_next_transcribable_for_campaign(self, campaign_id):
    """
    Remove invalid cached transcribable assets for a campaign then repopulate
    the cache.

    Invalid assets include those that are reserved or no longer eligible for
    transcription based on their transcription status. After cleaning, the
    corresponding populate task is queued to restore the cache to the target
    count.

    Args:
        campaign_id: Primary key of the campaign to clean.
    """

    for next_asset in find_invalid_next_transcribable_campaign_assets(campaign_id):
        try:
            next_asset.delete()
        except Exception:
            logger.exception("Error deleting cached asset %s", next_asset.id)
    logger.info(
        "Spawning populate_next_transcribable_for_campaign for campgin %s", campaign_id
    )
    populate_next_transcribable_for_campaign.delay(campaign_id)


@celery_app.task(bind=True, ignore_result=True)
@locked_task
def clean_next_transcribable_for_topic(self, topic_id):
    """
    Remove invalid cached transcribable assets for a topic then repopulate the
    cache.

    Invalid assets include those that are reserved or no longer eligible for
    transcription based on their transcription status. After cleaning, the
    corresponding populate task is queued to restore the cache to the target
    count.

    Args:
        topic_id: Primary key of the topic to clean.
    """

    for next_asset in find_invalid_next_transcribable_topic_assets(topic_id):
        try:
            next_asset.delete()
        except Exception:
            logger.exception("Error deleting cached asset %s", next_asset.id)
    logger.info("Spawning populate_next_transcribable_for_topic for topic %s", topic_id)
    populate_next_transcribable_for_topic.delay(topic_id)


================================================
FILE: concordia/tasks/reports/__init__.py
================================================


================================================
FILE: concordia/tasks/reports/backfill.py
================================================
import datetime
import time
from logging import getLogger
from typing import Iterable, Optional

from django.db.models import Sum

from concordia.decorators import locked_task
from concordia.logging import ConcordiaLogger
from concordia.models import SiteReport

from ...celery import app as celery_app

# Heartbeat / streaming tuning
HEARTBEAT_EVERY_ROWS = 1000
HEARTBEAT_EVERY_SECONDS = 10.0
ITERATOR_CHUNK_SIZE = 2000

# Matching window for associating campaign reports with a site-wide TOTAL
# snapshot. Reports in a single daily run are created within minutes of
# one another, but we use a wider band to make backfill resilient.
TOTAL_ROLLUP_WINDOW_HOURS = 6

logger = getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


@celery_app.task(bind=True, ignore_result=True)
@locked_task(lock_by_args=False)
def backfill_assets_started_for_site_reports(self, skip_existing: bool = True) -> int:
    """
    Backfill the ``assets_started`` field for existing site-report series.

    This one-off task computes and persists ``assets_started`` values for all
    relevant ``SiteReport`` rows. It should be removed after it has been run in
    production and the backfill is no longer needed.

    Series processed:

    * Site-wide TOTAL (``report_name=TOTAL``)
    * Site-wide RETIRED_TOTAL (``report_name=RETIRED_TOTAL``)
    * Per-campaign (``campaign`` is not null)
    * Per-topic (``topic`` is not null)

    Rules:

    * The first snapshot in each series assumes ``assets_started = 0``. This
      represents the launch of the site or the time before the first report
      when no earlier data is available.
    * Per-campaign and per-topic values are derived from ``assets_total`` and
      ``assets_not_started``; publish/unpublish changes alone do not affect
      ``assets_started`` as long as the total and not-started counts remain
      consistent.
    * The site-wide TOTAL series is backfilled by rolling up per-campaign
      ``assets_started`` values from the same daily reporting run. This avoids
      undercounting caused by retirements changing site-wide totals between
      snapshots.
    * For rollup series whose membership can change over time (for example,
      ``RETIRED_TOTAL``), the delta-based ``assets_started`` calculation is not
      meaningful. We backfill a consistent zero value.
    * All results are floored at 0, since negative values indicate data
      removal and should not be treated as negative activity.

    Resumability:

    * By default, rows that already have a non-null ``assets_started`` value
      are skipped (``skip_existing=True``), so the task can be re-run to
      resume where it left off. In this mode, only series that still contain
      at least one snapshot with ``assets_started`` set to ``NULL`` are
      processed.
    * To recompute all rows, for example after changing the formula, call the
      task with ``skip_existing=False``. In this mode, any series that has at
      least one snapshot is processed, even if all snapshots already have
      non-null ``assets_started`` values.

    Args:
        skip_existing: If true, skip rows where ``assets_started`` is already
            populated.

    Returns:
        The number of ``SiteReport`` rows updated across all series.
    """
    structured_logger.info(
        "Starting backfill for assets_started across all series.",
        event_code="assets_started_backfill_start",
        skip_existing=skip_existing,
        task_id=getattr(self.request, "id", None),
    )

    updated_count = 0

    def process_series_queryset(
        qs: Iterable[SiteReport],
        *,
        series_label: str,
        force_zero_assets_started: bool = False,
        rollup_total_from_campaigns: bool = False,
    ) -> int:
        """
        Process a single series in chronological order and backfill values.

        This helper walks one site-report series and computes
        ``assets_started`` for each row. It saves updated rows and logs progress,
        including periodic heartbeat messages for monitoring long-running scans.

        For rollup series whose membership can change over time (for example,
        ``RETIRED_TOTAL``), the delta-based ``assets_started`` calculation is
        not meaningful. In those cases, callers should set
        ``force_zero_assets_started=True`` to backfill a consistent zero value.

        For the site-wide TOTAL series, callers should set
        ``rollup_total_from_campaigns=True`` to derive values by summing
        per-campaign ``assets_started`` from the same daily reporting run.

        Args:
            qs: Queryset or iterable of ``SiteReport`` objects ordered by
                ``created_on`` and primary key.
            series_label: Short label for logging, such as ``"TOTAL"`` or
                ``"CAMPAIGN:<id>"``.
            force_zero_assets_started: If True, set ``assets_started`` to 0 for
                every row in the series instead of computing deltas between
                snapshots.
            rollup_total_from_campaigns: If True, compute ``assets_started`` for
                each row by rolling up per-campaign values within a time window
                around the row's ``created_on``.

        Returns:
            The number of rows in the series that were updated.
        """
        changed = 0
        scanned = 0
        previous: Optional[SiteReport] = None

        series_start_t = time.monotonic()
        last_hb_t = series_start_t
        last_hb_rows = 0

        structured_logger.info(
            "Starting series scan.",
            event_code="assets_started_backfill_series_start",
            series=series_label,
        )

        window = datetime.timedelta(hours=TOTAL_ROLLUP_WINDOW_HOURS)

        for current in qs.iterator(chunk_size=ITERATOR_CHUNK_SIZE):
            scanned += 1

            if force_zero_assets_started:
                calculated = 0
            elif rollup_total_from_campaigns:
                window_start = current.created_on - window
                window_end = current.created_on + window
                agg = SiteReport.objects.filter(
                    campaign__isnull=False,
                    created_on__gte=window_start,
                    created_on__lte=window_end,
                ).aggregate(total=Sum("assets_started"))
                calculated = int(agg["total"] or 0)
            elif previous is None:
                calculated = 0
            else:
                calculated = SiteReport.calculate_assets_started(
                    previous_assets_total=previous.assets_total,
                    previous_assets_not_started=previous.assets_not_started,
                    current_assets_total=current.assets_total,
                    current_assets_not_started=current.assets_not_started,
                )

            # Resume behavior: optionally skip already-populated rows.
            if skip_existing and current.assets_started is not None:
                previous = current
                now_t = time.monotonic()
                if (
                    scanned - last_hb_rows >= HEARTBEAT_EVERY_ROWS
                    or (now_t - last_hb_t) >= HEARTBEAT_EVERY_SECONDS
                ):
                    structured_logger.info(
                        "Scanning series...",
                        event_code="assets_started_backfill_series_heartbeat",
                        series=series_label,
                        scanned_rows=scanned,
                        updated_rows=changed,
                        last_seen_site_report_id=current.id,
                    )
                    last_hb_rows = scanned
                    last_hb_t = now_t
                continue

            if current.assets_started != calculated:
                current.assets_started = calculated
                current.save(update_fields=["assets_started"])
                changed += 1

                structured_logger.info(
                    "Backfilled assets_started for SiteReport.",
                    event_code="assets_started_backfill_row",
                    site_report_id=current.id,
                    created_on=current.created_on.isoformat(),
                    series=series_label,
                    assets_started=calculated,
                    previous_site_report_id=(previous.id if previous else None),
                    campaign_id=current.campaign_id,
                    topic_id=current.topic_id,
                )

            previous = current

            now_t = time.monotonic()
            if (
                scanned - last_hb_rows >= HEARTBEAT_EVERY_ROWS
                or (now_t - last_hb_t) >= HEARTBEAT_EVERY_SECONDS
            ):
                structured_logger.info(
                    "Scanning series...",
                    event_code="assets_started_backfill_series_heartbeat",
                    series=series_label,
                    scanned_rows=scanned,
                    updated_rows=changed,
                    last_seen_site_report_id=current.id,
                )
                last_hb_rows = scanned
                last_hb_t = now_t

        structured_logger.info(
            "Finished series scan.",
            event_code="assets_started_backfill_series_done",
            series=series_label,
            scanned_rows=scanned,
            updated_rows=changed,
            elapsed_seconds=round(time.monotonic() - series_start_t, 3),
        )
        return changed

    # Per-campaign (includes retired campaigns; their historical reports remain)
    campaign_base_qs = SiteReport.objects.filter(campaign__isnull=False)
    if skip_existing:
        campaign_ids_source = campaign_base_qs.filter(assets_started__isnull=True)
    else:
        campaign_ids_source = campaign_base_qs

    campaign_ids = campaign_ids_source.values_list("campaign_id", flat=True).distinct()
    for campaign_id in campaign_ids.iterator():
        campaign_series = campaign_base_qs.filter(campaign_id=campaign_id).order_by(
            "created_on", "pk"
        )
        updated_count += process_series_queryset(
            campaign_series, series_label=f"CAMPAIGN:{campaign_id}"
        )

    # Per-topic
    topic_base_qs = SiteReport.objects.filter(topic__isnull=False)
    if skip_existing:
        topic_ids_source = topic_base_qs.filter(assets_started__isnull=True)
    else:
        topic_ids_source = topic_base_qs

    topic_ids = topic_ids_source.values_list("topic_id", flat=True).distinct()
    for topic_id in topic_ids.iterator():
        topic_series = topic_base_qs.filter(topic_id=topic_id).order_by(
            "created_on", "pk"
        )
        updated_count += process_series_queryset(
            topic_series, series_label=f"TOPIC:{topic_id}"
        )

    # Site-wide TOTAL (roll up per-campaign assets_started)
    total_base_qs = SiteReport.objects.filter(
        report_name=SiteReport.ReportName.TOTAL,
        campaign__isnull=True,
        topic__isnull=True,
    )
    total_exists_qs = total_base_qs
    if skip_existing:
        total_exists_qs = total_exists_qs.filter(assets_started__isnull=True)

    if total_exists_qs.exists():
        total_qs = total_base_qs.order_by("created_on", "pk")
        updated_count += process_series_queryset(
            total_qs,
            series_label="TOTAL",
            rollup_total_from_campaigns=True,
        )

    # Site-wide RETIRED_TOTAL
    retired_base_qs = SiteReport.objects.filter(
        report_name=SiteReport.ReportName.RETIRED_TOTAL
    )
    retired_exists_qs = retired_base_qs
    if skip_existing:
        retired_exists_qs = retired_exists_qs.filter(assets_started__isnull=True)

    if retired_exists_qs.exists():
        retired_total_qs = retired_base_qs.order_by("created_on", "pk")
        updated_count += process_series_queryset(
            retired_total_qs,
            series_label="RETIRED_TOTAL",
            force_zero_assets_started=True,
        )

    structured_logger.info(
        "Completed backfill for assets_started.",
        event_code="assets_started_backfill_complete",
        updated_rows=updated_count,
        task_id=getattr(self.request, "id", None),
    )
    return updated_count


================================================
FILE: concordia/tasks/reports/key_metrics.py
================================================
import datetime
from logging import getLogger

from django.db.models import Max
from django.utils import timezone

from concordia.decorators import locked_task
from concordia.logging import ConcordiaLogger
from concordia.models import KeyMetricsReport, SiteReport

from ...celery import app as celery_app

logger = getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


@celery_app.task(bind=True, ignore_result=True)
@locked_task(lock_by_args=False)
def build_key_metrics_reports(self, recompute_all: bool = False) -> int:
    """
    Build or refresh KeyMetricsReport rows (monthly, quarterly and fiscal year).

    The task operates in two modes, controlled by ``recompute_all``:

    - If ``recompute_all`` is True:
        - Recompute every monthly period that can be derived from
          SiteReport data.
        - Recompute all quarters that have at least one monthly row.
        - Recompute all fiscal years that have at least one quarterly
          row.
    - If ``recompute_all`` is False (incremental mode):
        - Create any missing monthly rows.
        - Refresh a monthly row if any SiteReport in that month has
          ``created_on`` later than the row's ``updated_on`` value.
        - Create any missing quarter rows that have at least one
          monthly row.
        - Refresh a quarter row if any of its monthly inputs have
          ``updated_on`` later than the quarter's ``updated_on`` value.
        - Create any missing fiscal year rows that have at least one
          quarter row.
        - Refresh a fiscal year row if any of its quarterly inputs have
          ``updated_on`` later than the fiscal year's ``updated_on``
          value.

    Args:
        recompute_all: If True, recompute all monthly, quarterly and
            fiscal-year rows from scratch based on SiteReport data. If
            False, only create missing rows and refresh rows that are
            stale.

    Returns:
        int: Count of KeyMetricsReport rows created or updated.
    """
    task_id = getattr(self.request, "id", None)
    structured_logger.info(
        "Starting KeyMetricsReport build.",
        event_code="key_metrics_build_start",
        task_id=task_id,
        recompute_all=recompute_all,
    )

    rows_changed = 0

    # Determine month range we can evaluate
    earliest_site_report = SiteReport.objects.order_by("created_on", "pk").first()
    earliest_date = earliest_site_report.created_on.date()
    first_month_start = earliest_date.replace(day=1)

    # Use local date for boundary logic
    today_local = timezone.localdate()
    # Evaluate up to the month containing "yesterday"
    # so we never rely on future EOM snapshots
    yesterday_local = today_local - datetime.timedelta(days=1)
    _, latest_evaluated_end_of_month = KeyMetricsReport.month_bounds(yesterday_local)

    def has_any_snapshot_by_end_of_month(month_start: datetime.date) -> bool:
        _, end_of_month = KeyMetricsReport.month_bounds(month_start)
        return SiteReport.objects.filter(created_on__date__lte=end_of_month).exists()

    last_month_start = latest_evaluated_end_of_month.replace(day=1)
    # Step back if the very latest month has no SiteReport by its EOM
    while (
        last_month_start >= first_month_start
        and not has_any_snapshot_by_end_of_month(last_month_start)
    ):
        if last_month_start.month == 1:
            last_month_start = last_month_start.replace(
                year=last_month_start.year - 1, month=12, day=1
            )
        else:
            last_month_start = last_month_start.replace(
                month=last_month_start.month - 1, day=1
            )

    if last_month_start < first_month_start:
        structured_logger.info(
            "No computable monthly periods found.",
            event_code="key_metrics_build_no_months",
            task_id=task_id,
        )
        return 0

    # Monthly

    months_processed: list[datetime.date] = []
    current_month_start = first_month_start
    while current_month_start <= last_month_start:
        year = current_month_start.year
        month = current_month_start.month
        _, current_month_end = KeyMetricsReport.month_bounds(current_month_start)

        if recompute_all:
            report = KeyMetricsReport.upsert_month(year=year, month=month)
            if report is not None:
                rows_changed += 1
                months_processed.append(current_month_start)
                structured_logger.info(
                    "Upserted monthly KeyMetricsReport.",
                    event_code="key_metrics_month_upserted",
                    year=year,
                    month=month,
                    period_start=str(report.period_start),
                    period_end=str(report.period_end),
                    task_id=task_id,
                )
        else:
            # Incremental mode: create missing, or refresh if stale
            existing_monthly_report = KeyMetricsReport.objects.filter(
                period_type=KeyMetricsReport.PeriodType.MONTHLY,
                fiscal_year=KeyMetricsReport.get_fiscal_year_for_date(
                    current_month_start
                ),
                month=month,
            ).first()

            if existing_monthly_report is None:
                report = KeyMetricsReport.upsert_month(year=year, month=month)
                if report is not None:
                    rows_changed += 1
                    months_processed.append(current_month_start)
                    structured_logger.info(
                        "Created missing monthly KeyMetricsReport.",
                        event_code="key_metrics_month_created",
                        year=year,
                        month=month,
                        period_start=str(report.period_start),
                        period_end=str(report.period_end),
                        task_id=task_id,
                    )
            else:
                # Refresh if any SiteReport within this month (TOTAL
                # or RETIRED_TOTAL, site-wide) has been created after
                # the monthly report was last updated.
                site_report_newer_exists = SiteReport.objects.filter(
                    report_name__in=(
                        SiteReport.ReportName.TOTAL,
                        SiteReport.ReportName.RETIRED_TOTAL,
                    ),
                    campaign__isnull=True,
                    topic__isnull=True,
                    created_on__date__gte=current_month_start,
                    created_on__date__lte=current_month_end,
                    created_on__gt=existing_monthly_report.updated_on,
                ).exists()

                if site_report_newer_exists:
                    report = KeyMetricsReport.upsert_month(year=year, month=month)
                    if report is not None:
                        rows_changed += 1
                        months_processed.append(current_month_start)
                        structured_logger.info(
                            (
                                "Refreshed monthly KeyMetricsReport "
                                "due to newer SiteReports."
                            ),
                            event_code="key_metrics_month_refreshed",
                            year=year,
                            month=month,
                            period_start=str(report.period_start),
                            period_end=str(report.period_end),
                            task_id=task_id,
                        )

        # Next month
        if month == 12:
            current_month_start = current_month_start.replace(
                year=year + 1, month=1, day=1
            )
        else:
            current_month_start = current_month_start.replace(month=month + 1, day=1)

    # Quarterly

    # Ensure we know which quarters exist (or should exist) given MONTHLY rows
    monthly_rows = (
        KeyMetricsReport.objects.filter(period_type=KeyMetricsReport.PeriodType.MONTHLY)
        .values("fiscal_year")
        .annotate(max_month=Max("month"))
    )
    # We will iterate over all fiscal_years that have at least one monthly row
    fiscal_years_with_monthlies = {row["fiscal_year"] for row in monthly_rows}

    # Create missing quarters and refresh stale ones
    for fiscal_year in sorted(fiscal_years_with_monthlies):
        for fiscal_quarter in (1, 2, 3, 4):
            quarter_exists = KeyMetricsReport.objects.filter(
                period_type=KeyMetricsReport.PeriodType.QUARTERLY,
                fiscal_year=fiscal_year,
                fiscal_quarter=fiscal_quarter,
            ).first()

            if recompute_all:
                quarter_report = KeyMetricsReport.upsert_quarter(
                    fiscal_year=fiscal_year, fiscal_quarter=fiscal_quarter
                )
                if quarter_report is not None:
                    rows_changed += 1
                    structured_logger.info(
                        "Upserted quarterly KeyMetricsReport.",
                        event_code="key_metrics_quarter_upserted",
                        fiscal_year=fiscal_year,
                        fiscal_quarter=fiscal_quarter,
                        period_start=str(quarter_report.period_start),
                        period_end=str(quarter_report.period_end),
                        task_id=task_id,
                    )
                continue

            # Incremental mode
            if quarter_exists is None:
                quarter_report = KeyMetricsReport.upsert_quarter(
                    fiscal_year=fiscal_year, fiscal_quarter=fiscal_quarter
                )
                if quarter_report is not None:
                    rows_changed += 1
                    structured_logger.info(
                        "Created missing quarterly KeyMetricsReport.",
                        event_code="key_metrics_quarter_created",
                        fiscal_year=fiscal_year,
                        fiscal_quarter=fiscal_quarter,
                        period_start=str(quarter_report.period_start),
                        period_end=str(quarter_report.period_end),
                        task_id=task_id,
                    )
            else:
                # Refresh if any constituent MONTHLY rows are newer than the quarter row
                if fiscal_quarter == 1:
                    month_list = [10, 11, 12]
                    monthly_fiscal_year = fiscal_year
                elif fiscal_quarter == 2:
                    month_list = [1, 2, 3]
                    monthly_fiscal_year = fiscal_year
                elif fiscal_quarter == 3:
                    month_list = [4, 5, 6]
                    monthly_fiscal_year = fiscal_year
                else:
                    month_list = [7, 8, 9]
                    monthly_fiscal_year = fiscal_year

                monthly_newer_exists = KeyMetricsReport.objects.filter(
                    period_type=KeyMetricsReport.PeriodType.MONTHLY,
                    fiscal_year=monthly_fiscal_year,
                    month__in=month_list,
                    updated_on__gt=quarter_exists.updated_on,
                ).exists()

                if monthly_newer_exists:
                    quarter_report = KeyMetricsReport.upsert_quarter(
                        fiscal_year=fiscal_year, fiscal_quarter=fiscal_quarter
                    )
                    if quarter_report is not None:
                        rows_changed += 1
                        structured_logger.info(
                            (
                                "Refreshed quarterly KeyMetricsReport "
                                "due to newer monthly inputs."
                            ),
                            event_code="key_metrics_quarter_refreshed",
                            fiscal_year=fiscal_year,
                            fiscal_quarter=fiscal_quarter,
                            period_start=str(quarter_report.period_start),
                            period_end=str(quarter_report.period_end),
                            task_id=task_id,
                        )

    # Fiscal year

    # Any fiscal year that has at least one quarter row should have a FY rollup
    fiscal_years_with_quarters = set(
        KeyMetricsReport.objects.filter(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY
        ).values_list("fiscal_year", flat=True)
    )

    for fiscal_year in sorted(fiscal_years_with_quarters):
        fiscal_year_report = KeyMetricsReport.objects.filter(
            period_type=KeyMetricsReport.PeriodType.FISCAL_YEAR,
            fiscal_year=fiscal_year,
        ).first()

        if recompute_all:
            year_report = KeyMetricsReport.upsert_fiscal_year(fiscal_year=fiscal_year)
            if year_report is not None:
                rows_changed += 1
                structured_logger.info(
                    "Upserted fiscal-year KeyMetricsReport.",
                    event_code="key_metrics_year_upserted",
                    fiscal_year=fiscal_year,
                    period_start=str(year_report.period_start),
                    period_end=str(year_report.period_end),
                    task_id=task_id,
                )
            continue

        if fiscal_year_report is None:
            year_report = KeyMetricsReport.upsert_fiscal_year(fiscal_year=fiscal_year)
            if year_report is not None:
                rows_changed += 1
                structured_logger.info(
                    "Created missing fiscal-year KeyMetricsReport.",
                    event_code="key_metrics_year_created",
                    fiscal_year=fiscal_year,
                    period_start=str(year_report.period_start),
                    period_end=str(year_report.period_end),
                    task_id=task_id,
                )
        else:
            # Refresh if any constituent QUARTER rows are newer than the FY row
            quarter_newer_exists = KeyMetricsReport.objects.filter(
                period_type=KeyMetricsReport.PeriodType.QUARTERLY,
                fiscal_year=fiscal_year,
                updated_on__gt=fiscal_year_report.updated_on,
            ).exists()

            if quarter_newer_exists:
                year_report = KeyMetricsReport.upsert_fiscal_year(
                    fiscal_year=fiscal_year
                )
                if year_report is not None:
                    rows_changed += 1
                    structured_logger.info(
                        (
                            "Refreshed fiscal-year KeyMetricsReport "
                            "due to newer quarterly inputs."
                        ),
                        event_code="key_metrics_year_refreshed",
                        fiscal_year=fiscal_year,
                        period_start=str(year_report.period_start),
                        period_end=str(year_report.period_end),
                        task_id=task_id,
                    )

    structured_logger.info(
        "Completed KeyMetricsReport build.",
        event_code="key_metrics_build_complete",
        rows_changed=rows_changed,
        task_id=task_id,
        recompute_all=recompute_all,
    )
    return rows_changed


================================================
FILE: concordia/tasks/reports/sitereport.py
================================================
from logging import getLogger

from django.contrib.auth.models import User
from django.db.models import Count, Q, QuerySet
from django.utils import timezone

from concordia.logging import ConcordiaLogger
from concordia.models import (
    ONE_DAY_AGO,
    Asset,
    Campaign,
    Item,
    Project,
    SiteReport,
    Tag,
    Topic,
    Transcription,
    UserAssetTagCollection,
)
from concordia.utils import get_anonymous_user

from ...celery import app as celery_app

logger = getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


def _recent_transcriptions() -> QuerySet[Transcription]:
    """
    Return transcriptions with activity in the last day.

    "Recent" activity is defined as any transcription whose accepted, created,
    rejected, submitted, or updated timestamp is greater than or equal to
    ONE_DAY_AGO. This queryset is used as the basis for daily activity and DAU
    calculations.

    Returns:
        QuerySet[Transcription]: Django queryset of recent transcriptions.
    """
    qs = Transcription.objects.filter(
        Q(accepted__gte=ONE_DAY_AGO)
        | Q(created_on__gte=ONE_DAY_AGO)
        | Q(rejected__gte=ONE_DAY_AGO)
        | Q(submitted__gte=ONE_DAY_AGO)
        | Q(updated_on__gte=ONE_DAY_AGO)
    )
    structured_logger.info(
        "Fetched recent transcriptions for DAU calculation.",
        event_code="recent_transcriptions_fetched",
        transcription_count=qs.count(),
    )
    return qs


def _daily_active_users() -> int:
    """
    Calculate the daily active user count based on recent transcriptions.

    A daily active user is any account that either created or updated a
    transcription, or performed a review, within the last day.

    Returns:
        int: The number of unique users who were active in the last day.
    """
    transcriptions = _recent_transcriptions()
    transcriber_ids = transcriptions.values_list("user", flat=True).distinct()
    reviewer_ids = (
        transcriptions.exclude(reviewed_by__isnull=True)
        .values_list("reviewed_by", flat=True)
        .distinct()
    )
    transcriber_count = transcriber_ids.count()
    reviewer_count = reviewer_ids.count()
    daily_active_users = len(set(list(reviewer_ids) + list(transcriber_ids)))

    structured_logger.info(
        "Calculated daily active users from recent transcriptions.",
        event_code="daily_active_users_calculated",
        transcriber_count=transcriber_count,
        reviewer_count=reviewer_count,
        daily_active_users=daily_active_users,
    )
    return daily_active_users


@celery_app.task
def site_report() -> None:
    """
    Generate site-wide, per-campaign, per-topic, and retired rollup SiteReports.

    This task snapshots current counts for assets, items, projects, campaigns,
    tags, users, and transcription activity into SiteReport rows. It creates a
    site-wide TOTAL report, then per-campaign and per-topic reports, and
    finally a RETIRED_TOTAL rollup for retired campaigns.

    For per-campaign and per-topic reports, the ``assets_started`` metric is
    derived from ``assets_total`` and ``assets_not_started``, so
    publish/unpublish changes alone do not affect the calculated starts as
    long as total and not-started counts remain consistent.

    For the site-wide TOTAL report, ``assets_started`` is calculated by rolling
    up the per-campaign ``assets_started`` values generated in the same daily
    reporting run. This avoids confounding changes to the site-wide series
    caused by campaign retirements.

    The RETIRED_TOTAL rollup does not calculate ``assets_started``; it is set
    to zero because membership changes when campaigns retire, and the daily
    delta is not meaningful for that rollup.
    """
    structured_logger.debug(
        "Starting site report generation task.",
        event_code="site_report_task_start",
    )
    report = {
        "assets_not_started": 0,
        "assets_in_progress": 0,
        "assets_submitted": 0,
        "assets_completed": 0,
    }

    asset_count_qs = Asset.objects.values_list("transcription_status").annotate(
        Count("transcription_status")
    )
    for status, count in asset_count_qs:
        logger.debug("Assets %s: %d", status, count)
        report[f"assets_{status}"] = count

    assets_total = Asset.objects.count()
    assets_published = Asset.objects.published().count()
    assets_unpublished = Asset.objects.unpublished().count()

    items_published = Item.objects.published().count()
    items_unpublished = Item.objects.unpublished().count()

    projects_published = Project.objects.published().count()
    projects_unpublished = Project.objects.unpublished().count()

    campaigns_published = Campaign.objects.published().count()
    campaigns_unpublished = Campaign.objects.unpublished().count()

    users_registered = User.objects.all().count()
    users_activated = User.objects.filter(is_active=True).count()

    anonymous_transcriptions = Transcription.objects.filter(
        user=get_anonymous_user()
    ).count()
    transcriptions_saved = Transcription.objects.all().count()

    daily_review_actions = Transcription.objects.recent_review_actions().count()

    stats = UserAssetTagCollection.objects.aggregate(Count("tags"))
    tag_count = stats["tags__count"]

    distinct_tag_count = Tag.objects.all().count()

    site_report = SiteReport()
    site_report.report_name = SiteReport.ReportName.TOTAL
    site_report.assets_total = assets_total
    site_report.assets_published = assets_published
    site_report.assets_not_started = report["assets_not_started"]
    site_report.assets_in_progress = report["assets_in_progress"]
    site_report.assets_waiting_review = report["assets_submitted"]
    site_report.assets_completed = report["assets_completed"]
    site_report.assets_unpublished = assets_unpublished
    site_report.assets_started = 0
    site_report.items_published = items_published
    site_report.items_unpublished = items_unpublished
    site_report.projects_published = projects_published
    site_report.projects_unpublished = projects_unpublished
    site_report.anonymous_transcriptions = anonymous_transcriptions
    site_report.transcriptions_saved = transcriptions_saved
    site_report.daily_review_actions = daily_review_actions
    site_report.distinct_tags = distinct_tag_count
    site_report.tag_uses = tag_count
    site_report.campaigns_published = campaigns_published
    site_report.campaigns_unpublished = campaigns_unpublished
    site_report.users_registered = users_registered
    site_report.users_activated = users_activated
    site_report.daily_active_users = _daily_active_users()

    structured_logger.debug(
        "Site-wide counts calculated for report generation.",
        event_code="site_report_counts_calculated",
        assets_total=assets_total,
        assets_published=assets_published,
        assets_unpublished=assets_unpublished,
        assets_started=site_report.assets_started,
        items_published=items_published,
        items_unpublished=items_unpublished,
        projects_published=projects_published,
        projects_unpublished=projects_unpublished,
        campaigns_published=campaigns_published,
        campaigns_unpublished=campaigns_unpublished,
        users_registered=users_registered,
        users_activated=users_activated,
        anonymous_transcriptions=anonymous_transcriptions,
        transcriptions_saved=transcriptions_saved,
        daily_review_actions=daily_review_actions,
        distinct_tags=distinct_tag_count,
        tag_uses=tag_count,
        daily_active_users=site_report.daily_active_users,
    )

    site_report.save()

    structured_logger.debug(
        "Site-wide report saved successfully.",
        event_code="site_report_saved",
        site_report_id=site_report.id,
        created_on=site_report.created_on.isoformat(),
    )

    campaigns = Campaign.objects.exclude(status=Campaign.Status.RETIRED)
    structured_logger.debug(
        "Generating campaign reports.",
        event_code="campaign_reports_generation_start",
        campaign_count=campaigns.count(),
    )
    campaign_reports = []
    for campaign in campaigns:
        campaign_reports.append(campaign_report(campaign))
    structured_logger.debug(
        "Campaign reports generation completed.",
        event_code="campaign_reports_generation_complete",
    )

    total_assets_started = sum(
        (campaign_site_report.assets_started or 0)
        for campaign_site_report in campaign_reports
        if campaign_site_report is not None
    )
    if site_report.assets_started != total_assets_started:
        site_report.assets_started = total_assets_started
        site_report.save(update_fields=["assets_started"])

        structured_logger.debug(
            "Site-wide assets_started rolled up from campaign reports.",
            event_code="site_report_assets_started_rolled_up",
            site_report_id=site_report.id,
            created_on=site_report.created_on.isoformat(),
            assets_started=total_assets_started,
            campaign_report_count=len(campaign_reports),
        )

    topics = Topic.objects.all()
    structured_logger.debug(
        "Generating topic reports.",
        event_code="topic_reports_generation_start",
        topic_count=topics.count(),
    )
    for topic in topics:
        topic_report(topic)
    structured_logger.debug(
        "Topic reports generation completed.",
        event_code="topic_reports_generation_complete",
    )

    retired_total_report()
    structured_logger.debug(
        "Retired total report generation completed.",
        event_code="retired_total_report_complete",
    )

    structured_logger.debug(
        "Site report generation task completed successfully.",
        event_code="site_report_task_complete",
    )


def topic_report(topic: Topic) -> None:
    """
    Generate and save a SiteReport snapshot for a single topic.

    The report aggregates asset, item, project, tag, and review activity counts
    for the topic and stores them as a new SiteReport row.

    Args:
        topic: Topic instance to generate a report for.
    """
    structured_logger.debug(
        "Starting topic report generation.",
        event_code="topic_report_generation_start",
        topic_slug=topic,
    )
    report = {
        "assets_not_started": 0,
        "assets_in_progress": 0,
        "assets_submitted": 0,
        "assets_completed": 0,
    }

    asset_count_qs = (
        Asset.objects.filter(item__project__topics=topic)
        .values_list("transcription_status")
        .annotate(Count("transcription_status"))
    )

    for status, count in asset_count_qs:
        logger.debug("Topic %s assets %s: %d", topic.slug, status, count)
        report[f"assets_{status}"] = count

    assets_total = Asset.objects.filter(item__project__topics=topic).count()
    if assets_total == 0:
        structured_logger.warning(
            "Topic report generated with zero total assets.",
            event_code="topic_report_zero_assets",
            reason="Topic has no associated assets",
            reason_code="no_assets",
            topic=topic,
        )
    assets_published = (
        Asset.objects.published().filter(item__project__topics=topic).count()
    )
    assets_unpublished = (
        Asset.objects.unpublished().filter(item__project__topics=topic).count()
    )

    items_published = Item.objects.published().filter(project__topics=topic).count()
    items_unpublished = Item.objects.unpublished().filter(project__topics=topic).count()

    projects_published = Project.objects.published().filter(topics=topic).count()
    projects_unpublished = Project.objects.unpublished().filter(topics=topic).count()

    anonymous_transcriptions = Transcription.objects.filter(
        asset__item__project__topics=topic, user=get_anonymous_user()
    ).count()
    transcriptions_saved = Transcription.objects.filter(
        asset__item__project__topics=topic
    ).count()

    daily_review_actions = (
        Transcription.objects.recent_review_actions()
        .filter(asset__item__project__topics__in=(topic,))
        .count()
    )

    asset_tag_collections = UserAssetTagCollection.objects.filter(
        asset__item__project__topics=topic
    )

    stats = asset_tag_collections.order_by().aggregate(tag_count=Count("tags"))
    tag_count = stats["tag_count"]

    distinct_tag_list = set()

    for tag_collection in asset_tag_collections:
        distinct_tag_list.update(tag_collection.tags.values_list("pk", flat=True))

    distinct_tag_count = len(distinct_tag_list)

    previous = SiteReport.objects.previous_in_series(topic=topic, before=timezone.now())
    assets_started = SiteReport.calculate_assets_started(
        previous_assets_total=getattr(previous, "assets_total", 0),
        previous_assets_not_started=getattr(previous, "assets_not_started", 0),
        current_assets_total=assets_total,
        current_assets_not_started=report["assets_not_started"],
    )

    structured_logger.debug(
        "Topic counts calculated for report generation.",
        event_code="topic_report_counts_calculated",
        topic=topic,
        assets_total=assets_total,
        assets_published=assets_published,
        assets_unpublished=assets_unpublished,
        assets_started=assets_started,
        items_published=items_published,
        items_unpublished=items_unpublished,
        projects_published=projects_published,
        projects_unpublished=projects_unpublished,
        anonymous_transcriptions=anonymous_transcriptions,
        transcriptions_saved=transcriptions_saved,
        daily_review_actions=daily_review_actions,
        distinct_tags=distinct_tag_count,
        tag_uses=tag_count,
    )
    site_report = SiteReport()
    site_report.topic = topic
    site_report.assets_total = assets_total
    site_report.assets_published = assets_published
    site_report.assets_not_started = report["assets_not_started"]
    site_report.assets_in_progress = report["assets_in_progress"]
    site_report.assets_waiting_review = report["assets_submitted"]
    site_report.assets_completed = report["assets_completed"]
    site_report.assets_unpublished = assets_unpublished
    site_report.items_published = items_published
    site_report.items_unpublished = items_unpublished
    site_report.projects_published = projects_published
    site_report.projects_unpublished = projects_unpublished
    site_report.anonymous_transcriptions = anonymous_transcriptions
    site_report.transcriptions_saved = transcriptions_saved
    site_report.daily_review_actions = daily_review_actions
    site_report.distinct_tags = distinct_tag_count
    site_report.tag_uses = tag_count
    site_report.assets_started = assets_started
    site_report.save()
    structured_logger.debug(
        "Topic report saved successfully.",
        event_code="topic_report_saved",
        topic=topic,
        site_report_id=site_report.id,
        created_on=site_report.created_on.isoformat(),
    )


def campaign_report(campaign: Campaign) -> SiteReport:
    """
    Generate and save a SiteReport snapshot for a single campaign.

    The report aggregates asset, item, project, contributor, tag, and review
    counts for the campaign and stores them as a new SiteReport row.

    The ``assets_started`` metric is derived from ``assets_total`` and
    ``assets_not_started``, so publish/unpublish changes alone do not affect
    the calculated starts as long as total and not-started counts remain
    consistent.

    Args:
        campaign: Campaign instance to generate a report for.

    Returns:
        SiteReport: The newly created campaign SiteReport.
    """
    structured_logger.debug(
        "Starting campaign report generation.",
        event_code="campaign_report_generation_start",
        campaign=campaign,
    )
    report = {
        "assets_not_started": 0,
        "assets_in_progress": 0,
        "assets_submitted": 0,
        "assets_completed": 0,
    }

    asset_count_qs = (
        Asset.objects.filter(item__project__campaign=campaign)
        .values_list("transcription_status")
        .annotate(Count("transcription_status"))
    )

    for status, count in asset_count_qs:
        logger.debug("Campaign %s assets %s: %d", campaign.slug, status, count)
        report[f"assets_{status}"] = count

    assets_total = Asset.objects.filter(item__project__campaign=campaign).count()
    if assets_total == 0:
        structured_logger.warning(
            "Campaign report generated with zero total assets.",
            event_code="campaign_report_zero_assets",
            reason="Campaign has no associated assets",
            reason_code="no_assets",
            campaign=campaign,
        )
    assets_published = (
        Asset.objects.published().filter(item__project__campaign=campaign).count()
    )
    assets_unpublished = (
        Asset.objects.unpublished().filter(item__project__campaign=campaign).count()
    )

    items_published = (
        Item.objects.published().filter(project__campaign=campaign).count()
    )
    items_unpublished = (
        Item.objects.unpublished().filter(project__campaign=campaign).count()
    )

    projects_published = Project.objects.published().filter(campaign=campaign).count()
    projects_unpublished = (
        Project.objects.unpublished().filter(campaign=campaign).count()
    )

    anonymous_transcriptions = Transcription.objects.filter(
        asset__item__project__campaign=campaign, user=get_anonymous_user()
    ).count()
    transcriptions_saved = Transcription.objects.filter(
        asset__item__project__campaign=campaign
    ).count()

    daily_review_actions = (
        Transcription.objects.recent_review_actions()
        .filter(asset__item__project__campaign=campaign)
        .count()
    )

    asset_tag_collections = UserAssetTagCollection.objects.filter(
        asset__item__project__campaign=campaign
    )

    stats = asset_tag_collections.order_by().aggregate(tag_count=Count("tags"))
    tag_count = stats["tag_count"]

    distinct_tag_list = set()

    for tag_collection in asset_tag_collections:
        distinct_tag_list.update(tag_collection.tags.values_list("pk", flat=True))

    distinct_tag_count = len(distinct_tag_list)

    campaign_assets = Asset.objects.filter(
        item__project__campaign=campaign,
        item__project__published=True,
        item__published=True,
        published=True,
    )
    asset_transcriptions = Transcription.objects.filter(
        asset__in=campaign_assets
    ).values_list("user_id", "reviewed_by")
    user_ids = {
        user_id
        for transcription in asset_transcriptions
        for user_id in transcription
        if user_id
    }
    registered_contributor_count = len(user_ids)

    previous = SiteReport.objects.previous_in_series(
        campaign=campaign, before=timezone.now()
    )
    assets_started = SiteReport.calculate_assets_started(
        previous_assets_total=getattr(previous, "assets_total", 0),
        previous_assets_not_started=getattr(previous, "assets_not_started", 0),
        current_assets_total=assets_total,
        current_assets_not_started=report["assets_not_started"],
    )

    structured_logger.debug(
        "Campaign counts calculated for report generation.",
        event_code="campaign_report_counts_calculated",
        campaign=campaign,
        assets_total=assets_total,
        assets_published=assets_published,
        assets_unpublished=assets_unpublished,
        assets_started=assets_started,
        items_published=items_published,
        items_unpublished=items_unpublished,
        projects_published=projects_published,
        projects_unpublished=projects_unpublished,
        anonymous_transcriptions=anonymous_transcriptions,
        transcriptions_saved=transcriptions_saved,
        daily_review_actions=daily_review_actions,
        distinct_tags=distinct_tag_count,
        tag_uses=tag_count,
        registered_contributors=registered_contributor_count,
    )
    site_report = SiteReport()
    site_report.campaign = campaign
    site_report.assets_total = assets_total
    site_report.assets_published = assets_published
    site_report.assets_not_started = report["assets_not_started"]
    site_report.assets_in_progress = report["assets_in_progress"]
    site_report.assets_waiting_review = report["assets_submitted"]
    site_report.assets_completed = report["assets_completed"]
    site_report.assets_unpublished = assets_unpublished
    site_report.items_published = items_published
    site_report.items_unpublished = items_unpublished
    site_report.projects_published = projects_published
    site_report.projects_unpublished = projects_unpublished
    site_report.anonymous_transcriptions = anonymous_transcriptions
    site_report.transcriptions_saved = transcriptions_saved
    site_report.daily_review_actions = daily_review_actions
    site_report.distinct_tags = distinct_tag_count
    site_report.tag_uses = tag_count
    site_report.registered_contributors = registered_contributor_count
    site_report.assets_started = assets_started
    site_report.save()
    structured_logger.debug(
        "Campaign report saved successfully.",
        event_code="campaign_report_saved",
        campaign=campaign,
        site_report_id=site_report.id,
        created_on=site_report.created_on.isoformat(),
    )
    return site_report


def retired_total_report() -> None:
    """
    Generate and save the RETIRED_TOTAL SiteReport rollup.

    This aggregates the most recent SiteReport for each retired campaign into a
    single rollup row, summing most fields directly.

    assets_started is a daily-delta metric and is not meaningful for this
    rollup because the rollup membership changes when campaigns retire, and
    that causes every asset in a newly-retired campaign being counted
    as having started on the day of the retirement.
    """
    structured_logger.debug(
        "Starting retired total report generation.",
        event_code="retired_total_report_generation_start",
    )
    site_reports = (
        SiteReport.objects.filter(campaign__status=Campaign.Status.RETIRED)
        .order_by("campaign_id", "-created_on")
        .distinct("campaign_id")
    )

    FIELDS = [
        "assets_total",
        "assets_published",
        "assets_not_started",
        "assets_in_progress",
        "assets_waiting_review",
        "assets_completed",
        "assets_unpublished",
        "items_published",
        "items_unpublished",
        "projects_published",
        "projects_unpublished",
        "anonymous_transcriptions",
        "transcriptions_saved",
        "daily_review_actions",
        "distinct_tags",
        "tag_uses",
        "registered_contributors",
    ]

    total_site_report = SiteReport()
    total_site_report.report_name = SiteReport.ReportName.RETIRED_TOTAL

    for field in FIELDS:
        setattr(
            total_site_report,
            field,
            sum(getattr(sr, field) or 0 for sr in site_reports),
        )

    # assets_started will always be zero for retired campaigns,
    # since no assets could ever be started once a campaign is
    # retired. Trying to calculate it like we do for other reports
    # results in every single asset from a newly retired campaign
    # being counted as having started
    total_site_report.assets_started = 0

    total_site_report.save()
    structured_logger.debug(
        "Retired total report saved successfully.",
        event_code="retired_total_report_saved",
        site_report_id=total_site_report.id,
        created_on=total_site_report.created_on.isoformat(),
    )


================================================
FILE: concordia/tasks/reservations.py
================================================
import datetime
from logging import getLogger

from django.conf import settings
from django.utils import timezone

from concordia.logging import ConcordiaLogger
from concordia.models import AssetTranscriptionReservation
from concordia.signals.signals import reservation_released

from ..celery import app as celery_app

logger = getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


@celery_app.task
def expire_inactive_asset_reservations():
    """
    Release and delete stale asset transcription reservations.

    This task identifies reservations which have not been updated within a grace
    period defined as twice ``TRANSCRIPTION_RESERVATION_SECONDS`` and:

    * Emits the ``reservation_released`` signal for each expired reservation so
      any listeners can react (for example, by making the asset available again).
    * Deletes the expired reservation records from the database.

    This is intended to be run periodically (for example via Celery beat) to
    ensure that abandoned reservations do not block other users from working on
    assets.
    """
    timestamp = timezone.now()

    # Clear old reservations, with a grace period:
    cutoff = timestamp - (
        datetime.timedelta(seconds=2 * settings.TRANSCRIPTION_RESERVATION_SECONDS)
    )

    logger.debug("Clearing reservations with last reserve time older than %s", cutoff)
    expired_reservations = AssetTranscriptionReservation.objects.filter(
        updated_on__lt=cutoff, tombstoned__in=(None, False)
    )

    for reservation in expired_reservations:
        logger.debug("Expired reservation with token %s", reservation.reservation_token)
        reservation_released.send(
            sender="reserve_asset",
            asset_pk=reservation.asset.pk,
            reservation_token=reservation.reservation_token,
        )
        reservation.delete()


@celery_app.task
def tombstone_old_active_asset_reservations():
    """
    Mark very old active reservations as tombstoned.

    This task finds asset transcription reservations whose ``created_on`` is
    older than ``TRANSCRIPTION_RESERVATION_TOMBSTONE_HOURS`` and that are not
    already tombstoned. Each matching reservation is marked with
    ``tombstoned=True`` and saved.

    Tombstoning is a soft-deactivation step that prevents further use of
    obsolete reservations while still retaining a short history for debugging
    or analytics before final deletion.
    """
    timestamp = timezone.now()

    cutoff = timestamp - (
        datetime.timedelta(hours=settings.TRANSCRIPTION_RESERVATION_TOMBSTONE_HOURS)
    )

    old_reservations = AssetTranscriptionReservation.objects.filter(
        created_on__lt=cutoff, tombstoned__in=(None, False)
    )
    for reservation in old_reservations:
        logger.debug("Tombstoning reservation %s ", reservation.reservation_token)
        reservation.tombstoned = True
        reservation.save()


@celery_app.task
def delete_old_tombstoned_reservations():
    """
    Permanently delete tombstoned reservations after a retention period.

    This task finds asset transcription reservations which:

    * Have ``tombstoned=True``, and
    * Have not been updated within
      ``TRANSCRIPTION_RESERVATION_TOMBSTONE_LENGTH_HOURS``.

    Each matching reservation is deleted from the database. This provides a
    final cleanup step after tombstoning so reservation records do not linger
    indefinitely.
    """
    timestamp = timezone.now()

    cutoff = timestamp - (
        datetime.timedelta(
            hours=settings.TRANSCRIPTION_RESERVATION_TOMBSTONE_LENGTH_HOURS
        )
    )

    old_reservations = AssetTranscriptionReservation.objects.filter(
        tombstoned__exact=True, updated_on__lt=cutoff
    )
    for reservation in old_reservations:
        logger.debug(
            "Deleting old tombstoned reservation %s", reservation.reservation_token
        )
        reservation.delete()


================================================
FILE: concordia/tasks/retirement.py
================================================
from logging import getLogger

from celery import chord
from django.db import transaction
from django.db.models import F
from django.utils import timezone

from concordia.logging import ConcordiaLogger
from concordia.models import Asset, Campaign, CampaignRetirementProgress, Item, Project

from ..celery import app as celery_app

logger = getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


@celery_app.task(ignore_result=True)
def retire_campaign(campaign_id):
    """
    Start the retirement workflow for a campaign.

    This task:

    * Loads the `Campaign` for ``campaign_id``.
    * Creates or retrieves the related `CampaignRetirementProgress` row.
    * For a new progress row, calculates and stores total counts of projects,
      items and assets.
    * Marks the campaign status as ``RETIRED`` if it is not already.
    * Enqueues `remove_next_project` to begin cascading removal of projects,
      items and assets.

    Args:
        campaign_id: Primary key of the `Campaign` to retire.

    Returns:
        CampaignRetirementProgress: The progress object tracking this
            retirement run.
    """
    # Entry point to the retirement process
    campaign = Campaign.objects.get(id=campaign_id)
    logger.debug("Retiring %s (%s)", campaign, campaign.id)
    progress, created = CampaignRetirementProgress.objects.get_or_create(
        campaign=campaign
    )
    if created:
        # We want to set totals on a newly created progress object
        # but not on one that already exists. This allows us to keep proper
        # track of the full progress if the process is stopped and resumed
        projects = campaign.project_set.values_list("id", flat=True)
        items = Item.objects.filter(project__id__in=projects).values_list(
            "id", flat=True
        )
        assets = Asset.objects.filter(item__id__in=items).values_list("id", flat=True)
        progress.project_total = len(projects)
        progress.item_total = len(items)
        progress.asset_total = len(assets)
        progress.save()
    if campaign.status != Campaign.Status.RETIRED:
        logger.debug("Setting campaign status to retired")
        # We want to make sure the status is set to Retired before
        # we start removing information so the front-end is pulling
        # from archived data rather than live
        campaign.status = Campaign.Status.RETIRED
        campaign.save()
    remove_next_project.delay(campaign.id)
    return progress


@celery_app.task(ignore_result=True)
def project_removal_success(project_id, campaign_id):
    """
    Record successful removal of a project and queue the next project.

    This task updates the associated `CampaignRetirementProgress` row by:

    * Incrementing ``projects_removed``.
    * Appending a project entry to ``removal_log``.
    * Enqueuing `remove_next_project` to continue campaign retirement.

    Args:
        project_id: Primary key of the project that was just deleted.
        campaign_id: Primary key of the parent `Campaign`.
    """
    logger.debug("Updating progress for campaign %s", campaign_id)
    logger.debug("Project id %s", project_id)
    with transaction.atomic():
        progress = CampaignRetirementProgress.objects.select_for_update().get(
            campaign__id=campaign_id
        )
        progress.projects_removed = F("projects_removed") + 1
        progress.removal_log.append(
            {
                "type": "project",
                "id": project_id,
            }
        )
        progress.save()
        logger.debug("Progress updated for %s", campaign_id)
    remove_next_project.delay(campaign_id)


@celery_app.task(ignore_result=True)
def remove_next_project(campaign_id):
    """
    Remove the next project in a campaign or mark retirement complete.

    This task attempts to fetch the first remaining project in the campaign.
    If a project exists, it enqueues `remove_next_item` to begin removing that
    project's items. If no projects remain, it marks the related
    `CampaignRetirementProgress` as complete and sets ``completed_on``.

    Args:
        campaign_id: Primary key of the `Campaign` whose projects are being
            retired.
    """
    campaign = Campaign.objects.get(id=campaign_id)
    logger.debug("Removing projects for %s (%s)", campaign, campaign.id)
    try:
        project = campaign.project_set.all()[0]
        remove_next_item.delay(project.id)
    except IndexError:
        # This means all projects are deleted, which means the
        # campaign is fully retired.
        logger.debug("Updating progress for campaign %s", campaign_id)
        logger.debug("Retirement complete for campaign %s", campaign_id)
        with transaction.atomic():
            progress = CampaignRetirementProgress.objects.select_for_update().get(
                campaign__id=campaign_id
            )
            progress.complete = True
            progress.completed_on = timezone.now()
            progress.save()
        logger.debug("Progress updated for %s", campaign_id)


@celery_app.task(ignore_result=True)
def item_removal_success(item_id, campaign_id, project_id):
    """
    Record successful removal of an item and queue the next item.

    This task updates the associated `CampaignRetirementProgress` row by:

    * Incrementing ``items_removed``.
    * Appending an item entry to ``removal_log``.
    * Enqueuing `remove_next_item` to continue removing items from the project.

    Args:
        item_id: Primary key of the item that was just deleted.
        campaign_id: Primary key of the parent `Campaign`.
        project_id: Primary key of the parent `Project`.
    """
    logger.debug("Updating progress for campaign %s", campaign_id)
    logger.debug("Item id %s", item_id)
    with transaction.atomic():
        progress = CampaignRetirementProgress.objects.select_for_update().get(
            campaign__id=campaign_id
        )
        progress.items_removed = F("items_removed") + 1
        progress.removal_log.append(
            {
                "type": "item",
                "id": item_id,
            }
        )
        progress.save()
    logger.debug("Progress updated for %s", campaign_id)
    remove_next_item.delay(project_id)


@celery_app.task(ignore_result=True)
def remove_next_item(project_id):
    """
    Remove the next item in a project or delete the project if empty.

    This task attempts to fetch the first remaining item for the given
    project. If an item exists, it enqueues `remove_next_assets` to delete
    that item's assets. If no items remain, it deletes the project and
    enqueues `project_removal_success`.

    Args:
        project_id: Primary key of the `Project` whose items are being
            removed.
    """
    project = Project.objects.get(id=project_id)
    logger.debug("Removing items for %s (%s)", project, project.id)
    try:
        item = project.item_set.all()[0]
        remove_next_assets.delay(item.id)
    except IndexError:
        # No more items remain for this project, so we can now delete
        # the project
        logger.debug("All items remoed for %s (%s)", project, project.id)
        campaign_id = project.campaign.id
        project_id = project.id
        project.delete()
        project_removal_success.delay(project_id, campaign_id)


@celery_app.task(ignore_result=True)
def assets_removal_success(asset_ids, campaign_id, item_id):
    """
    Record successful removal of a batch of assets and queue the next batch.

    This task updates the associated `CampaignRetirementProgress` row by:

    * Incrementing ``assets_removed`` by the number of asset IDs.
    * Appending an entry for each asset to ``removal_log``.
    * Enqueuing `remove_next_assets` to continue deleting assets for the item.

    Args:
        asset_ids: Iterable of primary keys for assets just deleted.
        campaign_id: Primary key of the parent `Campaign`.
        item_id: Primary key of the parent `Item`.
    """
    logger.debug("Updating progress for campaign %s", campaign_id)
    logger.debug("Asset ids %s", asset_ids)
    with transaction.atomic():
        progress = CampaignRetirementProgress.objects.select_for_update().get(
            campaign__id=campaign_id
        )
        progress.assets_removed = F("assets_removed") + len(asset_ids)
        for asset_id in asset_ids:
            progress.removal_log.append(
                {
                    "type": "asset",
                    "id": asset_id,
                }
            )
        progress.save()
    logger.debug("Progress updated for %s", campaign_id)
    remove_next_assets.delay(item_id)


@celery_app.task(ignore_result=True)
def remove_next_assets(item_id):
    """
    Remove assets for an item in small batches or delete the item.

    This task fetches all remaining assets for the given item. If no assets
    remain, it deletes the item and enqueues `item_removal_success`.
    Otherwise, it deletes up to ten assets with a Celery chord of
    `delete_asset` tasks, using `assets_removal_success` as the callback.

    Args:
        item_id: Primary key of the `Item` whose assets are being removed.
    """
    item = Item.objects.get(id=item_id)
    campaign_id = item.project.campaign.id
    logger.debug("Removing assets for %s (%s)", item, item.id)
    assets = item.asset_set.all()
    if not assets:
        # No assets remain for this item, so we can safely delete it
        logger.debug("All assets removed for %s (%s)", item, item.id)
        item_id = item.id
        project_id = item.project.id
        item.delete()
        item_removal_success.delay(item_id, campaign_id, project_id)
    else:
        # We delete assets in chunks of 10 in order to not lock up the database
        # for a long period of time.
        chord(delete_asset.s(asset.id) for asset in assets[:10])(
            assets_removal_success.s(campaign_id, item.id)
        )


@celery_app.task
def delete_asset(asset_id):
    """
    Delete a single asset and its storage image.

    This task:

    * Loads the `Asset` for the given primary key.
    * Deletes the associated ``storage_image`` file from storage.
    * Deletes the asset record itself.

    It returns the ID of the deleted asset so callers such as Celery chords
    can record which assets were removed.

    Args:
        asset_id: Primary key of the `Asset` to delete.

    Returns:
        int: The ID of the deleted asset.
    """
    asset = Asset.objects.get(id=asset_id)
    asset_id = asset.id
    logger.debug("Deleting asset %s (%s)", asset, asset_id)
    # We explicitly delete the storage image, though
    # this should be removed anyway when the asset is deleted
    asset.storage_image.delete(save=False)
    asset.delete()
    logger.debug("Asset %s (%s) deleted", asset, asset_id)

    return asset_id


================================================
FILE: concordia/tasks/search_index.py
================================================
from logging import getLogger

from django.core.management import call_command

from concordia.logging import ConcordiaLogger

from ..celery import app as celery_app

logger = getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


@celery_app.task
def create_opensearch_indices():
    """
    Create OpenSearch indices if they do not already exist.

    This task invokes the ``opensearch index create`` management command with
    ``verbosity=2``, ``force=True`` and ``ignore_error=True``.
    """
    call_command(
        "opensearch", "index", "create", verbosity=2, force=True, ignore_error=True
    )


@celery_app.task
def delete_opensearch_indices():
    """
    Delete OpenSearch indices and their stored documents.

    This task invokes the ``opensearch index delete`` management command with
    ``force=True`` and ``ignore_error=True``.
    """
    call_command("opensearch", "index", "delete", force=True, ignore_error=True)


@celery_app.task
def rebuild_opensearch_indices():
    """
    Rebuild all OpenSearch indices.

    This task invokes the ``opensearch index rebuild`` management command with
    ``verbosity=2``, ``force=True`` and ``ignore_error=True``.
    """
    call_command(
        "opensearch", "index", "rebuild", verbosity=2, force=True, ignore_error=True
    )


@celery_app.task
def populate_opensearch_users_indices():
    """
    Populate the ``users`` OpenSearch index.

    This task invokes the ``opensearch document index`` management command for
    the ``users`` index with ``--force`` and ``--parallel`` so user documents
    defined by the `UserDocument` mapping are indexed and searchable in
    OpenSearch Dashboards.
    """
    call_command(
        "opensearch", "document", "index", "--indices", "users", "--force", "--parallel"
    )


@celery_app.task
def populate_opensearch_assets_indices():
    """
    Populate the ``assets`` OpenSearch index.

    This task invokes the ``opensearch document index`` management command for
    the ``assets`` index with ``--force`` and ``--parallel`` so asset documents
    defined by the `AssetDocument` mapping are indexed and searchable in
    OpenSearch Dashboards.
    """
    call_command(
        "opensearch",
        "document",
        "index",
        "--indices",
        "assets",
        "--force",
        "--parallel",
    )


@celery_app.task
def populate_opensearch_indices():
    """
    Populate all OpenSearch document indices.

    This task invokes the ``opensearch document index`` management command with
    ``--force`` to skip interactive confirmation and ``--parallel`` to index
    documents in parallel.
    """
    call_command("opensearch", "document", "index", "--force", "--parallel")


================================================
FILE: concordia/tasks/thumbnails.py
================================================
from logging import getLogger
from typing import Optional

import requests
from celery import group
from django.db import transaction
from django.db.models import Q

from concordia.logging import ConcordiaLogger
from concordia.models import Item

from ..celery import app as celery_app

logger = getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)

# TODO: remove download_item_thumbnail_task once `item.thumbnail_url` is removed


@celery_app.task(
    bind=True,
    autoretry_for=(requests.RequestException,),
    retry_backoff=5,
    retry_kwargs={"max_retries": 5, "countdown": 5},
)
def download_item_thumbnail_task(
    self,
    item_id: int,
    force: bool = False,
) -> str:
    """
    Fetch an item and ensure its thumbnail image is populated.

    The item's ``thumbnail_url`` field is used as the source of the download.

    Args:
        item_id: Primary key of the item to process.
        force: Overwrite an existing thumbnail if true.

    Returns:
        Storage path of the saved image or a skip message.

    Raises:
        ValueError: If ``Item.thumbnail_url`` is unavailable.
        requests.RequestException: For network errors (auto-retried).
    """
    from importer.tasks.items import download_and_set_item_thumbnail

    with transaction.atomic():
        item = (
            Item.objects.select_for_update(of=("self",))
            .only("id", "thumbnail_url", "thumbnail_image", "item_id")
            .get(pk=item_id)
        )

    src_url = item.thumbnail_url
    if not src_url:
        msg = "No thumbnail URL available."
        logger.info("download_item_thumbnail_task: %s item_id=%s", msg, item_id)
        return msg

    return download_and_set_item_thumbnail(item, src_url, force=force)


# TODO: remove download_missing_thumbnails_task once `item.thumbnail_url` is removed


@celery_app.task(bind=True)
def download_missing_thumbnails_task(
    self,
    project_id: Optional[int] = None,
    batch_size: int = 10,
    limit: Optional[int] = None,
    force: bool = False,
) -> int:
    """
    Spawn per-item download tasks for items missing thumbnails in chunks.

    This finds items that have a non-empty ``thumbnail_url`` but no stored
    ``thumbnail_image``. It then executes per-item tasks in chunks of
    ``batch_size``, waiting for each chunk to finish before starting the next.

    Args:
        project_id: Optional project filter.
        batch_size: Number of parallel tasks per wave.
        limit: Optional cap on total items processed.
        force: Overwrite existing thumbnails if true.

    Returns:
        Count of items scheduled or processed.
    """
    qs = Item.objects.all()

    if project_id is not None:
        qs = qs.filter(project_id=project_id)

    qs = qs.filter(
        Q(thumbnail_url__isnull=False)
        & ~Q(thumbnail_url="")
        & (Q(thumbnail_image__isnull=True) | Q(thumbnail_image=""))
    ).order_by("pk")

    if limit is not None:
        qs = qs[:limit]

    ids = list(qs.values_list("pk", flat=True))
    total = len(ids)
    if total == 0:
        logger.info("download_missing_thumbnails_task: nothing to do.")
        return 0

    # Process in waves of `batch_size`, waiting between waves.
    for i in range(0, total, batch_size):
        chunk = ids[i : i + batch_size]
        task_group = group(
            download_item_thumbnail_task.s(item_id, force=force) for item_id in chunk
        )
        result = task_group.apply_async()
        # Block this task until the chunk finishes; then schedule next.
        result.get(disable_sync_subtasks=False)

    logger.info(
        "download_missing_thumbnails_task: processed %s items in chunks of %s",
        total,
        batch_size,
    )
    return total


================================================
FILE: concordia/tasks/unusualactivity.py
================================================
import datetime
from logging import getLogger

from django.conf import settings
from django.contrib.sites.models import Site
from django.core.mail import EmailMultiAlternatives
from django.template import loader
from django.utils import timezone

from concordia.logging import ConcordiaLogger
from concordia.models import Transcription

from ..celery import app as celery_app

logger = getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)

ENV_MAPPING = {"development": "DEV", "test": "TEST", "staging": "STAGE"}


@celery_app.task(ignore_result=True)
def unusual_activity(ignore_env: bool = False) -> None:
    """
    Send an email report about suspect transcription or review activity.

    By default this task runs only when ``CONCORDIA_ENVIRONMENT`` is
    set to ``"production"``. Setting ``ignore_env`` to true forces the
    report to be generated in other environments and adds an
    environment tag to the subject line.

    The report includes:

    * Transcriptions flagged by ``transcribe_incidents`` in the past day
    * Reviews flagged by ``review_incidents`` in the past day

    Both plain text and HTML versions of the report are rendered from
    templates and emailed to the monitoring recipients.

    Args:
        ignore_env: Generate and send the report even if the current
            environment is not production.

    Returns:
        None
    """
    # Don't bother running unless we're in the prod env
    if settings.CONCORDIA_ENVIRONMENT == "production" or ignore_env:
        site = Site.objects.get_current()
        display_time = timezone.localtime().strftime("%b %d %Y, %I:%M %p")
        ONE_DAY_AGO = timezone.now() - datetime.timedelta(days=1)
        title = "Unusual User Activity Report for " + display_time
        if ignore_env:
            title += " [%s]" % ENV_MAPPING[settings.CONCORDIA_ENVIRONMENT]
        context = {
            "title": title,
            "domain": "https://" + site.domain,
            "transcriptions": Transcription.objects.transcribe_incidents(ONE_DAY_AGO),
            "reviews": Transcription.objects.review_incidents(ONE_DAY_AGO),
        }

        text_body_template = loader.get_template("emails/unusual_activity.txt")
        text_body_message = text_body_template.render(context)

        html_body_template = loader.get_template("emails/unusual_activity.html")
        html_body_message = html_body_template.render(context)

        to_email = ["rsar@loc.gov"]
        if settings.DEFAULT_TO_EMAIL:
            to_email.append(settings.DEFAULT_TO_EMAIL)
        message = EmailMultiAlternatives(
            subject=context["title"],
            body=text_body_message,
            from_email=settings.DEFAULT_FROM_EMAIL,
            to=to_email,
            reply_to=[settings.DEFAULT_FROM_EMAIL],
        )
        message.attach_alternative(html_body_message, "text/html")
        message.send()


================================================
FILE: concordia/tasks/useractivity.py
================================================
from logging import getLogger
from typing import Iterable

from django.conf import settings
from django.contrib.auth.models import User
from django.core.cache import cache
from django.core.mail import send_mail
from django.db.models import Q

from concordia.decorators import locked_task
from concordia.exceptions import CacheLockedError
from concordia.logging import ConcordiaLogger
from concordia.models import (
    Asset,
    Campaign,
    Tag,
    Transcription,
    UserAssetTagCollection,
    UserProfileActivity,
    _update_useractivity_cache,
    update_userprofileactivity_table,
)
from concordia.utils import get_anonymous_user

from ..celery import app as celery_app

logger = getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


def _populate_activity_table(campaigns: Iterable[Campaign]) -> None:
    """
    Populate UserProfileActivity rows for the given campaigns.

    For each campaign this helper calculates per user counts of assets,
    tags, transcriptions and reviews and bulk creates rows for all
    non-anonymous users. It also updates or creates an aggregate row for
    the anonymous user.

    Args:
        campaigns: Iterable of Campaign instances to process.
    """
    anonymous_user = get_anonymous_user()
    for campaign in campaigns:
        transcriptions = Transcription.objects.filter(
            asset__item__project__campaign=campaign
        )
        reviewer_ids = (
            transcriptions.exclude(reviewed_by=anonymous_user)
            .values_list("reviewed_by", flat=True)
            .distinct()
        )
        transcriber_ids = (
            transcriptions.exclude(user=anonymous_user)
            .values_list("user", flat=True)
            .distinct()
        )
        user_ids = list(set(list(reviewer_ids) + list(transcriber_ids)))
        tag_collections = UserAssetTagCollection.objects.filter(
            asset__item__project__campaign=campaign
        )
        UserProfileActivity.objects.bulk_create(
            [
                UserProfileActivity(
                    user=user,
                    campaign=campaign,
                    asset_count=Asset.objects.filter(item__project__campaign=campaign)
                    .filter(
                        Q(transcription__reviewed_by=user) | Q(transcription__user=user)
                    )
                    .distinct()
                    .count(),
                    asset_tag_count=Tag.objects.filter(
                        userassettagcollection__in=tag_collections.filter(user=user)
                    )
                    .distinct()
                    .count(),
                    transcribe_count=transcriptions.filter(Q(user=user))
                    .distinct()
                    .count(),
                    review_count=transcriptions.filter(Q(reviewed_by=user))
                    .distinct()
                    .count(),
                )
                for user in User.objects.filter(id__in=user_ids)
            ]
        )
        assets = Asset.objects.filter(item__project__campaign=campaign)
        q = Q(transcription__reviewed_by=anonymous_user) | Q(
            transcription__user=anonymous_user
        )
        user_profile_activity, _ = UserProfileActivity.objects.get_or_create(
            user=anonymous_user,
            campaign=campaign,
        )
        user_profile_activity.asset_count = assets.filter(q).distinct().count()
        user_profile_activity.asset_tag_count = (
            Tag.objects.filter(
                userassettagcollection__in=tag_collections.filter(user=anonymous_user)
            )
            .distinct()
            .count()
        )
        user_profile_activity.transcribe_count = (
            transcriptions.filter(Q(user=anonymous_user)).distinct().count()
        )
        user_profile_activity.review_count = (
            transcriptions.filter(Q(reviewed_by=anonymous_user)).distinct().count()
        )
        user_profile_activity.save()


@celery_app.task
def populate_completed_campaign_counts() -> None:
    """
    Populate UserProfileActivity for completed and retired campaigns.

    This task should be run after the UserProfileActivity table is
    created. It processes all campaigns that are not active by
    delegating to ``_populate_activity_table``.
    """
    # this task creates records in the UserProfileActivity table for campaigns
    # that are completed or have status == RETIRED (but have not yet actually
    # been retired). It should be run once, after the table has initially been
    # created
    # in my local env, this task took ~10 minutes to complete
    campaigns = Campaign.objects.exclude(status=Campaign.Status.ACTIVE)
    _populate_activity_table(campaigns)


@celery_app.task
def populate_active_campaign_counts() -> None:
    """
    Populate UserProfileActivity for active campaigns.

    This task builds or refreshes activity rows for campaigns whose
    status is ACTIVE by delegating to ``_populate_activity_table``.
    """
    active_campaigns = Campaign.objects.filter(status=Campaign.Status.ACTIVE)
    _populate_activity_table(active_campaigns)


@celery_app.task(
    bind=True,
    autoretry_for=(Exception,),
    retry_backoff=5,
    retry_kwargs={"max_retries": 5, "countdown": 5},
)
def update_useractivity_cache(
    self,
    user_id: int,
    campaign_id: int,
    attr_name: str,
    *args,
    **kwargs,
) -> None:
    """
    Update cached user activity counts for a single metric.

    This Celery task acquires a short lived cache based lock to prevent
    concurrent updates for the same key. On success it calls
    ``_update_useractivity_cache`` then releases the lock and logs a
    completion event. If the lock cannot be acquired after the retry
    budget it logs a warning and sends an email to the developer list.

    Args:
        user_id: Primary key of the user to update.
        campaign_id: Primary key of the campaign whose cache is updated.
        attr_name: Name of the activity attribute being incremented,
            for example ``"transcribe_count"`` or ``"review_count"``.

    Raises:
        CacheLockedError: If the cache lock cannot be acquired before
            retries are exhausted.
    """
    structured_logger.info(
        "Running update_useractivity_cache task",
        event_code="useractivity_cache_task_start",
        user_id=user_id,
        campaign_id=campaign_id,
        activity_type=attr_name,
        attempt=self.request.retries + 1,
    )
    try:
        lock_key = "userprofileactivity_cache_lock"

        # attempt to acquire
        if not cache.add(lock_key, "locked", timeout=10):
            raise CacheLockedError(f"Could not acquire lock for {lock_key}")

        try:
            _update_useractivity_cache(user_id, campaign_id, attr_name)
            structured_logger.info(
                "Successfully updated user activity cache",
                event_code="useractivity_cache_task_complete",
                user_id=user_id,
                campaign_id=campaign_id,
                activity_type=attr_name,
            )
        finally:
            # release
            cache.delete(lock_key)

    except Exception as e:
        if self.request.retries >= self.max_retries:
            structured_logger.warning(
                "Could not acquire cache lock",
                event_code="useractivity_cache_lock_failed",
                reason="Another task is holding the lock",
                reason_code="lock_unavailable",
                user_id=user_id,
                campaign_id=campaign_id,
                activity_type=attr_name,
            )
            structured_logger.exception(
                "Failed to update user activity cache after retries.",
                event_code="useractivity_cache_task_failed",
                reason="Max retries reached while trying to acquire lock.",
                reason_code="max_retries_exceeded",
                user_id=user_id,
                campaign_id=campaign_id,
                activity_type=attr_name,
            )
            subject = "Task update_useractivity_cache failed: cache is locked."
            message_body = """%s
                            user: %s
                            campaign: %s
                            attribute: %s
                          """ % (
                e,
                user_id,
                campaign_id,
                attr_name,
            )
            logger.error("%s %s Retrying...", subject, message_body)
            send_mail(
                subject,
                message_body,
                settings.DEFAULT_FROM_EMAIL,
                settings.CONCORDIA_DEVS,
            )
        # Let celery handle retries
        raise e


@celery_app.task(bind=True, ignore_result=True)
@locked_task
def update_userprofileactivity_from_cache(self) -> None:
    """
    Flush per campaign activity deltas from cache to the database.

    This task is wrapped by the ``locked_task`` decorator so only one
    instance runs at a time. For each campaign it reads the cached
    update payload, writes transcribe and review counts with
    ``update_userprofileactivity_table`` then clears the cache entry.
    """
    structured_logger.info(
        "Starting update_userprofileactivity_from_cache task",
        event_code="starting_update_userprofileactivity_from_cache_task",
    )
    for campaign in Campaign.objects.all():
        key = f"userprofileactivity_{campaign.pk}"
        structured_logger.debug(
            "Read key",
            event_code="update_userprofileactivity_from_cache_key_read",
            key=key,
        )
        updates_by_user = cache.get(key)
        if updates_by_user is not None:
            cache.delete(key)
            for user_id in updates_by_user:
                user = User.objects.get(id=user_id)
                update_userprofileactivity_table(
                    user,
                    campaign.id,
                    "transcribe_count",
                    updates_by_user[user_id][0],
                )
                update_userprofileactivity_table(
                    user,
                    campaign.id,
                    "review_count",
                    updates_by_user[user_id][1],
                )
                structured_logger.debug(
                    "Updated activity counts for user",
                    event_code=("update_userprofileactivity_from_cache_database_write"),
                    user=user_id,
                )
        else:
            structured_logger.debug(
                "Cache contained no updates for key. Skipping",
                event_code="update_userprofileactivity_from_cache_no_updates",
                key=key,
            )


================================================
FILE: concordia/tasks/visualizations.py
================================================
import csv
from datetime import timedelta
from io import StringIO
from logging import getLogger

from django.core.cache import caches
from django.core.files.base import ContentFile
from django.db.models import Count
from django.utils import timezone

from concordia.decorators import locked_task
from concordia.logging import ConcordiaLogger
from concordia.models import Asset, Campaign, SiteReport, TranscriptionStatus
from concordia.storage import VISUALIZATION_STORAGE

from ..celery import app as celery_app

logger = getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


@celery_app.task(bind=True, ignore_result=True)
@locked_task
def populate_asset_status_visualization_cache(self) -> None:
    """
    Build and cache aggregate asset status counts for active campaigns.

    This task queries live Asset rows for all campaigns that are published,
    listed and active then aggregates counts by ``transcription_status``. It
    also writes a CSV export to ``VISUALIZATION_STORAGE`` and stores the
    following payload in the ``"visualization_cache"`` under the
    ``"asset-status-overview"`` key:

        - `status_labels`: [
                "Not Started",
                "In Progress",
                "Needs Review",
                "Completed"
          ]
        - `total_counts`: [
                count_not_started,
                count_in_progress,
                count_submitted,
                count_completed
          ]
        - `csv_url`: URL to download a CSV of the data
    """
    visualization_cache = caches["visualization_cache"]
    cache_key = "asset-status-overview"
    csv_path = "visualization_exports/page-status-active-campaigns.csv"

    structured_logger.debug(
        "Starting asset status visualization task.",
        event_code="asset_status_vis_start",
    )

    campaign_ids = list(
        Campaign.objects.published().listed().active().values_list("id", flat=True)
    )

    status_keys = [key for key, _ in TranscriptionStatus.CHOICES]
    status_labels = [TranscriptionStatus.CHOICE_MAP[key] for key in status_keys]

    # Aggregate counts across all active campaigns
    status_counts_qs = (
        Asset.objects.filter(campaign_id__in=campaign_ids)
        .values("transcription_status")
        .annotate(cnt=Count("id"))
    )
    counts_map = {row["transcription_status"]: row["cnt"] for row in status_counts_qs}
    total_counts = [counts_map.get(status, 0) for status in status_keys]

    structured_logger.debug(
        "Aggregated asset counts by status.",
        event_code="asset_status_vis_counts",
        active_campaign_count=len(campaign_ids),
        total_counts=total_counts,
    )

    # If data unchanged, skip CSV + cache update
    existing = visualization_cache.get(cache_key)
    if isinstance(existing, dict) and existing.get("total_counts") == total_counts:
        structured_logger.info(
            "Asset status data unchanged; skipping CSV and cache update.",
            event_code="asset_status_vis_unchanged",
            total_counts=total_counts,
        )
        return
    elif isinstance(existing, dict):
        # We want the existing URL in case the upload fails later
        overview_csv_url = existing.get("csv_url")
    else:
        overview_csv_url = None

    overview_csv = StringIO(newline="")
    overview_writer = csv.writer(overview_csv)
    overview_writer.writerow(["Status", "Count"])
    for label, count in zip(status_labels, total_counts, strict=True):
        overview_writer.writerow([label, count])
    overview_csv_content = overview_csv.getvalue()

    try:
        VISUALIZATION_STORAGE.save(csv_path, ContentFile(overview_csv_content))
        overview_csv_url = VISUALIZATION_STORAGE.url(csv_path)
        structured_logger.debug(
            "CSV saved for asset status visualization.",
            event_code="asset_status_vis_csv_saved",
            csv_path=csv_path,
            byte_length=len(overview_csv_content.encode("utf-8")),
            csv_url=overview_csv_url,
        )
    except Exception:
        if overview_csv_url is None:
            structured_logger.exception(
                (
                    "CSV upload failed for asset status visualization and "
                    "no existing CSV URL could be determined"
                ),
                event_code="asset_status_vis_csv_missing_url_error",
                csv_path=csv_path,
            )
            raise
        structured_logger.exception(
            "CSV upload failed for asset status visualization.",
            event_code="asset_status_vis_csv_error",
            csv_path=csv_path,
        )

    # Update cache
    overview_payload = {
        "status_labels": status_labels,
        "total_counts": total_counts,
        "csv_url": overview_csv_url,
    }
    visualization_cache.set(cache_key, overview_payload, None)

    structured_logger.debug(
        "Asset status visualization cache updated.",
        event_code="asset_status_vis_cache_set",
        cache_key=cache_key,
        total_counts=total_counts,
    )

    structured_logger.debug(
        "Asset status visualization task completed successfully.",
        event_code="asset_status_vis_complete",
    )


@celery_app.task(bind=True, ignore_result=True)
@locked_task
def populate_daily_activity_visualization_cache(self) -> None:
    """
    Build and cache a 28 day time series of transcription activity.

    This task queries ``SiteReport`` rows with
    ``report_name=SiteReport.ReportName.TOTAL`` for the last 28 days
    (excluding today) and derives per day counts of saved transcriptions and
    review actions. It writes a CSV export to ``VISUALIZATION_STORAGE`` and
    stores the following payload in the ``"visualization_cache"`` under the
    ``"daily-transcription-activity-last-28-days"`` key.

    The dataset contains:

        - `labels`: [ "YYYY-MM-DD", ..., ] (28 dates)
        - `transcription_datasets`: [
              {
                  "label": "Transcriptions",
                  "data": [ daily_total, daily_total, ... ],
              },
              {
                  "label": "Reviews",
                  "data": [ daily_total, daily_total, ... ],
              },
          ]
        - `csv_url`: URL to download a CSV of the data
    """
    visualization_cache = caches["visualization_cache"]
    cache_key = "daily-transcription-activity-last-28-days"
    csv_path = "visualization_exports/daily-transcription-activity-last-28-days.csv"

    structured_logger.debug(
        "Starting daily activity visualization task.",
        event_code="daily_activity_vis_start",
    )

    yesterday = timezone.localdate() - timedelta(days=1)
    start_date = yesterday - timedelta(days=27)
    date_range = [start_date + timedelta(days=i) for i in range(28)]
    date_strings = [d.strftime("%Y-%m-%d") for d in date_range]

    reports = SiteReport.objects.filter(
        report_name=SiteReport.ReportName.TOTAL,
        created_on__date__in=date_range,
    )

    # Find the most recent SiteReport BEFORE the first of our dates, if any
    report_lookup = {
        timezone.localtime(report.created_on).date(): report for report in reports
    }

    prev_report = (
        SiteReport.objects.filter(
            report_name=SiteReport.ReportName.TOTAL,
            created_on__date__lt=start_date,
        )
        .order_by("-created_on")
        .first()
    )
    prev_cumulative = prev_report.transcriptions_saved if prev_report else 0
    running_prev = prev_cumulative

    transcriptions = []
    reviews = []

    for report_date in date_range:
        sitereport = report_lookup.get(report_date)
        if sitereport:
            cumulative = sitereport.transcriptions_saved or 0
            daily_saved = cumulative - running_prev
            if daily_saved < 0:
                daily_saved = 0
            running_prev = cumulative
            daily_review = sitereport.daily_review_actions or 0
        else:
            daily_saved = 0
            daily_review = 0

        transcriptions.append(daily_saved)
        reviews.append(daily_review)

    structured_logger.debug(
        "Compiled daily activity series.",
        event_code="daily_activity_vis_series_compiled",
        start_date=start_date.isoformat(),
        end_date=yesterday.isoformat(),
        transcriptions_total=sum(transcriptions),
        reviews_total=sum(reviews),
    )

    # If data unchanged, skip CSV + cache update
    existing = visualization_cache.get(cache_key)
    if isinstance(existing, dict):
        prev_series = existing.get("transcription_datasets") or []
        prev_transcriptions = next(
            (
                ds.get("data")
                for ds in prev_series
                if ds.get("label") == "Transcriptions"
            ),
            None,
        )
        prev_reviews = next(
            (ds.get("data") for ds in prev_series if ds.get("label") == "Reviews"),
            None,
        )
        if prev_transcriptions == transcriptions and prev_reviews == reviews:
            structured_logger.info(
                "Daily activity data unchanged; skipping CSV and cache update.",
                event_code="daily_activity_vis_unchanged",
            )
            return
        else:
            csv_url = existing.get("csv_url")
    else:
        csv_url = None

    data = {
        "labels": date_strings,
        "transcription_datasets": [
            {"label": "Transcriptions", "data": transcriptions},
            {"label": "Reviews", "data": reviews},
        ],
    }

    csv_output = StringIO(newline="")
    writer = csv.writer(csv_output)
    writer.writerow(["Date", "Transcriptions", "Reviews"])
    for i in range(28):
        writer.writerow([date_strings[i], transcriptions[i], reviews[i]])
    csv_content = csv_output.getvalue()

    try:
        VISUALIZATION_STORAGE.save(csv_path, ContentFile(csv_content))
        csv_url = VISUALIZATION_STORAGE.url(csv_path)
        structured_logger.debug(
            "CSV saved for daily activity visualization.",
            event_code="daily_activity_vis_csv_saved",
            csv_path=csv_path,
            byte_length=len(csv_content.encode("utf-8")),
            csv_url=csv_url,
        )
    except Exception:
        if csv_url is None:
            structured_logger.exception(
                (
                    "CSV upload failed for daily activity visualization and "
                    "no existing CSV URL could be determined"
                ),
                event_code="daily_activity_vis_csv_missing_url_error",
                csv_path=csv_path,
            )
            raise
        structured_logger.exception(
            "CSV upload failed for daily activity visualization.",
            event_code="daily_activity_vis_csv_error",
            csv_path=csv_path,
        )

    data["csv_url"] = csv_url
    visualization_cache.set(cache_key, data, None)

    structured_logger.debug(
        "Daily activity visualization cache updated.",
        event_code="daily_activity_vis_cache_set",
        cache_key=cache_key,
    )

    structured_logger.debug(
        "Daily activity visualization task completed successfully.",
        event_code="daily_activity_vis_complete",
    )


================================================
FILE: concordia/templates/404.html
================================================
{% extends "error.html" %}

{% block full_title %}404 Error{% endblock full_title %}

{% block error_message %}
    <h1>HTTP 404 Error</h1>

    <p>
        The requested page was not found.
    </p>

    <nav>
        <ul class="nav justify-content-center">
            <li class="nav-item">
                <a class="nav-link" href="{{ request.META.HTTP_REFERER }}">
                    &laquo; Go Back
                </a>
            </li>
            <li class="nav-item">
                <a class="nav-link" href="/">Go Home &raquo;</a>
            </li>
        </ul>
    </nav>
{% endblock error_message %}


================================================
FILE: concordia/templates/429.html
================================================
{% extends "error.html" %}

{% block full_title %}429 Error{% endblock full_title %}

{% block error_message %}
    <h1>HTTP 429: Too Many Requests</h1>

    <p>
        {% if exception %}
            {{ exception }}
        {% else %}
            {{ error|default:'Please wait a bit, then try again.' }}
        {% endif %}

    </p>
    <p>
        Seeing this page a lot? <a href="{% url 'contact' %}">Contact Us</a>
    </p>
{% endblock error_message %}


================================================
FILE: concordia/templates/500.html
================================================
{% extends "error.html" %}

{% block full_title %}500 Error{% endblock full_title %}

{% block error_message %}
    <h1>HTTP 500 Error</h1>
    <p>
        The server encountered an unexpected condition which prevented
        it from fulfilling the request. Our staff have been notified
        about the failure.
    </p>
    <nav>
        <ul class="nav justify-content-center">
            {% if request %}
                <li class="nav-item">
                    <a
                        class="nav-link"
                        href="{{ request.META.HTTP_REFERER }}"
                    >
                        &laquo; Go Back
                    </a>
                </li>
            {% endif %}
            <li class="nav-item">
                <a class="nav-link" href="/">Go Home &raquo;</a>
            </li>
        </ul>
    </nav>
{% endblock error_message %}


================================================
FILE: concordia/templates/503.html
================================================
{% extends "error.html" %}

{% load staticfiles %}

{% block full_title %}503 Error{% endblock full_title %}

{% block error_message %}
    <h1>We're experiencing technical difficulties.</h1>
    <p>
        But we're working on it and we should be back soon. Please try again later.
    </p>
    <figure class="error-figure">
        <img src="{% static 'img/503.jpg' %}" />
        <figcaption>
            <strong>Operating a hand drill at Vultee-Nashville, woman is working on a "Vengeance" dive bomber, Tennessee, February 1943.</strong><br />
            Palmer, Alfred T., photographer. <a target="_blank" href="http://hdl.loc.gov/loc.pnp/fsac.1a35371" rel=noopener>http://hdl.loc.gov/loc.pnp/fsac.1a35371</a></figcaption>
    </figure>

    <nav>
        <ul class="nav justify-content-center">
            {% if request and request.META.HTTP_REFERER %}
                <li class="nav-item">
                    <a
                        class="nav-link"
                        href="{{ request.META.HTTP_REFERER }}"
                    >
                        &laquo; Go Back
                    </a>
                </li>
            {% endif %}
            <li class="nav-item">
                <a class="nav-link" href="/">Go Home &raquo;</a>
            </li>
        </ul>
    </nav>
{% endblock error_message %}


================================================
FILE: concordia/templates/account/account_deletion.html
================================================
{% extends "base.html" %}

{% load django_bootstrap5 %}

{% block main_content %}
    <div class="container">
        <ul class="nav nav-tabs mb-4" id="nav-tab" role="tablist">
            <li class="nav-item">
                <a class="nav-link fw-bold" aria-selected="false" id="contributions-tab" type="button" role="tab" href="{% url 'user-profile' %}">My Contributions</a>
            </li>
            <li class="nav-item">
                <a class="nav-link fw-bold" aria-selected="false" id="recent-tab" type="button" role="tab" aria-controls="recent" href="{% url 'user-profile' %}#recent">Recent Pages Worked On</a>
            </li>
            <li class="nav-item">
                <a class="nav-link fw-bold active" aria-selected="true" id="account-tab" type="button" role="tab" href="{% url 'user-profile' %}#account">Account Settings</a>
            </li>
        </ul>
        <div class="row">
            <div class="col-md-8 mx-auto p-3">


            </div>
        </div>
        <div class="col-12 col-md-10 py-3 mt-4 change-options">
            <div class="d-flex">
                <h2>Delete your account?</h2>
            </div>
            <div class="d-flex">
                <p>By clicking the button below, all of your account information will be permanently removed from our system. This cannot be undone!</p>
            </div>
            <form class="form" action="{% url 'account-deletion' %}" method="POST" enctype="multipart/form-data">
                {% csrf_token %}
                <div class="input-group-append">
                    {% bootstrap_button "Delete Account" button_type="submit" button_class="btn btn-primary rounded-0" name="submit_delete" %}
                </div>
            </form>
        </div>
    </div>
{% endblock main_content %}


================================================
FILE: concordia/templates/account/email_reconfirmation_failed.html
================================================
{% extends "base.html" %}

{% block main_content %}
    <div class="container">
        <ul class="nav nav-tabs mb-4" id="nav-tab" role="tablist">
            <li class="nav-item">
                <a class="nav-link fw-bold" aria-selected="false" id="contributions-tab" type="button" role="tab" href="{% url 'user-profile' %}">My Contributions</a>
            </li>
            <li class="nav-item">
                <a class="nav-link fw-bold" aria-selected="false" id="recent-tab" type="button" role="tab" aria-controls="recent" href="{% url 'user-profile' %}#recent">Recent Pages Worked On</a>
            </li>
            <li class="nav-item">
                <a class="nav-link fw-bold active" aria-selected="true" id="account-tab" type="button" role="tab" href="{% url 'user-profile' %}#account">Account Settings</a>
            </li>
        </ul>
        <div class="row">
            <div class="col-md-8 mx-auto p-3">
                <h2>Email Reconfirmation</h2>
                <p class="reconfirmation-error-{{ reconfirmation_error.code }}">
                    {{ reconfirmation_error.message }}
                </p>
                <p><a href="{% url 'user-profile' %}">&#8810; Return to User Profile</a></p>
            </div>
        </div>
    </div>
{% endblock main_content %}


================================================
FILE: concordia/templates/account/profile.html
================================================
{% extends "base.html" %}

{% load humanize %}
{% load staticfiles django_vite %}
{% load django_bootstrap5 %}

{% block prefetch %}
    <link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/@duetds/date-picker@1.4.0/dist/duet/themes/default.css" />
{% endblock prefetch %}

{% block title %}User Profile{% endblock title %}

{% block breadcrumbs %}
    <li class="breadcrumb-item active" aria-current="page">Account</li>
{% endblock breadcrumbs %}

{% block main_content %}
    <div class="container bg-main profile-page" data-active-tab="{{ active_tab }}">
        <ul class="nav nav-tabs mb-4" id="nav-tab" role="tablist">
            <li class="nav-item">
                <a class="nav-link fw-bold{% if active_tab == 'contributions' %} active{% endif %}" aria-selected="{% if active_tab == 'contributions' %}true{% else %}false{% endif %}" id="contributions-tab" data-bs-toggle="tab" data-bs-target="#contributions" type="button" role="tab">My Contributions</a>
            </li>
            <li class="nav-item">
                <a class="nav-link fw-bold{% if active_tab == 'recent' %} active" aria-selected="true"{% else %} aria-selected="false"{% endif %} id="recent-tab" data-bs-toggle="tab" data-bs-target="#recent" type="button" role="tab" aria-controls="recent" href="#recent">Recent Pages Worked On</a>
            </li>
            <li class="nav-item">
                <a class="nav-link fw-bold{% if active_tab == 'account' %} active" aria-selected="true"{% else %} aria-selected="false"{% endif %} id="account-tab" data-bs-toggle="tab" data-bs-target="#account" type="button" role="tab" href="#account">Account Settings</a>
            </li>
        </ul>
        <div class="tab-content" id="nav-tabContent">
            <div class="tab-pane fade{% if active_tab == 'account' %} show active{% endif %}" id="account" role="tabpanel" aria-labelledby="account-tab">
                <div class="row justify-content-start">
                    <div class="col-12 col-md-10">
                        <h2>Account Settings</h2>
                        <div class="mb-2">
                            <span class="fw-bold">Username</span>: {{ user.username }}
                        </div>
                    </div>
                    <div class="col-12 col-md-10 py-3 change-options">
                        <div class="mt-1 mb-3">
                            <span class="fw-bold">Email address</span>: {{ user.email }}
                        </div>
                        {% if unconfirmed_email %}
                            <div class="mt-1 mb-3">
                                <span class="fw-bold">Unconfirmed email address</span>: {{ unconfirmed_email }}
                            </div>
                        {% endif %}
                        <form class="form needs-validation" action="{% url 'user-profile' %}" method="POST" enctype="multipart/form-data" novalidate>
                            {% csrf_token %}

                            <div class="input-group mb-3 user-fields">
                                <label for="id_email"><span class="visually-hidden">Email</span></label>
                                <input type="email" name="email" placeholder="Change your email address" class="form-control fst-italic" title="" required="" id="id_email" required>
                                <div class="input-group-append">
                                    {% bootstrap_button "Save Change" button_type="submit" button_class="btn btn-primary rounded-0" name="submit_email" %}
                                </div>
                                {% if valid is True %}
                                    <div class="mt-1 text-success w-100" id="validation-confirmation"><i class="fa fa-check-circle"></i> Email changed successfully; <strong>Check email to confirm address</strong></div>
                                {% else %}
                                    <div class="invalid-feedback" {% if valid is not None and valid is False %}style="display: block;" aria-hidden="false"{%endif %}>
                                        <i class="fa fa-exclamation-circle"></i> Error in email change
                                    </div>
                                {% endif %}
                            </div>
                        </form>
                    </div>
                    <div class="col-12 col-md-10 py-3 mt-4 change-options">
                        <div class="row justify-content-start">
                            <div class="btn-row col-md-10">
                                <a class="btn btn-primary rounded-0" href="{% url 'password_change' %}">Change Password</a>
                            </div>
                        </div>
                    </div>
                    <div class="col-12 col-md-10 py-3 mt-4 change-options">
                        <div class="mb-2">Optional: If you want a name to appear on your service letter, enter first and last name and click "Save". To remove name data click "Save" without entering any text.</div>
                        <form class="form" action="{% url 'user-profile' %}" method="POST" enctype="multipart/form-data">
                            {% csrf_token %}
                            <div class="mb-3 user-fields">
                                <label class="d-flex mb-2">
                                    <span class="fw-bold">First Name</span>: {{ user.first_name }}
                                </label>
                                <input name="first_name" placeholder="Enter your first name" class="form-control fst-italic">
                                <label class="mt-2">
                                    <span class="fw-bold">Last Name</span>: {{ user.last_name }}
                                </label>
                                <input name="last_name" placeholder="Enter your last name" class="form-control fst-italic">
                            </div>
                            <div class="input-group-append">
                                {% bootstrap_button "Save Changes" button_type="submit" button_class="btn btn-primary rounded-0" name="submit_name" %}
                            </div>
                        </form>
                    </div>
                    <div class="col-12 col-md-10 py-3 mt-4 change-options">
                        <div class="row justify-content-start">
                            <div class="btn-row col-md-10">
                                <a class="btn btn-primary rounded-0" href="{% url 'account-deletion' %}">Delete Account</a>
                            </div>
                        </div>
                    </div>
                </div>
            </div>
            <div class="row tab-pane fade{% if active_tab == 'contributions' %} show active{% endif %}" id="contributions" role="tabpanel">
                {% if user_profile_activity %}
                    <div class="d-flex justify-content-start">
                        <div class="col-md">
                            <div class="d-flex">
                                <h2>My Contributions</h2>
                            </div>
                            <div>
                                <label><b>Account created: </b></label> {{ user.date_joined|date:"SHORT_DATE_FORMAT" }}
                            </div>
                            <div class="d-lg-flex" style="margin-right: -0.5rem; margin-left: -0.5rem;">
                                <div class="contribution-highlight">
                                    <div class="value">{{ user_profile_activity.count|intcomma }}</div>
                                    <p class="label">Campaigns</p>
                                    <p>Projects you've worked on</p>
                                </div>
                                <div class="contribution-highlight">
                                    <div class="value">{{ pages_worked_on|intcomma }}</div>
                                    <p class="label">Pages</p>
                                    <p>Pages you've worked on</p>
                                </div>
                                <div class="contribution-highlight">
                                    <div class="value">{{ totalCount|intcomma }}</div>
                                    <p class="label">Actions</p>
                                    <p>Your saves, submits, and reviews</p>
                                </div>
                            </div>
                            <div class="d-flex mt-4">
                                <table id="tblTranscription" class="table table-striped table-sm table-responsive-sm contribution-table">
                                    <thead class="border-y">
                                        <tr>
                                            <td></td>
                                            <th>Campaign</th>
                                            <th>
                                                <abbr title="Total number of times you saved, submitted a transcription" class="text-decoration-none">Saves & Submits</abbr>
                                            </th>
                                            <th>
                                                <abbr title="Total number of times you reviewed a transcription" class="text-decoration-none">Reviews</abbr>
                                            </th>
                                            <th><abbr title="Total number of times you saved, submitted, or reviewed a transcription" class="text-decoration-none">Total Actions</abbr></th>
                                        </tr>
                                    </thead>
                                    <tbody>
                                        <tr>
                                            <td class="py-2"></td>
                                            <td class="campaign all-campaigns py-2" id="-1">
                                                <b><a href="{% url 'campaign-topic-list' %}">All Campaigns</a></b>
                                            </td>
                                            <td class="py-2"><b>{{ totalTranscriptions|intcomma }}</b></td>
                                            <td class="py-2"><b>{{ totalReviews|intcomma }}</b></td>
                                            <td class="py-2"><b>{{ totalCount|intcomma }}</b></td>
                                        </tr>
                                        {% for user_campaign in user_profile_activity %}
                                            <tr>
                                                <td></td>
                                                <td>
                                                    <a class="campaign py-2" id={{user_campaign.campaign.id}} href="{% url 'transcriptions:campaign-detail' user_campaign.campaign.slug %}">
                                                        {{ user_campaign.campaign.title }}
                                                    </a>
                                                </td>
                                                <td class="py-2">{{ user_campaign.transcribe_count|intcomma }}</td>
                                                <td class="py-2">{{ user_campaign.review_count|intcomma }}</td>
                                                <td class="py-2">{{ user_campaign.total_actions|intcomma }}</td>
                                            </tr>
                                        {% endfor %}
                                    </tbody>
                                </table>
                            </div>
                            <div class="d-flex justify-content-start bg-light">
                                <div class="col-12 py-3">
                                    <h3>Service Letter</h3>
                                    <div class="mb-3">Download a letter verifying your volunteer contributions, including a list of your transcription and review activity over the past six months.</div>
                                    <div class="row justify-content-start">
                                        <div class="btn-row col-md-10">
                                            <a class="btn btn-primary rounded-0" href="/letter">Download Letter</a>
                                        </div>
                                    </div>
                                </div>
                            </div>
                            <div class="d-flex justify-content-start bg-light mt-4">
                                <div class="col-12 py-3">
                                    <h3>Volunteer Hours Spreadsheet</h3>
                                    <div class="mb-3">The <em>By the People</em> website doesn't track the number of hours you spend volunteering. Download a spreadsheet template that makes it easy keep your own record.</div>
                                    <div class="row justify-content-start">
                                        <div class="btn-row col-md-10">
                                            <a class="btn btn-primary rounded-0" href="https://crowd-content.s3.amazonaws.com/cm-uploads/resources/2023/btp_volunteer_hours_log_sheet.xlsx
                                                                                      ">Download Spreadsheet</a>
                                        </div>
                                    </div>
                                </div>
                            </div>
                        </div>
                    </div>
                {% endif %}
            </div>

            <div class="tab-pane fade{% if active_tab == 'recent' %} show active{% endif %}" id="recent" role="tabpanel" aria-labelledby="recent-tab">
                <div class="row justify-content-start" id="recent-pages"></div>
            </div>
        </div>
    </div>
{% endblock main_content %}

{% block body_scripts %}
    <script type="module" src="https://cdn.jsdelivr.net/npm/@duetds/date-picker@1.4.0/dist/duet/duet.esm.js"></script>
    <script nomodule src="https://cdn.jsdelivr.net/npm/@duetds/date-picker@1.4.0/dist/duet/duet.js"></script>
    {{ block.super }}
    {% vite_asset 'src/profile.js' %}
{% endblock body_scripts %}


================================================
FILE: concordia/templates/admin/auth/user/change_form.html
================================================
{% extends "admin/change_form.html" %}

{% load i18n admin_urls humanize %}

{% block object-tools-items %}
    {% if original.pk %}
        <li>
            <a class="view-related-objects" href="{% url 'admin:concordia_transcription_changelist' %}?user__id__exact={{ original.pk }}">
                Transcriptions
            </a>
        </li>
        <li>
            <a class="view-related-objects" href="{% url 'admin:concordia_transcription_changelist' %}?reviewed_by__id__exact={{ original.pk }}">
                Reviews
            </a>
        </li>
    {% endif %}
    {{ block.super }}
{% endblock object-tools-items %}


================================================
FILE: concordia/templates/admin/base_site.html
================================================
{% extends "admin/base.html" %}

{% block title %}{{ title }} | {{ site_title|default:_('Django site admin') }}{% endblock %}

{% block branding %}
    <h1 id="site-name"><a href="{% url 'admin:index' %}">{{ site_header|default:_('Django administration') }}</a></h1>
{% endblock %}

{% block nav-global %}{% endblock %}

{% block extrahead %}
    <style>
        .view-parent-object::after {
            content: " ⤴️";
        }

        .view-related-objects::after {
            content: " 🔎";
        }
        .long-name-filter li {
            list-style-type: circle !important;
            list-style-position: inside !important;
        }
        .long-name-filter a {
            display: inline !important;
            margin-left: -0.5em;
        }
    </style>
{% endblock %}

{% block messages %}
    {% if messages %}
        <ul class="messagelist">
            {% for message in messages %}
        {# Remove mark-safe from tags since that's for controlling template behavior #}
                {% with message.tags|reject:"mark-safe"|join:" " as cleaned_tags %}
                    <li {% if cleaned_tags %} class="{{ cleaned_tags }}">{% endif %}
                    {% if "marked-safe" in message.tags %}
                        {{ message|safe|capfirst }}
                    {% else %}
                        {{ message|capfirst }}
                    {% endif %}
                    </li>
                {% endwith %}
            {% endfor %}
        </ul>
    {% endif %}
{% endblock messages %}


================================================
FILE: concordia/templates/admin/bulk_change.html
================================================
{% extends "admin/base_site.html" %}

{% block messages %}
    {% comment %} This is displayed elswhere {% endcomment %}
{% endblock messages %}

{% block extrahead %}
    {{ block.super }}
    <style>
        .message-error, .message-warning {
            font-weight: bold;
        }

        .message-error {
            color: #dc3545;
        }

        .message-warning {
            color: #ffc107;
        }
    </style>
{% endblock %}

{% block content %}
    <div id="content" class="colM">
        <div>
            <ol>
                <li>The spreadsheet should be in xlsx (not xls or csv) format.</li>
                <li>The spreadsheet should have a header row. One of the columns headers should be "asset__slug", and another should be "New Status".</li>
                <li>If the "user" column is set, that value will be used as the submitting user. Otherwise, the anonymouse user will be used.</li>
            </ol>
            <form method="post" enctype="multipart/form-data">
                {% csrf_token %}
                {{ form.as_table }}
                <div class="submit-row">
                    <input type="submit" value="import!" class="default" />
                </div>
            </form>
        </div>

        {% if messages %}
            <h4>Messages</h4>
            <ul>
                {% for message in messages %}
                    <li class="message {% if message.level >= DEFAULT_MESSAGE_LEVELS.ERROR %}message-error{% elif message.level >= DEFAULT_MESSAGE_LEVELS.WARNING %}message-warning{% endif %}">{{ message }}</li>
                {% endfor %}
            </ul>
        {% endif %}
    </div>
{% endblock content %}


================================================
FILE: concordia/templates/admin/bulk_import.html
================================================
{% extends "admin/base.html" %}

{% block messages %}
    {% comment %} This is displayed elswhere {% endcomment %}
{% endblock messages %}

{% block extrahead %}
    {{ block.super }}
    <style>
        .message-error, .message-warning {
            font-weight: bold;
        }

        .message-error {
            color: #dc3545;
        }

        .message-warning {
            color: #ffc107;
        }
    </style>
{% endblock %}

{% block content %}
    <div id="content-main">
        {% if import_jobs %}
            <h2>Import Tasks</h2>
            <ul>
                {% for import_job in import_jobs %}
                    <li>
                        <a target="_blank" rel=noopener href="{% url 'admin:importer_importjob_change' object_id=import_job.pk %}">{{ import_job }}</a>
                    </li>
                {% endfor %}
            </ul>
        {% else %}
            <p>
                The spreadsheet must follow this convention:
                <ol>
                    <li>A header row must include the columns Campaign, Campaign Short Description, Campaign Long Description, Campaign Slug, Project Slug, Project, Project Description, and Import URLs</li>
                    <li>The header names are case sensitive but may occur in any order and other columns will be ignored</li>
                    <li>Project titles (in the Project column) must be 80 characters or less.</li>
                    <li>The Campaign, Project, and Import URLs columns must have values or the row will be skipped</li>
                    <li>
                        The Import URLs column may contain one or more URLs
                        separated by spaces or newlines. Do not include commas or
                        semicolons as those are valid URL characters and will be
                        treated as part of the URL.
                    </li>
                    <li>
                        Campaigns and Projects will be created if they do not
                        exist but existing records will not be modified. If you
                        want to recreate them, delete the old records before
                        running the importer.
                    </li>
                    <li>
                        Items will be added to projects but items which have
                        already been imported into that project will be skipped.
                        (Unless the redownload option is checked below.)
                        This means that you can add multiple items to a project
                        both by having the “Import URLs” cell contain multiple
                        URLs or by duplicating the row with new ”Import URLs”
                        values.
                    </li>
                </ol>
            </p>

            <div>
                <form method="post" enctype="multipart/form-data">
                    {% csrf_token %}
                    {{ form.as_p }}
                    <div class="submit-row">
                        <button type="submit">Import!</button>
                    </div>
                </form>
            </div>
        {% endif %}


        {% if messages %}
            <h4>Messages</h4>
            <ul>
                {% for message in messages %}
                    <li class="message {% if message.level >= DEFAULT_MESSAGE_LEVELS.ERROR %}message-error{% elif message.level >= DEFAULT_MESSAGE_LEVELS.WARNING %}message-warning{% endif %}">{{ message }}</li>
                {% endfor %}
            </ul>
        {% endif %}
    </div>
{% endblock content %}


================================================
FILE: concordia/templates/admin/bulk_review.html
================================================
{% extends "admin/base.html" %}

{% block messages %}
    {% comment %} This is displayed elswhere {% endcomment %}
{% endblock messages %}

{% block extrahead %}
    {{ block.super }}
    <style>
        .message-error, .message-warning {
            font-weight: bold;
        }

        .message-error {
            color: #dc3545;
        }

        .message-warning {
            color: #ffc107;
        }
    </style>
{% endblock %}

{% block content %}
    <div id="content-main">
        {% if import_jobs %}
            <h2>Import Tasks</h2>
            <ul>
                {% for import_job in import_jobs %}
                    <li>
                        <a target="_blank" rel=noopener href="{% url 'admin:importer_importjob_change' object_id=import_job.pk %}">{{ import_job }}</a>
                    </li>
                {% endfor %}
            </ul>
        {% else %}
            <p>
                The spreadsheet must follow this convention:
                <ol>
                    <li>A header row must include the columns Campaign, Campaign Short Description, Campaign Long Description, Campaign Slug, Project Slug, Project, Project Description, and Import URLs</li>
                    <li>The header names are case sensitive but may occur in any order and other columns will be ignored</li>
                    <li>Project titles (in the Project column) must be 80 characters or less.</li>
                    <li>The Campaign, Project, and Import URLs columns must have values or the row will be skipped</li>
                    <li>
                        The Import URLs column may contain one or more URLs
                        separated by spaces or newlines. Do not include commas or
                        semicolons as those are valid URL characters and will be
                        treated as part of the URL.
                    </li>
                    <li>
                        Campaigns and Projects will be created if they do not
                        exist but existing records will not be modified. If you
                        want to recreate them, delete the old records before
                        running the importer.
                    </li>
                    <li>
                        Items will be added to projects but items which have
                        already been imported into that project will be skipped.
                        This means that you can add multiple items to a project
                        both by having the “Import URLs” cell contain multiple
                        URLs or by duplicating the row with new ”Import URLs”
                        values.
                    </li>
                </ol>
            </p>

            <div>
                <form method="post" enctype="multipart/form-data">
                    {% csrf_token %}
                    {{ form.as_p }}
                    <div class="submit-row">
                        <button type="submit">Review!</button>
                    </div>
                </form>
            </div>
        {% endif %}


        {% if messages %}
            <h4>Messages</h4>
            <ul>
                {% for message in messages %}
                    <li class="message {% if message.level >= DEFAULT_MESSAGE_LEVELS.ERROR %}message-error{% elif message.level >= DEFAULT_MESSAGE_LEVELS.WARNING %}message-warning{% endif %}">{{ message }}</li>
                {% endfor %}
            </ul>
        {% endif %}
    </div>
{% endblock content %}


================================================
FILE: concordia/templates/admin/celery_task.html
================================================
{% extends "admin/base.html" %}

{% block messages %}
    {% comment %} This is displayed elswhere {% endcomment %}
{% endblock messages %}

{% block extrahead %}
    {{ block.super }}
    <style>
        .message-error,
        .message-warning {
            font-weight: bold;
        }

        .message-error {
            color: #dc3545;
        }

        .message-warning {
            color: #ffc107;
        }
    </style>
{% endblock %}

{% block content %}
    <div id="content-main">
        {% if campaigns %}
            <h2>Importer Progress</h2>
            <ul>
                <table>
                    <thead>
                        <tr>
                            <th>Campaign Title</th>
                            <th></th>
                        </tr>
                    </thead>
                    {% for campaign in campaigns %}
                        <tr>
                            <td>{{ campaign.title }}</td>
                            <td><a href="?id={{ campaign.id}}">Check Progress</a></td>
                        </tr>
                    {% endfor %}
                </table>
            </ul>

        {% else %}

            {% if projects %}
                <span><a href="/admin/celery-review">All Campaigns</a></span>
                <h2>Projects</h2>
                <ul>
                    <table>
                        <thead>
                            <tr>
                                <th>Project Title</th>
                                <th>Successful</th>
                                <th>Started-Incomplete</th>
                                <th>Started-Failed</th>
                                <th>Unstarted</th>
                                <th></th>
                            </tr>
                        </thead>
                        {% for project in projects %}
                            <tr>
                                <td>{{ project.title }}</td>
                                <td>{{ project.successful }}</td>
                                <td><a
                                    href="/admin/importer/importitemasset/?completed=null&import_item__job__project__campaign__id__exact={{project.campaign_id}}&import_item__job__project__in={{ project.id}}&last_started=not-null">
                                    {{ project.incomplete }}</a></td>
                                <td><a
                                    href="/admin/importer/importitemasset/?failed=not-null&import_item__job__project__campaign__id__exact={{project.campaign_id}}&import_item__job__project__in={{ project.id}}&last_started=not-null">
                                    {{ project.failure }}</a></td>
                                <td><a
                                    href="/admin/importer/importitemasset/?import_item__job__project__campaign__id__exact={{project.campaign_id}}&import_item__job__project__in={{ project.id}}&last_started=null">
                                    {{ project.unstarted }}</a></td>
                            </tr>
                        {% endfor %}
                    </table>
                </ul>

                <span>Total Assets: {{ totalassets }}</span>

            {% endif %}
        {% endif %}
        {% if messages %}
            <h4>Messages</h4>
            <ul>
                {% for message in messages %}
                    <li
                        class="message {% if message.level >= DEFAULT_MESSAGE_LEVELS.ERROR %}message-error{% elif message.level >= DEFAULT_MESSAGE_LEVELS.WARNING %}message-warning{% endif %}">
                        {{ message }}</li>
                {% endfor %}
            </ul>
        {% endif %}
    </div>
{% endblock content %}


================================================
FILE: concordia/templates/admin/clear_cache.html
================================================
{% extends "admin/base.html" %}

{% block extrahead %}
    {{ block.super }}
    <style>
        .message-error, .message-warning {
            font-weight: bold;
        }

        .message-error {
            color: #dc3545;
        }

        .message-warning {
            color: #ffc107;
        }
    </style>
{% endblock %}

{% block content %}
    <div id="content-main">
        <p>
            Don't do this if you don't know what you're doing.
        </p>
        <p><strong>
            Don't do this if you don't know what you're doing.
        </strong>
        </p>
        <div>
            <form method="post">
                {% csrf_token %}
                {{ form.as_p }}
                <div class="submit-row">
                    <button type="submit">Clear Cache</button>
                </div>
            </form>
        </div>
    </div>
{% endblock content %}


================================================
FILE: concordia/templates/admin/concordia/asset/change_form.html
================================================
{% extends "admin/change_form.html" %}

{% load i18n admin_urls humanize %}

{% block object-tools-items %}
    {% if original.pk %}
        <li>
            <a class="view-parent-object" href="{% url 'admin:concordia_campaign_change' original.item.project.campaign_id %}">
                Campaign
            </a>
        </li>
        <li>
            <a class="view-parent-object" href="{% url 'admin:concordia_project_change' original.item.project_id %}">
                Project
            </a>
        </li>
        <li>
            <a class="view-parent-object" href="{% url 'admin:concordia_item_change' original.item_id %}">
                Item
            </a>
        </li>
        <li>
            <a class="view-related-objects" href="{% url 'admin:concordia_transcription_changelist' %}?asset__id__exact={{ original.pk }}">
                Transcriptions
            </a>
        </li>
    {% endif %}
    {{ block.super }}
{% endblock object-tools-items %}

{% block content %}
    {% if original %}
        <form action="{% url 'admin:concordia_asset_changelist' %}" method="post" style="display:inline;">
            {% csrf_token %}

            {# Manually create the hidden PK field #}
            <input type="hidden" name="_selected_action" value="{{ original.pk }}"></input>

            {# We use this to send the user back to this page instead of leaving them on the changelist #}
            <input type="hidden" name="next" value="{% url 'admin:concordia_asset_change' original.pk %}"></input>

            {{ status_action_form.action }}
            <button type="submit" class="button">Change status</button>
        </form>
    {% endif %}

    <h4>Current status: {{ original.get_transcription_status_display }}</h4>

    {{ block.super }}

    <h4>Current status: {{ original.transcription_status }}</h4>

    {% if transcriptions %}
        <table>
            <caption>Transcription History</caption>
            <thead>
                <tr>
                    <th>ID</th>
                    <th>Creator</th>
                    <th>Created</th>
                    <th>Updated</th>
                    <th>Submitted</th>
                    <th>Review Status</th>
                </tr>
            </thead>
            <tbody>
                {% for t in transcriptions %}
                    <tr>
                        <th><a href="{% url 'admin:concordia_transcription_change' t.id %}">{{ t.id }}</a></th>
                        <th>{{ t.user }}</th>
                        <td>{{ t.created_on|naturaltime }}</td>
                        <td>{{ t.updated_on|naturaltime }}</td>
                        <td>{{ t.submitted|naturaltime|default:'' }}</td>
                        <td>
                            {% if t.rejected %}
                                Rejected
                            {% elif t.accepted %}
                                Accepted
                            {% endif %}
                            {% if t.rejected or t.accepted %}
                                by {{ t.reviewed_by }}
                            {% endif %}
                            {% if t.rejected %}
                                {{ t.rejected|naturaltime }}
                            {% elif t.accepted %}
                                {{ t.accepted|naturaltime }}
                            {% endif %}
                        </td>
                    </tr>
                {% endfor %}
            </tbody>
        </table>
    {% endif %}
{% endblock content %}


================================================
FILE: concordia/templates/admin/concordia/asset/change_list.html
================================================
{% extends "admin/change_list.html" %}

{% block result_list %}
    {% block pagination %} {{ block.super }} {% endblock %}
    {{ block.super }}
{% endblock %}


================================================
FILE: concordia/templates/admin/concordia/campaign/change_form.html
================================================
{% extends "admin/change_form.html" %}

{% load i18n admin_urls static %}

{% block object-tools-items %}
    {% if original.pk %}
        <li>
            <a href="{% url 'admin:concordia_campaign_export-csv' original.slug %}" class="viewsitelink">
                Export CSV
            </a>
        </li>
        <li>
            <a href="{% url 'admin:concordia_campaign_export-bagit' original.slug %}" class="viewsitelink">
                Export BagIt
            </a>
        </li>
        <li>
            <a href="{% url 'admin:concordia_campaign_report' original.slug %}" class="viewsitelink">
                Report
            </a>
        </li>
        {% if perms.concordia.retire_campaign and original.status != 1 %}
            {# Hide if campaign is active #}
            <li>
                <a href="{% url 'admin:concordia_campaign_retire' original.slug %}" class="viewsitelink">
                    Retire
                </a>
            </li>
        {% endif %}
        <li>
            <a class="view-related-objects" href="{% url 'admin:concordia_project_changelist' %}?campaign__id__exact={{ original.pk }}">
                Projects
            </a>
        </li>
        <li>
            <a class="view-related-objects" href="{% url 'admin:concordia_item_changelist' %}?project__campaign__id__exact={{ original.pk }}">
                Items
            </a>
        </li>
        <li>
            <a class="view-related-objects" href="{% url 'admin:concordia_asset_changelist' %}?item__project__campaign__id__exact={{ original.pk }}">
                Assets
            </a>
        </li>
    {% endif %}
    {{ block.super }}
{% endblock %}


================================================
FILE: concordia/templates/admin/concordia/campaign/retire.html
================================================
{% extends "admin/base_site.html" %}
{% load i18n admin_urls static %}

{% block extrahead %}
    {{ block.super }}
    {{ media }}
    <script src="{% static 'admin/js/cancel.js' %}" async></script>
{% endblock %}

{% block bodyclass %}{{ block.super }} app-{{ opts.app_label }} model-{{ opts.model_name }} delete-confirmation{% endblock %}

{% block breadcrumbs %}
    <div class="breadcrumbs">
        <a href="{% url 'admin:index' %}">Home</a>
        &rsaquo; <a href="{% url 'admin:app_list' app_label=opts.app_label %}">{{ opts.app_config.verbose_name }}</a>
        &rsaquo; <a href="{% url opts|admin_urlname:'changelist' %}">{{ opts.verbose_name_plural|capfirst }}</a>
        &rsaquo; <a href="{% url opts|admin_urlname:'change' object.pk|admin_urlquote %}">{{ object|truncatewords:"18" }}</a>
        &rsaquo; Retire
    </div>
{% endblock %}

{% block content %}
    {% block delete_confirm %}
        <p>Are you sure you want to retire the {{ object_name }} "{{ object }}"? All of the following related items will be deleted:</p>
        {% include "admin/includes/object_delete_summary.html" %}
        <form method="post">{% csrf_token %}
            <div>
                <input type="hidden" name="post" value="yes">
                <input type="submit" value="Yes, I’m sure">
                <a href="#" class="button cancel-link">No, take me back</a>
            </div>
        </form>
    {% endblock %}
{% endblock content %}


================================================
FILE: concordia/templates/admin/concordia/item/change_form.html
================================================
{% extends "admin/change_form.html" %}

{% load i18n admin_urls static %}

{% block object-tools-items %}
    {% if original.pk %}
        <li>
            <a href="{% url 'transcriptions:item-export-bagit' original.project.campaign.slug original.project.slug original.item_id %}" class="viewsitelink">
                Export BagIt
            </a>
        </li>
        <li>
            <a class="view-parent-object" href="{% url 'admin:concordia_campaign_change' original.project.campaign_id %}">
                Campaign
            </a>
        </li>
        <li>
            <a class="view-parent-object" href="{% url 'admin:concordia_project_change' original.project_id %}">
                Project
            </a>
        </li>

        <li>
            <a class="view-related-objects" href="{% url 'admin:concordia_asset_changelist' %}?item__id__exact={{ original.pk }}">
                Assets
            </a>
        </li>

    {% endif %}
    {{ block.super }}
{% endblock %}


================================================
FILE: concordia/templates/admin/concordia/project/change_form.html
================================================
{% extends "admin/change_form.html" %}

{% load i18n admin_urls static %}

{% block object-tools-items %}
    {% if original.pk %}
        <li>
            <a href="{% url 'admin:concordia_project_export-csv' original.campaign.slug original.slug %}" class="viewsitelink">
                Export CSV
            </a>
        </li>
        <li>
            <a href="{% url 'transcriptions:project-export-bagit' original.campaign.slug original.slug %}" class="viewsitelink">
                Export BagIt
            </a>
        </li>
        <li>
            <a href="{% url 'admin:concordia_project_item-import' original.pk %}" class="viewsitelink">
                Import Items
            </a>
        </li>

        <li>
            <a class="view-parent-object" href="{% url 'admin:concordia_campaign_change' original.campaign_id %}">
                Campaign
            </a>
        </li>

        <li>
            <a class="view-related-objects" href="{% url 'admin:concordia_item_changelist' %}?project__id__exact={{ original.pk }}">
                Items
            </a>
        </li>

        <li>
            <a class="view-related-objects" href="{% url 'admin:concordia_asset_changelist' %}?item__project__id__exact={{ original.pk }}">
                Assets
            </a>
        </li>
    {% endif %}
    {{ block.super }}
{% endblock %}


================================================
FILE: concordia/templates/admin/concordia/project/item_import.html
================================================
{% extends "admin/change_form.html" %}

{% load i18n admin_urls %}


{% block content %}
    <div id="content-main">
        {% if import_job %}
            <p>
                Task ID <a target="_blank" rel=noopener href="{% url 'admin:importer_importjob_change' object_id=import_job.pk %}">{{ import_job }}</a>
                created to import <a target="_blank" rel=noopener href="{{ form.cleaned_data.import_url }}">{{ form.cleaned_data.import_url }}</a>
            </p>
            <ul>
                <li>
                    <a target="_blank" rel=noopener href="{% url 'admin:concordia_item_changelist' %}?project__pk={{ object_id }}">
                        View Project Items
                    </a>
                </li>
                <li>
                    <a target="_blank" rel=noopener href="{% url 'admin:concordia_asset_changelist' %}?project__pk={{ object_id }}">
                        View Project Assets
                    </a>
                </li>
            </ul>
        {% else %}
            <form id="import-items" method="post">
                {% csrf_token %}

                <input type="hidden" name="project-id" value="{{ object_id }}">

                {{ form.non_field_errors }}

                {% if form.errors %}
                    <p>Please fix the errors below:</p>
                {% endif %}

                <div class="row">
                    <div class="fieldBox field-import_url">
                        <label for="{{ form.import_url.id_for_label }}">{{ form.import_url.label }}</label>
                        {{ form.import_url }}

                        <ul class="error">
                            {% for error in form.import_url.errors %}
                                <li>{{ error }}</li>
                            {% endfor %}
                        </ul>

                        <ul>
                            <li onclick="document.getElementById('{{ form.import_url.id_for_label }}').value = 'https://www.loc.gov/item/mss859430231'">https://www.loc.gov/item/mss859430231</li>
                            <li onclick="document.getElementById('{{ form.import_url.id_for_label }}').value = 'https://www.loc.gov/collections/branch-rickey-papers/'">https://www.loc.gov/collections/branch-rickey-papers/</li>
                            <li onclick="document.getElementById('{{ form.import_url.id_for_label }}').value = 'https://www.loc.gov/item/mss859430231'">https://www.loc.gov/item/mss859430231</li>
                            <li onclick="document.getElementById('{{ form.import_url.id_for_label }}').value = 'https://www.loc.gov/search/?q=group%3Amal&amp;fa=online-format!%3Aonline+text'">https://www.loc.gov/search/?q=group%3Amal&amp;fa=online-format!%3Aonline+text</li>
                        </ul>
                    </div>
                </div>

                <div class="submit-row">
                    <input type="submit" value="Import" class="default">
                </div>
            </form>
        {% endif %}
    </div>
{% endblock content %}


================================================
FILE: concordia/templates/admin/concordia/simplepage/change_form.html
================================================
{% extends "admin/change_form.html" %}

{% block extrahead %}
    {{ block.super }}

    {% include 'fragments/codemirror.html' %}
{% endblock extrahead %}

{% block content %}
    {{ block.super }}
{% endblock content %}


================================================
FILE: concordia/templates/admin/concordia/transcription/change_form.html
================================================
{% extends "admin/change_form.html" %}

{% load i18n admin_urls humanize %}

{% block object-tools-items %}
    {% if original.pk %}
        <li>
            <a class="view-parent-object" href="{% url 'admin:concordia_campaign_change' original.asset.item.project.campaign_id %}">
                Campaign
            </a>
        </li>
        <li>
            <a class="view-parent-object" href="{% url 'admin:concordia_project_change' original.asset.item.project_id %}">
                Project
            </a>
        </li>
        <li>
            <a class="view-parent-object" href="{% url 'admin:concordia_item_change' original.asset.item_id %}">
                Item
            </a>
        </li>
        <li>
            <a class="view-parent-object" href="{% url 'admin:concordia_asset_change' original.asset.pk %}">
                Asset
            </a>
        </li>
        {% if original.supersedes_id %}
            <li>
                <a class="view-related-object" href="{% url 'admin:concordia_transcription_change' original.supersedes_id %}">
                    Previous Version
                </a>
            </li>
        {% endif %}
        {% with original.superseded_by.first as superseded_by %}
            {% if superseded_by %}
                <li>
                    <a class="view-related-object" href="{% url 'admin:concordia_transcription_change' superseded_by.pk %}">
                        Next Version
                    </a>
                </li>
            {% endif %}
        {% endwith %}
    {% endif %}
    {{ block.super }}
{% endblock object-tools-items %}


================================================
FILE: concordia/templates/admin/index.html
================================================
{% extends 'admin/index.html' %}

{% load static i18n %}

{% block sidebar %}
    <div id="content-related">
        <div class="module" id="custom-actions">
            <h2>Site Operations</h2>
            <ul>
                <li><a href="{% url 'admin:bulk-import' %}">Bulk Import Items</a></li>
                <li><a href="{% url 'admin:celery-review' %}">Importer Progress</a></li>
                <li><a href="{% url 'admin:site-report' %}">Site Report</a></li>
                <li><a href="{% url 'admin:retired-site-report' %}">Retired Site Report</a></li>
                <li><a href="{% url 'admin:project-level-export' %}">Project Level Export</a></li>
                {% if user.is_superuser %}
                    {% if maintenance_mode %}
                        <li><a href="{% url 'maintenance_mode_off' %}">Disable Maintenance Mode</a></li>
                    {% else %}
                        <li><a href="{% url 'maintenance_mode_on' %}">Enable Maintenance Mode</a></li>
                    {% endif %}
                    {% if maintenance_mode_frontend_available %}
                        <li><a href="{% url 'maintenance_mode_frontend_unavailable' %}">Disable Front-end During Maintenance Mode</a></li>
                    {% else %}
                        <li><a href="{% url 'maintenance_mode_frontend_available' %}">Enable Front-end During Maintenance Mode</a></li>
                    {% endif %}
                    <li><a href="{% url 'admin:clear-cache' %}">Clear Caches</a></li>
                    <li><a href="{% url 'admin:bulk-change' %}">Bulk Change Status of Assets</a></li>
                {% endif %}
            </ul>
        </div>
        <div class="module" id="recent-actions-module">
            <h2>{% trans 'Recent actions' %}</h2>
            <h3>{% trans 'My actions' %}</h3>
            {% load log %}
            {% get_admin_log 10 as admin_log for_user user %}
            {% if not admin_log %}
                <p>{% trans 'None available' %}</p>
            {% else %}
                <ul class="actionlist">
                    {% for entry in admin_log %}
                        <li class="{% if entry.is_addition %}addlink{% endif %}{% if entry.is_change %}changelink{% endif %}{% if entry.is_deletion %}deletelink{% endif %}">
                            {% if entry.is_deletion or not entry.get_admin_url %}
                                {{ entry.object_repr }}
                            {% else %}
                                <a href="{{ entry.get_admin_url }}">{{ entry.object_repr }}</a>
                            {% endif %}
                            <br>
                            {% if entry.content_type %}
                                <span class="mini quiet">{% filter capfirst %}{{ entry.content_type }}{% endfilter %}</span>
                            {% else %}
                                <span class="mini quiet">{% trans 'Unknown content' %}</span>
                            {% endif %}
                        </li>
                    {% endfor %}
                </ul>
            {% endif %}
        </div>
        <div class="module" id="version-module">
            <h2>Application Version</h2>
            <p><small>{{ APPLICATION_VERSION }}</small></p>
        </div>
    </div>
{% endblock sidebar%}


================================================
FILE: concordia/templates/admin/long_name_filter.html
================================================
{% load i18n %}
<h3>{% blocktranslate with filter_title=title %} By {{ filter_title }} {% endblocktranslate %}</h3>
<ul class="long-name-filter">
    {% for choice in choices %}
        <li{% if choice.selected %} class="selected"{% endif %}>
            <a href="{{ choice.query_string|iriencode }}">{{ choice.display }}</a></li>
    {% endfor %}
</ul>


================================================
FILE: concordia/templates/admin/process_bagit.html
================================================
{% extends "admin/base.html" %}

{% block messages %}
    {% comment %} This is displayed elswhere {% endcomment %}
{% endblock messages %}

{% block extrahead %}
    {{ block.super }}
    <style>
        .message-error, .message-warning {
            font-weight: bold;
        }

        .message-error {
            color: #dc3545;
        }

        .message-warning {
            color: #ffc107;
        }
    </style>
{% endblock %}

{% block content %}
    <div id="content-main">

        <p><strong>
            This feature will accept a zip file, process and convert to Loc.gov structure and re-zip it back
        </strong>
        </p>
        <div>
            <form method="post" enctype="multipart/form-data">
                {% csrf_token %}
                {{ form.as_p }}
                <div class="submit-row">
                    <button type="submit">Process Bagit</button>
                </div>
            </form>
        </div>


        {% if messages %}
            <h4>Messages</h4>
            <ul>
                {% for message in messages %}
                    <li class="message {% if message.level >= DEFAULT_MESSAGE_LEVELS.ERROR %}message-error{% elif message.level >= DEFAULT_MESSAGE_LEVELS.WARNING %}message-warning{% endif %}">{{ message }}</li>
                {% endfor %}
            </ul>
        {% endif %}
    </div>
{% endblock content %}


================================================
FILE: concordia/templates/admin/project_level_export.html
================================================
{% extends "admin/base.html" %}

{% block messages %}
    {% comment %} This is displayed elswhere {% endcomment %}
{% endblock messages %}

{% block extrahead %}
    {{ block.super }}
    <style>
        .message-error,
        .message-warning {
            font-weight: bold;
        }

        .message-error {
            color: #dc3545;
        }

        .message-warning {
            color: #ffc107;
        }
    </style>
{% endblock %}

{% block content %}
    <div id="content-main">
        {% if campaigns %}
            <h2>Campaigns</h2>
            <ul>
                <table>
                    <thead>
                        <tr>
                            <th>Campaign Title</th>
                            <th></th>
                        </tr>
                    </thead>
                    {% for campaign in campaigns %}
                        <tr>
                            <td>{{ campaign.title }}</td>
                            <td><a href="?id={{ campaign.id}}&slug={{ campaign.slug }}">List Projects</a></td>
                        </tr>
                    {% endfor %}
                </table>
            </ul>

        {% else %}

            {% if projects %}
                <span><a href="/admin/project-level-export">All Campaigns</a></span>
                <h2>Projects</h2>
                <form method="post" id="registration-form" class="form-register">
                    {% csrf_token %}
                    <ul>
                        <table>
                            <thead>
                                <tr>
                                    <th></th>
                                    <th>Project Title</th>
                                    <th></th>
                                </tr>
                            </thead>
                            {% for project in projects %}
                                <tr>
                                    <td><input type="checkbox" id="{{project.id}}" name="project_name" value="{{project.id}}"></td>
                                    <td>{{ project.title }}</td>

                                </tr>
                            {% endfor %}
                        </table>
                        <input type="submit" value="Submit">
                    </ul>

                </form>

            {% endif %}
        {% endif %}
        {% if messages %}
            <h4>Messages</h4>
            <ul>
                {% for message in messages %}
                    <li
                        class="message {% if message.level >= DEFAULT_MESSAGE_LEVELS.ERROR %}message-error{% elif message.level >= DEFAULT_MESSAGE_LEVELS.WARNING %}message-warning{% endif %}">
                        {{ message }}</li>
                {% endfor %}
            </ul>
        {% endif %}
    </div>
{% endblock content %}


================================================
FILE: concordia/templates/base.html
================================================
{% spaceless %}
    {% load static django_vite %}
{% endspaceless %}<!DOCTYPE html>
<html lang="{{ language_code|default:'en'}}">
    <head>
        <meta charset="UTF-8">
        <meta name="viewport" content="width=device-width, initial-scale=1,
                                       shrink-to-fit=no">
        <title>
            {% block full_title %}By the People
                {% block title %}
                    {% if title %}
                        {{ title }}{% else %}Untitled
                    {% endif %}
                {% endblock title %}
            {% endblock full_title %}
        </title>
        <meta name="description" content="Crowdsourcing project By the People invites
                                          anyone to become a Library of Congress virtual volunteer. Explore, transcribe, review,
                                          and tag digital collections to improve search and readability and open new avenues of
                                          research.">
        <link rel="shortcut icon" href="{% static 'favicon.ico' %}">
        {% include "fragments/common-stylesheets.html" %}
        {% block prefetch %}
            <link href="https://fonts.gstatic.com" rel="preconnect dns-prefetch"
                  crossorigin>
            {% if CONCORDIA_ENVIRONMENT == "production" %}
                <link href="https://crowd-media.loc.gov" rel="preconnect dns-prefetch"
                      crossorigin>
            {% endif %}
            <link href="https://thelibraryofcongress.tt.omtrdc.net" rel="preconnect
                                                                         dns-prefetch" crossorigin>
            <link href="https://smon.loc.gov" rel="preconnect dns-prefetch" crossorigin>
        {% endblock prefetch %}
        <link href="https://cdn.jsdelivr.net/npm/bootstrap@5.3.3/dist/css/bootstrap.min.css" rel="stylesheet" integrity="sha384-QWTKZyjpPEjISv5WaRU9OFeRpok6YctnYmDr5pNlyT2bRjXh0JMhjY6hW+ALEwIH" crossorigin="anonymous">
        {% block head_content %}
            {% vite_hmr_client %}
        {% endblock head_content %}
        {% block extra_scripts %}{% endblock %}
        {% comment %}
    Adobe's tag manager requires this script to be placed at the top even though it's bad
for performance:
    {% endcomment %}
        {% if CONCORDIA_ENVIRONMENT == "production" %}
            <script
                src="https://assets.adobedtm.com/f94f5647937d/624e2240e90d/launch-0610ec681aff.min.js" async></script>
        {% else %}
            <script
                src="https://assets.adobedtm.com/f94f5647937d/624e2240e90d/launch-0610ec681aff.min.js" async></script>
        {% endif %}
    </head>
    <body id="body"
          class="{% block body_classes %}view-{{ VIEW_NAME_FOR_CSS }}
                     section-{{ PATH_LEVEL_1|default:'homepage' }}
                     environment-{{ CONCORDIA_ENVIRONMENT }}
                     {% block extra_body_classes %}{% endblock %}
                     d-print-block
                 {% endblock body_classes %}">
        {% block site-header %}
            <header class="border-bottom" role="banner" aria-label="site navigation">
                <nav class="container navbar navbar-light navbar-expand-lg
                            align-items-lg-end p-3 d-print-block">
                    <div class="navbar-brand d-flex align-items-center">
                        <a class="logo-loc" href="https://www.loc.gov" title="Library of
                                                                              Congress">
                            <img class="img-fluid" src="{% static 'img/LoC-logo.svg' %}"
                                 width="170" height="97" alt="Library of Congress logo">
                        </a>
                        <h1 class="logo-by-the-people m-0 -d-flex -align-items-center">
                            <a class="d-flex" href="/" title="By the People">
                                <img class="img-fluid" src="{% static 'img/logo-by-the-people.svg' %}" width="260" height="27" alt="" aria-hidden="true">
                                <span class="visually-hidden">By The People</span>
                            </a>
                        </h1>
                    </div>
                    <button class="navbar-toggler navbar-light border-0 d-print-none"
                            type="button" data-bs-toggle="collapse" data-bs-target="#nav-menu" aria-controls="nav-menu"
                            aria-expanded="false" aria-label="Toggle navigation">
                        <i class="fas fa-bars"></i>
                        <span class="visually-hidden">Menu</span>
                    </button>
                    <div class="collapse navbar-collapse text-center d-print-none"
                         id="nav-menu">
                        <ul class="navbar-nav ms-auto d-print-none small">
                            <li class="nav-item">
                                <a class="nav-link {% if PATH_LEVEL_1 == 'about'%}active{% endif %}" href="{% url 'about' %}">About</a>
                            </li>
                            <li class="nav-item dropdown nav-dropdown">
                                <a id="topnav-campaigns-dropdown-toggle" class="nav-link
                                                                                {% if 'campaigns' in PATH_LEVEL_1 %}active{% endif %}" href="{% url 'campaign-topic-list' %}" data-bs-toggle="dropdown" aria-haspopup="true"
                                   aria-expanded="false">Campaigns&nbsp;<span class="fa fa-chevron-down text-primary"></span></a>
                                <div class="dropdown-menu" aria-labelledby="topnav-campaigns-dropdown-toggle">
                                    <a class="dropdown-item" href="{% url 'campaign-topic-list' %}">All Campaigns</a>
                                    <a class="dropdown-item" href="{% url 'transcriptions:completed-campaign-list' %}">Completed Campaigns</a>
                                </div>
                            </li>
                            <li id="topnav-help-dropdown" class="nav-item dropdown
                                                                 nav-dropdown">
                                <a id="topnav-help-dropdown-toggle" class="nav-link
                                                                           {% if PATH_LEVEL_1 == 'help-center' or 'get-started' in PATH_LEVEL_1 %}active{% endif %}"
                                   href="{% url 'help-center' %}" rel="nofollow" data-bs-toggle="dropdown" aria-haspopup="true"
                                   aria-expanded="false">How-To&nbsp;<span class="fa fa-chevron-down text-primary"></span></a>
                                <div class="dropdown-menu"
                                     aria-labelledby="topnav-help-dropdown-toggle">
                                    <a class="dropdown-item" href="{% url 'welcome-guide' %}"
                                       rel="nofollow">Get Started</a>
                                    <a class="dropdown-item" href="{% url 'transcription-basic-rules' %}" rel="nofollow">Transcribe</a>
                                    <a class="dropdown-item" href="{% url 'how-to-review' %}"
                                       rel="nofollow">Review</a>
                                    <a class="dropdown-item" href="{% url 'how-to-tag' %}"
                                       rel="nofollow">Tag</a>
                                </div>
                            </li>
                            <li id="resources-dropdown" class="nav-item dropdown nav-dropdown">
                                <a id="resources-dropdown" class="nav-link
                                                                  {% if PATH_LEVEL_1 == 'resources' %}active{% endif %}"
                                   href="{% url 'resources' %}" rel="nofollow" data-bs-toggle="dropdown" aria-haspopup="true"
                                   aria-expanded="false">Resources <span class="fa fa-chevron-down text-primary"></span></a>
                                <div class="dropdown-menu"
                                     aria-labelledby="topnav-resources-dropdown-toggle">
                                    <a class="dropdown-item" href="{% url 'guidelines' %}"
                                       rel="nofollow">Community Guidelines</a>
                                    <a class="dropdown-item" href="{% url 'programs' %}"
                                       rel="nofollow">Programs</a>
                                    <a class="dropdown-item" href="{% url 'for-educators' %}"
                                       rel="nofollow">For Educators</a>
                                    <a class="dropdown-item" href="{% url 'service' %}"
                                       rel="nofollow">Documenting Service</a>
                                </div>
                            </li>
                            <li class="nav-item">
                                <a class="nav-link"
                                   href="https://forum.crowd.loc.gov" target="_blank">Discuss</a>
                            </li>
                            <li id="topnav-account-dropdown" class="nav-item dropdown
                                                                    nav-dropdown authenticated-only">
                                <a id="topnav-account-dropdown-toggle" class="nav-link fw-bold" href="#" data-bs-toggle="dropdown" aria-haspopup="true" aria-expanded="false" aria-label="{{ user.username }} account menu">
                                    {{ user.username }}<span class="fa fa-chevron-down text-primary"></span>
                                </a>
                                <div id="topnav-account-dropdown-menu" class="dropdown-menu" aria-labelledby="topnav-account-dropdown-toggle"></div>
                            </li>
                        </ul>

                        <ul class="nav-secondary anonymous-only list-unstyled d-none d-lg-flex
                                   d-print-none small ms-4 ps-3">
                            <li class="nav-item">
                                <a class="nav-link nav-secondary nav-link-login fw-bold"
                                   href="{% url 'login' %}?next={{ request.path|urlencode }}" rel="nofollow">Login</a>
                            </li>
                            <li class="nav-item">
                                <a class="nav-link nav-secondary nav-link-register fw-bold"
                                   href="{% url 'registration_register' %}" rel="nofollow">Register</a>
                            </li>
                        </ul>
                    </div>
                </nav>
            </header>
        {% endblock site-header %}

        {% block breadcrumbs-container %}
            <nav class="container breadcrumb-wrapper" aria-label="breadcrumb">
                <ol class="breadcrumb">
                    <li class="breadcrumb-item"><a href="/">Home</a></li>
                    {% block breadcrumbs %}{% endblock breadcrumbs %}
                </ol>
            </nav>
        {% endblock breadcrumbs-container %}

        {% block site-main %}
            <main class="{% block extra_main_classes %}{% endblock %} d-print-block">

                {% block messages-container %}
                    <div id="messages" hidden>
                        <div hidden id="message-template">
                            {% comment %} This is a hidden <div> rather than <template>
because it's not worth dealing with IE11 compatibility {% endcomment %}
                            <div class="alert alert-dismissible mx-3 my-2 d-flex justify-content-between align-items-center" role="alert">
                                <a type="button" data-bs-dismiss="alert"
                                   aria-label="Close">
                                    <!--span aria-hidden="true">&times;</span-->
                                    <span aria-hidden="true" class="fas fa-times"></span>
                                </a>
                            </div>
                        </div>
                    </div>
                {% endblock messages-container %}

                {% if maintenance_mode %}
                    <div class="alert mx-3 my-2 text-center" role="alert" style="background-color: red;">
                        <h2>Maintenance mode is active!</h2>
                    </div>
                {% endif %}

                {% block main_content %}{% endblock main_content %}
            </main>
        {% endblock site-main %}
        {% block site-footer %}
            <footer class="footer border-top py-4 d-print-none">
                <div class="container">
                    <div class="row">
                        <div class="col-lg-auto px-3">

                            <h2 class="h3 fw-normal text-center text-lg-start">Follow
                                Us</h2>
                            <ul class="list-unstyled list-inline mb-0 text-center
                                       text-lg-start">
                                <li class="list-inline-item link-github">
                                    <a href="https://github.com/LibraryOfCongress/concordia"
                                       title="GitHub" target="_blank">
                                        <span class="bitmap-icon github-icon"></span>
                                    </a>
                                </li>
                                <li class="list-inline-item link-twitter">
                                    <a href="https://www.twitter.com/Crowd_LOC"
                                       title="Twitter" target="_blank">
                                        <span class="bitmap-icon twitter-icon"></span>
                                    </a>
                                </li>
                                <li class="list-inline-item link-email">
                                    <a
                                        href="https://updates.loc.gov/accounts/USLOC/subscriber/new?topic_id=USLOC_175"
                                        title="Newsletter" target="_blank">
                                        <span class="bitmap-icon email-icon"></span>
                                    </a>
                                </li>
                            </ul>
                        </div>
                        <div class="footer-links col-lg">
                            <ul class="list-unstyled list-inline small fw-bold mb-0
                                       text-center text-lg-start">
                                <li class="list-inline-item mb-1"><a
                                    href="/for-educators/" target="_blank">For Educators</a></li>
                                <li class="list-inline-item mb-1"><a
                                    href="https://forum.crowd.loc.gov" target="_blank">Discuss</a></li>
                                <li class="list-inline-item mb-1"><a href="https://ask.loc.gov/crowd" target="_blank" rel=noopener>Contact
                                    Us</a></li>
                                <li class="list-inline-item"><a
                                    href="{% url 'welcome-guide' %}" target="_blank">Help</a></li>
                            </ul>
                        </div>
                        <div class="col-lg-auto align-self-center">
                            <ul class="list-unstyled list-inline small text-center
                                       text-lg-start">
                                <li class="list-inline-item"><a
                                    href="https://www.loc.gov/accessibility/">Accessibility</a></li>
                                <li class="list-inline-item"><a
                                    href="https://www.loc.gov/legal/">Legal</a></li>
                                <li class="list-inline-item"><a
                                    href="https://www.loc.gov/about/office-of-the-inspector-general/">Inspector
                                    General</a></li>
                                <li class="list-inline-item"><a
                                    href="https://www.loc.gov/legal/standard-disclaimer-for-external-links/">External Link
                                    Disclaimer</a></li>
                            </ul>
                            <ul class="list-unstyled list-inline mb-0 text-center
                                       text-lg-start">
                                <li class="list-inline-item intersites-link-congress"><a
                                    href="https://www.congress.gov/"><span class="visually-hidden">Congress.gov</span></a></li>
                                <li class="list-inline-item intersites-link-copyright"><a
                                    href="https://copyright.gov"><span class="visually-hidden">Copyright.gov</span></a></li>
                            </ul>
                        </div>
                    </div>
                </div>
            </footer>
        {% endblock site-footer %}

        {% if SENTRY_FRONTEND_DSN %}
            <script src="https://browser.sentry-cdn.com/5.0.8/bundle.min.js"
                    integrity="sha384-PKOJCSVL6suo2Qz9Hs4hkrZqX7S6iLwadxXxBEa0h0ycsuoDNZCiAcHlPGHYxU6l"
                    crossorigin="anonymous"></script>
            <script>
                // Don't load Sentry if this is the "always online" version of the page,
                // which is the version CloudFlare serves if the actual site is down
                if (navigator.userAgent.indexOf("CloudFlare-AlwaysOnline") < 0) {
                    Sentry.init({
                        'dsn': '{{ SENTRY_FRONTEND_DSN }}',
                        'release': '{{ APPLICATION_VERSION }}',
                        'environment': '{{ CONCORDIA_ENVIRONMENT }}',
                        'blacklistUrls': [
                            /^moz-extension/
                        ],
                        // Turnstile 300xxx and 600xxx errors indicate the user failed validation. We don't want those in Sentry
                        'ignoreErrors': ["[Cloudflare Turnstile] Error: 600", "[Cloudflare Turnstile] Error: 300"]
                    });
                }
            </script>
        {% endif %}

        <script>
            window.STATIC_URL = "{% get_static_prefix %}";
        </script>

        {% vite_asset 'src/main.js' %}

        {% block body_scripts %}{% endblock body_scripts %}

        <script type="text/javascript">
            if (typeof _satellite == "undefined") {
                if (typeof Sentry != "undefined") {
                    Sentry.captureMessage("Adobe Analytics did not load");
                }
            } else {
                _satellite.pageBottom();
            }
        </script>
        <div id="tutorial-data" aria-hidden="true" hidden data-campaign-slug="{{ campaign.slug }}" data-user-authenticated="{{ user.is_authenticated|yesno:"true,false" }}" data-has-asset="{{ asset|yesno:"true,false" }}">
        </div>
    </body>
</html>


================================================
FILE: concordia/templates/django_registration/activation_complete.html
================================================
{% extends "base.html" %}
{% block title %}Account Activation{% endblock title %}
{% block extra_main_classes %}container{% endblock %}
{% block main_content %}
    <div class="row">
        <div class="col-md-8 mx-auto p-3">
            <h2>Account Activation Complete</h2>
            <p>
                Welcome back! Your registration is now complete and you are logged in.
            </p>
            <p>
                Visit the <a href="{% url 'welcome-guide' %}">By the People Welcome Guide</a> for instructions and help getting started.
                Or, <a href="{% url 'redirect-to-next-transcribable-topic-asset' 'suffrage-women-fight-for-the-vote' %}">jump right in</a> to a page that needs your help!
            </p>
        </div>
    </div>
{% endblock main_content %}


================================================
FILE: concordia/templates/django_registration/activation_email_body.txt
================================================
{% load custom_math %}
Thank you for registering as a Library of Congress virtual volunteer with By the People!

To complete your activation, please verify your email address in the next {{ expiration_days }} days by clicking the link below:

https://{{ site }}{% url "django_registration_activate" activation_key %}

Once your email is verified, your account will be active! As a registered user you can complete pages by reviewing other volunteers' transcriptions, tag pages, and see a history of your activity on your account page.

Check out our Get Started guide and other instructions by visiting https://crowd.loc.gov/get-started/.

Happy transcribing,
-- The By the People team


================================================
FILE: concordia/templates/django_registration/activation_email_subject.txt
================================================
Start transcribing! Activate your By the People account at {{ site }}


================================================
FILE: concordia/templates/django_registration/activation_failed.html
================================================
{% extends "base.html" %}

{% block main_content %}
    <div class="container">
        <div class="row">
            <div class="col-md-8 mx-auto p-3">
                <h2>Account Activation</h2>
                <p class="activation-error-{{ activation_error.code }}">
                    {{ activation_error.message }}
                </p>
            </div>
        </div>
    </div>
{% endblock main_content %}


================================================
FILE: concordia/templates/django_registration/registration_closed.html
================================================
{% extends "base.html" %}

{% block title %}Registration is closed{% endblock title %}

{% block head_content %}
    <meta name="robots" content="noindex">
    {{ block.super }}
{% endblock head_content %}

{% block main_content %}
    <div class="container">
        <div class="row">
            <div class="col-md-8 mx-auto p-3">
                <h2>Registration Closed</h2>
                <p>
                    Registration is closed at the moment.
                </p>
            </div>
        </div>
    </div>
{% endblock main_content %}


================================================
FILE: concordia/templates/django_registration/registration_complete.html
================================================
{% extends "base.html" %}

{% block main_content %}
    <div class="container">
        <div class="row">
            <div class="col-md-8 mx-auto p-3">
                <h2>Thank you for joining By the People!</h2>
                <p>
                    We are excited for you to get started! First, complete your registration by checking your email inbox for an activation link. Click the link in the email within 7 days to activate your account.
                </p>
                <p>
                    Activated and ready to jump in? <a href="{% url 'welcome-guide' %}">Read our Welcome Guide</a>.
                </p>
            </div>
        </div>
    </div>
{% endblock main_content %}


================================================
FILE: concordia/templates/django_registration/registration_form.html
================================================
{% extends "base.html" %}

{% load static %}
{% load django_bootstrap5 %}

{% block title %}Registration{% endblock title %}

{% block main_content %}
    <div class="container-fluid">
        <div id="registration-form-container" class="row flex-md-row justify-content-center">
            <div class="col-md-6 p-3">
                <h2 class="mb-3 text-center">Registration</h2>
                <p>
                    Register for an account to track your work, add tags and review transcriptions.
                </p>
                <p> To sign up, please provide a username, email address and a strong password.
                    Once you click register, we will send you an email to confirm your address. We may use this email address to communicate with you about account activity,
                    website updates, and, occasionally, to ask for your feedback.
                </p>
                <p>
                    Learn more about why we ask you to register in the <a href="{% url 'about' %}">FAQ</a>.
                </p>
                <hr />
                <form method="post" id="registration-form" class="form-register">
                    {% csrf_token %}

                    {% bootstrap_form form %}

                    {% bootstrap_button "Register" button_type="submit" button_class="btn-primary" extra_classes="btn justify-content-center" %}
                    <div class="d-flex col mx-auto">
                        <a href="{% url 'login' %}" class="text-center blue-text">I already have an account</a>
                    </div>
                </form>
            </div>
        </div>
    </div>
{% endblock main_content %}

{% block body_scripts %}
    {{ block.super }}
    {% load django_vite %}
    {% vite_asset 'concordia/static/js/src/password-validation.js' %}
{% endblock body_scripts %}


================================================
FILE: concordia/templates/documents/service_letter.html
================================================
{% load static staticfiles %}
{% load humanize %}
<html lang="en-US">
    <head>
        <style>
            @page {
                size: A4;
                margin: 1.1cm;
                @bottom-right {
                    content: "Page " counter(page) " of " counter(pages);
                    font-family: Arial;
                    font-size: 11pt;
                    line-height: 1.4;
                }
            }
            a { text-decoration: none; color: black; }
            p { font-family: Arial; font-size: 11pt; line-height: 1.4;}
            img { width: 35%; height: auto; }
            h1 { font-size: 1.75rem; }
            h2 { font-size: 1.2rem;}
            tr { page-break-inside: avoid; page-break-after: auto; }
            thead { display: table-header-group; }
            tfoot { display: table-footer-group; }
            .text-right { text-align: right !important; }
            .text-left {text-align: left !important; }
            table {
                width: 100%;
                margin-bottom: 1rem;
                color: #242424;
                border-collapse: collapse;
                font-family: Artial;
                font-size: 11pt;
                line-height: 1.4;
                page-break-inside: auto;
            }
            table thead th {
                vertical-align: bottom;
                border-bottom: 2px solid #efefef;
            }
            table th, table td {
                padding: 0.75rem;
                vertical-align: top;
                border-top: 1px solid #efefef;
            }
            table thead th, table thead td {
                border-bottom: 1px solid #000;
                border-top: 1px solid #000;
            }
            table tbody tr:nth-of-type(odd) {
                background-color: rgba(0, 0, 0, 0.05);
            }
        </style>
        <title>Service Letter</title>
        <meta name=author content="By the People" />
        <meta name=generator content="Concordia" />
        <meta name=description content="BTP Service Letter" />
        <meta name=keywords content="SL" />
        <meta name=keywords content="Concordia" />
        <meta name=keywords content="BTP" />
        <meta name=dcterms.created content="{% now 'c' %}" />
        <meta name=dcterms.modified content="{% now 'c' %}" />
    </head>
    <body>
        <p><img src="{{ image_url }}" alt="Library Logo" /><br /><br /><br /></p>
        <p>
            Library of Congress<br />
            101 Independence Avenue SE<br />
            Washington, DC 20540<br />
        </p>
        <p>
            {% now "m/d/Y" %}<br /><br />
        </p>
        <p>To whom it may concern,</p>
        <p>I am writing to confirm {% if user.first_name %}{{ user.first_name }}{% if user.last_name %} {{ user.last_name }}{% endif %}{% else %}this volunteer{% endif %}'s participation in the Library of Congress virtual volunteering program <a href="https://crowd.loc.gov"><em>By the People</em> (https://crowd.loc.gov)</a>. The project invites anyone to help the Library by transcribing, tagging, and reviewing transcriptions of digitized historical documents from the Library's collections. Transcriptions make the content of handwritten and other documents keyword searchable on the <a href="https://www.loc.gov">Library's main website (https://loc.gov)</a>, open new avenues of digital research, and improve accessibility, including for people with visual or cognitive disabilities.</p>
        <p>They registered as a <em>By the People</em> volunteer on {{ join_date|date:"m/d/Y" }} as {{ user.username }}. They made {{ total_transcriptions|intcomma }} edits to transcriptions on the site and reviewed {{ total_reviews|intcomma }} transcriptions by other volunteers. You can find further details on their virtual volunteer activity in the following pages.</p>
        <p>The <em>By the People</em> site does not track the time that volunteers spend transcribing but volunteers may track their own hours. The following activity pages have time stamps that may also be useful.</p>
        <p>Best,<br /><br /></p>
        <p>Lauren Algee</p>
        <p>
            Community Manager, <em>By the People</em><br />
            Library of Congress<br />
            crowd@ask.loc.gov
        </p>
        <div style="page-break-after: always;"></div>
        <h1>Recent Pages Worked On</h1>
        <h2>All the pages contributed to in the last 6 months</h2>
        <table>
            <thead>
                <tr class="text-start">
                    <th>Row</th>
                    <th>Date</th>
                    <th>Page</th>
                    <th>Campaign Items</th>
                    <th>Your Contribution</th>
                    <th>Current Status</th>
                </tr>
            </thead>
            <tbody>
                {% for asset in asset_list %}
                    <tr>
                        <td>{{ forloop.counter }}</td>
                        <td class="col-md-3">{{ asset.latest_activity }}</td>
                        <td class="text-end"><a href="{{ asset.get_absolute_url }}">{{ asset.sequence }}</a></td>
                        <td>{{ asset.item.title }}</td>
                        <td>{% if asset.last_reviewed %}Reviewed{% else %}Transcribed{% endif %}</td>
                        <td>{{ asset.get_transcription_status_display }}</td>
                    </tr>
                {% endfor %}
            </tbody>
        </table>
    </body>
</html>


================================================
FILE: concordia/templates/emails/delete_account_body.txt
================================================
This email is to confirm deletion of your By the People user account. We have permanently removed all of your account information from the system.

Thank you for all of your contributions to the Library of Congress. Come back any time!

Sorry to see you go,
-- The By the People team


================================================
FILE: concordia/templates/emails/delete_account_subject.txt
================================================
Your By the People account has been deleted


================================================
FILE: concordia/templates/emails/email_reconfirmation_body.txt
================================================
{% load custom_math %}
To complete your email change, please verify your email address in the next {{ expiration_days }} days by clicking the link below:

https://{{ site }}{% url "email-reconfirmation" confirmation_key %}

Once it's verified, your email will be active on your account, and your previous email address will no longer be used.

Happy transcribing,
-- The By the People team


================================================
FILE: concordia/templates/emails/email_reconfirmation_subject.txt
================================================
Confirm your email change for your By the People account at {{ site }}


================================================
FILE: concordia/templates/emails/unusual_activity.html
================================================
<style type="text/css">

    table, td { border: 1px solid black; border-collapse: collapse; }
    th, td { padding: 7px; }

</style>
<h4>{{ title }}</h4>
Transcription Incidents: 2 or more transcriptions submitted in 1 minute.
<table>
    <tr>
        <th>User</th>
        <th>Incidents</th>
        <th>User transcriptions</th>
    </tr>
    {% for row in transcriptions %}
        <tr>
            <td>
                <a href="{{ domain }}{% url 'admin:concordia_transcription_changelist' %}?user={{ row.0 }}">
                    {{ row.1 }}
                </a>
            </td>
            <td>{{ row.2 }}</td>
            <td>{{ row.3 }}</td>
        </tr>
    {% empty %}
        <tr><td>No transcriptions fell within the window.</td></tr>
    {% endfor %}
</table>
<br/>
Review Incidents: 2 or more transcriptions accepted in 1 minute.
<table>
    <tr>
        <th>User</th>
        <th>Incidents</th>
        <th>User accepts</th>
    </tr>
    {% for row in reviews %}
        <tr>
            <td>
                <a href="{{ domain }}{% url 'admin:concordia_transcription_changelist' %}?accepted=not-null&o=-7&reviewed_by__id__exact={{ row.0 }}">
                    {{ row.1 }}
                </a>
            </td>
            <td>{{ row.2 }}</td>
            <td>{{ row.3 }}</td>
        </tr>
    {% empty %}
        <tr><td>No reviews fell within the window.</td></tr>
    {% endfor %}
</table>


================================================
FILE: concordia/templates/emails/unusual_activity.txt
================================================
{{ title }}
Transcription Incidents: 2 or more transcriptions submitted in 1 minute.
{% for row in transcriptions %}
    * {{ row.1 }} | {{ row.2 }} || {{ row.3 }}
{% empty %}
    No transcriptions fell within the window.
{% endfor %}
Review Incidents: 2 or more transcriptions accepted in 1 minute.
{% for row in reviews %}
    {{ row.1 }} | {{ row.2 }} | {{ row.3 }}
{% empty %}
    No reviews fell within the window.
{% endfor %}


================================================
FILE: concordia/templates/emails/welcome_email_body.html
================================================
<p>
    Thank you for becoming a By the People virtual volunteer for the Library of Congress!
</p>
<p>
    To help you get started, we recommend reading the <a href="https://crowd.loc.gov/help-center/welcome-guide/">Welcome Guide</a>. It includes instructions on transcribing, tagging, and reviewing transcriptions by other volunteers. Reviewing is an area where we especially need your help in completing transcriptions and moving them over the finish line!
</p>
<p>
    Once you have a handle on the transcription guidelines, explore the different collections available under <a href="https://crowd.loc.gov/campaigns-topics/">“Campaigns”</a> using the top navigation on any page.
</p>
<p>
    Let us know what you find once you dig in! Share your experience or questions with the community managers and other volunteers on our <a href="https://forum.crowd.loc.gov">discussion space on Discourse</a>.
</p>
<p>
    Happy transcribing!<br/>
    The By the People team
</p>


================================================
FILE: concordia/templates/emails/welcome_email_body.txt
================================================
Thank you for becoming a By the People virtual volunteer for the Library of Congress!

To help you get started, we recommend reading the Welcome Guide <https://crowd.loc.gov/help-center/welcome-guide/>. It includes instructions on transcribing, tagging, and reviewing transcriptions by other volunteers. Reviewing is an area where we especially need your help in completing transcriptions and moving them over the finish line!

Once you have a handle on the transcription guidelines, explore the different collections available under “Campaigns” <https://crowd.loc.gov/campaigns-topics/> using the top navigation on any page.

Let us know what you find once you dig in! Share your experience or questions with the community managers and other volunteers on our discussion space on Discourse <https://forum.crowd.loc.gov>.

Happy transcribing!
The By the People team


================================================
FILE: concordia/templates/emails/welcome_email_subject.txt
================================================
Welcome to By The People


================================================
FILE: concordia/templates/error.html
================================================
{% extends "base.html" %}
{% load staticfiles %}

{% block head_content %}
    <style>
        body {
            height: 100vh;
            width: 100vw;
            margin: 0;
            padding: 0;
        }

        #error-message {
            max-width: 50%;
        }
    </style>
{% endblock head_content %}

{% block body_classes %}d-flex justify-content-center align-items-center text-center{% endblock body_classes %}

{% block site-header %}{% endblock site-header %}

{% block breadcrumbs-container %}{% endblock breadcrumbs-container %}

{% block site-main %}
    <div id="error-message">
        {% block error_message %}{% endblock error_message %}
    </div>
{% endblock site-main %}

{% block site-footer %} {% endblock site-footer %}


================================================
FILE: concordia/templates/forms/widgets/email.html
================================================
<input
    type="{{ widget.type }}"
    name="{{ widget.name }}"
    {% if widget.value != None %}
        placeholder="Change your email address"
    {% endif %}
    class="form-control fst-italic"
    {% for name, value in widget.attrs.items %}
        {% if value is not False %}
            {{ name }}
            {% if value is not True %}
                ="{{ value|stringformat:'s' }}"
            {% endif %}
        {% endif %}
    {% endfor %}
>


================================================
FILE: concordia/templates/forms/widgets/turnstile_widget.html
================================================
<div class="cf-turnstile" {% include "django/forms/widgets/attrs.html" %}></div>


================================================
FILE: concordia/templates/fragments/_filter-buttons.html
================================================
{% if user.is_authenticated %}
    <div>
        <input name="radioButtons" type="radio" id="show-all" {% if not do_filter %}checked{% endif %} data-url="{{ all_url}}{% if sublevel_qs %}?{{ sublevel_qs }}{% endif %}">
        <label for="show-all">Show all</label>
        <input name="radioButtons" type="radio" id="filter-assets" {% if do_filter %}checked{% endif %} class="ml-1" data-url="{{ filtered_url}}{% if sublevel_qs %}?{{ sublevel_qs }}{% endif %}">
        <label for="filter-assets">Show pages I can review</label>
    </div>
{% endif %}


================================================
FILE: concordia/templates/fragments/_modal_footer.html
================================================
<div class="modal-footer d-flex justify-content-around">
    <p>
        <a class="btn btn-primary" href="{{ next_open_asset_url }}">
            Transcribe a new page
        </a>
    </p>
    <p>
        <a class="btn btn-primary" href="{{ next_review_asset_url }}">
            Review a new page
        </a>
    </p>
</div>


================================================
FILE: concordia/templates/fragments/activity-filter-sort.html
================================================
{% load concordia_querystring %}
<div class="col-sm">
    <ul>
        <li><a href="/transcribe">Transcribe</a></li>
        <li><a href="/review">Review</a></li>
    </ul>
</div>
<div class="col-sm">
    Filter by campaign:
    <ul>
        {% for c in campaigns %}
            <li><a href="?{% qs_alter request.GET campaign_filter=c.pk %}">{{ c.title }}</a></li>
        {% endfor %}
    </ul>
</div>
<div class="col-sm">
    Sort by:
    <ul>
        <li><a href="?{% qs_alter request.GET order_by="pk" %}">None</a></li>
        <li><a href="?{% qs_alter request.GET order_by="-difficulty" %}">Hard to easy</a></li>
        <li><a href="?{% qs_alter request.GET order_by="difficulty" %}">Easy to hard</a></li>
    </ul>
</div>


================================================
FILE: concordia/templates/fragments/codemirror.html
================================================
{% load static django_vite %}

<link rel="stylesheet" href="{% static 'codemirror/lib/codemirror.css' %}">
<link rel="stylesheet" href="{% static 'codemirror/addon/lint/lint.css' %}">

<script src="{% static 'codemirror/lib/codemirror.js' %}"></script>
<script src="{% static 'codemirror/mode/xml/xml.js' %}"></script>
<script src="{% static 'codemirror/mode/markdown/markdown.js' %}"></script>
<script src="{% static 'codemirror/addon/lint/html-lint.js' %}"></script>

<script src="{% static 'prettier/standalone.js' %}"></script>
<script src="{% static 'prettier/parser-html.js' %}"></script>
<script src="{% static 'prettier/parser-markdown.js' %}"></script>

<script src="{% static 'remarkable/dist/remarkable.min.js' %}"></script>

{% vite_asset 'concordia/static/admin/editor-preview.js' %}

<style>
    .form-row.codemirror-with-preview > div {
        display: flex;
        width: 100%;
        flex-wrap: wrap;
    }

    .form-row.codemirror-with-preview > div > * {
        overflow-y: auto;
        box-sizing: border-box;
        min-height: 500px;
    }

    .form-row.codemirror-with-preview > div .CodeMirror {
        min-height: 500px;
    }

    .form-row.codemirror-with-preview > div > label {
        flex-basis: 100%;
        min-height: 0;
        font-weight: bold;
        color: #333;
    }

</style>

<template id="preview-head">{% spaceless %}
    {% include "fragments/common-stylesheets.html" %}
{% endspaceless %}</template>


================================================
FILE: concordia/templates/fragments/common-stylesheets.html
================================================
{% load static django_vite %}

<link rel="stylesheet" href="https://fonts.googleapis.com/css?family=Open+Sans:400,600,700|Roboto+Slab:400,700" />
<link rel="stylesheet" href="{% vite_asset_url 'concordia/static/scss/base.scss' %}" />
<link rel="stylesheet" href="{% static '@fortawesome/fontawesome-free/css/all.min.css' %}" />


================================================
FILE: concordia/templates/fragments/featured_blog_posts.html
================================================
{% load group_list %}
<h3 class="mb-4">Featured blog posts</h3>
<div id="blog-carousel" class="carousel slide">
    <div class="carousel-inner" blog-post-count="{{ blog_posts|length }}" slice-count="{{ blog_posts|slice:':3'|length }}" batch-count="{{ blog_posts|slice:':3'|batch:3|length }}">
        {% for segment in blog_posts %}
            <div class="carousel-item mb-4{% if forloop.first %} active{% endif %}">
                <div class="row mx-auto blog-chunk">
                    {% for post in segment %}
                        <div class="col-md-4">
                            <div class="card h-100">
                                <div class="card-body p-0">
                                    <a href="{{ post.link }}">
                                        <img alt="{{ post.title }}" width="197" height="132" style="opacity: 1;" src="{{ post.og_image }}">
                                        <h5 class="pt-2">
                                            {{ post.title }}
                                        </h5>
                                    </a>
                                </div>
                            </div>
                        </div>
                    {% endfor %}
                </div>
            </div>
        {% endfor %}
    </div>
    {% if blog_posts|length > 1 %}
        <button class="carousel-control-prev" type="button" data-bs-target="#blog-carousel" data-bs-slide="prev">
            <span class="carousel-control-icon prev" aria-hidden="true"></span>
            <span class="visually-hidden">Previous</span>
        </button>
    {% endif %}
    <div class="carousel-indicators">
        {% for segment in blog_posts %}
            <button type="button" data-bs-target="#blog-carousel" data-bs-slide-to="{{ forloop.counter0 }}" {% if forloop.first %}class="active" aria-current="true"{% endif %}>
            </button>
        {% endfor %}
    </div>
    {% if blog_posts|length > 1 %}
        <button class="carousel-control-next" type="button" data-bs-target="#blog-carousel" data-bs-slide="next">
            <span class="carousel-control-icon next" aria-hidden="true"></span>
            <span class="visually-hidden">Next</span>
        </button>
    {% endif %}
</div>
<div class="text-center">
    <a class="btn btn-primary text-decoration-none" href="https://blogs.loc.gov/thesignal/category/by-the-people-transcription-program/" target="_blank">Read more</a>
</div>


================================================
FILE: concordia/templates/fragments/recent-pages.html
================================================
{% load concordia_querystring %}

<h2>Recent Pages Worked On</h2>
<div>View all the pages you contributed to in the last 6 months.</div>
<div class="row mt-4">
    {% include "fragments/standard-pagination.html" %}
</div>
<form class="container form date-filter pb-1 mb-2" method="get">
    <div class="d-flex flex-row">
        <span class="fw-bold me-1">Date: </span>Select Range
    </div>
    <div class="d-flex flex-row pb-1">
        <label for="id_start"><span class="visually-hidden">Start</span></label>
        <duet-date-picker name="start" identifier="id_start"></duet-date-picker>
        <div class="p-2">to</div>
        <label for="id_end"><span class="visually-hidden">End</span></label>
        <duet-date-picker name="end" identifier="id_end"></duet-date-picker>
        <button type="submit" class="btn btn-primary rounded-0 p-2">Go</button>
    </div>
    <div class="d-flex flex-row pt-1">
        <div>
            <input type="radio" name="flexRadioDefault" id="flexRadioDefault1" onclick="sortDateDescending();"{% if order_by != 'date-ascending' %} checked{% endif %}>
            <label class="form-check-label" for="flexRadioDefault1">Sort by Newest</label>
        </div>
        <div style="margin-left: 1.6rem;">
            <input type="radio" name="flexRadioDefault" id="flexRadioDefault2" onclick="sortDateAscending();"{% if order_by == 'date-ascending'%} checked{% endif %}>
            <label class="form-check-label" for="flexRadioDefault2">Sort by Oldest</label>
        </div>
    </div>
</form>
{% if campaign or activity or statuses or start or end %}
    <div class="bg-light flex-row" id="current-filters">
        <span class="align-middle d-inline fw-bold">Filtered by: </span>
        <ul class="d-inline">
            {% if campaign %}
                <li class="btn btn-xs font-size-sm rounded-pill">
                    <label class="m-0 fw-normal">
                        <input type="hidden" value="campaign">
                        campaign: {{ campaign.slug }}
                    </label>
                    <a href="?{% qs_alter request.GET tab='recent' delete:campaign %}" class="btn" role="button">
                        <span aria-hidden="true" class="fas fa-times"></span>
                    </a>
                </li>
            {% endif %}
            {% if activity %}
                <li class="btn btn-xs font-size-sm rounded-pill">
                    <label class="m-0 fw-normal">
                        <input type="hidden" value="activity">
                        contribution: {{ activity }}
                    </label>
                    <a href="?{% qs_alter request.GET tab='recent' delete:activity %}" class="btn" role="button">
                        <span aria-hidden="true" class="fas fa-times"></span>
                    </a>
                </li>
            {% endif %}
            {% for status in statuses %}
                <li class="btn btn-xs font-size-sm rounded-pill">
                    <label class="m-0 fw-normal">
                        <input type="hidden" value="activity">
                        status: {% if status == 'submitted' %}needs review {% else %}{{ status }}{% endif %}
                    </label>
                    <a href="?{% qs_alter request.GET tab='recent' delete_value:"status",status %}" class="btn" role="button">
                        <span aria-hidden="true" class="fas fa-times"></span>
                    </a>
                </li>
            {% endfor %}
            {% if start or end %}
                <li class="btn btn-xs font-size-sm rounded-pill">
                    <label class="m-0 fw-normal">
                        <input type="hidden" value="date">
                        {% if start and end %}
                            date: {{ start }} to {{ end }}
                        {% else %}
                            date: {% if start %}{{ start }}{% else %}{{ end }}{% endif %}
                        {% endif %}
                    </label>
                    <a href="?{% qs_alter request.GET tab='recent' delete:start delete:end %}" class="btn" role="button">
                        <span aria-hidden="true" class="fas fa-times"></span>
                    </a>
                </li>
            {% endif %}
        </ul>
    </div>
{% endif %}
<table class="table table-striped table-responsive-sm">
    <thead class="border-y">
        <tr class="text-start">
            <th class="date-header">Date</th>
            <th>Page</th>
            <th>
                <div data-bs-toggle="dropdown" aria-haspopup="true" aria-expanded="false">Campaign/Item <span class="fa fa-chevron-down"></span></div>
                <div class="dropdown-menu border border-primary py-0 rounded-0">
                    {% if campaign %}
                        <a class="dropdown-item border-bottom border-primary filter-link" href="?{% qs_alter request.GET tab='recent' delete:campaign %}">Show All</a>
                    {% endif %}
                    {% for recent_campaign in recent_campaigns %}
                        <a class="dropdown-item{% if not forloop.first %} border-top border-primary{% endif %}{% if campaign.pk == recent_campaign.pk %} fw-bold{% endif %} filter-link" href="?{% qs_alter request.GET campaign=recent_campaign.pk delete:page %}">
                            {{ recent_campaign.title }}
                        </a>
                    {% endfor %}
                </div>
            </th>
            <th>
                <div data-bs-toggle="dropdown" aria-haspopup="true" aria-expanded="false">Your Contribution <span class="fa fa-chevron-down"></span></div>
                <div class="dropdown-menu border border-primary py-0 rounded-0">
                    {% if activity %}
                        <a class="dropdown-item border-bottom border-primary filter-link" href="?{% qs_alter request.GET tab='recent' delete:activity %}">Show All</a>
                    {% endif %}
                    <a class="dropdown-item border-bottom border-primary{% if activity == 'reviewed' %} fw-bold{% endif %} filter-link" href="?{% qs_alter request.GET activity='reviewed' delete:page %}">Reviewed</a>
                    <a class="dropdown-item{% if activity == 'transcribed' %} fw-bold{% endif %} filter-link" href="?{% qs_alter request.GET activity='transcribed' delete:page %}">Transcribed</a>
                </div>
            </th>
            <th>
                <div data-bs-toggle="dropdown" aria-haspopup="true" aria-expanded="false">Current Status <span class="fa fa-chevron-down"></span></div>
                <div class="dropdown-menu border border-primary py-0 rounded-0">
                    <a class="dropdown-item border-bottom border-primary{% if 'in_progress' in status_list %} fw-bold{% endif %} filter-link" href="?{% qs_alter request.GET status='in_progress' delete:page %}">In Progress</a>
                    <a class="dropdown-item border-bottom border-primary{% if 'submitted' in status_list %} fw-bold{% endif %} filter-link" href="?{% qs_alter request.GET status='submitted' delete:page %}">Needs Review</a>
                    <a class="dropdown-item{% if 'completed' in status_list %} fw-bold{% endif %} filter-link" href="?{% qs_alter request.GET status='completed' delete:page %}">Completed</a>
                </div>
            </th>
        </tr>
    </thead>
    <tbody>
        {% for asset in page_obj %}
            <tr class="{{ asset.item.project.campaign.id }} recent-page">
                <td class="col-md-3"><abbr title="{{ asset.latest_activity|date:'SHORT_DATE_FORMAT' }}">{{ asset.latest_activity }}</abbr></td>
                <td class="text-end"><a href="{{ asset.get_absolute_url }}">{{ asset.sequence }}</a></td>
                <td><a href="{{ asset.item.get_absolute_url }}">{{ asset.item.title }}</a></td>
                <td>{% if asset.last_reviewed %}Reviewed{% else %}Transcribed{% endif %}</td>
                <td>{{ asset.get_transcription_status_display }}</td>
            </tr>
        {% endfor %}
    </tbody>
</table>
<div class="row">
    {% include "fragments/standard-pagination.html" %}
</div>


================================================
FILE: concordia/templates/fragments/sharing-button-group.html
================================================
<div class="concordia-share-button-group btn-group" role="navigation" aria-label="Links to share this page">
    <a class="facebook-share-button btn btn-link px-1 py-0" target="_blank" role="button" title="Share this page on Facebook" href="https://www.facebook.com/share.php?u={{ url|urlencode:"" }}"><span class="bitmap-icon facebook-icon"></span></a>
    <a class="twitter-share-button btn btn-link px-1 py-0" target="_blank" role="button" title="Share this page on Twitter" href="https://twitter.com/intent/tweet?text={% filter urlencode %}”{{ title }}” {{ url }} #ByThePeople @Crowd_LOC{% endfilter %}&amp;source=webclient"><span class="bitmap-icon twitter-icon"></span></a>
    <a class="copy-url-button btn btn-link px-1 py-0" target="_blank" rel=noopener role="button" data-bs-toggle="tooltip" data-bs-trigger="manual" data-bs-placement="bottom" aria-label="Copy this link to your clipboard" href="{{ url }}"><span class="bitmap-icon copy-link-icon"></span></a>
</div>


================================================
FILE: concordia/templates/fragments/standard-pagination.html
================================================
{% load concordia_querystring %}

{% comment %}
This template fragment assumes that you are using Bootstrap's default pagination
with a Django ListView CBV or equivalent which has the default is_paginated,
paginator, and page_obj variables defined.
{% endcomment %}

{% if is_paginated %}
    <nav class="w-100" aria-label="Pagination">
        <ul class="pagination mx-auto justify-content-center">
            {% if page_obj.has_previous %}
                <li class="page-item">
                    <a class="page-link" href="?{% qs_alter request.GET page=page_obj.previous_page_number %}" aria-title="Previous Page">
                        <span class="fas fa-chevron-left"><span class="visually-hidden">Previous Page</span></span>
                    </a>
                </li>
            {% else %}
                <li class="page-item disabled" aria-hidden="true">
                    <span class="page-link">
                        <span class="fas fa-chevron-left"></span>
                    </span>
                </li>
            {% endif %}

            {% if page_obj.number > 1 %}
                <li class="page-item">
                    <a class="page-link" href="?{% qs_alter request.GET page=1 %}">1</a>
                </li>
            {% endif %}

            {% if page_obj.previous_page_number > 3 %}
                <li class="page-item disabled" aria-hidden="true"><span class="page-link">…</span></li>
            {% endif %}

            {% if page_obj.has_previous %}
                {% with page_obj.previous_page_number|add:-1 as second_previous_page %}
                    {% if second_previous_page > 1 %}
                        <li class="page-item">
                            <a class="page-link" href="?{% qs_alter request.GET page=second_previous_page %}">{{ second_previous_page }}</a>
                        </li>
                    {% endif %}
                {% endwith %}
            {% endif %}

            {% if page_obj.previous_page_number > 1 %}
                <li class="page-item">
                    <a class="page-link" href="?{% qs_alter request.GET page=page_obj.previous_page_number %}">{{ page_obj.previous_page_number }}</a>
                </li>
            {% endif %}

            <li class="page-item active">
                <a class="page-link" href="?{% qs_alter request.GET page=page_obj.number %}" aria-current="page">
                    {{ page_obj.number }}
                </a>
            </li>

            {% if page_obj.next_page_number < paginator.num_pages %}
                <li class="page-item">
                    <a class="page-link" href="?{% qs_alter request.GET page=page_obj.next_page_number %}">{{ page_obj.next_page_number }}</a>
                </li>
            {% endif %}

            {% if page_obj.has_next %}
                {% with page_obj.next_page_number|add:1 as second_next_page %}
                    {% if second_next_page < paginator.num_pages %}
                        <li class="page-item">
                            <a class="page-link" href="?{% qs_alter request.GET page=second_next_page %}">{{ second_next_page }}</a>
                        </li>
                    {% endif %}
                {% endwith %}
            {% endif %}

            {% if page_obj.next_page_number|add:2 < paginator.num_pages %}
                <li class="page-item disabled" aria-hidden="true"><span class="page-link">…</span></li>
            {% endif %}

            {% if page_obj.number < paginator.num_pages %}
                <li class="page-item">
                    <a class="page-link" href="?{% qs_alter request.GET page=paginator.num_pages %}">{{ paginator.num_pages }}</a>
                </li>
            {% endif %}

            {% if page_obj.has_next %}
                <li class="page-item">
                    <a class="page-link" href="?{% qs_alter request.GET page=page_obj.next_page_number %}" aria-title="Next Page">
                        <span class="fas fa-chevron-right"><span class="visually-hidden">Next Page</span></span>
                    </a>
                </li>
            {% else %}
                <li class="page-item disabled" aria-hidden="true">
                    <span class="page-link">
                        <span class="fas fa-chevron-right"></span>
                    </span>
                </li>
            {% endif %}
        </ul>
    </nav>
    <nav class="w-100" aria-label="Page Jump">
        <form method="get" class="d-flex justify-content-center mt-3" role="form">
            <div class="input-group input-group-sm" style="max-width: 240px;">
                <label class="input-group-text" for="page-jump">Jump to</label>
                <select class="form-select" id="page-jump" name="page">
                    {% for i in paginator.page_range %}
                        <option value="{{ i }}" {% if i == page_obj.number %}selected{% endif %}>
                            Page {{ i }}{% if i == page_obj.number %} of {{ paginator.num_pages }}{% endif %}
                        </option>
                    {% endfor %}
                </select>
                <button type="submit" class="btn btn-primary">Go</button>
            </div>

            {# Preserve other query parameters #}
            {% for key, value in request.GET.items %}
                {% if key != 'page' %}
                    <input type="hidden" name="{{ key }}" value="{{ value }}">
                {% endif %}
            {% endfor %}
        </form>
    </nav>
{% endif %}


================================================
FILE: concordia/templates/fragments/transcription-progress-bar.html
================================================
{% load humanize %}
<div id="contributor-stats">
    {{ contributor_count|intcomma }} registered
    contributor{{contributor_count|pluralize}}
</div>

<div id="progress-bar" class="progress">
    <div
        title="Completed ({{ completed_count|intcomma }} page{{ completed_count|pluralize }})"
        class="progress-bar bg-completed"
        role="progressbar"
        style="width: {{ completed_percent }}%"
        aria-valuenow="{{ completed_percent }}"
        aria-valuemin="0"
        aria-valuemax="100"
    ></div>
    <div
        title="Needs Review ({{ submitted_count|intcomma }} page{{ submitted_count|pluralize }})"
        class="progress-bar bg-submitted"
        role="progressbar"
        style="width: {{ submitted_percent }}%"
        aria-valuenow="{{ submitted_percent }}"
        aria-valuemin="0"
        aria-valuemax="100"
    ></div>
    <div
        title="In Progress ({{ in_progress_count|intcomma }} page{{ in_progress_count|pluralize }})"
        class="progress-bar bg-in_progress"
        role="progressbar"
        style="width: {{ in_progress_percent }}%"
        aria-valuenow="{{ in_progress_percent }}"
        aria-valuemin="0"
        aria-valuemax="100"
    ></div>
</div>
<div class="table-responsive-md">
    <table id="progress-stats" class="table table-sm fw-light">
        <tbody>
            {% for key, label, value in transcription_status_counts %}
                <tr
                    class="{% if filters.transcription_status == key %}table-secondary{% endif %}"
                >
                    <th class="text-nowrap">
                        <a href="?transcription_status={{ key|urlencode }}">
                            <span
                                class="transcription-status-key bg-{{ key }}"
                            ></span>
                            {{ label }}
                        </a>
                    </th>
                    <td class="text-end">
                        <a href="?transcription_status={{ key|urlencode }}">
                            <abbr title="{{ value|intcomma }} pages"
                            >{{ value|intcomma }}</abbr
                                >
                            </a>
                        </td>
                    </tr>
            {% endfor %}
        </tbody>
    </table>
</div>


================================================
FILE: concordia/templates/fragments/transcription-progress-row.html
================================================
{% load humanize %}

<div class="row">
    <div class="col-12 col-lg pt-1 pb-1">
        <div class="progress campaign-page-progress">
            <div
                title="Completed ({{ completed_count|intcomma }} page{{ completed_count|pluralize }})"
                class="progress-bar bg-completed"
                role="progressbar"
                style="width: {{ completed_percent }}%"
                aria-valuenow="{{ completed_percent }}"
                aria-valuemin="0"
                aria-valuemax="100"
            ></div>
            <div
                title="Needs Review ({{ submitted_count|intcomma }} page{{ submitted_count|pluralize }})"
                class="progress-bar bg-submitted"
                role="progressbar"
                style="width: {{ submitted_percent }}%"
                aria-valuenow="{{ submitted_percent }}"
                aria-valuemin="0"
                aria-valuemax="100"
            ></div>
            <div
                title="In Progress ({{ in_progress_count|intcomma }} page{{ in_progress_count|pluralize }})"
                class="progress-bar bg-in_progress bg-in-progress"
                role="progressbar"
                style="width: {{ in_progress_percent }}%"
                aria-valuenow="{{ in_progress_percent }}"
                aria-valuemin="0"
                aria-valuemax="100"
            ></div>
            <div
                title="Not Started ({{ not_started_count|intcomma }} page{{ not_started_count|pluralize }})"
                class="progress-bar bg-not_started bg-not-started"
                role="progressbar"
                style="width: {{ not_started_percent }}%"
                aria-valuenow="{{ not_started_percent }}"
                aria-valuemin="0"
                aria-valuemax="100"
            ></div>
        </div>
    </div>
</div>
<div class="row">
    <div class="col-12 col-lg pb-1">
        <ul class="progress-bar-labels list-unstyled m-0 p-1">
            {% if completed_percent %}
                <li>{{ completed_percent }}% Completed</li>
            {% endif %}
            {% if submitted_percent %}
                <li>{{ submitted_percent }}% Needs Review</li>
            {% endif %}
            {% if in_progress_percent %}
                <li>{{ in_progress_percent }}% In Progress</li>
            {% endif %}
            {% if not_started_percent %}
                <li>{{ not_started_percent }}% Not Started</li>
            {% endif %}
        </ul>
    </div>
</div>


================================================
FILE: concordia/templates/fragments/transcription-status-filters.html
================================================
{% load humanize %}

<div class="btn-group btn-group-toggle flex-wrap justify-content-center
            {% if size == "large" %}
                btn-group-xl w-100
            {% else %}
                btn-group-sm
            {% endif %}
           ">
    {% for url, classes, key, label, count in status_choices %}
        <a class="btn btn-outline-dark {{ classes }}" href="{{ url|default:"?" }}">
            {% if key %}
                <span class="bg-{{ key }}
                             {% if size == "large" %}
                                 transcription-status-key-lg
                             {% else %}
                                 transcription-status-key
                             {% endif %}
                            "></span>
            {% endif %}

            {{ label }} {% if size == "large" and count >= 0 %}({{ count|intcomma }}){% endif %}
        </a>
    {% endfor %}
</div>


================================================
FILE: concordia/templates/home.html
================================================
{% extends "base.html" %}
{% load staticfiles %}
{% load feature_flags %}

{% block title %}Home{% endblock title %}

{% block breadcrumbs-container %}{% endblock breadcrumbs-container %}

{% block extra_main_classes %}{% endblock %}

{% block main_content %}

    {% flag_enabled 'SHOW_BANNER' as SHOW_BANNER %}

    {% if SHOW_BANNER and banner %}
        <div id="homepage-contribute-container" class="container my-4">
            <div class="px-default ms-md-3 mb-5">
                <div class="alert {{ banner.alert_class }} alert-dismissible w-100 d-flex" id="banner-{{ banner.slug }}" role="alert">
                    <div id="banner-inner" class="d-flex flex-1 justify-content-center">
                        {% if banner.link %}
                            <a class="btn {{ banner.btn_class }}" href="{{ banner.link }}"{% if banner.open_in_new_window_tab %} target="_blank"{% endif %}>
                                {{ banner.text }}
                            </a>
                        {% else %}
                            <table class="{{ banner.btn_class }} fw-bold">
                                <td class="align-middle">{{ banner.text }}</td>
                            </table>
                        {% endif %}
                        <button type="button" class="btn btn-dark" id="no-interface-banner">Don't display this again</button>
                    </div>
                    <div class="d-flex justify-content-end">
                        <a type="button" data-bs-dismiss="alert" aria-label="Close">
                            <span class="fas fa-times text-white"></span>
                        </a>
                    </div>
                </div>
            </div>
        </div>
    {% endif %}

    <div id="homepage-contribute-container" class="container my-4">
        <div class="px-default ms-md-3 mb-5">
            <h2 class="text-center font-serif">Be a virtual volunteer!</h2>
            <p class="text-center px-md-5 mx-md-5">Help transcribe Library of Congress documents. Volunteers create and review transcriptions to improve search, access, and discovery of these pages from history.</p>
        </div>
        <ul id="homepage-contribute-activities" class="list-unstyled row text-center">
            <li class="col-sm px-4 mb-4">
                <a class="text-dark" href="{% url 'welcome-guide' %}">
                    <img class="img-fluid" src="{% static 'img/homepage-search.svg' %}" alt="" width="200" height="200" loading="lazy">
                    <h3 class="mt-3 text-uppercase">Get started</h3>
                    <p id="homepage-activity-tag-help" class="m-0">Learn how to volunteer. Anyone can contribute!</p>
                </a>
            </li>
            <li class="col-sm px-4 mb-4">
                <a class="text-dark" href="{% url 'transcription-basic-rules' %}">
                    <img class="img-fluid" src="{% static 'img/homepage-pencil.svg' %}" alt="" width="200" height="200" loading="lazy">
                    <h3 class="mt-3 text-uppercase">Transcribe</h3>
                    <p id="homepage-activity-transcribe-help" class="m-0">No account needed! Type what you see on the page.</p>
                </a>
            </li>
            <li class="col-sm px-4 mb-4">
                <a class="text-dark" href="{% url 'how-to-review' %}">
                    <img class="img-fluid" src="{% static 'img/homepage-checkmark.svg' %}" alt="" width="200" height="200" loading="lazy">
                    <h3 class="mt-3 text-uppercase">Review</h3>
                    <p id="homepage-activity-review-help" class="m-0">Review is the crucial final step! Register to edit and complete transcriptions.</p>
                </a>
            </li>
        </ul>
    </div>
    {% flag_enabled 'ADVERTISE_ACTIVITY_UI' as ADVERTISE_ACTIVITY_UI %}
    {% flag_enabled 'NEW_CAROUSEL_SLIDE' as NEW_CAROUSEL_SLIDE %}
    {% flag_enabled 'CAROUSEL_CMS' as CAROUSEL_CMS %}

    {% if CAROUSEL_CMS %}
        <div id="homepage-carousel" class="carousel slide container">
            <button type="button" id="play-pause-button" class="btn btn-primary play-pause-button" aria-label="pause">
                <i class="fa fa-solid fa-pause"></i>
            </button>
            <div class="carousel-indicators d-none d-lg-flex">
                {% for slide in slides %}
                    <button type="button" data-bs-target="#homepage-carousel" data-bs-slide-to="{{ forloop.counter0 }}" {% if forloop.first %}class="active" aria-current="true" {% endif %}aria-label="Slide {{ forloop.counter }}"></button>
                {% endfor %}
            </div>

            <div class="carousel-inner">
                {% for slide in slides %}
                    <div class="carousel-item {% if forloop.first %} active {% endif %}" {% if slide.overlay_position == "right" %} data-overlay-position="top-right" {% endif %} data-bs-title="{{ slide.headline }}" data-hero-text="{{ slide.body }}" data-link-url="{{ slide.lets_go_url }}">
                        <img class="d-block img-fluid" src="{{ MEDIA_URL }}{{ slide.carousel_image }}" alt="{{ slide.image_alt_text }}" width="1200" height="480">
                        <div class="carousel-overlay text-center d-flex flex-column justify-content-around align-items-center">
                            <h2 class="h1 title mb-1 fw-bold">{{ slide.headline }}</h2>
                            <p class="hero-text mx-auto">{{ slide.body }}</p>
                            <a class="btn btn-primary px-4" href="{{ slide.lets_go_url }}">LET'S GO!</a>
                        </div>
                    </div>
                {% endfor %}
            </div>
            <a class="carousel-control-prev" href="#homepage-carousel" role="button" data-bs-slide="prev">
                <span class="carousel-control-prev-icon" aria-hidden="true"></span>
                <span class="visually-hidden">Previous</span>
            </a>
            <a class="carousel-control-next" href="#homepage-carousel" role="button" data-bs-slide="next">
                <span class="carousel-control-next-icon" aria-hidden="true"></span>
                <span class="visually-hidden">Next</span>
            </a>

        </div>
    {% else %}
        <div id="homepage-carousel" class="carousel slide container" data-bs-ride="carousel" data-bs-pause="hover">
            <ol class="carousel-indicators d-none d-lg-flex">
                <li data-bs-target="#homepage-carousel" data-bs-slide-to="0" class="active"></li>
                <li data-bs-target="#homepage-carousel" data-bs-slide-to="1"></li>
                <li data-bs-target="#homepage-carousel" data-bs-slide-to="2"></li>
                <li data-bs-target="#homepage-carousel" data-bs-slide-to="3"></li>
                {% if ADVERTISE_ACTIVITY_UI %}
                    <li data-bs-target="#homepage-carousel" data-bs-slide-to="4"></li>
                {% endif %}
            </ol>
            <div class="carousel-inner">
                {% if NEW_CAROUSEL_SLIDE %}
                    <div class="carousel-item active" data-bs-title="Join our cause!" data-hero-text="Women's suffrage review challenge August 12-19. Help complete pages and get to know the women who fought for change 100 years ago" data-link-url="{% url 'redirect-to-next-reviewable-topic-asset' 'suffrage-women-fight-for-the-vote' %}">
                        <img class="d-block w-100" src="{% static 'img/homepage-carousel/suffrage.jpg' %}" alt="Carrie Chapman Catt stands with protesters advocating for women's right to vote. Some protesters carry banners and shields with state names, including Wyoming, California, Kansas. Some women are dressed in white, wearing crowns and carrying musical instruments, and American flags.">
                    </div>
                    {% if ADVERTISE_ACTIVITY_UI %}
                        <div class="carousel-item" data-overlay-position="top-right" data-bs-title="Find your perfect page" data-hero-text="Log in or register to transcribe and review in our new way of browsing" data-link-url="{% url 'action-app' %}">
                            <img class="d-block w-100" src="{% static 'img/homepage-carousel/activity-ui.jpg' %}" alt="New crowdsourcing browse interface. Two rows of pages volunteers can choose from to review.">
                        </div>
                    {% endif %}
                    <div class="carousel-item" data-bs-title="Walt Whitman at 200" data-hero-text="Transcribe and review poetry, letters, and writings of Walt Whitman. Discover how he wrote and lived for yourself." data-link-url="{% url 'transcriptions:redirect-to-next-transcribable-campaign-asset' 'walt-whitman' %}">
                        <img class="d-block w-100" src="{% static 'img/homepage-carousel/whitman.jpg' %}" alt="Walt Whitman in his younger years, a black and white engraving. Whitman with his right hand on his hip and his left in his pocket wearing a black rimmed hat.">
                    </div>
                    <div class="carousel-item" data-overlay-position="top-right" data-bs-title="Review Now" data-hero-text="Approve or correct other volunteers' transcriptions to help them cross the finish line." data-link-url="{% url 'transcriptions:redirect-to-next-reviewable-campaign-asset' 'mary-church-terrell-advocate-for-african-americans-and-women' %}">
                        <img class="d-block w-100" src="{% static 'img/homepage-carousel/review.jpg' %}" alt="Close up of hand-written text of Mary Church Terrell's first speech to the NAACP">
                    </div>
                    <div class="carousel-item" data-bs-title="Where to start?" data-hero-text="Find instructions and help to get started in our Welcome Guide" data-link-url="{% url 'welcome-guide' %}">
                        <img class="d-block w-100" src="{% static 'img/homepage-carousel/welcome-guide.jpg' %}" alt="Collection of typed report pages by baseball scout Branch Rickey">
                    </div>
                {% else %}
                    <div class="carousel-item active" data-bs-title="Walt Whitman at 200" data-hero-text="Transcribe and review poetry, letters, and writings of Walt Whitman. Discover how he wrote and lived for yourself." data-link-url="{% url 'transcriptions:redirect-to-next-transcribable-campaign-asset' 'walt-whitman' %}">
                        <img class="d-block w-100" src="{% static 'img/homepage-carousel/whitman.jpg' %}" alt="Walt Whitman in his younger years, a black and white engraving. Whitman with his right hand on his hip and his left in his pocket wearing a black rimmed hat.">
                    </div>
                    {% if ADVERTISE_ACTIVITY_UI %}
                        <div class="carousel-item" data-overlay-position="top-right" data-bs-title="Find your perfect page" data-hero-text="Log in or register to transcribe and review in our new way of browsing" data-link-url="{% url 'action-app' %}">
                            <img class="d-block w-100" src="{% static 'img/homepage-carousel/activity-ui.jpg' %}" alt="New crowdsourcing browse interface. Two rows of pages volunteers can choose from to review.">
                        </div>
                    {% endif %}
                    <div class="carousel-item" data-overlay-position="top-right" data-bs-title="Review Now" data-hero-text="Approve or correct other volunteers' transcriptions to help them cross the finish line." data-link-url="{% url 'transcriptions:redirect-to-next-reviewable-campaign-asset' 'mary-church-terrell-advocate-for-african-americans-and-women' %}">
                        <img class="d-block w-100" src="{% static 'img/homepage-carousel/review.jpg' %}" alt="Close up of hand-written text of Mary Church Terrell's first speech to the NAACP">
                    </div>
                    <div class="carousel-item" data-bs-title="Where to start?" data-hero-text="Find instructions and help to get started in our Welcome Guide" data-link-url="{% url 'welcome-guide' %}">
                        <img class="d-block w-100" src="{% static 'img/homepage-carousel/welcome-guide.jpg' %}" alt="Collection of typed report pages by baseball scout Branch Rickey">
                    </div>
                    <div class="carousel-item" data-overlay-position="top-right" data-bs-title="Jump in!" data-hero-text="Transcription uncovers our shared history and makes documents more searchable for everyone." data-link-url="{% url 'transcriptions:redirect-to-next-transcribable-campaign-asset' 'mary-church-terrell-advocate-for-african-americans-and-women' %}">
                        <img class="d-block w-100" src="{% static 'img/homepage-carousel/crowd-home.jpg' %}" alt="A crowd of young women cheering and waving handkerchiefs">
                    </div>
                {% endif %}
            </div>
            <a class="carousel-control-prev" href="#homepage-carousel" role="button" data-bs-slide="prev">
                <span class="carousel-control-prev-icon" aria-hidden="true"></span>
                <span class="visually-hidden">Previous</span>
            </a>
            <a class="carousel-control-next" href="#homepage-carousel" role="button" data-bs-slide="next">
                <span class="carousel-control-next-icon" aria-hidden="true"></span>
                <span class="visually-hidden">Next</span>
            </a>
            {% if NEW_CAROUSEL_SLIDE %}
                <div class="carousel-overlay text-center d-flex flex-column justify-content-around align-items-center">
                    <h1 class="title">Join our cause!</h1>
                    <p class="hero-text mx-auto">Women's suffrage review challenge August 12-19. Help complete pages and get to know the women who fought for change 100 years ago</p>
                    <a class="btn btn-primary btn-lg" href="{% url 'redirect-to-next-reviewable-topic-asset' 'suffrage-women-fight-for-the-vote' %}">LET'S GO!</a>
                </div>
            {% else %}
                <div class="carousel-overlay text-center d-flex flex-column justify-content-around align-items-center">
                    <h1 class="title">Walt Whitman at 200</h1>
                    <p class="hero-text mx-auto">Transcribe and review poetry, letters, and writings of Walt Whitman. Discover how he wrote and lived for yourself.</p>
                    <a class="btn btn-primary btn-lg" href="{% url 'transcriptions:redirect-to-next-transcribable-campaign-asset' 'walt-whitman' %}">LET'S GO!</a>
                </div>
            {% endif %}
        </div>
    {% endif %}
    <div id="homepage-next-transcribable-links" class="container mt-5">
        <div class="row align-items-center justify-content-md-center">
            <h2 class="col-md-auto text-center text-nowrap px-5 py-3 m-0">Surprise me!</h2>
            <ul class="col-md-auto row list-unstyled m-0">
                <li class="col text-center text-bold px-5 py-3">
                    <a href="{% url 'redirect-to-next-transcribable-asset' %}"><span class="d-block text-dark fw-bold">Jump into</span> <span class="d-block text-nowrap h2">a transcription</span></a>
                </li>
                <li class="col text-center text-bold px-5 py-3">
                    <a href="{% url 'redirect-to-next-reviewable-asset' %}"><span class="d-block text-dark fw-bold">Jump into</span> <span class="d-block text-nowrap h2">a review</span></a>
                </li>
            </ul>
        </div>
    </div>
    <div id="homepage-campaign-list" class="container pt-2 mt-5 mb-4">
        <h2 class="text-center font-serif mb-4">Campaigns: <small>Choose which collections to explore and transcribe</small></h2>
        <ul class="list-unstyled row text-center">
            {% for campaign in campaigns|slice:":3" %}
                <li class="col-sm mb-4">
                    {% url 'transcriptions:campaign-detail' campaign.slug as campaign_url %}
                    <a class="text-dark" href="{{ campaign_url }}">
                        <div class="aspect-ratio-box">
                            <div class="aspect-ratio-box-inner-wrapper">
                                <img src="{{ MEDIA_URL }}{{ campaign.thumbnail_image }}" class="img-fluid" alt="{{ campaign.image_alt_text }}" loading="lazy">
                            </div>
                        </div>
                        <span class="d-block h4 mt-2">{{ campaign.title }}</span>
                    </a>
                </li>
            {% endfor %}
        </ul>
        <div class="text-center">
            <a class="btn btn-primary" href="{% url 'campaign-topic-list' %}" role="button">Browse All Campaigns</a>
        </div>
    </div>
{% endblock main_content %}


================================================
FILE: concordia/templates/registration/activate.html
================================================
{% extends "base.html" %}
{% block main_content %}
    <h2>Account Activation Complete</h2>
{% endblock main_content %}


================================================
FILE: concordia/templates/registration/login.html
================================================
{% extends "base.html" %}

{% load django_bootstrap5 %}

{% block head_content %}
    <meta name="robots" content="noindex">
    {{ block.super }}
    <script module src="{{ TURNSTILE_JS_API_URL }}"></script>
{% endblock head_content %}

{% block title %}Login{% endblock title %}

{% block main_content %}
    <div class="container" role="dialog" aria-labelledby="dialog-title">
        <div class="row">
            <div class="col-8 col-md-6 col-lg-4 mx-auto my-3">
                <h2 id="dialog-title" class="text-center">Welcome back!</h2>

                <form id="login-form" method="post" action="{% url 'login' %}" class="col-10 my-3 mx-auto">
                    {% csrf_token %}

                    {% if next %}
                        <input type="hidden" name="next" value="{{ next }}" />
                    {% endif %}

                    {% bootstrap_form form %}
                    <div class="w-100 text-center mt-0 mb-3">{{ turnstile_form.turnstile }}</div>
                    <p>
                        By using this system, you agree to comply with
                        <a href="https://www.loc.gov/legal/" target="_blank">the Library's
                            security requirements</a>
                    </p>
                    {% bootstrap_button "Login" button_type="submit" button_class="btn-primary" extra_classes="btn" id="login" %}
                </form>
            </div>
        </div>
        <div class="row">
            <div class="col-8 col-md-6 col-lg-4 mx-auto my-3 text-center">
                <a href="{% url 'password_reset' %}">Forgot my password</a>
            </div>
        </div>
    </div>
{% endblock main_content %}


================================================
FILE: concordia/templates/registration/password_change_done.html
================================================
{% extends "base.html" %}

{% block main_content %}
    <div class="row flex-column align-items-center justify-content-center">
        <p>Your password was changed</p>

        <nav>
            <ul class="nav justify-content-center">
                <li class="nav-item">
                    <a class="nav-link" href="{% url 'user-profile' %}">
                        Return to your account profile
                    </a>
                </li>
                <li class="nav-item">
                    <a class="nav-link" href="/">Home</a>
                </li>
            </ul>
        </nav>

    </div>
{% endblock %}


================================================
FILE: concordia/templates/registration/password_change_form.html
================================================
{% extends "base.html" %}

{% load i18n staticfiles %}
{% load django_bootstrap5 %}

{% block head_content %}
    <meta name="robots" content="noindex">
    {{ block.super }}
{% endblock head_content %}

{% block main_content %}
    <div class="container">
        <div class="row">
            <form method="post" class="col-md-6 mx-auto">
                {% csrf_token %}

                {% bootstrap_form form %}

                {% bootstrap_button "Save" button_type="submit" button_class="btn-primary" extra_classes="btn" %}
            </form>
        </div>
    </div>
{% endblock %}

{% block body_scripts %}
    {{ block.super }}
    <script src="{% static 'js/password-validation.js' %}"></script>
{% endblock body_scripts %}


================================================
FILE: concordia/templates/registration/password_reset_complete.html
================================================
{% extends "base.html" %}
{% load i18n %}

{% block title %}{{ title }}{% endblock %}
{% block content_title %}<h1>{{ title }}</h1>{% endblock %}

{% block main_content %}
    <div class="container p-3">
        <div class="row">
            <div class="col-md-6 mx-auto">
                <p>
                    Your password has been reset and you are now logged in. If your account was inactive, it has been activated.
                </p>
                <p>
                    New here? Visit the <a href="{% url 'welcome-guide' %}">By the People Welcome Guide</a> for instructions and help getting started.
                </p>
            </div>
        </div>
    </div>
{% endblock %}


================================================
FILE: concordia/templates/registration/password_reset_confirm.html
================================================
{% extends "base.html" %}
{% load i18n staticfiles %}
{% load django_bootstrap5 %}

{% block title %}{{ title }}{% endblock %}
{% block content_title %}<h1>{{ title }}</h1>{% endblock %}

{% block main_content %}
    <div class="container py-3">
        <div class="row">
            <div class="col-md-8 mx-auto my-3 p-3">
                {% if validlink %}
                    <form method="post" class="col-10 mx-auto">
                        {% csrf_token %}

                        {% bootstrap_form form %}

                        {% bootstrap_button "Change my password" button_type="submit" button_class="btn-primary" extra_classes="btn" %}
                    </form>
                {% else %}
                    <p>
                        {% trans "The password reset link was invalid, possibly because it has already been used. Please request a new password reset." %}
                    </p>
                {% endif %}
            </div>
        </div>
    </div>
{% endblock %}

{% block body_scripts %}
    {{ block.super }}
    <script src="{% static 'js/password-validation.js' %}"></script>
{% endblock body_scripts %}


================================================
FILE: concordia/templates/registration/password_reset_done.html
================================================
{% extends "base.html" %}
{% load i18n %}

{% block breadcrumbs %}
    <li class="breadcrumb-item active" aria-current="page">{% trans 'Password reset' %}</li>
{% endblock %}

{% block title %}{{ title }}{% endblock %}
{% block content_title %}<h1>{{ title }}</h1>{% endblock %}
{% block extra_main_classes %}container{% endblock %}
{% block main_content %}
    <div class="row">
        <div class="col-md-8 mx-auto p-3">
            <p role="alert">
                {% trans "We've emailed you instructions for setting your password, if an account exists with the email you entered. You should receive them shortly." %}
            </p>
            <p>
                {% trans "If you don't receive an email, please make sure you've entered the address you registered with, and check your spam folder." %}
            </p>
        </div>
    </div>
{% endblock %}


================================================
FILE: concordia/templates/registration/password_reset_email.html
================================================
{% load i18n %}{% autoescape off %}
    {% blocktrans %}You're receiving this email because you requested a password reset for your user account at {{ site_name }}.{% endblocktrans %}

    {% trans "Please go to the following page and choose a new password:" %}
    {% block reset_link %}
        https://{{ domain }}{% url 'password_reset_confirm' uidb64=uid token=token %}
    {% endblock %}
    {% trans "Your username, in case you've forgotten:" %} {{ user.get_username }}

    {% trans "Thanks for using our site!" %}

    {% blocktrans %}The {{ site_name }} team{% endblocktrans %}

{% endautoescape %}


================================================
FILE: concordia/templates/registration/password_reset_form.html
================================================
{% extends "base.html" %}

{% load i18n staticfiles %}
{% load django_bootstrap5 %}

{% block title %}{{ title }}{% endblock %}

{% block content_title %}<h1>{{ title }}</h1>{% endblock %}

{% block head_content %}
    <meta name="robots" content="noindex">
    {{ block.super }}
{% endblock head_content %}

{% block main_content %}
    <div class="container">
        <div class="row">
            <div class="col-6 mx-auto" role="dialog">
                <p>
                    {% trans "Forgotten your password? Enter your email address below, and we'll email instructions for setting a new one." %}
                </p>

                <form method="post">
                    {% csrf_token %}

                    {% bootstrap_form form %}

                    {% bootstrap_button "Reset my password" button_type="submit" button_class="btn-primary" extra_classes="btn"%}
                </form>
            </div>
        </div>
    </div>
{% endblock %}

{% block body_scripts %}
    {{ block.super }}
    <script src="{% static 'js/password-validation.js' %}"></script>
{% endblock body_scripts %}


================================================
FILE: concordia/templates/registration/password_reset_subject.txt
================================================
{{ site_name }}


================================================
FILE: concordia/templates/static-page.html
================================================
{% extends "base.html" %}
{% load staticfiles django_vite %}

{% block title %}{{ title }}{% endblock title %}

{% block extra_scripts %}
    {% if about_page %}
        {% vite_asset 'src/about.js' %}
    {% endif %}
{% endblock %}

{% block breadcrumbs %}
    {% for link, title in breadcrumbs %}
        {% if forloop.last %}
            <li class="breadcrumb-item active" title="{{ title }}">{{ title }}</li>
        {% else %}
            <li class="breadcrumb-item"><a class="primary-text" href="{{ link }}" title="{{ title }}">{{ title }}</a></li>
        {% endif %}
    {% endfor %}
{% endblock breadcrumbs %}

{% block main_content %}
    <div class="container">
        <div class="row">
            <div class="col">
                <h1 class="my-3">{{ title }}</h1>

                <div class="simple-page">
                    {% if add_navigation %}
                        <div class="row">
                            <div class="col-3">
                                <div class="nav flex-column help-center">
                                    <h4>Instructions</h4>
                                    {% for guide in guides %}
                                        <a class="nav-link{% if guide.page.path == request.path %} active{% endif %}" href="{{ guide.page.path }}">
                                            {{ guide.title }}
                                        </a>
                                    {% endfor %}
                                    <span lang="es">
                                        <a class="nav-link" href="/help-center/how-to-transcribe-esp/">Instrucciones en español</a>
                                    </span>
                                </div>
                            </div>
                            <div class="p-3 col-9">
                                {{ body|safe }}
                            </div>
                        </div>
                    {% else %}
                        {{ body|safe }}
                    {% endif %}
                </div>
            </div>
        </div>
    </div>
{% endblock main_content %}


================================================
FILE: concordia/templates/transcriptions/asset_detail/asset_reservation_failure_modal.html
================================================
<div class="modal-dialog modal-dialog-centered" role="document">
    <div class="modal-content">
        <div class="modal-header">
            <h5 class="modal-title">Someone else is already transcribing this page</h5>
            <button type="button" class="btn-close" data-bs-dismiss="modal" aria-label="Close"></button>
        </div>
        <div class="modal-body">
            <p>You can help by transcribing a new page, adding tags to this page, or coming back later to review this page's transcription.</p>
        </div>
        <div class="modal-footer">
            <a class="btn btn-primary" href="{{ next_open_asset_url }}">
                Find new page
            </a>
            <button type="button" class="btn btn-primary" data-bs-dismiss="modal">Close</button>
        </div>
    </div>
</div>


================================================
FILE: concordia/templates/transcriptions/asset_detail/editor.html
================================================
<div class="flex-grow-1 d-flex d-print-block flex-column">
    <form id="transcription-editor" class="ajax-submission flex-grow-1 d-flex flex-column d-print-block" method="post" action="{% url 'save-transcription' asset_pk=asset.pk %}" data-transcription-status="{{ transcription_status }}" {% if transcription %}data-transcription-id="{{ transcription.pk|default:'' }}" {% if transcription.submitted %}data-unsaved-changes="true"{% endif %} data-submit-url="{% url 'submit-transcription' pk=transcription.pk %}" data-review-url="{% url 'review-transcription' pk=transcription.pk %}"{% endif %}>
        {% csrf_token %}
        <input type="hidden" name="supersedes" value="{{ transcription.pk|default:'' }}" />
        <div class="row justify-content-sm-between align-items-end mx-0">
            <div class="col ps-0">
                <div id="transcription-status-message">
                    <div id="transcription-status-display" class="row">
                        <h2 id="display-submitted" {% if transcription_status != 'submitted' %}hidden{% endif %}>
                            <span class="fas fa-list"></span>
                            Needs review
                        </h2>
                        <h2 id="display-completed" {% if transcription_status != 'completed' %}hidden{% endif %}>
                            <span class="fas fa-check"></span>
                            Completed
                        </h2>
                        <h2 id="display-notstarted" {% if transcription_status != "not_started" %}hidden{% endif %}>
                            <span class="fas fa-edit"></span>
                            Not started
                        </h2>
                        <h2 id="display-inprogress" {% if transcription_status != "in_progress" %}hidden{% endif %}>
                            <span class="fas fa-edit"></span>
                            In progress
                        </h2>
                        <span id="display-conflict" hidden>
                            <span class="fas fa-exclamation-triangle"></span>
                            Another user is transcribing this page
                        </span>
                    </div>
                </div>
                <div class="w-100">
                    <h2 id="message-contributors" {% if transcription_status == 'not_started' %}hidden{% endif %}>
                        Registered Contributors: <span id="message-contributors-num" class="fw-normal">{{ registered_contributors }}</span>
                    </h2>
                    <span id="message-notstarted" {% if transcription_status != 'not_started' %}hidden{% endif %}>
                        Transcribe this page.
                    </span>
                    <span id="message-inprogress" {% if transcription_status != 'in_progress' %}hidden{% endif %}>
                        Someone started this transcription. Can you finish it?
                    </span>
                    <span id="message-submitted" {% if transcription_status != 'submitted' %}hidden{% endif %}>
                        Check this transcription thoroughly. Accept if correct!
                    </span>
                    <span id="message-completed" {% if transcription_status != 'completed' %}hidden{% endif %}>
                        This transcription is finished! You can read and add tags.
                    </span>
                </div>
            </div>
            {% if cards %}
                <div id="instruction-buttons" class="d-flex align-items-end col pe-0">
                    <a class="fw-bold mt-3" id="quick-tips" data-bs-toggle="modal" data-bs-target="#tutorial-popup" role="button" href="#">
                        <u>Campaign Tips</u>
                    </a>
                    {% if guides %}
                        <div>
                            <button id="open-guide" class="btn btn-primary" type="button">How-To Guide</button>
                        </div>{% endif %}
                </div>
            {% endif %}
        </div>

        {% spaceless %}
            <div id="loading-container" class="pb-2">
                <div id="ocr-loading" class="spinner-border" role="status" aria-hidden="true" hidden>
                    <span class="visually-hidden">Loading...</span>
                </div>
            </div>
            <div class="d-flex flex-column flex-grow-1" id="transcription-input-container">
                <textarea readonly class="form-control rounded flex-grow-1 d-print-none" name="text" id="transcription-input" placeholder="{% if transcription_status == 'not_started' or transcription_status == 'in_progress' %}Go ahead, start typing. You got this!{% else %}Nothing to transcribe{% endif %}" aria-label="Transcription input">
                    {{ transcription.text }}
                </textarea>
                {% if guides %}
                    {% include "transcriptions/asset_detail/guide.html" %}
                {% endif %}
            </div>

            <div class="print-transcription-text" aria-hidden="true" style="display: none;">{{ transcription.text }}</div>

            <div class="mt-3 mb-2 d-print-none d-flex flex-wrap justify-content-center align-items-center">
                {% if transcription_status == 'not_started' or transcription_status == 'in_progress' %}
                    <div class="form-check mt-0 mb-3 d-flex justify-content-center w-100">
                        <input id="nothing-to-transcribe" type="checkbox" class="form-check-input" />
                        <label class="form-check-label ms-1" for="nothing-to-transcribe">
                            Nothing to transcribe
                        </label>

                        <a tabindex="0" class="btn btn-link d-inline py-0" role="button" data-bs-toggle="popover" data-bs-placement="top" data-bs-trigger="focus click hover" title="Nothing to transcribe?" data-bs-html="true" data-bs-content="If there is no text to transcribe, check this box and click &quot;Submit&quot;. Learn more about what to transcribe and what to skip in &quot;How To.&quot;">
                            <span class="fas fa-question-circle" aria-label="Open Help"></span>
                        </a>
                    </div>

                    <div>
                        <button id="save-transcription-button" disabled type="submit" class="btn btn-primary mx-1 mb-2" title="Save the text you entered above">
                            Save
                        </button>
                        <button id="rollback-transcription-button" {% if not undo_available %}disabled{% endif %} type="button" class="btn btn-outline-primary mx-1 mb-2" title="Undo" data-url="{% url 'rollback-transcription' asset_pk=asset.pk %}">
                            <span class="fas fa-undo"></span> Undo
                        </button>
                        <button id="rollforward-transcription-button" {% if not redo_available %}disabled{% endif %} type="button" class="btn btn-outline-primary mx-1 mb-2" title="Redo" data-url="{% url 'rollforward-transcription' asset_pk=asset.pk %}">
                            Redo <span class="fas fa-redo"></span>
                        </button>
                        <button id="submit-transcription-button" disabled type="button" class="btn btn-primary mx-1 mb-2" title="Request another volunteer to review the text you entered above">
                            Submit for Review
                        </button>
                    </div>

                {% elif transcription_status == 'submitted' %}
                    {% if not user.is_authenticated %}
                        <p class="help-text">
                            <a href="{% url 'registration_register' %}">Register</a>
                            or
                            <a href="{% url 'login' %}?next={{ request.path|urlencode }}">login</a>
                            to help review
                        </p>
                    {% else %}
                        <button id="reject-transcription-button" disabled type="button" class="btn btn-primary mx-1" title="Correct errors you see in the text">Edit</button>
                        {% if transcription.user.pk == user.pk %}
                            <p class="help-text mt-2">You submitted this transcription. You can re-open it for editing if you wish to make changes before another volunteer reviews it.</p>
                        {% else %}
                            <button id="accept-transcription-button" disabled type="button" class="btn btn-primary mx-1" title="Confirm that the text is accurately transcribed">Accept</button>
                        {% endif %}
                    {% endif %}
                {% endif %}
                {% if anonymous_user_validation_required %}
                    {% if transcription_status == 'not_started' or transcription_status == 'in_progress' %}
                        <div class="w-100 text-center mt-1 mb-1">{{ turnstile_form.turnstile }}</div>
                    {% endif %}
                {% endif %}
            </div>
        {% endspaceless %}
    </form>
</div>


================================================
FILE: concordia/templates/transcriptions/asset_detail/error_modal.html
================================================
<div class="modal-dialog modal-dialog-centered" role="document">
    <div class="modal-content">
        <div class="modal-header">
            <h5 class="modal-title" id="error-modal-title">An error ocurred</h5>
            <button type="button" class="btn-close" data-bs-dismiss="modal" aria-label="Close"></button>
        </div>
        <div class="modal-body" id="error-modal-message">
            <p>An error occurred.</p>
        </div>
        <div class="modal-footer">
            <button type="button" class="btn btn-primary" data-bs-dismiss="modal">Close</button>
        </div>
    </div>
</div>


================================================
FILE: concordia/templates/transcriptions/asset_detail/guide.html
================================================
<div id="guide-sidebar" class="sidebar offscreen" tabindex="-1">
    <div id="title-bar" class="bg-primary px-2 py-1 row text-white">
        <div id="guide-bars-col" class="col-1 d-none pt-2">
            <a id="guide-bars" data-bs-target="#guide-carousel" data-bs-slide-to="0" href="" aria-label="link">
                <i aria-hidden="true" class="fas fa-solid fa-bars ps-3 pb-2"></i>
            </a>
        </div>
        <div class="col-10">
            <h3 class="px-2 my-1 py-1">How-To Guide</h3>
        </div>
        <div class="col-1 pt-2">
            <a id="close-guide">
                <span aria-hidden="true" class="fas fa-times"></span>
            </a>
        </div>
    </div>
    <div id="guide-carousel" class="carousel carousel-fade" data-bs-interval="false">
        <div class="carousel-inner">
            <div class="carousel-item active" id="guide-nav">
                <ul class="nav flex-column">
                    <li class="nav-item toc-title">
                        <a class="nav-link" data-bs-target="#guide-carousel" data-bs-slide-to="1" href="#" tabindex="-1">About This Campaign</a>
                    </li>
                    {% for guide in guides %}
                        <li class="nav-item toc-title">
                            <a data-bs-target="#guide-carousel" data-bs-slide-to="{{ forloop.counter|add:1 }}" class="nav-link" href="#pane-{{ forloop.counter }}" tabindex="-1">
                                {{ guide.title }}
                            </a>
                        </li>
                    {% endfor %}
                </ul>
            </div>
            <div class="carousel-item container">
                <div class="border-bottom justify-content-end mb-3 py-1 d-flex">
                    <div class="col-7 justify-self-center me-4">
                        <h3>About This Campaign</h3>
                    </div>
                    <div class="col-1 pt-2">
                        <a class="fw-bold ms-3" id="next-guide" data-bs-target="#guide-carousel" data-bs-slide="next">></a>
                    </div>
                </div>
                <div class="guide-body">
                    {% if campaign.description %}
                        <h4>About this campaign</h4>
                        <p>{{ campaign.description|safe }}</p>
                    {% endif %}
                    {% if asset.item.project.description %}
                        <h4>About this project</h4>
                        <p>{{ asset.item.project.description|safe }}</p>
                    {% endif %}
                    {% if campaign.helpfullink_set.related_links %}
                        <h5 class="pt-3">Helpful Links</h5>
                        <p>
                            <ul>
                                {% for link in campaign.helpfullink_set.related_links %}
                                    <li class="mb-3">
                                        <a href="{{ link.link_url }}" target="_blank" rel=noopener>
                                            {{ link.title }}{% if 'loc.gov' not in link.link_url %} <i class="fa fa-external-link-alt"></i>{% endif %}
                                        </a>
                                    </li>
                                {% endfor %}
                            </ul>
                    {% endif %}
                </div>
            </div>
            {% for guide in guides %}
                <div class="carousel-item container" id="pane-{{ forloop.counter }}">
                    <div class="border-bottom guide-header row">
                        <div class="col-1 pt-2 prev-guide">
                            <a class="fw-bold" id="previous-guide" data-bs-target="#guide-carousel" data-bs-slide="prev"><</a>
                        </div>
                        <div class="col text-center ps-2">
                            <h3>{{ guide.title }}</h3>
                        </div>
                        <div class="col-1 pt-2 next-guide">
                            {% if not forloop.last %}
                                <a class="fw-bold" id="next-guide" data-bs-target="#guide-carousel" data-bs-slide="next">></a>
                            {% endif %}
                        </div>
                    </div>
                    <div class="guide-body">
                        {{ guide.body|safe }}
                    </div>
                </div>
            {% endfor %}
        </div>
    </div>
</div>


================================================
FILE: concordia/templates/transcriptions/asset_detail/language_selection_modal.html
================================================
<div class="modal-dialog modal-dialog-centered" role="document">
    <div class="modal-content">
        <div class="modal-header d-flex justify-content-end">
            <button type="button" class="btn-close" data-bs-dismiss="modal" aria-label="Close"></button>
        </div>
        <form id="ocr-transcription-form" class="ajax-submission" method="post" action="{% url 'generate-ocr-transcription' asset_pk=asset.pk %}" data-lock-element="#transcription-editor">
            <div class="modal-body">
                <div class="bg-light p-3">
                    <h5 class="modal-title mb-3">Select language</h5>
                    <p>Select the language the transcription is in from the list below.</p>
                    <div class="text-center pb-1">
                        <select id="language" name="language" size="7">
                            {% for language in languages %}
                                <option value="{{ language.0 }}"{% if language.0 == "eng" %} selected="selected"{% endif %}>
                                    {{ language.1 }}
                                </option>
                            {% endfor %}
                        </select>
                    </div>
                </div>
            </div>
            <div class="modal-footer">
                <button type="button" class="btn btn-primary" data-bs-dismiss="modal">Cancel</button>
                {% if transcription_status != "completed" %}
                    <input type="hidden" name="supersedes" value="{{ transcription.pk|default:'' }}" />
                    <button id="ocr-transcription-button" class="btn btn-link underline-link fw-bold" disabled>Replace Text</button>
                {% endif %}
            </div>
        </form>
    </div>
</div>


================================================
FILE: concordia/templates/transcriptions/asset_detail/navigation.html
================================================
<nav id="asset-navigation" class="d-flex flex-wrap flex-grow-1 justify-content-sm-between align-items-center d-print-block" role="navigation">
    <div class="d-flex align-items-center">
        <form class="p-1" onsubmit="document.location.href = encodeURI(document.getElementById('asset-selection').value); return false">
            <div class="input-group input-group-sm flex-nowrap">
                <div class="input-group-prepend">
                    <label class="input-group-text mt-1 p-0 pe-1 border-0" for="asset-selection">Page</label>
                </div>
                <select id="asset-selection" class="form-select form-select-sm">
                    {% for sequence, slug in asset_navigation %}
                        <option {% if sequence == asset.sequence %}selected{% endif %} value="{% url 'transcriptions:asset-detail' campaign.slug project.slug item.item_id slug %}">{{ sequence }}</option>
                    {% endfor %}
                </select>
                <div class="input-group-append">
                    <button type="submit" class="btn btn-primary">Go</button>
                </div>
            </div>
        </form>

        <div class="btn-group btn-group-sm p-1">
            <a class="btn btn-primary {% if not previous_asset_url %}disabled{% endif %}" {% if previous_asset_url %}href="{{ previous_asset_url }}"{% else %}aria-disabled="true"{% endif %}>
                <span class="fas fa-chevron-left"></span>
                <span class="visually-hidden">Previous Page</span>
            </a>
            <a class="btn btn-primary {% if not next_asset_url %}disabled{% endif %}" {% if next_asset_url %}href="{{ next_asset_url }}"{% else %}aria-disabled="true"{% endif %}>
                <span class="fas fa-chevron-right"></span>
                <span class="visually-hidden">Next Page</span>
            </a>
        </div>

        <div class="btn-group btn-group-sm p-1">
            <button hidden id="go-fullscreen" class="btn btn-primary text-nowrap" data-bs-target="contribute-main-content">
                <span class="fas fa-arrows-alt"></span>
                Fullscreen
            </button>
        </div>
    </div>

    <div class="btn-group align-self-end" style="margin-right: -8px">
        {% if asset.resource_url %}
            <div class="btn-group-sm p-1" role="navigation" aria-label="Link to the original source for this item">
                <a class="btn btn-outline-primary text-nowrap" target="_blank" rel=noopener title="View the original source for this item in a new tab" href="{{ asset.resource_url }}{% if 'sp=' not in asset.resource_url %}?sp={{ asset.sequence }}{% endif %}">View on www.loc.gov <i class="fa fa-external-link-alt"></i></a>
            </div>
        {% endif %}

        <div class="btn-group-sm p-1" role="navigation" aria-label="Link to the next editable page">
            <a class="btn btn-outline-primary text-nowrap" title="Move to the next page in this item that needs help" href="{{ next_open_asset_url }}">Find a new page &rarr;</a>
        </div>
    </div>
</nav>


================================================
FILE: concordia/templates/transcriptions/asset_detail/nothing_to_transcribe_modal.html
================================================
<div class="modal-dialog modal-dialog-centered" role="document">
    <div class="modal-content">
        <div class="modal-header">
            <h5 class="modal-title" id="error-modal-title"></h5>
            <button type="button" class="btn-close" data-bs-dismiss="modal" aria-label="Close"></button>
        </div>
        <div class="modal-body"></div>
        <div class="modal-footer d-flex justify-content-center gap-5">
            <a class="btn btn-primary" id="confirmDiscard">Yes</a>
            <a class="btn btn-primary" id="cancelDiscard">Cancel</a>
        </div>
    </div>
</div>


================================================
FILE: concordia/templates/transcriptions/asset_detail/ocr_help_modal.html
================================================
<div id="ocr-help-modal" class="modal" tabindex="-1" role="dialog">
    <div class="modal-dialog modal-dialog-centered" role="document">
        <div class="modal-content">
            <div class="modal-header">
                <h5 class="modal-title">About Transcribe with OCR</h5>
                <button type="button" class="btn-close" data-bs-dismiss="modal" aria-label="Close"></button>
            </div>
            <div class="modal-body">
                <h6 class="modal-title">What is OCR?</h6>
                <p>OCR stands for Optical Character Recognition. OCR is a software tool that can extract print text from some documents.</p>
                <h6>When will OCR work well?</h6>
                <p>OCR does not work on handwriting. It only works for printed or typed text, meaning text created by a typewriter, printing press, or other mechanical means. OCR will do best on consistent and clear images of modern typefaces.</p>
                <h6>Do I still need to review pages started with OCR?</h6>
                <p>Yes! OCR is imperfect. It may not work well for some or all parts of a typed page, but it can be a great starting point. If you start a page with OCR, you should read the text closely before submitting. If you are reviewing a OCR-ed page, you also still need to review.</p>
                <h6>Who can use "Transcribe with OCR"?</h6>
                <p><a href="{% url 'registration_register' %}">Register for an account</a> and <a href="{% url 'registration_login' %}?next={{ request.path }}">log in</a> to use this feature.</p>
                <h6>Why does <span class="fst-italic">By the People</span> have this feature?</h6>
                <p>We always want to use volunteer time effectively. When the Library of Congress digitizes a large group of printed pages, it will usually OCR them. The materials in By the People campaigns are not good candidates for applying OCR at scale, either because they are handwritten, a mixed collection of handwritten and print materials, or printed on paper or in a typeface that does not produce accurate OCR results. However, OCR can still be a useful starting point for some typed pages. Use it if it if you like it or skip it if you don’t!</p>
            </div>
            <div class="modal-footer justify-content-center">
                <button type="button" class="btn btn-primary" data-bs-dismiss="modal">Close</button>
            </div>
        </div>
    </div>
</div>


================================================
FILE: concordia/templates/transcriptions/asset_detail/ocr_transcription_modal.html
================================================
<div class="modal-dialog modal-dialog-centered" role="document">
    <div class="modal-content">
        <div class="modal-header d-flex justify-content-end">
            <button type="button" class="btn-close" data-bs-dismiss="modal" aria-label="Close"></button>
        </div>
        <div class="modal-body">
            <div class="bg-light p-3">
                <h5 class="modal-title mb-3">Are you sure?</h5>
                <p>Clicking "Transcribe with OCR" will remove all existing transcription text and replace it with automatically generated text. Use the "Undo" button to restore previous text.</p>
            </div>
        </div>
        <div class="modal-footer">
            <button type="button" class="btn btn-primary" data-bs-dismiss="modal">Cancel</button>
            {% if transcription_status == "not_started" or transcription_status == "in_progress" %}
                <input type="hidden" name="supersedes" value="{{ transcription.pk|default:'' }}" />
                <a tabindex="0" class="btn btn-link d-inline p-0" role="button" data-bs-placement="top" id="select-language-button">
                    <span class="underline-link fw-bold">Yes, Select Language</span>
                </a>
            {% endif %}
        </div>
    </div>
</div>


================================================
FILE: concordia/templates/transcriptions/asset_detail/quick_tips_modal.html
================================================
<div id="campaign-data"
     aria-hidden="true"
     role="none"
     hidden
     data-campaign-slug="{{ campaign.slug|default:'' }}"
     data-user-authenticated="{{ user.is_authenticated|yesno:'true,false' }}"
     data-has-asset="{{ asset|yesno:'true,false' }}">
</div>
<div id="tutorial-popup" class="modal" tabindex="-1" role="dialog">
    <div class="modal-dialog modal-dialog-centered" role="document">
        <div class="modal-content">
            <div class="modal-header border-bottom-0 row">
                <div class="col ps-3">
                    <h4>Campaign Tips</h4>
                </div>
                <div class="col-1" id="close-tutorial">
                    <a data-bs-dismiss="modal" aria-label="Close">
                        <span aria-hidden="true">x</span>
                    </a>
                </div>
            </div>
            <div class="modal-body">
                <div id="card-carousel" class="carousel slide" data-bs-interval="false">
                    <div class="carousel-inner">
                        {% for card in cards %}
                            <div class="carousel-item pb-4 {% if forloop.first %} active {% endif %}">
                                <div class="position-static d-flex flex-column justify-content-around">
                                    {% if card.image %}
                                        <img src="{{ card.image.url }}"{% if card.image_alt_text %} alt="{{ card.image_alt_text }}"{% endif %}>
                                    {% endif %}
                                    {% if card.display_heading %}
                                        <h5>{{ card.display_heading }}</h5>
                                    {% endif %}
                                    <p>{{ card.body_text|safe }}</p>
                                </div>
                            </div>
                        {% endfor %}
                    </div>
                    <a id="previous-card" href="#card-carousel" role="button" data-bs-slide="prev">
                        <strong><u><&nbsp;Back</u></strong>
                    </a>
                    <div class="carousel-indicators d-none d-lg-flex">
                        {% for card in cards %}
                            <button type="button" data-bs-target="#card-carousel" data-bs-slide-to="{{ forloop.counter0 }}" {% if forloop.first %}class="active" {% endif %}></button>
                        {% endfor %}
                    </div>
                    <a id="next-card" href="#card-carousel" data-bs-slide="next">
                        <strong><u>Next&nbsp;></u></strong>
                    </a>
                </div>
            </div>
        </div>
    </div>
</div>


================================================
FILE: concordia/templates/transcriptions/asset_detail/review_accepted_modal.html
================================================
<div class="modal-dialog modal-dialog-centered" role="document">
    <div class="modal-content">
        <div class="modal-header">
            <h5 class="modal-title">Nice Job!</h5>
            <button type="button" class="btn-close" data-bs-dismiss="modal" aria-label="Close"></button>
        </div>
        <div class="modal-body">
            <p>
                Thanks for helping complete this page!
            </p>
            <p>
                What would you like to do next?
            </p>
        </div>
        {% include "fragments/_modal_footer.html" %}
    </div>
</div>


================================================
FILE: concordia/templates/transcriptions/asset_detail/successful_submission_modal.html
================================================
<div class="modal-dialog modal-dialog-centered" role="document">
    <div class="modal-content">
        <div class="modal-header">
            <h5 class="modal-title">Submitted!</h5>
            <button type="button" class="btn-close" data-bs-dismiss="modal" aria-label="Close"></button>
        </div>
        <div class="modal-body">
            <p>Thanks for helping complete this page!</p>
            <p>
                {% if not user.is_authenticated %}<a href="{% url 'login' %}?next={{ request.path|urlencode }}">Login</a> or <a href="{% url 'registration_register' %}">Register</a> to review and track your progress.{% endif %}
            </p>
            <p>
                What would you like to do next?
            </p>
        </div>
        {% include "fragments/_modal_footer.html" %}
    </div>
</div>


================================================
FILE: concordia/templates/transcriptions/asset_detail/tags.html
================================================
<div id="tag-editor" class="flex-shrink-1">
    <h2 id="tag-label" class="border-top pt-3 pb-2"><a
        data-bs-toggle="collapse" href="#tag-form" role="button" aria-expanded="false"
        aria-controls="tag-form"><i class="fas fa-plus-square"></i> <span
            id="tag-count-text" class="text-dark">Tags (<span id="tag-count">{{ tags|length }}</span>)</span></a></h2>
    <form id="tag-form" class="ajax-submission collapse" method="post" action="{% url 'submit-tags' asset_pk=asset.pk %}">
        {% csrf_token %}
        <div class="d-print-none grid">
            {% if user.is_authenticated %}
                <div class="row">
                    <div class="col input-group">
                        <input type="text" id="new-tag-input" class="form-control" placeholder="Add a new tag…" aria-label="Add a new tag" pattern="[\- _À-ž'\w]{1,50}">
                        <div class="input-group-append">
                            <button id="new-tag-button" class="btn btn-outline-primary" type="button" title="Add tags to the page">Add</button>
                        </div>
                        <div class="invalid-feedback">
                            Tags must be between 1-50 characters and may contain only letters, numbers, dashes, underscores, apostrophes, and spaces
                        </div>
                    </div>
                </div>
            {% else %}
                <div class="d-flex justify-content-center w-100 py-2">
                    <p class="help-text anonymous-only text-center d-print-none mb-0">
                        Want to tag this page?

                        <a href="{% url 'registration_register' %}" class="mx-1">Register</a>
                        <span class="text-muted">or</span>
                        <a href="{% url 'login' %}?next={{ request.path|urlencode }}" class="mx-1">login</a>
                        to add tags.
                    </p>
                </div>
            {% endif %}
        </div>

        <ul id="current-tags" class="d-flex flex-wrap list-unstyled mb-0 d-print-block">
            {% for tag in tags %}
                <li class="btn btn-outline-dark btn-sm">
                    <label class="m-0">
                        <input type="hidden" name="tags" value="{{ tag }}" />
                        {{ tag }}
                    </label>
                    <a class="close authenticated-only" data-bs-dismiss="alert" aria-label="Remove previous tag" {% if not user.is_authenticated %}hidden{% endif %}>
                        <span aria-hidden="true" class="fas fa-times"></span>
                    </a>
                </li>
            {% endfor %}
        </ul>
    </form>
</div>


================================================
FILE: concordia/templates/transcriptions/asset_detail/viewer.html
================================================
<div id="viewer-controls" class="m-1 text-center d-print-none">
    <div class="d-inline-flex justify-content-between">
        <div class="d-flex btn-group m-1">
            <button id="viewer-layout-vertical" class="btn btn-dark viewer-control-button" title="Vertical Layout">
                <span class="fas fa-grip-lines"></span>
            </button>
            <button id="viewer-layout-horizontal" class="btn btn-dark" title="Horizontal Layout">
                <span class="fas fa-grip-lines-vertical"></span>
            </button>
        </div>

        <div class="d-flex btn-group m-1">
            <button type="button" id="viewer-home" class="btn btn-dark viewer-control-button" title="Fit Image to Viewport">
                <span class="fas fa-compress"></span>
            </button>
        </div>

        <div class="d-flex btn-group m-1">
            <button id="viewer-zoom-in" class="btn btn-dark viewer-control-button" title="Zoom In">
                <span class="fas fa-search-plus"></span>
            </button>
            <button id="viewer-zoom-out" class="btn btn-dark" title="Zoom Out">
                <span class="fas fa-search-minus"></span>
            </button>
        </div>

        <div class="d-flex btn-group m-1">
            <button id="viewer-rotate-left" class="btn btn-dark viewer-control-button" title="Rotate Left">
                <span class="fas fa-undo"></span>
            </button>
            <button id="viewer-rotate-right" class="btn btn-dark viewer-control-button" title="Rotate Right">
                <span class="fas fa-redo"></span>
            </button>
        </div>

        <div class="d-flex btn-group m-1">
            <button id="viewer-flip" class="btn btn-dark viewer-control-button" title="Flip">
                <span class="fas fa-exchange-alt"></span>
            </button>
        </div>

        <div class="d-flex btn-group m-1">
            <button type="button" class="btn btn-dark extra-control-button" title="Image Filters" data-bs-toggle="collapse" data-bs-target="#image-filters">
                <span class="fas fa-sliders-h" aria-label="Image Filters"></span>
            </button>
        </div>

        <div class="d-flex btn-group m-1">
            <button type="button" id="viewer-fullscreen" class="btn btn-dark extra-control-button" title="View Full Screen" data-target="#viewer-column">
                <span class="fas fa-expand"></span>
            </button>
        </div>

        <div class="d-flex btn-group m-1">
            <button type="button" class="btn btn-dark extra-control-button" title="Viewer keyboard shortcuts" data-bs-toggle="modal" data-bs-target="#keyboard-help-modal">
                <span class="fas fa-question-circle" aria-label="Viewer keyboard shortcuts"></span>
            </button>
        </div>
    </div>
</div>

<div id="keyboard-help-modal" class="modal" tabindex="-1" role="dialog">
    <div class="modal-dialog modal-dialog-centered" role="document">
        <div class="modal-content">
            <div class="modal-header">
                <h5 class="modal-title">Keyboard Shortcuts</h5>
                <button type="button" class="btn-close" data-bs-dismiss="modal" aria-label="Close">

                </button>
            </div>
            <div class="modal-body">
                <h6>Viewer Shortcuts</h6>
                <table class="table table-compact table-responsive">
                    <tr>
                        <th><kbd>w</kbd>, up arrow</th>
                        <td>Scroll the viewport up</td>
                    </tr>
                    <tr>
                        <th><kbd>s</kbd>, down arrow</th>
                        <td>Scroll the viewport down</td>
                    </tr>
                    <tr>
                        <th><kbd>a</kbd>, left arrow</th>
                        <td>Scroll the viewport left</td>
                    </tr>
                    <tr>
                        <th><kbd>d</kbd>, right arrow </th>
                        <td>Scroll the viewport right</td>
                    </tr>
                    <tr>
                        <th><kbd>0</kbd></th>
                        <td>Fit the entire image to the viewport</td>
                    </tr>
                    <tr>
                        <th><kbd>-</kbd>, <kbd>_</kbd>, Shift+<kbd>W</kbd>, Shift+Up arrow</th>
                        <td>Zoom the viewport out</td>
                    </tr>
                    <tr>
                        <th><kbd>=</kbd>, <kbd>+</kbd>, Shift+<kbd>S</kbd>, Shift+Down arrow</th>
                        <td>Scroll the viewport in</td>
                    </tr>
                    <tr>
                        <th><kbd>r</kbd></th>
                        <td>Rotate the viewport clockwise</td>
                    </tr>
                    <tr>
                        <th><kbd>R</kbd></th>
                        <td>Rotate the viewport counterclockwise</td>
                    </tr>
                    <tr>
                        <th><kbd>f</kbd></th>
                        <td>Flip the viewport horizontally</td>
                    </tr>
                </table>
            </div>
            <div class="modal-footer">
                <button type="button" class="btn btn-primary" data-bs-dismiss="modal">Close</button>
            </div>
        </div>
    </div>
</div>


================================================
FILE: concordia/templates/transcriptions/asset_detail/viewer_filters.html
================================================
<div id="image-filters" class="m-1 text-center d-print-none collapse">
    <hr class="m-0" />
    <ul class="d-inline-flex mt-1 btn-group nav nav-tabs" role="tablist">
        <li class="nav-item" role="presentation">
            <button id="viewer-gamma" class="btn btn-dark nav-link active" title="Adjust gamma" data-bs-toggle="tab" data-bs-target="#gamma-filter" role="tab">
                Brightness
            </button>
        </li>
        <li class="nav-item" role="presentation">
            <button id="viewer-invert" class="btn btn-dark nav-link" title="Invert colors" data-bs-toggle="tab" data-bs-target="#invert-filter" role="tab">
                Invert
            </button>
        </li>
        <li class="nav-item" role="presentation">
            <button id="viewer-threshold" class="btn btn-dark nav-link" title="Adjust threshold" data-bs-toggle="tab" data-bs-target="#threshold-filter" role="tab">
                Contrast
            </button>
        </li>
    </ul>
    <div class="btn-group m-1">
        <button id="viewer-reset" class="btn" title="Reset all filters">
            Reset All
        </button>
    </div>
    <div id="filter-tabs" class="tab-content">
        <div id="gamma-filter" class="tab-pane pt-1 ps-3 show active" role="tabpanel">
            <form id="gamma-form" class="d-flex align-items-center" onsubmit="return false;">
                <div class="row ms-0 me-3 number-input">
                    <div class="col p-1">
                        <input
                            type="number"
                            id="gamma"
                            name="gamma"
                            min="0"
                            max="5"
                            step="0.01"
                            value="1.00"
                        />
                        <label class="visually-hidden" for="gamma">Gamma</label>
                    </div>
                    <div class="col p-0 filter-buttons">
                        <div class="row m-0">
                            <button id="gamma-up" type="button" class="arrow-button">
                                <span class="fas fa-chevron-up" />
                                <span class="visually-hidden">Increase</span>
                            </button>
                        </div>
                        <div class="row m-0">
                            <button id="gamma-down" type="button" class="arrow-button">
                                <span class="fas fa-chevron-down" />
                                <span class="visually-hidden">Decrease</span>
                            </button>
                        </div>
                    </div>
                </div>
                <input
                    type="range"
                    id="gamma-range"
                    name="gamma-range"
                    min="0"
                    max="5"
                    step="0.01"
                    value="1.00"
                    class="filter-slider flex-grow-1"
                />
                <label class="visually-hidden" for="gamma-range">Gamma</label>
                <input type="reset" class="btn btn-link underline-link fw-bold" value="Reset filter" />
            </form>
        </div>
        <div id="invert-filter" class="tab-pane pt-2" role="tabpanel" style="background-color: white;">
            <form id="invert-form" onsubmit="return false;" class="d-flex justify-content-center">
                <label class="ms-2 align-middle">Off</label>
                <div class="form-check form-switch custom-control-inline">
                    <input type="checkbox" id="invert" name="invert" class="form-check-input" role="switch" />
                    <label class="form-check-label" for="invert"><span class="visually-hidden">Invert</span></label>
                </div>
                <label class="align-middle">On</label>
            </form>
        </div>
        <div id="threshold-filter" class="tab-pane pt-1 ps-3" role="tabpanel">
            <form id="threshold-form" class="d-flex align-items-center" onsubmit="return false;">
                <div class="row ms-0 me-3 number-input">
                    <div class="col p-1">
                        <input
                            type="number"
                            id="threshold"
                            name="threshold"
                            min="0"
                            max="255"
                            step="1"
                            value="0"
                        />
                        <label class="visually-hidden" for="threshold">Threshold</label>
                    </div>
                    <div class="col p-0 filter-buttons">
                        <div class="row m-0">
                            <button id="threshold-up" type="button" class="arrow-button">
                                <span class="fas fa-chevron-up" />
                                <span class="visually-hidden">Increase</span>
                            </button>
                        </div>
                        <div class="row m-0">
                            <button id="threshold-down" type="button" class="arrow-button">
                                <span class="fas fa-chevron-down" />
                                <span class="visually-hidden">Decrease</span>
                            </button>
                        </div>
                    </div>
                </div>
                <input
                    type="range"
                    id="threshold-range"
                    name="threshold-range"
                    min="0"
                    max="255"
                    step="1"
                    value="0"
                    class="filter-slider flex-grow-1"
                />
                <label class="visually-hidden" for="threshold-range">Threshold</label>
                <input type="reset" class="btn btn-link underline-link fw-bold" value="Reset filter" />
            </form>
        </div>
    </div>
</div>


================================================
FILE: concordia/templates/transcriptions/asset_detail.html
================================================
{% extends "base.html" %}

{% load staticfiles %}

{% load feature_flags %}

{% load concordia_media_tags %}
{% load concordia_sharing_tags %}

{% block title %}
    {{ asset.title }} ({{ asset.item.project.campaign.title }}: {{ asset.item.project.title }})
{% endblock title %}

{% block head_content %}
    <link rel="canonical" href="https://{{ request.get_host }}{{ request.path }}">
    <meta property="og.url" content="https://{{ request.get_host }}{{ request.path }}" />
    <meta property="og.title" content="{{ asset.item.title }}" />
    <meta property="og.description" content="{{ asset.item.project.description }}" />
    <meta property="og.type" content="website" />
    <meta property="og.image" content="{{ thumbnail_url }}" />

    <script id="asset-reservation-data"
            data-reserve-asset-url="{% url 'reserve-asset' asset.pk %}"
            {% if transcription_status == "not_started" or transcription_status == "in_progress" or user.is_authenticated%}
                data-reserve-for-editing=1
            {% endif %}
    ></script>

    <script id="viewer-data"
            data-prefix-url="{% static 'openseadragon/build/openseadragon/images/' %}"
            data-tile-source-url="{% asset_media_url asset %}?canvas"
            data-contact-url="https://ask.loc.gov/crowd"
    ></script>

    {% if anonymous_user_validation_required %}
        <script module src="{{ TURNSTILE_JS_API_URL }}"></script>
    {% endif %}

    {{ block.super }}
{% endblock head_content %}

{% block breadcrumbs %}
    <li class="breadcrumb-item"><a class="primary-text text-truncate" href="{% url 'transcriptions:campaign-detail' slug=campaign.slug %}" title="{{ campaign.title }}">{{ campaign.title }}</a></li>
    <li class="breadcrumb-item"><a class="primary-text text-truncate" href="{% url 'transcriptions:project-detail' campaign_slug=campaign.slug slug=project.slug %}" title="{{ project.title }}">{{ project.title }}</a></li>
    <li class="breadcrumb-item"><a class="primary-text text-truncate" href="{% url 'transcriptions:item-detail' campaign_slug=campaign.slug project_slug=project.slug item_id=item.item_id %}" title="{{ item.title }}">{{ item.title }}</a></li>
    <li class="breadcrumb-item active" title="{{ asset.title }}"><span class="text-truncate">{{ asset.title }}</spanclass></li>
{% endblock breadcrumbs %}

{% block extra_body_classes %}d-flex flex-column{% endblock %}
{% block extra_main_classes %}flex-grow-1 d-flex flex-column{% endblock %}

{% block main_content %}
    {% flag_enabled 'ADVERTISE_ACTIVITY_UI' as ADVERTISE_ACTIVITY_UI %}
    <div id="unacceptable-characters-content"></div>

    <div id="contribute-main-content" class="container-fluid flex-grow-1 d-flex flex-column d-print-block">
        <div id="navigation-container" class="row p-1 px-3 d-print-none bg-light">
            {% include "transcriptions/asset_detail/navigation.html" %}
        </div>
        <div id="contribute-container" class="d-flex flex-grow-1 d-print-block border">
            <div id="viewer-column" class="ps-0 d-flex align-items-stretch bg-dark d-print-block flex-column">
                {% include "transcriptions/asset_detail/viewer.html" %}
                {% include "transcriptions/asset_detail/ocr_help_modal.html" %}
                {% include "transcriptions/asset_detail/viewer_filters.html" %}
                <div id="asset-image" class="h-100 bg-dark d-print-none w-100"></div>
                <div id="ocr-section" class="row ps-3 pb-4 bg-white print-none">
                    {% if not disable_ocr %}
                        <div class="d-flex flex-row align-items-center justify-content-end mt-1">
                            <a tabindex="0" class="btn btn-link d-inline p-0" role="button" data-bs-placement="top" data-bs-trigger="focus click hover" title="When to use OCR"  data-bs-toggle="modal" data-bs-target="#ocr-help-modal">
                                <span class="underline-link fw-bold">What is OCR</span> <span class="fas fa-question-circle" aria-label="When to use OCR"></span>
                            </a>
                            <a role="button" data-bs-placement="top" data-bs-trigger="click" title="Transcribe with OCR" id="ocr-transcription-link" class="btn btn-primary mx-1" aria-disabled="true" href="#" tabindex="0" data-authenticated="{{ user.is_authenticated|yesno:'true,false' }}">Transcribe with OCR</a>
                        </div>
                    {% endif %}
                </div>
            </div>

            <div id="editor-column" class="d-flex justify-content-between p-3 d-print-block flex-column">
                {% include "transcriptions/asset_detail/editor.html" %}
                {% include "transcriptions/asset_detail/tags.html" %}
            </div>
        </div>
        <div id="help-container" class="mt-1 d-print-none">
            <div class="row p-3 bg-light justify-content-sm-between">
                <div class="d-flex align-items-center ps-1 col">Share this item: {% share_buttons current_asset_url asset.item.title %}</div>
                <div class="btn-group align-items-center col">
                    <p class="ms-auto me-2 my-0">Need help?</p>

                    <div class="d-grid gap-2 d-md-block">
                        <a class="btn btn-primary mx-1" href="https://ask.loc.gov/crowd" target="_blank" rel=noopener>
                            Contact us
                        </a>
                    </div>
                </div>
            </div>
        </div>
        <div id="asset-reservation-failure-modal" class="modal" tabindex="-1" role="dialog">
            {% include "transcriptions/asset_detail/asset_reservation_failure_modal.html" %}
        </div>
        <div id="successful-submission-modal" class="modal" tabindex="-1" role="dialog">
            {% include "transcriptions/asset_detail/successful_submission_modal.html" %}
        </div>
        <div id="review-accepted-modal" class="modal" tabindex="-1" role="dialog">
            {% include "transcriptions/asset_detail/review_accepted_modal.html" %}
        </div>
        <div id="ocr-transcription-modal" class="modal" tabindex="-1" role="dialog">
            {% include "transcriptions/asset_detail/ocr_transcription_modal.html" %}
        </div>
        <div id="language-selection-modal" class="modal" tabindex="-1" role="dialog">
            {% include "transcriptions/asset_detail/language_selection_modal.html" %}
        </div>
        <div id="error-modal" class="modal" tabindex="-1" role="dialog">
            {% include "transcriptions/asset_detail/error_modal.html" %}
        </div>
        <div id="nothing-to-transcribe-modal" class="modal" tabindex="-1" role="dialog">
            {% include "transcriptions/asset_detail/nothing_to_transcribe_modal.html" %}
        </div>
    </div>
    <div class="print-transcription-image d-none d-print-block"><img class="img-fluid" alt="Scanned image of the current content page" src="{% asset_media_url asset %}"></div>
    {% if cards %}
        {% include "transcriptions/asset_detail/quick_tips_modal.html" %}
    {% endif %}
{% endblock main_content %}


================================================
FILE: concordia/templates/transcriptions/campaign_detail.html
================================================
{% extends "base.html" %}

{% load static %}
{% load staticfiles %}
{% load humanize %}
{% load concordia_text_tags %}
{% load concordia_filtering_tags %}

{% block title %}{{ campaign.title }}{% endblock title %}

{% block head_content %}
    <link rel="canonical" href="https://{{ request.get_host }}{{ request.path }}">
    <meta name="description" content="{{ campaign.description|striptags|normalize_whitespace }}">
    <meta name="thumbnail" content="{{ MEDIA_URL }}{{ campaign.thumbnail_image }}">
    <meta property="og:image" content="{{ MEDIA_URL }}{{ campaign.thumbnail_image }}">
    {{ block.super }}
{% endblock head_content %}

{% block breadcrumbs %}
    <li class="breadcrumb-item"><a class="primary-text text-truncate" href="{% url 'campaign-topic-list' %}">Campaigns</a></li>
    <li class="breadcrumb-item active" aria-current="page" title="{{ campaign.title }}"><span class="text-truncate">{{ campaign.title }}</span></li>
{% endblock breadcrumbs %}

{% block main_content %}
    <div class="container py-3">
        <div class="row">
            <div class="col-md-12">
                <h1>{{ campaign.title }}</h1>
            </div>
        </div>
        <div class="row">
            <div class="col-12 col-lg pt-1 pb-1">
                <div class="progress campaign-page-progress">
                    <div
                        title="Completed ({{ completed_count|intcomma }} page{{ completed_count|pluralize }})"
                        class="progress-bar bg-completed"
                        role="progressbar"
                        style="width: {{ completed_percent }}%"
                        aria-valuenow="{{ completed_percent }}"
                        aria-valuemin="0"
                        aria-valuemax="100"
                    ></div>
                    <div
                        title="Needs Review ({{ submitted_count|intcomma }} page{{ submitted_count|pluralize }})"
                        class="progress-bar bg-submitted"
                        role="progressbar"
                        style="width: {{ submitted_percent }}%"
                        aria-valuenow="{{ submitted_percent }}"
                        aria-valuemin="0"
                        aria-valuemax="100"
                    ></div>
                    <div
                        title="In Progress ({{ in_progress_count|intcomma }} page{{ in_progress_count|pluralize }})"
                        class="progress-bar bg-in_progress"
                        role="progressbar"
                        style="width: {{ in_progress_percent }}%"
                        aria-valuenow="{{ in_progress_percent }}"
                        aria-valuemin="0"
                        aria-valuemax="100"
                    ></div>
                    <div
                        title="Not Started ({{ not_started_count|intcomma }} page{{ not_started_count|pluralize }})"
                        class="progress-bar bg-not_started"
                        role="progressbar"
                        style="width: {{ not_started_percent }}%"
                        aria-valuenow="{{ not_started_percent }}"
                        aria-valuemin="0"
                        aria-valuemax="100"
                    ></div>
                </div>
            </div>
        </div>
        <div class="row">
            <div class="col-12 col-lg pb-1">
                <ul class="progress-bar-labels list-unstyled m-0 p-1">
                    {% if completed_percent %}
                        <li>{{ completed_percent }}% Completed</li>
                    {% endif %}
                    {% if submitted_percent %}
                        <li>{{ submitted_percent }}% Needs Review</li>
                    {% endif %}
                    {% if in_progress_percent %}
                        <li>{{ in_progress_percent }}% In Progress</li>
                    {% endif %}
                    {% if not_started_percent %}
                        <li>{{ not_started_percent }}% Not Started</li>
                    {% endif %}
                </ul>
            </div>
            <div class="row">
                <div class="col-md-12 pt-1 pb-1">
                    <hr class="landing-divider" />
                    <p class="mb-1"><strong>Completed Page{{ completed_count|pluralize }}:</strong> {{ completed_count|intcomma }}</p>
                    <p class="mb-1"><strong>Registered Contributor{{ contributor_count|pluralize }}:</strong> {{ contributor_count|intcomma }}</p>
                    {% if campaign.launch_date %}
                        <p class="mb-1"><strong>Launched {{ campaign.launch_date }}.</strong></p>
                    {% endif %}
                    <hr class="landing-divider" />
                </div>
            </div>
            <div class="row">
                <div class="col-md-9">
                    <div class="hero-text">{{ campaign.description|safe }}</div>
                </div>
                <div class="col-md-3">
                    {% if campaign.helpfullink_set.related_links %}
                        <aside class="mb-3 mt-4 mt-md-0 p-3 bg-light">
                            <h4 class="mb-3">Helpful Links</h4>
                            <ul class="list-unstyled m-0">
                                {% for link in campaign.helpfullink_set.related_links %}
                                    {% if 'loc.gov' in link.link_url   %}
                                        <li class="mb-3"><a href="{{ link.link_url }}" target="_blank" rel=noopener>{{ link.title }}</a></li>
                                    {%else%}
                                        <li class="mb-3"><a href="{{ link.link_url }}" target="_blank" rel=noopener>{{ link.title }} <i class="fa fa-external-link-alt"></i></a></li>
                                    {% endif %}
                                {% endfor %}
                            </ul>
                        </aside>
                    {% endif %}
                </div>
            </div>
            <div class="d-flex justify-content-between mt-4">
                <div>
                    <h3>Filter pages:</h3>
                </div>
                {% url 'transcriptions:campaign-detail' campaign.slug as all_assets %}
                {% url 'transcriptions:filtered-campaign-detail' campaign.slug as filtered_assets %}
                {% include "fragments/_filter-buttons.html" with do_filter=filter_assets all_url=all_assets filtered_url=filtered_assets sublevel_qs=sublevel_querystring %}
            </div>
            <div class="row">
                <div class="col-12 col-lg text-center">
                    {% transcription_status_filters transcription_status_counts transcription_status "large" True all_assets %}
                </div>
            </div>
            <div class="row justify-content-center concordia-object-card-row">
                <div class="concordia-object-card-container justify-content-center">
                    {% for project in projects %}
                        <div class="col-6 concordia-object-card-col">
                            <div class="h-100 concordia-object-card card border" data-transcription-status="{{ project.lowest_transcription_status }}">
                                {% if filter_assets %}
                                    {% url 'transcriptions:filtered-project-detail' campaign.slug project.slug as project_url %}
                                {% else %}
                                    {% url 'transcriptions:project-detail' campaign.slug project.slug as project_url %}
                                {% endif %}

                                <a href="{{ project_url }}?{{ sublevel_querystring }}" aria-hidden="true">
                                    <img class="card-img card-img-campaign" src="{{ MEDIA_URL }}{{ project.thumbnail_image }}" alt="{{ project.title }}">
                                </a>

                                <div class="progress w-100">
                                    <div title="Completed" class="progress-bar bg-completed" role="progressbar" style="width: {{ project.completed_percent }}%" aria-valuenow="{{ project.completed_percent }}" aria-valuemin="0" aria-valuemax="100"></div>
                                    <div title="Needs Review" class="progress-bar bg-submitted" role="progressbar" style="width: {{ project.submitted_percent }}%" aria-valuenow="{{ project.submitted_percent }}" aria-valuemin="0" aria-valuemax="100"></div>
                                    <div title="In Progress" class="progress-bar bg-in_progress" role="progressbar" style="width: {{ project.in_progress_percent }}%" aria-valuenow="{{ project.in_progress_percent }}" aria-valuemin="0" aria-valuemax="100"></div>
                                </div>

                                <h6 class="text-center primary-text m-0 concordia-object-card-title">
                                    <a{% if project.lowest_transcription_status == 'completed' %} class="text-dark"{% endif %} href="{{ project_url }}?{{ sublevel_querystring }}">{{ project.title }}</a>
                                </h6>

                                {% if project.lowest_transcription_status == 'completed' %}
                                    <div class="card-actions">
                                        <a class="btn btn-sm btn-block btn-dark" href="{{ project_url }}?{{ sublevel_querystring }}">
                                            <span class="fas fa-check tx-completed"></span>
                                            Complete
                                        </a>
                                    </div>
                                {% endif %}
                            </div>
                        </div>
                    {% empty %}
                        {% if filter_assets %}
                            <div class="pt-3">There are no pages you can review. Select "Show all" to see pages you can read or edit.</div>
                        {% endif %}
                    {% endfor %}
                </div>
            </div>
{% endblock main_content %}
{% block body_scripts %}
    {{ block.super }}
    <script src="{% static 'js/filter-assets.js' %}"></script>
{% endblock body_scripts %}


================================================
FILE: concordia/templates/transcriptions/campaign_detail_completed.html
================================================
{% extends "base.html" %}

{% load staticfiles %}
{% load humanize %}
{% load concordia_text_tags %}

{% block title %}{{ campaign.title }}{% endblock title %}

{% block head_content %}
    <link rel="canonical" href="https://{{ request.get_host }}{{ request.path }}">
    <meta name="description" content="{{ campaign.description|striptags|normalize_whitespace }}">
    <meta name="thumbnail" content="{{ MEDIA_URL }}{{ campaign.thumbnail_image }}">
    <meta property="og:image" content="{{ MEDIA_URL }}{{ campaign.thumbnail_image }}">
    {{ block.super }}
{% endblock head_content %}

{% block breadcrumbs %}
    <li class="breadcrumb-item"><a class="primary-text text-truncate" href="{% url 'campaign-topic-list' %}">Campaigns</a></li>
    <li class="breadcrumb-item active" aria-current="page" title="{{ campaign.title }}"><span class="text-truncate">{{ campaign.title }}</span></li>
{% endblock breadcrumbs %}

{% block main_content %}
    <div class="container py-3">
        <div class="row">
            <div class="col-md-12">
                <h1>{{ campaign.title }}</h1>
                <div class="completed-bar"><h3 class="completed-text">100% Complete</h3></div>
                <hr class="landing-divider" />
                <span><strong>Completed Page{{ completed_count|pluralize }}:</strong> {{ completed_count|intcomma }}</span>
                <br />
                <span><strong>Registered Contributor{{ contributor_count|pluralize }}:</strong> {{ contributor_count|intcomma }}</span>
                {% if campaign.launch_date and campaign.completed_date %}
                    <br />
                    <span><strong>Launched {{ campaign.launch_date }} and completed {{ campaign.completed_date }}.</strong></span>
                {% endif %}
                <hr class="landing-divider" />
            </div>
        </div>
        {% with campaign.helpfullink_set.completed_transcription_links as links %}
            {% if links %}
                <div class="row mt-2">
                    <div class="col-md-12">
                        <aside class="mb-3 mt-md-0 p-3 bg-light">
                            <h3 class="mb-3">Use Completed Transcriptions</h3>
                            <ul class="list-unstyled m-0">
                                {% for link in links %}
                                    {% if forloop.last %}
                                        <li>
                                    {% else %}
                                        <li class="mb-3">
                                    {% endif %}
                                    <a class="underline-link" href="{{ link.link_url }}" target="_blank" rel=noopener>{{ link.title }}</a>
                                    {% if 'loc.gov' not in link.link_url  %}
                                        <i class="fa fa-external-link-alt"></i>
                                    {% endif %}
                                    </li>
                                {% endfor %}
                            </ul>
                        </aside>
                    </div>
                </div>
            {% endif %}
        {% endwith %}
        <div class="row">
            <div class="col-md-12">
                <div class="hero-text">{{ campaign.description|safe }}</div>
            </div>
        </div>
        <div class="row justify-content-center concordia-object-card-row">
            <div class="concordia-object-card-container justify-content-center pt-3">
                {% for project in projects %}
                    <div class="col-6 col-md-4 col-lg-3 concordia-object-card-col">
                        <div class="h-100 concordia-object-card card border" data-transcription-status="complete">
                            {% url 'transcriptions:project-detail' campaign.slug project.slug as project_url %}

                            <a href="{{ project_url }}?{{ sublevel_querystring }}" aria-hidden="true">
                                <img class="card-img card-img-campaign" src="{{ MEDIA_URL }}{{ project.thumbnail_image }}" alt="{{ project.title }}">
                            </a>

                            <div class="progress w-100">
                                <div title="Completed" class="progress-bar bg-completed" role="progressbar" style="width: 100%" aria-valuenow="100" aria-valuemin="0" aria-valuemax="100"></div>
                            </div>

                            <h6 class="text-center primary-text m-0 concordia-object-card-title">
                                <a class="underline-link" href="{{ project_url }}?{{ sublevel_querystring }}">{{ project.title }}</a>
                            </h6>
                            <div class="card-actions">
                                <a class="btn btn-sm btn-block btn-dark" href="{{ project_url }}?{{ sublevel_querystring }}">
                                    <span class="fas fa-check tx-completed"></span>
                                    Complete
                                </a>
                            </div>
                        </div>
                    </div>
                {% endfor %}
            </div>
        </div>
        {% with campaign.helpfullink_set.related_links as links %}
            {% if links %}
                <div class="row mt-2">
                    <div class="col-md-12">
                        <aside class="mb-3 mt-md-0 p-3 bg-light">
                            <h3 class="mb-3">Helpful Links</h3>
                            <ul class="list-unstyled m-0">
                                {% for link in links %}
                                    {% if forloop.last %}
                                        <li>
                                    {% else %}
                                        <li class="mb-3">
                                    {% endif %}
                                    <a class="underline-link" href="{{ link.link_url }}" target="_blank" rel=noopener>{{ link.title }}</a>
                                    {% if 'loc.gov' not in link.link_url  %}
                                        <i class="fa fa-external-link-alt"></i>
                                    {% endif %}
                                    </li>
                                {% endfor %}
                            </ul>
                        </aside>
                    </div>
                </div>
            {% endif %}
        {% endwith %}
    </div>
{% endblock main_content %}


================================================
FILE: concordia/templates/transcriptions/campaign_detail_retired.html
================================================
{% extends "base.html" %}

{% load staticfiles %}
{% load humanize %}
{% load concordia_text_tags %}

{% block title %}{{ campaign.title }}{% endblock title %}

{% block head_content %}
    <link rel="canonical" href="https://{{ request.get_host }}{{ request.path }}">
    <meta name="description" content="{{ campaign.description|striptags|normalize_whitespace }}">
    <meta name="thumbnail" content="{{ MEDIA_URL }}{{ campaign.thumbnail_image }}">
    <meta property="og:image" content="{{ MEDIA_URL }}{{ campaign.thumbnail_image }}">
    {{ block.super }}
{% endblock head_content %}

{% block breadcrumbs %}
    <li class="breadcrumb-item"><a class="primary-text text-truncate" href="{% url 'campaign-topic-list' %}">Campaigns</a></li>
    <li class="breadcrumb-item active" aria-current="page" title="{{ campaign.title }}"><span class="text-truncate">{{ campaign.title }}</span></li>
{% endblock breadcrumbs %}

{% block main_content %}
    <div class="container py-3">
        <div class="row">
            <div class="col-md-12">
                <h1>{{ campaign.title }}</h1>
                <div class="retired-bar mb-2"><h3 class="p-2 mb-0">Campaign retired. All transcriptions available in LOC.gov</h3></div>
                <hr class="landing-divider" />
                <span><strong>Completed Page{{ completed_count|pluralize }}:</strong> {{ completed_count|intcomma }}</span>
                <br />
                <span><strong>Registered Contributor{{ contributor_count|pluralize }}:</strong> {{ contributor_count|intcomma }}</span>
                {% if campaign.launch_date and campaign.completed_date %}
                    <br />
                    <span><strong>Launched {{ campaign.launch_date }} and completed {{ campaign.completed_date }}.</strong></span>
                {% endif %}
                <hr class="landing-divider" />
            </div>
        </div>
        {% with campaign.helpfullink_set.completed_transcription_links as links %}
            {% if links %}
                <div class="row mt-2">
                    <div class="col-md-12">
                        <aside class="mb-3 mt-md-0 p-3 bg-light">
                            <h3 class="mb-3">Use Completed Transcriptions</h3>
                            <ul class="list-unstyled m-0">
                                {% for link in links %}
                                    {% if forloop.last %}
                                        <li>
                                    {% else %}
                                        <li class="mb-3">
                                    {% endif %}
                                    <a class="underline-link" href="{{ link.link_url }}" target="_blank" rel=noopener>{{ link.title }}</a>
                                    {% if 'loc.gov' not in link.link_url  %}
                                        <i class="fa fa-external-link-alt"></i>
                                    {% endif %}
                                    </li>
                                {% endfor %}
                            </ul>
                        </aside>
                    </div>
                </div>
            {% endif %}
        {% endwith %}
        <div class="row mb-3">
            <div class="col-md-12">
                <h3>About This Campaign</h3>
                <div class="hero-text">{{ campaign.description|safe }}</div>
            </div>
        </div>
        {% with campaign.helpfullink_set.related_links as links %}
            {% if links %}
                <div class="row mt-2">
                    <div class="col-md-12">
                        <aside class="mb-3 mt-md-0 p-3 bg-light">
                            <h3 class="mb-3">Helpful Links</h3>
                            <ul class="list-unstyled m-0">
                                {% for link in links %}
                                    {% if forloop.last %}
                                        <li>
                                    {% else %}
                                        <li class="mb-3">
                                    {% endif %}
                                    <a class="underline-link" href="{{ link.link_url }}" target="_blank" rel=noopener>{{ link.title }}</a>
                                    {% if 'loc.gov' not in link.link_url  %}
                                        <i class="fa fa-external-link-alt"></i>
                                    {% endif %}
                                    </li>
                                {% endfor %}
                            </ul>
                        </aside>
                    </div>
                </div>
            {% endif %}
        {% endwith %}
    </div>
{% endblock main_content %}


================================================
FILE: concordia/templates/transcriptions/campaign_list.html
================================================
{% extends "base.html" %}

{% load staticfiles %}

{% block title %}Active Campaigns{% endblock title %}

{% block head_content %}
    <link rel="canonical" href="https://{{ request.get_host }}{{ request.path }}">
{% endblock head_content %}

{% block breadcrumbs %}
    <li class="breadcrumb-item active" aria-current="page">Active Campaigns</li>
{% endblock breadcrumbs %}

{% block main_content %}
    <div class="container py-3">
        <h1>Active Campaigns</h1>
        {% if topics %}
            <h3>Explore by topic</h3>
            <ul class="topic-list">
                {% for topic in topics %}
                    <li class="page-item">
                        <a class="page-link" href="{% url 'topic-detail' topic.slug %}">
                            {{ topic.title }}
                        </a>
                    </li>
                {% endfor %}
            </ul>
        {% endif %}
        <ul class="list-unstyled">
            {% for campaign in campaigns %}
                <li class="p-4 mb-1 bg-light">
                    <h2 class="h1 mb-3">{{ campaign.title }}</h2>
                    <div class="row">
                        <a class="col-md-5 order-md-2" href="{% url 'transcriptions:campaign-detail' campaign.slug %}">
                            <p class="mb-2 text-center"><img src="{{ MEDIA_URL }}{{ campaign.thumbnail_image }}" class="img-fluid" alt="{{ campaign.title }} image"></p>
                        </a>
                        <div class="col-md">
                            <p>{{ campaign.short_description|safe }}</p>
                            <a class="btn btn-primary" href="{% url 'transcriptions:campaign-detail' campaign.slug %}">View Projects</a>
                        </div>
                    </div>
                </li>
            {% endfor %}
        </ul>
        {% include "transcriptions/completed_campaigns_section.html" %}
    </div>
{% endblock main_content %}


================================================
FILE: concordia/templates/transcriptions/campaign_list_small_blocks.html
================================================
{% extends "base.html" %}

{% load staticfiles truncation %}

{% block title %}Completed Campaigns{% endblock title %}

{% block head_content %}
    <link rel="canonical" href="https://{{ request.get_host }}{{ request.path }}">
    {{ block.super }}
{% endblock head_content %}

{% block breadcrumbs %}
    <li class="breadcrumb-item active" aria-current="page">Completed Campaigns</li>
{% endblock breadcrumbs %}

{% block main_content %}
    <div class="container py-3">
        <h1>Completed Campaigns</h1>
        <div id="campaign-options" class="d-flex flex-wrap my-2">
            <div class="d-flex align-items-center me-auto mt-2">Results: {{ result_count }} Campaigns</div>
            <div class="d-flex align-items-center ms-3 mt-2">
                <label for="view-options" class="pe-1">View</label>
                <select id="view-options">
                    <option value="grid"{% if request.GET.view != 'list' %} selected{% endif %}>Grid</option>
                    <option value="list"{% if request.GET.view == 'list' %} selected{% endif %}>List</option>
                </select>
                <a class="btn btn-primary" onclick="toggleCampaignView();">Go</a>
            </div>
            <div class="d-flex align-items-center ms-3 mt-2">
                <label for="campaign-type" class="pe-1">Campaign Status</label>
                <select id="campaign-type">
                    <option value="all"{% if 'type' not in request.GET %} selected{%endif %}>All</option>
                    <option value="completed"{% if request.GET.type == 'completed' %} selected{% endif %}>Completed</option>
                    <option value="retired"{% if request.GET.type == 'retired' %} selected{% endif %}>Retired</option>
                </select>
                <a class="btn btn-primary" onclick="toggleCampaignType();" type="submit">Go</a>
            </div>
            <div class="d-flex align-items-center ms-3 mt-2">
                <label for="research-center" class="pe-1">Research Center</label>
                <select id="research-center">
                    <option value="all"{% if 'research_center' not in request.GET %} selected{% endif %}>All</option>
                    {% for research_center in research_centers %}
                        <option value="{{ research_center.pk }}"{% if request.GET.research_center|add:"0" == research_center.pk %} selected{% endif %}>
                            {{ research_center.title }}
                        </option>
                    {% endfor %}
                </select>
                <a class="btn btn-primary" onclick="toggleResearchCenter();" type="submit">Go</a>
            </div>
        </div>
        {% if request.GET.view == 'list' %}
            <ul id="campaign-list" class="list-unstyled list-view">
                {% for campaign in campaigns %}
                    <li{% if forloop.counter > 10 %} hidden{% endif %}>
                        <div class="row">
                            <div class="campaign-thumbnail">
                                <div class="aspect-ratio-box">
                                    <div class="aspect-ratio-box-inner-wrapper">
                                        <a href="{% url 'transcriptions:campaign-detail' campaign.slug %}">
                                            <img src="{{ MEDIA_URL }}{{ campaign.thumbnail_image }}" class="img-fluid" alt="{{ campaign.alt_image_text}}" loading="lazy" width="150" height="150">
                                        </a>
                                    </div>
                                </div>
                            </div>
                            <div class="campaign-text">
                                <p class="mb-2">
                                    <a href="{% url 'transcriptions:campaign-detail' campaign.slug %}">
                                        <span class="d-block h4">
                                            {{ campaign.title }}
                                        </span>
                                    </a>
                                    {% if campaign.launch_date %}
                                        <span class="fw-bold">Started: </span>{{ campaign.launch_date|date:"Y-m-d" }}
                                        {% if campaign.completed_date %}</br>{% endif %}
                                    {% endif %}
                                    {% if campaign.completed_date %}
                                        <span class="fw-bold">Completed: </span>{{ campaign.completed_date|date:"Y-m-d" }}
                                    {% endif %}
                                </p>
                                <p class="mb-2">
                                    {{ campaign.short_description|striptags|truncatechars_on_word_break:160 }}
                                </p>
                            </div>
                        </div>
                    </li>
                {% endfor %}
            </ul>
            {% with campaigns|length as campaigns_count %}
                {% if campaigns_count > 10 %}
                    <div class="align-items-center justify-content-center d-flex">
                        <a id="show-more" class="btn btn-primary">Show More Campaigns ({{ campaigns_count|add:"-10" }})</a>
                    </div>
                {% endif %}
            {% endwith %}
        {% else %}
            <ul class="list-unstyled row mt-4">
                {% with show_description=True show_start=True %}
                    {% for campaign in campaigns %}
                        {% include "transcriptions/campaign_small_block.html" %}
                    {% endfor %}
                {% endwith %}
            </ul>
        {% endif %}
    </div>
{% endblock main_content %}

{% block body_scripts %}
    <script>
        var toggleCampaignView = function(form) {
            let url = new URL(window.location.href);
            let viewValue = document.getElementById('view-options').value;
            url.searchParams.set("view", encodeURIComponent(viewValue));
            window.location.href = url;
        };
        let showMoreButton = document.getElementById("show-more");
        let campaignList = document.getElementById("campaign-list");
        if (showMoreButton){
            showMoreButton.addEventListener("click", function(event){
                for (const child of campaignList.children){
                    child.hidden = false;
                }
                showMoreButton.parentElement.classList.remove("d-flex");
                showMoreButton.parentElement.hidden = true;
                event.preventDefault();
            });
        }

        var toggleCampaignType = function(form) {
            let url = new URL(window.location.href);
            let typeValue = document.getElementById('campaign-type').value;
            if (typeValue == "all") {
                url.searchParams.delete("type");
            } else {
                url.searchParams.set("type", encodeURIComponent(typeValue));
            }
            window.location.href = url;
        }

        var toggleResearchCenter = function(form) {
            let url = new URL(window.location.href);
            let researchCenter = document.getElementById('research-center').value;
            if (researchCenter == "all") {
                url.searchParams.delete("research_center");
            } else {
                url.searchParams.set("research_center", encodeURIComponent(researchCenter));
            }
            window.location.href = url;
        }
    </script>
{% endblock body_scripts %}


================================================
FILE: concordia/templates/transcriptions/campaign_report.html
================================================
{% extends "base.html" %}

{% load humanize %}
{% load staticfiles %}

{% block title %}Campaign Report: {{ title }}{% endblock title %}

{% block main_content %}
    <div class="container">
        <div class="row">
            <h3>Campaign Summary: {{ title }}</h3>
            <table class="table table-bordered table-hover">
                <tbody>
                    <tr>
                        <th>Total Images:</th>
                        <td class="font-monospace text-end">{{ total_asset_count|intcomma }}</td>
                    </tr>
                    <tr>
                        <th>Total Projects:</th>
                        <td class="font-monospace text-end">{{ projects.paginator.count|intcomma }} </td>
                    </tr>
                </tbody>
            </table>
        </div>
        <div class="row justify-content-center">
            {% for project in projects %}
                <div class="card-column col-lg-4 mb-1">
                    <div class="card h-100">
                        <div class="card-header">
                            <a class="card-title" href="{% url 'transcriptions:project-detail' campaign_slug=campaign_slug slug=project.slug %}">
                                {{ project.title }}
                            </a>
                        </div>
                        <div class="card-body">
                            <table class="table table-sm table-bordered table-striped">
                                <tbody>
                                    <tr>
                                        <th>Images in this Project</th>
                                        <td class="font-monospace text-end">{{ project.asset_count|intcomma }}</td>
                                    </tr>
                                    <tr>
                                        <th>Number of Transcribers</th>
                                        <td class="font-monospace text-end">{{ project.transcriber_count|intcomma }} </td>
                                    </tr>
                                    <tr>
                                        <th>Number of Reviewers</th>
                                        <td class="font-monospace text-end">{{ project.reviewer_count|intcomma }} </td>
                                    </tr>
                                    <tr>
                                        <th>Tags</th>
                                        <td class="font-monospace text-end">{{ project.tag_count|intcomma }} </td>
                                    </tr>
                                </tbody>
                            </table>

                            <table class="table table-sm table-bordered table-striped mb-0">
                                <caption style="caption-side: top">Transcription Statuses</caption>
                                <tbody>
                                    {% for status, count in project.transcription_statuses %}
                                        <tr>
                                            <th>{{ status }}</th>
                                            <td class="font-monospace text-end">{{ count }}</td>
                                        </tr>
                                    {% endfor %}
                                </tbody>
                            </table>
                        </div>
                    </div>
                </div>
            {% endfor %}
        </div>

        <div class="row mt-3">
            <nav class="w-100" aria-label="pagination">
                <ul class="pagination mx-auto justify-content-center">
                    {% if projects.has_previous %}
                        <li class="page-item">
                            <a class="page-link" href="?page={{ projects.previous_page_number }}">Previous</a>
                        </li>
                    {% else %}
                        <li class="page-item disabled" aria-hidden="true">
                            <span class="page-link">Previous</span>
                        </li>
                    {% endif %}

                    {% for page_num in paginator.page_range %}
                        <li class="page-item {% if page_num == projects.number %}active{% endif %}" {% if page_num == projects.number %}aria-current="page"{% endif %}>
                            <a class="page-link" href="?page={{ page_num }}">{{ page_num }}</a>
                        </li>
                    {% endfor %}

                    {% if projects.has_next %}
                        <li class="page-item">
                            <a class="page-link" href="?page={{ projects.next_page_number }}">Next</a>
                        </li>
                    {% else %}
                        <li class="page-item disabled" aria-hidden="true">
                            <span class="page-link">Next</span>
                        </li>
                    {% endif %}
                </ul>
            </nav>
        </div>
    </div>
{% endblock main_content %}


================================================
FILE: concordia/templates/transcriptions/campaign_small_block.html
================================================
{% load truncation %}

<li class="col-sm-4 mb-4">
    <a href="{% url 'transcriptions:campaign-detail' campaign.slug %}">
        <div class="aspect-ratio-box">
            <div class="aspect-ratio-box-inner-wrapper">
                <img src="{{ MEDIA_URL }}{{ campaign.thumbnail_image }}" class="img-fluid" alt="{{ campaign.alt_image_text}}" loading="lazy">
            </div>
        </div>
        <span class="d-block h4 mt-2 small-campaign-title">{{ campaign.title }}</span>
    </a>
    {% if campaign.completed_date or show_start and campaign.launch_date %}
        <p>
            {% if show_start and campaign.launch_date %}
                <span class="fw-bold">Started: </span>{{ campaign.launch_date|date:"Y-m-d" }}
                {% if campaign.completed_date %}</br>{% endif %}
            {% endif %}
            {% if campaign.completed_date %}
                <span class="fw-bold">Completed: </span>{{ campaign.completed_date|date:"Y-m-d" }}
            {% endif %}
        </p>
    {% endif %}
    {% if show_description %}
        <p class="small-campaign-description">{{ campaign.short_description|striptags|truncatechars_on_word_break:160 }}</p>
    {% endif %}
</li>


================================================
FILE: concordia/templates/transcriptions/campaign_topic_list.html
================================================
{% extends "base.html" %}

{% load staticfiles %}

{% block title %}Active Campaigns{% endblock title %}

{% block head_content %}
    <link rel="canonical" href="https://{{ request.get_host }}{{ request.path }}">
    {{ block.super }}
{% endblock head_content %}

{% block breadcrumbs %}
    <li class="breadcrumb-item active" aria-current="page">All Campaigns</li>
{% endblock breadcrumbs %}

{% block main_content %}
    <div class="container py-3">
        <h1>All Campaigns</h1>
        {% if topics %}
            <div>
                <h2 class="h5">Explore by topic</h2>
                <ul class="list-inline">
                    {% for topic in topics %}
                        <li class="list-inline-item my-1 ">
                            <a class="btn btn-outline-primary" href="{% url 'topic-detail' topic.slug %}">
                                {{ topic.title }}
                            </a>
                        </li>
                    {% endfor %}
                </ul>
            </div>
        {% endif %}
        <h2 class="p-2">Active Campaigns</h2>
        <ul id="campaign-list" class="list-unstyled">
            {% for campaign in campaigns %}
                <li class="p-4 mb-1 bg-light" {% if forloop.counter > 10 %}hidden{% endif %}>
                    <h3 class="mb-3"><a href="{{ campaign.get_absolute_url }}">{{ campaign.title }}</a></h3>
                    <div class="row">
                        <a class="col-md-5 order-md-2" href="{{ campaign.get_absolute_url }}">
                            <p class="mb-2 text-center"><img src="{{ MEDIA_URL }}{{ campaign.thumbnail_image }}" class="img-fluid" alt="{% if campaign.image_alt_text %}{{ campaign.image_alt_text }}{% else %}{{ campaign.title }} image{% endif %}"></p>
                        </a>
                        <div class="col-md">
                            <p>{{ campaign.short_description|safe }}</p>
                            <a class="btn btn-primary" href="{{ campaign.get_absolute_url }}">View Projects</a>
                            <div class="progress campaign-progress">
                                <div
                                    class="progress-bar bg-completed"
                                    role="progressbar"
                                    style="width: {{ campaign.completed_percent|floatformat:'0' }}%"
                                    aria-valuenow="{{ campaign.completed_percent|floatformat:'0' }}"
                                ></div>
                                <div
                                    class="progress-bar bg-submitted"
                                    role="progressbar"
                                    style="width: {{ campaign.needs_review_percent|floatformat:'0' }}%"
                                    aria-valuenow="{{ campaign.needs_review_percent|floatformat:'0' }}"
                                ></div>
                            </div>
                            <div class="progress-bar-label">
                                {% if campaign.completed_percent %}
                                    <span>{{ campaign.completed_percent|floatformat:'0' }}% Completed</span>
                                    {% if campaign.needs_review_percent %} | {%endif %}
                                {% endif %}
                                {% if campaign.needs_review_percent %}
                                    <span>{{ campaign.needs_review_percent|floatformat:'0' }}% Needs Review</span>
                                {% endif %}
                            </div>
                        </div>
                    </div>
                </li>
            {% endfor %}
        </ul>
        {% with campaigns|length as campaigns_count %}
            {% if campaigns_count > 10 %}
                <div class="align-items-center justify-content-center d-flex mt-3">
                    <button id="show-more" class="btn btn-primary" aria-expanded="false">Show More Campaigns ({{ campaigns_count|add:"-10" }})</button>
                </div>
            {% endif %}
        {% endwith %}
        {% include "transcriptions/completed_campaigns_section.html" %}
    </div>
{% endblock main_content %}

{% block body_scripts %}
    <script>
        let showMoreButton = document.getElementById("show-more");
        let campaignList = document.getElementById("campaign-list");
        if (showMoreButton && campaignList){
            const items = Array.from(campaignList.children);
            const batchSize = 10;
            let expanded = false; // collapsed by default

            function updateVisibility() {
                if (expanded) {
                    // All
                    items.forEach(item => item.hidden = false);
                    showMoreButton.textContent = "Show Fewer Campaigns";
                    showMoreButton.setAttribute("aria-expanded", "true");
                } else {
                    // Only first 10
                    items.forEach((item, index) => {
                        item.hidden = index >= batchSize;
                    });
                    const remaining = items.length - batchSize;
                    showMoreButton.textContent = `Show More Campaigns (${remaining})`;
                    showMoreButton.setAttribute("aria-expanded", "false");
                }
            }

            // Initial state
            updateVisibility();

            showMoreButton.addEventListener("click", function(event){
                expanded = !expanded; // toggle state
                updateVisibility();
                event.preventDefault();
            });
        }
    </script>
{% endblock body_scripts %}


================================================
FILE: concordia/templates/transcriptions/completed_campaigns_section.html
================================================
<h2 class="pt-2">Completed Campaigns</h2>
<h4 class="section-link"><a href="{% url 'transcriptions:completed-campaign-list' %}">See All {{ completed_campaigns|length }} Completed Campaigns &raquo;</a></h4>
<ul class="list-unstyled row">
    {% for campaign in completed_campaigns|slice:3 %}
        {% include "transcriptions/campaign_small_block.html" %}
    {% endfor %}
</ul>


================================================
FILE: concordia/templates/transcriptions/item_detail.html
================================================
{% extends "base.html" %}

{% load humanize %}
{% load static %}
{% load staticfiles %}
{% load concordia_filtering_tags %}
{% load concordia_media_tags %}
{% load feature_flags %}

{% block title %} {{ item.title }} ({{ campaign.title }}: {{ project.title }}) {% endblock title %}

{% block head_content %}
    {{ block.super }}
    <link rel="canonical" href="https://{{ request.get_host }}{{ request.path }}" />
{% endblock head_content %}

{% block breadcrumbs %}
    <li class="breadcrumb-item"><a class="primary-text" href="{% url 'campaign-topic-list' %}">Campaigns</a></li>
    <li class="breadcrumb-item"><a class="primary-text text-truncate" href="{% url 'transcriptions:campaign-detail' campaign.slug %}?{{ sublevel_querystring }}" title="{{ campaign.title }}">{{ campaign.title }}</a></li>
    <li class="breadcrumb-item"><a class="primary-text text-truncate" href="{% url 'transcriptions:project-detail' campaign.slug project.slug %}?{{ sublevel_querystring }}" title="{{ project.title }}">{{ project.title }}</a></li>
    <li class="breadcrumb-item active" aria-current="page" title="{{ item.title }}"><span class="text-truncate">{{ item.title }}</span></li>
{% endblock breadcrumbs%}

{% block main_content %}
    {% flag_enabled 'DISPLAY_ITEM_DESCRIPTION' as DISPLAY_ITEM_DESCRIPTION %}

    <div class="container py-3">
        <div class="row">
            <div class="col-md-10">
                <h1>{{ item.title }}</h1>
                {% if DISPLAY_ITEM_DESCRIPTION %}
                    <div class="m-3 hero-text">{{ item.description|safe }}</div>
                {% endif %}
            </div>
            <div class="col-md-2 align-bottom px-3">
                <div>
                    <a href="{{ item.item_url }}" class="btn btn-light" title="View the original source for this item in a new tab" target="_blank" rel=noopener>View this item on www.loc.gov<i class="fa fa-external-link-alt"></i></a>
                </div>
            </div>
        </div>
        {% include "fragments/transcription-progress-row.html" %}
        <div class="d-flex justify-content-between mt-4">
            <div>
                <h3>Filter pages:</h2>
            </div>
            {% url 'transcriptions:item-detail' campaign.slug project.slug item.item_id as all_assets %}
            {% url 'transcriptions:filtered-item-detail' campaign.slug project.slug item.item_id as filtered_assets %}
            {% include "fragments/_filter-buttons.html" with do_filter=filter_assets all_url=all_assets filtered_url=filtered_assets sublevel_qs=sublevel_querystring %}
        </div>
        <div class="row">
            <div class="col-12 col-lg text-center">
                {% transcription_status_filters transcription_status_counts transcription_status "large" True all_assets %}
            </div>
        </div>
        <div class="row justify-content-center concordia-object-card-row">
            {% for a in assets %}
                {% url 'transcriptions:asset-detail' a.item.project.campaign.slug a.item.project.slug a.item.item_id a.slug as asset_detail_url %}
                <div class="col-6 col-md-4 col-lg-3 concordia-object-card-col">
                    <div class="h-100 card concordia-object-card border" data-transcription-status="{{ a.transcription_status }}">
                        <a class="card-img-container" href="{{ asset_detail_url }}">
                            <img class="card-img" alt="{{ a.slug }}" src="{% asset_media_url a %}" />
                        </a>
                        <a class="card-title text-center{% if a.transcription_status == 'completed' %} text-dark{% endif %}" href="{{ asset_detail_url }}">
                            #{{ a.sequence }}
                        </a>
                        <div class="card-actions">
                            <div class="d-grid">
                                <a class="btn btn-sm btn-block {% if a.transcription_status != 'completed' %}btn-primary{% else %}btn-dark{% endif %}" href="{{ asset_detail_url }}">
                                    {% if a.transcription_status == 'submitted' %}
                                        <span class="fas fa-list tx-submitted"></span>
                                        Review
                                    {% elif a.transcription_status == 'completed' %}
                                        <span class="fas fa-check tx-completed"></span>
                                        Complete
                                    {% else %}
                                        <span class="fas fa-edit tx-edit"></span>
                                        Transcribe
                                    {% endif %}
                                </a>
                            </div>
                        </div>
                    </div>
                </div>
            {% empty %}
                {% if filter_assets %}
                    <div class="pt-3">There are no pages you can review. Select "Show all" to see pages you can read or edit.</div>
                {% endif %}
            {% endfor %}
        </div>
        <div class="row mt-4">
            {% include "fragments/standard-pagination.html" %}
        </div>
    </div>
{% endblock main_content %}
{% block body_scripts %}
    {{ block.super }}
    <script src="{% static 'js/filter-assets.js' %}"></script>
{% endblock body_scripts %}


================================================
FILE: concordia/templates/transcriptions/project_detail.html
================================================
{% extends "base.html" %}

{% load static %}
{% load staticfiles %}
{% load concordia_filtering_tags %}
{% load concordia_text_tags %}

{% block title %}{{ project.title }} ({{ campaign.title }}){% endblock title %}

{% block head_content %}
    <link rel="canonical" href="https://{{ request.get_host }}{{ request.path }}" />
    <meta name="description" content="{{ project.description|striptags|normalize_whitespace }}" />
    <meta name="thumbnail" content="{{ MEDIA_URL }}{{ project.thumbnail_image }}" />
    <meta property="og:image" content="{{ MEDIA_URL }}{{ project.thumbnail_image }}" />
    {{ block.super }}
{% endblock head_content %}

{% block breadcrumbs %}
    <li class="breadcrumb-item"><a class="primary-text" href="{% url 'campaign-topic-list' %}">Campaigns</a></li>
    <li class="breadcrumb-item">
        <a class="primary-text text-truncate" href="{% url 'transcriptions:campaign-detail' campaign.slug %}?{{ sublevel_querystring }}" title="{{ campaign.title }}">{{ campaign.title }}</a>
    </li>
    <li class="breadcrumb-item active" aria-current="page" title="{{ project.title }}"><span class="text-truncate">{{ project.title }}</span></li>
{% endblock breadcrumbs %}

{% block main_content %}
    <div class="container py-3">
        <div class="row">
            <div class="col-12">
                <h1>{{ project.title }}</h1>
            </div>
        </div>
        {% include "fragments/transcription-progress-row.html" %}
        <div class="row">
            <div class="col-12 mt-4">
                <div class="hero-text">{{ project.description|safe }}</div>
            </div>
        </div>
        <div class="d-flex justify-content-between mt-4">
            <div>
                <h3>Filter pages:</h2>
            </div>
            {% url 'transcriptions:project-detail' campaign.slug project.slug as all_assets %}
            {% url 'transcriptions:filtered-project-detail' campaign.slug project.slug as filtered_assets %}
            {% include "fragments/_filter-buttons.html" with do_filter=filter_assets all_url=all_assets filtered_url=filtered_assets sublevel_qs=sublevel_querystring %}
        </div>
        <div class="row">
            <div class="col-12 col-lg text-center">
                {% transcription_status_filters transcription_status_counts transcription_status "large" True all_assets %}
            </div>
        </div>
        <div class="row justify-content-center concordia-object-card-row">
            {% for item in items %}
                <div class="col-6 col-md-4 col-lg-3 concordia-object-card-col">
                    <div class="h-100 concordia-object-card card border" data-transcription-status="{{ item.lowest_transcription_status }}">
                        {% if filter_assets %}
                            {% url 'transcriptions:filtered-item-detail' campaign.slug project.slug item.item_id as item_url %}
                        {% else %}
                            {% url 'transcriptions:item-detail' campaign.slug project.slug item.item_id as item_url %}
                        {% endif %}

                        <a href="{{ item_url }}?{{ sublevel_querystring }}">
                            <img class="card-img card-img-campaign" alt="{{ item.title }}" src="{{ item.thumbnail_link }}" />
                        </a>

                        <div class="progress w-100">
                            <div title="Completed" class="progress-bar bg-completed" role="progressbar" style="width: {{ item.completed_percent }}%" aria-valuenow="{{ item.completed_percent }}" aria-valuemin="0" aria-valuemax="100"></div>
                            <div title="Needs Review" class="progress-bar bg-submitted" role="progressbar" style="width: {{ item.submitted_percent }}%" aria-valuenow="{{ item.submitted_percent }}" aria-valuemin="0" aria-valuemax="100"></div>
                            <div title="In Progress" class="progress-bar bg-in_progress" role="progressbar" style="width: {{ item.in_progress_percent }}%" aria-valuenow="{{ item.in_progress_percent }}" aria-valuemin="0" aria-valuemax="100"></div>
                        </div>

                        <h6 class="text-center primary-text m-0 concordia-object-card-title">
                            <a{% if item.lowest_transcription_status == 'completed' %} class="text-dark"{% endif %} href="{{ item_url }}?{{ sublevel_querystring }}" class="campaign-image-link">
                                {{ item.title }}
                            </a>
                        </h6>

                        {% if item.lowest_transcription_status == 'completed' %}
                            <div class="card-actions">
                                <a class="btn btn-sm btn-block btn-dark" href="{{ item_url }}?{{ sublevel_querystring }}">
                                    <span class="fas fa-check tx-completed"></span>
                                    Complete
                                </a>
                            </div>
                        {% endif %}
                    </div>
                </div>
            {% empty %}
                {% if filter_assets %}
                    <div class="pt-3">There are no pages you can review. Select "Show all" to see pages you can read or edit.</div>
                {% endif %}
            {% endfor %}
        </div>
        <div class="row mt-4">
            {% include "fragments/standard-pagination.html" %}
        </div>
    </div>
{% endblock main_content %}
{% block body_scripts %}
    {{ block.super }}
    <script src="{% static 'js/filter-assets.js' %}"></script>
{% endblock body_scripts %}


================================================
FILE: concordia/templates/transcriptions/topic_detail.html
================================================
{% extends "base.html" %}

{% load staticfiles %}
{% load humanize %}
{% load concordia_text_tags %}
{% load concordia_querystring %}
{% load concordia_filtering_tags %}

{% block title %}{{ topic.title }}{% endblock title %}

{% block head_content %}
    <link rel="canonical" href="https://{{ request.get_host }}{{ request.path }}">
    <meta name="description" content="{{ topic.description|striptags|normalize_whitespace }}">
    <meta name="thumbnail" content="{{ MEDIA_URL }}{{ topic.thumbnail_image }}">
    <meta property="og:image" content="{{ MEDIA_URL }}{{ topic.thumbnail_image }}">
    {{ block.super }}
{% endblock head_content %}

{% block breadcrumbs %}
    <li class="breadcrumb-item"><a class="primary-text" href="{% url 'campaign-topic-list' %}">Campaigns</a></li>
    <li class="breadcrumb-item active" aria-current="page" title="{{ topic.title }}"><span class="text-truncate">{{ topic.title }}</span></li>
{% endblock breadcrumbs %}

{% block main_content %}
    <div class="container py-3">
        <div class="row">
            <div class="col-md-12">
                <h1>{{ topic.title }}</h1>
            </div>
        </div>
        {% include "fragments/transcription-progress-row.html" %}
        <div class="row mt-3">
            <div class="col-md-9">
                <div class="hero-text">{{ topic.description|safe }}</div>
            </div>
            <div class="col-md-3">
                {% if topic.helpfullink_set.all|length %}
                    <aside class="mb-3 mt-4 mt-md-0 p-3 bg-light border">
                        <h4 class="mb-3">Helpful Links</h4>
                        <ul class="list-unstyled m-0">
                            {% for link in topic.helpfullink_set.all %}
                                {% if 'loc.gov' in link.link_url   %}
                                    <li class="mb-3"><a href="{{ link.link_url }}" target="_blank" rel=noopener>{{ link.title }}</a></li>
                                {% else %}
                                    <li class="mb-3"><a href="{{ link.link_url }}" target="_blank" rel=noopener>{{ link.title }} <i class="fa fa-external-link-alt"></i></a></li>
                                {% endif %}
                            {% endfor %}
                        </ul>
                    </aside>
                {% endif %}
            </div>
            <div class="d-flex justify-content-between mt-4">
                <div>
                    <h3>Filter pages:</h3>
                </div>
                {% url 'transcriptions:topic-detail' topic.slug as all_assets %}
            </div>
            <div class="row">
                <div class="col-12 col-lg text-center">
                    {% transcription_status_filters transcription_status_counts transcription_status "large" True all_assets %}
                </div>
            </div>
            <div class="row justify-content-center concordia-object-card-row mt-3">
                {% for project in projects %}
                    <div class="col-6 col-md-4 col-lg-3 concordia-object-card-col">
                        <div class="h-100 concordia-object-card card border" data-transcription-status="{{ project.lowest_transcription_status }}">
                            {% url 'transcriptions:project-detail' project.campaign.slug project.slug as project_url %}
                            {% if sublevel_querystring %}
                            {# If a filter has been set, we want to always respect that #}
                            {# Essentially, this just assigns sublevel_querystring to the temp variable project_querystring for use below #}
                                {% qs_alter sublevel_querystring as project_querystring %}
                            {% elif project.topic_url_filter %}
                            {# No overriding filter has been set, so use the one assigned to the project, if any #}
                                {% qs_alter sublevel_querystring add_if_missing:transcription_status=project.topic_url_filter as project_querystring %}
                            {% else %}
                            {# Explicitly blank the querystring, since none are set; this is needed so the last project's querystring isn't used #}
                                {% qs_alter "" as project_querystring %}
                            {% endif %}

                            <a href="{{ project_url }}{% if project_querystring %}?{{ project_querystring }}{% endif %}" aria-hidden="true">
                                <img class="card-img card-img-campaign" src="{{ MEDIA_URL }}{{ project.thumbnail_image }}" alt="{{ project.title }}">
                            </a>

                            <div class="progress w-100">
                                <div title="Completed" class="progress-bar bg-completed" role="progressbar" style="width: {{ project.completed_percent }}%" aria-valuenow="{{ project.completed_percent }}" aria-valuemin="0" aria-valuemax="100"></div>
                                <div title="Needs Review" class="progress-bar bg-submitted" role="progressbar" style="width: {{ project.submitted_percent }}%" aria-valuenow="{{ project.submitted_percent }}" aria-valuemin="0" aria-valuemax="100"></div>
                                <div title="In Progress" class="progress-bar bg-in_progress" role="progressbar" style="width: {{ project.in_progress_percent }}%" aria-valuenow="{{ project.in_progress_percent }}" aria-valuemin="0" aria-valuemax="100"></div>
                            </div>

                            <h6 class="text-center primary-text m-0 concordia-object-card-title">
                                <a{% if project.lowest_transcription_status == 'completed' %} class="text-dark"{% endif %} href="{{ project_url }}{% if project_querystring %}?{{ project_querystring }}{% endif %}">{{ project.campaign.title }} - {{ project.title }}</a>
                            </h6>

                            {% if project.lowest_transcription_status == 'completed' %}
                                <div class="card-actions">
                                    <a class="btn btn-sm btn-block btn-dark" href="{{ project_url }}{% if project_querystring %}?{{ project_querystring }}{% endif %}">
                                        <span class="fas fa-check tx-completed"></span>
                                        Complete
                                    </a>
                                </div>
                            {% endif %}
                        </div>
                    </div>
                {% endfor %}
            </div>
        </div>
{% endblock main_content %}


================================================
FILE: concordia/templates/transcriptions/transcription.html
================================================
{% extends "base.html" %}
{% load static %}

{% block head_content %}
    <script id="viewer-data"
            data-prefix-url="{% static 'openseadragon/build/openseadragon/images/' %}"
            data-contact-url="https://ask.loc.gov/crowd"
    ></script>
    {% include "fragments/import-map.html" %}
{% endblock %}

{% block title %}React Test Page{% endblock title %}

{% block main_content %}
    <div id="app" class="container-fluid flex-grow-1 d-flex flex-column d-print-block">
        <script type="module" src="{% static 'frontend/js/index.js' %}"></script>
    </div>
{% endblock %}


================================================
FILE: concordia/templatetags/__init__.py
================================================


================================================
FILE: concordia/templatetags/concordia_filtering_tags.py
================================================
from typing import Any, Dict, Iterable, List, Tuple
from urllib.parse import quote as urlquote

from django import template

from ..models import TranscriptionStatus

register = template.Library()


@register.inclusion_tag("fragments/transcription-status-filters.html")
def transcription_status_filters(
    status_counts: Iterable[Tuple[str, str, int]],
    active_value: str | None,
    size: str = "small",
    reversed_order: bool = False,
    url: str = "",
) -> Dict[str, Any]:
    """
    Build a context for the transcription status filter UI.

    Behavior:
        Produces the context expected by the
        `fragments/transcription-status-filters.html` template. The context
        includes a `status_choices` list of tuples used to render links and
        classes for each status, plus an entry representing "All."

        The function keeps the provided `active_value` selected, can reverse
        the status order, and will prepend the provided `url` when building
        filter links.

    Usage:
        Basic usage with counts from the view:

            {% load concordia_filtering_tags %}
            {% transcription_status_filters status_counts active_value %}

        With optional parameters:

            {% transcription_status_filters status_counts active_value
               size="small" reversed_order=True url=request.path %}

        Where:
            - `status_counts` is an iterable of `(key, label, count)`.
            - `active_value` is the currently selected status key, or empty.
            - `size` controls sizing classes used by the fragment.
            - `reversed_order` reverses the order of `TranscriptionStatus.CHOICES`.
            - `url` is prefixed to each generated link.

    Args:
        status_counts: Iterable of three-tuples `(key, label, count)` used to
            display per-status counts.
        active_value: The currently active status key, or `None`/empty for All.
        size: Size hint passed through to the template.
        reversed_order: If True, reverse the status choice order.
        url: Base URL to which the query string is appended.

    Returns:
        dict: Template context with keys:
            - `size` (str)
            - `status_choices` (list[tuple[str, str, str, str, int | None]])
              Each tuple is `(href, active_class, css_key, label, count)`.
    """
    ctx: Dict[str, Any] = {}
    ctx["size"] = size

    status_choices: List[Tuple[str, str, str, str, int | None]] = [
        ("", "flex-initial" + " active" if not active_value else "", "", "All", None)
    ]
    ctx["status_choices"] = status_choices

    counts = {count[0]: count[2] for count in status_counts}
    statuses = TranscriptionStatus.CHOICES
    if reversed_order:
        statuses = reversed(statuses)
    for key, label in statuses:
        status_choices.append(
            (
                "%s?transcription_status=%s" % (url, urlquote(key)),
                "active" if active_value == key else "",
                key.replace("_", "-"),
                label,
                counts.get(key),
            )
        )

    return ctx


================================================
FILE: concordia/templatetags/concordia_media_tags.py
================================================
from typing import Any

from django import template

register = template.Library()


@register.simple_tag()
def asset_media_url(asset: Any) -> str:
    """
    Return the media URL for an asset's stored image.

    Behavior:
        Reads `asset.storage_image.url` and returns the URL string. This tag
        does not perform existence checks; it assumes the attribute is present
        on the given object.

    Usage:
        Inline `src` attribute:

            {% load concordia_media_tags %}
            <img src="{% asset_media_url asset %}" alt="">

        Store in a variable:

            {% asset_media_url asset as image_url %}
            <img src="{{ image_url }}" alt="">

    Args:
        asset: An object that exposes `storage_image.url`.

    Returns:
        str: The URL of the stored image.
    """
    return asset.storage_image.url


================================================
FILE: concordia/templatetags/concordia_querystring.py
================================================
"""
Query string manipulation template tag.

Originally from https://github.com/acdha/django-bittersweet
"""

from typing import Any, Optional

from django.http import QueryDict
from django.template import Library, Node, Variable
from django.template.base import Parser, Token
from django.utils.html import escape

register = Library()


class QueryStringAlterer(Node):
    """
    Template node that applies alterations to a query string.

    Behavior:
        Resolves a base query string from the template context (either a raw
        query string or a `QueryDict` such as `request.GET`) and applies a
        sequence of alterations provided as tag arguments.

        Supported alterations:
            - Assignment: `name=value`
            - Deletion by key: `delete:name`
            - Deletion by key and value (value from a literal or a variable):
              `delete_value:"name",value` or `delete_value:field_name,value`
            - Conditional add if missing: `add_if_missing:name=value`

        The result is URL-encoded and HTML-escaped. If the tag is used with an
        `as variable_name` clause, the encoded string is stored in the context
        under that name and an empty string is rendered. Otherwise, the encoded
        string is returned.

    Usage:
        The tag is registered as `qs_alter`. Provide a base query string
        (a `QueryDict` like `request.GET` or a string) followed by one or more
        alterations.

        Query string provided as `QueryDict`:

            {% qs_alter request.GET foo=bar %}
            {% qs_alter request.GET foo=bar baaz=quux %}
            {% qs_alter request.GET foo=bar baaz=quux delete:corge %}

        Remove one facet from a list:

            {% qs_alter request.GET foo=bar baaz=quux
               delete_value:"facets",value %}

        Conditionally add a parameter only if missing:

            {% qs_alter request.GET add_if_missing:foo=bar %}

        Query string provided as string:

            {% qs_alter "foo=baaz" foo=bar %}

        Store the result in a variable in the template context:

            {% qs_alter request.GET foo=bar baaz=quux delete:corge as new_qs %}

    Args (template usage):
        base_qs: Either a `QueryDict` (for example, `request.GET`) or a string
            containing a query string.
        alterations: One or more alteration arguments in the formats described
            above.
        as variable_name: Optional. If provided, the result is saved to the
            named context variable instead of being rendered.

    Returns:
        str: The encoded query string when not using `as variable_name`;
        otherwise an empty string.
    """

    def __init__(self, base_qs: str, as_variable: Optional[str], *args) -> None:
        self.base_qs = Variable(base_qs)
        self.args = args
        # Controls whether the result is returned or stored in the context.
        self.as_variable = as_variable

    def render(self, context: Any) -> str:
        """
        Render the altered query string.

        Args:
            context: Template rendering context.

        Returns:
            str: The encoded query string, or an empty string when storing the
            result via `as variable_name`.
        """
        base_qs = self.base_qs.resolve(context)

        if isinstance(base_qs, QueryDict):
            qs = base_qs.copy()
        else:
            qs = QueryDict(base_qs, mutable=True)

        for arg in self.args:
            if arg.startswith("delete:"):
                v = arg[7:]
                if v in qs:
                    del qs[v]
            elif arg.startswith("delete_value:"):
                field, value = arg[13:].split(",", 2)
                value = Variable(value).resolve(context)

                if not (field[0] == '"' and field[-1] == '"'):
                    field = Variable(field).resolve(context)
                else:
                    field = field.strip("\"'")

                f_list = qs.getlist(field)
                if value in f_list:
                    f_list.remove(value)
                    qs.setlist(field, f_list)
            elif arg.startswith("add_if_missing:"):
                k, v = arg[15:].split("=", 2)
                if k not in qs:
                    qs[k] = Variable(v).resolve(context)
            else:
                k, v = arg.split("=", 2)
                qs[k] = Variable(v).resolve(context)

        encoded_qs = escape(qs.urlencode())
        if self.as_variable:
            context[self.as_variable] = encoded_qs
            return ""
        else:
            return encoded_qs

    @classmethod
    def qs_alter_tag(cls, parser: Parser, token: Token) -> "QueryStringAlterer":
        """
        Template tag parser for `qs_alter`.

        Args:
            parser: Django template parser.
            token: Token containing the tag and its arguments.

        Returns:
            QueryStringAlterer: A compiled node ready for rendering.
        """
        bits = token.split_contents()

        if bits[-2] == "as":
            as_variable = bits[-1]
            bits = bits[0:-2]
        else:
            as_variable = None

        return QueryStringAlterer(bits[1], as_variable, *bits[2:])


register.tag("qs_alter", QueryStringAlterer.qs_alter_tag)


================================================
FILE: concordia/templatetags/concordia_sharing_tags.py
================================================
from typing import Dict

from django import template

register = template.Library()


@register.inclusion_tag("fragments/sharing-button-group.html")
def share_buttons(url: str, title: str) -> Dict[str, str]:
    """
    Build the context for the sharing button fragment and render it.

    Behavior:
        This is an inclusion tag. Django will render
        `fragments/sharing-button-group.html` with the returned context and
        insert the resulting HTML at the call site.

    Usage:
        Render inline:

            {% load concordia_sharing_buttons %}
            {% share_buttons request.build_absolute_uri object.title %}

        Capture the rendered HTML, then output it later:

            {% share_buttons page_url page_title as share_html %}
            {{ share_html|safe }}

        Notes:
            - The value captured with `as` is rendered HTML, not a context
              dictionary. Do not pass it to `{% include %}` as context.

    Args:
        url: Absolute URL to share.
        title: Display title to accompany the share action.

    Returns:
        dict: Mapping used by `fragments/sharing-button-group.html` with keys:
            - `title` (str)
            - `url` (str)
    """
    return {"title": title, "url": url}


================================================
FILE: concordia/templatetags/concordia_text_tags.py
================================================
import re

from django import template

register = template.Library()

WHITESPACE_NORMALIZER = re.compile(r"\s+")


@register.filter
def normalize_whitespace(text: str) -> str:
    """
    Replace consecutive whitespace in text with a single space.

    Behavior:
        Collapses runs of whitespace characters (including newlines and tabs)
        to a single ASCII space.

    Usage:
        In a template:

            {% load concordia_text_tags %}
            {{ some_text|normalize_whitespace }}

        In Python:

            normalize_whitespace("a\\n\\n  b\\t\\t c")  # -> "a b c"

    Args:
        text: Input text to normalize.

    Returns:
        str: Text with whitespace collapsed to single spaces.
    """
    return WHITESPACE_NORMALIZER.sub(" ", text)


@register.filter
def reprchar(character: str) -> str:
    """
    Return a Python-style literal representation of a single character without
    surrounding quotes, for example "\\\\u200b", "\\\\x00", "\\\\n".

    Behavior:
        Uses Python's `repr` to obtain an escaped form, then removes the outer
        quotes so the result is suitable for display in templates.

    Usage:
        In a template:

            {% load concordia_text_tags %}
            Invisible char: {{ some_char|reprchar }}

        In Python:

            reprchar("\\u200b")  # -> "\\\\u200b"

    Args:
        character: A single-character string to represent.

    Returns:
        str: The escaped representation without surrounding quotes.
    """
    # Strip the outer quotes added by repr
    return repr(character)[1:-1]


================================================
FILE: concordia/templatetags/custom_math.py
================================================
from typing import Any

from django import template

register = template.Library()


@register.filter(name="multiply")
def multiply(value: Any, arg: Any) -> Any:
    """
    Multiply two values.

    Behavior:
        Returns the product of `value` and `arg` using Python's `*` operator.

    Usage:
        In a template:

            {% load custom_math %}
            {{ 6|multiply:7 }}            {# 42 #}
            {{ price|multiply:quantity }} {# product of variables #}

        In Python:

            multiply(3, 5)   # -> 15
            multiply("a", 3) # -> "aaa"

    Args:
        value: Left operand.
        arg: Right operand.

    Returns:
        Any: The result of `value * arg`.
    """
    return value * arg


================================================
FILE: concordia/templatetags/group_list.py
================================================
from typing import Any, Sequence

from django import template

register = template.Library()


@register.filter
def batch(value: Sequence[Any], size: int) -> list[Sequence[Any]]:
    """
    Group a sequence into consecutive chunks.

    Behavior:
        Returns a list of slices from `value`, each of length `size`, except
        possibly the last slice if there are not enough elements.

    Usage:
        In a template:

            {% load group_list %}
            {% for row in items|batch:3 %}
                <div class="row">
                    {% for item in row %}
                        <span>{{ item }}</span>
                    {% endfor %}
                </div>
            {% endfor %}

        In Python:

            batch([1, 2, 3, 4, 5], 2)  # -> [[1, 2], [3, 4], [5]]
            batch(("a", "b", "c"), 4)  # -> [("a", "b", "c")]

    Args:
        value: The sequence to split. Must support `len()` and slicing.
        size: The maximum size of each chunk. Will be converted to `int`
            by Django when called from templates.

    Returns:
        list[Sequence[Any]]: Consecutive slices of `value`, each at most `size`
        elements long.
    """
    size = int(size)
    return [value[i : i + size] for i in range(0, len(value), size)]


================================================
FILE: concordia/templatetags/reject_filter.py
================================================
from typing import Any

from django import template

register = template.Library()


@register.filter
def reject(value: Any, args: str) -> Any:
    """
    Remove one or more unwanted items from a list or space-separated string.

    Behavior:
        - If `value` is a string, treat it as space-separated tokens.
        - If `value` is an iterable of items, convert it to a list.
        - Remove any tokens present in `args`, which is a comma-separated
          string of items to reject.

    Usage:
        In a template:

            {% load reject_filter %}
            {{ "error warn marked-safe"|reject:"marked-safe" }}
            {# -> "error warn" #}

            {{ "error warning marked-safe"|reject:"marked-safe,warn" }}
            {# -> "error" #}

            {{ my_list|reject:"deprecated,hidden" }}
            {# If my_list == ["ok", "deprecated", "x", "hidden"] then
               -> ["ok", "x"] #}

        In Python:

            reject("a b c", "b")            # -> "a c"
            reject(["a", "b", "c"], "b,c")  # -> ["a"]

    Args:
        value: Input to filter. A space-separated string or an iterable.
        args: Comma-separated items to remove.

    Returns:
        If `value` is a string, a space-joined string of remaining tokens.
        Otherwise a list of remaining items.
    """
    if not value:
        return value

    if isinstance(value, str):
        value_list = value.split()
    else:
        value_list = list(value)

    reject_items = set(args.split(","))

    filtered_list = [item for item in value_list if item not in reject_items]

    return " ".join(filtered_list) if isinstance(value, str) else filtered_list


================================================
FILE: concordia/templatetags/truncation.py
================================================
import unicodedata

from django import template
from django.template.defaultfilters import stringfilter
from django.utils.text import Truncator, add_truncation_text

register = template.Library()


class WordBreakTruncator(Truncator):
    def word_break(self, num: int, truncate: str | None = None) -> str:
        """
        Return the text truncated to no longer than the given number of
        characters, cutting at the most recent word break.

        This method follows the behavior of `django.utils.text.Truncator`, but
        differs by ensuring the cut occurs on a word boundary when possible.
        It also counts only non-combining Unicode code points toward the
        character limit.

        Args:
            num (int): Maximum length of the resulting string, including any
                truncation text.
            truncate (str | None): The text to append when truncation occurs.
                If not provided, the default from `add_truncation_text` is used.

        Returns:
            str: The truncation marker
            appended.
        """
        self._setup()
        length = int(num)
        text = unicodedata.normalize("NFC", self._wrapped)

        # Calculate the length to truncate to (max length - end_text length).
        truncate_len = length
        for char in add_truncation_text("", truncate):
            if not unicodedata.combining(char):
                truncate_len -= 1
                if truncate_len == 0:
                    break
        return self._text_word_break(length, truncate, text, truncate_len)

    def _text_word_break(
        self, length: int, truncate: str | None, text: str, truncate_len: int
    ) -> str:
        """
        Truncate a string after a given number of characters, cutting at the
        most recent word break.

        Args:
            length (int): Maximum length of the resulting string, including any
                truncation text.
            truncate (str | None): The text to append when truncation occurs.
            text (str): The normalized source string.
            truncate_len (int): The effective content length budget after
                subtracting the truncation text length.
        Returns:
            str: The original string if no truncation is needed; otherwise the
            truncated string with truncation text appended.
        """
        s_len = 0
        end_index = None
        for i, char in enumerate(text):
            if unicodedata.combining(char):
                # Do not count combining characters toward the visible length.
                continue
            s_len += 1
            if end_index is None and s_len > truncate_len:
                end_index = i
            if s_len > length:
                # Return the truncated string at the prior word boundary.
                return add_truncation_text(
                    " ".join(text[: end_index or 0].split()[:-1]), truncate
                )

        # Return the original string since no truncation was necessary.
        return text


@register.filter(is_safe=True)
@stringfilter
def truncatechars_on_word_break(value: str, arg: int | str) -> str:
    """
    Truncate a string after a given number of characters, cutting at the most
    recent word break.

    Behavior:
        - Counts only non-combining Unicode code points toward the limit.
        - If truncation occurs, appends a truncation marker.
        - Preserves whole words by backing up to the nearest word boundary.

    Usage:
        In a template:

            {% load truncation %}
            {{ long_text|truncatechars_on_word_break:120 }}

        In Python:

            truncatechars_on_word_break("alpha beta gamma", 8)
            # returns "alpha […]" (truncated at a word boundary)

    Args:
        value (str): The source text to truncate.
        arg (int | str): Maximum length. If a string is provided, it is cast
            to an integer. Invalid values cause the original text to be
            returned unchanged.

    Returns:
        str: The truncated string, or the original string if no truncation is
        needed or the argument is invalid.
    """
    try:
        length = int(arg)
    except ValueError:
        # Invalid literal for int(); fail silently and return original.
        return value
    return WordBreakTruncator(value).word_break(length, "[…]")


================================================
FILE: concordia/templatetags/visualization.py
================================================
# concordia/templatetags/visualization.py

from django import template
from django.utils.html import escape, format_html, format_html_join
from django.utils.safestring import SafeString

register = template.Library()


@register.simple_tag
def concordia_visualization(name: str, **attrs) -> SafeString:
    """
    Render a container with a section and a canvas for a named visualization.

    This tag outputs a `<div>` that always includes the
    `visualization-container` class, wrapping a `<section>` with a `<canvas>`
    whose `id` is set to the provided `name`. Any extra attributes passed to
    the tag are applied to the outer `<div>` after being safely escaped.

    Usage:
        Load the tag library, then invoke the tag with a name and optional
        HTML attributes.

        Template:

            {% load visualization %}
            {% concordia_visualization "daily-activity"
                style="float:left;" class="chart" data-role="viz" %}

        Output:

            <div class="visualization-container chart" style="float:left;"
                 data-role="viz">
                <section>
                    <canvas id="daily-activity"></canvas>
                </section>
            </div>

        Notes:
            - The `class` attribute you pass is appended to
              `visualization-container`.
            - All attribute names and values are escaped.
            - This tag does not include any `<script>` tags. Visualization
              scripts are included in the site-wide JavaScript rollup.

    Args:
        name (str): The slug used as the `id` of the `<canvas>` element.
        **attrs: Any HTML attributes to apply to the outer `<div>` container.

    Returns:
        SafeString: Escaped HTML for the container, section, and canvas.
    """
    # Ensure 'visualization-container' is always present in class attribute
    user_classes = attrs.pop("class", "")
    combined_classes = "visualization-container"
    if user_classes:
        combined_classes += f" {user_classes}"
    attrs["class"] = combined_classes

    # Build an attribute string like: key1="value1" key2="value2"
    # Using format_html_join ensures that each key and value is properly escaped.
    attr_items = ((escape(key), escape(value)) for key, value in attrs.items())
    # format_html_join(' ', '{}="{}"', attr_items) -> 'key1="value1" key2="value2"'
    attrs_str = format_html_join(" ", '{}="{}"', attr_items)
    # Prepend a space so that when we do '<div {attrs_str}>
    # we get "<div key=...>"
    attrs_str = format_html(" {}", attrs_str)

    # Build the <div> + <section> + <canvas> line
    # We use the section in order to be able to grow the
    # canvas's container to fit the entire thing. We need
    # the outer div to be able to add elements to our display
    # (e.g., a csv) without resizing the section
    # Use format_html so that {name} is escaped if necessary.
    canvas_html = format_html(
        "<div{}>" '<section><canvas id="{}"></canvas></section>' "</div>",
        attrs_str,
        name,
    )

    # Because we used format_html, this is already safe.
    return canvas_html


================================================
FILE: concordia/tests/README.md
================================================
# Concordia Tests

This directory contains tests for the concordia app. It
uses Django TestCases, which will create a test database
before running each test.

## Pre-requisites

-   Regarding Django TestCases, since these tests create a test database, the docker container with the db must be running — for example:

    ```console
    $ docker-compose up -d db
    ```

-   Use the settings module with defaults appropriate for testing:

    ```console
    $ export DJANGO_SETTINGS_MODULE=concordia.settings_test
    ```

    or

    ```console
    $ pipenv run manage.py test --settings=concordia.settings_test
    ```

## Running the tests

-   To run all tests:

    ```console
    $ python manage.py test concordia
    ```

*   To run a single unittest module:

    ```console
    $ python manage.py test concordia.tests.test_view
    ```

*   To run a single unittest in a django unittest module:
    ```console
    $ python manage.py test
    concordia.tests.test_view.ViewTest1.test_addition
    ```


================================================
FILE: concordia/tests/__init__.py
================================================


================================================
FILE: concordia/tests/axe.py
================================================
# Code originally from
# https://github.com/mozilla-services/axe-selenium-python/blob/3cfbdd67c9b40ab03f37b3ba2521f77c2071827b/axe_selenium_python/axe.py
# This Source Code Form is subject to the terms of the Mozilla Public
# License, v. 2.0. If a copy of the MPL was not distributed with this
# file, You can obtain one at http://mozilla.org/MPL/2.0/.

import json
import os
from io import open

from django.conf import settings

_DEFAULT_SCRIPT = settings.DEFAULT_AXE_SCRIPT or os.path.join(
    os.path.dirname(__file__), "node_modules", "axe-core", "axe.min.js"
)


class Axe:
    def __init__(self, py, script_path=_DEFAULT_SCRIPT):
        self.script_path = script_path
        self.py = py

    def violations(self, report=None):
        """
        Injects aXe into the current document then runs it and returns
        any violations found.

        :param report: Whether to generate a report or not. Can be None,
                       True or a string. If True, write_results is run with
                       the default filename, otherwise used as the filename
                       for write_results. If None or False, write_result is
                       not called.
        :type report: bool, str or None
        :returns: Response from aXe
        :rtype: Dict
        """
        self.inject()
        results = self.run()
        if report:
            if report is True:
                self.write_results(results)
            else:
                self.write_results(results, report)
        return results["violations"]

    def inject(self):
        """
        Recursively inject aXe into all iframes and the top level document.
        """
        with open(self.script_path, "r", encoding="utf8") as f:
            self.py.execute_script(f.read())

    def run(self, context=None, options=None):
        """
        Run axe against the current page.

        :param context: which page part(s) to analyze and/or what to exclude.
        :param options: dictionary of aXe options.
        """
        template = (
            "var callback = arguments[arguments.length - 1];"
            + "axe.run(%s).then(results => callback(results))"
        )
        args = ""

        # If context parameter is passed, add to args
        if context is not None:
            args += "%r" % context
        # Add comma delimiter only if both parameters are passed
        if context is not None and options is not None:
            args += ","
        # If options parameter is passed, add to args
        if options is not None:
            args += "%s" % options

        command = template % args
        response = self.py.execute_async_script(command)
        return response

    def report(self, violations):
        """
        Return readable report of accessibility violations found.

        :param violations: Dictionary of violations.
        :type violations: dict
        :return report: Readable report of violations.
        :rtype: string
        """
        string = ""
        string += "Found " + str(len(violations)) + " accessibility violations:"
        for violation in violations:
            string += (
                "\n\n\nRule Violated:\n"
                + violation["id"]
                + " - "
                + violation["description"]
                + "\n\tURL: "
                + violation["helpUrl"]
                + "\n\tImpact Level: "
                + violation["impact"]
                + "\n\tTags:"
            )
            for tag in violation["tags"]:
                string += " " + tag
            string += "\n\tElements Affected:"
            i = 1
            for node in violation["nodes"]:
                for target in node["target"]:
                    string += "\n\t" + str(i) + ") Target: " + target
                    i += 1
                for item in node["all"]:
                    string += "\n\t\t" + item["message"]
                for item in node["any"]:
                    string += "\n\t\t" + item["message"]
                for item in node["none"]:
                    string += "\n\t\t" + item["message"]
            string += "\n\n\n"
        return string

    def write_results(self, data, name=None):
        """
        Write JSON to file with the specified name.

        :param name: Path to the file to be written to. If no path is passed
                     a new JSON file "results.json" will be created in the
                     current working directory.
        :param output: JSON object.
        """

        if name:
            filepath = os.path.abspath(name)
        else:
            filepath = os.path.join(os.path.getcwd(), "results.json")

        with open(filepath, "w", encoding="utf8") as f:
            try:
                f.write(unicode(json.dumps(data, indent=4)))
            except NameError:
                f.write(json.dumps(data, indent=4))


================================================
FILE: concordia/tests/data/site_reports.csv
================================================
created_on,time,campaign
05/27/2024,10:13 PM UTC,1
05/26/2024,10:12 PM UTC,


================================================
FILE: concordia/tests/test_account_views.py
================================================
"""
Tests for user account-related views
"""

from smtplib import SMTPException
from unittest.mock import patch

from django import forms
from django.contrib.messages import get_messages
from django.core import mail, signing
from django.core.cache import cache
from django.test import TestCase, override_settings
from django.urls import reverse
from django.utils.timezone import now

from concordia.models import ConcordiaUser, Transcription, User, UserProfileActivity
from concordia.utils import get_anonymous_user

from .utils import (
    CacheControlAssertions,
    CreateTestUsers,
    JSONAssertMixin,
    create_asset,
    create_campaign,
    create_transcription,
)


@override_settings(RATELIMIT_ENABLE=False)
class ConcordiaAccountViewTests(
    CreateTestUsers, JSONAssertMixin, CacheControlAssertions, TestCase
):
    """
    This class contains the unit tests for the view in the concordia app.
    """

    def setUp(self):
        cache.clear()

    def tearDown(self):
        cache.clear()

    def test_AccountProfileView_get(self):
        """
        Test the http GET on route account/profile
        """

        self.login_user()

        response = self.client.get(reverse("user-profile"))
        self.assertEqual(response.status_code, 200)
        self.assertUncacheable(response)
        self.assertTemplateUsed(response, template_name="account/profile.html")
        self.assertEqual(response.context["user"], self.user)
        self.assertContains(response, self.user.username)
        self.assertContains(response, self.user.email)

        response = self.client.get(reverse("user-profile"), {"activity": "transcribed"})
        self.assertEqual(response.status_code, 200)
        self.assertUncacheable(response)
        self.assertTemplateUsed(response, template_name="account/profile.html")
        self.assertEqual(response.context["user"], self.user)
        self.assertEqual(response.context["active_tab"], "recent")

        response = self.client.get(reverse("user-profile"), {"status": "submitted"})
        self.assertEqual(response.status_code, 200)
        self.assertUncacheable(response)
        self.assertTemplateUsed(response, template_name="account/profile.html")
        self.assertEqual(response.context["user"], self.user)
        self.assertEqual(response.context["active_tab"], "recent")
        self.assertEqual(response.context["status_list"], ["submitted"])

        response = self.client.get(
            reverse("user-profile"), {"start": "1970-01-01", "end": "1970-01-02"}
        )
        self.assertEqual(response.status_code, 200)
        self.assertUncacheable(response)
        self.assertTemplateUsed(response, template_name="account/profile.html")
        self.assertEqual(response.context["user"], self.user)
        self.assertEqual(response.context["end"], "1970-01-02")
        self.assertEqual(response.context["start"], "1970-01-01")

        anon = get_anonymous_user()
        asset = create_asset()
        t = asset.transcription_set.create(asset=asset, user=anon)
        t.submitted = now()
        t.accepted = now()
        t.reviewed_by = self.user
        t.save()
        # when the transcription is saved, the handler should automatically
        # create or updated the corresponding UserProfileActivity object
        user_profile_activity, _ = UserProfileActivity.objects.get_or_create(
            campaign=asset.item.project.campaign, user=self.user
        )
        user_profile_activity.review_count = 1
        user_profile_activity.save()
        response = self.client.get(reverse("user-profile"))
        self.assertEqual(response.status_code, 200)
        self.assertUncacheable(response)
        self.assertTemplateUsed(response, template_name="account/profile.html")
        self.assertEqual(response.context["user"], self.user)
        self.assertEqual(response.context["totalReviews"], 1)
        self.assertEqual(response.context["totalCount"], 1)

    def test_AccountProfileView_post(self):
        """
        This unit test tests the post entry for the route account/profile
        :param self:
        """
        test_email = "tester2@example.com"

        self.login_user()

        with self.settings(REQUIRE_EMAIL_RECONFIRMATION=False):
            # First, test trying to 'update' to the already used email
            response = self.client.post(
                reverse("user-profile"),
                {"email": self.user.email, "username": "tester"},
            )

        self.assertEqual(response.status_code, 200)
        self.assertIn("form", response.context)
        self.assertFalse(response.context["form"].is_valid())

        with self.settings(REQUIRE_EMAIL_RECONFIRMATION=False):
            response = self.client.post(
                reverse("user-profile"), {"email": test_email, "username": "tester"}
            )

        self.assertEqual(response.status_code, 302)
        self.assertUncacheable(response)
        index = response.url.find("#")
        self.assertEqual(response.url[:index], reverse("user-profile"))

        # Verify the User was correctly updated
        updated_user = User.objects.get(email=test_email)
        self.assertEqual(updated_user.email, test_email)

        # Test first/last name can be updated
        self.assertNotEqual(updated_user.first_name, "Test")
        self.assertNotEqual(updated_user.last_name, "User")
        response = self.client.post(
            reverse("user-profile"),
            {"submit_name": True, "first_name": "Test", "last_name": "User"},
        )

        self.assertRedirects(response, reverse("user-profile"))
        self.assertUncacheable(response)

        updated_user = User.objects.get(email=test_email)
        first_name = updated_user.first_name
        last_name = updated_user.last_name
        self.assertEqual(first_name, "Test")
        self.assertEqual(last_name, "User")

        # Test name form submission without valid data
        # First/last names should stay the same after post
        # The form can't really be invalid since even blank
        # values just set the names to empty strings,
        # so we need to mock an invalid response
        with patch("concordia.forms.UserNameForm.is_valid") as mock:
            mock.return_value = False
            response = self.client.post(reverse("user-profile"), {"submit_name": True})
        updated_user = User.objects.get(email=test_email)
        self.assertEqual(updated_user.first_name, first_name)
        self.assertEqual(updated_user.last_name, last_name)

    def test_AccountProfileView_post_invalid_form(self):
        """
        This unit test tests the post entry for the route account/profile but
        submits an invalid form
        """
        self.login_user()

        response = self.client.post(reverse("user-profile"), {"first_name": "Jimmy"})

        self.assertEqual(response.status_code, 200)
        self.assertUncacheable(response)

        # Verify the User was not changed
        updated_user = User.objects.get(id=self.user.id)
        self.assertEqual(updated_user.first_name, "")

    def test_ajax_session_status_anon(self):
        response = self.client.get(reverse("ajax-session-status"))
        self.assertCachePrivate(response)
        data = self.assertValidJSON(response)
        self.assertEqual(data, {})

    def test_ajax_session_status(self):
        self.login_user()

        response = self.client.get(reverse("ajax-session-status"))
        self.assertCachePrivate(response)
        data = self.assertValidJSON(response)

        self.assertIn("links", data)
        self.assertIn("username", data)

        self.assertEqual(data["username"], self.user.username)

        self.assertFalse(any(link["title"] == "Admin Area" for link in data["links"]))

    def test_ajax_session_status_staff(self):
        self.login_user(is_staff=True, is_superuser=True)

        response = self.client.get(reverse("ajax-session-status"))
        self.assertCachePrivate(response)
        data = self.assertValidJSON(response)

        self.assertIn("links", data)
        self.assertIn("username", data)

        self.assertEqual(data["username"], self.user.username)

        self.assertTrue(any(link["title"] == "Admin Area" for link in data["links"]))

    def test_ajax_messages(self):
        self.login_user()

        response = self.client.get(reverse("ajax-messages"))
        data = self.assertValidJSON(response)

        self.assertIn("messages", data)

        # This view cannot be cached because the messages would be displayed
        # multiple times:
        self.assertUncacheable(response)

    def test_email_reconfirmation(self):
        self.login_user()
        # Confirm the user doesn't have a reconfirmation key
        concordia_user = ConcordiaUser.objects.get(id=self.user.id)
        with self.assertRaises(ValueError):
            concordia_user.get_email_reconfirmation_key()

        with self.settings(REQUIRE_EMAIL_RECONFIRMATION=True):
            email_data = {"email": "change@example.com"}
            with patch("django.core.mail.EmailMultiAlternatives.send") as mock:
                mock.side_effect = SMTPException()
                response = self.client.post(reverse("user-profile"), email_data)
                self.assertRedirects(
                    response, "{}#account".format(reverse("user-profile"))
                )
                messages = [
                    str(message) for message in get_messages(response.wsgi_request)
                ]
                self.assertIn(
                    "Email confirmation could not be sent.",
                    messages,
                )
                self.assertEqual(len(mail.outbox), 0)

            response = self.client.post(reverse("user-profile"), email_data)
            self.assertRedirects(response, "{}#account".format(reverse("user-profile")))
            self.assertTemplateUsed(response, "emails/email_reconfirmation_subject.txt")
            self.assertTemplateUsed(response, "emails/email_reconfirmation_body.txt")
            self.assertEqual(len(mail.outbox), 1)
            mail.outbox = []

            updated_user = User.objects.get(id=self.user.id)
            self.assertNotEqual(updated_user.email, email_data["email"])

            concordia_user = ConcordiaUser.objects.get(id=self.user.id)

            self.assertEqual(
                concordia_user.get_email_for_reconfirmation(), email_data["email"]
            )
            confirmation_key = concordia_user.get_email_reconfirmation_key()

            # Check if user failing validation is handled
            with patch("concordia.models.ConcordiaUser.full_clean") as mock:
                mock.side_effect = forms.ValidationError("Testing error")
                error_response = self.client.get(
                    reverse(
                        "email-reconfirmation",
                        kwargs={"confirmation_key": confirmation_key},
                    )
                )
                self.assertEqual(error_response.status_code, 403)
                self.assertTemplateUsed(
                    error_response, "account/email_reconfirmation_failed.html"
                )

            # Check if invalid data from confirmation key is handled
            with patch("django.core.signing.loads") as mock:
                mock.return_value = {
                    "username": "bad-username",
                    "email": "bad-email-address",
                }
                error_response = self.client.get(
                    reverse(
                        "email-reconfirmation",
                        kwargs={"confirmation_key": confirmation_key},
                    )
                )
                self.assertEqual(error_response.status_code, 403)
                self.assertTemplateUsed(
                    error_response, "account/email_reconfirmation_failed.html"
                )

            # Check if signing errors are handled
            with patch("django.core.signing.loads") as mock:
                mock.side_effect = signing.BadSignature()
                error_response = self.client.get(
                    reverse(
                        "email-reconfirmation",
                        kwargs={"confirmation_key": confirmation_key},
                    )
                )
                self.assertEqual(error_response.status_code, 403)
                self.assertTemplateUsed(
                    error_response, "account/email_reconfirmation_failed.html"
                )

                mock.side_effect = signing.SignatureExpired()
                error_response = self.client.get(
                    reverse(
                        "email-reconfirmation",
                        kwargs={"confirmation_key": confirmation_key},
                    )
                )
                self.assertEqual(error_response.status_code, 403)
                self.assertTemplateUsed(
                    error_response, "account/email_reconfirmation_failed.html"
                )

            confirmation_response = self.client.get(
                reverse(
                    "email-reconfirmation",
                    kwargs={"confirmation_key": confirmation_key},
                )
            )
            self.assertRedirects(
                confirmation_response, "{}#account".format(reverse("user-profile"))
            )
            updated_user = User.objects.get(id=self.user.id)
            self.assertEqual(updated_user.email, email_data["email"])

            error_response = self.client.get(
                reverse(
                    "email-reconfirmation",
                    kwargs={"confirmation_key": confirmation_key},
                )
            )
            self.assertEqual(error_response.status_code, 403)
            self.assertTemplateUsed(
                error_response, "account/email_reconfirmation_failed.html"
            )

        with self.settings(REQUIRE_EMAIL_RECONFIRMATION=False):
            email_data = {"email": "change2@example.com"}
            response = self.client.post(reverse("user-profile"), email_data)
            self.assertRedirects(response, "{}#account".format(reverse("user-profile")))
            self.assertEqual(len(mail.outbox), 0)
            updated_user = User.objects.get(id=self.user.id)
            self.assertEqual(updated_user.email, email_data["email"])

    def test_account_letter(self):
        self.login_user()

        response = self.client.get(reverse("user-letter"))
        self.assertEqual(response.status_code, 200)
        self.assertEqual(
            response["Content-Disposition"], "attachment; filename=letter.pdf"
        )
        self.assertEqual(response["Content-Type"], "application/pdf")

    def test_get_pages(self):
        self.login_user()
        campaign = create_campaign()
        url = reverse("get_pages")

        response = self.client.get(url, {"activity": "transcribed"})
        self.assertEqual(response.status_code, 200)

        response = self.client.get(
            url, {"activity": "reviewed", "order_by": "date-ascending"}
        )
        self.assertEqual(response.status_code, 200)
        self.assertUncacheable(response)

        response = self.client.get(
            url, {"status": ["completed"], "campaign": campaign.id}
        )
        self.assertEqual(response.status_code, 200)
        self.assertUncacheable(response)

        response = self.client.get(url, {"status": ["in_progress", "submitted"]})
        self.assertEqual(response.status_code, 200)
        self.assertUncacheable(response)

        response = self.client.get(
            url, kwargs={"start": "1900-01-01", "end": "1999-12-31"}
        )
        self.assertEqual(response.status_code, 200)
        self.assertUncacheable(response)

        response = self.client.get(url, {"end": "1999-12-31"})
        self.assertEqual(response.status_code, 200)
        self.assertUncacheable(response)

        response = self.client.get(url, {"start": "1900-01-01", "end": "1999-12-31"})
        self.assertEqual(response.status_code, 200)
        self.assertUncacheable(response)

    def test_AccountDeletionView(self):
        self.login_user()

        response = self.client.get(reverse("account-deletion"))
        self.assertEqual(response.status_code, 200)
        self.assertUncacheable(response)
        self.assertTemplateUsed(response, template_name="account/account_deletion.html")
        self.assertEqual(response.context["user"], self.user)

        response = self.client.post(reverse("account-deletion"))
        self.assertRedirects(response, reverse("homepage"))
        with self.assertRaises(User.DoesNotExist):
            User.objects.get(id=self.user.id)
        self.assertEqual(len(mail.outbox), 1)

        mail.outbox = []
        self.user = None
        self.login_user()
        with patch("django.core.mail.EmailMultiAlternatives.send") as mock:
            mock.side_effect = SMTPException()
            response = self.client.post(reverse("account-deletion"))
            self.assertRedirects(response, reverse("homepage"))
            messages = [str(message) for message in get_messages(response.wsgi_request)]
            self.assertIn(
                "Email confirmation of deletion could not be sent.",
                messages,
            )
            self.assertEqual(len(mail.outbox), 0)

        mail.outbox = []
        self.user = None
        self.login_user()
        transcription = create_transcription(user=self.user)
        response = self.client.post(reverse("account-deletion"))
        self.assertRedirects(response, reverse("homepage"))
        user = User.objects.get(id=self.user.id)
        transcription = Transcription.objects.get(id=transcription.id)
        self.assertEqual(transcription.user, user)
        self.assertIn("Anonymized", user.username)
        self.assertEqual(user.first_name, "")
        self.assertEqual(user.last_name, "")
        self.assertEqual(user.email, "")
        self.assertFalse(user.has_usable_password())
        self.assertFalse(user.is_staff)
        self.assertFalse(user.is_superuser)
        self.assertFalse(user.is_active)
        self.assertEqual(len(mail.outbox), 1)


================================================
FILE: concordia/tests/test_admin.py
================================================
import io
import zipfile
from datetime import date, datetime
from html import escape
from unittest import mock

from django.contrib import admin
from django.contrib.admin.sites import AdminSite
from django.contrib.auth.models import User
from django.http import HttpResponse, HttpResponseRedirect
from django.test import RequestFactory, TestCase
from django.urls import reverse
from django.utils import timezone
from django.utils.safestring import SafeString
from faker import Faker

from concordia.admin import (
    AssetAdmin,
    CampaignAdmin,
    CampaignRetirementProgressAdmin,
    ConcordiaFileAdmin,
    ConcordiaUserAdmin,
    ItemAdmin,
    KeyMetricsReportAdmin,
    ProjectAdmin,
    SiteReportAdmin,
    TagAdmin,
    TranscriptionAdmin,
)
from concordia.models import (
    Asset,
    Campaign,
    CampaignRetirementProgress,
    ConcordiaFile,
    Item,
    KeyMetricsReport,
    Project,
    SiteReport,
    Tag,
    Transcription,
)
from concordia.tests.utils import (
    CreateTestUsers,
    StreamingTestMixin,
    create_asset,
    create_project,
    create_site_report,
    create_tag_collection,
    create_topic,
    create_transcription,
)


class ConcordiaUserAdminTest(TestCase, CreateTestUsers, StreamingTestMixin):
    def setUp(self):
        self.site = AdminSite()
        self.user = self.create_test_user()
        self.super_user = self.create_super_user()
        self.asset = create_asset()
        self.user_admin = ConcordiaUserAdmin(model=User, admin_site=self.site)
        self.request_factory = RequestFactory()

    def test_transcription_count(self):
        request = self.request_factory.get("/")
        request.user = self.super_user
        users = self.user_admin.get_queryset(request)
        user = users.get(username=self.user.username)
        transcription_count = self.user_admin.transcription_count(user)
        self.assertEqual(transcription_count, 0)

        create_transcription(asset=self.asset, user=user)
        user = users.get(username=self.user.username)
        user.profile.transcribe_count = 1
        user.profile.save()
        transcription_count = self.user_admin.transcription_count(user)
        self.assertEqual(transcription_count, 1)

    def test_review_count(self):
        request = self.request_factory.get("/")
        request.user = self.super_user
        users = self.user_admin.get_queryset(request)
        user = users.get(username=self.user.username)
        review_count = self.user_admin.review_count(user)
        self.assertEqual(review_count, 0)

        transcription = create_transcription(
            asset=self.asset, user=self.super_user, submitted=timezone.now()
        )
        transcription.accepted = timezone.now()
        transcription.reviewed_by = self.user
        transcription.save()
        user = users.get(username=self.user.username)
        user.profile.review_count = 1
        user.profile.save()
        review_count = self.user_admin.review_count(user)
        self.assertEqual(review_count, 1)

    def test_csv_export(self):
        request = self.request_factory.get("/")
        request.user = self.super_user
        # TODO: Fix this to mock date_joined rather than removing it
        self.user_admin.EXPORT_FIELDS = [
            field for field in self.user_admin.EXPORT_FIELDS if field != "date_joined"
        ]
        response = self.user_admin.export_users_as_csv(
            request, self.user_admin.get_queryset(request)
        )
        content = self.get_streaming_content(response).split(b"\r\n")
        self.assertEqual(len(content), 4)  # Includes empty line at the end of the file
        test_data = [
            b"username,email address,first name,last name,active,staff status,"
            + b"superuser status,last login,transcription count,review count",
            b"testsuperuser,testsuperuser@example.com,,,True,True,True,,0,0",
            b"testuser,testuser@example.com,,,True,False,False,,0,0",
            b"",
        ]
        self.assertEqual(content, test_data)

    def test_excel_export(self):
        request = self.request_factory.get("/")
        request.user = self.super_user
        response = self.user_admin.export_users_as_excel(
            request, self.user_admin.get_queryset(request)
        )
        # TODO: Test contents of file (requires a library to read xlsx files)
        self.assertNotEqual(len(response.content), 0)


class CampaignAdminTest(TestCase, CreateTestUsers, StreamingTestMixin):
    def setUp(self):
        self.site = AdminSite()
        self.user = self.create_test_user()
        self.staff_user = self.create_staff_user()
        self.super_user = self.create_super_user()
        self.asset = create_asset()
        self.campaign = self.asset.item.project.campaign
        self.campaign_admin = CampaignAdmin(model=Campaign, admin_site=self.site)
        self.fake = Faker()
        self.request_factory = RequestFactory()

    def test_truncated_description(self):
        self.campaign.description = ""
        self.assertEqual(self.campaign_admin.truncated_description(self.campaign), "")
        self.campaign.description = self.fake.text()
        truncated_description = self.campaign_admin.truncated_metadata(self.campaign)
        self.assertIn(truncated_description, self.campaign.description)

    def test_truncated_metadata(self):
        self.campaign.metadata = {}
        self.assertEqual(self.campaign_admin.truncated_metadata(self.campaign), "")
        self.campaign.metadata[self.fake.unique.word()] = self.fake.text()
        truncated_metadata = self.campaign_admin.truncated_metadata(self.campaign)
        self.assertIs(type(truncated_metadata), SafeString)
        self.assertRegex(truncated_metadata, r"<code>.*</code>")

    def test_retire(self):
        self.client.force_login(self.staff_user)
        response = self.client.get(
            reverse(
                "admin:concordia_campaign_retire",
                args=[
                    self.campaign.slug,
                ],
            )
        )
        self.assertEqual(response.status_code, 403)

        self.client.logout()
        self.client.force_login(self.super_user)
        response = self.client.get(
            reverse(
                "admin:concordia_campaign_retire", args=[self.campaign.slug + "bad"]
            )
        )
        self.assertEqual(response.status_code, 302)

        response = self.client.get(
            reverse("admin:concordia_campaign_retire", args=[self.campaign.slug])
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="admin/concordia/campaign/retire.html"
        )
        self.assertContains(response, "Are you sure?")

        response = self.client.post(
            reverse("admin:concordia_campaign_retire", args=[self.campaign.slug]),
            {"post": "yes"},
        )
        self.assertEqual(response.status_code, 302)
        campaign = Campaign.objects.get(pk=self.campaign.pk)
        self.assertEqual(campaign.status, Campaign.Status.RETIRED)

    def test_campaign_admin(self):
        self.client.force_login(self.super_user)
        response = self.client.get(reverse("admin:concordia_campaign_add"))
        self.assertEqual(response.status_code, 200)
        self.assertContains(response, "form")
        self.assertContains(response, "Display on homepage")
        self.assertContains(response, "Next transcription campaign")
        self.assertContains(response, "Next review campaign")


class HelpfulLinkAdminTest(TestCase, CreateTestUsers):
    def setUp(self):
        self.super_user = self.create_super_user()

    def test_helpfullink_admin(self):
        self.client.force_login(self.super_user)
        response = self.client.get(reverse("admin:concordia_helpfullink_add"))
        self.assertEqual(response.status_code, 200)


class ConcordiaFileAdminTest(TestCase, CreateTestUsers):
    def setUp(self):
        self.site = AdminSite()
        self.staff_user = self.create_staff_user()
        self.super_user = self.create_super_user()
        self.concordia_file_admin = ConcordiaFileAdmin(
            model=ConcordiaFile, admin_site=self.site
        )
        self.request_factory = RequestFactory()

    def test_link_url(self):
        class MockFile:
            url = "http://example.com?arg=true"

        class MockConcordiaFile:
            uploaded_file = MockFile()

        result = self.concordia_file_admin.file_url(MockConcordiaFile())
        self.assertEqual(result, "http://example.com")

    def test_get_fields(self):
        request = self.request_factory.get("/")
        result = self.concordia_file_admin.get_fields(request)
        self.assertNotIn("path", result)
        self.assertNotIn("file_url", result)

        result = self.concordia_file_admin.get_fields(request, object())
        self.assertNotIn("path", result)
        self.assertIn("file_url", result)


class ProjectAdminTest(TestCase, CreateTestUsers):
    def setUp(self):
        self.site = AdminSite()
        self.super_user = self.create_super_user()
        self.staff_user = self.create_staff_user()
        self.project_admin = ProjectAdmin(model=Project, admin_site=self.site)
        self.project = create_project()
        self.url_lookup = "admin:concordia_project_item-import"

    def test_lookup_allowed(self):
        self.assertTrue(self.project_admin.lookup_allowed("campaign__id__exact", 0))
        self.assertTrue(self.project_admin.lookup_allowed("campaign", 0))
        self.assertFalse(self.project_admin.lookup_allowed("campaign__slug__exact", 0))

    def test_item_import_view(self):
        self.client.force_login(self.staff_user)
        response = self.client.get(reverse(self.url_lookup, args=[self.project.id]))
        self.assertEqual(response.status_code, 403)
        self.client.logout()

        self.client.force_login(self.super_user)
        response = self.client.get(reverse(self.url_lookup, args=[self.project.id + 1]))
        self.assertEqual(response.status_code, 404)

        response = self.client.get(reverse(self.url_lookup, args=[self.project.id]))
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="admin/concordia/project/item_import.html"
        )

        self.client.post(
            reverse(self.url_lookup, args=[self.project.id]),
            {"bad_param": "https://example.com"},
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="admin/concordia/project/item_import.html"
        )

        with self.assertRaises(ValueError):
            self.client.post(
                reverse(self.url_lookup, args=[self.project.id]),
                {"import_url": "https://example.com"},
            )

        with mock.patch(
            "importer.tasks.items.create_item_import_task.delay"
        ) as task_mock:
            response = self.client.post(
                reverse(self.url_lookup, args=[self.project.id]),
                {"import_url": "https://www.loc.gov/item/example"},
            )
            self.assertTrue(task_mock.called)

        with mock.patch(
            "importer.tasks.collections.import_collection_task.delay"
        ) as task_mock:
            response = self.client.post(
                reverse(self.url_lookup, args=[self.project.id]),
                {"import_url": "https://www.loc.gov/collections/example/"},
            )
            self.assertTrue(task_mock.called)


class ItemAdminTest(TestCase, CreateTestUsers):
    def setUp(self):
        self.site = AdminSite()
        self.super_user = self.create_super_user()
        self.staff_user = self.create_staff_user()
        self.user = self.create_test_user()
        self.admin = ItemAdmin(model=Item, admin_site=self.site)
        self.asset = create_asset()
        self.item = self.asset.item
        create_transcription(asset=self.asset, user=self.user)
        self.request_factory = RequestFactory()

    def test_lookup_allowed(self):
        self.assertTrue(self.admin.lookup_allowed("project__campaign__id__exact", 0))
        self.assertFalse(self.admin.lookup_allowed("project__campaign", 0))
        self.assertFalse(self.admin.lookup_allowed("project__campaign__slug__exact", 0))

    def test_get_deleted_objects(self):
        mock_objs = range(0, 50)
        request = self.request_factory.get("/")

        request.user = self.staff_user
        deleted_objects, model_count, perms_needed, protected = (
            self.admin.get_deleted_objects(mock_objs, request)
        )
        self.assertEqual(len(deleted_objects), 4)
        self.assertEqual(model_count, {"items": 50, "assets": 1, "transcriptions": 1})
        self.assertNotEqual(perms_needed, set())
        self.assertEqual(protected, [])

        request.user = self.super_user
        deleted_objects, model_count, perms_needed, protected = (
            self.admin.get_deleted_objects(mock_objs, request)
        )
        self.assertEqual(len(deleted_objects), 4)
        self.assertEqual(model_count, {"items": 50, "assets": 1, "transcriptions": 1})
        self.assertEqual(perms_needed, set())
        self.assertEqual(protected, [])

        deleted_objects, model_count, perms_needed, protected = (
            self.admin.get_deleted_objects([self.item], request)
        )
        self.assertEqual(len(deleted_objects), 1)
        self.assertEqual(model_count, {"items": 1, "assets": 1, "transcriptions": 1})
        self.assertEqual(perms_needed, set())
        self.assertEqual(protected, [])

    def test_get_queryset(self):
        request = self.request_factory.get("/")
        qs = self.admin.get_queryset(request)
        self.assertEqual(qs.count(), 1)

    def test_campaign_title(self):
        self.assertEqual(
            self.item.project.campaign.title, self.admin.campaign_title(self.item)
        )


class AssetAdminTest(TestCase, CreateTestUsers):
    def setUp(self):
        self.site = AdminSite()
        self.super_user = self.create_super_user()
        self.staff_user = self.create_staff_user()
        self.user = self.create_test_user()
        self.admin = AssetAdmin(model=Asset, admin_site=self.site)
        self.asset = create_asset()
        create_transcription(asset=self.asset, user=self.user)
        self.request_factory = RequestFactory()

    def test_get_queryset(self):
        request = self.request_factory.get("/")
        qs = self.admin.get_queryset(request)
        self.assertEqual(qs.count(), 1)

    def test_lookup_allowed(self):
        self.assertTrue(self.admin.lookup_allowed("item__project__id__exact", 0))
        self.assertTrue(
            self.admin.lookup_allowed("item__project__campaign__id__exact", 0)
        )
        self.assertFalse(self.admin.lookup_allowed("item__project", 0))

    def test_item_id(self):
        self.assertEqual(self.asset.item.item_id, self.admin.item_id(self.asset))

    def test_truncated_storage_image(self):
        truncated_url = self.admin.truncated_storage_image(self.asset)
        filename = self.asset.get_existing_storage_image_filename()
        self.assertEqual(truncated_url.count(filename), 2)

        self.asset.storage_image.name = "".join([str(i) for i in range(200)])
        truncated_url = self.admin.truncated_storage_image(self.asset)
        filename = self.asset.get_existing_storage_image_filename()
        self.assertEqual(truncated_url.count(filename), 1)
        self.assertEqual(truncated_url.count(filename[:99]), 2)

    def test_get_readonly_fields(self):
        request = self.request_factory.get("/")
        self.assertNotIn("item", self.admin.get_readonly_fields(request))
        self.assertIn("item", self.admin.get_readonly_fields(request, self.asset))

    def test_change_view(self):
        self.client.force_login(self.super_user)
        response = self.client.get(
            reverse("admin:concordia_asset_change", args=[self.asset.id])
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="admin/concordia/asset/change_form.html"
        )

    def test_has_reopen_permission(self):
        request = self.request_factory.get("/")
        request.user = self.super_user
        self.admin.has_reopen_permission(request)

        request.user = self.staff_user
        self.admin.has_reopen_permission(request)

    def test_response_action_redirects_with_valid_next(self):
        request = self.request_factory.post(
            reverse("admin:concordia_asset_changelist"),
            data={"next": "/admin/"},
        )
        request._messages = mock.MagicMock()
        request.user = self.super_user

        queryset = Asset.objects.all()
        admin_instance = AssetAdmin(Asset, self.site)
        admin_instance.get_actions = mock.MagicMock(return_value={})
        response = admin_instance.response_action(request, queryset)

        self.assertIsInstance(response, HttpResponseRedirect)
        self.assertEqual(response.url, "/admin/")

    def test_response_action_falls_back_to_default_without_valid_next(self):
        request = self.request_factory.post(
            reverse("admin:concordia_asset_changelist"),
            data={"next": "https://example.com/malicious"},
        )
        request._messages = mock.MagicMock()
        request.user = self.super_user

        queryset = Asset.objects.all()
        admin_instance = AssetAdmin(Asset, self.site)

        fallback_response = HttpResponseRedirect("/default/")
        with mock.patch.object(
            admin.ModelAdmin, "response_action", return_value=fallback_response
        ):
            response = admin_instance.response_action(request, queryset)

        self.assertEqual(response.url, "/default/")

    def test_change_view_skips_asset_logic_when_no_object_id(self):
        request = self.request_factory.get("/admin/concordia/asset/add/")
        request.user = self.super_user

        admin_instance = AssetAdmin(Asset, self.site)

        with mock.patch.object(
            admin.ModelAdmin, "change_view", return_value=HttpResponse("OK")
        ) as mock_super_change_view:
            response = admin_instance.change_view(request, object_id=None)

        self.assertEqual(response.status_code, 200)
        mock_super_change_view.assert_called_once()

    def test_change_view_handles_submitted_status_as_needs_review(self):
        asset = create_asset(
            item=self.asset.item, slug="test-asset-2", transcription_status="submitted"
        )
        request = self.request_factory.get(
            reverse("admin:concordia_asset_change", args=[asset.pk])
        )
        request.user = self.super_user

        admin_instance = AssetAdmin(Asset, self.site)

        with mock.patch.object(admin_instance, "get_actions") as mock_get_actions:
            mock_get_actions.return_value = {
                "change_status_to_completed": (
                    "func",
                    None,
                    "Change status to Completed",
                ),
                "change_status_to_needs_review": (
                    "func",
                    None,
                    "Change status to Needs Review",
                ),
                "change_status_to_in_progress": (
                    "func",
                    None,
                    "Change status to In Progress",
                ),
            }

            with mock.patch.object(
                admin.ModelAdmin, "change_view", return_value=HttpResponse("OK")
            ) as mock_super_change_view:
                response = admin_instance.change_view(request, str(asset.pk))

        self.assertEqual(response.status_code, 200)
        mock_super_change_view.assert_called_once()

    def test_response_action_returns_default_when_no_next_url(self):
        request = self.request_factory.post(
            reverse("admin:concordia_asset_changelist"),
            data={},
        )
        request._messages = mock.MagicMock()
        request.user = self.super_user

        queryset = Asset.objects.all()
        admin_instance = AssetAdmin(Asset, self.site)

        default_response = HttpResponseRedirect("/default/")
        with mock.patch.object(
            admin.ModelAdmin, "response_action", return_value=default_response
        ) as mock_super_response_action:
            response = admin_instance.response_action(request, queryset)

        mock_super_response_action.assert_called_once_with(request, queryset)
        self.assertEqual(response, default_response)
        self.assertEqual(response.url, "/default/")


class TagAdminTest(TestCase, CreateTestUsers, StreamingTestMixin):
    def setUp(self):
        self.site = AdminSite()
        self.super_user = self.create_super_user()
        self.user = self.create_test_user()
        self.admin = TagAdmin(model=Tag, admin_site=self.site)
        self.request_factory = RequestFactory()

    def test_lookup_allowed(self):
        self.assertTrue(
            self.admin.lookup_allowed(
                "userassettagcollection__asset__item__project__campaign__id__exact", 0
            )
        )
        self.assertTrue(self.admin.lookup_allowed("id", 0))
        self.assertFalse(self.admin.lookup_allowed("userassettagcollection__asset", 0))

    def test_export_tags_as_csv(self):
        request = self.request_factory.get("/")
        request.user = self.super_user
        mocked_datetime = timezone.now()
        with mock.patch("django.utils.timezone.now") as now_mocked:
            now_mocked.return_value = mocked_datetime
            self.collection = create_tag_collection(user=self.user)

        response = self.admin.export_tags_as_csv(
            request, self.admin.get_queryset(request)
        )
        content = self.get_streaming_content(response).split(b"\r\n")
        self.assertEqual(len(content), 3)  # Includes empty line at the end of the file
        test_data = [
            b"tag value,user asset tag collection date created,"
            + b"user asset tag collection user_id,asset id,asset title,"
            + b"asset download url,asset resource url,campaign slug",
            b"tag-value,%s,%i,%i,Test Asset,,,test-campaign"
            % (
                str.encode(mocked_datetime.isoformat()),
                self.user.id,
                self.collection.asset.id,
            ),
            b"",
        ]
        self.assertEqual(content, test_data)


class TranscriptionAdminTest(TestCase, CreateTestUsers, StreamingTestMixin):
    def setUp(self):
        self.site = AdminSite()
        self.super_user = self.create_super_user()
        self.user = self.create_test_user()
        self.asset = create_asset()
        self.mocked_datetime = timezone.now()
        self.mocked_datetime_formatted = self.mocked_datetime.isoformat()
        with mock.patch("django.utils.timezone.now") as now_mocked:
            now_mocked.return_value = self.mocked_datetime
            self.transcription = create_transcription(asset=self.asset, user=self.user)
        self.admin = TranscriptionAdmin(model=Transcription, admin_site=self.site)
        self.request_factory = RequestFactory()
        self.fake = Faker()

    def test_lookup_allowed(self):
        self.assertTrue(
            self.admin.lookup_allowed("asset__item__project__campaign__id__exact", 0)
        )
        self.assertTrue(self.admin.lookup_allowed("id", 0))
        self.assertFalse(
            self.admin.lookup_allowed("asset__item__project__id__exact", 0)
        )

    def test_truncated_text(self):
        self.transcription.text = self.fake.text(50)
        result = self.admin.truncated_text(self.transcription)
        self.assertEqual(result, self.transcription.text)

        self.transcription.text = self.fake.text(500)
        result = self.admin.truncated_text(self.transcription)
        self.assertNotEqual(result, self.transcription.text)
        self.assertIn(result[:-1], self.transcription.text)

    def test_export_to_csv(self):
        request = self.request_factory.get("/")
        request.user = self.super_user

        response = self.admin.export_to_csv(request, self.admin.get_queryset(request))
        content = self.get_streaming_content(response).split(b"\r\n")
        self.assertEqual(len(content), 3)
        test_data = [
            b"ID,asset__id,asset__slug,user,created on,updated on,supersedes,"
            + b"submitted,accepted,rejected,reviewed by,text,ocr generated,"
            + b"ocr originated",
            b"%i,%i,%s,%i,%s,%s,,,,,,,False,False"
            % (
                self.transcription.id,
                self.transcription.asset.id,
                str.encode(self.transcription.asset.slug),
                self.user.id,
                str.encode(self.mocked_datetime_formatted),
                str.encode(self.mocked_datetime_formatted),
            ),
            b"",
        ]
        self.assertEqual(content, test_data)

    def test_export_to_excel(self):
        request = self.request_factory.get("/")
        request.user = self.super_user
        response = self.admin.export_to_excel(request, self.admin.get_queryset(request))
        # TODO: Test contents of file (requires a library to read xlsx files)
        self.assertNotEqual(len(response.content), 0)

    def test_show_full_result_count_is_disabled(self):
        self.assertFalse(self.admin.show_full_result_count)

    def test_list_display_includes_superseded(self):
        self.assertIn("superseded", self.admin.list_display)

    def test_list_filter_includes_superseded_param(self):
        params = {
            getattr(f, "parameter_name", None)
            for f in self.admin.list_filter
            if hasattr(f, "parameter_name")
        }
        self.assertIn("superseded", params)

    def test_get_queryset_adds_is_superseded_annotation(self):
        base = create_transcription(asset=self.asset, user=self.user, text="base")
        superseding = create_transcription(
            asset=self.asset, user=self.user, supersedes=base, text="superseding"
        )
        request = self.request_factory.get("/")
        qs = self.admin.get_queryset(request).filter(pk__in=[base.pk, superseding.pk])
        by_id = {t.pk: t for t in qs}
        self.assertIn(base.pk, by_id)
        self.assertIn(superseding.pk, by_id)
        self.assertTrue(hasattr(by_id[base.pk], "is_superseded"))
        self.assertTrue(by_id[base.pk].is_superseded)
        self.assertFalse(by_id[superseding.pk].is_superseded)

    def test_superseded_column_uses_annotation_boolean(self):
        base = create_transcription(asset=self.asset, user=self.user, text="base2")
        superseding = create_transcription(
            asset=self.asset, user=self.user, supersedes=base, text="superseding2"
        )
        request = self.request_factory.get("/")
        qs = self.admin.get_queryset(request).filter(pk__in=[base.pk, superseding.pk])
        by_id = {t.pk: t for t in qs}
        self.assertTrue(self.admin.superseded(by_id[base.pk]))
        self.assertFalse(self.admin.superseded(by_id[superseding.pk]))


class SiteReportAdminTest(TestCase, CreateTestUsers, StreamingTestMixin):
    def setUp(self):
        self.site = AdminSite()
        self.super_user = self.create_super_user()
        self.mocked_datetime = timezone.now()
        self.mocked_datetime_formatted = self.mocked_datetime.isoformat()
        with mock.patch("django.utils.timezone.now") as now_mocked:
            now_mocked.return_value = self.mocked_datetime
            self.site_report = create_site_report()
        self.topic = create_topic()
        self.campaign = self.topic.project_set.all()[0].campaign
        self.admin = SiteReportAdmin(model=SiteReport, admin_site=self.site)
        self.request_factory = RequestFactory()
        self.fake = Faker()

    def test_report_type(self):
        self.site_report.report_name = "Test name"
        self.site_report.campaign = self.campaign
        self.site_report.topic = self.topic

        response = self.admin.report_type(self.site_report)
        self.assertIn("Report name", response)

        self.site_report.report_name = ""
        response = self.admin.report_type(self.site_report)
        self.assertIn("Campaign", response)

        self.site_report.campaign = None
        response = self.admin.report_type(self.site_report)
        self.assertIn("Topic", response)

        self.site_report.topic = None
        response = self.admin.report_type(self.site_report)
        self.assertIn("SiteReport", response)

    def test_export_to_csv(self):
        request = self.request_factory.get("/")
        request.user = self.super_user

        response = self.admin.export_to_csv(request, self.admin.get_queryset(request))
        content = self.get_streaming_content(response).split(b"\r\n")
        self.assertEqual(len(content), 3)  # Includes empty line at the end of the file

        test_data = [
            b"created on,report name,campaign__title,topic__title,assets total,"
            + b"assets published,assets not started,assets in progress,"
            + b"assets waiting review,assets completed,assets unpublished,"
            + b"assets started,items published,items unpublished,projects published,"
            + b"projects unpublished,anonymous transcriptions,transcriptions saved,"
            + b"daily review actions,distinct tags,tag uses,campaigns published,"
            + b"campaigns unpublished,users registered,users activated,"
            + b"registered contributors,daily active users",
            b"%s,,,,,,,,,,,,,,,,,,,,,,,,,,"
            % str.encode(self.mocked_datetime_formatted),
            b"",
        ]
        self.assertEqual(content, test_data)

    def test_export_to_excel(self):
        request = self.request_factory.get("/")
        request.user = self.super_user
        response = self.admin.export_to_excel(request, self.admin.get_queryset(request))
        # TODO: Test contents of file (requires a library to read xlsx files)
        self.assertNotEqual(len(response.content), 0)

    def test_report_type_variants(self):
        # Report name present
        s1 = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        text = self.admin.report_type(s1)
        self.assertIn("Report name", text)

        # Campaign present, no report name
        s2 = SiteReport.objects.create(campaign=self.campaign, report_name="")
        text = self.admin.report_type(s2)
        self.assertIn("Campaign", text)
        self.assertIn(self.campaign.title, text)

        # Topic present, no report name or campaign
        s3 = SiteReport.objects.create(topic=self.topic, report_name="", campaign=None)
        text = self.admin.report_type(s3)
        self.assertIn("Topic", text)
        self.assertIn(self.topic.title, text)

        # None of the above
        s4 = SiteReport.objects.create(report_name="", campaign=None, topic=None)
        text = self.admin.report_type(s4)
        self.assertIn("SiteReport:", text)
        self.assertIn(str(s4.id), text)

    def test_report_json_pretty_wrap(self):
        s = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        with mock.patch.object(SiteReport, "to_debug_json", return_value='{"a":1}'):
            html = self.admin.report_json(s)
        self.assertIn("<pre", html)
        self.assertIn("</pre>", html)
        self.assertIn(escape('{"a":1}'), html)

    def test_previous_and_next_in_series_links(self):
        # Build a small series of TOTAL snapshots with known timestamps.
        tz = timezone.get_current_timezone()
        t1 = timezone.make_aware(datetime(2024, 1, 1, 10, 0, 0), tz)
        t2 = timezone.make_aware(datetime(2024, 1, 1, 11, 0, 0), tz)
        t3 = timezone.make_aware(datetime(2024, 1, 1, 12, 0, 0), tz)

        a = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        b = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        c = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)

        # Set exact created_on values
        SiteReport.objects.filter(pk=a.pk).update(created_on=t1)
        SiteReport.objects.filter(pk=b.pk).update(created_on=t2)
        SiteReport.objects.filter(pk=c.pk).update(created_on=t3)

        # Refresh from DB to get updated created_on
        a = SiteReport.objects.get(pk=a.pk)
        b = SiteReport.objects.get(pk=b.pk)
        c = SiteReport.objects.get(pk=c.pk)

        # Middle record should link back to 'a' and forward to 'c'
        prev_html = self.admin.previous_in_series_link(b)
        next_html = self.admin.next_in_series_link(b)

        expected_prev_url = reverse(
            f"admin:{a._meta.app_label}_{a._meta.model_name}_change", args=[a.pk]
        )
        expected_prev_label = f"{a.created_on:%Y-%m-%d %H:%M:%S} (id {a.pk})"
        self.assertIn(expected_prev_url, prev_html)
        self.assertIn(expected_prev_label, prev_html)

        expected_next_url = reverse(
            f"admin:{c._meta.app_label}_{c._meta.model_name}_change", args=[c.pk]
        )
        expected_next_label = f"{c.created_on:%Y-%m-%d %H:%M:%S} (id {c.pk})"
        self.assertIn(expected_next_url, next_html)
        self.assertIn(expected_next_label, next_html)

        # Edge cases: first has no previous, last has no next
        self.assertEqual(self.admin.previous_in_series_link(a), "—")
        self.assertEqual(self.admin.next_in_series_link(c), "—")


class CampaignRetirementProgressAdminTest(TestCase):
    def setUp(self):
        class MockCompletion:
            complete = False

            project_total = 0
            item_total = 0
            asset_total = 0

            projects_removed = 0
            items_removed = 0
            assets_removed = 0

        self.completion_obj = MockCompletion()

        self.site = AdminSite()
        self.admin = CampaignRetirementProgressAdmin(
            model=CampaignRetirementProgress, admin_site=self.site
        )

    def test_completion(self):
        self.completion_obj.complete = True
        self.assertEqual(self.admin.completion(self.completion_obj), "100%")
        self.completion_obj.complete = False

        self.completion_obj.project_total = 10
        self.completion_obj.item_total = 100
        self.completion_obj.asset_total = 1000
        self.assertEqual(self.admin.completion(self.completion_obj), "0.0%")

        self.completion_obj.projects_removed = 1
        self.assertEqual(self.admin.completion(self.completion_obj), "0.09%")

        self.completion_obj.items_removed = 10
        self.completion_obj.assets_removed = 100
        self.assertEqual(self.admin.completion(self.completion_obj), "10.0%")


class KeyMetricsReportAdminTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.site = AdminSite()
        self.admin = KeyMetricsReportAdmin(model=KeyMetricsReport, admin_site=self.site)
        self.request_factory = RequestFactory()
        self.super_user = self.create_super_user()

    def _make_monthly(self):
        return KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.MONTHLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 1, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
            month=1,
        )

    def test_download_csv_link_builds_expected_anchor(self):
        obj = self._make_monthly()
        html = self.admin.download_csv_link(obj)
        url = reverse("admin:concordia_keymetricsreport_download_csv", args=[obj.pk])
        self.assertIn('class="button"', html)
        self.assertIn("Download CSV", html)
        self.assertIn(url, html)

    def test_get_urls_registers_named_view(self):
        urls = self.admin.get_urls()
        names = [p.name for p in urls if hasattr(p, "name")]
        self.assertIn("concordia_keymetricsreport_download_csv", names)

    def test_download_csv_view_success(self):
        # Ensure monthly stage is computable in admin URLconf context
        SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)

        obj = self._make_monthly()

        with (
            mock.patch.object(
                KeyMetricsReport, "render_csv", return_value=b"a,b\n1,2\n"
            ),
            mock.patch.object(
                KeyMetricsReport, "csv_filename", return_value="report.csv"
            ),
        ):
            self.client.force_login(self.super_user)
            url = reverse(
                "admin:concordia_keymetricsreport_download_csv", args=[obj.pk]
            )
            resp = self.client.get(url)

        self.assertEqual(resp.status_code, 200)
        self.assertEqual(resp["Content-Type"], "text/csv")
        self.assertIn('attachment; filename="report.csv"', resp["Content-Disposition"])
        self.assertEqual(resp.content, b"a,b\n1,2\n")

    def test_download_csv_view_404_when_missing(self):
        # Login so admin view runs permission checks normally
        self.client.force_login(self.super_user)
        url = reverse(
            "admin:concordia_keymetricsreport_download_csv", args=["99999999"]
        )
        resp = self.client.get(url)
        self.assertEqual(resp.status_code, 404)

    def test_download_selected_as_zip_streams_zip_with_csvs(self):
        r1 = self._make_monthly()
        r2 = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.MONTHLY,
            period_start=date(2024, 2, 1),
            period_end=date(2024, 2, 29),  # 2024 is leap year
            fiscal_year=2024,
            fiscal_quarter=2,
            month=2,
        )

        def fname_side_effect(self_obj):
            return f"kmr-{self_obj.pk}.csv"

        def csv_side_effect(self_obj):
            return f"id,{self_obj.pk}\n".encode("utf-8")

        with (
            mock.patch.object(
                KeyMetricsReport, "csv_filename", autospec=True
            ) as mock_fname,
            mock.patch.object(
                KeyMetricsReport, "render_csv", autospec=True
            ) as mock_csv,
        ):
            mock_fname.side_effect = fname_side_effect
            mock_csv.side_effect = csv_side_effect

            req = self.request_factory.post("/")
            req.user = self.super_user
            qs = KeyMetricsReport.objects.filter(pk__in=[r1.pk, r2.pk])

            resp = self.admin.download_selected_as_zip(req, qs)

        self.assertEqual(resp.status_code, 200)
        self.assertEqual(resp["Content-Type"], "application/zip")
        self.assertIn(
            'attachment; filename="key_metrics_reports.zip"',
            resp["Content-Disposition"],
        )

        with zipfile.ZipFile(io.BytesIO(resp.content), "r") as zf:
            names = set(zf.namelist())
            self.assertIn(f"kmr-{r1.pk}.csv", names)
            self.assertIn(f"kmr-{r2.pk}.csv", names)
            self.assertEqual(
                zf.read(f"kmr-{r1.pk}.csv"), f"id,{r1.pk}\n".encode("utf-8")
            )
            self.assertEqual(
                zf.read(f"kmr-{r2.pk}.csv"), f"id,{r2.pk}\n".encode("utf-8")
            )


================================================
FILE: concordia/tests/test_admin_actions.py
================================================
import uuid
from unittest import mock

from django.contrib.auth.models import User
from django.http import HttpRequest
from django.test import TestCase

from concordia.admin.actions import (
    anonymize_action,
    change_status_to_completed,
    change_status_to_in_progress,
    change_status_to_needs_review,
    publish_action,
    publish_item_action,
    unpublish_action,
    unpublish_item_action,
    verify_assets_action,
)
from concordia.models import (
    Asset,
    Campaign,
    Item,
    Project,
    TranscriptionStatus,
)
from concordia.tests.utils import (
    CreateTestUsers,
    create_asset,
    create_campaign,
    create_item,
    create_project,
    create_transcription,
)
from concordia.utils import get_anonymous_user


class MockModelAdmin:
    pass


request = HttpRequest()
modeladmin = MockModelAdmin()


class UserAdminActionTest(TestCase, CreateTestUsers):
    def setUp(self):
        self.user1 = self.create_user("user1")
        self.user2 = self.create_user("user2")
        self.user3 = self.create_user("user3")

    def test_anonymize_action(self):
        queryset = User.objects.filter(pk__in=(self.user1.pk, self.user3.pk))
        anonymize_action(modeladmin, request, queryset)
        user1 = User.objects.get(pk=self.user1.pk)
        user2 = User.objects.get(pk=self.user2.pk)
        user3 = User.objects.get(pk=self.user3.pk)

        self.assertIn("Anonymized", user1.username)
        self.assertEqual(self.user2.username, user2.username)
        self.assertIn("Anonymized", user3.username)

        self.assertEqual("", user1.email)
        self.assertEqual(self.user2.email, user2.email)
        self.assertEqual("", user3.email)

        self.assertFalse(user1.has_usable_password())
        self.assertTrue(user2.has_usable_password())
        self.assertFalse(user3.has_usable_password())

        self.assertFalse(user1.check_password(self.user1._password))
        self.assertTrue(user2.check_password(self.user2._password))
        self.assertFalse(user3.check_password(self.user3._password))

        self.assertFalse(user1.is_active)
        self.assertTrue(user2.is_active)
        self.assertFalse(user3.is_active)


class ItemAdminActionTest(TestCase):
    def _setUp(self, published=True):
        self.asset1 = create_asset(published=published)
        self.item1 = self.asset1.item
        self.project = self.item1.project

        self.item2 = create_item(project=self.project, item_id="2", published=published)
        self.asset2 = create_asset(
            item=self.item2, slug="test-asset-slug-2", published=published
        )

        self.item3 = create_item(project=self.project, item_id="3", published=published)
        self.asset3 = create_asset(
            item=self.item3, slug="test-asset-slug-3", published=published
        )
        self.asset4 = create_asset(
            item=self.item3, slug="test-asset-slug-4", published=published
        )

    def test_publish_item_action(self):
        self._setUp(False)
        queryset = Item.objects.filter(pk__in=[self.item1.pk, self.item3.pk])
        publish_item_action(modeladmin, request, queryset)
        item1 = Item.objects.get(pk=self.item1.pk)
        asset1 = Asset.objects.get(pk=self.asset1.pk)
        item2 = Item.objects.get(pk=self.item2.pk)
        asset2 = Asset.objects.get(pk=self.asset2.pk)
        item3 = Item.objects.get(pk=self.item3.pk)
        asset3 = Asset.objects.get(pk=self.asset3.pk)
        asset4 = Asset.objects.get(pk=self.asset4.pk)

        self.assertTrue(item1.published)
        self.assertTrue(asset1.published)
        self.assertFalse(item2.published)
        self.assertFalse(asset2.published)
        self.assertTrue(item3.published)
        self.assertTrue(asset3.published)
        self.assertTrue(asset4.published)

    def test_unpublish_item_action(self):
        self._setUp(True)
        queryset = Item.objects.filter(pk__in=[self.item1.pk, self.item3.pk])
        unpublish_item_action(modeladmin, request, queryset)
        item1 = Item.objects.get(pk=self.item1.pk)
        asset1 = Asset.objects.get(pk=self.asset1.pk)
        item2 = Item.objects.get(pk=self.item2.pk)
        asset2 = Asset.objects.get(pk=self.asset2.pk)
        item3 = Item.objects.get(pk=self.item3.pk)
        asset3 = Asset.objects.get(pk=self.asset3.pk)
        asset4 = Asset.objects.get(pk=self.asset4.pk)

        self.assertFalse(item1.published)
        self.assertFalse(asset1.published)
        self.assertTrue(item2.published)
        self.assertTrue(asset2.published)
        self.assertFalse(item3.published)
        self.assertFalse(asset3.published)
        self.assertFalse(asset4.published)


class AssetAdminActionTest(TestCase, CreateTestUsers):
    def setUp(self):
        self.user = self.create_user("testuser")
        self.reviewed_asset = create_asset()
        self.unreviewed_asset = create_asset(
            item=self.reviewed_asset.item, slug="unreviewed-asset"
        )
        self.untranscribed_asset = create_asset(
            item=self.reviewed_asset.item, slug="untranscribed-asset"
        )
        self.asset_pks = [
            self.reviewed_asset.pk,
            self.unreviewed_asset.pk,
            self.untranscribed_asset.pk,
        ]
        self.anon_user = get_anonymous_user()
        self.request = HttpRequest()
        self.request.user = self.user
        create_transcription(asset=self.reviewed_asset, user=self.anon_user)
        create_transcription(asset=self.unreviewed_asset, user=self.anon_user)
        create_transcription(
            asset=self.reviewed_asset,
            user=self.anon_user,
            reviewed_by=self.user,
        )

    def test_change_status_to_completed(self):
        queryset = Asset.objects.filter(pk__in=self.asset_pks)
        change_status_to_completed(modeladmin, self.request, queryset)

        reviewed_asset = Asset.objects.get(pk=self.reviewed_asset.pk)
        unreviewed_asset = Asset.objects.get(pk=self.unreviewed_asset.pk)
        untranscribed_asset = Asset.objects.get(pk=self.untranscribed_asset.pk)

        self.assertEqual(
            reviewed_asset.transcription_status, TranscriptionStatus.COMPLETED
        )
        self.assertEqual(
            unreviewed_asset.transcription_status, TranscriptionStatus.COMPLETED
        )
        self.assertEqual(
            untranscribed_asset.transcription_status, TranscriptionStatus.COMPLETED
        )

    def test_change_status_to_needs_review(self):
        queryset = Asset.objects.filter(pk__in=self.asset_pks)
        change_status_to_needs_review(modeladmin, self.request, queryset)

        reviewed_asset = Asset.objects.get(pk=self.reviewed_asset.pk)
        unreviewed_asset = Asset.objects.get(pk=self.unreviewed_asset.pk)
        untranscribed_asset = Asset.objects.get(pk=self.untranscribed_asset.pk)

        self.assertEqual(
            reviewed_asset.transcription_status, TranscriptionStatus.SUBMITTED
        )
        self.assertEqual(
            unreviewed_asset.transcription_status, TranscriptionStatus.SUBMITTED
        )
        self.assertEqual(
            untranscribed_asset.transcription_status, TranscriptionStatus.SUBMITTED
        )

    def test_change_status_to_in_progress(self):
        queryset = Asset.objects.filter(pk__in=self.asset_pks)
        change_status_to_in_progress(modeladmin, self.request, queryset)

        reviewed_asset = Asset.objects.get(pk=self.reviewed_asset.pk)
        unreviewed_asset = Asset.objects.get(pk=self.unreviewed_asset.pk)
        untranscribed_asset = Asset.objects.get(pk=self.untranscribed_asset.pk)

        self.assertEqual(
            reviewed_asset.transcription_status, TranscriptionStatus.IN_PROGRESS
        )
        self.assertEqual(
            unreviewed_asset.transcription_status, TranscriptionStatus.IN_PROGRESS
        )
        self.assertEqual(
            untranscribed_asset.transcription_status, TranscriptionStatus.IN_PROGRESS
        )

    def test_change_status_to_completed_message_single(self):
        queryset = Asset.objects.filter(pk__in=[self.untranscribed_asset.pk])
        with mock.patch("concordia.admin.actions.messages.info") as mock_info:
            change_status_to_completed(modeladmin, self.request, queryset)

        self.assertTrue(mock_info.called)
        args, kwargs = mock_info.call_args
        self.assertIs(args[0], self.request)
        self.assertIn("Changed status of", args[1])
        self.assertIn(self.untranscribed_asset.title, args[1])
        self.assertIn("to Complete", args[1])

    def test_change_status_to_completed_message_multiple(self):
        queryset = Asset.objects.filter(
            pk__in=[self.unreviewed_asset.pk, self.untranscribed_asset.pk]
        )
        with mock.patch("concordia.admin.actions.messages.info") as mock_info:
            change_status_to_completed(modeladmin, self.request, queryset)

        self.assertTrue(mock_info.called)
        args, kwargs = mock_info.call_args
        self.assertIs(args[0], self.request)
        self.assertIn("Changed status of 2 assets to Complete", args[1])

    def test_change_status_to_needs_review_message_single(self):
        queryset = Asset.objects.filter(pk__in=[self.untranscribed_asset.pk])
        with mock.patch("concordia.admin.actions.messages.info") as mock_info:
            change_status_to_needs_review(modeladmin, self.request, queryset)

        self.assertTrue(mock_info.called)
        args, kwargs = mock_info.call_args
        self.assertIs(args[0], self.request)
        self.assertIn("Changed status of", args[1])
        self.assertIn(self.untranscribed_asset.title, args[1])
        self.assertIn("to Needs Review", args[1])

    def test_change_status_to_in_progress_message_multiple(self):
        extra_asset = create_asset(
            item=self.reviewed_asset.item, slug="extra-no-tx-for-in-progress"
        )

        queryset = Asset.objects.filter(
            pk__in=[self.untranscribed_asset.pk, extra_asset.pk]
        )

        with mock.patch("concordia.admin.actions.messages.info") as mock_info:
            change_status_to_in_progress(modeladmin, self.request, queryset)

        self.assertTrue(mock_info.called)
        args, kwargs = mock_info.call_args
        self.assertIs(args[0], self.request)
        self.assertIn("Changed status of 2 assets to In Progress", args[1])


class AdminActionTest(TestCase):
    def _setUp(self, published=True):
        self.asset1 = create_asset(published=published)
        self.item1 = self.asset1.item
        self.project1 = self.item1.project
        self.campaign1 = self.project1.campaign

        self.campaign2 = create_campaign(
            slug="test-campaign-slug-2", published=published
        )
        self.project2 = create_project(
            campaign=self.campaign2, slug="test-project-slug-2", published=published
        )
        self.item2 = create_item(
            project=self.project2, item_id="2", published=published
        )
        self.asset2 = create_asset(
            item=self.item2, slug="test-asset-slug-2", published=published
        )

        self.campaign3 = create_campaign(
            slug="test-campaign-slug-3", published=published
        )
        self.project3 = create_project(
            campaign=self.campaign3, slug="test-project-slug-3", published=published
        )
        self.item3 = create_item(
            project=self.project3, item_id="3", published=published
        )
        self.asset3 = create_asset(
            item=self.item3, slug="test-asset-slug-3", published=published
        )
        self.asset4 = create_asset(
            item=self.item3, slug="test-asset-slug-4", published=published
        )

    def test_publish_action(self):
        self._setUp(False)
        queryset = Campaign.objects.filter(
            pk__in=[self.campaign1.pk, self.campaign3.pk]
        )
        publish_action(modeladmin, request, queryset)
        campaign1 = Campaign.objects.get(pk=self.campaign1.pk)
        campaign2 = Campaign.objects.get(pk=self.campaign2.pk)
        campaign3 = Campaign.objects.get(pk=self.campaign3.pk)
        project1 = Project.objects.get(pk=self.project1.pk)

        self.assertTrue(campaign1.published)
        self.assertFalse(campaign2.published)
        self.assertTrue(campaign3.published)
        self.assertFalse(project1.published)

        queryset = Project.objects.filter(pk__in=[self.project2.pk])
        publish_action(modeladmin, request, queryset)
        project1 = Project.objects.get(pk=self.project1.pk)
        project2 = Project.objects.get(pk=self.project2.pk)
        project3 = Project.objects.get(pk=self.project3.pk)
        item2 = Item.objects.get(pk=self.item2.pk)

        self.assertFalse(project1.published)
        self.assertTrue(project2.published)
        self.assertFalse(project3.published)
        self.assertFalse(item2.published)

        queryset = Asset.objects.filter(
            pk__in=[self.asset1.pk, self.asset2.pk, self.asset3.pk]
        )
        publish_action(modeladmin, request, queryset)
        asset1 = Asset.objects.get(pk=self.asset1.pk)
        asset2 = Asset.objects.get(pk=self.asset2.pk)
        asset3 = Asset.objects.get(pk=self.asset3.pk)
        asset4 = Asset.objects.get(pk=self.asset4.pk)

        self.assertTrue(asset1.published)
        self.assertTrue(asset2.published)
        self.assertTrue(asset3.published)
        self.assertFalse(asset4.published)

    def test_unpublish_action(self):
        self._setUp(True)
        queryset = Campaign.objects.filter(
            pk__in=[self.campaign1.pk, self.campaign3.pk]
        )
        unpublish_action(modeladmin, request, queryset)
        campaign1 = Campaign.objects.get(pk=self.campaign1.pk)
        campaign2 = Campaign.objects.get(pk=self.campaign2.pk)
        campaign3 = Campaign.objects.get(pk=self.campaign3.pk)
        project1 = Project.objects.get(pk=self.project1.pk)

        self.assertFalse(campaign1.published)
        self.assertTrue(campaign2.published)
        self.assertFalse(campaign3.published)
        self.assertTrue(project1.published)

        queryset = Project.objects.filter(pk__in=[self.project2.pk])
        unpublish_action(modeladmin, request, queryset)
        project1 = Project.objects.get(pk=self.project1.pk)
        project2 = Project.objects.get(pk=self.project2.pk)
        project3 = Project.objects.get(pk=self.project3.pk)
        item2 = Item.objects.get(pk=self.item2.pk)

        self.assertTrue(project1.published)
        self.assertFalse(project2.published)
        self.assertTrue(project3.published)
        self.assertTrue(item2.published)

        queryset = Asset.objects.filter(
            pk__in=[self.asset1.pk, self.asset2.pk, self.asset3.pk]
        )
        unpublish_action(modeladmin, request, queryset)
        asset1 = Asset.objects.get(pk=self.asset1.pk)
        asset2 = Asset.objects.get(pk=self.asset2.pk)
        asset3 = Asset.objects.get(pk=self.asset3.pk)
        asset4 = Asset.objects.get(pk=self.asset4.pk)

        self.assertFalse(asset1.published)
        self.assertFalse(asset2.published)
        self.assertFalse(asset3.published)
        self.assertTrue(asset4.published)


class VerifyAssetsActionTest(TestCase):
    def setUp(self):
        # Campaign A with two assets
        self.asset_a1 = create_asset()
        self.item_a2 = create_item(
            project=self.asset_a1.item.project, item_id="a2", published=True
        )
        self.asset_a2 = create_asset(item=self.item_a2, slug="asset-a2", published=True)

        # Campaign B with one asset
        self.campaign_b = create_campaign(slug="camp-b")
        self.project_b = create_project(campaign=self.campaign_b, slug="proj-b")
        self.item_b1 = create_item(project=self.project_b, item_id="b1")
        self.asset_b1 = create_asset(item=self.item_b1, slug="asset-b1")

        self.request = HttpRequest()

        class DummyAdmin:
            def __init__(self, model):
                self.model = model
                self.messages = []

            def message_user(self, request, msg, **kwargs):
                self.messages.append((request, msg, kwargs))

        self.DummyAdmin = DummyAdmin

    def test_verify_assets_action_for_campaign(self):
        admin_obj = self.DummyAdmin(model=Campaign)
        queryset = Campaign.objects.filter(
            pk__in=[self.asset_a1.item.project.campaign.pk, self.campaign_b.pk]
        )

        with (
            mock.patch(
                "concordia.admin.actions.uuid.uuid4",
                return_value=uuid.UUID("12345678-1234-1234-1234-1234567890ab"),
            ),
            mock.patch(
                "concordia.admin.actions.create_verify_asset_image_job_batch",
                return_value=(3, "http://example/jobs"),
            ) as mock_batch,
        ):
            verify_assets_action(admin_obj, self.request, queryset)

        # Assert the selected asset IDs were passed through
        passed_ids = list(mock_batch.call_args[0][0])
        self.assertCountEqual(
            passed_ids, [self.asset_a1.pk, self.asset_a2.pk, self.asset_b1.pk]
        )

        # Assert the message content
        self.assertEqual(len(admin_obj.messages), 1)
        _req, msg, _kwargs = admin_obj.messages[0]
        self.assertIn(
            "Created 3 VerifyAssetImageJobs as part of batch "
            "12345678-1234-1234-1234-1234567890ab",
            msg,
        )
        self.assertIn('href="http://example/jobs"', msg)

    def test_verify_assets_action_for_project(self):
        admin_obj = self.DummyAdmin(model=Project)
        queryset = Project.objects.filter(pk__in=[self.asset_a1.item.project.pk])

        with mock.patch(
            "concordia.admin.actions.create_verify_asset_image_job_batch",
            return_value=(2, "http://example/proj"),
        ) as mock_batch:
            verify_assets_action(admin_obj, self.request, queryset)

        passed_ids = list(mock_batch.call_args[0][0])
        self.assertCountEqual(passed_ids, [self.asset_a1.pk, self.asset_a2.pk])

        self.assertEqual(len(admin_obj.messages), 1)
        _req, msg, _kwargs = admin_obj.messages[0]
        self.assertIn("Created 2 VerifyAssetImageJobs", msg)

    def test_verify_assets_action_for_item(self):
        admin_obj = self.DummyAdmin(model=Item)
        queryset = Item.objects.filter(pk__in=[self.asset_a1.item.pk, self.item_b1.pk])

        with mock.patch(
            "concordia.admin.actions.create_verify_asset_image_job_batch",
            return_value=(2, "http://example/item"),
        ) as mock_batch:
            verify_assets_action(admin_obj, self.request, queryset)

        passed_ids = list(mock_batch.call_args[0][0])
        self.assertCountEqual(passed_ids, [self.asset_a1.pk, self.asset_b1.pk])

        self.assertEqual(len(admin_obj.messages), 1)
        _req, msg, _kwargs = admin_obj.messages[0]
        self.assertIn("Created 2 VerifyAssetImageJobs", msg)

    def test_verify_assets_action_for_asset(self):
        admin_obj = self.DummyAdmin(model=Asset)
        queryset = Asset.objects.filter(pk__in=[self.asset_a2.pk, self.asset_b1.pk])

        with mock.patch(
            "concordia.admin.actions.create_verify_asset_image_job_batch",
            return_value=(2, "http://example/asset"),
        ) as mock_batch:
            verify_assets_action(admin_obj, self.request, queryset)

        passed_ids = list(mock_batch.call_args[0][0])
        self.assertCountEqual(passed_ids, [self.asset_a2.pk, self.asset_b1.pk])

        self.assertEqual(len(admin_obj.messages), 1)
        _req, msg, _kwargs = admin_obj.messages[0]
        self.assertIn("Created 2 VerifyAssetImageJobs", msg)

    def test_verify_assets_action_for_unsupported_model(self):
        admin_obj = self.DummyAdmin(model=User)  # unsupported branch
        queryset = User.objects.none()

        with mock.patch(
            "concordia.admin.actions.create_verify_asset_image_job_batch"
        ) as mock_batch:
            verify_assets_action(admin_obj, self.request, queryset)

        # No batch call for unsupported model
        self.assertFalse(mock_batch.called)

        # Error message sent
        self.assertEqual(len(admin_obj.messages), 1)
        _req, msg, kwargs = admin_obj.messages[0]
        self.assertIn("This action is not available for this model.", msg)
        self.assertEqual(kwargs.get("level"), "error")


================================================
FILE: concordia/tests/test_admin_filters.py
================================================
from django.contrib.admin import ModelAdmin
from django.test import RequestFactory, TestCase
from django.utils import timezone

from concordia.admin import (
    CardAdmin,
    HelpfulLinkAdmin,
    ItemAdmin,
    ProjectAdmin,
    SiteReportAdmin,
    TranscriptionAdmin,
)
from concordia.admin.filters import (
    CardCampaignListFilter,
    ItemProjectListFilter,
    NextAssetCampaignListFilter,
    OcrGeneratedFilter,
    ProjectCampaignListFilter,
    ProjectCampaignStatusListFilter,
    SiteReportCampaignListFilter,
    SubmittedFilter,
    SupersededListFilter,
    TopicListFilter,
)
from concordia.admin_site import ConcordiaAdminSite
from concordia.models import (
    Campaign,
    Card,
    HelpfulLink,
    Item,
    NextTranscribableCampaignAsset,
    Project,
    SiteReport,
    Transcription,
)
from concordia.tests.utils import (
    CreateTestUsers,
    create_asset,
    create_card,
    create_card_family,
    create_helpful_link,
    create_item,
    create_project,
    create_site_report,
    create_topic,
    create_transcription,
)


class NullableTimestampFilterTest(CreateTestUsers, TestCase):
    def setUp(self):
        user = self.create_user(username="tester")
        create_transcription(user=user, submitted=timezone.now())

    def test_lookups(self):
        f = SubmittedFilter(
            None, {"submitted": ("null",)}, Transcription, TranscriptionAdmin
        )
        transcriptions = f.queryset(None, Transcription.objects.all())
        self.assertEqual(transcriptions.count(), 0)

        f = SubmittedFilter(
            None, {"submitted": ("not-null",)}, Transcription, TranscriptionAdmin
        )
        transcriptions = f.queryset(None, Transcription.objects.all())
        self.assertEqual(transcriptions.count(), 1)

        f = SubmittedFilter(
            None, {"submitted": (timezone.now(),)}, Transcription, TranscriptionAdmin
        )
        transcriptions = f.queryset(None, Transcription.objects.all())
        self.assertEqual(transcriptions.count(), 1)


class CampaignListFilterTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.campaign = create_project().campaign

    def test_card_filter(self):
        request = RequestFactory().get("/admin/concordia/card/?campaign=")
        f = CardCampaignListFilter(request, {}, Card, CardAdmin)
        cards = f.queryset(None, Card.objects.all())
        self.assertEqual(cards.count(), 0)

        request = RequestFactory().get(
            "/admin/concordia/card/?campaign=%s" % self.campaign.id
        )
        f = CardCampaignListFilter(
            request, {"campaign": (self.campaign.id,)}, Card, CardAdmin
        )
        cards = f.queryset(None, Card.objects.all())
        self.assertEqual(cards.count(), 0)

        self.campaign.card_family = create_card_family()
        self.campaign.card_family.cards.add(create_card())
        self.campaign.save()
        cards = f.queryset(None, Card.objects.all())
        self.assertEqual(cards.count(), 1)

    def test_project_filter(self):
        request = RequestFactory().get(
            "/admin/concordia/project/?campaign__id__exact=%s" % self.campaign.id
        )
        f = ProjectCampaignListFilter(
            request,
            {"campaign__id__exact": (self.campaign.id,)},
            Project,
            ProjectAdmin,
        )
        projects = f.queryset(None, Project.objects.all())
        self.assertEqual(projects.count(), 1)

        request = RequestFactory().get("/admin/concordia/project/?campaign__status=1")
        f = ProjectCampaignListFilter(
            request,
            {"campaign__status": (Campaign.Status.ACTIVE,)},
            Project,
            ProjectAdmin,
        )
        projects = f.queryset(None, Project.objects.all())
        self.assertEqual(projects.count(), 1)

    def test_site_report_filter(self):
        create_site_report(campaign=self.campaign)
        param = "campaign__id__exact"
        request = RequestFactory().get(
            "/admin/concordia/sitereport/?%s=%s" % (param, self.campaign.id)
        )
        site_report_admin = SiteReportAdmin(SiteReport, ConcordiaAdminSite())
        f = SiteReportCampaignListFilter(
            request,
            {param: (self.campaign.id,)},
            SiteReport,
            site_report_admin,
        )
        self.assertTrue(f.has_output())

        self.assertIn(param, f.expected_parameters())

        self.login_user()
        request.user = self.user
        changelist = site_report_admin.get_changelist_instance(request)
        choices = list(f.choices(changelist))
        self.assertEqual(choices[0]["display"], "All")

        self.assertEqual(choices[1]["display"], "Test Campaign")

        self.assertEqual(choices[-1]["display"], "-")

        f.include_empty_choice = False
        self.assertFalse(f.has_output())

        choices = list(f.choices(changelist))
        self.assertEqual(choices[-1]["display"], "Test Campaign")


class ItemFilterTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.project = create_item().project

    def test_project_filter(self):
        request = RequestFactory().get(
            "/admin/concordia/item/?project__in=%s" % self.project.pk
        )
        f = ItemProjectListFilter(
            request, {"project__in": (self.project.id,)}, Item, ItemAdmin
        )
        items = f.queryset(None, Item.objects.all())
        self.assertEqual(items.count(), 1)

        request = RequestFactory().get(
            "/admin/concordia/item/?project__campaign__id__exact=%s"
            % self.project.campaign.pk
        )
        f = ItemProjectListFilter(
            request,
            {"project__campaign__id__exact": (self.project.campaign.pk,)},
            Item,
            ItemAdmin,
        )
        items = f.queryset(None, Item.objects.all())
        self.assertEqual(items.count(), 1)


class ProjectFilterTests(TestCase):
    def setUp(self):
        self.project = create_item().project

    def test_project_campaign_status_list_filter(self):
        f = ProjectCampaignStatusListFilter(None, {}, Project, ProjectAdmin)
        projects = f.queryset(None, Project.objects.all())
        self.assertEqual(projects.count(), 1)

        f = ProjectCampaignStatusListFilter(
            None, {"campaign__status": (Campaign.Status.ACTIVE,)}, Project, ProjectAdmin
        )
        projects = f.queryset(None, Project.objects.all())
        self.assertEqual(projects.count(), 1)


class TranscriptionFilterTests(CreateTestUsers, TestCase):
    def setUp(self):
        user = self.create_user(username="tester")
        create_transcription(user=user)

    def test_ocr_filter(self):
        f = OcrGeneratedFilter("No", {}, Transcription, TranscriptionAdmin)
        transcriptions = f.queryset(None, Transcription.objects.all())
        self.assertEqual(transcriptions.count(), 1)

        f = OcrGeneratedFilter(
            "No", {"ocr_generated": (False,)}, Transcription, TranscriptionAdmin
        )
        transcriptions = f.queryset(None, Transcription.objects.all())
        self.assertEqual(transcriptions.count(), 1)


class TopicListFilterTests(TestCase):
    def setUp(self):
        self.topic = create_topic()
        self.helpful_link_1 = create_helpful_link(topic=self.topic)
        self.helpful_link_2 = create_helpful_link()

    def test_helpfullink_topic_list_filter(self):
        topic_filter = TopicListFilter(None, {}, HelpfulLink, HelpfulLinkAdmin)
        helpful_links = topic_filter.queryset(None, HelpfulLink.objects.all())
        self.assertEqual(helpful_links.count(), 2)

        topic_filter = TopicListFilter(
            None, {"topic__id__exact": (self.topic.id,)}, HelpfulLink, HelpfulLinkAdmin
        )
        helpful_links = topic_filter.queryset(None, HelpfulLink.objects.all())
        self.assertEqual(helpful_links.count(), 1)


class NextAssetCampaignListFilterTests(TestCase):
    def setUp(self):
        asset = create_asset()
        NextTranscribableCampaignAsset.objects.create(
            asset=asset,
            campaign=asset.campaign,
            item=asset.item,
            item_item_id=asset.item.item_id,
            project=asset.item.project,
            project_slug=asset.item.project.slug,
            sequence=asset.sequence,
            transcription_status=asset.transcription_status,
        )
        self.campaign = asset.campaign

    def test_lookups_only_includes_used_campaigns(self):
        class DummyAdmin(ModelAdmin):
            model = NextTranscribableCampaignAsset

        request = RequestFactory().get(
            "/admin/concordia/nexttranscribablecampaignasset/"
        )
        dummy_admin = DummyAdmin(NextTranscribableCampaignAsset, None)
        fil = NextAssetCampaignListFilter(
            request, {}, NextTranscribableCampaignAsset, dummy_admin
        )

        lookups = list(fil.lookups(request, dummy_admin))
        self.assertEqual(len(lookups), 1)
        self.assertEqual(lookups[0][0], self.campaign.id)
        self.assertEqual(lookups[0][1], self.campaign.title)


class SupersededListFilterTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.user = self.create_user(username="tester")
        self.base = create_transcription(user=self.user, text="base")
        self.superseding = create_transcription(
            user=self.user,
            supersedes=self.base,
            text="superseding",
            asset=self.base.asset,
        )
        asset2 = create_asset(item=self.base.asset.item, slug="asset-2")
        self.independent = create_transcription(
            user=self.user, text="independent", asset=asset2
        )

    def test_lookups(self):
        request = RequestFactory().get("/admin/concordia/transcription/")
        f = SupersededListFilter(request, {}, Transcription, TranscriptionAdmin)
        lookups = dict(f.lookups(request, TranscriptionAdmin(Transcription, None)))
        self.assertIn("yes", lookups)
        self.assertIn("no", lookups)
        self.assertEqual(lookups["yes"], "Superseded")
        self.assertEqual(lookups["no"], "Not superseded")

    def test_queryset_superseded_yes(self):
        f = SupersededListFilter(
            None, {"superseded": ("yes",)}, Transcription, TranscriptionAdmin
        )
        qs = f.queryset(None, Transcription.objects.all())
        self.assertQuerySetEqual(
            qs.order_by("id").values_list("id", flat=True),
            [self.base.id],
            transform=lambda x: x,
        )

    def test_queryset_superseded_no(self):
        f = SupersededListFilter(
            None, {"superseded": ("no",)}, Transcription, TranscriptionAdmin
        )
        qs = f.queryset(None, Transcription.objects.all())
        ids = set(qs.values_list("id", flat=True))
        self.assertEqual(ids, {self.superseding.id, self.independent.id})

    def test_queryset_no_param_returns_all(self):
        f = SupersededListFilter(None, {}, Transcription, TranscriptionAdmin)
        qs = f.queryset(None, Transcription.objects.all())
        ids = set(qs.values_list("id", flat=True))
        self.assertEqual(ids, {self.base.id, self.superseding.id, self.independent.id})

    def test_queryset_ignores_unknown_value(self):
        f = SupersededListFilter(
            None, {"superseded": ("maybe",)}, Transcription, TranscriptionAdmin
        )
        qs = f.queryset(None, Transcription.objects.all())
        ids = set(qs.values_list("id", flat=True))
        self.assertEqual(ids, {self.base.id, self.superseding.id, self.independent.id})


================================================
FILE: concordia/tests/test_admin_forms.py
================================================
from django.test import TestCase, override_settings

from concordia.admin.forms import SanitizedDescriptionAdminForm, get_cache_name_choices
from concordia.models import Campaign


class SanitizedDescriptionAdminFormTests(TestCase):
    def test_clean(self):
        short_description = "<p>Arm</p>"
        data = {
            "slug": "test",
            "title": "Test",
            "status": Campaign.Status.ACTIVE,
            "ordering": 0,
            "short_description": "<div>%s</<div>" % short_description,
            "description": "<script src=example.com/evil.js></script>",
        }
        data["description"] += "<strong>Arm</strong>"
        form = SanitizedDescriptionAdminForm(data)
        self.assertTrue(form.is_valid())
        self.assertEqual(form.clean_short_description(), short_description)
        self.assertEqual(form.clean_description(), "<strong>Arm</strong>")


class ClearCacheFormTests(TestCase):
    @override_settings(
        CACHES={
            "default": {
                "BACKEND": "django.core.cache.backends.dummy.DummyCache",
            },
            "view_cache": {
                "BACKEND": "django.core.cache.backends.dummy.DummyCache",
            },
        }
    )
    def test_cache_name_choices(self):
        choices = get_cache_name_choices()
        choice_names = [name for name, description in choices]
        self.assertNotIn("default", choice_names)
        self.assertIn("view_cache", choice_names)


================================================
FILE: concordia/tests/test_admin_views.py
================================================
import copy
import json
from functools import wraps
from http import HTTPStatus
from io import BytesIO
from unittest import mock

from django.contrib.messages import get_messages
from django.core.files.uploadedfile import SimpleUploadedFile
from django.test import RequestFactory, TestCase
from django.urls import reverse
from django.utils import timezone
from django.utils.text import slugify
from django.utils.timezone import now

from concordia.admin.views import SerializedObjectView
from concordia.models import Campaign, Project, TranscriptionStatus
from concordia.tests.utils import (
    CreateTestUsers,
    StreamingTestMixin,
    create_asset,
    create_campaign,
    create_card,
    create_item,
    create_project,
    create_site_report,
    create_transcription,
)
from concordia.utils import get_anonymous_user
from importer.tests.utils import create_import_asset


class TestProjectLevelExportView(CreateTestUsers, TestCase):
    def setUp(self):
        self.login_user(is_staff=True, is_superuser=True)
        self.url = reverse("admin:project-level-export")
        self.asset = create_asset(download_url="http://example.com/1234.jpg")
        self.asset2 = create_asset(
            slug="asset-2",
            item=self.asset.item,
            download_url="http://example.com/5678.jpg",
        )
        self.asset3 = create_asset(
            slug="asset-3",
            item=self.asset.item,
            download_url="http://example.com/9012.jpg",
        )

    def test_get(self):
        response = self.client.get(self.url)
        self.assertEqual(response.status_code, 200)
        self.assertContains(
            response, f"<td>{self.asset.item.project.campaign.title}</td>", html=True
        )

    def test_get_campaign(self):
        response = self.client.get(
            self.url, {"id": self.asset.item.project.campaign.id}
        )
        self.assertContains(
            response, f"<td>{self.asset.item.project.title}</td>", html=True
        )

    def test_post(self):
        with mock.patch("exporter.views.boto3.resource", autospec=True) as bucket_mock:
            # The parameter is 'project_name', but it actually expects the project id.
            response = self.client.post(
                f"{self.url}?slug={self.asset.item.project.campaign.slug}",
                {"project_name": f"{self.asset.item.project.id}"},
            )
            self.assertEqual(response.status_code, 200)
            self.assertEqual(response["Content-Type"], "application/zip")
            self.assertFalse(bucket_mock.called)


class TestFunctionBasedViews(CreateTestUsers, TestCase, StreamingTestMixin):
    def test_admin_bulk_import_review(self):
        self.login_user(is_staff=True, is_superuser=True)
        self.assertTrue(self.user.is_active)
        self.assertTrue(self.user.is_staff)
        self.assertTrue(self.user.is_superuser)
        path = reverse("admin:bulk-review")
        response = self.client.get(path)
        self.assertEqual(response.status_code, 200)

        data = {}
        response = self.client.post(path, data=data)
        self.assertEqual(response.status_code, 200)

    def test_admin_site_report_view(self):
        self.login_user(is_staff=True, is_superuser=True)
        mocked_datetime = timezone.now()
        mocked_datetime_formatted = mocked_datetime.isoformat()
        with mock.patch("django.utils.timezone.now") as now_mocked:
            now_mocked.return_value = mocked_datetime
            create_site_report()

        response = self.client.get(reverse("admin:site-report"))
        self.assertEqual(response.status_code, 200)
        content = self.get_streaming_content(response).split(b"\r\n")
        self.assertEqual(len(content), 3)  # Includes empty line at the end of the file
        test_data = [
            b"Date,report name,Campaign,topic__title,assets total,assets published,"
            b"assets not started,assets in progress,assets waiting review,"
            b"assets completed,assets unpublished,assets started,items published,"
            b"items unpublished,projects published,projects unpublished,"
            b"anonymous transcriptions,transcriptions saved,daily review actions,"
            b"distinct tags,tag uses,campaigns published,campaigns unpublished,"
            b"users registered,users activated,registered contributors,"
            b"daily active users",
            b"%s,,,,,,,,,,,,,,,,,,,,,,,,,," % str.encode(mocked_datetime_formatted),
            b"",
        ]
        self.assertEqual(content, test_data)

    def test_admin_retired_site_report_view(self):
        self.login_user(is_staff=True, is_superuser=True)

        response = self.client.get(reverse("admin:retired-site-report"))
        self.assertEqual(response.status_code, 200)
        content = self.get_streaming_content(response).split(b"\r\n")
        self.assertEqual(len(content), 3)  # Includes empty line at the end of the file
        test_data = [
            b"Date,report name,Campaign,topic__title,assets total,assets published,"
            b"assets not started,assets in progress,assets waiting review,"
            b"assets completed,assets unpublished,assets started,items published,"
            b"items unpublished,projects published,projects unpublished,"
            b"anonymous transcriptions,transcriptions saved,daily review actions,"
            b"distinct tags,tag uses,campaigns published,campaigns unpublished,"
            b"users registered,users activated,registered contributors,"
            b"daily active users",
            b",RETIRED TOTAL,,,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0",
            b"",
        ]
        self.assertEqual(content, test_data)


class TestAdminBulkImportView(CreateTestUsers, TestCase):
    def setUp(self):
        self.login_user(is_staff=True, is_superuser=True)
        self.path = reverse("admin:bulk-import")
        self.campaign_title = "Test Campaign"
        self.campaign_short_description = "Short description"
        self.campaign_long_description = "Long description"
        self.campaign_slug = "test-campaign"
        self.project_slug = "test-project"
        self.project_title = "Test Project"
        self.project_description = "Project description"
        self.url = "http://example.com"
        self.spreadsheet_data = {
            "Campaign": self.campaign_title,
            "Campaign Short Description": self.campaign_short_description,
            "Campaign Long Description": self.campaign_long_description,
            "Campaign Slug": self.campaign_slug,
            "Project Slug": self.project_slug,
            "Project": self.project_title,
            "Project Description": self.project_description,
            "Import URLs": self.url,
        }
        self.post_data = {"spreadsheet_file": BytesIO()}

    def test_get(self):
        response = self.client.get(self.path)
        self.assertEqual(response.status_code, 200)
        self.assertIn("form", response.context)

    def test_invalid_form(self):
        response = self.client.post(self.path)
        self.assertEqual(response.status_code, 200)
        self.assertIn("form", response.context)

    def test_fully_valid_form(self):
        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.import_items_into_project_from_url",
                autospec=True,
            ),
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            slurp_mock.return_value = [self.spreadsheet_data]

            response = self.client.post(self.path, data=self.post_data)

            self.assertEqual(response.status_code, 200)
            messages = [str(message) for message in get_messages(response.wsgi_request)]
            self.assertEqual(len(messages), 3)
            self.assertEqual(messages[0], f"Created new campaign {self.campaign_title}")
            self.assertEqual(messages[1], f"Created new project {self.project_title}")
            self.assertEqual(
                messages[2],
                f"Queued {self.campaign_title} {self.project_title} "
                f"import for {self.url}",
            )

            campaign = Campaign.objects.get()
            self.assertEqual(campaign.title, self.campaign_title)
            self.assertEqual(campaign.slug, self.campaign_slug)
            self.assertEqual(campaign.description, self.campaign_long_description)
            self.assertEqual(
                campaign.short_description, self.campaign_short_description
            )

            project = Project.objects.get()
            self.assertEqual(project.title, self.project_title)
            self.assertEqual(project.slug, self.project_slug)
            self.assertEqual(project.description, self.project_description)

            # Submit it again to test that it doesn't re-create the campaign or project
            response = self.client.post(self.path, data=self.post_data)
            self.assertEqual(response.status_code, 200)
            messages = [str(message) for message in get_messages(response.wsgi_request)]
            self.assertEqual(len(messages), 3)
            self.assertEqual(
                messages[0],
                f"Reusing campaign {self.campaign_title} without modification",
            )
            self.assertEqual(
                messages[1],
                f"Reusing project {self.project_title} without modification",
            )
            self.assertEqual(
                messages[2],
                f"Queued {self.campaign_title} {self.project_title} "
                f"import for {self.url}",
            )
            self.assertEqual(1, Campaign.objects.count())
            self.assertEqual(1, Project.objects.count())

    def test_missing_field(self):
        spreadsheet_data = copy.copy(self.spreadsheet_data)
        del spreadsheet_data["Campaign"]

        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.import_items_into_project_from_url",
                autospec=True,
            ),
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            slurp_mock.return_value = [spreadsheet_data]

            response = self.client.post(self.path, data=self.post_data)

        self.assertEqual(response.status_code, 200)
        messages = [str(message) for message in get_messages(response.wsgi_request)]
        self.assertEqual(len(messages), 1)
        self.assertEqual(
            str(messages[0]), "Skipping row 0: missing fields ['Campaign']"
        )

    def test_empty_field(self):
        # Only three fields require values: Campaign, Projet and Import URLs.
        # Other fields must be present but can be empty.
        # This tests that blank value check
        spreadsheet_data = copy.copy(self.spreadsheet_data)

        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.import_items_into_project_from_url",
                autospec=True,
            ),
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}

            # Test one empty field
            spreadsheet_data["Campaign"] = ""
            slurp_mock.return_value = [spreadsheet_data]

            response = self.client.post(self.path, data=self.post_data)
            self.assertEqual(response.status_code, 200)
            messages = [str(message) for message in get_messages(response.wsgi_request)]
            self.assertEqual(len(messages), 1)
            self.assertEqual(
                messages[0],
                "Skipping row 0: at least one required field "
                "(Campaign, Project, Import URLs) is empty",
            )

    def test_all_empty_fields(self):
        # If all values in a spreadsheet row are empty, the row is skipped silently
        spreadsheet_data = {key: "" for key in self.spreadsheet_data.keys()}

        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.import_items_into_project_from_url",
                autospec=True,
            ),
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            slurp_mock.return_value = [spreadsheet_data]

            response = self.client.post(self.path, data=self.post_data)

        self.assertEqual(response.status_code, 200)
        messages = [str(message) for message in get_messages(response.wsgi_request)]
        self.assertEqual(len(messages), 0)

    def test_empty_campaign_slug(self):
        spreadsheet_data = copy.copy(self.spreadsheet_data)
        spreadsheet_data["Campaign Slug"] = ""

        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.import_items_into_project_from_url",
                autospec=True,
            ),
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            slurp_mock.return_value = [spreadsheet_data]

            response = self.client.post(self.path, data=self.post_data)

        self.assertEqual(response.status_code, 200)
        messages = [str(message) for message in get_messages(response.wsgi_request)]
        self.assertEqual(len(messages), 3)
        self.assertEqual(messages[0], f"Created new campaign {self.campaign_title}")
        self.assertEqual(messages[1], f"Created new project {self.project_title}")
        self.assertEqual(
            messages[2],
            f"Queued {self.campaign_title} {self.project_title} import for {self.url}",
        )

        # Since the provided campaign slug was blank, it should slugify the Campaign
        # field instead
        campaign = Campaign.objects.get()
        self.assertEqual(
            campaign.slug, slugify(self.campaign_title, allow_unicode=True)
        )

    def test_bad_campaign_slug(self):
        spreadsheet_data = copy.copy(self.spreadsheet_data)
        spreadsheet_data["Campaign Slug"] = "bad#slug@"

        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.import_items_into_project_from_url",
                autospec=True,
            ),
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            slurp_mock.return_value = [spreadsheet_data]

            response = self.client.post(self.path, data=self.post_data)

        self.assertEqual(response.status_code, 200)
        messages = [str(message) for message in get_messages(response.wsgi_request)]
        self.assertEqual(len(messages), 2)
        self.assertEqual(messages[0], "Campaign slug doesn't match pattern.")
        self.assertEqual(
            messages[1],
            "Unable to create campaign Test Campaign: {'slug': "
            "['Enter a valid “slug” consisting of Unicode letters, "
            "numbers, underscores, or hyphens.']}",
        )

    def test_empty_project_slug(self):
        spreadsheet_data = copy.copy(self.spreadsheet_data)
        spreadsheet_data["Project Slug"] = ""

        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.import_items_into_project_from_url",
                autospec=True,
            ),
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            slurp_mock.return_value = [spreadsheet_data]

            response = self.client.post(self.path, data=self.post_data)

        self.assertEqual(response.status_code, 200)
        messages = [str(message) for message in get_messages(response.wsgi_request)]
        self.assertEqual(len(messages), 3)
        self.assertEqual(messages[0], f"Created new campaign {self.campaign_title}")
        self.assertEqual(messages[1], f"Created new project {self.project_title}")
        self.assertEqual(
            messages[2],
            f"Queued {self.campaign_title} {self.project_title} import for {self.url}",
        )

        # Since the provided project slug was blank, it should slugify the project
        # field instead
        project = Project.objects.get()
        self.assertEqual(project.slug, slugify(self.project_title, allow_unicode=True))

    def test_bad_project_slug(self):
        spreadsheet_data = copy.copy(self.spreadsheet_data)
        spreadsheet_data["Project Slug"] = "bad#slug@"

        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.import_items_into_project_from_url",
                autospec=True,
            ),
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            slurp_mock.return_value = [spreadsheet_data]

            response = self.client.post(self.path, data=self.post_data)

        self.assertEqual(response.status_code, 200)
        messages = [str(message) for message in get_messages(response.wsgi_request)]
        self.assertEqual(len(messages), 3)
        self.assertEqual(messages[0], f"Created new campaign {self.campaign_title}")
        self.assertEqual(messages[1], "Project slug doesn't match pattern.")
        self.assertEqual(
            messages[2],
            "Unable to create project Test Project: {'slug': "
            "['Enter a valid “slug” consisting of Unicode letters, "
            "numbers, underscores, or hyphens.']}",
        )

    def test_bad_url(self):
        spreadsheet_data = copy.copy(self.spreadsheet_data)
        spreadsheet_data["Import URLs"] = bad_url = "ftp://example.com"

        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.import_items_into_project_from_url",
                autospec=True,
            ),
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            slurp_mock.return_value = [spreadsheet_data]

            response = self.client.post(self.path, data=self.post_data)

        self.assertEqual(response.status_code, 200)
        messages = [str(message) for message in get_messages(response.wsgi_request)]
        self.assertEqual(len(messages), 3)
        self.assertEqual(messages[0], f"Created new campaign {self.campaign_title}")
        self.assertEqual(messages[1], f"Created new project {self.project_title}")
        self.assertEqual(messages[2], f"Skipping unrecognized URL value: {bad_url}")

    def test_import_task_exception(self):
        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.import_items_into_project_from_url",
                autospec=True,
            ) as import_mock,
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            slurp_mock.return_value = [self.spreadsheet_data]
            import_mock.side_effect = Exception("Test Exception")

            response = self.client.post(self.path, data=self.post_data)

            self.assertEqual(response.status_code, 200)
            messages = [str(message) for message in get_messages(response.wsgi_request)]
            self.assertEqual(len(messages), 3)
            self.assertEqual(messages[0], f"Created new campaign {self.campaign_title}")
            self.assertEqual(messages[1], f"Created new project {self.project_title}")
            self.assertEqual(
                messages[2],
                f"Unhandled error attempting to import {self.url}: Test Exception",
            )


class TestAdminBulkChangeAssetStatus(CreateTestUsers, TestCase):
    def setUp(self):
        item = create_item()
        self.assets = [
            create_asset(item=item),
            create_asset(item=item, slug="test-asset-2"),
            create_asset(item=item, slug="test-asset-3"),
            create_asset(item=item, slug="test-asset-4"),
        ]
        # Seed with existing transcriptions
        self.accepted_transcription = create_transcription(
            asset=self.assets[0], accepted=now()
        )
        self.rejected_transcription = create_transcription(
            asset=self.assets[1], rejected=now()
        )
        self.submitted_transcription = create_transcription(asset=self.assets[2])
        self.accepted_transcription2 = create_transcription(
            asset=self.assets[3], accepted=now()
        )
        anon = get_anonymous_user()
        self.spreadsheet_data = [
            {
                "asset__slug": self.assets[0].slug,
                "New Status": "submitted",
                "user": anon.id,
            },
            {
                "asset__slug": self.assets[1].slug,
                "New Status": "completed",
                "user": anon.id,
            },
            {
                "asset__slug": self.assets[2].slug,
                "New Status": "completed",
                "user": anon.id,
            },
            {
                "asset__slug": self.assets[3].slug,
                "New Status": "in_progress",
                "user": anon.id,
            },
        ]

    def test_admin_bulk_change_asset_status(self):
        self.login_user(is_staff=True, is_superuser=True)

        fake_file = SimpleUploadedFile(
            "test.xlsx", b"x", content_type="application/vnd.ms-excel"
        )
        post_data = {"spreadsheet_file": fake_file}

        with mock.patch(
            "concordia.admin.views.slurp_excel", autospec=True
        ) as slurp_mock:
            slurp_mock.return_value = self.spreadsheet_data

            path = reverse("admin:bulk-change")
            response = self.client.post(path, data=post_data)
            for asset in self.assets:
                asset.refresh_from_db()
            self.assertEqual(response.status_code, 200)
            slurp_mock.assert_called()
            self.assertEqual(
                self.assets[0].transcription_status,
                TranscriptionStatus.SUBMITTED,
            )
            self.assertEqual(
                self.assets[1].transcription_status,
                TranscriptionStatus.COMPLETED,
            )
            self.assertEqual(
                self.assets[2].transcription_status,
                TranscriptionStatus.COMPLETED,
            )
            self.assertEqual(
                self.assets[3].transcription_status,
                TranscriptionStatus.IN_PROGRESS,
            )


class TestAdminBulkImportReview(CreateTestUsers, TestCase):
    def setUp(self):
        self.login_user(is_staff=True, is_superuser=True)
        self.path = reverse("admin:bulk-review")
        self.campaign_title = "Test Campaign"
        self.campaign_short_description = "Short description"
        self.campaign_long_description = "Long description"
        self.campaign_slug = "test-campaign"
        self.project_slug = "test-project"
        self.project_title = "Test Project"
        self.project_description = "Project description"
        self.url = "http://example.com"
        self.spreadsheet_data = {
            "Campaign": self.campaign_title,
            "Campaign Short Description": self.campaign_short_description,
            "Campaign Long Description": self.campaign_long_description,
            "Campaign Slug": self.campaign_slug,
            "Project Slug": self.project_slug,
            "Project": self.project_title,
            "Project Description": self.project_description,
            "Import URLs": self.url,
        }
        self.post_data = {"spreadsheet_file": BytesIO()}

    def test_get(self):
        response = self.client.get(self.path)
        self.assertEqual(response.status_code, 200)
        self.assertIn("form", response.context)

    def test_invalid_form(self):
        response = self.client.post(self.path)
        self.assertEqual(response.status_code, 200)
        self.assertIn("form", response.context)

    def test_fully_valid_form(self):
        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.fetch_all_urls",
                autospec=True,
            ) as fetch_mock,
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            slurp_mock.return_value = [self.spreadsheet_data]
            fetch_mock.return_value = [["Fetch test message"], 1]

            response = self.client.post(self.path, data=self.post_data)

            self.assertEqual(response.status_code, 200)
            messages = [str(message) for message in get_messages(response.wsgi_request)]
            self.assertEqual(len(messages), 3)
            self.assertEqual(messages[0], "Fetch test message")
            self.assertEqual(messages[1], "Total Asset Count:1")
            self.assertEqual(messages[2], "All Processes Completed")

    def test_missing_field(self):
        spreadsheet_data = copy.copy(self.spreadsheet_data)
        del spreadsheet_data["Campaign"]

        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.fetch_all_urls",
                autospec=True,
            ) as fetch_mock,
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            slurp_mock.return_value = [spreadsheet_data]
            fetch_mock.return_value = [["Fetch test message"], 1]

            response = self.client.post(self.path, data=self.post_data)

        self.assertEqual(response.status_code, 200)
        messages = [str(message) for message in get_messages(response.wsgi_request)]
        self.assertEqual(len(messages), 4)
        self.assertEqual(messages[0], "Skipping row 0: missing fields ['Campaign']")
        self.assertEqual(messages[1], "Fetch test message")
        self.assertEqual(messages[2], "Total Asset Count:1")
        self.assertEqual(messages[3], "All Processes Completed")

    def test_empty_field(self):
        # Only three fields require values: Campaign, Projet and Import URLs.
        # Other fields must be present but can be empty.
        # This tests that blank value check
        spreadsheet_data = copy.copy(self.spreadsheet_data)

        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.fetch_all_urls",
                autospec=True,
            ) as fetch_mock,
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            # Test one empty field
            spreadsheet_data["Campaign"] = ""
            slurp_mock.return_value = [spreadsheet_data]
            fetch_mock.return_value = [["Fetch test message"], 1]

            response = self.client.post(self.path, data=self.post_data)
            self.assertEqual(response.status_code, 200)
            messages = [str(message) for message in get_messages(response.wsgi_request)]
            self.assertEqual(len(messages), 4)
            self.assertEqual(
                messages[0],
                "Skipping row 0: at least one required field "
                "(Campaign, Project, Import URLs) is empty",
            )
            self.assertEqual(messages[1], "Fetch test message")
            self.assertEqual(messages[2], "Total Asset Count:1")
            self.assertEqual(messages[3], "All Processes Completed")

    def test_all_empty_fields(self):
        # If all values in a spreadsheet row are empty, the row is skipped silently
        spreadsheet_data = {key: "" for key in self.spreadsheet_data.keys()}

        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.fetch_all_urls",
                autospec=True,
            ) as fetch_mock,
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            slurp_mock.return_value = [spreadsheet_data]
            fetch_mock.return_value = [["Fetch test message"], 1]

            response = self.client.post(self.path, data=self.post_data)

        self.assertEqual(response.status_code, 200)
        messages = [str(message) for message in get_messages(response.wsgi_request)]
        self.assertEqual(len(messages), 3)
        self.assertEqual(messages[0], "Fetch test message")
        self.assertEqual(messages[1], "Total Asset Count:1")
        self.assertEqual(messages[2], "All Processes Completed")

    def test_empty_campaign_slug(self):
        spreadsheet_data = copy.copy(self.spreadsheet_data)
        spreadsheet_data["Campaign Slug"] = ""

        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.fetch_all_urls",
                autospec=True,
            ) as fetch_mock,
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            slurp_mock.return_value = [spreadsheet_data]
            fetch_mock.return_value = [["Fetch test message"], 1]

            response = self.client.post(self.path, data=self.post_data)

        self.assertEqual(response.status_code, 200)
        messages = [str(message) for message in get_messages(response.wsgi_request)]
        self.assertEqual(len(messages), 3)
        self.assertEqual(messages[0], "Fetch test message")
        self.assertEqual(messages[1], "Total Asset Count:1")
        self.assertEqual(messages[2], "All Processes Completed")

    def test_bad_campaign_slug(self):
        spreadsheet_data = copy.copy(self.spreadsheet_data)
        spreadsheet_data["Campaign Slug"] = "bad#slug@"

        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.fetch_all_urls",
                autospec=True,
            ) as fetch_mock,
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            slurp_mock.return_value = [spreadsheet_data]
            fetch_mock.return_value = [["Fetch test message"], 1]

            response = self.client.post(self.path, data=self.post_data)

        self.assertEqual(response.status_code, 200)
        messages = [str(message) for message in get_messages(response.wsgi_request)]
        self.assertEqual(len(messages), 4)
        self.assertEqual(messages[0], "Campaign slug doesn't match pattern.")
        self.assertEqual(messages[1], "Fetch test message")
        self.assertEqual(messages[2], "Total Asset Count:1")
        self.assertEqual(messages[3], "All Processes Completed")

    def test_empty_project_slug(self):
        spreadsheet_data = copy.copy(self.spreadsheet_data)
        spreadsheet_data["Project Slug"] = ""

        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.fetch_all_urls",
                autospec=True,
            ) as fetch_mock,
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            slurp_mock.return_value = [spreadsheet_data]
            fetch_mock.return_value = [["Fetch test message"], 1]
            fetch_mock.return_value = [["Fetch test message"], 1]

            response = self.client.post(self.path, data=self.post_data)

        self.assertEqual(response.status_code, 200)
        messages = [str(message) for message in get_messages(response.wsgi_request)]
        self.assertEqual(len(messages), 3)
        self.assertEqual(messages[0], "Fetch test message")
        self.assertEqual(messages[1], "Total Asset Count:1")
        self.assertEqual(messages[2], "All Processes Completed")

    def test_bad_project_slug(self):
        spreadsheet_data = copy.copy(self.spreadsheet_data)
        spreadsheet_data["Project Slug"] = "bad#slug@"

        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.fetch_all_urls",
                autospec=True,
            ) as fetch_mock,
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            slurp_mock.return_value = [spreadsheet_data]
            fetch_mock.return_value = [["Fetch test message"], 1]

            response = self.client.post(self.path, data=self.post_data)

        self.assertEqual(response.status_code, 200)
        messages = [str(message) for message in get_messages(response.wsgi_request)]
        self.assertEqual(len(messages), 4)
        self.assertEqual(messages[0], "Project slug doesn't match pattern.")
        self.assertEqual(messages[1], "Fetch test message")
        self.assertEqual(messages[2], "Total Asset Count:1")
        self.assertEqual(messages[3], "All Processes Completed")

    def test_bad_url(self):
        spreadsheet_data = copy.copy(self.spreadsheet_data)
        spreadsheet_data["Import URLs"] = bad_url = "ftp://example.com"

        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.fetch_all_urls",
                autospec=True,
            ) as fetch_mock,
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            slurp_mock.return_value = [spreadsheet_data]
            fetch_mock.return_value = [["Fetch test message"], 1]

            response = self.client.post(self.path, data=self.post_data)

        self.assertEqual(response.status_code, 200)
        messages = [str(message) for message in get_messages(response.wsgi_request)]
        self.assertEqual(len(messages), 4)
        self.assertEqual(messages[0], f"Skipping unrecognized URL value: {bad_url}")
        self.assertEqual(messages[1], "Fetch test message")
        self.assertEqual(messages[2], "Total Asset Count:1")
        self.assertEqual(messages[3], "All Processes Completed")

    def test_large_number_urls(self):
        spreadsheet_data = copy.copy(self.spreadsheet_data)
        spreadsheet_data["Import URLs"] = " ".join([self.url for i in range(51)])

        with (
            mock.patch(
                "concordia.admin.views.AdminProjectBulkImportForm", autospec=True
            ) as form_mock,
            mock.patch(
                "concordia.admin.views.slurp_excel", autospec=True
            ) as slurp_mock,
            mock.patch(
                "concordia.admin.views.fetch_all_urls",
                autospec=True,
            ) as fetch_mock,
        ):
            form_mock.return_value.is_valid.return_value = True
            form_mock.return_value.cleaned_data = {}
            slurp_mock.return_value = [spreadsheet_data]
            fetch_mock.return_value = [["Fetch test message"], 1]

            response = self.client.post(self.path, data=self.post_data)

        self.assertEqual(response.status_code, 200)
        messages = [str(message) for message in get_messages(response.wsgi_request)]
        self.assertEqual(len(messages), 4)
        self.assertEqual(messages[0], "Fetch test message")
        self.assertEqual(messages[1], "Fetch test message")
        # This count is weird because we mock the fetch_all_urls function
        self.assertEqual(messages[2], "Total Asset Count:2")
        self.assertEqual(messages[3], "All Processes Completed")


class TestCeleryTaskReview(CreateTestUsers, TestCase):
    def setUp(self):
        # We don't set up our data here because we want to test
        # both with and without data
        self.login_user(is_staff=True, is_superuser=True)
        self.path = reverse("admin:celery-review")

    def add_campaigns(self):
        self.add_active_campaigns()
        self.add_completed_campaigns()
        self.add_retired_campaigns()

    def add_active_campaigns(self):
        self.campaign1 = create_campaign(
            slug="test-active-campaign-1", title="Test Active Campaign 1"
        )
        self.campaign2 = create_campaign(
            slug="test-active-campaign-2", title="Test Active Campaign 2"
        )

    def add_completed_campaigns(self):
        self.completed_campaign1 = create_campaign(
            slug="test-completed-campaign-1",
            title="Test Completed Campaign 1",
            status=Campaign.Status.COMPLETED,
        )
        self.completed_campaign2 = create_campaign(
            slug="test-completed-campaign-2",
            title="Test Completed Campaign 1",
            status=Campaign.Status.COMPLETED,
        )

    def add_retired_campaigns(self):
        self.retired_campaign1 = create_campaign(
            slug="test-retired-campaign-1",
            title="Test Retired Campaign 1",
            status=Campaign.Status.RETIRED,
        )
        self.retired_campaign2 = create_campaign(
            slug="test-retired-campaign-2",
            title="Test Retired Campaign 1",
            status=Campaign.Status.RETIRED,
        )

    def add_projects(self):
        # Active campaign 1, three projects
        create_project(
            campaign=self.campaign1,
            slug="campaign1-project-1",
            title="Campaign 1 Project 1",
        )
        create_project(
            campaign=self.campaign1,
            slug="campaign1-project-2",
            title="Campaign 1 Project 2",
        )
        create_project(
            campaign=self.campaign1,
            slug="campaign1-project-3",
            title="Campaign 1 Project 3",
        )

        # Active campaign 2, two projects
        create_project(
            campaign=self.campaign2,
            slug="campaign1-project-1",
            title="Campaign 2 Project 1",
        )
        create_project(
            campaign=self.campaign2,
            slug="campaign1-project-2",
            title="Campaign 2 Project 2",
        )

        # Completed campaign 1, two projects
        create_project(
            campaign=self.completed_campaign1,
            slug="completed-campaign1-project-1",
            title="Completed Campaign 1 Project 1",
        )
        create_project(
            campaign=self.completed_campaign1,
            slug="completed-campaign1-project-2",
            title="Completed Campaign 1 Project 2",
        )

        # Completed campaign 2, one project
        create_project(
            campaign=self.completed_campaign2,
            slug="completed-campaign2-project-1",
            title="Completed Campaign 1 Project 1",
        )

        # We don't create any for retired campaigns since the campaigns
        # are only created to make sure the view ignores them

    def add_tasks(self, campaign):
        data = []
        for project in campaign.project_set.all():
            import_asset = create_import_asset(1, project=project)
            item = import_asset.import_item
            import_job = item.job
            create_import_asset(
                2,
                import_item=item,
                import_job=import_job,
                project=project,
                last_started=timezone.now(),
            )
            create_import_asset(
                3,
                import_item=item,
                import_job=import_job,
                project=project,
                failed=timezone.now(),
                last_started=timezone.now(),
            )
            create_import_asset(
                4,
                import_item=item,
                import_job=import_job,
                project=project,
                completed=timezone.now(),
                last_started=timezone.now(),
            )
            data.append(
                {
                    "title": project.title,
                    "id": project.id,
                    "campaign_id": str(campaign.id),
                    "successful": 1,
                    "incomplete": 1,
                    "unstarted": 1,
                    "failure": 1,
                }
            )
        return data

    def test_empty_dashboard(self):
        response = self.client.get(self.path)
        context = response.context

        self.assertEqual(response.status_code, 200)
        self.assertIn("campaigns", context)
        campaigns = list(context["campaigns"])
        self.assertEqual(campaigns, [])

    def test_dashboard(self):
        self.add_active_campaigns()
        response = self.client.get(self.path)
        context = response.context
        self.assertEqual(response.status_code, 200)
        self.assertIn("campaigns", context)
        self.assertIn(self.campaign1, context["campaigns"])
        self.assertIn(self.campaign2, context["campaigns"])

        self.add_completed_campaigns()
        response = self.client.get(self.path)
        context = response.context
        self.assertEqual(response.status_code, 200)
        self.assertIn("campaigns", context)
        campaigns = list(context["campaigns"])
        self.assertIn(self.campaign1, campaigns)
        self.assertIn(self.campaign2, campaigns)
        self.assertIn(self.completed_campaign1, campaigns)
        self.assertIn(self.completed_campaign2, campaigns)

        self.add_retired_campaigns()
        response = self.client.get(self.path)
        context = response.context
        self.assertEqual(response.status_code, 200)
        self.assertIn("campaigns", context)
        campaigns = list(context["campaigns"])
        self.assertIn(self.campaign1, campaigns)
        self.assertIn(self.campaign2, campaigns)
        self.assertIn(self.completed_campaign1, campaigns)
        self.assertIn(self.completed_campaign2, campaigns)
        self.assertNotIn(self.retired_campaign1, campaigns)
        self.assertNotIn(self.retired_campaign2, campaigns)

    def test_campaign_dashboard(self):
        self.add_campaigns()
        self.add_projects()

        data = self.add_tasks(self.campaign1)
        response = self.client.get(self.path, {"id": self.campaign1.id})
        context = response.context
        self.assertIn("campaigns", context)
        self.assertEqual(context["campaigns"], [])
        self.assertIn("totalassets", context)
        self.assertEqual(context["totalassets"], 12)
        self.assertIn("projects", context)
        self.assertEqual(context["projects"], data)

        data = self.add_tasks(self.campaign2)
        response = self.client.get(self.path, {"id": self.campaign2.id})
        context = response.context
        self.assertIn("campaigns", context)
        self.assertEqual(context["campaigns"], [])
        self.assertIn("totalassets", context)
        self.assertEqual(context["totalassets"], 8)
        self.assertIn("projects", context)
        self.assertEqual(context["projects"], data)

        data = self.add_tasks(self.completed_campaign1)
        response = self.client.get(self.path, {"id": self.completed_campaign1.id})
        context = response.context
        self.assertIn("campaigns", context)
        self.assertEqual(context["campaigns"], [])
        self.assertIn("totalassets", context)
        self.assertEqual(context["totalassets"], 8)
        self.assertIn("projects", context)
        self.assertEqual(context["projects"], data)

        data = self.add_tasks(self.completed_campaign2)
        response = self.client.get(self.path, {"id": self.completed_campaign2.id})
        context = response.context
        self.assertIn("campaigns", context)
        self.assertEqual(context["campaigns"], [])
        self.assertIn("totalassets", context)
        self.assertEqual(context["totalassets"], 4)
        self.assertIn("projects", context)
        self.assertEqual(context["projects"], data)


class TestSerializedObjectView(TestCase):
    def setUp(self):
        self.card = create_card()
        # Every test needs access to the request factory.
        self.factory = RequestFactory()

    def test_exists(self):
        request = self.factory.get(
            "/admin/card/",
            {"model_name": "Card", "object_id": self.card.id, "field_name": "title"},
        )
        response = SerializedObjectView.as_view()(request)
        self.assertEqual(response.status_code, 200)
        self.assertEqual(json.loads(response.content)["title"], self.card.title)

    def test_dne(self):
        request = self.factory.get(
            "/admin/card/",
            {"model_name": "Card", "object_id": 3, "field_name": "title"},
        )
        response = SerializedObjectView.as_view()(request)
        self.assertEqual(response.status_code, HTTPStatus.NOT_FOUND)
        self.assertJSONEqual(response.content, {"status": "false"})


def mock_cache(object_to_patch):
    def decorator(cls):
        # Decorator to mock `django.core.cache.caches`.
        # Passes the mock cache and caches_mock to each
        # test method as additional arguments.
        # We have to write this as a custom decorator
        # in order to not have to create these mocks in
        # each invidivual test method, since we need to override
        # __getitem__ on the caches mock

        # We need to create a helper function so each method
        # gets a unique wrapper and mocks
        def create_wrapper(attr):
            @wraps(attr)
            def wrapper(self, *args, **kwargs):
                with mock.patch(object_to_patch) as caches_mock:
                    cache_mock = mock.MagicMock()
                    caches_mock.__getitem__.return_value = cache_mock
                    return attr(self, caches_mock, cache_mock, *args, **kwargs)

            return wrapper

        # Wrap each test method to include the mocks as arguments
        for attr_name in dir(cls):
            attr = getattr(cls, attr_name)
            if callable(attr) and attr_name.startswith("test_"):
                setattr(cls, attr_name, create_wrapper(attr))

        return cls

    return decorator


@mock_cache("concordia.admin.views.caches")
class TestClearCacheView(CreateTestUsers, TestCase):
    def setUp(self):
        self.login_user(is_staff=True, is_superuser=True)
        self.path = reverse("admin:clear-cache")

    def test_get(self, caches_mock, cache_mock):
        response = self.client.get(self.path)
        self.assertEqual(response.status_code, 200)
        self.assertIn("form", response.context)
        self.assertFalse(caches_mock.__getitem__.called)
        self.assertFalse(cache_mock.clear.called)

    def test_invalid_form(self, caches_mock, cache_mock):
        response = self.client.post(self.path)
        self.assertEqual(response.status_code, 200)
        self.assertIn("form", response.context)
        self.assertFalse(caches_mock.__getitem__.called)
        self.assertFalse(cache_mock.clear.called)

    def test_valid_form(self, caches_mock, cache_mock):
        response = self.client.post(self.path, {"cache_name": "view_cache"})
        self.assertEqual(response.status_code, 302)
        messages = [str(message) for message in get_messages(response.wsgi_request)]
        self.assertEqual(messages[0], "Successfully cleared 'view_cache' cache")
        self.assertTrue(caches_mock.__getitem__.called)
        self.assertTrue(cache_mock.clear.called)

    def test_form_with_invalid_data(self, caches_mock, cache_mock):
        response = self.client.post(self.path, {"cache_name": "default"})
        self.assertEqual(response.status_code, 200)
        self.assertIn("form", response.context)
        self.assertFalse(caches_mock.__getitem__.called)
        self.assertFalse(cache_mock.clear.called)

    def test_exception(self, caches_mock, cache_mock):
        caches_mock.__getitem__.side_effect = Exception("Test Exception")
        response = self.client.post(self.path, {"cache_name": "view_cache"})
        messages = [str(message) for message in get_messages(response.wsgi_request)]
        self.assertEqual(
            messages[0],
            "Couldn't clear cache 'view_cache', something went wrong. "
            "Received error: Test Exception",
        )


================================================
FILE: concordia/tests/test_api_views.py
================================================
from datetime import date
from unittest import mock
from urllib.parse import urlparse

from django.test import TestCase, override_settings
from django.urls import reverse
from django.utils.timezone import now

from concordia import api_views
from concordia.models import (
    Asset,
    Campaign,
    Item,
    Project,
    Topic,
    Transcription,
    User,
)
from concordia.utils import get_anonymous_user

from .utils import (
    JSONAssertMixin,
    create_asset,
    create_item,
    create_project,
    create_topic,
)


class URLAwareEncoderTest(TestCase):
    def test_default(self):
        encoder = api_views.URLAwareEncoder()
        self.assertEqual(encoder.default(None), None)

        obj = mock.Mock(spec=["url"])
        self.assertEqual(encoder.default(obj), obj.url)

        obj = mock.Mock(spec=["get_absolute_url"])
        self.assertEqual(encoder.default(obj), obj.get_absolute_url())

        # Test non-model object
        obj = date.today()
        self.assertEqual(encoder.default(obj), date.today().isoformat())


class APIViewMixinTest(TestCase):
    def setUp(self):
        self.mixin = api_views.APIViewMixin()

    def test_serialize_conctext(self):
        context = {"test-key": "test-value"}
        self.assertEqual(self.mixin.serialize_context(context), context)

    @mock.patch("concordia.api_views.model_to_dict")
    def test_serialize_object(self, mtd_mock):
        return_data = {"test-key": "test-value"}
        mtd_mock.return_value = return_data

        obj = mock.Mock(spec=["get_absolute_url"])
        data = self.mixin.serialize_object(obj)

        self.assertEqual(data, return_data | {"url": obj.get_absolute_url()})

        obj = mock.Mock(spec=[])
        data = self.mixin.serialize_object(obj)

        self.assertEqual(data, return_data)


@mock.patch("concordia.api_views.time")
class APIListViewTest(TestCase):
    def test_serialize_context(self, time_mock):
        time_mock.return_value = "test-time"
        view = api_views.APIListView()
        context = {"object_list": []}

        data = view.serialize_context(context)
        self.assertEqual(data, {"objects": [], "sent": "test-time"})


@override_settings(RATELIMIT_ENABLE=False)
class ConcordiaViewTests(JSONAssertMixin, TestCase):
    @classmethod
    def setUpTestData(cls):
        cls.anon_user = get_anonymous_user()

        cls.reviewer = User.objects.create_user(
            username="reviewer", email="tester@example.com"
        )

        # clear data from other tests
        Project.objects.all().delete()
        Topic.objects.all().delete()

        cls.test_project = create_project()

        cls.test_topic = create_topic(project=cls.test_project)

        cls.items = [
            create_item(
                item_id=f"item_{i}",
                title=f"Item {i}",
                project=cls.test_project,
                do_save=False,
            )
            for i in range(0, 3)
        ]
        Item.objects.bulk_create(cls.items)

        cls.assets = []
        for item in cls.items:
            cls.assets.append(
                create_asset(
                    title=f"Thumbnail URL test for {item.id}",
                    item=item,
                    download_url="http://tile.loc.gov/image-services/iiif/"
                    "service:music:mussuffrage:mussuffrage-100183:mussuffrage-100183.0001/"
                    "full/pct:100/0/default.jpg",
                    do_save=False,
                )
            )
            for i in range(0, 15):
                cls.assets.append(
                    create_asset(title=f"{item.id} — {i}", item=item, do_save=False)
                )
        Asset.objects.bulk_create(cls.assets)

        cls.transcriptions = []
        for asset in cls.assets:
            last_t = None

            for n in range(0, 3):
                cls.transcriptions.append(
                    Transcription(
                        asset=asset,
                        supersedes=last_t,
                        text=f"{asset} — {n}",
                        user=cls.anon_user,
                    )
                )

        Transcription.objects.bulk_create(cls.transcriptions)

        submitted_t = cls.transcriptions[-1]
        submitted_t.submitted = now()
        submitted_t.full_clean()
        submitted_t.save()

    def get_api_response(self, url, **request_args):
        """
        This issues a call to one of our API views and confirms that the
        response follows our basic conventions of returning a valid JSON
        response
        """

        qs = {"format": "json"}
        if request_args is not None:
            qs.update(request_args)

        resp = self.client.get(url, qs)
        data = self.assertValidJSON(resp)
        return resp, data

    def get_api_list_response(self, url, page_size=10, **request_args):
        """
        This issues a call to one of our API views and confirms that the
        response follows our basic conventions of returning a top level object
        with members“objects” (list) and “pagination” (object).
        """

        qs = {"per_page": page_size}
        if request_args is not None:
            qs.update(request_args)

        resp, data = self.get_api_response(url, **qs)

        self.assertIn("objects", data)
        self.assertIn("pagination", data)

        object_count = len(data["objects"])
        self.assertLessEqual(object_count, page_size)

        self.assertAbsoluteURLs(data["objects"])
        self.assertAbsoluteURLs(data["pagination"])

        return resp, data

    def assertAbsoluteUrl(self, url, allow_none=True):
        """Require a URL to either be None or an absolute URL"""

        if url is None and allow_none:
            return

        parsed = urlparse(url)
        self.assertIn(
            parsed.scheme, ["http", "https"], msg=f"Expected {url} to have HTTP scheme"
        )

        self.assertTrue(parsed.netloc)

    def assertAbsoluteURLs(self, data):
        if isinstance(data, dict):
            for k, v in data.items():
                if k.endswith("url"):
                    self.assertAbsoluteUrl(v)
                elif isinstance(v, (dict, list)):
                    self.assertAbsoluteURLs(v)
        elif isinstance(data, list):
            for i in data:
                self.assertAbsoluteURLs(i)
        else:
            raise TypeError(
                "assertAbsoluteURLs must be called with a dictionary or list"
            )

    def assertAssetStatuses(self, asset_list, expected_statuses):
        asset_pks = [i["id"] for i in asset_list]

        self.assertQuerySetEqual(
            Asset.objects.filter(pk__in=asset_pks).exclude(
                transcription_status__in=expected_statuses
            ),
            [],
        )

    def assertAssetsHaveLatestTranscriptions(self, asset_list):
        asset_pks = {i["id"]: i for i in asset_list}

        for asset in Asset.objects.filter(pk__in=asset_pks.keys()):
            latest_trans = asset.transcription_set.latest("pk")

            if latest_trans is None:
                self.assertIsNone(asset_pks[asset.id]["latest_transcription"])
            else:
                self.assertDictEqual(
                    asset_pks[asset.id]["latest_transcription"],
                    {
                        "id": latest_trans.pk,
                        "text": latest_trans.text,
                        "submitted_by": latest_trans.user_id,
                    },
                )

    def test_topic_detail(self):
        resp, data = self.get_api_response(
            reverse("topic-detail", kwargs={"slug": self.test_topic.slug})
        )

        self.assertIn("object", data)
        self.assertNotIn("objects", data)

        serialized_project = data["object"]

        self.assertIn("id", serialized_project)
        self.assertIn("url", serialized_project)
        topic = self.test_topic
        self.assertEqual(
            serialized_project,
            serialized_project
            | {
                "id": topic.id,
                "title": topic.title,
                "description": topic.description,
                "slug": topic.slug,
                "thumbnail_image": topic.thumbnail_image,
            },
        )
        self.assertURLEqual(
            serialized_project["url"], f"http://testserver{topic.get_absolute_url()}"
        )

    def test_campaign_list(self):
        resp, data = self.get_api_list_response(reverse("transcriptions:campaign-list"))

        self.assertGreater(len(data["objects"]), 0)

        test_campaigns = {
            i["id"]: i
            for i in Campaign.objects.published().values(
                "id", "title", "description", "short_description", "slug"
            )
        }

        for obj in data["objects"]:
            self.assertIn("id", obj)
            self.assertIn("url", obj)
            self.assertEqual(obj, obj | test_campaigns[obj["id"]])

    def test_campaign_detail(self):
        resp, data = self.get_api_response(
            reverse(
                "transcriptions:campaign-detail",
                kwargs={"slug": self.test_project.campaign.slug},
            )
        )

        self.assertIn("object", data)
        self.assertNotIn("objects", data)

        serialized_project = data["object"]

        self.assertIn("id", serialized_project)
        self.assertIn("url", serialized_project)
        campaign = self.test_project.campaign
        self.assertEqual(
            serialized_project,
            serialized_project
            | {
                "id": campaign.id,
                "title": campaign.title,
                "description": campaign.description,
                "slug": campaign.slug,
                "metadata": campaign.metadata,
                "thumbnail_image": campaign.thumbnail_image,
            },
        )
        self.assertURLEqual(
            serialized_project["url"], f"http://testserver{campaign.get_absolute_url()}"
        )

    def test_project_detail(self):
        project = self.test_project

        resp, data = self.get_api_list_response(project.get_absolute_url())

        # Until we clean up the project view code, projects have two key
        # elements: objects lists the children (i.e. items) and the project
        # itself is in a second top-level “project” object:
        self.assertIn("objects", data)
        self.assertIn("project", data)
        self.assertNotIn("object", data)

        serialized_project = data["project"]

        self.assertIn("id", serialized_project)
        self.assertIn("url", serialized_project)

        self.assertURLEqual(
            serialized_project["url"], f"http://testserver{project.get_absolute_url()}"
        )
        self.assertEqual(
            serialized_project,
            serialized_project
            | {
                "description": project.description,
                "id": project.id,
                "metadata": project.metadata,
                "slug": project.slug,
                "thumbnail_image": project.thumbnail_image,
                "title": project.title,
            },
        )

        for obj in data["objects"]:
            self.assertIn("description", obj)
            self.assertIn("item_id", obj)
            self.assertIn("item_url", obj)
            self.assertIn("metadata", obj)
            self.assertIn("thumbnail_url", obj)
            self.assertIn("title", obj)
            self.assertIn("url", obj)

    def test_item_detail(self):
        item = self.test_project.item_set.first()
        resp, data = self.get_api_list_response(item.get_absolute_url())

        # Until we clean up the project view code, projects have two key
        # elements: objects lists the children (i.e. items) and the project
        # itself is in a second top-level “project” object:
        self.assertIn("objects", data)
        self.assertIn("item", data)
        self.assertNotIn("object", data)

        serialized_item = data["item"]

        self.assertIn("id", serialized_item)
        self.assertIn("url", serialized_item)
        self.assertIn("thumbnail_url", serialized_item)

        self.assertURLEqual(
            serialized_item["url"], f"http://testserver{item.get_absolute_url()}"
        )
        self.assertEqual(
            serialized_item,
            serialized_item
            | {
                "description": item.description,
                "id": item.id,
                "item_id": item.item_id,
                "metadata": item.metadata,
                "title": item.title,
            },
        )

        for obj in data["objects"]:
            self.assertIn("description", obj)
            self.assertIn("difficulty", obj)
            self.assertIn("metadata", obj)
            self.assertIn("image_url", obj)
            self.assertIn("thumbnail_url", obj)
            self.assertIn("resource_url", obj)
            self.assertIn("title", obj)
            self.assertIn("slug", obj)
            self.assertIn("url", obj)
            self.assertIn("year", obj)
            if "Thumbnail test" in obj["title"]:
                self.assertIn("https", obj["thumbnail_url"])


================================================
FILE: concordia/tests/test_authentication.py
================================================
from django.test import RequestFactory, TestCase

from concordia.authentication_backends import EmailOrUsernameModelBackend

from .utils import CreateTestUsers


class AuthenticationBackendTests(TestCase, CreateTestUsers):
    def test_EmailOrUsernameModelBackend(self):
        backend = EmailOrUsernameModelBackend()
        request_factory = RequestFactory()
        test_user = self.create_user("tester")
        request = request_factory.get("/")

        # Fail to authenticate with no information
        user = backend.authenticate(request)
        self.assertEqual(user, None)

        # Fail to authenticate with no password, using username
        user = backend.authenticate(request, test_user.username)
        self.assertEqual(user, None)

        # Authenticate with correct password, using username
        user = backend.authenticate(request, test_user.username, test_user._password)
        self.assertEqual(user, test_user)

        # Fail to authenticate with no password, using email
        user = backend.authenticate(request, test_user.email)
        self.assertEqual(user, None)

        # Authenticate with correct password, using email
        user = backend.authenticate(request, test_user.email, test_user._password)
        self.assertEqual(user, test_user)

        # Fail to authenticate with incorrect password, using username
        user = backend.authenticate(request, test_user.username, "bad-password")
        self.assertEqual(user, None)

        # Fail to authenticate with incorrect password, using email
        user = backend.authenticate(request, test_user.email, "bad-password")
        self.assertEqual(user, None)

        # Same tests, with user with a username
        # the same as the first user's email address
        test_user2 = self.create_user(test_user.email)

        # Fail to authenticate with no password, using username
        user = backend.authenticate(request, test_user2.username)
        self.assertEqual(user, None)

        # Authenticate with correct password, using username
        user = backend.authenticate(request, test_user2.username, test_user2._password)
        self.assertEqual(user, test_user2)

        # Fail to authenticate with no password, using email
        user = backend.authenticate(request, test_user2.email)
        self.assertEqual(user, None)

        # Authenticate with correct password, using email
        user = backend.authenticate(request, test_user2.email, test_user2._password)
        self.assertEqual(user, test_user2)

        # Fail to authenticate with incorrect password, using username
        user = backend.authenticate(request, test_user2.username, "bad-password")
        self.assertEqual(user, None)

        # Fail to authenticate with incorrect password, using email
        user = backend.authenticate(request, test_user2.email, "bad-password")
        self.assertEqual(user, None)


================================================
FILE: concordia/tests/test_celery.py
================================================
import tempfile
from types import SimpleNamespace
from unittest import mock

from django.test import TestCase

import concordia.celery as celery_mod
from concordia.celery import import_all_submodules


class ConcordiaCeleryTests(TestCase):
    def test_returns_early_for_non_package(self):
        mock_pkg = SimpleNamespace(__name__="not_a_pkg")  # no __path__

        with (
            mock.patch.object(
                celery_mod.importlib, "import_module", return_value=mock_pkg
            ) as mock_import,
            mock.patch.object(celery_mod.pkgutil, "walk_packages") as mock_walk,
        ):
            import_all_submodules("not_a_pkg")

        mock_import.assert_called_once_with("not_a_pkg")
        mock_walk.assert_not_called()

    def test_imports_all_submodules_for_package(self):
        sub1 = SimpleNamespace(name="dummy_pkg.sub1")
        sub2 = SimpleNamespace(name="dummy_pkg.sub2")

        with tempfile.TemporaryDirectory() as td:
            mock_pkg = SimpleNamespace(__name__="dummy_pkg", __path__=[td])

            with (
                mock.patch.object(celery_mod.importlib, "import_module") as mock_import,
                mock.patch.object(
                    celery_mod.pkgutil, "walk_packages", return_value=[sub1, sub2]
                ) as mock_walk,
            ):

                def side_effect(name):
                    if name == "dummy_pkg":
                        return mock_pkg
                    return SimpleNamespace(__name__=name)

                mock_import.side_effect = side_effect
                import_all_submodules("dummy_pkg")

        mock_walk.assert_called_once()
        args, _kwargs = mock_walk.call_args
        self.assertEqual(args[0], mock_pkg.__path__)
        self.assertEqual(args[1], mock_pkg.__name__ + ".")

        self.assertIn(mock.call("dummy_pkg"), mock_import.mock_calls)
        self.assertIn(mock.call("dummy_pkg.sub1"), mock_import.mock_calls)
        self.assertIn(mock.call("dummy_pkg.sub2"), mock_import.mock_calls)

    def test_package_with_no_submodules(self):
        with tempfile.TemporaryDirectory() as td:
            mock_pkg = SimpleNamespace(__name__="empty_pkg", __path__=[td])

            with (
                mock.patch.object(celery_mod.importlib, "import_module") as mock_import,
                mock.patch.object(
                    celery_mod.pkgutil, "walk_packages", return_value=[]
                ) as mock_walk,
            ):

                mock_import.side_effect = lambda name: (
                    mock_pkg if name == "empty_pkg" else SimpleNamespace(__name__=name)
                )
                import_all_submodules("empty_pkg")

        mock_walk.assert_called_once()
        mock_import.assert_called_once_with("empty_pkg")

    def test__load_all_task_modules_invokes_imports(self):
        with mock.patch.object(celery_mod, "import_all_submodules") as mock_import_all:
            celery_mod._load_all_task_modules(sender=celery_mod.app)

        mock_import_all.assert_has_calls(
            [
                mock.call("concordia.tasks"),
                mock.call("importer.tasks"),
            ],
            any_order=False,
        )

    def test_on_after_finalize_signal_triggers_handler(self):
        with mock.patch.object(celery_mod, "import_all_submodules") as mock_import_all:
            celery_mod.app.on_after_finalize.send(sender=celery_mod.app)

        mock_import_all.assert_has_calls(
            [mock.call("concordia.tasks"), mock.call("importer.tasks")],
            any_order=False,
        )
        self.assertEqual(mock_import_all.call_count, 2)


================================================
FILE: concordia/tests/test_consumers.py
================================================
from asgiref.sync import sync_to_async
from channels.testing import WebsocketCommunicator
from django.test import RequestFactory, TransactionTestCase
from django.urls import reverse

from concordia.consumers import AssetConsumer
from concordia.utils import get_or_create_reservation_token
from concordia.views.ajax import obtain_reservation

from .utils import CreateTestUsers, create_asset, create_item, create_transcription


class TestAssetConsumer(CreateTestUsers, TransactionTestCase):
    """
    Normally defining communicator would be in setUp
    and communicator.disconnect would be called in tearDown
    Asynchronous code doesn't seem to work well with those methods
    so those lines are in each test.
    """

    async def test_asset_update(self):
        communicator = WebsocketCommunicator(
            AssetConsumer.as_asgi(), "ws/asset/asset_updates/"
        )
        connected, subprotocol = await communicator.connect()
        self.assertTrue(connected)

        asset = await sync_to_async(create_asset)()
        response = await communicator.receive_json_from()
        message = response["message"]
        self.assertEqual(message["type"], "asset_update")
        self.assertEqual(message["asset_pk"], asset.pk)
        self.assertEqual(message["status"], "not_started")
        self.assertEqual(message["latest_transcription"], None)

        await sync_to_async(create_item)(item_id="item-2", project=asset.item.project)
        response = await communicator.receive_nothing()
        self.assertTrue(response)

        user = await sync_to_async(self.create_test_user)()
        transcription = await sync_to_async(create_transcription)(
            asset=asset, user=user
        )
        response = await communicator.receive_json_from()
        message = response["message"]
        self.assertEqual(message["type"], "asset_update")
        self.assertEqual(message["asset_pk"], asset.pk)
        self.assertEqual(message["status"], "in_progress")
        self.assertEqual(message["latest_transcription"]["id"], transcription.pk)

        await communicator.disconnect()

    async def test_asset_reservation_obtained(self):
        asset = await sync_to_async(create_asset)()
        communicator = WebsocketCommunicator(
            AssetConsumer.as_asgi(), "ws/asset/asset_updates/"
        )
        connected, subprotocol = await communicator.connect()
        self.assertTrue(connected)

        request_factory = RequestFactory()
        request = request_factory.get("/")
        request.session = {}
        token = get_or_create_reservation_token(request)
        await sync_to_async(obtain_reservation)(asset.pk, token)

        response = await communicator.receive_json_from()
        message = response["message"]
        self.assertEqual(message["type"], "asset_reservation_obtained")
        self.assertEqual(message["asset_pk"], asset.pk)

        await communicator.disconnect()

    async def test_asset_reservation_released(self):
        asset = await sync_to_async(create_asset)()
        await self.async_client.get(
            reverse("reserve-asset", kwargs={"asset_pk": asset.pk})
        )

        communicator = WebsocketCommunicator(
            AssetConsumer.as_asgi(), "ws/asset/asset_updates/"
        )
        connected, subprotocol = await communicator.connect()
        self.assertTrue(connected)

        await self.async_client.post(
            reverse("reserve-asset", kwargs={"asset_pk": asset.pk}),
            {"release": "release"},
        )
        response = await communicator.receive_json_from()
        message = response["message"]
        self.assertEqual(message["type"], "asset_reservation_released")
        self.assertEqual(message["asset_pk"], asset.pk)
        await communicator.disconnect()


================================================
FILE: concordia/tests/test_contextmanagers.py
================================================
from unittest import TestCase
from unittest.mock import patch

from concordia.contextmanagers import DEFAULT_LOCK_DURATION, cache_lock


class CacheLockTests(TestCase):
    def setUp(self):
        self.lock_id = "test-lock"
        self.oid = "worker-1"

        self.cache_patch = patch("concordia.contextmanagers.cache")
        self.mock_cache = self.cache_patch.start()
        self.addCleanup(self.cache_patch.stop)

        self.time_patch = patch("concordia.contextmanagers.time.monotonic")
        self.mock_monotonic = self.time_patch.start()
        self.addCleanup(self.time_patch.stop)

        self.start_time = 100.0
        self.mock_monotonic.return_value = self.start_time

    def test_acquires_and_releases_lock(self):
        self.mock_cache.add.return_value = True

        with cache_lock(self.lock_id, self.oid) as acquired:
            self.assertTrue(acquired)
            self.mock_cache.add.assert_called_once_with(
                self.lock_id, self.oid, DEFAULT_LOCK_DURATION
            )

        self.mock_cache.delete.assert_called_once_with(self.lock_id)

    def test_does_not_release_if_lock_not_acquired(self):
        self.mock_cache.add.return_value = False

        with cache_lock(self.lock_id, self.oid) as acquired:
            self.assertFalse(acquired)

        self.mock_cache.delete.assert_not_called()

    def test_does_not_release_if_expired(self):
        self.mock_cache.add.return_value = True

        # Simulate expiration: time has passed beyond timeout
        def advance_time():
            return self.start_time + DEFAULT_LOCK_DURATION + 1

        self.mock_monotonic.side_effect = [self.start_time, advance_time()]

        with cache_lock(self.lock_id, self.oid) as acquired:
            self.assertTrue(acquired)

        self.mock_cache.delete.assert_not_called()


================================================
FILE: concordia/tests/test_decorators.py
================================================
from unittest import TestCase
from unittest.mock import MagicMock, patch

from celery import Task

from concordia.decorators import locked_task


class LockedTaskDecoratorTests(TestCase):
    def setUp(self):
        self.hostname = "test-worker"
        self.logger_patch = patch("concordia.decorators.logger")
        self.logger = self.logger_patch.start()
        self.addCleanup(self.logger_patch.stop)

        self.cache_lock_patch = patch("concordia.decorators.cache_lock")
        self.mock_cache_lock = self.cache_lock_patch.start()
        self.addCleanup(self.cache_lock_patch.stop)

    def make_task_instance(self, name="test-task"):
        task = MagicMock(spec=Task)
        task.name = name
        task.request.hostname = self.hostname
        return task

    def test_lock_by_args_allows_only_one_execution(self):
        task = self.make_task_instance()

        calls = []

        @locked_task
        def dummy(self, arg):
            calls.append(arg)
            return f"Ran with {arg}"

        dummy_task = dummy.__get__(task)

        self.mock_cache_lock.return_value.__enter__.return_value = True
        result = dummy_task("foo")
        self.assertEqual(result, "Ran with foo")
        self.assertEqual(calls, ["foo"])

        self.mock_cache_lock.return_value.__enter__.return_value = False
        result = dummy_task("foo")
        self.assertIsNone(result)
        self.logger.info.assert_called_once()

    def test_lock_by_task_name(self):
        task = self.make_task_instance()

        calls = []

        @locked_task(lock_by_args=False)
        def dummy(self, arg):
            calls.append(arg)
            return f"Ran with {arg}"

        dummy_task = dummy.__get__(task)

        self.mock_cache_lock.return_value.__enter__.return_value = True
        result = dummy_task("foo")
        self.assertEqual(result, "Ran with foo")
        self.assertEqual(calls, ["foo"])

    def test_force_runs_even_if_lock_not_acquired(self):
        task = self.make_task_instance()

        calls = []

        @locked_task
        def dummy(self, arg):
            calls.append(arg)
            return f"Forced {arg}"

        dummy_task = dummy.__get__(task)

        self.mock_cache_lock.return_value.__enter__.return_value = False
        result = dummy_task("bar", force=True)
        self.assertEqual(result, "Forced bar")
        self.logger.warning.assert_called_once()

    def test_error_in_key_generation_logs_and_raises(self):
        task = self.make_task_instance()

        @locked_task
        def dummy(self, arg):
            return "This shouldn't run"

        dummy_task = dummy.__get__(task)

        # Use a non-repr-able object to simulate key generation failure
        class Unreprable:
            def __repr__(self):
                raise ValueError("Can't repr")

        with self.assertRaises(ValueError):
            dummy_task(Unreprable())

        self.logger.exception.assert_called_once_with(
            "Unable to create cache key from arguments for %s.", task.name
        )


================================================
FILE: concordia/tests/test_fields.py
================================================
from unittest import mock
from urllib.error import HTTPError

from django.forms import ValidationError
from django.test import TestCase, override_settings

from concordia.turnstile.fields import TurnstileField


class TestFields(TestCase):
    @override_settings(
        TURNSTILE_PROXIES={},
        TURNSTILE_SECRET="test-secret",  # nosec B106: test-only dummy secret
        TURNSTILE_VERIFY_URL="http://example.com",
        TURNSTILE_TIMEOUT=0,
    )
    def test_TurnstileField(self):
        with (
            override_settings(
                TURNSTILE_DEFAULT_CONFIG={"appearance": "interaction-only"}
            ),
            mock.patch("concordia.turnstile.fields.Request"),
            mock.patch("concordia.turnstile.fields.build_opener") as opener_mock,
        ):
            open_mock = opener_mock.return_value.open
            read_mock = open_mock.return_value.read

            field = TurnstileField(required=False)

            self.assertEqual(
                field.widget_attrs(field.widget),
                {"data-appearance": "interaction-only"},
            )

            # Successful validation from Turnstile
            read_mock.return_value = '{"success" : true}'.encode()
            self.assertEqual(field.validate("test-value"), None)

            # Unsuccessful validation from Turnstile
            read_mock.return_value = '{"test-key" : "test-value"}'.encode()
            self.assertRaises(ValidationError, field.validate, "test-value")

            # Error trying to contact Turnstile
            open_mock.side_effect = HTTPError(
                "http://example.com", 404, "Test message%", "", mock.MagicMock()
            )
            self.assertRaises(ValidationError, field.validate, "test-value")

            # Testing special parameters on the widget
            field = TurnstileField(
                onload="testOnload()",
                render="test-render",
                hl="test-hl",
                test_parameter="test-data",
            )
            self.assertEqual(
                field.widget_attrs(field.widget),
                {
                    "data-appearance": "interaction-only",
                    "data-test_parameter": "test-data",
                },
            )
            self.assertEqual(
                field.widget.extra_url,
                {
                    "onload": "testOnload()",
                    "render": "test-render",
                    "hl": "test-hl",
                },
            )


================================================
FILE: concordia/tests/test_logging.py
================================================
import warnings
from types import SimpleNamespace
from unittest.mock import MagicMock, patch

from django.test import TestCase

from concordia.logging import ConcordiaLogger


class ConcordiaLoggerTests(TestCase):
    def setUp(self):
        self.mock_structlog_logger = MagicMock()
        self.logger = ConcordiaLogger(self.mock_structlog_logger)

    def test_debug_logs_with_event(self):
        self.logger.debug("debug msg", event_code="debug_event", key1="value1")
        self.mock_structlog_logger.debug.assert_called_once()
        args, kwargs = self.mock_structlog_logger.debug.call_args
        self.assertEqual(args[0], "debug msg")
        self.assertEqual(kwargs["event_code"], "debug_event")
        self.assertEqual(kwargs["key1"], "value1")

    def test_info_logs_with_event(self):
        self.logger.info("info msg", event_code="info_event", key2="value2")
        self.mock_structlog_logger.info.assert_called_once()
        args, kwargs = self.mock_structlog_logger.info.call_args
        self.assertEqual(args[0], "info msg")
        self.assertEqual(kwargs["event_code"], "info_event")
        self.assertEqual(kwargs["key2"], "value2")

    def test_warning_requires_reason_and_reason_code(self):
        with self.assertRaises(TypeError):
            self.logger.warning(
                "warning msg", event_code="warn_event", reason="only_reason"
            )

        self.logger.warning(
            "warning msg",
            event_code="warn_event",
            reason="test reason",
            reason_code="warn_code",
            key3="value3",
        )
        self.mock_structlog_logger.warning.assert_called_once()
        args, kwargs = self.mock_structlog_logger.warning.call_args
        self.assertEqual(kwargs["event_code"], "warn_event")
        self.assertEqual(kwargs["reason"], "test reason")
        self.assertEqual(kwargs["reason_code"], "warn_code")
        self.assertEqual(kwargs["key3"], "value3")

    def test_error_requires_reason_and_reason_code(self):
        with self.assertRaises(TypeError):
            self.logger.error(
                "error msg", event_code="error_event", reason_code="only_code"
            )

        self.logger.error(
            "error msg",
            event_code="error_event",
            reason="error reason",
            reason_code="error_code",
        )
        self.mock_structlog_logger.error.assert_called_once()
        args, kwargs = self.mock_structlog_logger.error.call_args
        self.assertEqual(kwargs["event_code"], "error_event")
        self.assertEqual(kwargs["reason"], "error reason")
        self.assertEqual(kwargs["reason_code"], "error_code")

    def test_missing_event_raises(self):
        with self.assertRaises(ValueError):
            self.logger.info("msg", event_code=None)

    def test_log_merges_context_correctly(self):
        mock_obj = SimpleNamespace(id=42)
        self.logger.register_extractor("thing", lambda o: {"thing_id": o.id})
        self.logger.info("msg", event_code="test_event", thing=mock_obj)
        args, kwargs = self.mock_structlog_logger.info.call_args
        self.assertEqual(kwargs["thing_id"], 42)

    def test_log_explicit_key_overrides_extracted(self):
        mock_obj = SimpleNamespace(id=42)
        self.logger.register_extractor("thing", lambda o: {"thing_id": 123})
        self.logger.info("msg", event_code="test_event", thing=mock_obj, thing_id=999)
        args, kwargs = self.mock_structlog_logger.info.call_args
        self.assertEqual(kwargs["thing_id"], 999)

    def test_bind_merges_context(self):
        bound = self.logger.bind(foo="bar")
        self.assertIsInstance(bound, ConcordiaLogger)
        self.assertIn("foo", bound._context)
        self.assertEqual(bound._context["foo"], "bar")

    def test_bind_merges_context_into_logging(self):
        bound = self.logger.bind(user="uval")
        bound.register_extractor("user", lambda o: {"user_id": o})
        bound.info("msg", event_code="bound_event")
        args, kwargs = self.mock_structlog_logger.info.call_args
        self.assertEqual(kwargs["user_id"], "uval")

    def test_unregister_extractor_removes_extractor(self):
        self.logger.register_extractor("foo", lambda o: {"foo_id": 1})
        self.logger.unregister_extractor("foo")
        self.assertNotIn("foo", self.logger._extractors)

    def test_register_extractor_warns_on_chained_override(self):
        def fake_asset_extractor(x):
            return {"asset_id": 1, "item_id": 2}

        with warnings.catch_warnings(record=True) as w:
            warnings.simplefilter("always")
            self.logger.register_extractor("asset", fake_asset_extractor)
            self.assertTrue(
                any(
                    "default extractors may still reference" in str(warn.message)
                    for warn in w
                )
            )

    def test_log_raises_when_message_is_none(self):
        with self.assertRaises(ValueError):
            self.logger.info(None, event_code="event")

    def test_log_raises_when_message_is_none_direct(self):
        with self.assertRaises(ValueError):
            self.logger.log("info", None, event_code="event")

    def test_log_raises_when_message_is_empty(self):
        with self.assertRaises(ValueError):
            self.logger.info("", event_code="event")

    def test_log_raises_when_message_is_empty_direct(self):
        with self.assertRaises(ValueError):
            self.logger.log("info", "", event_code="event")

    def test_log_skips_none_values_from_extractor(self):
        class Dummy:
            def __init__(self):
                self.id = None

        self.logger.register_extractor("thing", lambda o: {"thing_id": o.id})
        self.logger.info("msg", event_code="event", thing=Dummy())
        args, kwargs = self.mock_structlog_logger.info.call_args
        self.assertNotIn("thing_id", kwargs)

    def test_log_includes_nonextractor_bound_context(self):
        bound = self.logger.bind(extra1="foo", extra2="bar")
        bound.info("msg", event_code="event")
        args, kwargs = self.mock_structlog_logger.info.call_args
        self.assertEqual(kwargs["extra1"], "foo")
        self.assertEqual(kwargs["extra2"], "bar")

    def test_log_skips_none_values_in_context(self):
        self.logger.info("msg", event_code="event", explicit=None)
        args, kwargs = self.mock_structlog_logger.info.call_args
        self.assertNotIn("explicit", kwargs)

    def test_log_overrides_bound_and_extracted_context(self):
        obj = SimpleNamespace(id=123)
        base = self.logger.bind(thing=obj, value="a")
        base.register_extractor("thing", lambda o: {"thing_id": o.id, "value": "b"})
        base.info("msg", event_code="event", value="c")
        args, kwargs = self.mock_structlog_logger.info.call_args
        # Extracted value ("b") overridden by explicit context ("c")
        self.assertEqual(kwargs["value"], "c")
        self.assertEqual(kwargs["thing_id"], 123)

    def test_extractor_returns_none_value_skipped(self):
        obj = SimpleNamespace()
        self.logger.register_extractor("thing", lambda o: {"thing_id": None})
        self.logger.info("msg", event_code="event", thing=obj)
        args, kwargs = self.mock_structlog_logger.info.call_args
        self.assertNotIn("thing_id", kwargs)

    def test_get_logger_uses_structlog(self):
        with patch("concordia.logging.structlog.get_logger") as mock_get_logger:
            mock_logger_instance = MagicMock()
            mock_get_logger.return_value = mock_logger_instance

            logger = ConcordiaLogger.get_logger("concordia.tests")

            mock_get_logger.assert_called_once_with("structlog.concordia.tests")
            self.assertIsInstance(logger, ConcordiaLogger)
            self.assertEqual(logger._logger, mock_logger_instance)

    def test_log_raises_valueerror_for_empty_reason_and_code(self):
        with self.assertRaises(ValueError):
            self.logger.log(
                "warning", "bad", event_code="something", reason="", reason_code="fail"
            )

        with self.assertRaises(ValueError):
            self.logger.log(
                "error", "bad", event_code="something", reason="fail", reason_code=None
            )

    def test_exception_logs_with_exc_info(self):
        try:
            raise ValueError("Something went wrong")
        except ValueError:
            self.logger.exception(
                "Exception occurred",
                event_code="test_exception",
                reason="An error was raised",
                reason_code="value_error",
                extra="context",
            )

        self.mock_structlog_logger.error.assert_called_once()
        args, kwargs = self.mock_structlog_logger.error.call_args
        self.assertEqual(args[0], "Exception occurred")
        self.assertEqual(kwargs["event_code"], "test_exception")
        self.assertEqual(kwargs["reason"], "An error was raised")
        self.assertEqual(kwargs["reason_code"], "value_error")
        self.assertEqual(kwargs["extra"], "context")
        self.assertTrue(kwargs.get("exc_info"))


================================================
FILE: concordia/tests/test_maintenance.py
================================================
from django.core.cache import cache
from django.test import RequestFactory, TestCase
from maintenance_mode.core import set_maintenance_mode

from concordia.maintenance import need_maintenance_response

from .utils import CreateTestUsers


class TestMaintenance(TestCase, CreateTestUsers):
    def setUp(self):
        self.request_factory = RequestFactory()
        cache.clear()

    def tearDown(self):
        cache.clear()

    def test_need_maintenance_response_maintenance_default(self):
        request = self.request_factory.get("/")
        self.assertFalse(need_maintenance_response(request))

    def test_need_maintenance_response_maintenance_off(self):
        set_maintenance_mode(False)
        request = self.request_factory.get("/")
        self.assertFalse(need_maintenance_response(request))

    def test_need_maintenance_response_maintenance_on(self):
        set_maintenance_mode(True)
        request = self.request_factory.get("/")
        self.assertTrue(need_maintenance_response(request))

        request.user = self.create_test_user()
        request.user.is_staff = True

        # User is set and is staff, but frontend is off
        # (the default) so they should still get a maintenance
        # mode response
        self.assertTrue(need_maintenance_response(request))

    def test_need_maintenance_response_maintenance_frontend(self):
        set_maintenance_mode(True)
        request = self.request_factory.get("/")
        request.user = self.create_test_user()
        cache.set("maintenance_mode_frontend_available", True)

        # User is set but isn't super user, so they should get
        # a maintenance mode response
        self.assertTrue(need_maintenance_response(request))

        request.user.is_staff = True
        # User is staff, so they shouldn't get a maintenance
        # mode response
        self.assertFalse(need_maintenance_response(request))


================================================
FILE: concordia/tests/test_management_commands.py
================================================
from io import StringIO
from unittest import mock

from django.core.management import call_command
from django.test import TestCase

from concordia.tests.utils import create_asset, create_campaign


class EnsureInitialSiteConfigurationTests(TestCase):
    def test_command_output(self, *args, **kwargs):
        out = StringIO()
        call_command(
            "ensure_initial_site_configuration", admin_email="admin@loc.gov", stdout=out
        )
        call_command(
            "ensure_initial_site_configuration", site_domain="crowd.loc.gov", stdout=out
        )
        with mock.patch(
            "django.contrib.sites.models.Site.objects.update"
        ) as update_mock:
            update_mock.return_value = 0
            call_command(
                "ensure_initial_site_configuration",
                site_domain="crowd.loc.gov",
                stdout=out,
            )


class ImportSiteReportsTests(TestCase):
    def test_command_output(self, *args, **kwargs):
        out = StringIO()
        create_campaign(id=1)
        call_command(
            "import_site_reports",
            csv_file="concordia/tests/data/site_reports.csv",
            stdout=out,
        )


class PrintFrontendTestUrlsTests(TestCase):
    def test_command_output(self, *args, **kwargs):
        out = StringIO()
        call_command("print_frontend_test_urls", stdout=out)
        self.assertIn("", out.getvalue())

        create_asset()
        call_command("print_frontend_test_urls", stdout=out)
        self.assertIn("", out.getvalue())


================================================
FILE: concordia/tests/test_models.py
================================================
import json
from datetime import date, datetime, timedelta
from decimal import Decimal
from secrets import token_hex
from unittest import mock

from django.conf import settings
from django.core.exceptions import ObjectDoesNotExist, ValidationError
from django.db.models import signals
from django.test import TestCase
from django.utils import timezone

from concordia.models import (
    Asset,
    AssetTranscriptionReservation,
    Campaign,
    CardFamily,
    ConcordiaUser,
    HelpfulLink,
    KeyMetricsReport,
    MediaType,
    NextReviewableCampaignAsset,
    NextReviewableTopicAsset,
    NextTranscribableCampaignAsset,
    NextTranscribableTopicAsset,
    SiteReport,
    Topic,
    Transcription,
    TranscriptionStatus,
    UserProfile,
    UserProfileActivity,
    _update_useractivity_cache,
    resource_file_upload_path,
    update_userprofileactivity_table,
    validated_get_or_create,
)
from concordia.signals.handlers import create_user_profile, on_transcription_save
from concordia.utils import get_anonymous_user

from .utils import (
    CreateTestUsers,
    create_asset,
    create_banner,
    create_campaign,
    create_campaign_retirement_progress,
    create_card,
    create_card_family,
    create_carousel_slide,
    create_concordia_file,
    create_guide,
    create_helpful_link,
    create_item,
    create_simple_page,
    create_tag,
    create_tag_collection,
    create_topic,
    create_transcription,
    create_user_profile_activity,
)


class AssetTestCase(CreateTestUsers, TestCase):
    def setUp(self):
        self.asset = create_asset()
        self.anon = get_anonymous_user()
        create_transcription(asset=self.asset, user=self.anon)
        create_transcription(
            asset=self.asset,
            user=self.create_test_user(username="tester"),
            reviewed_by=self.anon,
        )

    def test_get_ocr_transcript(self):
        self.asset.storage_image = "tests/test-european.jpg"
        self.asset.save()
        phrase = "marrón rápido salta sobre el perro"
        self.assertFalse(phrase in self.asset.get_ocr_transcript())
        self.assertFalse(
            phrase in self.asset.get_ocr_transcript(language="bad-language-code")
        )
        self.assertTrue(phrase in self.asset.get_ocr_transcript(language="spa"))

    def test_get_contributor_count(self):
        self.assertEqual(self.asset.get_contributor_count(), 2)

    def test_turn_off_ocr(self):
        self.assertFalse(self.asset.turn_off_ocr())
        self.asset.disable_ocr = True
        self.asset.save()
        self.assertTrue(self.asset.turn_off_ocr())

        self.assertFalse(self.asset.item.turn_off_ocr())
        self.asset.item.disable_ocr = True
        self.asset.item.save()
        self.assertTrue(self.asset.item.turn_off_ocr())

        self.assertFalse(self.asset.item.project.turn_off_ocr())
        self.asset.item.project.disable_ocr = True
        self.asset.item.project.save()
        self.assertTrue(self.asset.item.project.turn_off_ocr())

    def test_get_storage_path(self):
        self.assertEqual(
            self.asset.get_storage_path(filename=self.asset.storage_image.name),
            "test-campaign/test-project/testitem.0123456789/1.jpg",
        )

    def test_saving_without_campaign(self):
        try:
            Asset.objects.create(
                item=self.asset.item,
                title="No campaign",
                slug="no-campaign",
                media_type=MediaType.IMAGE,
                storage_image="unittest1.jpg",
            )
        except (ValidationError, ObjectDoesNotExist):
            self.fail("Creating an Asset without a campaign failed validation.")

    def test_rollforward_with_only_rollforward_transcriptions(self):
        asset = create_asset(slug="rollforward-test", item=self.asset.item)
        create_transcription(asset=asset, user=self.anon, rolled_forward=True)
        with self.assertRaisesMessage(
            ValueError,
            "Can not rollforward transcription on an asset with "
            "no non-rollforward transcriptions",
        ):
            asset.rollforward_transcription(self.anon)

    def test_rollforward_with_too_many_rollforward_transcriptions(self):
        asset = create_asset(slug="rollforward-test", item=self.asset.item)
        transcription1 = create_transcription(asset=asset, user=self.anon)
        create_transcription(
            asset=asset, user=self.anon, supersedes=transcription1, rolled_forward=True
        )
        create_transcription(
            asset=asset, user=self.anon, supersedes=transcription1, rolled_forward=True
        )
        with self.assertRaisesMessage(
            ValueError,
            "More rollforward transcription exist than non-roll-forward "
            "transcriptions, which shouldn't be possible. Possibly "
            "incorrectly modified transcriptions for this asset.",
        ):
            asset.rollforward_transcription(self.anon)

    def test_rollforward_with_no_superseded_transcription(self):
        # This isn't a state that would happen normally, but could be created
        # accidentally when manually editing transcription history
        asset = create_asset(slug="rollforward-test", item=self.asset.item)
        transcription1 = create_transcription(asset=asset, user=self.anon)
        create_transcription(asset=asset, user=self.anon, supersedes=transcription1)
        create_transcription(
            asset=asset, user=self.anon, rolled_back=True, source=transcription1
        )
        with self.assertRaisesMessage(
            ValueError,
            "Can not rollforward transcription on an asset if the latest "
            "rollback transcription did not supersede a previous transcription",
        ):
            asset.rollforward_transcription(self.anon)

    def test_get_storage_path_handles_jpeg(self):
        # Ensure ".jpeg" is normalized to ".jpg"
        expected = self.asset.get_asset_image_filename("jpg")
        self.assertEqual(self.asset.get_storage_path("anything.jpeg"), expected)


class ItemModelTests(TestCase):
    def test_thumbnail_link_prefers_image_url_when_present(self):
        item = create_item()

        class Img:
            url = "http://example.test/media/thumb.jpg"

        item.thumbnail_image = Img()
        self.assertEqual(item.thumbnail_link, Img.url)

    def test_thumbnail_link_falls_back_when_image_url_raises(self):
        # If .url access raises ValueError, fall back to thumbnail_url
        item = create_item()

        class BadImg:
            @property
            def url(self):
                raise ValueError("missing from storage")

        item.thumbnail_image = BadImg()
        item.thumbnail_url = "http://example.test/media/fallback.jpg"
        self.assertEqual(item.thumbnail_link, item.thumbnail_url)

    def test_thumbnail_link_returns_thumbnail_url_when_no_image(self):
        item = create_item()
        item.thumbnail_image = None
        item.thumbnail_url = "http://example.test/media/fallback.jpg"
        self.assertEqual(item.thumbnail_link, item.thumbnail_url)

    def test_thumbnail_link_returns_none_when_no_image_or_url(self):
        item = create_item()
        item.thumbnail_image = None
        item.thumbnail_url = None
        self.assertIsNone(item.thumbnail_link)


class TranscriptionManagerTestCase(CreateTestUsers, TestCase):
    def setUp(self):
        self.transcription1 = create_transcription(
            user=self.create_user(username="tester1"),
            rejected=timezone.now() - timedelta(days=2),
        )
        self.transcription2 = create_transcription(
            asset=self.transcription1.asset, user=get_anonymous_user()
        )

    def test_recent_review_actions(self):
        transcriptions = Transcription.objects
        self.assertEqual(transcriptions.recent_review_actions().count(), 0)

        self.transcription1.accepted = timezone.now()
        self.transcription1.save()
        self.assertEqual(transcriptions.recent_review_actions().count(), 1)

        self.transcription2.rejected = timezone.now()
        self.transcription2.save()
        self.assertEqual(transcriptions.recent_review_actions().count(), 2)

    def test_review_actions(self):
        start = timezone.now() - timedelta(days=5)
        end = timezone.now() - timedelta(days=1)
        self.assertEqual(Transcription.objects.review_actions(start, end).count(), 1)

    def test_review_incidents(self):
        self.transcription1.accepted = timezone.now()
        self.transcription1.reviewed_by = self.create_user(username="tester2")
        self.transcription1.save()
        self.transcription2.accepted = self.transcription1.accepted + timedelta(
            seconds=29
        )
        self.transcription2.reviewed_by = self.transcription1.reviewed_by
        self.transcription2.save()
        create_transcription(
            asset=self.transcription1.asset,
            user=self.transcription1.user,
            reviewed_by=self.transcription1.reviewed_by,
            rejected=self.transcription2.accepted + timedelta(seconds=29),
        )
        create_transcription(
            asset=self.transcription1.asset,
            user=self.transcription1.user,
            reviewed_by=self.transcription1.reviewed_by,
            rejected=self.transcription2.accepted + timedelta(seconds=58),
        )
        users = Transcription.objects.review_incidents()
        self.assertNotIn(self.transcription1.user.id, users)

        transcription3 = create_transcription(
            asset=self.transcription1.asset,
            user=self.transcription1.user,
            reviewed_by=self.transcription1.reviewed_by,
            accepted=self.transcription1.accepted + timedelta(seconds=58),
        )
        transcription4 = create_transcription(
            asset=self.transcription1.asset,
            user=self.transcription1.user,
            reviewed_by=self.transcription1.reviewed_by,
            accepted=transcription3.accepted + timedelta(minutes=1, seconds=1),
        )
        users = Transcription.objects.review_incidents()
        self.assertEqual(len(users), 1)
        self.assertEqual(
            users[0],
            (
                self.transcription1.reviewed_by.id,
                self.transcription1.reviewed_by.username,
                2,
                4,
            ),
        )

        create_transcription(
            asset=self.transcription1.asset,
            user=self.transcription1.user,
            reviewed_by=self.transcription1.reviewed_by,
            accepted=transcription4.accepted + timedelta(seconds=29),
        )
        create_transcription(
            asset=self.transcription1.asset,
            user=self.transcription1.user,
            reviewed_by=self.transcription1.reviewed_by,
            accepted=transcription4.accepted + timedelta(seconds=58),
        )
        users = Transcription.objects.review_incidents()
        self.assertEqual(len(users), 1)
        self.assertEqual(
            users[0],
            (
                self.transcription1.reviewed_by.id,
                self.transcription1.reviewed_by.username,
                4,
                6,
            ),
        )

    def test_transcribe_incidents(self):
        self.transcription1.submitted = timezone.now()
        self.transcription1.save()
        self.transcription2.submitted = self.transcription1.submitted + timedelta(
            seconds=29
        )
        self.transcription2.user = self.transcription1.user
        self.transcription2.save()
        users = Transcription.objects.transcribe_incidents()
        self.assertEqual(len(users), 0)
        self.assertNotIn(self.transcription1.user.id, users)

        transcription3 = create_transcription(
            asset=create_asset(slug="asset-two", item=self.transcription1.asset.item),
            user=self.transcription1.user,
            submitted=self.transcription1.submitted + timedelta(seconds=58),
        )
        transcription4 = create_transcription(
            asset=create_asset(slug="asset-three", item=self.transcription1.asset.item),
            user=self.transcription1.user,
            submitted=transcription3.submitted + timedelta(minutes=1, seconds=1),
        )
        create_transcription(
            asset=transcription4.asset,
            user=self.transcription1.user,
            submitted=transcription4.submitted + timedelta(seconds=59),
        )
        users = Transcription.objects.transcribe_incidents()
        self.assertEqual(len(users), 1)
        self.assertEqual(
            users[0],
            (self.transcription1.user.id, self.transcription1.user.username, 2, 5),
        )

        create_transcription(
            asset=create_asset(slug="asset-five", item=self.transcription1.asset.item),
            user=self.transcription1.user,
            submitted=self.transcription1.submitted + timedelta(minutes=1, seconds=59),
        )
        users = Transcription.objects.transcribe_incidents()
        self.assertEqual(len(users), 1)
        self.assertEqual(
            users[0],
            (self.transcription1.user.id, self.transcription1.user.username, 3, 6),
        )

    def test_review_incidents_returns_empty_when_counts_zero(self):
        reviewer = self.create_user(username="rev-zero")
        asset = self.transcription1.asset

        t1 = create_transcription(
            asset=asset,
            user=self.create_user(username="u-a"),
            reviewed_by=reviewer,
            accepted=timezone.now() - timedelta(minutes=5),
        )
        create_transcription(
            asset=asset,
            user=self.create_user(username="u-b"),
            reviewed_by=reviewer,
            accepted=t1.accepted + timedelta(seconds=61),
        )

        out = Transcription.objects.review_incidents()
        self.assertEqual(out, [])

    def test_user_review_incidents_no_threshold_hit(self):
        asset = self.transcription1.asset

        reviewer = self.create_user("reviewer-1")
        reviewer_proxy = ConcordiaUser.objects.get(pk=reviewer.pk)

        base = timezone.now()
        create_transcription(
            asset=asset,
            user=self.create_user("ri_u1"),
            reviewed_by=reviewer_proxy,
            accepted=base,
        )
        create_transcription(
            asset=asset,
            user=self.create_user("ri_u2"),
            reviewed_by=reviewer_proxy,
            accepted=base + timedelta(seconds=61),
        )

        recent = Transcription.objects.filter(accepted__isnull=False)
        incidents = reviewer_proxy.review_incidents(recent)
        self.assertEqual(incidents, 0)

    def test_review_incidents_no_threshold_match_inner_loop_break(self):
        # Two accepts for same reviewer but >60s apart:
        a1 = create_asset(slug="rev-gap-a1", item=self.transcription1.asset.item)
        a2 = create_asset(slug="rev-gap-a2", item=a1.item)
        reviewer = self.create_user("reviewer-1")

        t0 = timezone.now()
        create_transcription(
            asset=a1, user=self.create_user("u1"), reviewed_by=reviewer, accepted=t0
        )
        create_transcription(
            asset=a2,
            user=self.create_user("u2"),
            reviewed_by=reviewer,
            accepted=t0 + timedelta(seconds=61),
        )

        recent = Transcription.objects.filter(accepted__isnull=False)
        reviewer_proxy = ConcordiaUser.objects.get(pk=reviewer.pk)

        incidents = reviewer_proxy.review_incidents(recent)
        self.assertEqual(incidents, 0)

    def test_review_incidents_loops_until_threshold(self):
        reviewer = self.create_user(username="test-reviewer-1")

        # Three accepts within 60s so threshold=3 will require two inner
        # iterations (count goes 1->2, not equal to threshold, then 2->3)
        base = timezone.now()
        create_transcription(
            asset=self.transcription1.asset,
            user=self.transcription1.user,
            reviewed_by=reviewer,
            accepted=base,
        )
        create_transcription(
            asset=self.transcription1.asset,
            user=self.transcription1.user,
            reviewed_by=reviewer,
            accepted=base + timedelta(seconds=20),
        )
        create_transcription(
            asset=self.transcription1.asset,
            user=self.transcription1.user,
            reviewed_by=reviewer,
            accepted=base + timedelta(seconds=40),
        )

        recent_accepts = Transcription.objects.filter(
            accepted__gte=base - timedelta(seconds=1)
        )

        reviewer_proxy = ConcordiaUser.objects.get(id=reviewer.id)

        incidents = reviewer_proxy.review_incidents(
            recent_accepts=recent_accepts, threshold=3
        )
        self.assertEqual(incidents, 1)


class TranscriptionTestCase(CreateTestUsers, TestCase):
    def setUp(self):
        self.user = self.create_user("test-user-1")
        self.user2 = self.create_user("test-user-2")
        self.asset = create_asset()
        self.transcription1 = create_transcription(
            user=self.user,
            asset=self.asset,
            rejected=timezone.now() - timedelta(days=2),
        )
        self.transcription2 = create_transcription(asset=self.asset, user=self.user2)

    def test_campaign_slug(self):
        self.assertEqual(
            self.asset.item.project.campaign.slug, self.transcription1.campaign_slug()
        )

    def test_clean(self):
        bad_transcription = Transcription(asset=self.asset, user=self.user)
        bad_transcription.clean()

        bad_transcription2 = Transcription(
            asset=self.asset,
            user=self.user,
            reviewed_by=self.user,
            accepted=timezone.now(),
        )
        with self.assertRaises(ValidationError):
            bad_transcription2.clean()

        bad_transcription3 = Transcription(
            asset=self.asset,
            user=self.user,
            reviewed_by=self.user2,
            accepted=timezone.now(),
            rejected=timezone.now(),
        )
        with self.assertRaises(ValidationError):
            bad_transcription3.clean()

    @mock.patch("concordia.tests.test_models.on_transcription_save")
    def test_save(self, mock_handler):
        signals.post_save.connect(on_transcription_save, sender=Transcription)

        transcription = create_transcription(asset=self.asset)
        self.assertTrue(mock_handler.called)
        self.assertEqual(mock_handler.call_count, 1)

        transcription.save()
        self.assertEqual(mock_handler.call_count, 2)

        signals.post_save.disconnect(on_transcription_save, sender=Transcription)

    def test_status(self):
        transcription = create_transcription(user=self.user, asset=self.asset)
        self.assertEqual(
            transcription.status,
            TranscriptionStatus.CHOICE_MAP[TranscriptionStatus.IN_PROGRESS],
        )

        transcription2 = create_transcription(
            asset=transcription.asset, user=self.user, submitted=timezone.now()
        )
        self.assertEqual(
            transcription2.status,
            TranscriptionStatus.CHOICE_MAP[TranscriptionStatus.SUBMITTED],
        )

        transcription3 = create_transcription(
            asset=transcription.asset,
            user=self.user,
            reviewed_by=self.user2,
            accepted=timezone.now(),
        )
        self.assertEqual(
            transcription3.status,
            TranscriptionStatus.CHOICE_MAP[TranscriptionStatus.COMPLETED],
        )


class SignalHandlersTest(CreateTestUsers, TestCase):
    @mock.patch("django.core.cache.cache.get")
    @mock.patch("django.core.cache.cache.set")
    def test_update_useractivity_cache(self, mock_set, mock_get):
        campaign = create_campaign()
        user = self.create_test_user()
        mock_get.return_value = {}
        _update_useractivity_cache(user.id, campaign.id, "transcribe")
        self.assertEqual(mock_set.call_count, 1)
        expected_key = f"userprofileactivity_{campaign.pk}"
        expected_value = {user.id: (1, 0)}
        mock_set.assert_called_with(expected_key, expected_value, timeout=None)

        reviewed_by = self.create_test_user(username="testuser2")
        mock_get.return_value = {}
        _update_useractivity_cache(reviewed_by.id, campaign.id, "review")
        self.assertEqual(mock_set.call_count, 2)
        expected_value = {reviewed_by.id: (0, 1)}
        mock_set.assert_called_with(expected_key, expected_value, timeout=None)


class AssetTranscriptionReservationTest(CreateTestUsers, TestCase):
    def setUp(self):
        self.asset = create_asset()
        self.user = self.create_user("test-user")
        self.uid = str(self.user.id).zfill(6)
        self.token = token_hex(22)
        self.reservation_token = self.token + self.uid
        self.reservation = AssetTranscriptionReservation.objects.create(
            asset=self.asset, reservation_token=self.reservation_token
        )

    def test_get_token(self):
        self.assertEqual(self.reservation.get_token(), self.token)

    def test_get_user(self):
        self.assertEqual(self.reservation.get_user(), self.uid)


class UserProfileActivityTestCase(TestCase):
    def setUp(self):
        self.user_profile_activity = UserProfileActivity(
            campaign=Campaign(), transcribe_count=135, review_count=204
        )

    def test_get_status(self):
        self.user_profile_activity.campaign.status = Campaign.Status.ACTIVE
        self.assertEqual(self.user_profile_activity.get_status(), "Active")
        self.user_profile_activity.campaign.status = Campaign.Status.COMPLETED
        self.assertEqual(self.user_profile_activity.get_status(), "Completed")
        self.user_profile_activity.campaign.status = Campaign.Status.RETIRED
        self.assertEqual(self.user_profile_activity.get_status(), "Retired")

    def test_total_actions(self):
        self.assertEqual(self.user_profile_activity.total_actions(), 339)

    def test_str(self):
        activity = create_user_profile_activity()
        self.assertEqual(f"{activity.user} - {activity.campaign}", str(activity))


class UserProfileTestCase(CreateTestUsers, TestCase):
    def test_update_userprofileactivity_table(self):
        signals.post_save.disconnect(
            create_user_profile, sender=settings.AUTH_USER_MODEL
        )

        user = self.create_test_user()
        self.assertFalse(hasattr(user, "profile"))

        transcription = create_transcription(user=user)
        update_userprofileactivity_table(
            user, transcription.asset.item.project.campaign.id, "transcribe_count"
        )

        self.assertTrue(hasattr(user, "profile"))
        self.assertEqual(user.profile.transcribe_count, 1)

        signals.post_save.connect(create_user_profile, sender=settings.AUTH_USER_MODEL)

    def test_update_userprofileactivity_table_updates_existing_and_profile(self):
        # Avoid auto-profile creation so we control both branches
        signals.post_save.disconnect(
            create_user_profile, sender=settings.AUTH_USER_MODEL
        )

        user = self.create_test_user()
        UserProfile.objects.create(user=user)

        transcription = create_transcription(user=user)
        campaign = transcription.asset.item.project.campaign
        upa, _ = UserProfileActivity.objects.get_or_create(
            user=user, campaign=campaign, defaults={"transcribe_count": 1}
        )

        update_userprofileactivity_table(user, campaign.id, "transcribe_count")

        # F() increments apply on save; refresh to observe DB values
        upa.refresh_from_db()
        user.refresh_from_db()
        user.profile.refresh_from_db()

        self.assertEqual(upa.transcribe_count, 2)
        self.assertEqual(user.profile.transcribe_count, 1)

        signals.post_save.connect(create_user_profile, sender=settings.AUTH_USER_MODEL)


class CampaignTestCase(TestCase):
    def test_queryset(self):
        campaign = create_campaign(unlisted=True)
        self.assertIn(campaign, Campaign.objects.unlisted())

        campaign.status = Campaign.Status.COMPLETED
        campaign.save()
        self.assertIn(campaign, Campaign.objects.completed())

        campaign.status = Campaign.Status.RETIRED
        campaign.save()
        self.assertIn(campaign, Campaign.objects.retired())


class CardTestCase(TestCase):
    def test_str(self):
        card = create_card()
        self.assertEqual(card.title, str(card))


class CardFamilyTestCase(TestCase):
    def setUp(self):
        self.family1 = create_card_family(default=True)

    def test_str(self):
        self.assertEqual(self.family1.slug, str(self.family1))

    def test_on_cardfamily_save(self):
        with mock.patch("concordia.models.on_cardfamily_save") as mocked_handler:
            signals.post_save.connect(mocked_handler, sender=CardFamily)
            self.family1.save()
            self.assertTrue(mocked_handler.called)
            self.assertEqual(mocked_handler.call_count, 1)


class HelpfulLinkTestCase(TestCase):
    def setUp(self):
        self.helpful_link = create_helpful_link()

    def test_str(self):
        self.assertEqual(self.helpful_link.title, str(self.helpful_link))

    def test_queryset(self):
        self.assertEqual(HelpfulLink.objects.related_links().count(), 1)
        create_helpful_link(
            link_type=HelpfulLink.HelpfulLinkType.COMPLETED_TRANSCRIPTION_LINK
        )
        self.assertEqual(HelpfulLink.objects.completed_transcription_links().count(), 1)


class ConcordiaFileTestCase(TestCase):
    def setUp(self):
        self.concordia_file = create_concordia_file()

    def test_str(self):
        self.assertEqual(self.concordia_file.name, str(self.concordia_file))

    def test_delete(self):
        with (
            mock.patch.object(
                self.concordia_file.uploaded_file, "delete"
            ) as delete_mock,
            mock.patch.object(
                self.concordia_file.uploaded_file, "storage", autospec=True
            ) as storage_mock,
        ):
            storage_mock.exists.return_value = True
            self.concordia_file.delete()
            self.assertTrue(delete_mock.called)

        concordia_file2 = create_concordia_file()
        with (
            mock.patch.object(concordia_file2.uploaded_file, "delete") as delete_mock,
            mock.patch.object(
                concordia_file2.uploaded_file, "storage", autospec=True
            ) as storage_mock,
        ):
            storage_mock.exists.return_value = False
            concordia_file2.delete()
            self.assertFalse(delete_mock.called)

    def test_concordia_file_upload_path(self):
        current_year = date.today().year

        path = resource_file_upload_path(self.concordia_file, "SHOULDNTBEUSED.PDF")
        self.assertEqual(path, "file.pdf")

        self.concordia_file.path = None

        path = resource_file_upload_path(self.concordia_file, "TEST.PDF")
        self.assertEqual(path, f"cm-uploads/resources/{current_year}/test.pdf")

        path = resource_file_upload_path(self.concordia_file, "TEST%%s.PDF")
        self.assertEqual(path, f"cm-uploads/resources/{current_year}/test%s.pdf")

        path = resource_file_upload_path(self.concordia_file, "%%YTEST.PDF")
        self.assertEqual(path, f"cm-uploads/resources/{current_year}/%ytest.pdf")


class TagTestCase(TestCase):
    def test_str(self):
        tag = create_tag()
        self.assertEqual(tag.value, str(tag))


class UserAssetTagCollectionTestCase(TestCase):
    def test_str(self):
        tag_collection = create_tag_collection()
        self.assertEqual(
            "{} - {}".format(tag_collection.asset, tag_collection.user),
            str(tag_collection),
        )


class BannerTestCase(TestCase):
    def setUp(self):
        self.banner = create_banner()

    def test_str(self):
        self.assertEqual(f"Banner: {self.banner.slug}", str(self.banner))

    def test_alert_class(self):
        self.assertEqual(
            self.banner.alert_class(), "alert-" + self.banner.alert_status.lower()
        )

    def test_btn_class(self):
        self.assertEqual(
            self.banner.btn_class(), "btn-" + self.banner.alert_status.lower()
        )


class CarouselSlideTestCase(TestCase):
    def test_str(self):
        slide = create_carousel_slide()
        self.assertEqual(f"CarouselSlide: {slide.headline}", str(slide))


class CampaignRetirementProgressTestCase(TestCase):
    def test_str(self):
        progress = create_campaign_retirement_progress()
        self.assertEqual(f"Removal progress for {progress.campaign}", str(progress))


class GuideTestCase(TestCase):
    def test_str(self):
        guide = create_guide()
        self.assertEqual(guide.title, str(guide))


class SimplePageTestCase(TestCase):
    def test_str(self):
        simple_page = create_simple_page()
        self.assertEqual(f"SimplePage: {simple_page.path}", str(simple_page))


class ValidatedGetOrCreateTestCase(TestCase):
    def test_validated_get_or_create(self):
        kwargs = {
            "title": "Test Campaign",
            "slug": "test-campaign",
        }
        campaign, created = validated_get_or_create(Campaign, **kwargs)
        self.assertTrue(created)
        campaign, created = validated_get_or_create(Campaign, **kwargs)
        self.assertFalse(created)
        self.assertEqual(campaign.title, kwargs["title"])


class NextAssetModelTests(TestCase):
    def setUp(self):
        self.asset = create_asset()
        self.topic = create_topic(project=self.asset.item.project)
        self.campaign = self.asset.campaign
        self.project = self.asset.item.project

    def test_create_next_transcribable_campaign_asset(self):
        obj = NextTranscribableCampaignAsset.objects.create(
            asset=self.asset,
            item=self.asset.item,
            item_item_id=self.asset.item.item_id,
            project=self.project,
            project_slug=self.project.slug,
            sequence=self.asset.sequence,
            campaign=self.campaign,
        )
        self.assertEqual(str(obj), self.asset.title)
        self.assertEqual(obj.transcription_status, "not_started")

    def test_create_next_reviewable_campaign_asset(self):
        obj = NextReviewableCampaignAsset.objects.create(
            asset=self.asset,
            item=self.asset.item,
            item_item_id=self.asset.item.item_id,
            project=self.project,
            project_slug=self.project.slug,
            sequence=self.asset.sequence,
            campaign=self.campaign,
        )
        self.assertEqual(str(obj), self.asset.title)
        self.assertEqual(obj.transcriber_ids, [])

    def test_create_next_transcribable_topic_asset(self):
        obj = NextTranscribableTopicAsset.objects.create(
            asset=self.asset,
            item=self.asset.item,
            item_item_id=self.asset.item.item_id,
            project=self.project,
            project_slug=self.project.slug,
            sequence=self.asset.sequence,
            topic=self.topic,
        )
        self.assertEqual(obj.transcription_status, "not_started")

    def test_create_next_reviewable_topic_asset(self):
        obj = NextReviewableTopicAsset.objects.create(
            asset=self.asset,
            item=self.asset.item,
            item_item_id=self.asset.item.item_id,
            project=self.project,
            project_slug=self.project.slug,
            sequence=self.asset.sequence,
            topic=self.topic,
        )
        self.assertEqual(obj.transcriber_ids, [])

    def test_needed_for_campaign_respects_target_count(self):
        manager = NextTranscribableCampaignAsset.objects
        current_needed = manager.needed_for_campaign(self.campaign.id)
        self.assertEqual(current_needed, settings.NEXT_TRANSCRIBABE_ASSET_COUNT)

        # Add one and check count again
        manager.create(
            asset=self.asset,
            item=self.asset.item,
            item_item_id=self.asset.item.item_id,
            project=self.project,
            project_slug=self.project.slug,
            sequence=self.asset.sequence,
            campaign=self.campaign,
        )
        new_needed = manager.needed_for_campaign(self.campaign.id)
        self.assertEqual(new_needed, settings.NEXT_TRANSCRIBABE_ASSET_COUNT - 1)

    def test_needed_for_topic_respects_target_count(self):
        manager = NextReviewableTopicAsset.objects
        current_needed = manager.needed_for_topic(self.topic.id)
        self.assertEqual(current_needed, settings.NEXT_REVIEWABLE_ASSET_COUNT)

        manager.create(
            asset=self.asset,
            item=self.asset.item,
            item_item_id=self.asset.item.item_id,
            project=self.project,
            project_slug=self.project.slug,
            sequence=self.asset.sequence,
            topic=self.topic,
        )
        new_needed = manager.needed_for_topic(self.topic.id)
        self.assertEqual(new_needed, settings.NEXT_REVIEWABLE_ASSET_COUNT - 1)

    def test_needed_for_campaign_raises_without_target(self):
        from django.db import models

        from concordia.models import NextCampaignAssetManager

        class DummyManager(NextCampaignAssetManager):
            target_count = None

        class DummyModel(models.Model):
            campaign = models.ForeignKey("concordia.Campaign", on_delete=models.CASCADE)
            objects = DummyManager()

            class Meta:
                app_label = "concordia"

        with self.assertRaises(NotImplementedError):
            DummyModel.objects.needed_for_campaign(self.campaign.id)

    def test_needed_for_topic_raises_without_target(self):
        from django.db import models

        from concordia.models import NextTopicAssetManager

        class DummyManager(NextTopicAssetManager):
            target_count = None

        class DummyModel(models.Model):
            topic = models.ForeignKey("concordia.Topic", on_delete=models.CASCADE)
            objects = DummyManager()

            class Meta:
                app_label = "concordia"

        with self.assertRaises(NotImplementedError):
            DummyModel.objects.needed_for_topic(self.topic.id)

    def test_needed_for_campaign_with_explicit_target_count(self):
        manager = NextTranscribableCampaignAsset.objects
        # Should return full count when no assets exist yet
        needed = manager.needed_for_campaign(self.campaign.id, target_count=10)
        self.assertEqual(needed, 10)

        # Add one asset
        manager.create(
            asset=self.asset,
            item=self.asset.item,
            item_item_id=self.asset.item.item_id,
            project=self.project,
            project_slug=self.project.slug,
            sequence=self.asset.sequence,
            campaign=self.campaign,
        )

        needed = manager.needed_for_campaign(self.campaign.id, target_count=10)
        self.assertEqual(needed, 9)

    def test_needed_for_topic_with_explicit_target_count(self):
        manager = NextReviewableTopicAsset.objects
        needed = manager.needed_for_topic(self.topic.id, target_count=5)
        self.assertEqual(needed, 5)

        manager.create(
            asset=self.asset,
            item=self.asset.item,
            item_item_id=self.asset.item.item_id,
            project=self.project,
            project_slug=self.project.slug,
            sequence=self.asset.sequence,
            topic=self.topic,
        )

        needed = manager.needed_for_topic(self.topic.id, target_count=5)
        self.assertEqual(needed, 4)


class SiteReportAndManagerTestCase(TestCase):
    def _aware(self, y, m, d, hh=12, mm=0, ss=0):
        tz = timezone.get_current_timezone()
        return timezone.make_aware(datetime(y, m, d, hh, mm, ss), tz)

    def _mk_sr(
        self,
        *,
        dt,
        report_name=None,
        campaign=None,
        topic=None,
        **kwargs,
    ):
        sr = SiteReport.objects.create(
            report_name=report_name or "",
            campaign=campaign,
            topic=topic,
            **kwargs,
        )
        # Set created_on deterministically for ordering logic
        SiteReport.objects.filter(pk=sr.pk).update(created_on=dt)
        return SiteReport.objects.get(pk=sr.pk)

    def test_calculate_assets_started(self):
        # Uses (assets_total - assets_not_started) deltas; floor at 0.
        v = SiteReport.calculate_assets_started(
            previous_assets_total=100,
            previous_assets_not_started=100,
            current_assets_total=107,
            current_assets_not_started=92,
        )
        self.assertEqual(v, 15)

        # None treated as 0.
        v2 = SiteReport.calculate_assets_started(
            previous_assets_total=None,
            previous_assets_not_started=None,
            current_assets_total=200,
            current_assets_not_started=190,
        )
        self.assertEqual(v2, 10)

        # Negative deltas are floored at 0.
        v3 = SiteReport.calculate_assets_started(
            previous_assets_total=107,
            previous_assets_not_started=92,
            current_assets_total=100,
            current_assets_not_started=90,
        )
        self.assertEqual(v3, 0)

    def test_series_navigation_and_sums(self):
        # Site-wide TOTAL series snapshots across three days
        d1 = self._aware(2024, 1, 10)
        d2 = self._aware(2024, 1, 20)
        d3 = self._aware(2024, 1, 31)

        r1 = self._mk_sr(
            dt=d1,
            report_name=SiteReport.ReportName.TOTAL,
            assets_started=3,
        )
        r2 = self._mk_sr(
            dt=d2,
            report_name=SiteReport.ReportName.TOTAL,
            assets_started=7,
        )
        r3 = self._mk_sr(
            dt=d3,
            report_name=SiteReport.ReportName.TOTAL,
            assets_started=10,
        )

        prev = SiteReport.objects.previous_in_series(
            report_name=SiteReport.ReportName.TOTAL,
            before=self._aware(2024, 1, 25),
        )
        self.assertEqual(prev.pk, r2.pk)

        # last_on_or_before_date_for_series
        last = SiteReport.objects.last_on_or_before_date_for_series(
            report_name=SiteReport.ReportName.TOTAL,
            on_or_before_date=date(2024, 1, 31),
        )
        self.assertEqual(last.pk, r3.pk)

        first = SiteReport.objects.first_on_or_after_date_for_series(
            report_name=SiteReport.ReportName.TOTAL,
            on_or_after_date=date(2024, 1, 15),
            on_or_before_date=date(2024, 1, 29),
        )
        self.assertEqual(first.pk, r2.pk)

        self.assertEqual(r2.previous_in_series().pk, r1.pk)
        self.assertEqual(r2.next_in_series().pk, r3.pk)

        summed = SiteReport.objects.sum_assets_started_for_series_between_dates(
            report_name=SiteReport.ReportName.TOTAL,
            start_date=date(2024, 1, 1),
            end_date=date(2024, 1, 31),
        )
        self.assertEqual(summed, 3 + 7 + 10)

    def test_per_campaign_and_topic_series_filters(self):
        camp = Campaign.objects.create(title="C1", slug="c1")
        # Per-campaign series
        d1 = self._aware(2023, 12, 1)
        d2 = self._aware(2023, 12, 2)
        s1 = self._mk_sr(dt=d1, campaign=camp, assets_total=1)
        s2 = self._mk_sr(dt=d2, campaign=camp, assets_total=2)

        prev = SiteReport.objects.previous_for_instance(s2)
        nxt = SiteReport.objects.next_for_instance(s1)
        self.assertEqual(prev.pk, s1.pk)
        self.assertEqual(nxt.pk, s2.pk)

        # Unspecified series (fallback), ensure no crash and no result
        none_prev = SiteReport.objects.previous_in_series()
        self.assertIsNone(none_prev)

    def test__series_filter_campaign_branch(self):
        camp = Campaign.objects.create(title="C", slug="c")
        # Two rows in same per-campaign series
        s1 = SiteReport.objects.create(campaign=camp, assets_total=1)
        s2 = SiteReport.objects.create(campaign=camp, assets_total=2)

        # Force a deterministic order
        SiteReport.objects.filter(pk=s1.pk).update(created_on=self._aware(2024, 1, 1))
        SiteReport.objects.filter(pk=s2.pk).update(created_on=self._aware(2024, 1, 2))

        prev = SiteReport.objects.previous_in_series(
            campaign=camp, before=self._aware(2024, 1, 3)
        )
        self.assertEqual(prev.pk, s2.pk)

        # And last_on_or_before path also using campaign filter
        last = SiteReport.objects.last_on_or_before_date_for_series(
            campaign=camp, on_or_before_date=date(2024, 1, 2)
        )
        self.assertEqual(last.pk, s2.pk)

    def test__series_filter_topic_branch(self):
        topic = Topic.objects.create(title="T", slug="t")
        s1 = SiteReport.objects.create(topic=topic, assets_total=1)
        s2 = SiteReport.objects.create(topic=topic, assets_total=2)
        SiteReport.objects.filter(pk=s1.pk).update(created_on=self._aware(2024, 2, 1))
        SiteReport.objects.filter(pk=s2.pk).update(created_on=self._aware(2024, 2, 2))

        first = SiteReport.objects.first_on_or_after_date_for_series(
            topic=topic,
            on_or_after_date=date(2024, 2, 1),
            on_or_before_date=date(2024, 2, 5),
        )
        self.assertEqual(first.pk, s1.pk)

    def test_series_filter_for_instance_topic_branch(self):
        topic = Topic.objects.create(title="T2", slug="t2")
        a = SiteReport.objects.create(topic=topic, assets_total=10)
        b = SiteReport.objects.create(topic=topic, assets_total=20)

        SiteReport.objects.filter(pk=a.pk).update(created_on=self._aware(2024, 3, 1))
        SiteReport.objects.filter(pk=b.pk).update(created_on=self._aware(2024, 3, 2))

        # IMPORTANT: refresh to pick up the updated created_on values
        a.refresh_from_db()
        b.refresh_from_db()

        self.assertEqual(b.previous_in_series().pk, a.pk)
        self.assertEqual(a.next_in_series().pk, b.pk)

    def test_series_filter_for_instance_retired_and_fallback(self):
        r = SiteReport.objects.create(
            report_name=SiteReport.ReportName.RETIRED_TOTAL, assets_total=1
        )
        # With only a single row, previous/next resolve via the RETIRED series Q()
        self.assertIsNone(r.previous_in_series())
        self.assertIsNone(r.next_in_series())

        blank = SiteReport.objects.create(assets_total=3)  # report_name=""
        self.assertIsNone(blank.previous_in_series())
        self.assertIsNone(blank.next_in_series())

    def test_to_debug_dict_includes_related_fields_and_counters(self):
        camp = Campaign.objects.create(title="CTitle", slug="cslug")
        topic = Topic.objects.create(title="TTitle", slug="tslug")

        sr_campaign = SiteReport.objects.create(
            campaign=camp, assets_total=9, assets_published=3
        )
        sr_topic = SiteReport.objects.create(
            topic=topic, items_published=4, items_unpublished=1
        )

        d1 = sr_campaign.to_debug_dict()
        self.assertIn("campaign", d1)
        self.assertEqual(d1["campaign"]["id"], camp.id)
        self.assertEqual(d1["campaign"]["title"], "CTitle")
        self.assertEqual(d1["campaign"]["slug"], "cslug")
        self.assertIn("counters", d1)
        self.assertEqual(d1["counters"]["assets_total"], 9)
        self.assertEqual(d1["counters"]["assets_published"], 3)

        d2 = sr_topic.to_debug_dict()
        self.assertIn("topic", d2)
        self.assertEqual(d2["topic"]["id"], topic.id)
        self.assertEqual(d2["topic"]["title"], "TTitle")
        self.assertEqual(d2["topic"]["slug"], "tslug")
        self.assertEqual(d2["counters"]["items_published"], 4)
        self.assertEqual(d2["counters"]["items_unpublished"], 1)

    def test_first_on_or_after_with_upper_bound_campaign(self):
        camp = Campaign.objects.create(title="C-Bound", slug="c-bound")
        a = SiteReport.objects.create(campaign=camp)
        b = SiteReport.objects.create(campaign=camp)
        SiteReport.objects.filter(pk=a.pk).update(created_on=self._aware(2024, 5, 1))
        SiteReport.objects.filter(pk=b.pk).update(created_on=self._aware(2024, 5, 2))

        out = SiteReport.objects.first_on_or_after_date_for_series(
            campaign=camp,
            on_or_after_date=date(2024, 5, 1),
            on_or_before_date=date(2024, 5, 1),
        )
        self.assertEqual(out.pk, a.pk)

    def test_previous_in_series_defaults_to_now(self):
        r1 = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        r2 = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=r1.pk).update(created_on=self._aware(2024, 1, 10))
        SiteReport.objects.filter(pk=r2.pk).update(created_on=self._aware(2024, 1, 20))
        out = SiteReport.objects.previous_in_series(
            report_name=SiteReport.ReportName.TOTAL
        )
        self.assertEqual(out.pk, r2.pk)

    def test_sum_assets_started_treats_null_as_zero(self):
        r1 = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL, assets_started=None
        )
        r2 = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL, assets_started=None
        )
        SiteReport.objects.filter(pk=r1.pk).update(created_on=self._aware(2024, 2, 1))
        SiteReport.objects.filter(pk=r2.pk).update(created_on=self._aware(2024, 2, 2))
        total = SiteReport.objects.sum_assets_started_for_series_between_dates(
            report_name=SiteReport.ReportName.TOTAL,
            start_date=date(2024, 2, 1),
            end_date=date(2024, 2, 28),
        )
        self.assertEqual(total, 0)

    def test_to_debug_dict_campaign_status_and_topic_loop(self):
        camp = Campaign.objects.create(
            title="Camp", slug="camp"
        )  # status has a default
        topic = Topic.objects.create(title="Top", slug="top")

        sr_campaign = SiteReport.objects.create(campaign=camp, assets_total=1)
        sr_topic = SiteReport.objects.create(topic=topic, assets_total=2)

        d1 = sr_campaign.to_debug_dict()
        self.assertIn("campaign", d1)
        # ensure the loop includes all three fields, including status
        self.assertEqual(d1["campaign"]["title"], "Camp")
        self.assertEqual(d1["campaign"]["slug"], "camp")
        self.assertIn("status", d1["campaign"])

        d2 = sr_topic.to_debug_dict()
        self.assertIn("topic", d2)
        # ensure the loop includes both fields for topic
        self.assertEqual(d2["topic"]["title"], "Top")
        self.assertEqual(d2["topic"]["slug"], "top")

    def test_to_debug_json_serializes_and_includes_counters(self):
        camp = Campaign.objects.create(title="CJ", slug="cj")
        sr = SiteReport.objects.create(
            campaign=camp, assets_total=4, assets_published=2
        )
        out = sr.to_debug_json()
        parsed = json.loads(out)

        # basic shape checks
        self.assertIn("created_on", parsed)  # ISO string
        self.assertEqual(parsed["report_name"], "")
        self.assertEqual(parsed["campaign"]["id"], camp.id)

        # counters included and numeric values preserved
        self.assertEqual(parsed["counters"]["assets_total"], 4)
        self.assertEqual(parsed["counters"]["assets_published"], 2)

    def test_first_on_or_after_without_upper_bound_topic(self):
        # Create two topic reports; query without an upper bound s
        # hould still return the earliest on/after.
        topic = Topic.objects.create(title="UBT", slug="ubt")
        s1 = SiteReport.objects.create(topic=topic)
        s2 = SiteReport.objects.create(topic=topic)
        SiteReport.objects.filter(pk=s1.pk).update(created_on=self._aware(2024, 6, 1))
        SiteReport.objects.filter(pk=s2.pk).update(created_on=self._aware(2024, 6, 2))

        out = SiteReport.objects.first_on_or_after_date_for_series(
            topic=topic,
            on_or_after_date=date(2024, 6, 2),
            # no on_or_before_date here on purpose
        )
        self.assertEqual(out.pk, s2.pk)

    def test_to_debug_dict_skips_none_campaign_attrs(self):
        # Force the related-object cache to a stub that lacks some attrs
        from types import SimpleNamespace

        camp = Campaign.objects.create(title="C", slug="c")
        sr = SiteReport.objects.create(campaign=camp, assets_total=1)

        # Populate fields_cache so descriptor returns this stub instead of hitting DB
        sr._state.fields_cache["campaign"] = SimpleNamespace(title="OnlyTitle")
        d = sr.to_debug_dict()

        self.assertIn("campaign", d)
        self.assertEqual(d["campaign"]["id"], camp.id)
        # title present, slug/status omitted because getattr(...) returned None
        self.assertEqual(d["campaign"]["title"], "OnlyTitle")
        self.assertNotIn("slug", d["campaign"])
        self.assertNotIn("status", d["campaign"])

    def test_to_debug_dict_skips_none_topic_attrs(self):
        # Force the related-object cache to a stub that lacks one of the looped attrs
        from types import SimpleNamespace

        t = Topic.objects.create(title="TT", slug="tt")
        sr = SiteReport.objects.create(topic=t, assets_total=2)

        sr._state.fields_cache["topic"] = SimpleNamespace(slug="only-slug")
        d = sr.to_debug_dict()

        self.assertIn("topic", d)
        self.assertEqual(d["topic"]["id"], t.id)
        # slug present, title omitted because getattr(...) returned None
        self.assertEqual(d["topic"]["slug"], "only-slug")
        self.assertNotIn("title", d["topic"])


class KeyMetricsReportTestCase(TestCase):
    def _aware(self, y, m, d, hh=12, mm=0, ss=0):
        tz = timezone.get_current_timezone()
        return timezone.make_aware(datetime(y, m, d, hh, mm, ss), tz)

    def _mk_sr(self, dt, report_name, **counters):
        sr = SiteReport.objects.create(
            report_name=report_name,
            **counters,
        )
        SiteReport.objects.filter(pk=sr.pk).update(created_on=dt)
        return SiteReport.objects.get(pk=sr.pk)

    def test_helpers(self):
        # FY math
        self.assertEqual(
            KeyMetricsReport.get_fiscal_year_for_date(date(2023, 10, 1)),
            2024,
        )
        self.assertEqual(
            KeyMetricsReport.get_fiscal_year_for_date(date(2024, 9, 30)),
            2024,
        )
        self.assertEqual(
            KeyMetricsReport.get_fiscal_quarter_for_date(date(2024, 2, 1)),
            2,
        )
        self.assertEqual(
            KeyMetricsReport.get_fiscal_quarter_for_date(date(2024, 10, 1)),
            1,
        )
        # Month bounds (leap year Feb)
        first, last = KeyMetricsReport.month_bounds(date(2024, 2, 10))
        self.assertEqual(first, date(2024, 2, 1))
        self.assertEqual(last, date(2024, 2, 29))

    def test_upsert_month_from_sitereports(self):
        # Baselines at 2023-12-31; EOM at 2024-01-31
        base_dt = self._aware(2023, 12, 31, 9, 0, 0)
        eom_dt = self._aware(2024, 1, 31, 23, 0, 0)

        # TOTAL baseline + EOM
        self._mk_sr(
            base_dt,
            SiteReport.ReportName.TOTAL,
            assets_published=100,
            assets_completed=50,
            users_activated=10,
            anonymous_transcriptions=5,
            transcriptions_saved=20,
            tag_uses=40,
        )
        self._mk_sr(
            eom_dt,
            SiteReport.ReportName.TOTAL,
            assets_published=130,
            assets_completed=70,
            users_activated=16,
            anonymous_transcriptions=8,
            transcriptions_saved=26,
            tag_uses=50,
        )

        # RETIRED_TOTAL baseline + EOM
        self._mk_sr(
            base_dt,
            SiteReport.ReportName.RETIRED_TOTAL,
            assets_published=10,
            assets_completed=5,
            users_activated=1,
            anonymous_transcriptions=2,
            transcriptions_saved=3,
            tag_uses=4,
        )
        self._mk_sr(
            eom_dt,
            SiteReport.ReportName.RETIRED_TOTAL,
            assets_published=15,
            assets_completed=8,
            users_activated=2,
            anonymous_transcriptions=3,
            transcriptions_saved=5,
            tag_uses=6,
        )

        # Daily assets_started within the month (sums to 15 + 5 = 20)
        self._mk_sr(
            self._aware(2024, 1, 10),
            SiteReport.ReportName.TOTAL,
            assets_started=10,
        )
        self._mk_sr(
            self._aware(2024, 1, 20),
            SiteReport.ReportName.TOTAL,
            assets_started=5,
        )
        self._mk_sr(
            self._aware(2024, 1, 11),
            SiteReport.ReportName.RETIRED_TOTAL,
            assets_started=3,
        )
        self._mk_sr(
            self._aware(2024, 1, 21),
            SiteReport.ReportName.RETIRED_TOTAL,
            assets_started=2,
        )

        # Upsert month
        m = KeyMetricsReport.upsert_month(year=2024, month=1)
        self.assertIsNotNone(m)
        self.assertEqual(m.fiscal_year, 2024)
        self.assertEqual(m.fiscal_quarter, 2)
        self.assertEqual(m.month, 1)

        # Deltas: see analysis; expect 35, 23, 7, 4, 8, 12 and started=20
        self.assertEqual(m.assets_published, 35)
        self.assertEqual(m.assets_completed, 23)
        self.assertEqual(m.users_activated, 7)
        self.assertEqual(m.anonymous_transcriptions, 4)
        self.assertEqual(m.transcriptions_saved, 8)
        self.assertEqual(m.tag_uses, 12)
        self.assertEqual(m.assets_started, 20)

        # __str__ + filenames
        self.assertIn("FY2024M01", str(m))
        self.assertTrue(m.csv_filename().startswith("key_metrics_monthly_fy2024"))

    def test_upsert_quarter_and_fiscal_year_rollups(self):
        # Create monthly rows for FY2024 Q2 (Jan & Feb present)
        KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.MONTHLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 1, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
            month=1,
            assets_published=10,
            assets_started=2,
            assets_completed=3,
            users_activated=5,
            anonymous_transcriptions=7,
            transcriptions_saved=11,
            tag_uses=13,
            crowd_visits=None,
            avg_visit_seconds=Decimal("10.50"),
        )
        KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.MONTHLY,
            period_start=date(2024, 2, 1),
            period_end=date(2024, 2, 29),
            fiscal_year=2024,
            fiscal_quarter=2,
            month=2,
            assets_published=20,
            assets_started=3,
            assets_completed=4,
            users_activated=6,
            anonymous_transcriptions=8,
            transcriptions_saved=12,
            tag_uses=14,
            # manual present in Feb only
            crowd_visits=100,
            avg_visit_seconds=None,
        )

        # Quarter upsert should sum calc fields; manual sums only when present
        q2 = KeyMetricsReport.upsert_quarter(fiscal_year=2024, fiscal_quarter=2)
        self.assertIsNotNone(q2)
        self.assertEqual(q2.assets_published, 30)
        self.assertEqual(q2.assets_started, 5)
        self.assertEqual(q2.assets_completed, 7)
        self.assertEqual(q2.users_activated, 11)
        self.assertEqual(q2.anonymous_transcriptions, 15)
        self.assertEqual(q2.transcriptions_saved, 23)
        self.assertEqual(q2.tag_uses, 27)
        # Manual: only Feb had a value, so total=100, avg from Jan only
        self.assertEqual(q2.crowd_visits, 100)
        self.assertEqual(q2.avg_visit_seconds, Decimal("10.50"))

        # Fiscal year rollup on FY2024 should equal Jan+Feb (for now)
        fy = KeyMetricsReport.upsert_fiscal_year(fiscal_year=2024)
        self.assertIsNotNone(fy)
        self.assertEqual(fy.assets_published, 30)
        self.assertEqual(fy.crowd_visits, 100)
        self.assertEqual(fy.avg_visit_seconds, Decimal("10.50"))

        # String and filenames
        self.assertIn("FY2024 Q2", str(q2))
        self.assertTrue(q2.csv_filename().startswith("key_metrics_quarterly_fy2024"))
        self.assertIn("FY2024 Report", str(fy))
        self.assertTrue(fy.csv_filename().startswith("key_metrics_fiscal_year_fy2024"))

    def test___str___fallback_when_fields_incomplete(self):
        # QUARTERLY without fiscal_quarter so fallback label path
        q = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2024, 4, 1),
            period_end=date(2024, 6, 30),
            fiscal_year=2024,
            fiscal_quarter=None,
        )
        s = str(q)
        self.assertIn("KeyMetricsReport QUARTERLY", s)
        self.assertIn("2024-04-01", s)
        self.assertIn("2024-06-30", s)

        # MONTHLY without month so fallback label path
        m = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.MONTHLY,
            period_start=date(2024, 5, 1),
            period_end=date(2024, 5, 31),
            fiscal_year=2024,
            month=None,
        )
        s2 = str(m)
        self.assertIn("KeyMetricsReport MONTHLY", s2)

    def test_quarter_helper_edges(self):
        # Q3 and Q4 branches
        self.assertEqual(
            KeyMetricsReport.get_fiscal_quarter_for_date(date(2024, 4, 1)), 3
        )
        self.assertEqual(
            KeyMetricsReport.get_fiscal_quarter_for_date(date(2024, 7, 1)), 4
        )

    def test__format_value_for_csv_variants(self):
        rep = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.FISCAL_YEAR,
            period_start=date(2023, 10, 1),
            period_end=date(2024, 9, 30),
            fiscal_year=2024,
        )

        self.assertEqual(rep._format_value_for_csv("crowd_visits", None), "")

        # Manual Decimal (avg_visit_seconds) to string with 2 decimals
        self.assertEqual(
            rep._format_value_for_csv("avg_visit_seconds", Decimal("10")),
            "10.00",
        )

        self.assertEqual(rep._format_value_for_csv("crowd_visits", 0), 0)

        self.assertEqual(rep._format_value_for_csv("assets_started", None), 0)

        # Unknown field fallback: None to "", non-None to value passthrough
        self.assertEqual(rep._format_value_for_csv("unknown_field", None), "")
        self.assertEqual(rep._format_value_for_csv("unknown_field", "x"), "x")

    def test_upsert_month_returns_none_when_no_snapshots(self):
        out = KeyMetricsReport.upsert_month(year=2025, month=6)
        self.assertIsNone(out)

    def test_upsert_quarter_invalid_quarter_raises(self):
        with self.assertRaises(ValueError):
            KeyMetricsReport.upsert_quarter(fiscal_year=2024, fiscal_quarter=5)

    def test_quarter_month_specs_all_quarters(self):
        # Q1
        q1 = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2023, 10, 1),
            period_end=date(2023, 12, 31),
            fiscal_year=2024,
            fiscal_quarter=1,
        )
        self.assertEqual(
            q1._quarter_month_specs(), [(2023, 10), (2023, 11), (2023, 12)]
        )

        # Q3
        q3 = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2024, 4, 1),
            period_end=date(2024, 6, 30),
            fiscal_year=2024,
            fiscal_quarter=3,
        )
        self.assertEqual(q3._quarter_month_specs(), [(2024, 4), (2024, 5), (2024, 6)])

        # Q4
        q4 = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2024, 7, 1),
            period_end=date(2024, 9, 30),
            fiscal_year=2024,
            fiscal_quarter=4,
        )
        self.assertEqual(q4._quarter_month_specs(), [(2024, 7), (2024, 8), (2024, 9)])

    def test_month_bounds_handles_december(self):
        first, last = KeyMetricsReport.month_bounds(date(2024, 12, 10))
        self.assertEqual(first, date(2024, 12, 1))
        self.assertEqual(last, date(2024, 12, 31))

    def test__monthly_from_sitereports_returns_empty_dict_when_no_eom(self):
        vals = KeyMetricsReport._monthly_from_sitereports(
            month_start=date(2030, 5, 1),
            month_end=date(2030, 5, 31),
        )
        self.assertEqual(vals, {})  # no snapshots at all

    def test__monthly_from_sitereports_baseline_fallback_inside_month(self):
        # No snapshots before month start; first snapshot inside the month
        start = date(2024, 3, 1)
        end = date(2024, 3, 31)

        # TOTAL: baseline inside month (10) -> EOM (15)
        self._mk_sr(
            self._aware(2024, 3, 5, 9, 0, 0),
            SiteReport.ReportName.TOTAL,
            assets_published=10,
        )
        self._mk_sr(
            self._aware(2024, 3, 31, 23, 0, 0),
            SiteReport.ReportName.TOTAL,
            assets_published=15,
        )

        # RETIRED: baseline inside month (4) -> EOM (7)
        self._mk_sr(
            self._aware(2024, 3, 10, 9, 0, 0),
            SiteReport.ReportName.RETIRED_TOTAL,
            assets_published=4,
        )
        self._mk_sr(
            self._aware(2024, 3, 31, 23, 0, 0),
            SiteReport.ReportName.RETIRED_TOTAL,
            assets_published=7,
        )

        vals = KeyMetricsReport._monthly_from_sitereports(
            month_start=start, month_end=end
        )
        # delta should be (15+7) - (10+4) = 8
        self.assertEqual(vals["assets_published"], 8)

    def test__monthly_from_sitereports_treats_missing_series_as_zero(self):
        # Only TOTAL snapshots; RETIRED series absent
        start = date(2024, 4, 1)
        end = date(2024, 4, 30)

        # baseline inside month (100) -> EOM (110)
        self._mk_sr(
            self._aware(2024, 4, 5, 9, 0, 0),
            SiteReport.ReportName.TOTAL,
            assets_published=100,
        )
        self._mk_sr(
            self._aware(2024, 4, 30, 23, 0, 0),
            SiteReport.ReportName.TOTAL,
            assets_published=110,
        )

        vals = KeyMetricsReport._monthly_from_sitereports(
            month_start=start, month_end=end
        )
        # RETIRED contributes 0 via the helper that treats None as 0
        self.assertEqual(vals["assets_published"], 10)

    def test_upsert_quarter_returns_none_when_no_monthlies_all_quarters(self):
        # Q1
        out1 = KeyMetricsReport.upsert_quarter(fiscal_year=2027, fiscal_quarter=1)
        self.assertIsNone(out1)
        # Q3
        out3 = KeyMetricsReport.upsert_quarter(fiscal_year=2027, fiscal_quarter=3)
        self.assertIsNone(out3)
        # Q4
        out4 = KeyMetricsReport.upsert_quarter(fiscal_year=2027, fiscal_quarter=4)
        self.assertIsNone(out4)

    def test_upsert_fiscal_year_returns_none_when_no_monthlies(self):
        out = KeyMetricsReport.upsert_fiscal_year(fiscal_year=2029)
        self.assertIsNone(out)

    def test__calendar_year_for_month_in_fy_helper(self):
        rep = KeyMetricsReport(
            period_type=KeyMetricsReport.PeriodType.FISCAL_YEAR,
            period_start=date(2023, 10, 1),
            period_end=date(2024, 9, 30),
            fiscal_year=2024,
        )
        # Oct in FY should map to previous calendar year
        self.assertEqual(rep._calendar_year_for_month_in_fy(10, 2024), 2023)
        # Jun in FY maps to the FY year
        self.assertEqual(rep._calendar_year_for_month_in_fy(6, 2024), 2024)

    def test_quarter_month_specs_q2(self):
        q2 = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 3, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
        )
        self.assertEqual(q2._quarter_month_specs(), [(2024, 1), (2024, 2), (2024, 3)])


class KeyMetricsReportCsvTestCase(TestCase):
    def setUp(self):
        # FY2023 FY row (for lifetime math)
        self.fy23 = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.FISCAL_YEAR,
            period_start=date(2022, 10, 1),
            period_end=date(2023, 9, 30),
            fiscal_year=2023,
            assets_published=50,
            assets_started=5,
            assets_completed=7,
            users_activated=11,
            anonymous_transcriptions=13,
            transcriptions_saved=17,
            tag_uses=19,
            crowd_visits=30,
            avg_visit_seconds=Decimal("9.00"),
        )

        # FY2024 Q1 (for quarterly lifetime math on Q2)
        self.q1_24 = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2023, 10, 1),
            period_end=date(2023, 12, 31),
            fiscal_year=2024,
            fiscal_quarter=1,
            assets_published=7,
            assets_started=1,
            assets_completed=2,
            users_activated=3,
            anonymous_transcriptions=4,
            transcriptions_saved=5,
            tag_uses=6,
            crowd_visits=None,
            avg_visit_seconds=Decimal("8.00"),
        )

        # FY2024 monthly rows for Q2: Jan, Feb present only
        self.jan24 = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.MONTHLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 1, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
            month=1,
            assets_published=10,
            assets_started=2,
            assets_completed=3,
            users_activated=5,
            anonymous_transcriptions=7,
            transcriptions_saved=11,
            tag_uses=13,
            crowd_visits=None,
        )
        self.feb24 = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.MONTHLY,
            period_start=date(2024, 2, 1),
            period_end=date(2024, 2, 29),
            fiscal_year=2024,
            fiscal_quarter=2,
            month=2,
            assets_published=20,
            assets_started=3,
            assets_completed=4,
            users_activated=6,
            anonymous_transcriptions=8,
            transcriptions_saved=12,
            tag_uses=14,
            crowd_visits=100,
        )

        # Upsert Q2 and FY2024 so we can render CSVs with proper totals
        self.q2_24 = KeyMetricsReport.upsert_quarter(
            fiscal_year=2024,
            fiscal_quarter=2,
        )
        self.fy24 = KeyMetricsReport.upsert_fiscal_year(fiscal_year=2024)

    def _csv_as_lines(self, rep: KeyMetricsReport) -> list[list[str]]:
        raw = rep.render_csv().decode("utf-8")
        return [line.split(",") for line in raw.strip().splitlines()]

    def test_monthly_csv_headers_and_values(self):
        # Build a synthetic single-month report to test header label only
        m = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.MONTHLY,
            period_start=date(2024, 6, 1),
            period_end=date(2024, 6, 30),
            fiscal_year=2024,
            fiscal_quarter=3,
            month=6,
            assets_published=1,
        )
        lines = self._csv_as_lines(m)
        # Header: "Metric", "<Month name only>"
        self.assertEqual(lines[0][0], "Metric")
        self.assertEqual(lines[0][1], "June")

        # One known metric row check
        labels = [row[0] for row in lines[1:]]
        vals = [row[1] for row in lines[1:]]
        pub_idx = labels.index("Assets published")
        self.assertEqual(int(vals[pub_idx]), 1)

    def test_quarterly_csv_headers_totals_and_lifetime(self):
        lines = self._csv_as_lines(self.q2_24)
        header = lines[0]

        # Months present (Jan, Feb), then "FY24 Q2 totals", "FY24 Lifetime totals"
        self.assertEqual(header[0], "Metric")
        self.assertIn("January", header)
        self.assertIn("February", header)
        self.assertIn("FY24 Q2 totals", header)
        self.assertIn("FY24 Lifetime totals", header)

        # Assets published row:
        # Jan(10), Feb(20) => quarter total=30
        # Lifetime = FY2023 FY(50) + FY2024 Q1(7) = 57
        labels = [row[0] for row in lines[1:]]
        ap_idx = labels.index("Assets published")
        row = lines[1 + ap_idx]
        # [label, Jan, Feb, Q2 total, Lifetime]
        self.assertEqual(int(row[1]), 10)
        self.assertEqual(int(row[2]), 20)
        self.assertEqual(int(row[3]), 30)
        self.assertEqual(int(row[4]), 57)

        # Manual example (Crowd.loc.gov visits):
        # Jan(None), Feb(100) => Q2 total=100 (not blank)
        # Lifetime = FY2023 FY(30) + Q1(None) => 30
        cv_idx = labels.index("Crowd.loc.gov visits")
        row2 = lines[1 + cv_idx]
        self.assertEqual(row2[1], "")  # January empty
        self.assertEqual(int(row2[2]), 100)
        self.assertEqual(int(row2[3]), 100)
        self.assertEqual(int(row2[4]), 30)

    def test_fiscal_year_csv_headers_totals_and_lifetime(self):
        # Ensure FY rows exist for lifetime (FY2023 and FY2024 already present)
        lines = self._csv_as_lines(self.fy24)
        header = lines[0]

        # Header pattern:
        # Metric | (FY24 Q1 totals if present) | Q2 totals | Q3 totals? | Q4 totals?
        # | FY24 totals | FY24 Lifetime totals
        self.assertEqual(header[0], "Metric")
        self.assertIn("FY24 Q1 totals", header)
        self.assertIn("Q2 totals", header)
        self.assertIn("FY24 totals", header)
        self.assertIn("FY24 Lifetime totals", header)

        labels = [row[0] for row in lines[1:]]
        ap_idx = labels.index("Assets published")
        row = lines[1 + ap_idx]

        # With our setup:
        # Q1 assets_published=7 (preset), Q2=30 (from jan+feb),
        # year total = 37, lifetime = FY2023 FY(50) + FY2024 FY(37) = 87
        # Header columns could be: Metric, FY24 Q1 totals, Q2 totals,
        # FY24 totals, FY24 Lifetime totals (Q3/Q4 absent)
        # Find indices dynamically.
        h = header
        q1_i = h.index("FY24 Q1 totals")
        q2_i = h.index("Q2 totals")
        yt_i = h.index("FY24 totals")
        lt_i = h.index("FY24 Lifetime totals")

        self.assertEqual(int(row[q1_i]), 7)
        self.assertEqual(int(row[q2_i]), 30)
        self.assertEqual(int(row[yt_i]), 37)
        expected_lifetime = self.fy23.assets_published + self.fy24.assets_published
        self.assertEqual(int(row[lt_i]), expected_lifetime)

    def test_str_formats(self):
        # Monthly string covers Oct (calendar year is fy-1)
        oct_row = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.MONTHLY,
            period_start=date(2023, 10, 1),
            period_end=date(2023, 10, 31),
            fiscal_year=2024,
            fiscal_quarter=1,
            month=10,
        )
        s = str(oct_row)
        self.assertIn("FY2024M10", s)
        self.assertIn("(October 2023)", s)

    def test_quarterly_csv_when_no_monthlies_and_no_priors(self):
        # Create a standalone quarterly row with no monthly rows in that quarter
        q = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2019, 10, 1),
            period_end=date(2019, 12, 31),
            fiscal_year=2020,
            fiscal_quarter=1,
        )
        lines = self._csv_as_lines(q)

        # Header should be: Metric | FY25 Q3 totals | FY25 Lifetime totals
        self.assertEqual(lines[0][0], "Metric")
        self.assertIn("FY20 Q1 totals", lines[0])
        self.assertIn("FY20 Lifetime totals", lines[0])
        self.assertEqual(len(lines[0]), 3)

        labels = [r[0] for r in lines[1:]]
        # Calculated field: totals are numeric, lifetime is 0
        ap_i = labels.index("Assets published")
        ap_row = lines[1 + ap_i]
        self.assertEqual(int(ap_row[1]), 0)  # quarter total
        self.assertEqual(int(ap_row[2]), 0)  # lifetime total

        # Manual field: totals should be blank when no values
        cv_i = labels.index("Crowd.loc.gov visits")
        cv_row = lines[1 + cv_i]
        self.assertEqual(cv_row[1], "")  # quarter total blank
        self.assertEqual(cv_row[2], "")  # lifetime total blank

    def test_fiscal_year_csv_headers_when_q1_missing(self):
        # Create an FY row and only Q2 and Q4 quarters for that FY
        fy = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.FISCAL_YEAR,
            period_start=date(2025, 10, 1),
            period_end=date(2026, 9, 30),
            fiscal_year=2026,
        )
        KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2026, 1, 1),
            period_end=date(2026, 3, 31),
            fiscal_year=2026,
            fiscal_quarter=2,
            assets_published=12,
        )
        KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2026, 7, 1),
            period_end=date(2026, 9, 30),
            fiscal_year=2026,
            fiscal_quarter=4,
            assets_published=8,
        )

        lines = self._csv_as_lines(fy)
        header = lines[0]

        self.assertEqual(header[0], "Metric")
        self.assertNotIn("FY26 Q1 totals", header)
        self.assertIn("Q2 totals", header)
        self.assertNotIn("Q3 totals", header)
        self.assertIn("Q4 totals", header)
        self.assertIn("FY26 totals", header)
        self.assertIn("FY26 Lifetime totals", header)

        labels = [r[0] for r in lines[1:]]
        ap_i = labels.index("Assets published")
        row = lines[1 + ap_i]

        q2_i = header.index("Q2 totals")
        q4_i = header.index("Q4 totals")
        yt_i = header.index("FY26 totals")
        lt_i = header.index("FY26 Lifetime totals")

        self.assertEqual(int(row[q2_i]), 12)
        self.assertEqual(int(row[q4_i]), 8)
        self.assertEqual(int(row[yt_i]), 20)

        # Lifetime sums all FY rows <= 2026 (FY2023 + FY2024 + FY2026)
        expected_lifetime = (
            self.fy23.assets_published + self.fy24.assets_published + 0
        )  # FY2026 FY row has no stored value in this test
        self.assertEqual(int(row[lt_i]), expected_lifetime)

    def test_format_value_for_csv_non_decimal_avg(self):
        rep = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.FISCAL_YEAR,
            period_start=date(2025, 10, 1),
            period_end=date(2026, 9, 30),
            fiscal_year=2026,
        )
        self.assertEqual(
            rep._format_value_for_csv("avg_visit_seconds", 12.3),
            "12.3",
        )


================================================
FILE: concordia/tests/test_parser.py
================================================
from types import SimpleNamespace
from unittest import mock

import requests
from django.test import TestCase
from requests.models import Response

import concordia.parser as parser_mod
from concordia.parser import extract_og_image, fetch_blog_posts, paginate_blog_posts

TITLE = "What’s New Online at the Library of Congress: May 2025"
LINK = "https://blogs.loc.gov/thesignal/2025/05/new-loc-may-2025/"
RSS = """<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0">
  <channel>
    <title>The Signal</title>
    <item>
      <title>%s</title>
      <link>%s</link>
      <description><![CDATA[Interested in learning more about what’...]]></description>
    </item>
    <item>
      <title>Volunteers Leverage OCR to Transcribe Library of Congress Digit...</title>
      <description>
        <![CDATA[Today’s guest post is from Lauren Algee, a Senior Digital Collec...]]>
      </description>
    </item>
  </channel>
</rss>""" % (
    TITLE,
    LINK,
)
IMAGE = "https://blogs.loc.gov/thesignal/files/2025/05/loc-2017698702.png"
HTML = """<html>
  <head>
    <meta property="og:image" content="%s"/>
  </head>
  <body></body>
</html>""" % IMAGE


class ParserTestCase(TestCase):
    @mock.patch("requests.get")
    def test_extract_og_image(self, mock_urlopen):
        mock_response = mock.MagicMock(spec=Response)
        mock_response.text = HTML
        mock_response.headers = {"Content-Type": "text/html"}
        mock_urlopen.return_value = mock_response

        image = extract_og_image("https://example.com/post1")
        self.assertEqual(image, IMAGE)

    @mock.patch("concordia.parser.extract_og_image")
    @mock.patch("requests.get")
    def test_paginate_blog_posts(self, mock_urlopen, mock_extract_og_image):
        mock_response = mock.MagicMock(spec=Response)
        mock_response.content = RSS
        mock_response.status_code = 200
        mock_urlopen.return_value = mock_response

        mock_extract_og_image.return_value = IMAGE

        feed_items = paginate_blog_posts()

        self.assertEqual(len(feed_items), 1)
        self.assertEqual(len(feed_items[0]), 2)
        feed_item = feed_items[0][0]
        self.assertEqual(feed_item["title"], TITLE)
        self.assertEqual(feed_item["link"], LINK)
        self.assertEqual(feed_item["og_image"], IMAGE)

    @mock.patch("concordia.parser.structured_logger.warning")
    @mock.patch("concordia.parser.requests.get")
    def test_get_http_error(self, mock_get, mock_logger):
        mock_response = mock.Mock()
        mock_response.raise_for_status.side_effect = requests.exceptions.HTTPError(
            "500 Server Error"
        )
        mock_get.return_value = mock_response
        result = fetch_blog_posts()
        self.assertEqual(result, [])
        mock_logger.assert_called()

    @mock.patch("concordia.parser.structured_logger.warning")
    @mock.patch("concordia.parser.requests.get")
    def test_get_exception_timeout(self, mock_get, mock_logger):
        mock_get.side_effect = requests.exceptions.Timeout()
        result = fetch_blog_posts()
        self.assertEqual(result, [])
        mock_logger.assert_called()

    @mock.patch("concordia.parser.structured_logger.warning")
    @mock.patch("concordia.parser.requests.get")
    def test_get_connection_error(self, mock_get, mock_logger):
        mock_get.side_effect = requests.exceptions.ConnectionError()
        result = fetch_blog_posts()
        self.assertEqual(result, [])
        mock_logger.assert_called()

    @mock.patch("concordia.parser.structured_logger.warning")
    @mock.patch("concordia.parser.requests.get")
    def test_get_request_exception(self, mock_get, mock_logger):
        mock_get.side_effect = requests.exceptions.RequestException()
        result = fetch_blog_posts()
        self.assertEqual(result, [])
        mock_logger.assert_called()
        call_args, call_kwargs = mock_logger.call_args
        self.assertEqual("blog_req_error", call_kwargs["reason_code"])

    def test_ogimageparser_parses_meta_and_sets_og_image(self):
        parser = parser_mod.OGImageParser()
        html_document = (
            "<html><head>"
            '<meta property="og:title" content="ignored"/>'
            '<meta property="og:image" content="http://ex.com/img.png?x=Tom&amp;Jerry"/>'
            "</head><body></body></html>"
        )
        parser.feed(html_document.replace("&amp;", "&"))
        self.assertEqual(parser.og_image, "http://ex.com/img.png?x=Tom&Jerry")

    @mock.patch.object(parser_mod.structured_logger, "warning")
    @mock.patch.object(parser_mod.requests, "get")
    def test_extract_og_image_request_exception_logs_and_returns_none(
        self, requests_get_mock, logger_warning_mock
    ):
        requests_get_mock.side_effect = parser_mod.requests.RequestException
        result = parser_mod.extract_og_image("http://ex.com/bad")
        self.assertIsNone(result)
        self.assertEqual(
            logger_warning_mock.call_args.kwargs.get("reason_code"),
            "ogi_req_fail_fetch",
        )

    @mock.patch.object(parser_mod, "extract_og_image", return_value="fetched.png")
    @mock.patch.object(parser_mod, "cache")
    def test_get_og_image_calls_extract_on_cache_miss(
        self, cache_mock, extract_og_image_mock
    ):
        cache_mock.get.return_value = None
        value = parser_mod.get_og_image("http://ex.com/post2")
        self.assertEqual(value, "fetched.png")
        extract_og_image_mock.assert_called_once_with("http://ex.com/post2")

    @mock.patch.object(parser_mod, "extract_og_image")
    @mock.patch.object(parser_mod, "cache")
    def test_get_og_image_uses_cache_when_present(
        self, cache_mock, extract_og_image_mock
    ):
        cache_mock.get.return_value = "cached.png"
        value = parser_mod.get_og_image("http://ex.com/post")
        self.assertEqual(value, "cached.png")
        extract_og_image_mock.assert_not_called()

    def _make_item_element(self, title, link):
        def find(tag):
            if tag == "title":
                return SimpleNamespace(text=title)
            if tag == "link":
                return SimpleNamespace(text=link)
            return None

        return SimpleNamespace(find=find)

    @mock.patch.object(parser_mod, "get_og_image")
    @mock.patch.object(parser_mod, "fetch_blog_posts")
    def test_paginate_blog_posts_segments_and_includes_og_images(
        self, fetch_blog_posts_mock, get_og_image_mock
    ):
        items = [
            self._make_item_element(f"T{i}", f"http://ex.com/{i}") for i in range(1, 7)
        ]

        def get_og_image_side_effect(url):
            n = int(url.rsplit("/", 1)[-1])
            return f"http://img/{n}.png" if n <= 4 else None

        fetch_blog_posts_mock.return_value = items
        get_og_image_mock.side_effect = get_og_image_side_effect

        segmented = paginate_blog_posts()
        self.assertEqual(len(segmented), 2)
        self.assertEqual(len(segmented[0]), 3)
        self.assertEqual(len(segmented[1]), 3)

        first = segmented[0][0]
        self.assertEqual(first["title"], "T1")
        self.assertEqual(first["link"], "http://ex.com/1")
        self.assertEqual(first["og_image"], "http://img/1.png")

        last = segmented[1][2]
        self.assertEqual(last["title"], "T6")
        self.assertEqual(last["link"], "http://ex.com/6")
        self.assertNotIn("og_image", last)

    @mock.patch.object(parser_mod, "fetch_blog_posts", return_value=[])
    def test_paginate_blog_posts_with_no_items_returns_single_empty_segment(
        self, fetch_blog_posts_mock
    ):
        segmented = paginate_blog_posts()
        self.assertEqual(segmented, [[]])


================================================
FILE: concordia/tests/test_registration_views.py
================================================
"""
Tests for user registration-related views
"""

from logging import getLogger
from unittest import mock

from django.contrib.auth import get_user_model
from django.contrib.auth.tokens import default_token_generator
from django.core import mail
from django.test import TestCase, override_settings, tag
from django.urls import reverse
from django.utils.encoding import force_bytes
from django.utils.http import urlsafe_base64_encode

from .utils import CacheControlAssertions, CreateTestUsers, JSONAssertMixin

User = get_user_model()


logger = getLogger(__name__)


INTERNAL_RESET_URL_TOKEN = "set-password"  # nosec
INTERNAL_RESET_SESSION_TOKEN = "_password_reset_token"  # nosec


@override_settings(RATELIMIT_ENABLE=False)
@tag("registration")
class ConcordiaViewTests(
    JSONAssertMixin, CacheControlAssertions, TestCase, CreateTestUsers
):
    def test_send_activation_email_on_inactive_login(self):
        self.user = self.create_inactive_user("tester")

        response = self.client.post(
            reverse("registration_login"),
            {"username": self.user.username, "password": self.user._password},
        )

        self.assertContains(response, "This account has not yet been activated.")

        self.assertEqual(len(mail.outbox), 1)

    def test_inactive_user_can_password_reset(self):
        self.user = self.create_inactive_user("tester")

        self.client.post(reverse("password_reset"), {"email": self.user.email})

        self.assertEqual(len(mail.outbox), 1)

    @mock.patch("concordia.forms.user_activated.send")
    def test_password_reset_will_activate_user(self, signal_mock):
        self.user = self.create_inactive_user("tester2")
        fake_pw = "ASdf12&&"
        new_password_data = {"new_password1": fake_pw, "new_password2": fake_pw}
        password_reset_token = default_token_generator.make_token(self.user)
        uidb64 = urlsafe_base64_encode(force_bytes(self.user.pk))

        session = self.client.session
        session[INTERNAL_RESET_SESSION_TOKEN] = password_reset_token
        session.save()

        confirm_response = self.client.post(
            reverse(
                "password_reset_confirm",
                kwargs={"uidb64": uidb64, "token": INTERNAL_RESET_URL_TOKEN},
            ),
            new_password_data,
        )

        self.assertRedirects(confirm_response, "/account/reset/done/")
        self.assertUncacheable(confirm_response)

        # Verify the User was correctly activated
        updated_user = User.objects.get(pk=self.user.pk)
        self.assertEqual(updated_user.is_active, True)

        # Verify activation signal was sent
        self.assertTrue(signal_mock.called)

    @mock.patch("concordia.forms.user_activated.send")
    def test_password_reset_with_activate_user(self, signal_mock):
        self.user = self.create_user("tester")
        fake_pw = "ASdf12&&"
        new_password_data = {"new_password1": fake_pw, "new_password2": fake_pw}
        password_reset_token = default_token_generator.make_token(self.user)
        uidb64 = urlsafe_base64_encode(force_bytes(self.user.pk))

        session = self.client.session
        session[INTERNAL_RESET_SESSION_TOKEN] = password_reset_token
        session.save()

        confirm_response = self.client.post(
            reverse(
                "password_reset_confirm",
                kwargs={"uidb64": uidb64, "token": INTERNAL_RESET_URL_TOKEN},
            ),
            new_password_data,
        )

        self.assertRedirects(confirm_response, "/account/reset/done/")
        self.assertUncacheable(confirm_response)

        # Verify the User is still activated
        updated_user = User.objects.get(pk=self.user.pk)
        self.assertEqual(updated_user.is_active, True)

        # Verify activation signal was not sent
        self.assertFalse(signal_mock.called)


================================================
FILE: concordia/tests/test_s3.py
================================================
import os
from unittest.mock import MagicMock, patch

from django.core.files.base import ContentFile
from django.test import TestCase, override_settings

from .utils import create_asset


class S3StorageAPITest(TestCase):
    def setUp(self):
        super().setUp()
        # Reset ASSET_STORAGE so it's evaluated with
        # the new settings
        from concordia.storage import ASSET_STORAGE

        ASSET_STORAGE._wrapped = None

    def tearDown(self):
        # Reset ASSET_STORAGE so it doesn't keep
        # the overriden settings in future tests
        from concordia.storage import ASSET_STORAGE

        ASSET_STORAGE._wrapped = None
        ASSET_STORAGE._setup()
        super().tearDown()

    @override_settings(
        STORAGES={
            "default": {
                "BACKEND": "storages.backends.s3boto3.S3Boto3Storage",
            },
            "assets": {
                "BACKEND": "storages.backends.s3boto3.S3Boto3Storage",
                "OPTIONS": {
                    "querystring_auth": False,
                },
            },
        },
        AWS_STORAGE_BUCKET_NAME="test-bucket",
    )
    @patch.dict(
        os.environ,
        {
            # Force static creds so botocore uses the "env" provider
            "AWS_ACCESS_KEY_ID": "test",
            "AWS_SECRET_ACCESS_KEY": "test",
            "AWS_SESSION_TOKEN": "test",
            "AWS_DEFAULT_REGION": "us-east-1",
            # Prevent profile/config-based resolution and IMDS
            "AWS_SDK_LOAD_CONFIG": "0",
            "AWS_EC2_METADATA_DISABLED": "true",
        },
        clear=False,
    )
    @patch("botocore.auth.SigV4Auth.add_auth")
    @patch("botocore.endpoint.Endpoint._send")
    def test_s3_upload_api_layer(self, mock_send, mock_add_auth):
        # Set up mocked response to prevent real network call
        mock_response = MagicMock()
        mock_response.status_code = 200
        mock_response.headers = {}
        mock_response.content = b""
        mock_send.return_value = mock_response

        with patch.dict(
            os.environ,
            {
                # Force the env-credentials provider to win
                "AWS_ACCESS_KEY_ID": "test",
                "AWS_SECRET_ACCESS_KEY": "test",
                "AWS_SESSION_TOKEN": "test",
                "AWS_DEFAULT_REGION": "us-east-1",
                # Make boto ignore shared config and IMDS
                "AWS_SDK_LOAD_CONFIG": "0",
                "AWS_EC2_METADATA_DISABLED": "true",
            },
            clear=False,  # keep PATH, HOME, etc.
        ):
            # Ensure AWS_PROFILE is truly absent (not an empty string)
            # Setting it to an empty string causes an error because
            # boto tries to use it as a profile name
            os.environ.pop("AWS_PROFILE", None)
            os.environ.pop("AWS_DEFAULT_PROFILE", None)

            # We import this here to stop it from being
            # evaluated before we override the storage settings
            from concordia.storage import ASSET_STORAGE

            ASSET_STORAGE._setup()

            # Simulate manually saving to the storage backend
            asset_image_filename = "test-campaign/test-project/1.jpg"
            content = ContentFile(b"abc123", name="test.jpg")

            ASSET_STORAGE.save(asset_image_filename, content)
            asset = create_asset(storage_image=asset_image_filename)

            self.assertTrue(asset.storage_image.name.endswith("1.jpg"))
            mock_send.assert_called()


================================================
FILE: concordia/tests/test_selenium.py
================================================
import json
from logging import getLogger
from secrets import token_hex

from django.conf import settings
from django.contrib.staticfiles.testing import StaticLiveServerTestCase
from django.template.loader import render_to_string
from django.test import tag
from django.urls import reverse
from pylenium.config import PyleniumConfig
from pylenium.driver import Pylenium

from .axe import Axe
from .utils import CreateTestUsers, create_simple_page

logger = getLogger(__name__)


@tag("selenium", "axe")
class SeleniumTests(CreateTestUsers, StaticLiveServerTestCase):
    @classmethod
    def setUpClass(cls):
        super().setUpClass()
        try:
            with open(settings.PYLENIUM_CONFIG) as file:
                _json = json.load(file)
            config = PyleniumConfig(**_json)
        except FileNotFoundError:
            logger.warning(
                "settings.PYLENIUM_CONFIG (%s) was not found; using defaults.",
                settings.PYLENIUM_CONFIG,
            )
            config = PyleniumConfig()

        cls.py = Pylenium(config)
        cls.axe = Axe(cls.py)

    @classmethod
    def tearDownClass(cls):
        cls.py.quit()
        super().tearDownClass()

    def reverse(self, name):
        return f"{self.live_server_url}{reverse(name)}"

    def test_login(self):
        self.py.viewport(1280, 800)
        self.py.visit(self.reverse("registration_login"))
        violations = self.axe.violations()
        self.assertEqual(len(violations), 0, self.axe.report(violations))

        self.py.get("[name='username']").type(token_hex(8))
        self.py.get("[name='password']").type(token_hex(24))
        self.py.get("button#login").click()
        self.assertTrue(
            self.py.should().have_url(f"{self.live_server_url}/account/login/")
        )

        violations = self.axe.violations()
        self.assertEqual(len(violations), 0, self.axe.report(violations))

        self.assertTrue(
            self.py.get("form#login-form")
            .should()
            .contain_text("Please enter a correct username and password")
        )

        user = self.create_user("login-test")
        self.py.visit(self.reverse("registration_login"))
        self.py.get("[name='username']").type(user.username)
        self.py.get("[name='password']").type(user._password)
        self.py.get("button#login").click()

        violations = self.axe.violations()
        self.assertEqual(len(violations), 0, self.axe.report(violations))

    def test_blog_carousel(self):
        context = {"blog_posts": [[{}], [{}]]}
        html_string = render_to_string("fragments/featured_blog_posts.html", context)
        create_simple_page(path="/about/", title="About", body=html_string)
        self.py.visit(self.reverse("about"))

        carousel = self.py.get("#blog-carousel")
        self.assertTrue(carousel.should().be_visible())

        inner = carousel.get(".carousel-inner")
        items = inner.find(".carousel-item")
        self.assertGreater(len(items), 1, "No carousel items found")

        active_items = [
            item for item in items if "active" in item.get_attribute("class")
        ]
        self.assertEqual(len(active_items), 1)


================================================
FILE: concordia/tests/test_sentry.py
================================================
import importlib
import os
from unittest import mock

from django.test import TestCase

from concordia import celery


class TestSentry(TestCase):
    @mock.patch.dict(
        os.environ,
        {
            "SENTRY_BACKEND_DSN": "http://example.com",
            "CONCORDIA_ENVIRONMENT": "dummy_environment",
        },
    )
    def test_sentry_config(self):
        # Because the celery module is imported during start up,
        # we need to reload it after patching Sentry.
        # release and integrations aren't tested because they
        # are impossible to mock due to the how everything is imported
        # and the functions called are tested elsewhere
        with mock.patch("concordia.celery.sentry_sdk.init") as sentry_mock:
            importlib.reload(celery)
            sentry_mock.assert_called_with(
                "http://example.com",
                environment="dummy_environment",
                release=mock.ANY,
                integrations=mock.ANY,
            )


================================================
FILE: concordia/tests/test_signals.py
================================================
from unittest import mock

from django.conf import settings
from django.contrib.auth.models import Group
from django.contrib.auth.signals import user_logged_in
from django.core import mail
from django.http import HttpResponse
from django.test import RequestFactory, TestCase
from django.urls import reverse
from django.utils import timezone
from django_registration.signals import user_activated, user_registered
from structlog.contextvars import bind_contextvars, clear_contextvars

from concordia.models import TranscriptionStatus
from concordia.signals.handlers import add_request_id_to_response

from .utils import CreateTestUsers, create_asset, create_transcription


class TestSignalHandlers(CreateTestUsers, TestCase):
    def setUp(self):
        self.user = self.create_test_user()
        self.asset = create_asset()
        self.request_factory = RequestFactory()

    def test_clear_reservation_token(self):
        self.login_user()
        response = self.client.get(reverse("redirect-to-next-transcribable-asset"))
        self.assertIsNotNone(self.client.session.get("reservation_token"))
        user_logged_in.send(
            sender=self.__class__, user=self.user, request=response.wsgi_request
        )
        self.assertIsNone(self.client.session.get("reservation_token"))

    def test_user_successfully_activated(self):
        with mock.patch("concordia.signals.handlers.flag_enabled") as flag_mock:
            flag_mock.return_value = True
            response = self.client.get("/")
            request = response.wsgi_request
            user_activated.send(sender=self.__class__, user=self.user, request=request)
            self.assertTrue(request.user.is_authenticated)
            self.assertEqual(len(mail.outbox), 1)

    def test_user_successfully_activated_no_request(self):
        with mock.patch("concordia.signals.handlers.flag_enabled") as flag_mock:
            flag_mock.return_value = True
            user_activated.send(sender=self.__class__, user=self.user, request=None)
            self.assertEqual(len(mail.outbox), 1)

    def test_user_successfully_activated_no_welcome_email(self):
        with mock.patch("concordia.signals.handlers.flag_enabled") as flag_mock:
            flag_mock.return_value = False
            response = self.client.get("/")
            request = response.wsgi_request
            user_activated.send(sender=self.__class__, user=self.user, request=request)
            self.assertTrue(request.user.is_authenticated)
            self.assertEqual(len(mail.outbox), 0)

    def test_add_user_to_newsletter(self):
        self.login_user()
        response = self.client.post("/")
        user_registered.send(
            sender=self.__class__, user=self.user, request=response.wsgi_request
        )
        self.assertNotIn(
            self.user,
            Group.objects.get(name=settings.NEWSLETTER_GROUP_NAME).user_set.all(),
        )

        response = self.client.post("/", data={"newsletterOptIn": True})
        user_registered.send(
            sender=self.__class__, user=self.user, request=response.wsgi_request
        )
        self.assertIn(
            self.user,
            Group.objects.get(name=settings.NEWSLETTER_GROUP_NAME).user_set.all(),
        )


class UpdateAssetStatusSignalTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.user1 = self.create_user("user-1")
        self.user2 = self.create_user("user-2")
        self.asset = create_asset()

    def test_accepted_transcription_sets_completed_status(self):
        create_transcription(asset=self.asset, user=self.user1, accepted=timezone.now())

        self.asset.refresh_from_db()
        self.assertEqual(self.asset.transcription_status, TranscriptionStatus.COMPLETED)

    def test_submitted_transcription_sets_submitted_status(self):
        create_transcription(
            asset=self.asset, user=self.user1, submitted=timezone.now()
        )

        self.asset.refresh_from_db()
        self.assertEqual(self.asset.transcription_status, TranscriptionStatus.SUBMITTED)

    def test_rejected_transcription_sets_in_progress_status(self):
        create_transcription(asset=self.asset, user=self.user1, rejected=timezone.now())

        self.asset.refresh_from_db()
        self.assertEqual(
            self.asset.transcription_status, TranscriptionStatus.IN_PROGRESS
        )

    def test_default_transcription_sets_in_progress_status(self):
        create_transcription(asset=self.asset, user=self.user1)

        self.asset.refresh_from_db()
        self.assertEqual(
            self.asset.transcription_status, TranscriptionStatus.IN_PROGRESS
        )

    def test_outdated_transcription_does_not_update_status(self):
        t1 = create_transcription(
            asset=self.asset, user=self.user1, submitted=timezone.now()
        )
        create_transcription(asset=self.asset, user=self.user2, accepted=timezone.now())

        # Now "re-save" the older one to trigger the signal
        # Expecting this save to trigger the warning logger since t1 is no longer latest
        with self.assertLogs("concordia.signals.handlers", level="WARNING") as log_cm:
            t1.rejected = timezone.now()
            t1.save()

        self.asset.refresh_from_db()
        # Status should remain COMPLETED due to latest transcription not being t1
        self.assertEqual(self.asset.transcription_status, TranscriptionStatus.COMPLETED)

        # Verify that a warning was indeed logged about outdated transcription
        self.assertTrue(
            any("An older transcription" in message for message in log_cm.output)
        )
        self.assertTrue(any(str(t1.id) in message for message in log_cm.output))
        self.assertTrue(any(str(self.asset.id) in message for message in log_cm.output))

    @mock.patch("concordia.signals.handlers.remove_next_asset_objects")
    @mock.patch("concordia.signals.handlers.calculate_difficulty_values")
    def test_tasks_called_on_latest_transcription(self, mock_calc, mock_remove):
        create_transcription(asset=self.asset, user=self.user1, accepted=timezone.now())

        mock_remove.assert_called_once_with(self.asset.id)
        mock_calc.assert_called_once()
        args, _ = mock_calc.call_args
        self.assertEqual(list(args[0].values_list("pk", flat=True)), [self.asset.pk])


class RequestIDHeaderTests(TestCase):
    def setUp(self):
        self.factory = RequestFactory()
        clear_contextvars()
        bind_contextvars(request_id="test-id-123")

    def tearDown(self):
        clear_contextvars()

    def make_response(self, cache_control_header=None):
        response = HttpResponse("ok")
        if cache_control_header:
            response["Cache-Control"] = cache_control_header
        return response

    @mock.patch(
        "structlog.contextvars.get_merged_contextvars",
        return_value={"request_id": "test-id-123"},
    )
    def test_adds_header_when_no_cache_control(self, mock_contextvars):
        response = self.make_response()
        add_request_id_to_response(response=response, logger=None)
        self.assertEqual(response["X-Request-ID"], "test-id-123")

    @mock.patch(
        "structlog.contextvars.get_merged_contextvars",
        return_value={"request_id": "test-id-123"},
    )
    def test_adds_header_when_private(self, mock_contextvars):
        response = self.make_response("private, no-store")
        add_request_id_to_response(response=response, logger=None)
        self.assertEqual(response["X-Request-ID"], "test-id-123")

    @mock.patch(
        "structlog.contextvars.get_merged_contextvars",
        return_value={"request_id": "test-id-123"},
    )
    def test_skips_header_when_public_with_max_age(self, mock_contextvars):
        response = self.make_response("public, max-age=600")
        add_request_id_to_response(response=response, logger=None)
        self.assertNotIn("X-Request-ID", response)

    @mock.patch(
        "structlog.contextvars.get_merged_contextvars",
        return_value={"request_id": "test-id-123"},
    )
    def test_adds_header_when_no_store_present(self, mock_contextvars):
        response = self.make_response("public, no-store")
        add_request_id_to_response(response=response, logger=None)
        self.assertEqual(response["X-Request-ID"], "test-id-123")


================================================
FILE: concordia/tests/test_tasks_assets.py
================================================
from unittest import mock
from unittest.mock import PropertyMock

from django.test import TestCase

from concordia.models import Asset, TranscriptionStatus
from concordia.tasks.assets import (
    calculate_difficulty_values,
    fix_storage_images,
    populate_asset_years,
)

from .utils import (
    CreateTestUsers,
    create_asset,
    create_campaign,
    create_item,
    create_project,
    create_transcription,
)


class CalculateDifficultyValuesTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.user1 = self.create_test_user("cdv-user-1")
        self.user2 = self.create_test_user("cdv-user-2")
        self.reviewer = self.create_test_user("cdv-reviewer")
        self.campaign = create_campaign(slug="cdv-c")
        self.project = create_project(campaign=self.campaign, slug="cdv-p")
        self.item = create_item(project=self.project, item_id="cdv-i")

    def test_no_changes_when_difficulty_matches(self):
        asset = create_asset(item=self.item, slug="cdv-a1")
        # Default difficulty is zero and there are no transcriptions
        updated = calculate_difficulty_values(Asset.objects.filter(pk=asset.pk))
        self.assertEqual(updated, 0)
        asset.refresh_from_db()
        self.assertEqual(asset.difficulty, 0)

    def test_updates_difficulty_for_explicit_queryset(self):
        asset = create_asset(item=self.item, slug="cdv-a2")
        with mock.patch(
            "concordia.signals.handlers.calculate_difficulty_values", return_value=None
        ):
            # Two transcriptions by two users and one reviewer
            create_transcription(asset=asset, user=self.user1)
            create_transcription(
                asset=asset, user=self.user2, reviewed_by=self.reviewer
            )

        updated = calculate_difficulty_values(Asset.objects.filter(pk=asset.pk))
        self.assertEqual(updated, 1)

        asset.refresh_from_db()
        # transcription_count is 2; transcriber_count is 2; reviewer_count is 1
        # difficulty is 2 * (2 + 1), so difficulty should be 6
        self.assertEqual(asset.difficulty, 6)

    def test_default_published_queryset_and_chunking(self):
        # Build 501 published assets so we traverse more than one chunk
        first = None
        last = None
        for i in range(1, 502):
            a = create_asset(
                item=self.item,
                slug=f"cdv-bulk-{i}",
                sequence=i,
            )
            if i == 1:
                first = a
            if i == 501:
                last = a

        with mock.patch(
            "concordia.signals.handlers.calculate_difficulty_values", return_value=None
        ):
            # Add one transcription to first and last to force two updates
            create_transcription(asset=first, user=self.user1)
            create_transcription(asset=last, user=self.user1)
        updated = calculate_difficulty_values()
        self.assertEqual(updated, 2)

        first.refresh_from_db()
        last.refresh_from_db()
        self.assertEqual(first.difficulty, 1)
        self.assertEqual(last.difficulty, 1)


class PopulateAssetYearsTests(TestCase):
    def setUp(self):
        self.campaign = create_campaign(slug="pay-c")
        self.project = create_project(campaign=self.campaign, slug="pay-p")

        self.item1 = create_item(project=self.project, item_id="pay-i1")
        self.asset1 = create_asset(item=self.item1, slug="pay-a1")

        self.item2 = create_item(project=self.project, item_id="pay-i2")
        self.asset2 = create_asset(item=self.item2, slug="pay-a2")

        # Ensure both assets have the metadata shape the task expects and that
        # their current year matches that metadata so we can control which rows
        # update in individual tests without KeyErrors or unintended updates.
        self._set_metadata_dates(self.asset1, "2000")
        self._set_metadata_dates(self.asset2, "2000")
        Asset.objects.filter(pk__in=[self.asset1.pk, self.asset2.pk]).update(
            year="2000"
        )

    def _set_metadata_dates(self, asset, *years):
        # Populate minimal metadata structure expected by the task
        asset.item.metadata = {
            "item": {"dates": [{y: {}} for y in years]},
        }
        asset.item.save(update_fields=["metadata"])

    def test_updates_year_from_last_date_key(self):
        # Change asset1’s metadata so it needs an update; asset2 stays matched.
        self._set_metadata_dates(self.asset1, "1900", "1901")
        # Current year differs (2000), so an update should occur for asset1.
        updated = populate_asset_years()
        self.assertGreaterEqual(updated, 1)

        self.asset1.refresh_from_db()
        self.assertEqual(self.asset1.year, "1901")

    def test_skips_when_year_unchanged(self):
        # Keep asset1 year equal to its extracted year; asset2 is already matched
        self._set_metadata_dates(self.asset1, "1900")
        Asset.objects.filter(pk=self.asset1.pk).update(year="1900")

        updated = populate_asset_years()
        self.assertEqual(updated, 0)

    def test_multiple_assets_count_returned(self):
        # Both assets should change
        self._set_metadata_dates(self.asset1, "1910")
        self._set_metadata_dates(self.asset2, "1920")

        Asset.objects.filter(pk=self.asset1.pk).update(year="1900")
        Asset.objects.filter(pk=self.asset2.pk).update(year="1900")

        updated = populate_asset_years()
        self.assertEqual(updated, 2)

        self.asset1.refresh_from_db()
        self.asset2.refresh_from_db()
        self.assertEqual(self.asset1.year, "1910")
        self.assertEqual(self.asset2.year, "1920")

    def test_skips_empty_date_dicts_and_uses_last_year(self):
        # Use truly empty dicts ({}) so the inner loop over keys is not entered for
        # those entries; the task should still pick the last non-empty year.
        self.asset1.item.metadata = {
            "item": {"dates": [{}, {"1955": {}}, {}, {"1957": {}}]}
        }
        self.asset1.item.save(update_fields=["metadata"])

        # Ensure an update is needed.
        Asset.objects.filter(pk=self.asset1.pk).update(year="2000")

        updated = populate_asset_years()
        self.assertEqual(updated, 1)

        self.asset1.refresh_from_db()
        self.assertEqual(self.asset1.year, "1957")


class FixStorageImagesTests(TestCase):
    def setUp(self):
        self.campaign1 = create_campaign(slug="fsi-c1")
        self.project1 = create_project(campaign=self.campaign1, slug="fsi-p1")
        self.item1 = create_item(project=self.project1, item_id="fsi-i1")

        self.campaign2 = create_campaign(slug="fsi-c2")
        self.project2 = create_project(campaign=self.campaign2, slug="fsi-p2")
        self.item2 = create_item(project=self.project2, item_id="fsi-i2")

        self.asset1 = create_asset(
            item=self.item1,
            slug="fsi-a1",
            sequence=1,
            transcription_status=TranscriptionStatus.NOT_STARTED,
        )
        self.asset2 = create_asset(
            item=self.item1,
            slug="fsi-a2",
            sequence=2,
            transcription_status=TranscriptionStatus.IN_PROGRESS,
        )
        self.asset3 = create_asset(
            item=self.item2,
            slug="fsi-a3",
            sequence=3,
            transcription_status=TranscriptionStatus.SUBMITTED,
        )

    def test_skips_when_storage_image_exists(self):
        with (
            mock.patch(
                "django.core.files.storage.FileSystemStorage.exists",
                return_value=True,
            ),
            mock.patch("concordia.tasks.assets.requests.get") as mock_get,
            mock.patch("concordia.tasks.assets.ASSET_STORAGE.save") as mock_save,
        ):
            fix_storage_images()
            mock_get.assert_not_called()
            mock_save.assert_not_called()

    def test_downloads_and_saves_when_missing_success(self):
        expected_filename = "/".join(
            [
                self.campaign1.slug,
                self.project1.slug,
                self.item1.item_id,
                f"{self.asset1.sequence}.jpg",
            ]
        )

        with (
            mock.patch(
                "django.core.files.storage.FileSystemStorage.exists",
                return_value=False,
            ),
            mock.patch.object(
                Asset,
                "download_url",
                new_callable=PropertyMock,
                return_value="https://example.invalid/img.jpg",
            ),
            mock.patch("concordia.tasks.assets.requests.get") as mock_get,
            mock.patch("concordia.tasks.assets.ASSET_STORAGE.save") as mock_save,
        ):
            fake_response = mock.MagicMock()
            fake_response.iter_content.return_value = [b"abc", b"def"]
            fake_response.raise_for_status.return_value = None
            mock_get.return_value = fake_response

            fix_storage_images(campaign_slug=self.campaign1.slug)

            mock_get.assert_called()
            mock_save.assert_any_call(expected_filename, mock.ANY)

    def test_raises_and_logs_when_save_fails(self):
        with (
            mock.patch(
                "django.core.files.storage.FileSystemStorage.exists",
                return_value=False,
            ),
            mock.patch.object(
                Asset,
                "download_url",
                new_callable=PropertyMock,
                return_value="https://example.invalid/img.jpg",
            ),
            mock.patch("concordia.tasks.assets.requests.get") as mock_get,
            mock.patch(
                "concordia.tasks.assets.ASSET_STORAGE.save",
                side_effect=RuntimeError("save failed"),
            ),
            mock.patch("concordia.tasks.assets.logger") as mock_logger,
        ):
            fake_response = mock.MagicMock()
            fake_response.iter_content.return_value = [b"abc"]
            fake_response.raise_for_status.return_value = None
            mock_get.return_value = fake_response

            with self.assertRaises(RuntimeError):
                fix_storage_images(campaign_slug=self.campaign1.slug)

            self.assertTrue(mock_logger.exception.called)

    def test_filters_by_campaign_and_asset_start_id(self):
        with (
            mock.patch(
                "django.core.files.storage.FileSystemStorage.exists",
                return_value=False,
            ),
            mock.patch.object(
                Asset,
                "download_url",
                new_callable=PropertyMock,
                return_value="https://example.invalid/img.jpg",
            ),
            mock.patch("concordia.tasks.assets.requests.get") as mock_get,
            mock.patch("concordia.tasks.assets.ASSET_STORAGE.save") as mock_save,
        ):
            fake_response = mock.MagicMock()
            fake_response.iter_content.return_value = [b"x"]
            fake_response.raise_for_status.return_value = None
            mock_get.return_value = fake_response

            fix_storage_images(
                campaign_slug=self.campaign1.slug,
                asset_start_id=self.asset2.id,
            )

            self.assertEqual(mock_save.call_count, 1)
            expected_filename = "/".join(
                [
                    self.campaign1.slug,
                    self.project1.slug,
                    self.item1.item_id,
                    f"{self.asset2.sequence}.jpg",
                ]
            )
            mock_save.assert_called_with(expected_filename, mock.ANY)

    def test_skips_when_storage_image_is_falsy(self):
        # Make both campaign1 assets have a falsy storage_image, to
        # ensure we handle that case sanely
        Asset.objects.filter(pk__in=[self.asset1.pk, self.asset2.pk]).update(
            storage_image=""
        )

        with (
            mock.patch(
                "django.core.files.storage.FileSystemStorage.exists",
                return_value=True,
            ) as mock_exists,
            mock.patch("concordia.tasks.assets.requests.get") as mock_get,
            mock.patch("concordia.tasks.assets.ASSET_STORAGE.save") as mock_save,
        ):
            fix_storage_images(campaign_slug=self.campaign1.slug)

            # Nothing should be fetched or saved when storage_image is falsy.
            mock_get.assert_not_called()
            mock_save.assert_not_called()
            # And we should never even check existence for these assets.
            mock_exists.assert_not_called()


================================================
FILE: concordia/tests/test_tasks_blog.py
================================================
from unittest import mock

from django.test import TestCase
from requests.models import Response

from concordia.tasks.blog import fetch_and_cache_blog_images


class BlogTaskTestCase(TestCase):
    @mock.patch("concordia.tasks.blog.extract_og_image")
    @mock.patch("concordia.parser.requests.get")
    def test_fetch_and_cache_blog_images(self, mock_get, mock_extract):
        link1 = "https://blogs.loc.gov/thesignal/2025/05/volunteers-ocr/"
        link2 = "https://blogs.loc.gov/thesignal/2025/02/douglass-day-2025/"
        rss = """<?xml version="1.0" encoding="UTF-8"?>
        <rss version="2.0">
          <channel>
            <item><link>%s</link></item><item><link>%s</link></item>
          </channel>
        </rss>""" % (
            link1,
            link2,
        )
        mock_response = mock.MagicMock(spec=Response)
        mock_response.content = rss
        mock_response.status_code = 200
        mock_get.return_value = mock_response

        # run the celery task
        fetch_and_cache_blog_images()

        mock_extract.assert_any_call(link1)
        mock_extract.assert_any_call(link2)
        self.assertEqual(mock_extract.call_count, 2)

    @mock.patch("concordia.tasks.blog.extract_og_image")
    @mock.patch("concordia.tasks.blog.fetch_blog_posts")
    def test_skips_items_with_no_link(self, mock_fetch, mock_extract):
        # Provide one item without a link and one with a link to make
        # sure we handle no link correctly
        class DummyLink:
            def __init__(self, text):
                self.text = text

        class DummyItem:
            def __init__(self, link):
                self._link = link

            def find(self, name):
                return self._link if name == "link" else None

        item_no_link = DummyItem(None)
        item_with_link = DummyItem(DummyLink("https://example.invalid/post"))
        mock_fetch.return_value = [item_no_link, item_with_link]

        fetch_and_cache_blog_images()

        mock_extract.assert_called_once_with("https://example.invalid/post")


================================================
FILE: concordia/tests/test_tasks_housekeeping.py
================================================
from unittest import mock

from django.test import TestCase

from concordia.tasks.housekeeping import clear_sessions


class ClearSessionsTaskTests(TestCase):
    def test_calls_django_clearsessions_command(self):
        # Verify the task invokes Django's clearsessions management command.
        with mock.patch("concordia.tasks.housekeeping.call_command") as mock_call:
            result = clear_sessions()
            self.assertIsNone(result)
            mock_call.assert_called_once_with("clearsessions")

    def test_raises_when_call_command_fails(self):
        # Ensure exceptions from the management command propagate.
        with mock.patch(
            "concordia.tasks.housekeeping.call_command",
            side_effect=RuntimeError("boom"),
        ):
            with self.assertRaises(RuntimeError):
                clear_sessions()


================================================
FILE: concordia/tests/test_tasks_next_asset.py
================================================
from unittest import mock

from django.test import TestCase
from django.utils import timezone

from concordia.models import (
    NextReviewableCampaignAsset,
    NextReviewableTopicAsset,
    NextTranscribableCampaignAsset,
    NextTranscribableTopicAsset,
    TranscriptionStatus,
)
from concordia.tasks.next_asset.renew import renew_next_asset_cache
from concordia.tasks.next_asset.reviewable import (
    clean_next_reviewable_for_campaign,
    clean_next_reviewable_for_topic,
    populate_next_reviewable_for_campaign,
    populate_next_reviewable_for_topic,
)
from concordia.tasks.next_asset.transcribable import (
    clean_next_transcribable_for_campaign,
    clean_next_transcribable_for_topic,
    populate_next_transcribable_for_campaign,
    populate_next_transcribable_for_topic,
)
from concordia.utils import get_anonymous_user

from .utils import (
    CreateTestUsers,
    create_asset,
    create_topic,
    create_transcription,
)


class PopulateNextAssetTasksTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.anon = get_anonymous_user()
        self.user = self.create_test_user()
        self.asset1 = create_asset(slug="test-asset-1", title="Test Asset 1")
        self.asset2 = create_asset(
            item=self.asset1.item, slug="test-asset-2", title="Test Asset 2"
        )
        self.topic = create_topic(project=self.asset1.item.project)
        self.campaign = self.asset1.campaign

    def test_populate_next_transcribable_for_campaign(self):
        populate_next_transcribable_for_campaign(campaign_id=self.campaign.id)
        self.assertEqual(
            NextTranscribableCampaignAsset.objects.filter(
                campaign=self.campaign
            ).count(),
            2,
        )

    def test_populate_next_transcribable_for_topic(self):
        populate_next_transcribable_for_topic(topic_id=self.topic.id)
        self.assertEqual(
            NextTranscribableTopicAsset.objects.filter(topic=self.topic).count(), 2
        )

    def test_populate_next_reviewable_for_campaign(self):
        create_transcription(
            asset=self.asset1, user=self.anon, submitted=timezone.now()
        )
        create_transcription(
            asset=self.asset2, user=self.user, submitted=timezone.now()
        )
        populate_next_reviewable_for_campaign(campaign_id=self.campaign.id)
        self.assertEqual(
            NextReviewableCampaignAsset.objects.filter(campaign=self.campaign).count(),
            2,
        )

    def test_populate_next_reviewable_for_topic(self):
        create_transcription(
            asset=self.asset1, user=self.anon, submitted=timezone.now()
        )
        create_transcription(
            asset=self.asset2, user=self.user, submitted=timezone.now()
        )
        populate_next_reviewable_for_topic(topic_id=self.topic.id)
        self.assertEqual(
            NextReviewableTopicAsset.objects.filter(topic=self.topic).count(), 2
        )

    @mock.patch("concordia.tasks.next_asset.transcribable.logger")
    def test_populate_next_transcribable_for_campaign_missing(self, mock_logger):
        populate_next_transcribable_for_campaign(campaign_id=9999)
        mock_logger.error.assert_called_once()

    @mock.patch("concordia.tasks.next_asset.transcribable.logger")
    def test_populate_next_transcribable_for_topic_missing(self, mock_logger):
        populate_next_transcribable_for_topic(topic_id=9999)
        mock_logger.error.assert_called_once()

    @mock.patch("concordia.tasks.next_asset.reviewable.logger")
    def test_populate_next_reviewable_for_campaign_missing(self, mock_logger):
        populate_next_reviewable_for_campaign(campaign_id=9999)
        mock_logger.error.assert_called_once()

    @mock.patch("concordia.tasks.next_asset.reviewable.logger")
    def test_populate_next_reviewable_for_topic_missing(self, mock_logger):
        populate_next_reviewable_for_topic(topic_id=9999)
        mock_logger.error.assert_called_once()

    @mock.patch("concordia.tasks.next_asset.transcribable.logger")
    def test_populate_next_transcribable_for_campaign_none_needed(self, mock_logger):
        for i in range(3, 103):
            asset = create_asset(item=self.asset1.item, slug=f"dummy-{i}")
            NextTranscribableCampaignAsset.objects.create(
                asset=asset,
                item=asset.item,
                item_item_id=asset.item.item_id,
                project=asset.item.project,
                project_slug=asset.item.project.slug,
                campaign=self.campaign,
                sequence=asset.sequence,
                transcription_status=asset.transcription_status,
            )
        populate_next_transcribable_for_campaign(campaign_id=self.campaign.id)
        mock_logger.info.assert_any_call(
            "Campaign %s already has %s next transcribable assets", self.campaign, 100
        )

    @mock.patch("concordia.tasks.next_asset.transcribable.logger")
    def test_populate_next_transcribable_for_topic_none_needed(self, mock_logger):
        for i in range(3, 103):
            asset = create_asset(item=self.asset1.item, slug=f"dummy-{i}")
            NextTranscribableTopicAsset.objects.create(
                asset=asset,
                item=asset.item,
                item_item_id=asset.item.item_id,
                project=asset.item.project,
                project_slug=asset.item.project.slug,
                topic=self.topic,
                sequence=asset.sequence,
                transcription_status=asset.transcription_status,
            )
        populate_next_transcribable_for_topic(topic_id=self.topic.id)
        mock_logger.info.assert_any_call(
            "Topic %s already has %s next transcribable assets", self.topic, 100
        )

    @mock.patch("concordia.tasks.next_asset.reviewable.logger")
    def test_populate_next_reviewable_for_campaign_none_needed(self, mock_logger):
        create_transcription(
            asset=self.asset1, user=self.user, submitted=timezone.now()
        )
        for i in range(3, 103):
            asset = create_asset(item=self.asset1.item, slug=f"r-{i}")
            create_transcription(asset=asset, user=self.user, submitted=timezone.now())
            NextReviewableCampaignAsset.objects.create(
                asset=asset,
                item=asset.item,
                item_item_id=asset.item.item_id,
                project=asset.item.project,
                project_slug=asset.item.project.slug,
                campaign=self.campaign,
                sequence=asset.sequence,
                transcriber_ids=[self.user.id],
            )

        populate_next_reviewable_for_campaign(campaign_id=self.campaign.id)
        mock_logger.info.assert_any_call(
            "Campaign %s already has %s next reviewable assets", self.campaign, 100
        )

    @mock.patch("concordia.tasks.next_asset.reviewable.logger")
    def test_populate_next_reviewable_for_topic_none_needed(self, mock_logger):
        create_transcription(
            asset=self.asset1, user=self.user, submitted=timezone.now()
        )
        for i in range(3, 103):
            asset = create_asset(item=self.asset1.item, slug=f"t-{i}")
            create_transcription(asset=asset, user=self.user, submitted=timezone.now())
            NextReviewableTopicAsset.objects.create(
                asset=asset,
                item=asset.item,
                item_item_id=asset.item.item_id,
                project=asset.item.project,
                project_slug=asset.item.project.slug,
                topic=self.topic,
                sequence=asset.sequence,
                transcriber_ids=[self.user.id],
            )

        populate_next_reviewable_for_topic(topic_id=self.topic.id)
        mock_logger.info.assert_any_call(
            "Topic %s already has %s next reviewable assets", self.topic, 100
        )

    @mock.patch("concordia.tasks.next_asset.reviewable.logger")
    def test_populate_next_reviewable_for_campaign_none_found(self, mock_logger):
        create_transcription(
            asset=self.asset1, user=self.user, submitted=timezone.now()
        )

        NextReviewableCampaignAsset.objects.create(
            asset=self.asset1,
            item=self.asset1.item,
            item_item_id=self.asset1.item.item_id,
            project=self.asset1.item.project,
            project_slug=self.asset1.item.project.slug,
            campaign=self.campaign,
            sequence=self.asset1.sequence,
            transcriber_ids=[self.user.id],
        )

        populate_next_reviewable_for_campaign(campaign_id=self.campaign.id)
        mock_logger.info.assert_any_call(
            "No reviewable assets found in campaign %s", self.campaign
        )

    @mock.patch("concordia.tasks.next_asset.reviewable.logger")
    def test_populate_next_reviewable_for_topic_none_found(self, mock_logger):
        create_transcription(
            asset=self.asset1, user=self.user, submitted=timezone.now()
        )

        NextReviewableTopicAsset.objects.create(
            asset=self.asset1,
            item=self.asset1.item,
            item_item_id=self.asset1.item.item_id,
            project=self.asset1.item.project,
            project_slug=self.asset1.item.project.slug,
            topic=self.topic,
            sequence=self.asset1.sequence,
            transcriber_ids=[self.user.id],
        )

        populate_next_reviewable_for_topic(topic_id=self.topic.id)
        mock_logger.info.assert_any_call(
            "No reviewable assets found in topic %s", self.topic
        )

    @mock.patch("concordia.tasks.next_asset.transcribable.logger")
    def test_populate_next_transcribable_for_campaign_none_found(self, mock_logger):
        for asset in (self.asset1, self.asset2):
            NextTranscribableCampaignAsset.objects.create(
                asset=asset,
                item=asset.item,
                item_item_id=asset.item.item_id,
                project=asset.item.project,
                project_slug=asset.item.project.slug,
                campaign=self.campaign,
                sequence=asset.sequence,
                transcription_status=asset.transcription_status,
            )

        populate_next_transcribable_for_campaign(campaign_id=self.campaign.id)
        mock_logger.info.assert_any_call(
            "No transcribable assets found in campaign %s", self.campaign
        )

    @mock.patch("concordia.tasks.next_asset.transcribable.logger")
    def test_populate_next_transcribable_for_topic_none_found(self, mock_logger):
        for asset in (self.asset1, self.asset2):
            NextTranscribableTopicAsset.objects.create(
                asset=asset,
                item=asset.item,
                item_item_id=asset.item.item_id,
                project=asset.item.project,
                project_slug=asset.item.project.slug,
                topic=self.topic,
                sequence=asset.sequence,
                transcription_status=asset.transcription_status,
            )

        populate_next_transcribable_for_topic(topic_id=self.topic.id)
        mock_logger.info.assert_any_call(
            "No transcribable assets found in topic %s", self.topic
        )


class CleanNextAssetTasksTests(TestCase):
    def setUp(self):
        self.asset = create_asset()
        self.campaign = self.asset.campaign
        self.topic = create_topic(project=self.asset.item.project)
        self.campaign_transcribable = NextTranscribableCampaignAsset.objects.create(
            asset=self.asset,
            item=self.asset.item,
            item_item_id=self.asset.item.item_id,
            project=self.asset.item.project,
            project_slug=self.asset.item.project.slug,
            campaign=self.campaign,
            sequence=self.asset.sequence,
            transcription_status=TranscriptionStatus.NOT_STARTED,
        )
        self.topic_transcribable = NextTranscribableTopicAsset.objects.create(
            asset=self.asset,
            item=self.asset.item,
            item_item_id=self.asset.item.item_id,
            project=self.asset.item.project,
            project_slug=self.asset.item.project.slug,
            topic=self.topic,
            sequence=self.asset.sequence,
            transcription_status=TranscriptionStatus.IN_PROGRESS,
        )
        self.campaign_reviewable = NextReviewableCampaignAsset.objects.create(
            asset=self.asset,
            item=self.asset.item,
            item_item_id=self.asset.item.item_id,
            project=self.asset.item.project,
            project_slug=self.asset.item.project.slug,
            campaign=self.campaign,
            sequence=self.asset.sequence,
        )
        self.topic_reviewable = NextReviewableTopicAsset.objects.create(
            asset=self.asset,
            item=self.asset.item,
            item_item_id=self.asset.item.item_id,
            project=self.asset.item.project,
            project_slug=self.asset.item.project.slug,
            topic=self.topic,
            sequence=self.asset.sequence,
        )

    @mock.patch(
        "concordia.tasks.next_asset.transcribable.populate_next_transcribable_for_campaign.delay"
    )
    def test_clean_next_transcribable_for_campaign(self, mock_delay):
        self.asset.transcription_status = TranscriptionStatus.COMPLETED
        self.asset.save()
        clean_next_transcribable_for_campaign(self.campaign.id)
        self.assertFalse(
            NextTranscribableCampaignAsset.objects.filter(
                campaign=self.campaign
            ).exists()
        )
        mock_delay.assert_called_once_with(self.campaign.id)

    @mock.patch(
        "concordia.tasks.next_asset.transcribable.populate_next_transcribable_for_topic.delay"
    )
    def test_clean_next_transcribable_for_topic(self, mock_delay):
        self.asset.transcription_status = TranscriptionStatus.COMPLETED
        self.asset.save()
        clean_next_transcribable_for_topic(self.topic.id)
        self.assertFalse(
            NextTranscribableTopicAsset.objects.filter(topic=self.topic).exists()
        )
        mock_delay.assert_called_once_with(self.topic.id)

    @mock.patch(
        "concordia.tasks.next_asset.reviewable.populate_next_reviewable_for_campaign.delay"
    )
    def test_clean_next_reviewable_for_campaign(self, mock_delay):
        self.asset.transcription_status = TranscriptionStatus.IN_PROGRESS
        self.asset.save()
        clean_next_reviewable_for_campaign(self.campaign.id)
        self.assertFalse(
            NextReviewableCampaignAsset.objects.filter(campaign=self.campaign).exists()
        )
        mock_delay.assert_called_once_with(self.campaign.id)

    @mock.patch(
        "concordia.tasks.next_asset.reviewable.populate_next_reviewable_for_topic.delay"
    )
    def test_clean_next_reviewable_for_topic(self, mock_delay):
        self.asset.transcription_status = TranscriptionStatus.NOT_STARTED
        self.asset.save()
        clean_next_reviewable_for_topic(self.topic.id)
        self.assertFalse(
            NextReviewableTopicAsset.objects.filter(topic=self.topic).exists()
        )
        mock_delay.assert_called_once_with(self.topic.id)

    @mock.patch(
        "concordia.tasks.next_asset.reviewable.clean_next_reviewable_for_campaign.delay"
    )
    @mock.patch(
        "concordia.tasks.next_asset.transcribable.clean_next_transcribable_for_campaign.delay"
    )
    @mock.patch(
        "concordia.tasks.next_asset.reviewable.clean_next_reviewable_for_topic.delay"
    )
    @mock.patch(
        "concordia.tasks.next_asset.transcribable.clean_next_transcribable_for_topic.delay"
    )
    def test_renew_next_asset_cache(
        self,
        mock_clean_trans_topic,
        mock_clean_rev_topic,
        mock_clean_trans_campaign,
        mock_clean_rev_campaign,
    ):
        renew_next_asset_cache()
        mock_clean_trans_campaign.assert_called_once_with(campaign_id=self.campaign.id)
        mock_clean_rev_campaign.assert_called_once_with(campaign_id=self.campaign.id)
        mock_clean_trans_topic.assert_called_once_with(topic_id=self.topic.id)
        mock_clean_rev_topic.assert_called_once_with(topic_id=self.topic.id)

    @mock.patch("concordia.tasks.next_asset.transcribable.logger")
    def test_clean_next_transcribable_for_campaign_exception(self, mock_logger):
        with mock.patch.object(
            self.campaign_transcribable, "delete", side_effect=Exception("fail")
        ):
            with mock.patch(
                "concordia.tasks.next_asset.transcribable.find_invalid_next_transcribable_campaign_assets",
                return_value=[self.campaign_transcribable],
            ):
                clean_next_transcribable_for_campaign(self.campaign.id)
        mock_logger.exception.assert_called_once()

    @mock.patch("concordia.tasks.next_asset.transcribable.logger")
    def test_clean_next_transcribable_for_topic_exception(self, mock_logger):
        with mock.patch.object(
            self.topic_transcribable, "delete", side_effect=Exception("fail")
        ):
            with mock.patch(
                "concordia.tasks.next_asset.transcribable.find_invalid_next_transcribable_topic_assets",
                return_value=[self.topic_transcribable],
            ):
                clean_next_transcribable_for_topic(self.topic.id)
        mock_logger.exception.assert_called_once()

    @mock.patch("concordia.tasks.next_asset.reviewable.logger")
    def test_clean_next_reviewable_for_campaign_exception(self, mock_logger):
        with mock.patch.object(
            self.campaign_reviewable, "delete", side_effect=Exception("fail")
        ):
            with mock.patch(
                "concordia.tasks.next_asset.reviewable.find_invalid_next_reviewable_campaign_assets",
                return_value=[self.campaign_reviewable],
            ):
                clean_next_reviewable_for_campaign(self.campaign.id)
        mock_logger.exception.assert_called_once()

    @mock.patch("concordia.tasks.next_asset.reviewable.logger")
    def test_clean_next_reviewable_for_topic_exception(self, mock_logger):
        with mock.patch.object(
            self.topic_reviewable, "delete", side_effect=Exception("fail")
        ):
            with mock.patch(
                "concordia.tasks.next_asset.reviewable.find_invalid_next_reviewable_topic_assets",
                return_value=[self.topic_reviewable],
            ):
                clean_next_reviewable_for_topic(self.topic.id)
        mock_logger.exception.assert_called_once()


================================================
FILE: concordia/tests/test_tasks_reports_backfill.py
================================================
from django.test import TestCase
from django.utils import timezone

from concordia.models import Campaign, SiteReport, Topic
from concordia.tasks.reports.backfill import (
    backfill_assets_started_for_site_reports,
)


class BackfillAssetsStartedTaskTests(TestCase):
    def _dt(self, days_ago):
        return timezone.now() - timezone.timedelta(days=days_ago)

    def test_updates_total_and_skips_existing_by_default(self):
        # Three TOTAL rows in time order. The last is already populated and
        # should be skipped in default mode.
        r1 = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL,
            assets_total=100,
            assets_not_started=100,
            assets_published=10,
            assets_started=None,
        )
        r2 = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL,
            assets_total=107,
            assets_not_started=92,
            assets_published=17,
            assets_started=None,
        )
        r3 = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL,
            assets_total=100,
            assets_not_started=90,
            assets_published=20,
            assets_started=5,
        )

        dt1 = self._dt(3)
        dt2 = self._dt(2)
        dt3 = self._dt(1)

        SiteReport.objects.filter(pk=r1.pk).update(created_on=dt1)
        SiteReport.objects.filter(pk=r2.pk).update(created_on=dt2)
        SiteReport.objects.filter(pk=r3.pk).update(created_on=dt3)

        # The TOTAL series assets_started is now expected to be rolled up from
        # per-campaign series that were generated on the same reporting day.
        camp1 = Campaign.objects.create(title="C1", slug="c1")
        camp2 = Campaign.objects.create(title="C2", slug="c2")

        c1_prev = SiteReport.objects.create(
            campaign=camp1,
            assets_total=50,
            assets_not_started=50,
            assets_published=0,
            assets_started=None,
        )
        c1_curr = SiteReport.objects.create(
            campaign=camp1,
            assets_total=50,
            assets_not_started=40,
            assets_published=0,
            assets_started=None,
        )

        c2_prev = SiteReport.objects.create(
            campaign=camp2,
            assets_total=50,
            assets_not_started=50,
            assets_published=0,
            assets_started=None,
        )
        c2_curr = SiteReport.objects.create(
            campaign=camp2,
            assets_total=52,
            assets_not_started=47,
            assets_published=0,
            assets_started=None,
        )

        SiteReport.objects.filter(pk=c1_prev.pk).update(created_on=dt1)
        SiteReport.objects.filter(pk=c1_curr.pk).update(created_on=dt2)
        SiteReport.objects.filter(pk=c2_prev.pk).update(created_on=dt1)
        SiteReport.objects.filter(pk=c2_curr.pk).update(created_on=dt2)

        updated = backfill_assets_started_for_site_reports.run()
        # Campaign series (2 campaigns x 2 rows) + TOTAL series (2 rows).
        self.assertEqual(updated, 6)

        r1.refresh_from_db()
        r2.refresh_from_db()
        r3.refresh_from_db()
        c1_prev.refresh_from_db()
        c1_curr.refresh_from_db()
        c2_prev.refresh_from_db()
        c2_curr.refresh_from_db()

        self.assertEqual(c1_prev.assets_started, 0)
        self.assertEqual(c1_curr.assets_started, 10)
        self.assertEqual(c2_prev.assets_started, 0)
        self.assertEqual(c2_curr.assets_started, 5)

        self.assertEqual(r1.assets_started, 0)
        self.assertEqual(r2.assets_started, 15)
        self.assertEqual(r3.assets_started, 5)

    def test_recompute_when_skip_existing_is_false(self):
        # Build a TOTAL series with two rows. Make the first row have a wrong,
        # non-null assets_started so it should be recomputed when
        # skip_existing is False.
        #
        # The TOTAL series assets_started is expected to be rolled up from
        # per-campaign series generated on the same reporting day.
        now = timezone.now()

        prev = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL,
            assets_total=100,
            assets_not_started=100,
            assets_published=10,
        )
        curr = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL,
            assets_total=105,
            assets_not_started=90,
            assets_published=15,
        )

        dt_prev = now - timezone.timedelta(days=2)
        dt_curr = now - timezone.timedelta(days=1)

        # Enforce chronological order for the iterator
        SiteReport.objects.filter(pk=prev.pk).update(created_on=dt_prev)
        SiteReport.objects.filter(pk=curr.pk).update(created_on=dt_curr)

        # Wrong non-null on first row, null on second.
        SiteReport.objects.filter(pk=prev.pk).update(assets_started=5)
        SiteReport.objects.filter(pk=curr.pk).update(assets_started=None)

        camp = Campaign.objects.create(title="C", slug="c")

        c_prev = SiteReport.objects.create(
            campaign=camp,
            assets_total=100,
            assets_not_started=100,
            assets_published=0,
            assets_started=None,
        )
        c_curr = SiteReport.objects.create(
            campaign=camp,
            assets_total=105,
            assets_not_started=90,
            assets_published=0,
            assets_started=None,
        )
        SiteReport.objects.filter(pk=c_prev.pk).update(created_on=dt_prev)
        SiteReport.objects.filter(pk=c_curr.pk).update(created_on=dt_curr)

        updated = backfill_assets_started_for_site_reports.run(skip_existing=False)
        # Campaign series (2 rows) + TOTAL series (2 rows).
        self.assertEqual(updated, 4)

        prev_refreshed = SiteReport.objects.get(pk=prev.pk)
        curr_refreshed = SiteReport.objects.get(pk=curr.pk)
        c_prev.refresh_from_db()
        c_curr.refresh_from_db()

        self.assertEqual(c_prev.assets_started, 0)
        self.assertEqual(c_curr.assets_started, 15)

        self.assertEqual(prev_refreshed.assets_started, 0)
        self.assertEqual(curr_refreshed.assets_started, 15)

    def test_processes_retired_campaign_and_topic_series(self):
        # One RETIRED_TOTAL row
        rt = SiteReport.objects.create(
            report_name=SiteReport.ReportName.RETIRED_TOTAL,
            assets_not_started=10,
            assets_published=2,
            assets_started=None,
        )
        SiteReport.objects.filter(pk=rt.pk).update(created_on=self._dt(3))

        # One per-campaign row
        camp = Campaign.objects.create(title="C", slug="c")
        cr = SiteReport.objects.create(
            campaign=camp,
            assets_not_started=7,
            assets_published=1,
            assets_started=None,
        )
        SiteReport.objects.filter(pk=cr.pk).update(created_on=self._dt(2))

        # One per-topic row
        topic = Topic.objects.create(title="T", slug="t")
        tr = SiteReport.objects.create(
            topic=topic,
            assets_not_started=5,
            assets_published=0,
            assets_started=None,
        )
        SiteReport.objects.filter(pk=tr.pk).update(created_on=self._dt(1))

        updated = backfill_assets_started_for_site_reports.run()
        # Each single-row series sets assets_started to 0
        self.assertEqual(updated, 3)

        rt.refresh_from_db()
        cr.refresh_from_db()
        tr.refresh_from_db()
        self.assertEqual(rt.assets_started, 0)
        self.assertEqual(cr.assets_started, 0)
        self.assertEqual(tr.assets_started, 0)

    def test_skip_existing_branch_emits_heartbeat_due_to_time(self):
        # First row already populated (skipped); second row needs update.
        from unittest import mock

        prev = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL,
            assets_not_started=100,
            assets_published=10,
            assets_started=0,
        )
        curr = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL,
            assets_not_started=90,
            assets_published=15,
            assets_started=None,
        )

        SiteReport.objects.filter(pk=prev.pk).update(created_on=self._dt(2))
        SiteReport.objects.filter(pk=curr.pk).update(created_on=self._dt(1))

        # Use a monotonic function that always advances time enough to trip the
        # heartbeat-by-time condition, without exhausting side effects.
        def make_monotonic(step=11.0):
            state = {"t": 0.0}

            def _mono():
                state["t"] += step
                return state["t"]

            return _mono

        with (
            mock.patch("concordia.tasks.reports.backfill.structured_logger") as slog,
            mock.patch(
                "concordia.tasks.reports.backfill.time.monotonic",
                new=make_monotonic(),
            ),
        ):
            updated = backfill_assets_started_for_site_reports.run()
            self.assertEqual(updated, 1)

            hb_calls = [
                c
                for c in slog.info.call_args_list
                if c.kwargs.get("event_code")
                == "assets_started_backfill_series_heartbeat"
                and c.kwargs.get("series") == "TOTAL"
                and c.kwargs.get("scanned_rows") == 1
                and c.kwargs.get("last_seen_site_report_id") == prev.id
            ]
            self.assertTrue(hb_calls)

    def test_post_scan_heartbeat_emitted_due_to_time(self):
        # Single-row series where a save occurs, then a heartbeat fires due to
        # elapsed time.
        from unittest import mock

        single = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL,
            assets_not_started=50,
            assets_published=5,
            assets_started=None,
        )
        SiteReport.objects.filter(pk=single.pk).update(created_on=self._dt(1))

        def make_monotonic(step=11.0):
            state = {"t": 0.0}

            def _mono():
                state["t"] += step
                return state["t"]

            return _mono

        with (
            mock.patch("concordia.tasks.reports.backfill.structured_logger") as slog,
            mock.patch(
                "concordia.tasks.reports.backfill.time.monotonic",
                new=make_monotonic(),
            ),
        ):
            updated = backfill_assets_started_for_site_reports.run()
            self.assertEqual(updated, 1)

            slog.info.assert_any_call(
                "Scanning series...",
                event_code="assets_started_backfill_series_heartbeat",
                series="TOTAL",
                scanned_rows=1,
                updated_rows=1,
                last_seen_site_report_id=single.id,
            )

    def test_no_update_when_equal_with_skip_existing_false(self):
        # First row already equals the calculated value (zero for first snapshot),
        # so no save should occur on that row when recomputing.
        from unittest import mock

        prev = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL,
            assets_not_started=100,
            assets_published=10,
            assets_started=0,
        )
        curr = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL,
            assets_not_started=90,
            assets_published=15,
            assets_started=None,
        )

        SiteReport.objects.filter(pk=prev.pk).update(created_on=self._dt(2))
        SiteReport.objects.filter(pk=curr.pk).update(created_on=self._dt(1))

        with mock.patch("concordia.tasks.reports.backfill.structured_logger") as slog:
            updated = backfill_assets_started_for_site_reports.run(skip_existing=False)
            self.assertEqual(updated, 1)

            # Row logs should not include the first row, since it already matched.
            row_logs = [
                c.kwargs
                for c in slog.info.call_args_list
                if c.kwargs.get("event_code") == "assets_started_backfill_row"
            ]
            self.assertTrue(any(kw.get("site_report_id") == curr.id for kw in row_logs))
            self.assertFalse(
                any(kw.get("site_report_id") == prev.id for kw in row_logs)
            )

    def test_total_assets_started_is_rolled_up_from_campaign_series(self):
        # Ensure the TOTAL series does not derive assets_started from its own
        # assets_total/assets_not_started deltas when campaign series data for
        # the same reporting days exists.
        camp = Campaign.objects.create(title="C", slug="c")

        total_prev = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL,
            assets_total=999,
            assets_not_started=999,
            assets_started=None,
        )
        total_curr = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL,
            assets_total=999,
            assets_not_started=0,
            assets_started=None,
        )

        c_prev = SiteReport.objects.create(
            campaign=camp,
            assets_total=20,
            assets_not_started=20,
            assets_started=None,
        )
        c_curr = SiteReport.objects.create(
            campaign=camp,
            assets_total=20,
            assets_not_started=15,
            assets_started=None,
        )

        dt_prev = self._dt(2)
        dt_curr = self._dt(1)

        SiteReport.objects.filter(pk=total_prev.pk).update(created_on=dt_prev)
        SiteReport.objects.filter(pk=total_curr.pk).update(created_on=dt_curr)
        SiteReport.objects.filter(pk=c_prev.pk).update(created_on=dt_prev)
        SiteReport.objects.filter(pk=c_curr.pk).update(created_on=dt_curr)

        updated = backfill_assets_started_for_site_reports.run(skip_existing=False)
        self.assertEqual(updated, 4)

        total_prev.refresh_from_db()
        total_curr.refresh_from_db()
        c_prev.refresh_from_db()
        c_curr.refresh_from_db()

        self.assertEqual(c_prev.assets_started, 0)
        self.assertEqual(c_curr.assets_started, 5)

        self.assertEqual(total_prev.assets_started, 0)
        self.assertEqual(total_curr.assets_started, 5)


================================================
FILE: concordia/tests/test_tasks_reports_key_metrics.py
================================================
from datetime import date, datetime
from types import SimpleNamespace
from unittest import mock

from django.test import TestCase
from django.utils import timezone

from concordia.models import KeyMetricsReport, SiteReport
from concordia.tasks.reports.key_metrics import build_key_metrics_reports


class BuildKeyMetricsReportsTaskTests(TestCase):
    def _dt(self, days_ago):
        return timezone.now() - timezone.timedelta(days=days_ago)

    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_recompute_all_calls_all_upserts(self, mock_localdate):
        # Fix "today" to a stable mid-month date.
        today = date(2024, 3, 15)
        mock_localdate.return_value = today

        # Earliest SiteReport in the current month so only one month is walked.
        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        tz = timezone.get_current_timezone()
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 3, 10, 12, 0, 0), tz)
        )

        fy = KeyMetricsReport.get_fiscal_year_for_date(today)
        fq = KeyMetricsReport.get_fiscal_quarter_for_date(today)

        KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.MONTHLY,
            period_start=today.replace(day=1),
            period_end=today,
            fiscal_year=fy,
            fiscal_quarter=fq,
            month=today.month,
        )
        KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=today.replace(day=1),
            period_end=today,
            fiscal_year=fy,
            fiscal_quarter=fq,
        )

        with (
            mock.patch.object(KeyMetricsReport, "upsert_month") as up_m,
            mock.patch.object(KeyMetricsReport, "upsert_quarter") as up_q,
            mock.patch.object(KeyMetricsReport, "upsert_fiscal_year") as up_y,
        ):
            up_m.return_value = mock.Mock(period_start=None, period_end=None)
            up_q.return_value = mock.Mock(period_start=None, period_end=None)
            up_y.return_value = mock.Mock(period_start=None, period_end=None)

            changed = build_key_metrics_reports.run(recompute_all=True)

        # One month, four quarters, one fiscal year
        self.assertEqual(changed, 6)
        self.assertEqual(up_m.call_count, 1)
        self.assertEqual(up_q.call_count, 4)
        self.assertEqual(up_y.call_count, 1)

    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_incremental_refresh_and_creates(self, mock_localdate):
        # Fix "today" to a stable mid-month date so the month logic is
        # deterministic.
        today = date(2024, 3, 15)
        mock_localdate.return_value = today

        # Make one SiteReport this month so the month is considered.
        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        tz = timezone.get_current_timezone()
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 3, 10, 12, 0, 0), tz)
        )

        fy = KeyMetricsReport.get_fiscal_year_for_date(today)
        fq = KeyMetricsReport.get_fiscal_quarter_for_date(today)

        # Existing MONTHLY row with old updated_on so it is refreshed.
        monthly = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.MONTHLY,
            period_start=today.replace(day=1),
            period_end=today,
            fiscal_year=fy,
            fiscal_quarter=fq,
            month=today.month,
        )
        KeyMetricsReport.objects.filter(pk=monthly.pk).update(
            updated_on=timezone.make_aware(datetime(2024, 3, 1, 0, 0, 0), tz)
        )

        # Existing QUARTERLY row for the same quarter; the other three quarters
        # are missing and will be created. We keep updated_on equal to the
        # MONTHLY row so only the missing quarters are upserted.
        quarter = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=today.replace(day=1),
            period_end=today,
            fiscal_year=fy,
            fiscal_quarter=fq,
        )
        KeyMetricsReport.objects.filter(pk=quarter.pk).update(
            updated_on=timezone.make_aware(datetime(2024, 3, 1, 0, 0, 0), tz)
        )

        # No FY row yet so it will be created in the FY stage.
        with (
            mock.patch.object(KeyMetricsReport, "upsert_month") as up_m,
            mock.patch.object(KeyMetricsReport, "upsert_quarter") as up_q,
            mock.patch.object(KeyMetricsReport, "upsert_fiscal_year") as up_y,
        ):
            up_m.return_value = mock.Mock(period_start=None, period_end=None)
            up_q.return_value = mock.Mock(period_start=None, period_end=None)
            up_y.return_value = mock.Mock(period_start=None, period_end=None)

            changed = build_key_metrics_reports(recompute_all=False)

        # One monthly refresh, three quarterly creates (no refresh since the
        # mock does not bump monthly.updated_on), and one fiscal year create.
        self.assertEqual(changed, 5)
        self.assertEqual(up_m.call_count, 1)
        self.assertEqual(up_q.call_count, 3)
        self.assertEqual(up_y.call_count, 1)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch("concordia.tasks.reports.key_metrics.SiteReport")
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_early_return_after_backsteps(self, mock_local, mock_sr, slog):
        # Force "today" to mid-March so last_month_start starts at Mar 1.
        mock_local.return_value = date(2024, 3, 15)

        # Earliest SR is mid-December so first_month_start is Dec 1.
        earliest = SimpleNamespace(
            created_on=timezone.make_aware(datetime(2023, 12, 15, 12, 0, 0))
        )
        mock_sr.objects.order_by.return_value.first.return_value = earliest

        # Pretend there are no snapshots by EOM for any month we check.
        mock_sr.objects.filter.return_value.exists.return_value = False

        changed = build_key_metrics_reports(recompute_all=False)
        self.assertEqual(changed, 0)

        # Ensure we logged the "no months" message.
        codes = [kw.get("event_code") for _, kw in slog.info.call_args_list if kw]
        self.assertIn("key_metrics_build_no_months", codes)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month")
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_recompute_all_month_upsert_and_december_rollover(
        self, mock_local, upsert_month, slog
    ):
        # Make yesterday in December so the month we process is December.
        mock_local.return_value = date(2023, 12, 20)

        # Create a TOTAL snapshot in December so the scan does not early-return.
        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2023, 12, 15, 10, 0, 0))
        )

        # Return a stub report so the "upserted" logging runs.
        upsert_month.return_value = SimpleNamespace(
            period_start=date(2023, 12, 1),
            period_end=date(2023, 12, 31),
        )

        changed = build_key_metrics_reports(recompute_all=True)
        self.assertGreaterEqual(changed, 1)

        codes = [kw.get("event_code") for _, kw in slog.info.call_args_list if kw]
        self.assertIn("key_metrics_month_upserted", codes)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter")
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year"
    )
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month")
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_incremental_month_create_and_refresh(
        self,
        mock_local,
        upsert_month,
        upsert_year,
        upsert_quarter,
        slog,
    ):
        mock_local.return_value = date(2024, 2, 1)

        sr_jan = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr_jan.pk).update(
            created_on=timezone.make_aware(datetime(2024, 1, 10, 9, 0, 0))
        )
        sr_dec = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr_dec.pk).update(
            created_on=timezone.make_aware(datetime(2023, 12, 20, 9, 0, 0))
        )

        dec_month = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.MONTHLY,
            period_start=date(2023, 12, 1),
            period_end=date(2023, 12, 31),
            fiscal_year=2024,
            fiscal_quarter=1,
            month=12,
        )
        KeyMetricsReport.objects.filter(pk=dec_month.pk).update(
            updated_on=timezone.make_aware(datetime(2023, 12, 1, 0, 0, 0))
        )

        # Monthly upsert produces a stub (so it counts as 1 change per call)
        upsert_month.return_value = SimpleNamespace(
            period_start=date(2024, 1, 1), period_end=date(2024, 1, 31)
        )
        # Disable quarterly and fiscal-year increments
        upsert_quarter.return_value = None
        upsert_year.return_value = None

        changed = build_key_metrics_reports(recompute_all=False)
        self.assertEqual(changed, 2)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.objects")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month")
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_quarter_recompute_all_logs(
        self, mock_local, upsert_month, upsert_quarter, kmr_objects, slog
    ):
        mock_local.return_value = date(2024, 1, 15)

        # Ensure we do not early-return (one SR anywhere is fine).
        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 1, 1, 8, 0, 0))
        )

        # We are not using monthly upserts here.
        upsert_month.return_value = None

        # monthly_rows -> one fiscal year (2024)
        kmr_objects.filter.return_value.values.return_value.annotate.return_value = [
            {"fiscal_year": 2024}
        ]
        # quarter_exists .first() can be anything; ignored in recompute_all.
        kmr_objects.filter.return_value.first.return_value = None
        # Prevent FY stage from running by returning no quarter years later.
        kmr_objects.filter.return_value.values_list.return_value = []

        upsert_quarter.return_value = SimpleNamespace(
            period_start=date(2024, 1, 1), period_end=date(2024, 3, 31)
        )

        changed = build_key_metrics_reports(recompute_all=True)
        # Four quarters upserted
        self.assertGreaterEqual(changed, 4)
        self.assertEqual(upsert_quarter.call_count, 4)

        codes = [kw.get("event_code") for _, kw in slog.info.call_args_list if kw]
        self.assertIn("key_metrics_quarter_upserted", codes)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.objects")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month")
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_quarter_incremental_refresh_all_quarters(
        self, mock_local, upsert_month, kmr_objects, upsert_quarter, slog
    ):
        mock_local.return_value = date(2024, 6, 15)

        # Ensure we do not early-return.
        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 5, 10, 8, 0, 0))
        )

        # No monthly creation in this test.
        upsert_month.return_value = None

        # Signal that we have monthly rows for fiscal_year=2024.
        kmr_objects.filter.return_value.values.return_value.annotate.return_value = [
            {"fiscal_year": 2024}
        ]

        # quarter_exists present for all four quarters.
        quarter_stub = SimpleNamespace(
            updated_on=timezone.make_aware(datetime(2024, 1, 1, 0, 0, 0))
        )

        def filter_side_effect(*args, **kwargs):
            # For QUARTERLY lookups with fiscal_quarter, return an object
            # whose first() yields a stub so "refresh" path is taken.
            class QS:
                def __init__(self, exists_value=False):
                    self._exists = exists_value

                def first(self):
                    return quarter_stub

                def exists(self):
                    return self._exists

                def values(self, *a, **k):
                    return self

                def annotate(self, *a, **k):
                    return [{"fiscal_year": 2024}]

                def values_list(self, *a, **k):
                    # Avoid FY stage in this test
                    return []

            pt = kwargs.get("period_type")
            if pt == KeyMetricsReport.PeriodType.MONTHLY and "updated_on__gt" in kwargs:
                # Make monthly_newer_exists True
                return QS(exists_value=True)
            return QS()

        kmr_objects.filter.side_effect = filter_side_effect

        upsert_quarter.return_value = SimpleNamespace(
            period_start=date(2024, 4, 1), period_end=date(2024, 6, 30)
        )

        changed = build_key_metrics_reports(recompute_all=False)
        # Four refreshes (Q1..Q4)
        self.assertGreaterEqual(changed, 4)
        self.assertEqual(upsert_quarter.call_count, 4)

        codes = [kw.get("event_code") for _, kw in slog.info.call_args_list if kw]
        self.assertIn("key_metrics_quarter_refreshed", codes)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year"
    )
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.objects")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month")
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_fiscal_year_recompute_all_logs(
        self, mock_local, upsert_month, kmr_objects, upsert_year, slog
    ):
        mock_local.return_value = date(2024, 1, 15)

        # Ensure no early-return.
        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 1, 2, 8, 0, 0))
        )

        upsert_month.return_value = None

        # No monthlies needed; quarters present for FY 2027.
        kmr_objects.filter.return_value.values.return_value.annotate.return_value = []
        kmr_objects.filter.return_value.values_list.return_value = [2027]
        kmr_objects.filter.return_value.first.return_value = None

        upsert_year.return_value = SimpleNamespace(
            period_start=date(2026, 10, 1), period_end=date(2027, 9, 30)
        )

        changed = build_key_metrics_reports(recompute_all=True)
        self.assertGreaterEqual(changed, 1)

        codes = [kw.get("event_code") for _, kw in slog.info.call_args_list if kw]
        self.assertIn("key_metrics_year_upserted", codes)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year"
    )
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.objects")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month")
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_fiscal_year_incremental_create_and_refresh(
        self, mock_local, upsert_month, kmr_objects, upsert_year, slog
    ):
        mock_local.return_value = date(2024, 5, 1)

        # Ensure no early-return.
        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 4, 15, 8, 0, 0))
        )
        upsert_month.return_value = None

        # First, drive "create" path: quarters exist, FY row is missing.
        def filter_values_list_side_effect(*args, **kwargs):
            # This handles the "fiscal_years_with_quarters" query.
            class QS:
                def values_list(self, *a, **k):
                    return [2026]

                def first(self):
                    return None

                def values(self, *a, **k):
                    return self

                def annotate(self, *a, **k):
                    return []

                def exists(self):
                    return False

            return QS()

        kmr_objects.filter.side_effect = filter_values_list_side_effect

        upsert_year.return_value = SimpleNamespace(
            period_start=date(2025, 10, 1), period_end=date(2026, 9, 30)
        )

        changed1 = build_key_metrics_reports(recompute_all=False)
        self.assertGreaterEqual(changed1, 1)
        codes1 = [kw.get("event_code") for _, kw in slog.info.call_args_list if kw]
        self.assertIn("key_metrics_year_created", codes1)

        # Now drive "refresh" path: FY exists, a newer quarter exists.
        fy_stub = SimpleNamespace(
            updated_on=timezone.make_aware(datetime(2024, 3, 1, 0, 0, 0))
        )

        def filter_refresh_side_effect(*args, **kwargs):
            class QS:
                def __init__(self, pt=None):
                    self.pt = pt

                def values_list(self, *a, **k):
                    return [2026]

                def first(self):
                    # When asking for the FY row, return a stub
                    return fy_stub

                def values(self, *a, **k):
                    return self

                def annotate(self, *a, **k):
                    return []

                def exists(self):
                    # This is called for quarters newer than FY.updated_on
                    return True

            return QS()

        kmr_objects.filter.side_effect = filter_refresh_side_effect

        upsert_year.return_value = SimpleNamespace(
            period_start=date(2025, 10, 1), period_end=date(2026, 9, 30)
        )

        changed2 = build_key_metrics_reports(recompute_all=False)
        self.assertGreaterEqual(changed2, 1)
        codes2 = [kw.get("event_code") for _, kw in slog.info.call_args_list if kw]
        self.assertIn("key_metrics_year_refreshed", codes2)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year"
    )
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month")
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_recompute_all_quarter_upserts_only(
        self, mock_local, mock_month, mock_quarter, mock_year, slog
    ):
        mock_local.return_value = date(2024, 2, 1)

        # Seed one site snapshot so the task has a start month (Jan 2024).
        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 1, 10, 9, 0, 0))
        )

        # Seed a MONTHLY row so the quarter loop sees FY 2024 in the set.
        KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.MONTHLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 1, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
            month=1,
        )

        # Monthly does nothing; quarter upserts return a stub; FY does nothing.
        mock_month.return_value = None
        mock_year.return_value = None

        def quarter_stub(**kwargs):
            return SimpleNamespace(
                period_start=date(2024, 1, 1), period_end=date(2024, 3, 31)
            )

        mock_quarter.side_effect = quarter_stub

        changed = build_key_metrics_reports(recompute_all=True)

        # Only quarters (4) should have counted.
        self.assertEqual(changed, 4)
        self.assertEqual(mock_quarter.call_count, 4)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year"
    )
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month")
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_incremental_quarter_refresh_only(
        self, mock_local, mock_month, mock_quarter, mock_year, slog
    ):
        mock_local.return_value = date(2024, 4, 1)

        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 1, 10, 9, 0, 0))
        )

        # Monthlies for Q2; newer than the quarter row we will refresh
        for m in (1, 2, 3):
            mr = KeyMetricsReport.objects.create(
                period_type=KeyMetricsReport.PeriodType.MONTHLY,
                period_start=date(2024, m, 1),
                period_end=KeyMetricsReport.month_bounds(date(2024, m, 15))[1],
                fiscal_year=2024,
                fiscal_quarter=2,
                month=m,
            )
            KeyMetricsReport.objects.filter(pk=mr.pk).update(
                updated_on=timezone.make_aware(datetime(2024, 3, 31, 12, 0, 0))
            )

        # Pre-create Q1, Q3, Q4 so they are not created by the task
        for fq, ps, pe in [
            (1, date(2023, 10, 1), date(2023, 12, 31)),
            (3, date(2024, 4, 1), date(2024, 6, 30)),
            (4, date(2024, 7, 1), date(2024, 9, 30)),
        ]:
            KeyMetricsReport.objects.create(
                period_type=KeyMetricsReport.PeriodType.QUARTERLY,
                period_start=ps,
                period_end=pe,
                fiscal_year=2024,
                fiscal_quarter=fq,
            )

        # Existing Q2 with older updated_on so only this quarter refreshes
        q2 = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 3, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
        )
        KeyMetricsReport.objects.filter(pk=q2.pk).update(
            updated_on=timezone.make_aware(datetime(2024, 1, 15, 0, 0, 0))
        )

        mock_month.return_value = None
        mock_year.return_value = None
        mock_quarter.return_value = SimpleNamespace(
            period_start=date(2024, 1, 1), period_end=date(2024, 3, 31)
        )

        changed = build_key_metrics_reports(recompute_all=False)

        self.assertEqual(changed, 1)
        self.assertEqual(mock_quarter.call_count, 1)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year"
    )
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month")
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_recompute_all_year_upsert_only(
        self, mock_local, mock_month, mock_quarter, mock_year, slog
    ):
        mock_local.return_value = date(2024, 2, 1)

        # Seed snapshot to allow the task to pick a month.
        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 1, 10, 9, 0, 0))
        )

        # Ensure the 'fiscal_years_with_quarters' set is not empty.
        KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 3, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
        )

        # Monthly and quarterly stages do nothing; FY upsert returns a stub.
        mock_month.return_value = None
        mock_quarter.return_value = None
        mock_year.return_value = SimpleNamespace(
            period_start=date(2024, 10, 1), period_end=date(2025, 9, 30)
        )

        changed = build_key_metrics_reports(recompute_all=True)

        self.assertEqual(changed, 1)
        self.assertEqual(mock_year.call_count, 1)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year"
    )
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month")
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_incremental_year_create(
        self, mock_local, mock_month, mock_quarter, mock_year, slog
    ):
        mock_local.return_value = date(2024, 2, 1)

        # Seed snapshot and a quarterly row so year loop triggers.
        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 1, 10, 9, 0, 0))
        )
        KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 3, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
        )

        mock_month.return_value = None
        mock_quarter.return_value = None
        mock_year.return_value = SimpleNamespace(
            period_start=date(2024, 10, 1), period_end=date(2025, 9, 30)
        )

        changed = build_key_metrics_reports(recompute_all=False)

        self.assertEqual(changed, 1)
        self.assertEqual(mock_year.call_count, 1)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year"
    )
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month")
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_incremental_year_refresh(
        self, mock_local, mock_month, mock_quarter, mock_year, slog
    ):
        mock_local.return_value = date(2024, 4, 1)

        # Seed a quarterly row with new updated_on.
        q = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 3, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
        )
        KeyMetricsReport.objects.filter(pk=q.pk).update(
            updated_on=timezone.make_aware(datetime(2024, 3, 31, 12, 0, 0))
        )

        # Create an older FY row that should be refreshed.
        fy = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.FISCAL_YEAR,
            period_start=date(2023, 10, 1),
            period_end=date(2024, 9, 30),
            fiscal_year=2024,
        )
        KeyMetricsReport.objects.filter(pk=fy.pk).update(
            updated_on=timezone.make_aware(datetime(2024, 1, 1, 0, 0, 0))
        )

        # Need a snapshot so the task can initialize months; it is not used
        # further because we neutralize month and quarter stages.
        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 1, 10, 9, 0, 0))
        )

        mock_month.return_value = None
        mock_quarter.return_value = None
        mock_year.return_value = SimpleNamespace(
            period_start=date(2023, 10, 1), period_end=date(2024, 9, 30)
        )

        changed = build_key_metrics_reports(recompute_all=False)

        self.assertEqual(changed, 1)
        self.assertEqual(mock_year.call_count, 1)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year"
    )
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month")
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_quarter_recompute_all_upserts_and_continue(
        self,
        mock_localdate,
        mock_upsert_month,
        mock_upsert_quarter,
        mock_upsert_year,
        slog,
    ):
        # Make the "monthly" section inert (no changes).
        mock_localdate.return_value = date(2024, 4, 1)
        mock_upsert_month.return_value = None
        mock_upsert_year.return_value = None

        # Seed minimal SiteReport so the monthly stage can compute bounds safely.
        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 1, 10, 9, 0, 0))
        )

        # Ensure at least one fiscal_year is discovered from MONTHLY rows.
        KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.MONTHLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 1, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
            month=1,
        )

        # Each quarter upsert returns a non-None object so rows_changed increments.
        mock_upsert_quarter.return_value = SimpleNamespace(
            period_start=date(2024, 1, 1), period_end=date(2024, 3, 31)
        )

        changed = build_key_metrics_reports.run(recompute_all=True)

        # Four quarters upserted; monthly and FY upserts return None.
        self.assertEqual(changed, 4)
        self.assertEqual(mock_upsert_quarter.call_count, 4)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year"
    )
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month")
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_fiscal_year_recompute_all_upserts_and_continue(
        self,
        mock_localdate,
        mock_upsert_month,
        mock_upsert_quarter,
        mock_upsert_year,
        slog,
    ):
        mock_localdate.return_value = date(2024, 4, 1)
        mock_upsert_month.return_value = None
        mock_upsert_quarter.return_value = None

        # Seed a quarter so the FY stage finds a fiscal year to process.
        KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 3, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
        )

        # Earliest SiteReport so earlier stages do not error.
        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 1, 5, 9, 0, 0))
        )

        mock_upsert_year.return_value = SimpleNamespace(
            period_start=date(2023, 10, 1), period_end=date(2024, 9, 30)
        )

        changed = build_key_metrics_reports.run(recompute_all=True)

        # Only FY upsert counts (quarter/month upserts return None).
        self.assertEqual(changed, 1)
        self.assertEqual(mock_upsert_year.call_count, 1)

    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month",
        return_value=None,
    )
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter")
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_quarter_recompute_all_non_none_continue_edge(
        self, mock_localdate, mock_upsert_quarter, mock_upsert_month
    ):
        mock_localdate.return_value = date(2024, 5, 20)

        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 5, 10, 12, 0, 0))
        )

        KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.MONTHLY,
            period_start=date(2024, 5, 1),
            period_end=date(2024, 5, 31),
            fiscal_year=2024,
            fiscal_quarter=3,
            month=5,
        )

        dummy = mock.MagicMock(
            period_start=date(2024, 1, 1), period_end=date(2024, 3, 31)
        )
        mock_upsert_quarter.return_value = dummy

        changed = build_key_metrics_reports(recompute_all=True)

        self.assertEqual(changed, 4)
        self.assertEqual(mock_upsert_quarter.call_count, 4)

    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month",
        return_value=None,
    )
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter",
        return_value=None,
    )
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year",
        return_value=mock.MagicMock(
            period_start=date(2024, 10, 1), period_end=date(2025, 9, 30)
        ),
    )
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_quarter_incremental_refresh_monthly_newer(
        self,
        mock_localdate,
        mock_upsert_fy,
        mock_upsert_quarter,
        mock_upsert_month,
    ):
        mock_localdate.return_value = date(2024, 1, 20)

        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 1, 10, 9, 0, 0))
        )

        jan = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.MONTHLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 1, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
            month=1,
        )
        KeyMetricsReport.objects.filter(pk=jan.pk).update(updated_on=timezone.now())

        now = timezone.now()
        older = now - timezone.timedelta(days=10)
        q1 = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2023, 10, 1),
            period_end=date(2023, 12, 31),
            fiscal_year=2024,
            fiscal_quarter=1,
        )
        q2 = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 3, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
        )
        q3 = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2024, 4, 1),
            period_end=date(2024, 6, 30),
            fiscal_year=2024,
            fiscal_quarter=3,
        )
        q4 = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2024, 7, 1),
            period_end=date(2024, 9, 30),
            fiscal_year=2024,
            fiscal_quarter=4,
        )
        KeyMetricsReport.objects.filter(pk=q1.pk).update(updated_on=now)
        KeyMetricsReport.objects.filter(pk=q2.pk).update(updated_on=older)
        KeyMetricsReport.objects.filter(pk=q3.pk).update(updated_on=now)
        KeyMetricsReport.objects.filter(pk=q4.pk).update(updated_on=now)

        fy = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.FISCAL_YEAR,
            period_start=date(2023, 10, 1),
            period_end=date(2024, 9, 30),
            fiscal_year=2024,
        )
        KeyMetricsReport.objects.filter(pk=fy.pk).update(updated_on=now)

        mock_upsert_quarter.return_value = mock.MagicMock(
            period_start=date(2024, 1, 1), period_end=date(2024, 3, 31)
        )

        changed = build_key_metrics_reports(recompute_all=False)

        self.assertEqual(changed, 1)
        self.assertGreaterEqual(mock_upsert_quarter.call_count, 1)

    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month",
        return_value=None,
    )
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter",
        return_value=None,
    )
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year",
        return_value=mock.MagicMock(
            period_start=date(2024, 10, 1), period_end=date(2025, 9, 30)
        ),
    )
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_fiscal_year_recompute_all_non_none_continue_edge(
        self, mock_localdate, mock_upsert_fy, mock_upsert_quarter, mock_upsert_month
    ):
        mock_localdate.return_value = date(2024, 5, 20)

        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 5, 10, 12, 0, 0))
        )

        KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 3, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
        )

        changed = build_key_metrics_reports(recompute_all=True)
        self.assertEqual(changed, 1)

    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month",
        return_value=None,
    )
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter",
        return_value=None,
    )
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year",
        return_value=mock.MagicMock(
            period_start=date(2024, 10, 1), period_end=date(2025, 9, 30)
        ),
    )
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_fiscal_year_incremental_create_missing(
        self,
        mock_localdate,
        mock_upsert_fy,
        mock_upsert_quarter,
        mock_upsert_month,
    ):
        mock_localdate.return_value = date(2024, 5, 20)

        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        tz = timezone.get_current_timezone()
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 5, 10, 12, 0, 0), tz)
        )

        for qn, start, end in [
            (1, date(2023, 10, 1), date(2023, 12, 31)),
            (2, date(2024, 1, 1), date(2024, 3, 31)),
            (3, date(2024, 4, 1), date(2024, 6, 30)),
            (4, date(2024, 7, 1), date(2024, 9, 30)),
        ]:
            KeyMetricsReport.objects.create(
                period_type=KeyMetricsReport.PeriodType.QUARTERLY,
                period_start=start,
                period_end=end,
                fiscal_year=2024,
                fiscal_quarter=qn,
            )

        changed = build_key_metrics_reports(recompute_all=False)
        self.assertEqual(changed, 1)

    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month",
        return_value=None,
    )
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter",
        return_value=None,
    )
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year",
        return_value=mock.MagicMock(
            period_start=date(2024, 10, 1), period_end=date(2025, 9, 30)
        ),
    )
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_fiscal_year_incremental_refresh_when_quarter_newer(
        self, mock_localdate, mock_upsert_fy, mock_upsert_quarter, mock_upsert_month
    ):
        mock_localdate.return_value = date(2024, 5, 20)

        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 5, 10, 12, 0, 0))
        )

        older = timezone.now() - timezone.timedelta(days=7)
        newer = timezone.now()

        fy = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.FISCAL_YEAR,
            period_start=date(2023, 10, 1),
            period_end=date(2024, 9, 30),
            fiscal_year=2024,
        )
        KeyMetricsReport.objects.filter(pk=fy.pk).update(updated_on=older)

        q2 = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 3, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
        )
        KeyMetricsReport.objects.filter(pk=q2.pk).update(updated_on=newer)

        changed = build_key_metrics_reports(recompute_all=False)
        self.assertEqual(changed, 1)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year",
        return_value=None,
    )
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month",
        return_value=None,
    )
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter",
        return_value=None,
    )
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_quarter_recompute_all_none_branch_continue(
        self, mock_localdate, upsert_quarter, upsert_month, upsert_year, slog
    ):
        # Keep the monthly scan minimal and stable
        mock_localdate.return_value = date(2024, 2, 10)

        # Seed a site snapshot so the task computes month bounds
        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(
                datetime(2024, 2, 9, 12, 0, 0), timezone.get_current_timezone()
            )
        )

        # Ensure the quarterly stage iterates a fiscal year by having a MONTHLY
        # row
        fy = KeyMetricsReport.get_fiscal_year_for_date(mock_localdate.return_value)
        KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.MONTHLY,
            period_start=date(2024, 2, 1),
            period_end=date(2024, 2, 29),
            fiscal_year=fy,
            fiscal_quarter=2,
            month=2,
        )

        # upsert_quarter returns None -> branch falls through to 'continue'
        changed = build_key_metrics_reports(recompute_all=True)

        # No rows changed because monthly and FY are neutralized and quarter
        # upserts return None (hitting the continue path each time).
        self.assertEqual(changed, 0)
        self.assertEqual(upsert_quarter.call_count, 4)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year",
        return_value=None,
    )
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month",
        return_value=None,
    )
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter",
        return_value=None,
    )
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_quarter_incremental_refresh_none_branch_continue(
        self,
        mock_localdate,
        mock_upsert_quarter,
        mock_upsert_month,
        mock_upsert_year,
        slog,
    ):
        # Ensure monthly scan has a valid window
        mock_localdate.return_value = date(2024, 2, 10)

        # Seed one site snapshot so month range can be computed
        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        tz = timezone.get_current_timezone()
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 1, 5, 12, 0, 0), tz)
        )

        # Provide a MONTHLY row in FY 2024; make it "newer" than Q2
        jan = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.MONTHLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 1, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
            month=1,
        )
        KeyMetricsReport.objects.filter(pk=jan.pk).update(updated_on=timezone.now())

        # Create quarter rows so the incremental branch runs.
        # Only Q2 should be older than the monthly row to trigger refresh.
        now = timezone.now()
        older = now - timezone.timedelta(days=10)
        quarters = {
            1: ((date(2023, 10, 1), date(2023, 12, 31)), now),
            2: ((date(2024, 1, 1), date(2024, 3, 31)), older),
            3: ((date(2024, 4, 1), date(2024, 6, 30)), now),
            4: ((date(2024, 7, 1), date(2024, 9, 30)), now),
        }
        for fq, val in quarters.items():
            (ps, pe), updated = val
            q = KeyMetricsReport.objects.create(
                period_type=KeyMetricsReport.PeriodType.QUARTERLY,
                period_start=ps,
                period_end=pe,
                fiscal_year=2024,
                fiscal_quarter=fq,
            )
            KeyMetricsReport.objects.filter(pk=q.pk).update(updated_on=updated)

        # upsert_quarter is mocked to return None, so when the code reaches the
        # monthly_newer_exists refresh path for Q2 it will take the "is None"
        # branch and continue without incrementing rows_changed.
        changed = build_key_metrics_reports(recompute_all=False)

        # No rows changed: month and year upserts return None, and Q2 refresh
        # returned None (so branch continued). Only one refresh attempt expected.
        self.assertEqual(changed, 0)
        self.assertEqual(mock_upsert_quarter.call_count, 1)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year",
        return_value=None,
    )
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter",
        return_value=None,
    )
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month",
        return_value=None,
    )
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_fiscal_year_recompute_all_none_branch_continue(
        self,
        mock_localdate,
        mock_upsert_month,
        mock_upsert_quarter,
        mock_upsert_year,
        slog,
    ):
        mock_localdate.return_value = date(2024, 5, 20)

        # Ensure monthly scan can initialize.
        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        tz = timezone.get_current_timezone()
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 5, 10, 12, 0, 0), tz)
        )

        # Ensure at least one fiscal year is present for the FY stage.
        KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 3, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
        )

        # Month/quarter upserts are mocked to None; FY upsert also None.
        changed = build_key_metrics_reports(recompute_all=True)

        # Nothing should be counted since FY upsert returned None and the code
        # immediately continued the loop without incrementing or logging.
        self.assertEqual(changed, 0)
        self.assertEqual(mock_upsert_year.call_count, 1)

        codes = [kw.get("event_code") for _, kw in slog.info.call_args_list if kw]
        self.assertNotIn("key_metrics_year_upserted", codes)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year",
        return_value=None,
    )
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter",
        return_value=None,
    )
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month",
        return_value=None,
    )
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_fiscal_year_incremental_refresh_none_branch_continue(
        self,
        mock_localdate,
        mock_upsert_month,
        mock_upsert_quarter,
        mock_upsert_year,
        slog,
    ):
        mock_localdate.return_value = date(2024, 5, 20)

        # Make monthly stage computable.
        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        tz = timezone.get_current_timezone()
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 5, 10, 12, 0, 0), tz)
        )

        # Existing FY row with older updated_on so a newer quarter will
        # trigger the refresh path.
        fy = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.FISCAL_YEAR,
            period_start=date(2023, 10, 1),
            period_end=date(2024, 9, 30),
            fiscal_year=2024,
        )
        KeyMetricsReport.objects.filter(pk=fy.pk).update(
            updated_on=timezone.make_aware(datetime(2024, 3, 1, 0, 0, 0), tz)
        )

        # Quarter newer than the FY row to make quarter_newer_exists True.
        q2 = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 3, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
        )
        KeyMetricsReport.objects.filter(pk=q2.pk).update(
            updated_on=timezone.make_aware(datetime(2024, 3, 15, 0, 0, 0), tz)
        )

        # FY upsert returns None so the branch is skipped and loop continues.
        changed = build_key_metrics_reports(recompute_all=False)

        self.assertEqual(changed, 0)
        self.assertEqual(mock_upsert_year.call_count, 1)

        codes = [kw.get("event_code") for _, kw in slog.info.call_args_list if kw]
        self.assertNotIn("key_metrics_year_refreshed", codes)
        self.assertNotIn("key_metrics_year_created", codes)
        self.assertNotIn("key_metrics_year_upserted", codes)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year"
    )
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month")
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_incremental_fiscal_year_created_branch(
        self,
        mock_localdate,
        mock_upsert_month,
        mock_upsert_quarter,
        mock_upsert_year,
        slog,
    ):
        mock_localdate.return_value = date(2024, 4, 1)
        mock_upsert_month.return_value = None
        mock_upsert_quarter.return_value = None

        # Quarter exists for FY discovery; no FY row exists yet.
        KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 3, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
        )

        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 1, 2, 9, 0, 0))
        )

        mock_upsert_year.return_value = SimpleNamespace(
            period_start=date(2023, 10, 1), period_end=date(2024, 9, 30)
        )

        changed = build_key_metrics_reports(recompute_all=False)

        self.assertEqual(changed, 1)
        self.assertEqual(mock_upsert_year.call_count, 1)

    @mock.patch("concordia.tasks.reports.key_metrics.structured_logger")
    @mock.patch(
        "concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_fiscal_year"
    )
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_quarter")
    @mock.patch("concordia.tasks.reports.key_metrics.KeyMetricsReport.upsert_month")
    @mock.patch("concordia.tasks.reports.key_metrics.timezone.localdate")
    def test_incremental_fiscal_year_refresh_due_to_newer_quarter(
        self,
        mock_localdate,
        mock_upsert_month,
        mock_upsert_quarter,
        mock_upsert_year,
        slog,
    ):
        mock_localdate.return_value = date(2024, 4, 1)
        mock_upsert_month.return_value = None
        mock_upsert_quarter.return_value = None

        # Existing FY row with earlier updated_on.
        fy = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.FISCAL_YEAR,
            period_start=date(2023, 10, 1),
            period_end=date(2024, 9, 30),
            fiscal_year=2024,
        )
        KeyMetricsReport.objects.filter(pk=fy.pk).update(
            updated_on=timezone.make_aware(datetime(2024, 3, 1, 0, 0, 0))
        )

        # Quarter with newer updated_on to trigger the refresh path.
        q = KeyMetricsReport.objects.create(
            period_type=KeyMetricsReport.PeriodType.QUARTERLY,
            period_start=date(2024, 1, 1),
            period_end=date(2024, 3, 31),
            fiscal_year=2024,
            fiscal_quarter=2,
        )
        KeyMetricsReport.objects.filter(pk=q.pk).update(
            updated_on=timezone.make_aware(datetime(2024, 3, 15, 0, 0, 0))
        )

        sr = SiteReport.objects.create(report_name=SiteReport.ReportName.TOTAL)
        SiteReport.objects.filter(pk=sr.pk).update(
            created_on=timezone.make_aware(datetime(2024, 1, 3, 9, 0, 0))
        )

        mock_upsert_year.return_value = SimpleNamespace(
            period_start=date(2023, 10, 1), period_end=date(2024, 9, 30)
        )

        changed = build_key_metrics_reports(recompute_all=False)

        self.assertEqual(changed, 1)
        self.assertEqual(mock_upsert_year.call_count, 1)


================================================
FILE: concordia/tests/test_tasks_reports_sitereport.py
================================================
from datetime import timedelta

from django.test import TestCase
from django.utils import timezone

from concordia.models import Asset, Campaign, SiteReport, Transcription
from concordia.tasks.reports.sitereport import (
    _daily_active_users,
    campaign_report,
    retired_total_report,
    site_report,
)
from concordia.utils import get_anonymous_user

from .utils import (
    CreateTestUsers,
    create_asset,
    create_campaign,
    create_item,
    create_project,
    create_tag,
    create_tag_collection,
    create_topic,
    create_transcription,
)


class SiteReportTestCase(CreateTestUsers, TestCase):
    @classmethod
    def setUpTestData(cls):
        # We use setUpTestData instead of setUp so the database is only set
        # up once rather than for each individual test in this test case
        cls.user1 = cls.create_user(username="tester1")
        cls.user2 = cls.create_user(username="tester2")
        cls.user3 = cls.create_user(username="tester3")
        cls.anonymous_user = get_anonymous_user()
        cls.asset1 = create_asset()
        cls.item1 = cls.asset1.item
        cls.project1 = cls.item1.project
        cls.campaign1 = cls.project1.campaign
        cls.asset1_transcription1 = create_transcription(
            asset=cls.asset1, user=cls.user1, accepted=timezone.now()
        )
        cls.asset1_transcription2 = create_transcription(
            asset=cls.asset1,
            user=cls.anonymous_user,
            rejected=timezone.now(),
            reviewed_by=cls.user1,
        )
        cls.topic1 = create_topic(project=cls.project1)
        cls.tag1 = create_tag()
        cls.tag_collection1 = create_tag_collection(
            tag=cls.tag1, asset=cls.asset1, user=cls.user1
        )

        cls.campaign2 = create_campaign(slug="test-campaign-slug-2")
        cls.project2 = create_project(
            campaign=cls.campaign2, slug="test-project-slug-2"
        )
        cls.item2 = create_item(project=cls.project2, item_id="2")
        cls.asset2 = create_asset(item=cls.item2, slug="test-asset-slug-2")
        cls.topic2 = create_topic(
            project=cls.asset2.item.project, slug="test-topic-slug-2"
        )
        cls.tag_collection2 = create_tag_collection(
            tag=cls.tag1, asset=cls.asset2, user=cls.user1
        )

        cls.campaign3 = create_campaign(slug="test-campaign-slug-3")
        cls.project3 = create_project(
            campaign=cls.campaign3, slug="test-project-slug-3"
        )
        cls.item3 = create_item(project=cls.project3, item_id="3")
        cls.asset3 = create_asset(item=cls.item3, slug="test-asset-slug-3")
        cls.asset4 = create_asset(
            item=cls.item3, slug="test-asset-slug-4", published=False
        )
        cls.item4 = create_item(project=cls.project3, item_id="4", published=False)
        cls.asset5 = create_asset(
            item=cls.item4, slug="test-asset-slug-5", published=False
        )

        cls.project3.topics.add(cls.topic1)
        cls.project3.topics.add(cls.topic2)

        cls.retired_campaign = create_campaign(slug="retired-campaign-slug")
        cls.retired_project = create_project(
            campaign=cls.retired_campaign, slug="retired-project-slug"
        )
        cls.retired_item = create_item(project=cls.retired_project)
        cls.retired_asset = create_asset(
            item=cls.retired_item, slug="retired-asset-slug"
        )
        time = timezone.now() - timedelta(days=1, hours=1)
        cls.retired_asset_transcription1 = create_transcription(
            asset=cls.retired_asset, user=cls.user1, accepted=time
        )
        # Done like this to override auto_now_add and auto_now
        Transcription.objects.filter(pk=cls.retired_asset_transcription1.pk).update(
            created_on=time, updated_on=time
        )
        time = timezone.now() - timedelta(days=1, seconds=1)
        cls.retired_asset_transcription2 = create_transcription(
            asset=cls.retired_asset,
            user=cls.user2,
            rejected=time,
            reviewed_by=cls.user1,
        )
        # Done like this to override auto_now_add and auto_now
        Transcription.objects.filter(pk=cls.retired_asset_transcription2.pk).update(
            created_on=time, updated_on=time
        )

        # Generate the campaign report before "retiring" the campaign to populate
        # the retired total report
        cls.retired_campaign_report = campaign_report(campaign=cls.retired_campaign)
        cls.retired_asset.delete()
        cls.retired_item.delete()
        cls.retired_project.delete()
        cls.retired_campaign.status = Campaign.Status.RETIRED
        cls.retired_campaign.save()

        site_report()
        cls.site_report = SiteReport.objects.filter(
            report_name=SiteReport.ReportName.TOTAL
        ).first()
        cls.retired_site_report = SiteReport.objects.filter(
            report_name=SiteReport.ReportName.RETIRED_TOTAL
        ).first()
        cls.campaign1_report = SiteReport.objects.filter(campaign=cls.campaign1).first()
        cls.topic1_report = SiteReport.objects.filter(topic=cls.topic1).first()

    def test_daily_active_users(self):
        self.assertEqual(_daily_active_users(), 2)

    def test_site_report(self):
        self.assertEqual(self.site_report.assets_total, 5)
        self.assertEqual(self.site_report.assets_published, 3)
        self.assertEqual(self.site_report.assets_not_started, 4)
        self.assertEqual(self.site_report.assets_in_progress, 1)
        self.assertEqual(self.site_report.assets_waiting_review, 0)
        self.assertEqual(self.site_report.assets_completed, 0)
        self.assertEqual(self.site_report.assets_unpublished, 2)
        self.assertEqual(self.site_report.items_published, 3)
        self.assertEqual(self.site_report.items_unpublished, 1)
        self.assertEqual(self.site_report.projects_published, 3)
        self.assertEqual(self.site_report.projects_unpublished, 0)
        self.assertEqual(self.site_report.anonymous_transcriptions, 1)
        self.assertEqual(self.site_report.transcriptions_saved, 2)
        self.assertEqual(self.site_report.daily_review_actions, 2)
        self.assertEqual(self.site_report.distinct_tags, 1)
        self.assertEqual(self.site_report.tag_uses, 2)
        self.assertEqual(self.site_report.campaigns_published, 4)
        self.assertEqual(self.site_report.campaigns_unpublished, 0)
        self.assertEqual(self.site_report.users_registered, 4)
        self.assertEqual(self.site_report.users_activated, 4)
        self.assertEqual(self.site_report.daily_active_users, 2)

    def test_retired_site_report(self):
        self.assertEqual(self.retired_site_report.assets_total, 1)
        self.assertEqual(self.retired_site_report.assets_published, 1)
        self.assertEqual(self.retired_site_report.assets_not_started, 0)
        self.assertEqual(self.retired_site_report.assets_in_progress, 1)
        self.assertEqual(self.retired_site_report.assets_waiting_review, 0)
        self.assertEqual(self.retired_site_report.assets_completed, 0)
        self.assertEqual(self.retired_site_report.assets_unpublished, 0)
        self.assertEqual(self.retired_site_report.items_published, 1)
        self.assertEqual(self.retired_site_report.items_unpublished, 0)
        self.assertEqual(self.retired_site_report.projects_published, 1)
        self.assertEqual(self.retired_site_report.projects_unpublished, 0)
        self.assertEqual(self.retired_site_report.anonymous_transcriptions, 0)
        self.assertEqual(self.retired_site_report.transcriptions_saved, 2)
        self.assertEqual(self.retired_site_report.daily_review_actions, 0)
        self.assertEqual(self.retired_site_report.distinct_tags, 0)
        self.assertEqual(self.retired_site_report.tag_uses, 0)
        self.assertEqual(self.retired_site_report.registered_contributors, 2)

    def test_campaign_report(self):
        self.assertEqual(self.campaign1_report.assets_total, 1)
        self.assertEqual(self.campaign1_report.assets_published, 1)
        self.assertEqual(self.campaign1_report.assets_not_started, 0)
        self.assertEqual(self.campaign1_report.assets_in_progress, 1)
        self.assertEqual(self.campaign1_report.assets_waiting_review, 0)
        self.assertEqual(self.campaign1_report.assets_completed, 0)
        self.assertEqual(self.campaign1_report.assets_unpublished, 0)
        self.assertEqual(self.campaign1_report.items_published, 1)
        self.assertEqual(self.campaign1_report.items_unpublished, 0)
        self.assertEqual(self.campaign1_report.projects_published, 1)
        self.assertEqual(self.campaign1_report.projects_unpublished, 0)
        self.assertEqual(self.campaign1_report.anonymous_transcriptions, 1)
        self.assertEqual(self.campaign1_report.transcriptions_saved, 2)
        self.assertEqual(self.campaign1_report.daily_review_actions, 2)
        self.assertEqual(self.campaign1_report.distinct_tags, 1)
        self.assertEqual(self.campaign1_report.tag_uses, 1)
        self.assertEqual(self.campaign1_report.registered_contributors, 2)

    def test_topic_report(self):
        self.assertEqual(self.topic1_report.assets_total, 4)
        self.assertEqual(self.topic1_report.assets_published, 2)
        self.assertEqual(self.topic1_report.assets_not_started, 3)
        self.assertEqual(self.topic1_report.assets_in_progress, 1)
        self.assertEqual(self.topic1_report.assets_waiting_review, 0)
        self.assertEqual(self.topic1_report.assets_completed, 0)
        self.assertEqual(self.topic1_report.assets_unpublished, 2)
        self.assertEqual(self.topic1_report.items_published, 2)
        self.assertEqual(self.topic1_report.items_unpublished, 1)
        self.assertEqual(self.topic1_report.projects_published, 2)
        self.assertEqual(self.topic1_report.projects_unpublished, 0)
        self.assertEqual(self.topic1_report.anonymous_transcriptions, 1)
        self.assertEqual(self.topic1_report.transcriptions_saved, 2)
        self.assertEqual(self.topic1_report.daily_review_actions, 2)
        self.assertEqual(self.topic1_report.distinct_tags, 1)
        self.assertEqual(self.topic1_report.tag_uses, 1)

    def test_topic_report_zero_assets_emits_warning(self):
        # Create a new topic attached to a project with no items/assets so the
        # topic report computes zero total assets and emits a warning.
        from unittest import mock

        empty_campaign = create_campaign(slug="sr-empty-c")
        empty_project = create_project(campaign=empty_campaign, slug="sr-empty-p")
        empty_topic = create_topic(project=empty_project, slug="sr-empty-t")

        with mock.patch("concordia.tasks.reports.sitereport.structured_logger") as slog:
            site_report()

            warn_calls = [
                c
                for c in slog.warning.call_args_list
                if c.kwargs.get("event_code") == "topic_report_zero_assets"
                and c.kwargs.get("topic") == empty_topic
            ]
            self.assertTrue(warn_calls)


class SiteReportAssetsStartedRollupTests(CreateTestUsers, TestCase):
    def test_total_assets_started_rolls_up_campaign_deltas_ignoring_retirements(
        self,
    ):
        """
        The TOTAL assets_started value should be derived from per-campaign
        daily deltas for the same reporting day.

        This protects the site-wide daily count from being suppressed when a
        campaign retires and its already-started assets are removed from the
        active asset tables.
        """
        from unittest import mock

        active_campaign = create_campaign(slug="rollup-active-c")
        retiring_campaign = create_campaign(slug="rollup-retiring-c")

        active_project = create_project(
            campaign=active_campaign, slug="rollup-active-p"
        )
        active_item = create_item(project=active_project, item_id="ra")
        active_asset = create_asset(item=active_item, slug="rollup-active-a")

        retiring_project = create_project(
            campaign=retiring_campaign, slug="rollup-retiring-p"
        )
        retiring_item = create_item(project=retiring_project, item_id="rb")
        retiring_asset = create_asset(item=retiring_item, slug="rollup-retiring-a")

        # Day 1 snapshot: one not-started asset in the active campaign and one
        # already-started asset in the campaign that will retire.
        Asset.objects.filter(pk=active_asset.pk).update(
            transcription_status="not_started"
        )
        Asset.objects.filter(pk=retiring_asset.pk).update(
            transcription_status="in_progress"
        )

        base_now = timezone.now()
        day1 = base_now - timedelta(days=2)
        day2 = base_now - timedelta(days=1)

        with mock.patch("django.utils.timezone.now", return_value=day1):
            site_report()

        # Between snapshots, the active campaign starts its asset.
        Asset.objects.filter(pk=active_asset.pk).update(
            transcription_status="in_progress"
        )

        # The other campaign is retired and its content is removed.
        retiring_asset.delete()
        retiring_item.delete()
        retiring_project.delete()
        retiring_campaign.status = Campaign.Status.RETIRED
        retiring_campaign.save()

        with mock.patch("django.utils.timezone.now", return_value=day2):
            site_report()

        total_day2 = (
            SiteReport.objects.filter(
                report_name=SiteReport.ReportName.TOTAL,
                campaign__isnull=True,
                topic__isnull=True,
                created_on__date=day2.date(),
            )
            .order_by("-created_on", "-pk")
            .first()
        )
        active_day2 = (
            SiteReport.objects.filter(
                campaign=active_campaign, created_on__date=day2.date()
            )
            .order_by("-created_on", "-pk")
            .first()
        )

        self.assertIsNotNone(total_day2)
        self.assertIsNotNone(active_day2)

        self.assertEqual(active_day2.assets_started, 1)
        self.assertEqual(total_day2.assets_started, 1)

    def test_retired_total_assets_started_is_always_zero(self):
        retired_campaign = create_campaign(slug="rollup-retired-c")
        retired_campaign.status = Campaign.Status.RETIRED
        retired_campaign.save()

        r1 = SiteReport.objects.create(
            campaign=retired_campaign,
            assets_total=10,
            assets_not_started=0,
            assets_started=4,
        )
        r2 = SiteReport.objects.create(
            campaign=retired_campaign,
            assets_total=10,
            assets_not_started=0,
            assets_started=7,
        )

        now = timezone.now()
        SiteReport.objects.filter(pk=r1.pk).update(created_on=now - timedelta(days=2))
        SiteReport.objects.filter(pk=r2.pk).update(created_on=now - timedelta(days=1))

        self.assertEqual(SiteReport.objects.get(pk=r2.pk).assets_started, 7)

        retired_total_report()

        retired_total = (
            SiteReport.objects.filter(report_name=SiteReport.ReportName.RETIRED_TOTAL)
            .order_by("-created_on", "-pk")
            .first()
        )

        self.assertIsNotNone(retired_total)
        self.assertEqual(retired_total.assets_started, 0)


================================================
FILE: concordia/tests/test_tasks_retirement.py
================================================
from unittest import mock

from django.core.exceptions import ObjectDoesNotExist
from django.test import TestCase

from concordia.models import Asset, Project
from concordia.tasks.retirement import (
    assets_removal_success,
    delete_asset,
    item_removal_success,
    project_removal_success,
    remove_next_assets,
    remove_next_item,
    remove_next_project,
    retire_campaign,
)

from .utils import (
    create_asset,
    create_campaign,
    create_campaign_retirement_progress,
    create_item,
    create_project,
)


class RetirementTasksTests(TestCase):
    def test_retire_campaign_initializes_totals_and_sets_status_and_triggers(self):
        # Build a campaign with 2 projects, 2 items, 3 assets.
        camp = create_campaign(slug="ret-c1")
        p1 = create_project(campaign=camp, slug="ret-p1")
        p2 = create_project(campaign=camp, slug="ret-p2")
        i1 = create_item(project=p1, item_id="ret-i1")
        i2 = create_item(project=p2, item_id="ret-i2")
        a1 = create_asset(item=i1, slug="ret-a1")
        a2 = create_asset(item=i1, slug="ret-a2")
        a3 = create_asset(item=i2, slug="ret-a3")
        self.assertTrue(all([a1.pk, a2.pk, a3.pk]))

        with mock.patch(
            "concordia.tasks.retirement.remove_next_project.delay"
        ) as m_delay:
            prog = retire_campaign(camp.id)

        prog.refresh_from_db()
        self.assertEqual(prog.project_total, 2)
        self.assertEqual(prog.item_total, 2)
        self.assertEqual(prog.asset_total, 3)
        camp.refresh_from_db()
        # Status must be set to RETIRED.
        self.assertEqual(camp.status, camp.Status.RETIRED)  # type: ignore[attr-defined]
        m_delay.assert_called_once_with(camp.id)

    def test_retire_campaign_existing_progress_and_already_retired(self):
        camp = create_campaign(slug="ret-c2")
        # Pre-create progress so the totals branch is skipped.
        prog = create_campaign_retirement_progress(campaign=camp)
        prog.project_total = 7
        prog.item_total = 8
        prog.asset_total = 9
        prog.save()
        # Mark campaign retired to skip status change.
        camp.status = camp.Status.RETIRED  # type: ignore[attr-defined]
        camp.save()

        with mock.patch(
            "concordia.tasks.retirement.remove_next_project.delay"
        ) as m_delay:
            retire_campaign(camp.id)

        prog.refresh_from_db()
        self.assertEqual(prog.project_total, 7)
        self.assertEqual(prog.item_total, 8)
        self.assertEqual(prog.asset_total, 9)
        camp.refresh_from_db()
        self.assertEqual(camp.status, camp.Status.RETIRED)  # type: ignore[attr-defined]
        m_delay.assert_called_once_with(camp.id)

    def test_remove_next_project_calls_remove_next_item_when_project_exists(self):
        camp = create_campaign(slug="ret-c3")
        proj = create_project(campaign=camp, slug="ret-p3")
        create_campaign_retirement_progress(campaign=camp)

        with mock.patch("concordia.tasks.retirement.remove_next_item.delay") as m_delay:
            remove_next_project(camp.id)

        m_delay.assert_called_once_with(proj.id)

    def test_remove_next_project_marks_complete_when_no_projects(self):
        camp = create_campaign(slug="ret-c4")
        prog = create_campaign_retirement_progress(campaign=camp)

        with mock.patch("concordia.tasks.retirement.remove_next_item.delay") as m_delay:
            remove_next_project(camp.id)

        prog.refresh_from_db()
        self.assertTrue(prog.complete)
        self.assertIsNotNone(prog.completed_on)
        m_delay.assert_not_called()

    def test_project_removal_success_increments_and_triggers_next(self):
        camp = create_campaign(slug="ret-c5")
        prog = create_campaign_retirement_progress(campaign=camp)
        self.assertEqual(prog.projects_removed, 0)

        with mock.patch(
            "concordia.tasks.retirement.remove_next_project.delay"
        ) as m_delay:
            project_removal_success(project_id=123, campaign_id=camp.id)

        prog.refresh_from_db()
        self.assertEqual(prog.projects_removed, 1)
        self.assertTrue(any(e.get("id") == 123 for e in prog.removal_log))
        m_delay.assert_called_once_with(camp.id)

    def test_remove_next_item_calls_remove_next_assets_when_item_exists(self):
        camp = create_campaign(slug="ret-c6")
        proj = create_project(campaign=camp, slug="ret-p6")
        itm = create_item(project=proj, item_id="ret-i6")

        with mock.patch(
            "concordia.tasks.retirement.remove_next_assets.delay"
        ) as m_delay:
            remove_next_item(proj.id)

        m_delay.assert_called_once_with(itm.id)

    def test_remove_next_item_deletes_project_and_triggers_when_no_items(self):
        camp = create_campaign(slug="ret-c7")
        proj = create_project(campaign=camp, slug="ret-p7")

        with mock.patch(
            "concordia.tasks.retirement.project_removal_success.delay"
        ) as m_delay:
            remove_next_item(proj.id)

        with self.assertRaises(ObjectDoesNotExist):
            Project.objects.get(pk=proj.id)
        m_delay.assert_called_once_with(proj.id, camp.id)

    def test_assets_removal_success_updates_counts_and_triggers_next(self):
        camp = create_campaign(slug="ret-c8")
        prog = create_campaign_retirement_progress(campaign=camp)
        self.assertEqual(prog.assets_removed, 0)

        with mock.patch(
            "concordia.tasks.retirement.remove_next_assets.delay"
        ) as m_delay:
            assets_removal_success([10, 11, 12], campaign_id=camp.id, item_id=55)

        prog.refresh_from_db()
        self.assertEqual(prog.assets_removed, 3)
        self.assertTrue(any(e.get("id") == 10 for e in prog.removal_log))
        self.assertTrue(any(e.get("id") == 11 for e in prog.removal_log))
        self.assertTrue(any(e.get("id") == 12 for e in prog.removal_log))
        m_delay.assert_called_once_with(55)

    def test_remove_next_assets_when_no_assets_deletes_item_and_triggers(self):
        camp = create_campaign(slug="ret-c9")
        proj = create_project(campaign=camp, slug="ret-p9")
        itm = create_item(project=proj, item_id="ret-i9")

        with mock.patch(
            "concordia.tasks.retirement.item_removal_success.delay"
        ) as m_delay:
            remove_next_assets(itm.id)

        with self.assertRaises(ObjectDoesNotExist):
            # Item should be deleted.
            type(itm).objects.get(pk=itm.id)  # type: ignore[attr-defined]
        m_delay.assert_called_once_with(itm.id, camp.id, proj.id)

    def test_remove_next_assets_with_assets_uses_chord_in_chunks_of_10(self):
        camp = create_campaign(slug="ret-c10")
        proj = create_project(campaign=camp, slug="ret-p10")
        itm = create_item(project=proj, item_id="ret-i10")
        # Create 12 assets; only 10 should be in the chord header.
        ids = []
        for n in range(12):
            a = create_asset(item=itm, slug=f"ret-a10-{n}", sequence=n)
            ids.append(a.id)
        first_ten = list(
            Asset.objects.filter(item=itm)
            .order_by("id")
            .values_list("id", flat=True)[:10]
        )

        with (
            mock.patch("concordia.tasks.retirement.chord") as m_chord,
            mock.patch("concordia.tasks.retirement.delete_asset.s") as m_del_sig,
            mock.patch(
                "concordia.tasks.retirement.assets_removal_success.s"
            ) as m_body_sig,
        ):
            runner = mock.MagicMock()
            m_chord.return_value = runner
            m_del_sig.side_effect = lambda aid: f"S({aid})"
            m_body_sig.return_value = "BODY"

            remove_next_assets(itm.id)

            # Header should contain exactly 10 signatures, matching first ten ids.
            header_iter = m_chord.call_args[0][0]
            header_list = list(header_iter)
            self.assertEqual(header_list, [f"S({aid})" for aid in first_ten])
            # The body signature should be called with campaign and item ids.
            m_body_sig.assert_called_once_with(camp.id, itm.id)
            runner.assert_called_once_with("BODY")

    def test_delete_asset_deletes_storage_and_model_and_returns_id(self):
        itm = create_item(item_id="ret-i11")
        a = create_asset(item=itm, slug="ret-a11", sequence=11)

        with mock.patch("django.core.files.storage.FileSystemStorage.delete") as m_del:
            ret_id = delete_asset(a.id)

        self.assertEqual(ret_id, a.id)
        self.assertFalse(Asset.objects.filter(pk=a.id).exists())
        m_del.assert_called()

    def test_item_removal_success_increments_and_triggers_next(self):
        camp = create_campaign(slug="ret-c12")
        proj = create_project(campaign=camp, slug="ret-p12")
        itm = create_item(project=proj, item_id="ret-i12")
        prog = create_campaign_retirement_progress(campaign=camp)
        self.assertEqual(prog.items_removed, 0)

        with mock.patch("concordia.tasks.retirement.remove_next_item.delay") as m_delay:
            item_removal_success(
                item_id=itm.id, campaign_id=camp.id, project_id=proj.id
            )

        prog.refresh_from_db()
        self.assertEqual(prog.items_removed, 1)
        self.assertTrue(
            any(
                entry.get("type") == "item" and entry.get("id") == itm.id
                for entry in prog.removal_log
            )
        )
        m_delay.assert_called_once_with(proj.id)


================================================
FILE: concordia/tests/test_tasks_search_index.py
================================================
from unittest import mock

from django.test import TestCase

from concordia.tasks.search_index import (
    create_opensearch_indices,
    delete_opensearch_indices,
    populate_opensearch_assets_indices,
    populate_opensearch_indices,
    populate_opensearch_users_indices,
    rebuild_opensearch_indices,
)


class SearchIndexTasksTests(TestCase):
    def test_create_opensearch_indices_calls_management_command(self):
        with mock.patch("concordia.tasks.search_index.call_command") as m_call:
            result = create_opensearch_indices()
            self.assertIsNone(result)
            m_call.assert_called_once_with(
                "opensearch",
                "index",
                "create",
                verbosity=2,
                force=True,
                ignore_error=True,
            )

    def test_delete_opensearch_indices_calls_management_command(self):
        with mock.patch("concordia.tasks.search_index.call_command") as m_call:
            result = delete_opensearch_indices()
            self.assertIsNone(result)
            m_call.assert_called_once_with(
                "opensearch", "index", "delete", force=True, ignore_error=True
            )

    def test_rebuild_opensearch_indices_calls_management_command(self):
        with mock.patch("concordia.tasks.search_index.call_command") as m_call:
            result = rebuild_opensearch_indices()
            self.assertIsNone(result)
            m_call.assert_called_once_with(
                "opensearch",
                "index",
                "rebuild",
                verbosity=2,
                force=True,
                ignore_error=True,
            )

    def test_populate_users_indices_calls_management_command(self):
        with mock.patch("concordia.tasks.search_index.call_command") as m_call:
            result = populate_opensearch_users_indices()
            self.assertIsNone(result)
            m_call.assert_called_once_with(
                "opensearch",
                "document",
                "index",
                "--indices",
                "users",
                "--force",
                "--parallel",
            )

    def test_populate_assets_indices_calls_management_command(self):
        with mock.patch("concordia.tasks.search_index.call_command") as m_call:
            result = populate_opensearch_assets_indices()
            self.assertIsNone(result)
            m_call.assert_called_once_with(
                "opensearch",
                "document",
                "index",
                "--indices",
                "assets",
                "--force",
                "--parallel",
            )

    def test_populate_all_indices_calls_management_command(self):
        with mock.patch("concordia.tasks.search_index.call_command") as m_call:
            result = populate_opensearch_indices()
            self.assertIsNone(result)
            m_call.assert_called_once_with(
                "opensearch", "document", "index", "--force", "--parallel"
            )


================================================
FILE: concordia/tests/test_tasks_thumbnails.py
================================================
from unittest import mock

from django.test import TestCase

from concordia.tasks.thumbnails import (
    download_item_thumbnail_task,
    download_missing_thumbnails_task,
)

from .utils import create_campaign, create_item, create_project


class ThumbnailsTasksTests(TestCase):
    def test_download_item_thumbnail_task_returns_skip_when_no_url(self):
        # Item has no thumbnail_url; task should return skip message.
        proj = create_project(campaign=create_campaign(slug="t-c1"), slug="t-p1")
        item = create_item(project=proj, item_id="t-i1", thumbnail_url="")

        with mock.patch("importer.tasks.items.download_and_set_item_thumbnail") as m_dl:
            result = download_item_thumbnail_task.run(item.id, force=False)

        self.assertEqual(result, "No thumbnail URL available.")
        m_dl.assert_not_called()

    def test_download_item_thumbnail_task_calls_helper_with_force(self):
        # Item has a thumbnail_url; helper should be called with force flag.
        proj = create_project(campaign=create_campaign(slug="t-c2"), slug="t-p2")
        item = create_item(
            project=proj,
            item_id="t-i2",
            thumbnail_url="https://ex.invalid/t.jpg",
            thumbnail_image="",
        )

        with mock.patch("importer.tasks.items.download_and_set_item_thumbnail") as m_dl:
            m_dl.return_value = "stored/path/t.jpg"
            result = download_item_thumbnail_task.run(item.id, force=True)

        self.assertEqual(result, "stored/path/t.jpg")
        m_dl.assert_called_once()
        # First arg is the Item instance, second the source URL.
        args, kwargs = m_dl.call_args
        self.assertEqual(args[0].id, item.id)
        self.assertEqual(args[1], "https://ex.invalid/t.jpg")
        self.assertTrue(kwargs.get("force"))

    def test_download_missing_thumbnails_task_returns_zero_when_none(self):
        # No items meet the filter; should log and return 0, no group calls.
        with mock.patch("concordia.tasks.thumbnails.group") as m_group:
            count = download_missing_thumbnails_task.run()

        self.assertEqual(count, 0)
        m_group.assert_not_called()

    def test_download_missing_thumbnails_task_filters_and_batches_once(self):
        from unittest import mock

        camp = create_campaign(slug="t-c3")
        proj_a = create_project(campaign=camp, slug="t-p3a")
        proj_b = create_project(campaign=camp, slug="t-p3b")

        i1 = create_item(
            project=proj_a,
            item_id="t-i3-1",
            thumbnail_url="http://example.com/img1.jpg",
            thumbnail_image="",
        )
        i2 = create_item(
            project=proj_a,
            item_id="t-i3-2",
            thumbnail_url="http://example.com/img2.jpg",
            thumbnail_image="",
        )
        create_item(  # wrong project -> not eligible
            project=proj_b,
            item_id="t-i3-3",
            thumbnail_url="http://example.com/img3.jpg",
            thumbnail_image="",
        )
        create_item(  # already has image -> not eligible
            project=proj_a,
            item_id="t-i3-4",
            thumbnail_url="http://example.com/img4.jpg",
            thumbnail_image="has-file",
        )

        with (
            mock.patch("concordia.tasks.thumbnails.group") as m_group,
            mock.patch(
                "concordia.tasks.thumbnails.download_item_thumbnail_task.s"
            ) as m_sig,
        ):
            runner = mock.MagicMock()
            runner.apply_async.return_value.get.return_value = None

            def fake_group(header_iter):
                # Force generator evaluation so .s(...) is actually called.
                list(header_iter)
                return runner

            m_group.side_effect = fake_group

            count = download_missing_thumbnails_task.run(
                project_id=proj_a.id, batch_size=2, limit=10, force=True
            )

        self.assertEqual(count, 2)
        m_sig.assert_has_calls(
            [mock.call(i1.id, force=True), mock.call(i2.id, force=True)],
            any_order=False,
        )
        m_group.assert_called_once()
        runner.apply_async.assert_called_once()
        runner.apply_async.return_value.get.assert_called_once_with(
            disable_sync_subtasks=False
        )

    def test_download_missing_thumbnails_task_multiple_waves(self):
        from unittest import mock

        camp = create_campaign(slug="t-c4")
        proj = create_project(campaign=camp, slug="t-p4")
        items = [
            create_item(
                project=proj,
                item_id=f"t-i4-{n}",
                thumbnail_url=f"http://example.com/{n}.jpg",
                thumbnail_image="",
            )
            for n in range(5)
        ]

        with (
            mock.patch("concordia.tasks.thumbnails.group") as m_group,
            mock.patch(
                "concordia.tasks.thumbnails.download_item_thumbnail_task.s"
            ) as m_sig,
        ):
            runners = [mock.MagicMock() for _ in range(3)]
            for r in runners:
                r.apply_async.return_value.get.return_value = None
            it = iter(runners)

            def fake_group(header_iter):
                # Force generator consumption each wave.
                list(header_iter)
                return next(it)

            m_group.side_effect = fake_group

            count = download_missing_thumbnails_task.run(
                project_id=proj.id, batch_size=2, limit=None, force=False
            )

        self.assertEqual(count, 5)
        self.assertEqual(m_group.call_count, 3)
        expected = [mock.call(itm.id, force=False) for itm in items]
        self.assertEqual(m_sig.call_args_list, expected)


================================================
FILE: concordia/tests/test_tasks_unusualactivity.py
================================================
from datetime import UTC, datetime, timedelta
from unittest import mock

from django.test import TestCase, override_settings
from django.utils import timezone

from concordia.tasks.unusualactivity import unusual_activity


class UnusualActivityTaskTests(TestCase):
    @override_settings(CONCORDIA_ENVIRONMENT="development")
    def test_noop_when_not_production_and_not_ignored(self):
        # Should not render templates or send mail.
        with (
            mock.patch(
                "concordia.tasks.unusualactivity.loader.get_template"
            ) as m_get_tmpl,
            mock.patch(
                "concordia.tasks.unusualactivity.EmailMultiAlternatives"
            ) as m_email,
            mock.patch(
                "concordia.tasks.unusualactivity.Transcription.objects"
            ) as m_mgr,
        ):
            unusual_activity(ignore_env=False)

        m_get_tmpl.assert_not_called()
        m_email.assert_not_called()
        # Manager methods should not be called either.
        self.assertFalse(m_mgr.transcribe_incidents.called)
        self.assertFalse(m_mgr.review_incidents.called)

    @override_settings(
        CONCORDIA_ENVIRONMENT="production",
        DEFAULT_FROM_EMAIL="noreply@example.com",
        DEFAULT_TO_EMAIL="",
    )
    def test_runs_in_production_without_default_to(self):
        # Executes, builds subject without env suffix, and sends to one addr.
        fixed_now_dt = timezone.make_aware(datetime(2025, 1, 1, 12, 0), timezone=UTC)
        expected_one_day_ago = fixed_now_dt - timedelta(days=1)

        with (
            mock.patch(
                "concordia.tasks.unusualactivity.Site.objects.get_current"
            ) as m_site,
            mock.patch(
                "concordia.tasks.unusualactivity.timezone.localtime"
            ) as m_localtime,
            mock.patch(
                "concordia.tasks.unusualactivity.timezone.now",
                return_value=fixed_now_dt,
            ),
            mock.patch(
                "concordia.tasks.unusualactivity.loader.get_template"
            ) as m_get_tmpl,
            mock.patch(
                "concordia.tasks.unusualactivity.EmailMultiAlternatives"
            ) as m_email,
            mock.patch(
                "concordia.tasks.unusualactivity.Transcription.objects"
            ) as m_mgr,
        ):
            lt = mock.Mock()
            lt.strftime.return_value = "STAMP"
            m_localtime.return_value = lt

            m_site.return_value = mock.Mock(domain="example.com")

            txt_tmpl = mock.Mock()
            html_tmpl = mock.Mock()
            txt_tmpl.render.return_value = "TEXT"
            html_tmpl.render.return_value = "HTML"
            m_get_tmpl.side_effect = lambda name: (
                txt_tmpl if name.endswith(".txt") else html_tmpl
            )

            m_mgr.transcribe_incidents.return_value = []
            m_mgr.review_incidents.return_value = []

            msg = mock.Mock()
            m_email.return_value = msg

            unusual_activity(ignore_env=False)

        expected_subject = "Unusual User Activity Report for STAMP"
        args, kwargs = m_email.call_args
        self.assertEqual(kwargs["subject"], expected_subject)
        self.assertEqual(kwargs["from_email"], "noreply@example.com")
        self.assertEqual(kwargs["to"], ["rsar@loc.gov"])
        self.assertEqual(kwargs["reply_to"], ["noreply@example.com"])

        txt_tmpl.render.assert_called_once()
        html_tmpl.render.assert_called_once()
        self.assertEqual(
            m_mgr.transcribe_incidents.call_args[0][0], expected_one_day_ago
        )
        self.assertEqual(m_mgr.review_incidents.call_args[0][0], expected_one_day_ago)
        msg.attach_alternative.assert_called_once_with("HTML", "text/html")
        msg.send.assert_called_once()

    @override_settings(
        CONCORDIA_ENVIRONMENT="test",
        DEFAULT_FROM_EMAIL="notify@example.com",
        DEFAULT_TO_EMAIL="extra@example.com",
    )
    def test_ignore_env_appends_suffix_and_includes_default_to(self):
        fixed_now_dt = timezone.make_aware(datetime(2025, 1, 2, 9, 30), timezone=UTC)
        expected_one_day_ago = fixed_now_dt - timedelta(days=1)

        with (
            mock.patch(
                "concordia.tasks.unusualactivity.Site.objects.get_current"
            ) as m_site,
            mock.patch(
                "concordia.tasks.unusualactivity.timezone.localtime"
            ) as m_localtime,
            mock.patch(
                "concordia.tasks.unusualactivity.timezone.now",
                return_value=fixed_now_dt,
            ),
            mock.patch(
                "concordia.tasks.unusualactivity.loader.get_template"
            ) as m_get_tmpl,
            mock.patch(
                "concordia.tasks.unusualactivity.EmailMultiAlternatives"
            ) as m_email,
            mock.patch(
                "concordia.tasks.unusualactivity.Transcription.objects"
            ) as m_mgr,
        ):
            lt = mock.Mock()
            lt.strftime.return_value = "STAMP2"
            m_localtime.return_value = lt

            m_site.return_value = mock.Mock(domain="example.net")

            txt_tmpl = mock.Mock()
            html_tmpl = mock.Mock()
            txt_tmpl.render.return_value = "TEXT2"
            html_tmpl.render.return_value = "HTML2"
            m_get_tmpl.side_effect = lambda name: (
                txt_tmpl if name.endswith(".txt") else html_tmpl
            )

            m_mgr.transcribe_incidents.return_value = []
            m_mgr.review_incidents.return_value = []

            msg = mock.Mock()
            m_email.return_value = msg

            unusual_activity(ignore_env=True)

        expected_subject = "Unusual User Activity Report for STAMP2 [TEST]"
        args, kwargs = m_email.call_args
        self.assertEqual(kwargs["subject"], expected_subject)
        self.assertEqual(kwargs["to"], ["rsar@loc.gov", "extra@example.com"])
        self.assertEqual(kwargs["from_email"], "notify@example.com")
        self.assertEqual(kwargs["reply_to"], ["notify@example.com"])

        txt_tmpl.render.assert_called_once()
        html_tmpl.render.assert_called_once()
        self.assertEqual(
            m_mgr.transcribe_incidents.call_args[0][0], expected_one_day_ago
        )
        self.assertEqual(m_mgr.review_incidents.call_args[0][0], expected_one_day_ago)
        msg.attach_alternative.assert_called_once_with("HTML2", "text/html")
        msg.send.assert_called_once()


================================================
FILE: concordia/tests/test_tasks_useractivity.py
================================================
from unittest import mock

from django.core import mail
from django.core.cache import cache
from django.test import TestCase

from concordia.exceptions import CacheLockedError
from concordia.models import Campaign, Transcription, UserProfileActivity
from concordia.tasks.unusualactivity import unusual_activity
from concordia.tasks.useractivity import (
    populate_active_campaign_counts,
    populate_completed_campaign_counts,
    update_useractivity_cache,
    update_userprofileactivity_from_cache,
)
from concordia.utils import get_anonymous_user

from .utils import (
    CreateTestUsers,
    create_asset,
    create_campaign,
    create_item,
    create_project,
    create_tag,
    create_tag_collection,
    create_transcription,
)


class UserActivityTaskTestCase(CreateTestUsers, TestCase):
    def setUp(self):
        cache.clear()
        self.user = self.create_test_user()
        self.campaign = create_campaign()
        self.key = f"userprofileactivity_{self.campaign.pk}"

    @mock.patch("concordia.tasks.useractivity.update_userprofileactivity_table")
    def test_update_userprofileactivity_from_cache_no_updates(self, mock_update_table):
        cache.set(self.key, None)
        with mock.patch("concordia.logging.ConcordiaLogger.debug") as mock_debug:
            update_userprofileactivity_from_cache()
            self.assertEqual(mock_debug.call_count, 2)
            mock_debug.assert_called_with(
                "Cache contained no updates for key. Skipping",
                event_code="update_userprofileactivity_from_cache_no_updates",
                key=self.key,
            )
        self.assertEqual(mock_update_table.call_count, 0)

    @mock.patch("concordia.tasks.useractivity.update_userprofileactivity_table")
    def test_update_userprofileactivity_from_cache_update(self, mock_update_table):
        cache.set(self.key, {self.user.pk: (1, 0)})
        update_userprofileactivity_from_cache()
        self.assertEqual(mock_update_table.call_count, 2)
        mock_update_table.assert_has_calls(
            [
                mock.call(self.user, self.campaign.id, "transcribe_count", 1),
                mock.call(self.user, self.campaign.id, "review_count", 0),
            ]
        )
        self.assertIsNone(cache.get(self.key))

    @mock.patch("concordia.tasks.unusualactivity.Transcription.objects")
    def test_unusual_activity(self, mock_transcription):
        mock_transcription.transcribe_incidents.return_value = (
            Transcription.objects.none()
        )
        mock_transcription.review_incidents.return_value = Transcription.objects.none()
        unusual_activity(ignore_env=True)
        self.assertEqual(len(mail.outbox), 1)
        expected_subject = "Unusual User Activity Report"
        self.assertIn(expected_subject, mail.outbox[0].subject)

    @mock.patch("django.core.cache.cache.add")
    @mock.patch("django.core.cache.cache.delete")
    @mock.patch("concordia.tasks.useractivity._update_useractivity_cache")
    def test_update_useractivity_cache(self, mock_update, mock_delete, mock_add):
        user = self.user
        campaign = self.campaign

        mock_add.return_value = False
        with self.assertRaises(CacheLockedError):
            update_useractivity_cache(user.id, campaign.id, "transcribe")
        self.assertEqual(mock_update.call_count, 0)
        self.assertEqual(mock_delete.call_count, 0)

        mock_add.return_value = True
        update_useractivity_cache(user.id, campaign.id, "transcribe")
        self.assertEqual(mock_update.call_count, 1)
        mock_update.assert_called_with(user.id, campaign.id, "transcribe")
        self.assertEqual(mock_delete.call_count, 1)
        mock_delete.assert_called_with("userprofileactivity_cache_lock")

        update_useractivity_cache(user.id, campaign.id, "review")
        self.assertEqual(mock_update.call_count, 2)
        mock_update.assert_called_with(user.id, campaign.id, "review")
        self.assertEqual(mock_delete.call_count, 2)
        mock_delete.assert_called_with("userprofileactivity_cache_lock")

    def test_populate_active_campaign_counts_computes_user_and_anon_rows(self):
        camp = create_campaign(slug="ua-camp-a")
        proj = create_project(campaign=camp, slug="ua-proj-a")
        item = create_item(project=proj, item_id="ua-item-a")
        a1 = create_asset(item=item, slug="ua-a1", sequence=1)
        a2 = create_asset(item=item, slug="ua-a2", sequence=2)

        u1 = self.create_test_user("ua-u1")
        u2 = self.create_test_user("ua-u2")
        anon = get_anonymous_user()

        create_transcription(asset=a1, user=u1, reviewed_by=u2)
        create_transcription(asset=a2, user=u2, reviewed_by=u1)
        create_transcription(asset=a1, user=anon)
        create_transcription(asset=a2, user=u2, reviewed_by=anon)

        t1 = create_tag(value="ua-t1")
        t2 = create_tag(value="ua-t2")
        create_tag_collection(tag=t1, asset=a1, user=u1)
        create_tag_collection(tag=t2, asset=a2, user=u1)
        create_tag_collection(tag=t1, asset=a2, user=anon)

        populate_active_campaign_counts.run()

        rows = UserProfileActivity.objects.filter(campaign=camp)
        self.assertEqual(rows.count(), 3)

        r_u1 = rows.get(user=u1)
        r_u2 = rows.get(user=u2)
        r_an = rows.get(user=anon)

        self.assertEqual(r_u1.asset_count, 2)
        self.assertEqual(r_u1.asset_tag_count, 2)
        self.assertEqual(r_u1.transcribe_count, 1)
        self.assertEqual(r_u1.review_count, 1)

        self.assertEqual(r_u2.asset_count, 2)
        self.assertEqual(r_u2.asset_tag_count, 0)
        self.assertEqual(r_u2.transcribe_count, 2)
        self.assertEqual(r_u2.review_count, 1)

        self.assertEqual(r_an.asset_count, 2)
        self.assertEqual(r_an.asset_tag_count, 1)
        self.assertEqual(r_an.transcribe_count, 1)
        self.assertEqual(r_an.review_count, 1)

    def test_populate_completed_campaign_counts_processes_non_active_only(self):
        active = create_campaign(slug="ua-act-1")
        p1 = create_project(campaign=active, slug="ua-act-proj")
        it1 = create_item(project=p1, item_id="ua-act-item")
        a_act = create_asset(item=it1, slug="ua-act-a")
        u_act = self.create_test_user("ua-act-u")
        create_transcription(asset=a_act, user=u_act)

        retired = create_campaign(slug="ua-ret-1", status=Campaign.Status.RETIRED)
        p2 = create_project(campaign=retired, slug="ua-ret-proj")
        it2 = create_item(project=p2, item_id="ua-ret-item")
        a_ret = create_asset(item=it2, slug="ua-ret-a")
        u_ret = self.create_test_user("ua-ret-u")
        create_transcription(asset=a_ret, user=u_ret)

        populate_completed_campaign_counts.run()

        self.assertFalse(UserProfileActivity.objects.filter(campaign=active).exists())
        self.assertTrue(UserProfileActivity.objects.filter(campaign=retired).exists())

    def test_update_useractivity_cache_lock_max_retries_sends_email(self):
        with (
            mock.patch("django.core.cache.cache.add", return_value=False),
            mock.patch.object(update_useractivity_cache, "max_retries", 0, create=True),
            mock.patch("concordia.tasks.useractivity.send_mail") as m_send,
            mock.patch("concordia.logging.ConcordiaLogger.warning") as m_warn,
            mock.patch("concordia.logging.ConcordiaLogger.exception") as m_exc,
            mock.patch("concordia.tasks.useractivity.logger.error") as m_err,
        ):
            with self.assertRaises(CacheLockedError):
                update_useractivity_cache.run(
                    self.user.id, self.campaign.id, "transcribe"
                )

        # Structured logs were emitted
        self.assertTrue(m_warn.called)
        self.assertTrue(m_exc.called)

        # Email sent with expected subject
        self.assertTrue(m_send.called)
        sent_args, sent_kwargs = m_send.call_args
        self.assertEqual(
            sent_args[0],
            "Task update_useractivity_cache failed: cache is locked.",
        )
        # Unstructured error log emitted
        self.assertTrue(m_err.called)

    def test_update_useractivity_cache_update_exception_releases_lock(self):
        with (
            mock.patch("concordia.tasks.useractivity.cache.add", return_value=True),
            mock.patch("concordia.tasks.useractivity.cache.delete") as m_del,
            mock.patch(
                "concordia.tasks.useractivity._update_useractivity_cache",
                side_effect=RuntimeError("boom"),
            ),
            mock.patch("concordia.tasks.useractivity.send_mail") as m_mail,
        ):
            with self.assertRaises(RuntimeError):
                update_useractivity_cache.run(self.user.id, self.campaign.id, "review")

        m_del.assert_called_once_with("userprofileactivity_cache_lock")
        m_mail.assert_not_called()


class UpdateUserprofileactivityFromCacheTestCase(CreateTestUsers, TestCase):
    def setUp(self):
        cache.clear()
        self.user = self.create_test_user()
        self.campaign = create_campaign()
        self.key = f"userprofileactivity_{self.campaign.pk}"

    @mock.patch("concordia.tasks.useractivity.update_userprofileactivity_table")
    def test_no_updates(self, mock_update_table):
        cache.set(self.key, None)
        with mock.patch("concordia.logging.ConcordiaLogger.debug") as mock_debug:
            update_userprofileactivity_from_cache()
            self.assertEqual(mock_debug.call_count, 2)
            mock_debug.assert_called_with(
                "Cache contained no updates for key. Skipping",
                event_code="update_userprofileactivity_from_cache_no_updates",
                key=self.key,
            )
        self.assertEqual(mock_update_table.call_count, 0)

    @mock.patch("concordia.tasks.useractivity.update_userprofileactivity_table")
    def test_update(self, mock_update_table):
        cache.set(self.key, {self.user.pk: (1, 0)})
        update_userprofileactivity_from_cache()
        self.assertEqual(mock_update_table.call_count, 2)
        mock_update_table.assert_has_calls(
            [
                mock.call(self.user, self.campaign.id, "transcribe_count", 1),
                mock.call(self.user, self.campaign.id, "review_count", 0),
            ]
        )
        self.assertIsNone(cache.get(self.key))


================================================
FILE: concordia/tests/test_tasks_visualizations.py
================================================
from datetime import timedelta
from unittest import mock

from django.core.cache import caches
from django.test import TestCase, override_settings
from django.utils import timezone

from concordia.models import Campaign, SiteReport, TranscriptionStatus
from concordia.tasks.visualizations import (
    populate_asset_status_visualization_cache,
    populate_daily_activity_visualization_cache,
)

from .utils import create_asset, create_campaign, create_item, create_project


@override_settings(
    CACHES={
        "default": {
            "BACKEND": "django.core.cache.backends.locmem.LocMemCache",
        },
        "visualization_cache": {
            "BACKEND": "django.core.cache.backends.locmem.LocMemCache",
        },
    }
)
class VisualizationCacheTasksTests(TestCase):
    class _UploadFailed(Exception):
        pass

    def setUp(self):
        self.cache = caches["visualization_cache"]
        self.cache.clear()

    def test_populate_asset_status_visualization_cache(self):
        c1 = create_campaign(status=Campaign.Status.ACTIVE, title="Alpha")
        c2 = create_campaign(status=Campaign.Status.ACTIVE, title="Beta")
        p1 = create_project(campaign=c1)
        i1 = create_item(project=p1)
        p2 = create_project(campaign=c2)
        i2 = create_item(project=p2)
        create_asset(item=i1, transcription_status=TranscriptionStatus.NOT_STARTED)
        create_asset(
            item=i2,
            slug="test-asset-2",
            transcription_status=TranscriptionStatus.IN_PROGRESS,
        )
        create_asset(
            item=i2,
            slug="test-asset-3",
            transcription_status=TranscriptionStatus.SUBMITTED,
        )
        create_asset(
            item=i2,
            slug="test-asset-4",
            transcription_status=TranscriptionStatus.COMPLETED,
        )

        populate_asset_status_visualization_cache.run()

        overview = self.cache.get("asset-status-overview")
        expected_labels = [
            TranscriptionStatus.CHOICE_MAP[key]
            for key, _ in TranscriptionStatus.CHOICES
        ]
        self.assertEqual(overview["status_labels"], expected_labels)
        # Totals: 1 not_started, 1 in_progress, 1 submitted, 1 completed
        self.assertEqual(overview["total_counts"], [1, 1, 1, 1])

    def test_populate_daily_activity_visualization_cache(self):
        today = timezone.localdate()
        date1 = today - timedelta(days=2)
        date2 = today - timedelta(days=1)

        sr1 = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL,
            transcriptions_saved=5,
            daily_review_actions=1,
        )
        sr2 = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL,
            transcriptions_saved=10,
            daily_review_actions=2,
        )
        # Set specific created_on dates directly in DB
        SiteReport.objects.filter(pk=sr1.pk).update(created_on=date1)
        SiteReport.objects.filter(pk=sr2.pk).update(created_on=date2)

        populate_daily_activity_visualization_cache.run()

        result = self.cache.get("daily-transcription-activity-last-28-days")
        self.assertIsNotNone(result)

        expected_labels = [(date2 - timedelta(days=1)), date2]
        expected_labels = [d.strftime("%Y-%m-%d") for d in expected_labels]

        # Extract the two datasets
        datasets = result["transcription_datasets"]
        self.assertEqual(len(datasets), 2)
        trans = next(ds for ds in datasets if ds["label"] == "Transcriptions")
        reviews = next(ds for ds in datasets if ds["label"] == "Reviews")

        # transcriptions = 5 on date1, 10 - 5 = 5 on date2
        # reviews = 1 on date1, 2 on date2
        self.assertEqual(trans["data"][-2:], [5, 5])  # last two days in the data range
        self.assertEqual(reviews["data"][-2:], [1, 2])

    def test_negative_daily_saved_clamps_to_zero(self):
        today = timezone.localdate()
        date1 = today - timedelta(days=2)
        date2 = today - timedelta(days=1)

        sr1 = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL,
            transcriptions_saved=10,
            daily_review_actions=0,
        )
        sr2 = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL,
            transcriptions_saved=5,  # decreased total, which should not happen
            daily_review_actions=0,
        )
        SiteReport.objects.filter(pk=sr1.pk).update(created_on=date1)
        SiteReport.objects.filter(pk=sr2.pk).update(created_on=date2)

        populate_daily_activity_visualization_cache.run()

        result = self.cache.get("daily-transcription-activity-last-28-days")
        self.assertIsNotNone(result)

        datasets = result["transcription_datasets"]
        trans = next(ds for ds in datasets if ds["label"] == "Transcriptions")

        # Should clamp the second day to 0
        self.assertEqual(trans["data"][-2:], [10, 0])

    def test_asset_status_unchanged_skips_upload_and_cache_update(self):
        campaign = create_campaign(status=Campaign.Status.ACTIVE, title="Only")
        project = create_project(campaign=campaign)
        item = create_item(project=project)
        create_asset(item=item, transcription_status=TranscriptionStatus.NOT_STARTED)
        create_asset(
            item=item, slug="a2", transcription_status=TranscriptionStatus.IN_PROGRESS
        )
        create_asset(
            item=item, slug="a3", transcription_status=TranscriptionStatus.SUBMITTED
        )
        create_asset(
            item=item, slug="a4", transcription_status=TranscriptionStatus.COMPLETED
        )

        expected_counts = [1, 1, 1, 1]

        existing_payload = {
            "status_labels": [
                TranscriptionStatus.CHOICE_MAP[key]
                for key, _ in TranscriptionStatus.CHOICES
            ],
            "total_counts": expected_counts,
            "csv_url": "https://old.example/asset-status.csv",
        }
        self.cache.set("asset-status-overview", existing_payload, None)

        with (
            mock.patch(
                "concordia.tasks.visualizations.VISUALIZATION_STORAGE.save"
            ) as mock_save,
            mock.patch("concordia.tasks.visualizations.structured_logger") as mock_log,
        ):
            populate_asset_status_visualization_cache.run()

            mock_save.assert_not_called()
            # Cache should remain as-is
            self.assertEqual(self.cache.get("asset-status-overview"), existing_payload)
            # Logged unchanged
            self.assertTrue(mock_log.info.called)
            self.assertEqual(
                mock_log.info.call_args.kwargs.get("event_code"),
                "asset_status_vis_unchanged",
            )

    def test_asset_status_upload_failure_with_prior_url_falls_back(self):
        campaign = create_campaign(status=Campaign.Status.ACTIVE, title="Only")
        project = create_project(campaign=campaign)
        item = create_item(project=project)
        create_asset(item=item, transcription_status=TranscriptionStatus.NOT_STARTED)

        # Ensure "existing" differs so code takes the non-unchanged path
        self.cache.set(
            "asset-status-overview",
            {
                "status_labels": [],
                "total_counts": [0, 0, 0, 0],
                "csv_url": "https://old.example/asset-status.csv",
            },
            None,
        )

        with (
            mock.patch(
                "concordia.tasks.visualizations.VISUALIZATION_STORAGE.save",
                side_effect=self._UploadFailed("test exception"),
            ),
            mock.patch("concordia.tasks.visualizations.structured_logger") as mock_log,
        ):
            # Should not raise because we have a prior CSV URL to fall back to
            populate_asset_status_visualization_cache.run()

            updated = self.cache.get("asset-status-overview")
            # Counts should reflect the new data (1 in NOT_STARTED; others 0)
            expected = [
                1 if key == TranscriptionStatus.NOT_STARTED else 0
                for key, _ in TranscriptionStatus.CHOICES
            ]
            self.assertEqual(updated["total_counts"], expected)
            # URL should remain the old one
            self.assertEqual(updated["csv_url"], "https://old.example/asset-status.csv")

            # Logged exception with the non-missing-url code
            self.assertTrue(mock_log.exception.called)
            self.assertEqual(
                mock_log.exception.call_args.kwargs.get("event_code"),
                "asset_status_vis_csv_error",
            )

    def test_asset_status_upload_failure_without_prior_url_raises(self):
        campaign = create_campaign(status=Campaign.Status.ACTIVE, title="Only")
        project = create_project(campaign=campaign)
        item = create_item(project=project)
        create_asset(item=item, transcription_status=TranscriptionStatus.NOT_STARTED)

        # No existing cache entry, so no prior URL
        with (
            mock.patch(
                "concordia.tasks.visualizations.VISUALIZATION_STORAGE.save",
                side_effect=self._UploadFailed("test exception"),
            ),
            mock.patch("concordia.tasks.visualizations.structured_logger") as mock_log,
        ):
            with self.assertRaises(self._UploadFailed):
                populate_asset_status_visualization_cache.run()

            self.assertTrue(mock_log.exception.called)
            self.assertEqual(
                mock_log.exception.call_args.kwargs.get("event_code"),
                "asset_status_vis_csv_missing_url_error",
            )

    def test_daily_activity_unchanged_skips_upload_and_cache_update(self):
        # With no SiteReports, both series are 28 zeros; pre-populate matching cache
        zeros = [0] * 28
        existing = {
            "labels": [],  # labels do not matter for the dedupe
            "transcription_datasets": [
                {"label": "Transcriptions", "data": zeros},
                {"label": "Reviews", "data": zeros},
            ],
            "csv_url": "https://old.example/daily.csv",
        }
        self.cache.set("daily-transcription-activity-last-28-days", existing, None)

        with (
            mock.patch(
                "concordia.tasks.visualizations.VISUALIZATION_STORAGE.save"
            ) as mock_save,
            mock.patch("concordia.tasks.visualizations.structured_logger") as mock_log,
        ):
            populate_daily_activity_visualization_cache.run()

            mock_save.assert_not_called()
            self.assertEqual(
                self.cache.get("daily-transcription-activity-last-28-days"), existing
            )
            self.assertTrue(mock_log.info.called)
            self.assertEqual(
                mock_log.info.call_args.kwargs.get("event_code"),
                "daily_activity_vis_unchanged",
            )

    def test_daily_activity_upload_failure_with_prior_url_falls_back(self):
        # Build reports so new data will not be all zeros (ensures "changed" path)
        today = timezone.localdate()
        date1 = today - timedelta(days=2)
        date2 = today - timedelta(days=1)
        sr1 = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL,
            transcriptions_saved=3,
            daily_review_actions=1,
        )
        sr2 = SiteReport.objects.create(
            report_name=SiteReport.ReportName.TOTAL,
            transcriptions_saved=5,
            daily_review_actions=2,
        )
        SiteReport.objects.filter(pk=sr1.pk).update(created_on=date1)
        SiteReport.objects.filter(pk=sr2.pk).update(created_on=date2)

        # Prior cache with different series and a CSV URL to fall back to
        self.cache.set(
            "daily-transcription-activity-last-28-days",
            {
                "labels": [],
                "transcription_datasets": [
                    {"label": "Transcriptions", "data": [0] * 28},
                    {"label": "Reviews", "data": [0] * 28},
                ],
                "csv_url": "https://old.example/daily.csv",
            },
            None,
        )

        with (
            mock.patch(
                "concordia.tasks.visualizations.VISUALIZATION_STORAGE.save",
                side_effect=self._UploadFailed("test exception"),
            ),
            mock.patch("concordia.tasks.visualizations.structured_logger") as mock_log,
        ):
            # Should not raise because we have a prior CSV URL
            populate_daily_activity_visualization_cache.run()

            updated = self.cache.get("daily-transcription-activity-last-28-days")
            self.assertIsNotNone(updated)
            # Still using the old URL
            self.assertEqual(updated["csv_url"], "https://old.example/daily.csv")
            # Logged exception with the non-missing-url code
            self.assertTrue(mock_log.exception.called)
            self.assertEqual(
                mock_log.exception.call_args.kwargs.get("event_code"),
                "daily_activity_vis_csv_error",
            )

    def test_daily_activity_upload_failure_without_prior_url_raises(self):
        # No existing cache entry -> csv_url is None
        with (
            mock.patch(
                "concordia.tasks.visualizations.VISUALIZATION_STORAGE.save",
                side_effect=self._UploadFailed("test exception"),
            ),
            mock.patch("concordia.tasks.visualizations.structured_logger") as mock_log,
        ):
            with self.assertRaises(self._UploadFailed):
                populate_daily_activity_visualization_cache.run()

            self.assertTrue(mock_log.exception.called)
            self.assertEqual(
                mock_log.exception.call_args.kwargs.get("event_code"),
                "daily_activity_vis_csv_missing_url_error",
            )


================================================
FILE: concordia/tests/test_templatetags.py
================================================
from django.http import QueryDict
from django.template import Context, Template
from django.templatetags.static import static
from django.test import TestCase, override_settings
from django.utils.html import escape, format_html

from concordia.models import TranscriptionStatus
from concordia.templatetags.concordia_filtering_tags import transcription_status_filters
from concordia.templatetags.concordia_text_tags import reprchar
from concordia.templatetags.custom_math import multiply
from concordia.templatetags.reject_filter import reject
from concordia.templatetags.truncation import (
    WordBreakTruncator,
    truncatechars_on_word_break,
)
from concordia.templatetags.visualization import concordia_visualization


class TestTemplateTags(TestCase):
    def test_truncatechars_on_word_break(self):
        test_string = "Lorem ipsum \u0317 dolor sit amet, consectetur adipiscing elit"

        self.assertEqual(truncatechars_on_word_break(test_string, 0), "[…]")
        self.assertEqual(truncatechars_on_word_break(test_string, 1), "[…]")
        self.assertEqual(truncatechars_on_word_break(test_string, 10), "Lorem[…]")
        self.assertEqual(
            truncatechars_on_word_break(test_string, 30),
            "Lorem ipsum \u0317 dolor sit[…]",
        )
        self.assertEqual(truncatechars_on_word_break(test_string, 1000), test_string)
        self.assertEqual(
            truncatechars_on_word_break(test_string, "badvalue"), test_string
        )

        self.assertEqual(
            WordBreakTruncator(test_string).word_break(30, "[\u0317]"),
            "Lorem ipsum \u0317 dolor sit[\u0317]",
        )

    def test_multiply(self):
        self.assertEqual(multiply(5, 5), 5 * 5)
        self.assertEqual(multiply(0, 5), 0 * 5)
        self.assertEqual(multiply(1, 2), 1 * 2)

    def test_transcription_status_filters(self):
        status_counts = []
        for choice in TranscriptionStatus.CHOICES:
            status_counts.append((choice, 0, 1))

        transcription_status_filters(status_counts, "")
        transcription_status_filters(status_counts, "", reversed_order=True)
        transcription_status_filters(status_counts, TranscriptionStatus.CHOICES[0][0])

    def test_qs_alter(self):
        base_template = "{% load concordia_querystring %}"

        out = Template(
            base_template + "{% qs_alter 'bar=baz&baz=taz' foo='bar' %}"
        ).render(Context())
        self.assertEqual(out, "bar=baz&amp;baz=taz&amp;foo=bar")

        data = QueryDict("bar=baz&baz=taz&bar=foo")
        out = Template(base_template + "{% qs_alter data foo='bar' %}").render(
            Context({"data": data})
        )
        self.assertEqual(out, "bar=baz&amp;bar=foo&amp;baz=taz&amp;foo=bar")

        out = Template(base_template + "{% qs_alter data delete:bar %}").render(
            Context({"data": data})
        )
        self.assertEqual(out, "baz=taz")

        out = Template(base_template + "{% qs_alter data delete:taz %}").render(
            Context({"data": data})
        )
        self.assertEqual(out, "bar=baz&amp;bar=foo&amp;baz=taz")

        out = Template(
            base_template + "{% qs_alter data delete_value:\"bar\",'foo' %}"
        ).render(Context({"data": data}))
        self.assertEqual(out, "bar=baz&amp;baz=taz")

        out = Template(
            base_template + "{% qs_alter data delete_value:'bar','taz' %}"
        ).render(Context({"data": data}))
        self.assertEqual(out, "bar=baz&amp;bar=foo&amp;baz=taz")

        out = Template(
            base_template + "{% qs_alter data foo='bar' as new_data %}" "{{ new_data }}"
        ).render(Context({"data": data}))
        self.assertEqual(out, "bar=baz&amp;bar=foo&amp;baz=taz&amp;foo=bar")

        # Test add_if_missing when the key already exists (should not overwrite)
        out = Template(
            base_template + "{% qs_alter data add_if_missing:bar='newvalue' %}"
        ).render(Context({"data": data}))
        self.assertEqual(out, "bar=baz&amp;bar=foo&amp;baz=taz")

    def test_reprchar_variants(self):
        cases = [
            ("A", "A"),
            ("\n", "\\n"),
            ("\x00", "\\x00"),
            ("\u200b", "\\u200b"),
            ("\\", "\\\\"),
        ]
        for ch, expected in cases:
            self.assertEqual(reprchar(ch), expected)


class RejectFilterTests(TestCase):
    def test_returns_input_when_falsy(self):
        self.assertEqual(reject("", "x"), "")
        self.assertEqual(reject([], "x"), [])
        self.assertIsNone(reject(None, "x"))
        self.assertEqual(reject((), "x"), ())

    def test_string_single_reject(self):
        self.assertEqual(
            reject("error warn marked-safe", "marked-safe"),
            "error warn",
        )

    def test_string_multiple_rejects(self):
        self.assertEqual(
            reject("error warn marked-safe", "marked-safe,warn"),
            "error",
        )

    def test_string_no_match(self):
        self.assertEqual(reject("one two", "three"), "one two")

    def test_string_empty_args(self):
        self.assertEqual(reject("one two", ""), "one two")

    def test_string_whitespace_split_and_join(self):
        self.assertEqual(reject("a   b\tc", "b"), "a c")

    def test_string_case_sensitivity(self):
        self.assertEqual(reject("A a", "a"), "A")

    def test_iterable_list(self):
        self.assertEqual(
            reject(["ok", "deprecated", "x", "hidden"], "deprecated,hidden"),
            ["ok", "x"],
        )

    def test_iterable_tuple_and_duplicates(self):
        self.assertEqual(reject(("a", "b", "c", "b"), "b"), ["a", "c"])

    def test_iterable_no_match(self):
        self.assertEqual(reject(["one", "two"], "three"), ["one", "two"])

    def test_iterable_empty_args(self):
        self.assertEqual(reject(["one", "two"], ""), ["one", "two"])


@override_settings(
    STORAGES={
        "default": {"BACKEND": "django.core.files.storage.FileSystemStorage"},
        "staticfiles": {
            "BACKEND": "django.contrib.staticfiles.storage.StaticFilesStorage",
        },
    },
    STATICFILES_STORAGE="django.contrib.staticfiles.storage.StaticFilesStorage",
)
class VisualizationTagsTests(TestCase):
    def test_without_attrs_renders_section_and_script(self):
        # No attributes: should render a plain <section> and matching <script>
        result = concordia_visualization("daily-activity")
        expected_section = (
            '<div class="visualization-container"><section>'
            '<canvas id="daily-activity"></canvas></section></div>'
        )
        self.assertHTMLEqual(result, expected_section)

    def test_with_attrs_and_escaping(self):
        # Attributes that include characters needing HTML escaping
        attrs = {"class": "test-class", "style": "width:100%;", "data-info": "<alert>"}
        result = concordia_visualization("chart1", **attrs)

        escaped_value = escape("<alert>")
        expected_section = (
            f'<div class="visualization-container test-class" '
            f'style="width:100%;" data-info="{escaped_value}">'
            f"<section >"
            f'<canvas id="chart1"></canvas>'
            f"</section>"
            f"</div>"
        )
        self.assertHTMLEqual(result, expected_section)

    def test_name_escaping_in_id_and_script_src(self):
        # Name contains characters needing HTML escaping
        name = 'x"><script>alert(1)</script>'
        script_src = static(f"js/visualizations/{name}.js")
        script_html = format_html(
            '<script type="module" src="{}"></script>', script_src
        )
        result = concordia_visualization(name) + script_html

        # The id attribute must have the name escaped
        escaped_id = escape(name)
        self.assertIn(f'id="{escaped_id}"', result)

        # The script src must also be escaped
        raw_src = static(f"js/visualizations/{name}.js")
        escaped_src = escape(raw_src)
        self.assertIn(f'src="{escaped_src}"', result)


================================================
FILE: concordia/tests/test_top_level_views.py
================================================
"""
Tests for for the top-level & “CMS” views
"""

from unittest.mock import patch

from django.core.cache import cache
from django.test import RequestFactory, TestCase
from django.urls import reverse
from maintenance_mode.core import get_maintenance_mode, set_maintenance_mode

from concordia.models import (
    Banner,
    CarouselSlide,
    Guide,
    OverlayPosition,
    SimplePage,
    SiteReport,
)
from concordia.views.simple_pages import simple_page

from .utils import (
    CacheControlAssertions,
    CreateTestUsers,
    JSONAssertMixin,
    create_guide,
    create_site_report,
)


class TopLevelViewTests(
    JSONAssertMixin, CreateTestUsers, CacheControlAssertions, TestCase
):
    def setUp(self):
        cache.clear()

    def tearDown(self):
        cache.clear()

    def test_healthz(self):
        data = self.assertValidJSON(self.client.get("/healthz"))

        for k in (
            "current_time",
            "load_average",
            "debug",
            "database_has_data",
            "application_version",
        ):
            self.assertIn(k, data)

    def test_homepage(self):
        response = self.client.get(reverse("homepage"))
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(response, "home.html")

        banner = Banner.objects.create(
            slug="test-banner", text="Test Banner", active=True
        )
        response = self.client.get(reverse("homepage"))
        context = response.context
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(response, "home.html")
        self.assertIn("banner", context)
        self.assertEqual(context["banner"].text, banner.text)
        banner.delete()

        slide = CarouselSlide.objects.create(
            published=True,
            overlay_position=OverlayPosition.LEFT,
            headline="Test Headline",
        )
        response = self.client.get(reverse("homepage"))
        context = response.context
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(response, "home.html")
        self.assertIn("firstslide", context)
        self.assertEqual(context["firstslide"].headline, slide.headline)
        slide.delete()

    def test_contact_us_redirect(self):
        response = self.client.get(reverse("contact"))

        self.assertEqual(response.status_code, 302)
        self.assertEqual(response["Location"], "https://ask.loc.gov/crowd")

    def test_simple_page(self):
        s = SimplePage.objects.create(
            title="Get Started 123",
            body="not the real body",
            path=reverse("welcome-guide"),
        )

        s2 = SimplePage.objects.create(
            title="Get Started Spanish 123",
            body="not the real spanish body",
            path=reverse("welcome-guide-spanish"),
        )

        resp = self.client.get(reverse("welcome-guide"))
        self.assertEqual(200, resp.status_code)
        self.assertEqual(s.title, resp.context["title"])
        self.assertEqual(
            [(reverse("welcome-guide"), s.title)], resp.context["breadcrumbs"]
        )
        self.assertEqual(resp.context["body"], f"<p>{s.body}</p>")

        request = RequestFactory().get("/")
        resp = simple_page(request, path=reverse("welcome-guide"))
        self.assertEqual(200, resp.status_code)

        resp = self.client.get(reverse("welcome-guide-spanish"))
        self.assertEqual(200, resp.status_code)
        self.assertEqual(s2.title, resp.context["title"])
        self.assertEqual("es", resp.context["language_code"])
        self.assertEqual(
            [(reverse("welcome-guide-spanish"), s2.title)], resp.context["breadcrumbs"]
        )
        self.assertEqual(resp.context["body"], f"<p>{s2.body}</p>")

    def test_nested_simple_page(self):
        Guide.objects.create(title="How to Tag")
        l1 = SimplePage.objects.create(
            title="Get Started",
            body="not the real body",
            path=reverse("welcome-guide"),
        )

        l2 = SimplePage.objects.create(
            title="How to Tag",
            body="This is _not_ the real page",
            path=reverse("how-to-tag"),
        )

        resp = self.client.get(reverse("how-to-tag"))
        self.assertEqual(200, resp.status_code)
        self.assertEqual(l2.title, resp.context["title"])
        self.assertEqual(
            resp.context["breadcrumbs"],
            [(reverse("welcome-guide"), l1.title), (reverse("how-to-tag"), l2.title)],
        )
        self.assertHTMLEqual(
            resp.context["body"], "<p>This is <em>not</em> the real page</p>"
        )

        create_guide(page=l1)
        resp = self.client.get(reverse("welcome-guide"))
        self.assertEqual(200, resp.status_code)

    def test_simple_page_with_context(self):
        path = reverse("about")
        page_body = (
            "<p>{{ assets_published}}</p> "
            "<p>{{ campaigns_published }}</p> "
            "<p>{{ assets_completed }}</p> "
            "<p>{{ assets_waiting_review }}</p> "
            "<p>{{ users_activated }}</p>"
        )
        about_page = SimplePage.objects.create(
            title="About",
            body=page_body,
            path=reverse("about"),
        )

        # Test with no SiteReports
        response = self.client.get(path)
        context = response.context
        self.assertEqual(200, response.status_code)
        self.assertEqual(about_page.title, context["title"])
        self.assertEqual([(path, about_page.title)], context["breadcrumbs"])
        self.assertEqual(
            context["body"], "<p>0</p>\n<p>0</p>\n<p>0</p>\n<p>0</p>\n<p>0</p>"
        )

        # Test with only active SiteReport
        cache.clear()
        create_site_report(
            report_name=SiteReport.ReportName.TOTAL,
            campaigns_published=1,
            assets_published=1,
            assets_completed=1,
            assets_waiting_review=1,
            users_activated=1,
        )

        response = self.client.get(path)
        context = response.context
        self.assertEqual(
            context["body"], "<p>1</p>\n<p>1</p>\n<p>1</p>\n<p>1</p>\n<p>1</p>"
        )

        # Test with both SiteReports, but with cached values from above
        # So we should expect the retired SiteReport to not be included in data
        create_site_report(
            report_name=SiteReport.ReportName.RETIRED_TOTAL,
            assets_published=1,
            assets_completed=1,
            assets_waiting_review=1,
        )

        response = self.client.get(path)
        context = response.context
        self.assertEqual(
            context["body"], "<p>1</p>\n<p>1</p>\n<p>1</p>\n<p>1</p>\n<p>1</p>"
        )

        # Test without bad cached data
        cache.clear()
        response = self.client.get(path)
        context = response.context
        self.assertEqual(
            context["body"], "<p>2</p>\n<p>1</p>\n<p>2</p>\n<p>2</p>\n<p>1</p>"
        )


class HelpCenterRedirectTests(TestCase):
    def test_HelpCenterRedirectView(self):
        SimplePage.objects.create(
            title="Get Started Page",
            body="Page Body",
            path="/get-started/page/",
        )

        self.assertRedirects(
            self.client.get("/help-center/page/"), "/get-started/page/"
        )

    def test_HelpCenterSpanishRedirectView(self):
        SimplePage.objects.create(
            title="Get Started Page",
            body="Page Body",
            path="/get-started-esp/page-esp/",
        )

        self.assertRedirects(
            self.client.get("/help-center/page-esp/"), "/get-started-esp/page-esp/"
        )


class MaintenanceModeTests(TestCase, CreateTestUsers):
    def setUp(self):
        cache.clear()
        self.timestamp_value = 1
        self.user = None

    def tearDown(self):
        cache.clear()

    def test_maintenance_mode_off(self):
        self.user = self.create_super_user()
        self.login_user()
        set_maintenance_mode(True)

        with patch("concordia.views.maintenance_mode.time") as mock:
            mock.return_value = self.timestamp_value
            self.assertRedirects(
                self.client.get(reverse("maintenance_mode_off")),
                f"/?t={self.timestamp_value}",
            )
        self.assertEqual(get_maintenance_mode(), False)

        self.user = self.create_test_user()
        self.login_user()
        set_maintenance_mode(True)
        with patch("concordia.views.maintenance_mode.time") as mock:
            mock.return_value = self.timestamp_value
            self.assertRedirects(
                self.client.get(reverse("maintenance_mode_off")),
                f"/?t={self.timestamp_value}",
                target_status_code=503,
            )
        self.assertEqual(get_maintenance_mode(), True)

    def test_maintenance_mode_on_without_frontend(self):
        cache.set("maintenance_mode_frontend_available", False, None)

        self.user = self.create_super_user()
        self.login_user()
        set_maintenance_mode(False)
        with patch("concordia.views.maintenance_mode.time") as mock:
            mock.return_value = self.timestamp_value
            self.assertRedirects(
                self.client.get(reverse("maintenance_mode_on")),
                f"/?t={self.timestamp_value}",
                target_status_code=503,
            )
        self.assertEqual(get_maintenance_mode(), True)

        self.user = self.create_test_user()
        self.login_user()
        set_maintenance_mode(False)
        with patch("concordia.views.maintenance_mode.time") as mock:
            mock.return_value = self.timestamp_value
            self.assertRedirects(
                self.client.get(reverse("maintenance_mode_on")),
                f"/?t={self.timestamp_value}",
            )
        self.assertEqual(get_maintenance_mode(), False)

    def test_maintenance_mode_on_with_frontend(self):
        cache.set("maintenance_mode_frontend_available", True, None)

        self.user = self.create_super_user()
        self.login_user()
        set_maintenance_mode(False)
        with patch("concordia.views.maintenance_mode.time") as mock:
            mock.return_value = self.timestamp_value
            self.assertRedirects(
                self.client.get(reverse("maintenance_mode_on")),
                f"/?t={self.timestamp_value}",
            )
        self.assertEqual(get_maintenance_mode(), True)

        self.user = self.create_test_user()
        self.login_user()
        set_maintenance_mode(False)
        with patch("concordia.views.maintenance_mode.time") as mock:
            mock.return_value = self.timestamp_value
            self.assertRedirects(
                self.client.get(reverse("maintenance_mode_on")),
                f"/?t={self.timestamp_value}",
            )
        self.assertEqual(get_maintenance_mode(), False)

    def test_maintenance_mode_frontend_available(self):
        self.user = self.create_super_user()
        self.login_user()
        cache.set("maintenance_mode_frontend_available", False, None)
        with patch("concordia.views.maintenance_mode.time") as mock:
            mock.return_value = self.timestamp_value
            self.assertRedirects(
                self.client.get(reverse("maintenance_mode_frontend_available")),
                f"/?t={self.timestamp_value}",
            )
        self.assertEqual(cache.get("maintenance_mode_frontend_available"), True)

        self.user = self.create_test_user()
        self.login_user()
        cache.set("maintenance_mode_frontend_available", False, None)
        with patch("concordia.views.maintenance_mode.time") as mock:
            mock.return_value = self.timestamp_value
            self.assertRedirects(
                self.client.get(reverse("maintenance_mode_frontend_available")),
                f"/?t={self.timestamp_value}",
            )
        self.assertEqual(cache.get("maintenance_mode_frontend_available"), False)

    def test_maintenance_mode_frontend_unavailable(self):
        self.user = self.create_super_user()
        self.login_user()
        cache.set("maintenance_mode_frontend_available", True, None)
        with patch("concordia.views.maintenance_mode.time") as mock:
            mock.return_value = self.timestamp_value
            self.assertRedirects(
                self.client.get(reverse("maintenance_mode_frontend_unavailable")),
                f"/?t={self.timestamp_value}",
            )
        self.assertEqual(cache.get("maintenance_mode_frontend_available"), False)

        self.user = self.create_test_user()
        self.login_user()
        cache.set("maintenance_mode_frontend_available", True, None)
        with patch("concordia.views.maintenance_mode.time") as mock:
            mock.return_value = self.timestamp_value
            self.assertRedirects(
                self.client.get(reverse("maintenance_mode_frontend_unavailable")),
                f"/?t={self.timestamp_value}",
            )
        self.assertEqual(cache.get("maintenance_mode_frontend_available"), True)


================================================
FILE: concordia/tests/test_utils_celery.py
================================================
from types import SimpleNamespace
from unittest import mock

from django.test import TestCase

from concordia.utils.celery import get_registered_task


class CeleryUtilsTests(TestCase):
    def test_get_registered_task_returns_task_from_registry(self):
        name = "pkg.tasks.do_thing"
        dummy_task = object()
        app = SimpleNamespace(tasks={name: dummy_task}, send_task=mock.Mock())

        with mock.patch(
            "concordia.utils.celery.concordia_celery_app",
            app,
        ):
            got = get_registered_task(name)

        self.assertIs(got, dummy_task)
        app.send_task.assert_not_called()

    def test_get_registered_task_raises_runtime_error_with_cause(self):
        name = "pkg.tasks.missing"
        app = SimpleNamespace(tasks={}, send_task=mock.Mock())

        with mock.patch(
            "concordia.utils.celery.concordia_celery_app",
            app,
        ):
            with self.assertRaises(RuntimeError) as ctx:
                get_registered_task(name)

        message = str(ctx.exception)
        self.assertIn(f"Task {name} is not registered.", message)
        self.assertIn("Did you typo it?", message)
        self.assertIsInstance(ctx.exception.__cause__, KeyError)
        app.send_task.assert_not_called()


================================================
FILE: concordia/tests/test_utils_logging.py
================================================
from types import SimpleNamespace

from django.test import TestCase

from concordia.logging import get_logging_user_id
from concordia.utils import get_anonymous_user

from .utils import CreateTestUsers


class LoggingTests(CreateTestUsers, TestCase):
    def test_get_logging_user_id_authenticated_user(self):
        user = self.create_test_user()
        self.assertEqual(get_logging_user_id(user), str(user.id))

    def test_get_logging_user_id_anonymous_user(self):
        anon = get_anonymous_user()
        self.assertEqual(get_logging_user_id(anon), "anonymous")

    def test_get_logging_user_id_missing_auth_attribute(self):
        mock_user = object()
        self.assertEqual(get_logging_user_id(mock_user), "anonymous")

    def test_get_logging_user_id_authenticated_no_id(self):
        user = SimpleNamespace(is_authenticated=True, username="someuser")
        self.assertEqual(get_logging_user_id(user), "anonymous")


================================================
FILE: concordia/tests/test_utils_next_asset_reviewable_campaign.py
================================================
from unittest.mock import MagicMock, patch

from django.test import TestCase
from django.utils.timezone import now

from concordia.models import (
    AssetTranscriptionReservation,
    NextReviewableCampaignAsset,
)
from concordia.utils import get_anonymous_user
from concordia.utils.next_asset import (
    find_new_reviewable_campaign_assets,
    find_next_reviewable_campaign_asset,
    find_reviewable_campaign_asset,
)
from concordia.utils.next_asset.reviewable.campaign import (
    _eligible_reviewable_base_qs,
    _find_reviewable_in_item,
    _find_reviewable_in_project,
    _next_seq_after,
    _reserved_asset_ids_subq,
    find_and_order_potential_reviewable_campaign_assets,
    find_invalid_next_reviewable_campaign_assets,
)

from .utils import (
    CreateTestUsers,
    create_asset,
    create_campaign,
    create_item,
    create_project,
    create_transcription,
)


class NextReviewableCampaignAssetTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.anon = get_anonymous_user()
        self.user = self.create_test_user()
        self.asset1 = create_asset(sequence=1)
        self.asset2 = create_asset(
            item=self.asset1.item, sequence=2, slug="test-asset-2"
        )
        self.campaign = self.asset1.campaign

    def test_find_new_reviewable_campaign_assets_filters_correctly(self):
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())

        queryset = find_new_reviewable_campaign_assets(self.campaign, self.user)
        self.assertIn(self.asset1, queryset)

    def test_find_new_reviewable_campaign_assets_without_user(self):
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        # Covers lines 28–30
        queryset = find_new_reviewable_campaign_assets(self.campaign, None)
        self.assertIn(self.asset1, queryset)

    def test_find_reviewable_campaign_asset_from_next_table(self):
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())

        NextReviewableCampaignAsset.objects.create(
            asset=self.asset1,
            campaign=self.campaign,
            item=self.asset1.item,
            item_item_id=self.asset1.item.item_id,
            project=self.asset1.item.project,
            project_slug=self.asset1.item.project.slug,
            sequence=self.asset1.sequence,
            transcriber_ids=[],
        )

        asset = find_reviewable_campaign_asset(self.campaign, self.user)
        self.assertEqual(asset, self.asset1)

    @patch("concordia.utils.next_asset.reviewable.campaign.get_registered_task")
    def test_find_reviewable_campaign_asset_falls_back_and_spawns_task(
        self, mock_get_task
    ):
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        asset = find_reviewable_campaign_asset(self.campaign, self.user)
        self.assertEqual(asset, self.asset2)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.reviewable.campaign.get_registered_task")
    def test_find_next_reviewable_campaign_asset_orders_and_falls_back(
        self, mock_get_task
    ):
        """
        With short-circuiting: project-level returns the eligible asset
        and we do not spawn a task.
        """
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        asset = find_next_reviewable_campaign_asset(
            self.campaign,
            self.user,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(asset, self.asset1)
        # Short-circuit satisfied -> no cache fallback -> no task spawned
        self.assertFalse(mock_get_task.called)
        self.assertFalse(mock_task.delay.called)

    @patch("concordia.utils.next_asset.reviewable.campaign.get_registered_task")
    def test_find_next_reviewable_campaign_asset_when_next_asset_exists(
        self, mock_get_task
    ):
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        NextReviewableCampaignAsset.objects.create(
            asset=self.asset2,
            campaign=self.campaign,
            item=self.asset2.item,
            item_item_id=self.asset2.item.item_id,
            project=self.asset2.item.project,
            project_slug=self.asset2.item.project.slug,
            sequence=self.asset2.sequence,
            transcriber_ids=[],
        )

        asset = find_next_reviewable_campaign_asset(
            self.campaign,
            self.user,
            project_slug=self.asset2.item.project.slug,
            item_id=self.asset2.item.item_id,
            original_asset_id=self.asset2.id - 1,
        )
        self.assertEqual(asset, self.asset2)
        self.assertFalse(mock_get_task.called)
        self.assertFalse(mock_task.delay.called)

    def test_short_circuit_same_item_excludes_users_own_work(self):
        """
        Reviewable item short-circuit must not return assets
        transcribed by the requesting user.
        """
        # Two submitted in same item: one by self.user, one by anon
        mine = self.asset1
        other = self.asset2
        create_transcription(asset=mine, user=self.user, submitted=now())
        create_transcription(asset=other, user=self.anon, submitted=now())

        chosen = find_next_reviewable_campaign_asset(
            self.campaign,
            self.user,
            project_slug=mine.item.project.slug,
            item_id=mine.item.item_id,
            original_asset_id=mine.id,
        )
        self.assertEqual(chosen, other)

    def test_item_short_circuit_reviewable_respects_after_sequence_and_reservations(
        self,
    ):
        """
        Item reviewable short-circuit should choose next by sequence
        and skip reserved assets.
        """
        # Three submitted in the same item (none by self.user)
        asset1 = self.asset1
        asset2 = self.asset2
        asset3 = create_asset(item=asset1.item, sequence=3, slug="rev-a3")
        for asset in (asset1, asset2, asset3):
            create_transcription(asset=asset, user=self.anon, submitted=now())

        # After asset1, pick asset2
        chosen = find_next_reviewable_campaign_asset(
            self.campaign,
            self.user,
            project_slug=asset1.item.project.slug,
            item_id=asset1.item.item_id,
            original_asset_id=asset1.id,
        )
        self.assertEqual(chosen, asset2)

        # Reserve asset2, so should pick asset3
        AssetTranscriptionReservation.objects.create(
            asset=asset2, reservation_token="rv"  # nosec
        )
        chosen2 = find_next_reviewable_campaign_asset(
            self.campaign,
            self.user,
            project_slug=asset1.item.project.slug,
            item_id=asset1.item.item_id,
            original_asset_id=asset1.id,
        )
        self.assertEqual(chosen2, asset3)

    def test_project_short_circuit_when_item_has_only_users_work(self):
        """
        If the only SUBMITTED assets in the item were transcribed by the user,
        the function should fall back to other assets in the same project.
        """
        # Item-level: only user's work
        create_transcription(asset=self.asset1, user=self.user, submitted=now())
        create_transcription(asset=self.asset2, user=self.user, submitted=now())

        # Project-level: someone else's work
        other_item = create_item(project=self.asset1.item.project, item_id="p2")
        project_asset = create_asset(item=other_item, slug="rev-p-asset")
        create_transcription(asset=project_asset, user=self.anon, submitted=now())

        chosen = find_next_reviewable_campaign_asset(
            self.campaign,
            self.user,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(chosen, project_asset)

    @patch("concordia.utils.next_asset.reviewable.campaign.get_registered_task")
    def test_cache_excludes_user_and_triggers_spawn_task(self, mock_get_task):
        """
        When the only cached asset is excluded via transcriber_ids containing the user,
        the function should skip cache, fall back to manual and spawn a populate task.
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        # Cached entry references the user's own work (excluded by contains)
        create_transcription(asset=self.asset1, user=self.user, submitted=now())
        NextReviewableCampaignAsset.objects.create(
            asset=self.asset1,
            campaign=self.campaign,
            item=self.asset1.item,
            item_item_id=self.asset1.item.item_id,
            project=self.asset1.item.project,
            project_slug=self.asset1.item.project.slug,
            sequence=self.asset1.sequence,
            transcriber_ids=[self.user.id],
        )

        # A valid reviewable exists elsewhere
        other = create_asset(item=self.asset1.item, sequence=3, slug="rev-other")
        create_transcription(asset=other, user=self.anon, submitted=now())

        # Pass empty project/item to ensure we hit cache (and thus spawn task)
        chosen = find_next_reviewable_campaign_asset(
            self.campaign,
            self.user,
            project_slug="",
            item_id="",
            original_asset_id=None,
        )
        self.assertEqual(chosen, other)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)


class ReviewableCampaignInternalsTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.anon = get_anonymous_user()
        self.user = self.create_test_user()
        self.asset1 = create_asset(sequence=1, slug="rc-a1")
        # same item, higher sequence
        self.asset2 = create_asset(item=self.asset1.item, sequence=2, slug="rc-a2")
        self.campaign = self.asset1.campaign

    def test_reserved_asset_ids_subq_filters_to_campaign(self):
        AssetTranscriptionReservation.objects.create(
            asset=self.asset1, reservation_token="r1"  # nosec
        )
        other_campaign = create_campaign(slug="rc-camp-a", title="rc-camp-a")
        other_project = create_project(
            campaign=other_campaign, slug="rc-proj-a", title="rc-proj-a"
        )
        other_item = create_item(project=other_project, item_id="rc-other-item")
        other_campaign_asset = create_asset(item=other_item, slug="rc-other-camp-a")
        AssetTranscriptionReservation.objects.create(
            asset=other_campaign_asset, reservation_token="r2"  # nosec
        )

        id_set = set(
            _reserved_asset_ids_subq(self.campaign).values_list("asset_id", flat=True)
        )
        self.assertIn(self.asset1.id, id_set)
        self.assertNotIn(other_campaign_asset.id, id_set)

    def test_eligible_reviewable_base_qs_excludes_user_and_requires_submitted(self):
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.user, submitted=now())
        asset3 = create_asset(item=self.asset1.item, sequence=3, slug="rc-a3")

        queryset_user = _eligible_reviewable_base_qs(self.campaign, user=self.user)
        self.assertIn(self.asset1, queryset_user)
        self.assertNotIn(self.asset2, queryset_user)
        self.assertNotIn(asset3, queryset_user)

        queryset_none = _eligible_reviewable_base_qs(self.campaign, user=None)
        self.assertIn(self.asset1, queryset_none)
        self.assertIn(self.asset2, queryset_none)
        self.assertNotIn(asset3, queryset_none)

    def test_next_seq_after_none_missing_and_valid(self):
        self.assertIsNone(_next_seq_after(None))
        self.assertIsNone(_next_seq_after(99999999))
        self.assertEqual(_next_seq_after(self.asset2.pk), self.asset2.sequence)

    def test_find_reviewable_in_item_after_none_returns_first(self):
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())

        chosen = _find_reviewable_in_item(
            self.campaign,
            self.user,
            item_id=self.asset1.item.item_id,
            after_asset_pk=None,
        )
        self.assertEqual(chosen, self.asset1)

    def test_find_reviewable_in_item_after_asset_in_other_item_ignores_gate(self):
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())

        other_item = create_item(
            project=self.asset1.item.project, item_id="rc-other-item"
        )
        other_asset = create_asset(item=other_item, slug="rc-other-asset")
        create_transcription(asset=other_asset, user=self.anon, submitted=now())

        chosen = _find_reviewable_in_item(
            self.campaign,
            self.user,
            item_id=self.asset1.item.item_id,
            after_asset_pk=other_asset.id,
        )
        self.assertEqual(chosen, self.asset1)

    def test_find_reviewable_in_item_after_asset_missing_ignores_gate(self):
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())

        chosen = _find_reviewable_in_item(
            self.campaign,
            self.user,
            item_id=self.asset1.item.item_id,
            after_asset_pk=987654321,
        )
        self.assertEqual(chosen, self.asset1)

    def test_find_reviewable_in_item_after_asset_sidc_ignores_gate(self):
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())

        other_campaign = create_campaign(slug="rc-camp-b", title="rc-camp-b")
        other_project = create_project(
            campaign=other_campaign, slug="rc-proj-b", title="rc-proj-b"
        )
        other_item = create_item(
            project=other_project, item_id=self.asset1.item.item_id
        )
        other_campaign_asset = create_asset(item=other_item, slug="rc-cross-camp")
        create_transcription(
            asset=other_campaign_asset, user=self.anon, submitted=now()
        )

        chosen = _find_reviewable_in_item(
            self.campaign,
            self.user,
            item_id=self.asset1.item.item_id,
            after_asset_pk=other_campaign_asset.id,
        )
        self.assertEqual(chosen, self.asset1)

    def test_find_reviewable_in_project_orders_and_excludes_user(self):
        other_item = create_item(project=self.asset1.item.project, item_id="rc-p-item")
        mine = create_asset(item=other_item, sequence=1, slug="rc-p-mine")
        theirs = create_asset(item=other_item, sequence=2, slug="rc-p-theirs")
        create_transcription(asset=mine, user=self.user, submitted=now())
        create_transcription(asset=theirs, user=self.anon, submitted=now())

        chosen = _find_reviewable_in_project(
            self.campaign,
            self.user,
            project_slug=self.asset1.item.project.slug,
            after_asset_pk=self.asset1.id,
        )
        self.assertEqual(chosen, theirs)

    def test_find_reviewable_in_project_returns_none_when_only_users_work(self):
        other_item = create_item(project=self.asset1.item.project, item_id="rc-p2")
        mine = create_asset(item=other_item, sequence=1, slug="rc-p2-mine")
        create_transcription(asset=mine, user=self.user, submitted=now())

        chosen = _find_reviewable_in_project(
            self.campaign,
            self.user,
            project_slug=self.asset1.item.project.slug,
            after_asset_pk=self.asset1.id,
        )
        self.assertIsNone(chosen)

    def test_find_new_reviewable_campaign_assets_excludes_reserved_and_next_table(
        self,
    ):
        asset_reserved = create_asset(
            item=self.asset1.item, sequence=3, slug="rc-a-res"
        )
        asset_cached = create_asset(
            item=self.asset1.item, sequence=4, slug="rc-a-cached"
        )
        for asset in (asset_reserved, asset_cached):
            create_transcription(asset=asset, user=self.anon, submitted=now())

        AssetTranscriptionReservation.objects.create(
            asset=asset_reserved, reservation_token="rv"  # nosec
        )

        from concordia.models import NextReviewableCampaignAsset

        NextReviewableCampaignAsset.objects.create(
            asset=asset_cached,
            campaign=self.campaign,
            item=asset_cached.item,
            item_item_id=asset_cached.item.item_id,
            project=asset_cached.item.project,
            project_slug=asset_cached.item.project.slug,
            sequence=asset_cached.sequence,
            transcriber_ids=[],
        )

        queryset = find_new_reviewable_campaign_assets(self.campaign, self.user)
        self.assertNotIn(asset_reserved, queryset)
        self.assertNotIn(asset_cached, queryset)

    def test_find_and_order_potential_reviewable_campaign_assets_ordering(self):
        base_item = self.asset1.item

        same_item_next = create_asset(item=base_item, sequence=10, slug="rc-ci-next")

        other_item_same_project = create_asset(
            item=create_item(project=base_item.project, item_id="rc-it-2"),
            sequence=5,
            slug="rc-p-next",
        )

        other_project = create_project(
            campaign=self.campaign, slug="rc-proj", title="rc-proj"
        )
        other_project_item = create_item(project=other_project, item_id="rc-it-3")
        other_project_asset = create_asset(
            item=other_project_item, sequence=1, slug="rc-op"
        )

        for asset in (same_item_next, other_item_same_project, other_project_asset):
            create_transcription(asset=asset, user=self.anon, submitted=now())

        def cache_row(asset):
            return NextReviewableCampaignAsset.objects.create(
                asset=asset,
                campaign=self.campaign,
                item=asset.item,
                item_item_id=asset.item.item_id,
                project=asset.item.project,
                project_slug=asset.item.project.slug,
                sequence=asset.sequence,
                transcriber_ids=[],
            )

        cache_row(same_item_next)
        cache_row(other_item_same_project)
        cache_row(other_project_asset)

        after_primary_key = self.asset1.id

        ordered = find_and_order_potential_reviewable_campaign_assets(
            self.campaign,
            self.user,
            project_slug=base_item.project.slug,
            item_id=base_item.item_id,
            asset_pk=after_primary_key,
        ).values_list("asset_id", flat=True)

        ordered = list(ordered)
        self.assertEqual(ordered[0], same_item_next.id)
        self.assertEqual(ordered[1], other_item_same_project.id)
        self.assertIn(other_project_asset.id, ordered[2:])

    @patch("concordia.utils.next_asset.reviewable.campaign.get_registered_task")
    def test_find_reviewable_campaign_asset_no_eligible_spawns_task_and_returns_none(
        self, mock_get_task
    ):
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        asset = find_reviewable_campaign_asset(self.campaign, self.user)
        self.assertIsNone(asset)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.reviewable.campaign.get_registered_task")
    def test_manual_fallback_orders_and_spawns_task(self, mock_get_task):
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        asset_x = create_asset(item=self.asset1.item, sequence=7, slug="rc-mf-x")
        asset_y = create_asset(item=self.asset1.item, sequence=8, slug="rc-mf-y")
        create_transcription(asset=asset_x, user=self.anon, submitted=now())
        create_transcription(asset=asset_y, user=self.anon, submitted=now())

        chosen = find_next_reviewable_campaign_asset(
            self.campaign,
            self.user,
            project_slug="",
            item_id="",
            original_asset_id=asset_x.id,  # makes asset_y the "next" by id
        )
        self.assertEqual(chosen, asset_y)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    def test_find_invalid_next_reviewable_campaign_assets_reserved_and_wrong_status(
        self,
    ):
        from concordia.models import NextReviewableCampaignAsset

        reserved_asset = create_asset(
            item=self.asset1.item, sequence=30, slug="rc-inv-res"
        )
        create_transcription(asset=reserved_asset, user=self.anon, submitted=now())
        AssetTranscriptionReservation.objects.create(
            asset=reserved_asset, reservation_token="rv"  # nosec
        )
        NextReviewableCampaignAsset.objects.create(
            asset=reserved_asset,
            campaign=self.campaign,
            item=reserved_asset.item,
            item_item_id=reserved_asset.item.item_id,
            project=reserved_asset.item.project,
            project_slug=reserved_asset.item.project.slug,
            sequence=reserved_asset.sequence,
            transcriber_ids=[],
        )

        wrong_status_asset = create_asset(
            item=self.asset1.item, sequence=31, slug="rc-inv-wrong"
        )
        create_transcription(asset=wrong_status_asset, user=self.anon)  # IN_PROGRESS
        NextReviewableCampaignAsset.objects.create(
            asset=wrong_status_asset,
            campaign=self.campaign,
            item=wrong_status_asset.item,
            item_item_id=wrong_status_asset.item.item_id,
            project=wrong_status_asset.item.project,
            project_slug=wrong_status_asset.item.project.slug,
            sequence=wrong_status_asset.sequence,
            transcriber_ids=[],
        )

        invalid = list(
            find_invalid_next_reviewable_campaign_assets(self.campaign.id).values_list(
                "asset_id", flat=True
            )
        )
        self.assertIn(reserved_asset.id, invalid)
        self.assertIn(wrong_status_asset.id, invalid)

    def test_item_short_circuit_internal_applies_after_and_skips_reserved(self):
        asset1 = self.asset1
        asset2 = self.asset2
        asset3 = create_asset(item=asset1.item, sequence=3, slug="rc-int-a3")
        for asset in (asset1, asset2, asset3):
            create_transcription(asset=asset, user=self.anon, submitted=now())
        AssetTranscriptionReservation.objects.create(
            asset=asset2, reservation_token="rv-int"  # nosec
        )

        chosen = _find_reviewable_in_item(
            self.campaign,
            self.user,
            item_id=asset1.item.item_id,
            after_asset_pk=asset1.id,
        )
        self.assertEqual(chosen, asset3)

    def test_item_short_circuit_internal_excludes_users_own_work(self):
        mine = self.asset1
        other = self.asset2
        create_transcription(asset=mine, user=self.user, submitted=now())
        create_transcription(asset=other, user=self.anon, submitted=now())

        chosen = _find_reviewable_in_item(
            self.campaign,
            self.user,
            item_id=mine.item.item_id,
            after_asset_pk=None,
        )
        self.assertEqual(chosen, other)

    def test_project_short_circuit_internal_skips_reserved_first(self):
        project = self.asset1.item.project
        item2 = create_item(project=project, item_id="rc-proj-int")
        first = create_asset(item=item2, sequence=1, slug="rc-proj-int-1")
        second = create_asset(item=item2, sequence=2, slug="rc-proj-int-2")
        for asset in (first, second):
            create_transcription(asset=asset, user=self.anon, submitted=now())
        AssetTranscriptionReservation.objects.create(
            asset=first, reservation_token="rv-proj-int"  # nosec
        )

        chosen = _find_reviewable_in_project(
            self.campaign,
            self.user,
            project_slug=project.slug,
            after_asset_pk=self.asset1.id,
        )
        self.assertEqual(chosen, second)

    def test_order_potential_without_after_prefers_item_then_project(self):
        base_item = self.asset1.item

        same_item = create_asset(item=base_item, sequence=9, slug="rc-ci-none")
        same_project = create_asset(
            item=create_item(project=base_item.project, item_id="rc-it-np"),
            sequence=2,
            slug="rc-p-none",
        )
        other_project = create_asset(
            item=create_item(
                project=create_project(
                    campaign=self.campaign, slug="rc-proj-none", title="rc-proj-none"
                ),
                item_id="rc-it-op-none",
            ),
            sequence=1,
            slug="rc-op-none",
        )
        for asset in (same_item, same_project, other_project):
            create_transcription(asset=asset, user=self.anon, submitted=now())

        NextReviewableCampaignAsset.objects.create(
            asset=same_item,
            campaign=self.campaign,
            item=same_item.item,
            item_item_id=same_item.item.item_id,
            project=same_item.item.project,
            project_slug=same_item.item.project.slug,
            sequence=same_item.sequence,
            transcriber_ids=[],
        )
        NextReviewableCampaignAsset.objects.create(
            asset=same_project,
            campaign=self.campaign,
            item=same_project.item,
            item_item_id=same_project.item.item_id,
            project=same_project.item.project,
            project_slug=same_project.item.project.slug,
            sequence=same_project.sequence,
            transcriber_ids=[],
        )
        NextReviewableCampaignAsset.objects.create(
            asset=other_project,
            campaign=self.campaign,
            item=other_project.item,
            item_item_id=other_project.item.item_id,
            project=other_project.item.project,
            project_slug=other_project.item.project.slug,
            sequence=other_project.sequence,
            transcriber_ids=[],
        )

        ordered = find_and_order_potential_reviewable_campaign_assets(
            self.campaign,
            self.user,
            project_slug=base_item.project.slug,
            item_id=base_item.item_id,
            asset_pk=None,  # ensure next_asset==0
        ).values_list("asset_id", flat=True)

        ordered = list(ordered)
        self.assertEqual(ordered[0], same_item.id)
        self.assertEqual(ordered[1], same_project.id)
        self.assertIn(other_project.id, ordered[2:])

    @patch("concordia.utils.next_asset.reviewable.campaign.get_registered_task")
    def test_next_reviewable_manual_fallback_no_after_spawns_and_picks_lowest_seq(
        self, mock_get_task
    ):
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        asset1 = self.asset1
        asset2 = self.asset2
        create_transcription(asset=asset1, user=self.anon, submitted=now())
        create_transcription(asset=asset2, user=self.anon, submitted=now())

        chosen = find_next_reviewable_campaign_asset(
            self.campaign,
            self.user,
            project_slug="",
            item_id="",
            original_asset_id=None,  # triggers Value(0) annotation branch
        )
        self.assertEqual(chosen, asset1)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.reviewable.campaign.get_registered_task")
    def test_next_reviewable_manual_fallback_invalid_after_str(self, mock_get_task):
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        asset1 = self.asset1
        asset2 = self.asset2
        create_transcription(asset=asset1, user=self.anon, submitted=now())
        create_transcription(asset=asset2, user=self.anon, submitted=now())

        chosen = find_next_reviewable_campaign_asset(
            self.campaign,
            self.user,
            project_slug="",
            item_id="",
            original_asset_id="not-an-int",
        )
        self.assertEqual(chosen, asset1)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.reviewable.campaign.get_registered_task")
    def test_next_reviewable_cached_path_when_short_circuits_fail(self, mock_get_task):
        """
        Provide item_id and project_slug so short-circuits run but fail
        (only user's SUBMITTED work in that scope), then ensure we use
        the cached table (no task spawned).
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        create_transcription(asset=self.asset1, user=self.user, submitted=now())
        create_transcription(asset=self.asset2, user=self.user, submitted=now())

        cached_project = create_project(
            campaign=self.campaign, slug="rc-cached-proj", title="rc-cached-proj"
        )
        cached_item = create_item(project=cached_project, item_id="rc-cached-item")
        cached_asset = create_asset(item=cached_item, slug="rc-cached-asset")
        create_transcription(asset=cached_asset, user=self.anon, submitted=now())

        NextReviewableCampaignAsset.objects.create(
            asset=cached_asset,
            campaign=self.campaign,
            item=cached_asset.item,
            item_item_id=cached_asset.item.item_id,
            project=cached_asset.item.project,
            project_slug=cached_asset.item.project.slug,
            sequence=cached_asset.sequence,
            transcriber_ids=[],
        )

        chosen = find_next_reviewable_campaign_asset(
            self.campaign,
            self.user,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(chosen, cached_asset)
        self.assertFalse(mock_get_task.called)
        self.assertFalse(mock_task.delay.called)

    @patch("concordia.utils.next_asset.reviewable.campaign.get_registered_task")
    def test_next_reviewable_uses_cache_when_bypassing_short_circuits(
        self, mock_get_task
    ):
        """
        Skip both short-circuits by passing blanks; ensure we return from
        the cache table directly (no task spawned).
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        cached_project = create_project(
            campaign=self.campaign,
            slug="rc-cached-proj-2",
            title="rc-cached-proj-2",
        )
        cached_item = create_item(project=cached_project, item_id="rc-cached-item-2")
        cached_asset = create_asset(item=cached_item, slug="rc-cached-asset-2")
        create_transcription(asset=cached_asset, user=self.anon, submitted=now())

        NextReviewableCampaignAsset.objects.create(
            asset=cached_asset,
            campaign=self.campaign,
            item=cached_asset.item,
            item_item_id=cached_asset.item.item_id,
            project=cached_asset.item.project,
            project_slug=cached_asset.item.project.slug,
            sequence=cached_asset.sequence,
            transcriber_ids=[],
        )

        chosen = find_next_reviewable_campaign_asset(
            self.campaign,
            self.user,
            project_slug="",
            item_id="",
            original_asset_id=None,
        )
        self.assertEqual(chosen, cached_asset)
        self.assertFalse(mock_get_task.called)
        self.assertFalse(mock_task.delay.called)


================================================
FILE: concordia/tests/test_utils_next_asset_reviewable_topic.py
================================================
from unittest.mock import MagicMock, patch

from django.test import TestCase
from django.utils.timezone import now

from concordia.models import (
    AssetTranscriptionReservation,
    NextReviewableTopicAsset,
)
from concordia.utils import get_anonymous_user
from concordia.utils.next_asset import (
    find_new_reviewable_topic_assets,
    find_next_reviewable_topic_asset,
    find_reviewable_topic_asset,
)
from concordia.utils.next_asset.reviewable.topic import (
    _eligible_reviewable_base_qs as topic_eligible_reviewable_base_qs,
)
from concordia.utils.next_asset.reviewable.topic import (
    _find_reviewable_in_item as topic_find_reviewable_in_item,
)
from concordia.utils.next_asset.reviewable.topic import (
    _find_reviewable_in_project as topic_find_reviewable_in_project,
)
from concordia.utils.next_asset.reviewable.topic import (
    _next_seq_after as topic_next_seq_after,
)
from concordia.utils.next_asset.reviewable.topic import (
    _reserved_asset_ids_subq as topic_reserved_asset_ids_subq,
)
from concordia.utils.next_asset.reviewable.topic import (
    find_and_order_potential_reviewable_topic_assets,
    find_invalid_next_reviewable_topic_assets,
)
from concordia.utils.next_asset.reviewable.topic import (
    find_next_reviewable_topic_assets as find_cached_reviewable_topic_assets,
)

from .utils import (
    CreateTestUsers,
    create_asset,
    create_campaign,
    create_item,
    create_project,
    create_topic,
    create_transcription,
)


class NextReviewableTopicAssetTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.anon = get_anonymous_user()
        self.user = self.create_test_user()
        self.asset1 = create_asset(sequence=1)
        self.asset2 = create_asset(
            item=self.asset1.item, sequence=2, slug="test-asset-2"
        )
        self.topic = create_topic(project=self.asset1.item.project)

    def test_find_new_reviewable_topic_assets_filters_correctly(self):
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())

        queryset = find_new_reviewable_topic_assets(self.topic, self.user)
        self.assertIn(self.asset1, queryset)

    def test_find_new_reviewable_topic_assets_without_user(self):
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())

        queryset = find_new_reviewable_topic_assets(self.topic, None)
        self.assertIn(self.asset1, queryset)

    def test_find_reviewable_topic_asset_from_next_table(self):
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())

        NextReviewableTopicAsset.objects.create(
            asset=self.asset1,
            topic=self.topic,
            item=self.asset1.item,
            item_item_id=self.asset1.item.item_id,
            project=self.asset1.item.project,
            project_slug=self.asset1.item.project.slug,
            sequence=self.asset1.sequence,
            transcriber_ids=[],
        )

        asset = find_reviewable_topic_asset(self.topic, self.user)
        self.assertEqual(asset, self.asset1)

    @patch("concordia.utils.next_asset.reviewable.topic.get_registered_task")
    def test_find_reviewable_topic_asset_falls_back_and_spawns_task(
        self, mock_get_task
    ):
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        asset = find_reviewable_topic_asset(self.topic, self.user)
        self.assertEqual(asset, self.asset2)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.reviewable.topic.get_registered_task")
    def test_find_next_reviewable_topic_asset_orders_and_falls_back(
        self, mock_get_task
    ):
        """
        With short-circuiting: project-level returns
        the eligible asset and we do not spawn a task.
        """
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        asset = find_next_reviewable_topic_asset(
            self.topic,
            self.user,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(asset, self.asset1)
        # Short-circuit satisfied -> no cache fallback -> no task spawned
        self.assertFalse(mock_get_task.called)
        self.assertFalse(mock_task.delay.called)

    @patch("concordia.utils.next_asset.reviewable.topic.get_registered_task")
    def test_find_next_reviewable_topic_asset_when_next_asset_exists(
        self, mock_get_task
    ):
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        NextReviewableTopicAsset.objects.create(
            asset=self.asset2,
            topic=self.topic,
            item=self.asset2.item,
            item_item_id=self.asset2.item.item_id,
            project=self.asset2.item.project,
            project_slug=self.asset2.item.project.slug,
            sequence=self.asset2.sequence,
            transcriber_ids=[],
        )

        asset = find_next_reviewable_topic_asset(
            self.topic,
            self.user,
            project_slug=self.asset2.item.project.slug,
            item_id=self.asset2.item.item_id,
            original_asset_id=self.asset2.id - 1,
        )
        self.assertEqual(asset, self.asset2)
        self.assertFalse(mock_get_task.called)
        self.assertFalse(mock_task.delay.called)

    def test_short_circuit_same_item_topic_excludes_users_own_work(self):
        mine = self.asset1
        other = self.asset2
        create_transcription(asset=mine, user=self.user, submitted=now())
        create_transcription(asset=other, user=self.anon, submitted=now())

        chosen = find_next_reviewable_topic_asset(
            self.topic,
            self.user,
            project_slug=mine.item.project.slug,
            item_id=mine.item.item_id,
            original_asset_id=mine.id,
        )
        self.assertEqual(chosen, other)

    def test_item_short_circuit_topic_reviewable_respects_after_and_reservations(self):
        asset3 = create_asset(item=self.asset1.item, sequence=3, slug="rev-topic-a3")
        for asset in (self.asset1, self.asset2, asset3):
            create_transcription(asset=asset, user=self.anon, submitted=now())

        chosen = find_next_reviewable_topic_asset(
            self.topic,
            self.user,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(chosen, self.asset2)

        AssetTranscriptionReservation.objects.create(
            asset=self.asset2, reservation_token="rv"  # nosec
        )
        chosen2 = find_next_reviewable_topic_asset(
            self.topic,
            self.user,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(chosen2, asset3)

    @patch("concordia.utils.next_asset.reviewable.topic.get_registered_task")
    def test_cache_excludes_user_and_triggers_spawn_task_topic(self, mock_get_task):
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        create_transcription(asset=self.asset1, user=self.user, submitted=now())
        NextReviewableTopicAsset.objects.create(
            asset=self.asset1,
            topic=self.topic,
            item=self.asset1.item,
            item_item_id=self.asset1.item.item_id,
            project=self.asset1.item.project,
            project_slug=self.asset1.item.project.slug,
            sequence=self.asset1.sequence,
            transcriber_ids=[self.user.id],
        )

        other = create_asset(item=self.asset1.item, sequence=3, slug="rev-topic-other")
        create_transcription(asset=other, user=self.anon, submitted=now())

        chosen = find_next_reviewable_topic_asset(
            self.topic,
            self.user,
            project_slug="",
            item_id="",
            original_asset_id=None,
        )
        self.assertEqual(chosen, other)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    def test_find_next_reviewable_topic_assets_excludes_user(self):
        create_transcription(asset=self.asset1, user=self.user, submitted=now())
        NextReviewableTopicAsset.objects.create(
            asset=self.asset1,
            topic=self.topic,
            item=self.asset1.item,
            item_item_id=self.asset1.item.item_id,
            project=self.asset1.item.project,
            project_slug=self.asset1.item.project.slug,
            sequence=self.asset1.sequence,
            transcriber_ids=[self.user.id],
        )
        NextReviewableTopicAsset.objects.create(
            asset=self.asset2,
            topic=self.topic,
            item=self.asset2.item,
            item_item_id=self.asset2.item.item_id,
            project=self.asset2.item.project,
            project_slug=self.asset2.item.project.slug,
            sequence=self.asset2.sequence,
            transcriber_ids=[],
        )
        queryset = find_cached_reviewable_topic_assets(self.topic, self.user)
        self.assertNotIn(self.asset1.id, queryset.values_list("asset_id", flat=True))
        self.assertIn(self.asset2.id, queryset.values_list("asset_id", flat=True))

    @patch("concordia.utils.next_asset.reviewable.topic.get_registered_task")
    def test_next_reviewable_cached_path_when_short_circuits_fail_topic(
        self, mock_get_task
    ):
        """
        Item+project short-circuits fail (only user's work), so we should pull
        from the cached table and not spawn a task.
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        # Only user's submitted work in current item/project
        create_transcription(asset=self.asset1, user=self.user, submitted=now())
        create_transcription(asset=self.asset2, user=self.user, submitted=now())

        # Cached eligible asset in another project (not reachable via short-circuit)
        cached_project = create_project(
            campaign=self.asset1.campaign,
            slug="topic-cached-proj",
            title="topic-cached-proj",
        )
        cached_item = create_item(project=cached_project, item_id="topic-cached-item")
        cached_asset = create_asset(item=cached_item, slug="topic-cached-asset")
        create_transcription(asset=cached_asset, user=self.anon, submitted=now())

        NextReviewableTopicAsset.objects.create(
            asset=cached_asset,
            topic=self.topic,
            item=cached_asset.item,
            item_item_id=cached_asset.item.item_id,
            project=cached_asset.item.project,
            project_slug=cached_asset.item.project.slug,
            sequence=cached_asset.sequence,
            transcriber_ids=[],
        )

        chosen = find_next_reviewable_topic_asset(
            self.topic,
            self.user,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(chosen, cached_asset)
        self.assertFalse(mock_get_task.called)
        self.assertFalse(mock_task.delay.called)

    @patch("concordia.utils.next_asset.reviewable.topic.get_registered_task")
    def test_next_reviewable_uses_cache_when_bypassing_short_circuits_topic(
        self, mock_get_task
    ):
        """
        Pass blanks for project/item so we bypass short-circuits and hit cache.
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        cached_project = create_project(
            campaign=self.asset1.campaign,
            slug="topic-cached-proj-2",
            title="topic-cached-proj-2",
        )
        cached_item = create_item(project=cached_project, item_id="topic-cached-item-2")
        cached_asset = create_asset(item=cached_item, slug="topic-cached-asset-2")
        create_transcription(asset=cached_asset, user=self.anon, submitted=now())

        NextReviewableTopicAsset.objects.create(
            asset=cached_asset,
            topic=self.topic,
            item=cached_asset.item,
            item_item_id=cached_asset.item.item_id,
            project=cached_asset.item.project,
            project_slug=cached_asset.item.project.slug,
            sequence=cached_asset.sequence,
            transcriber_ids=[],
        )

        chosen = find_next_reviewable_topic_asset(
            self.topic,
            self.user,
            project_slug="",
            item_id="",
            original_asset_id=None,
        )
        self.assertEqual(chosen, cached_asset)
        self.assertFalse(mock_get_task.called)
        self.assertFalse(mock_task.delay.called)

    @patch("concordia.utils.next_asset.reviewable.topic.get_registered_task")
    def test_next_reviewable_manual_fallback_no_after_spawns_and_picks_lowest_seq_topic(
        self, mock_get_task
    ):
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        other_item = create_item(project=self.asset1.item.project, item_id="t-mf-item")
        asset_x = create_asset(item=other_item, sequence=7, slug="t-mf-x")
        asset_y = create_asset(item=other_item, sequence=8, slug="t-mf-y")
        create_transcription(asset=asset_x, user=self.anon, submitted=now())
        create_transcription(asset=asset_y, user=self.anon, submitted=now())

        chosen = find_next_reviewable_topic_asset(
            self.topic,
            self.user,
            project_slug="",
            item_id="",
            original_asset_id=None,
        )
        self.assertEqual(chosen, asset_x)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.reviewable.topic.get_registered_task")
    def test_next_reviewable_manual_fallback_invalid_after_str_topic(
        self, mock_get_task
    ):
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        other_item = create_item(
            project=self.asset1.item.project, item_id="t-mf-item-2"
        )
        asset_a = create_asset(item=other_item, sequence=1, slug="t-mf-a")
        asset_b = create_asset(item=other_item, sequence=2, slug="t-mf-b")
        create_transcription(asset=asset_a, user=self.anon, submitted=now())
        create_transcription(asset=asset_b, user=self.anon, submitted=now())

        chosen = find_next_reviewable_topic_asset(
            self.topic,
            self.user,
            project_slug="",
            item_id="",
            original_asset_id="not-an-int",
        )
        self.assertEqual(chosen, asset_a)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)


class ReviewableTopicInternalsTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.anon = get_anonymous_user()
        self.user = self.create_test_user()
        self.asset1 = create_asset(sequence=1, slug="rt-a1")
        self.asset2 = create_asset(item=self.asset1.item, sequence=2, slug="rt-a2")
        self.topic = create_topic(project=self.asset1.item.project)

    def test_topic_reserved_asset_ids_subq_unfiltered(self):
        # Reservation tied to this test topic
        AssetTranscriptionReservation.objects.create(
            asset=self.asset1,
            reservation_token="rt-r1",  # nosec
        )
        # Reservation in entirely different campaign/project
        other_campaign = create_campaign(slug="rt-camp-x", title="rt-camp-x")
        other_project = create_project(
            campaign=other_campaign, slug="rt-proj-x", title="rt-proj-x"
        )
        other_item = create_item(project=other_project, item_id="rt-item-x")
        other_asset = create_asset(item=other_item, slug="rt-asset-x")
        AssetTranscriptionReservation.objects.create(
            asset=other_asset,
            reservation_token="rt-r2",  # nosec
        )

        id_set = set(topic_reserved_asset_ids_subq().values_list("asset_id", flat=True))
        self.assertIn(self.asset1.id, id_set)
        self.assertIn(other_asset.id, id_set)

    def test_topic_eligible_reviewable_base_qs_excludes_user_and_requires_submitted(
        self,
    ):
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.user, submitted=now())
        asset3 = create_asset(item=self.asset1.item, sequence=3, slug="rt-a3")
        # asset3 has no submitted timestamp -> not SUBMITTED

        queryset_user = topic_eligible_reviewable_base_qs(self.topic, user=self.user)
        self.assertIn(self.asset1, queryset_user)
        self.assertNotIn(self.asset2, queryset_user)
        self.assertNotIn(asset3, queryset_user)

        queryset_none = topic_eligible_reviewable_base_qs(self.topic, user=None)
        self.assertIn(self.asset1, queryset_none)
        self.assertIn(self.asset2, queryset_none)
        self.assertNotIn(asset3, queryset_none)

    def test_topic_next_seq_after_none_missing_and_valid(self):
        self.assertIsNone(topic_next_seq_after(None))
        self.assertIsNone(topic_next_seq_after(987654321))
        self.assertEqual(topic_next_seq_after(self.asset2.pk), self.asset2.sequence)

    def test_topic_find_reviewable_in_item_after_none_returns_first(self):
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())

        chosen = topic_find_reviewable_in_item(
            self.topic,
            self.user,
            item_id=self.asset1.item.item_id,
            after_asset_pk=None,
        )
        self.assertEqual(chosen, self.asset1)

    def test_topic_find_reviewable_in_item_after_asset_in_other_item_ignores_gate(
        self,
    ):
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())

        other_item = create_item(
            project=self.asset1.item.project, item_id="rt-other-item"
        )
        other_asset = create_asset(item=other_item, slug="rt-other-asset")
        create_transcription(asset=other_asset, user=self.anon, submitted=now())

        chosen = topic_find_reviewable_in_item(
            self.topic,
            self.user,
            item_id=self.asset1.item.item_id,
            after_asset_pk=other_asset.id,
        )
        self.assertEqual(chosen, self.asset1)

    def test_topic_find_reviewable_in_item_after_asset_missing_ignores_gate(self):
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())

        chosen = topic_find_reviewable_in_item(
            self.topic,
            self.user,
            item_id=self.asset1.item.item_id,
            after_asset_pk=123456789,
        )
        self.assertEqual(chosen, self.asset1)

    def test_topic_find_reviewable_in_item_after_asset_sidc_ignores_gate(self):
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())

        other_campaign = create_campaign(slug="rt-camp-b", title="rt-camp-b")
        other_project = create_project(
            campaign=other_campaign, slug="rt-proj-b", title="rt-proj-b"
        )
        other_item = create_item(
            project=other_project, item_id=self.asset1.item.item_id
        )
        cross_asset = create_asset(item=other_item, slug="rt-cross")
        create_transcription(asset=cross_asset, user=self.anon, submitted=now())

        chosen = topic_find_reviewable_in_item(
            self.topic,
            self.user,
            item_id=self.asset1.item.item_id,
            after_asset_pk=cross_asset.id,
        )
        self.assertEqual(chosen, self.asset1)

    def test_topic_find_reviewable_in_project_orders_and_excludes_user(self):
        project = self.asset1.item.project
        other_item = create_item(project=project, item_id="rt-p-item")
        mine = create_asset(item=other_item, sequence=1, slug="rt-p-mine")
        theirs = create_asset(item=other_item, sequence=2, slug="rt-p-theirs")
        create_transcription(asset=mine, user=self.user, submitted=now())
        create_transcription(asset=theirs, user=self.anon, submitted=now())

        chosen = topic_find_reviewable_in_project(
            self.topic,
            self.user,
            project_slug=project.slug,
            after_asset_pk=self.asset1.id,
        )
        self.assertEqual(chosen, theirs)

    def test_topic_find_reviewable_in_project_returns_none_when_only_users_work(self):
        project = self.asset1.item.project
        other_item = create_item(project=project, item_id="rt-p2")
        mine = create_asset(item=other_item, sequence=1, slug="rt-p2-mine")
        create_transcription(asset=mine, user=self.user, submitted=now())

        chosen = topic_find_reviewable_in_project(
            self.topic,
            self.user,
            project_slug=project.slug,
            after_asset_pk=self.asset1.id,
        )
        self.assertIsNone(chosen)

    def test_find_and_order_potential_reviewable_topic_assets_ordering(self):
        base_item = self.asset1.item

        same_item_next = create_asset(item=base_item, sequence=10, slug="rt-ci-next")
        other_item_same_project = create_asset(
            item=create_item(project=base_item.project, item_id="rt-it-2"),
            sequence=5,
            slug="rt-p-next",
        )
        other_project = create_project(
            campaign=self.asset1.campaign, slug="rt-proj", title="rt-proj"
        )
        other_project_item = create_item(project=other_project, item_id="rt-it-3")
        other_project_asset = create_asset(
            item=other_project_item, sequence=1, slug="rt-op"
        )

        for asset in (same_item_next, other_item_same_project, other_project_asset):
            create_transcription(asset=asset, user=self.anon, submitted=now())
            NextReviewableTopicAsset.objects.create(
                asset=asset,
                topic=self.topic,
                item=asset.item,
                item_item_id=asset.item.item_id,
                project=asset.item.project,
                project_slug=asset.item.project.slug,
                sequence=asset.sequence,
                transcriber_ids=[],
            )

        ordered = find_and_order_potential_reviewable_topic_assets(
            self.topic,
            self.user,
            project_slug=base_item.project.slug,
            item_id=base_item.item_id,
            asset_pk=self.asset1.id,
        ).values_list("asset_id", flat=True)

        ordered = list(ordered)
        self.assertEqual(ordered[0], same_item_next.id)
        self.assertEqual(ordered[1], other_item_same_project.id)
        self.assertIn(other_project_asset.id, ordered[2:])

    def test_order_potential_without_after_prefers_item_then_project_topic(self):
        base_item = self.asset1.item

        same_item = create_asset(item=base_item, sequence=9, slug="rt-ci-none")
        same_project = create_asset(
            item=create_item(project=base_item.project, item_id="rt-it-np"),
            sequence=2,
            slug="rt-p-none",
        )
        other_project = create_project(
            campaign=self.asset1.campaign, slug="rt-proj-none", title="rt-proj-none"
        )
        other_project_item = create_item(project=other_project, item_id="rt-it-op-none")
        other_project_asset = create_asset(
            item=other_project_item, sequence=1, slug="rt-op-none"
        )
        for asset in (same_item, same_project, other_project_asset):
            create_transcription(asset=asset, user=self.anon, submitted=now())
            NextReviewableTopicAsset.objects.create(
                asset=asset,
                topic=self.topic,
                item=asset.item,
                item_item_id=asset.item.item_id,
                project=asset.item.project,
                project_slug=asset.item.project.slug,
                sequence=asset.sequence,
                transcriber_ids=[],
            )

        ordered = find_and_order_potential_reviewable_topic_assets(
            self.topic,
            self.user,
            project_slug=base_item.project.slug,
            item_id=base_item.item_id,
            asset_pk=None,  # next_asset==0 branch
        ).values_list("asset_id", flat=True)

        ordered = list(ordered)
        self.assertEqual(ordered[0], same_item.id)
        self.assertEqual(ordered[1], same_project.id)
        self.assertIn(other_project_asset.id, ordered[2:])

    def test_find_invalid_next_reviewable_topic_assets_reserved_and_wrong_status(
        self,
    ):
        # Reserved
        reserved_asset = create_asset(
            item=self.asset1.item, sequence=30, slug="rt-inv-res"
        )
        create_transcription(asset=reserved_asset, user=self.anon, submitted=now())
        AssetTranscriptionReservation.objects.create(
            asset=reserved_asset, reservation_token="rt-rv"  # nosec
        )
        NextReviewableTopicAsset.objects.create(
            asset=reserved_asset,
            topic=self.topic,
            item=reserved_asset.item,
            item_item_id=reserved_asset.item.item_id,
            project=reserved_asset.item.project,
            project_slug=reserved_asset.item.project.slug,
            sequence=reserved_asset.sequence,
            transcriber_ids=[],
        )

        # Wrong status (IN_PROGRESS)
        wrong_status_asset = create_asset(
            item=self.asset1.item, sequence=31, slug="rt-inv-wrong"
        )
        create_transcription(asset=wrong_status_asset, user=self.anon)
        NextReviewableTopicAsset.objects.create(
            asset=wrong_status_asset,
            topic=self.topic,
            item=wrong_status_asset.item,
            item_item_id=wrong_status_asset.item.item_id,
            project=wrong_status_asset.item.project,
            project_slug=wrong_status_asset.item.project.slug,
            sequence=wrong_status_asset.sequence,
            transcriber_ids=[],
        )

        invalid_ids = list(
            find_invalid_next_reviewable_topic_assets(self.topic.id).values_list(
                "asset_id", flat=True
            )
        )
        self.assertIn(reserved_asset.id, invalid_ids)
        self.assertIn(wrong_status_asset.id, invalid_ids)

    def test_topic_project_short_circuit_internal_skips_reserved_first(self):
        project = self.asset1.item.project
        item2 = create_item(project=project, item_id="rt-proj-int")
        first = create_asset(item=item2, sequence=1, slug="rt-proj-int-1")
        second = create_asset(item=item2, sequence=2, slug="rt-proj-int-2")
        for asset in (first, second):
            create_transcription(asset=asset, user=self.anon, submitted=now())
        AssetTranscriptionReservation.objects.create(
            asset=first, reservation_token="rt-proj-int"  # nosec
        )

        chosen = topic_find_reviewable_in_project(
            self.topic,
            self.user,
            project_slug=project.slug,
            after_asset_pk=self.asset1.id,
        )
        self.assertEqual(chosen, second)

    def test_topic_item_short_circuit_internal_excludes_users_own_work(self):
        mine = self.asset1
        other = self.asset2
        create_transcription(asset=mine, user=self.user, submitted=now())
        create_transcription(asset=other, user=self.anon, submitted=now())

        chosen = topic_find_reviewable_in_item(
            self.topic,
            self.user,
            item_id=mine.item.item_id,
            after_asset_pk=None,
        )
        self.assertEqual(chosen, other)

    def test_topic_item_short_circuit_internal_applies_after_and_skips_reserved(self):
        asset3 = create_asset(item=self.asset1.item, sequence=3, slug="rt-int-a3")
        for asset in (self.asset1, self.asset2, asset3):
            create_transcription(asset=asset, user=self.anon, submitted=now())
        AssetTranscriptionReservation.objects.create(
            asset=self.asset2, reservation_token="rt-int-rv"  # nosec
        )

        chosen = topic_find_reviewable_in_item(
            self.topic,
            self.user,
            item_id=self.asset1.item.item_id,
            after_asset_pk=self.asset1.id,
        )
        self.assertEqual(chosen, asset3)


================================================
FILE: concordia/tests/test_utils_next_asset_transcribable_campaign.py
================================================
from unittest.mock import MagicMock, patch

from django.test import TestCase
from django.utils.timezone import now

from concordia.models import (
    Asset,
    AssetTranscriptionReservation,
    NextTranscribableCampaignAsset,
    TranscriptionStatus,
)
from concordia.utils import get_anonymous_user
from concordia.utils.next_asset import (
    find_new_transcribable_campaign_assets,
    find_next_transcribable_campaign_asset,
    find_transcribable_campaign_asset,
)
from concordia.utils.next_asset.transcribable.campaign import (
    _eligible_transcribable_base_qs as tc_eligible_base_qs,
)
from concordia.utils.next_asset.transcribable.campaign import (
    _find_transcribable_in_item as tc_find_in_item,
)
from concordia.utils.next_asset.transcribable.campaign import (
    _find_transcribable_not_started_in_project as tc_find_ns_in_proj,
)
from concordia.utils.next_asset.transcribable.campaign import (
    _next_seq_after as tc_next_seq_after,
)
from concordia.utils.next_asset.transcribable.campaign import (
    _order_unstarted_first as tc_order_unstarted_first,
)
from concordia.utils.next_asset.transcribable.campaign import (
    _reserved_asset_ids_subq as tc_reserved_ids_subq,
)
from concordia.utils.next_asset.transcribable.campaign import (
    find_and_order_potential_transcribable_campaign_assets,
    find_invalid_next_transcribable_campaign_assets,
)
from concordia.utils.next_asset.transcribable.campaign import (
    find_next_transcribable_campaign_assets as find_cached_transcribable_assets,
)

from .utils import (
    CreateTestUsers,
    create_asset,
    create_campaign,
    create_item,
    create_project,
    create_transcription,
)


class NextTranscribableCampaignAssetTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.anon = get_anonymous_user()
        self.user = self.create_test_user()
        self.asset1 = create_asset(
            sequence=1, slug="test-asset-1", title="Test Asset 1"
        )
        self.asset2 = create_asset(
            item=self.asset1.item, sequence=2, slug="test-asset-2", title="Test Asset 2"
        )
        self.campaign = self.asset1.campaign

    def test_find_new_transcribable_campaign_assets_filters_correctly(self):
        create_transcription(
            asset=self.asset1,
            user=self.anon,
            submitted=now(),
        )

        queryset = find_new_transcribable_campaign_assets(self.campaign)
        self.assertNotIn(self.asset1, queryset)
        self.assertIn(self.asset2, queryset)

    def test_find_transcribable_campaign_asset_from_next_table(self):
        NextTranscribableCampaignAsset.objects.create(
            asset=self.asset1,
            campaign=self.campaign,
            item=self.asset1.item,
            item_item_id=self.asset1.item.item_id,
            project=self.asset1.item.project,
            project_slug=self.asset1.item.project.slug,
            sequence=self.asset1.sequence,
            transcription_status=TranscriptionStatus.NOT_STARTED,
        )

        asset = find_transcribable_campaign_asset(self.campaign)
        self.assertEqual(asset, self.asset1)

    @patch("concordia.utils.next_asset.transcribable.campaign.get_registered_task")
    def test_find_transcribable_campaign_asset_falls_back_and_spawns_task(
        self, mock_get_task
    ):
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        asset = find_transcribable_campaign_asset(self.campaign)
        self.assertEqual(asset, self.asset1)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.transcribable.campaign.get_registered_task")
    def test_find_next_transcribable_campaign_asset_orders_and_falls_back(
        self, mock_get_task
    ):
        """
        With short-circuiting: item-level returns the next asset
        and we do not spawn a task.
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        asset = find_next_transcribable_campaign_asset(
            self.campaign,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(asset, self.asset2)
        # Short-circuit satisfied -> no cache fallback -> no task spawned
        self.assertFalse(mock_get_task.called)
        self.assertFalse(mock_task.delay.called)

    @patch("concordia.utils.next_asset.transcribable.campaign.get_registered_task")
    def test_find_next_transcribable_campaign_asset_when_next_asset_exists(
        self, mock_get_task
    ):
        # Make asset2 eligible (IN_PROGRESS)
        create_transcription(
            asset=self.asset2,
            user=self.anon,
        )
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        # Cache has asset2
        NextTranscribableCampaignAsset.objects.create(
            asset=self.asset2,
            campaign=self.campaign,
            item=self.asset2.item,
            item_item_id=self.asset2.item.item_id,
            project=self.asset2.item.project,
            project_slug=self.asset2.item.project.slug,
            sequence=self.asset2.sequence,
            transcription_status=TranscriptionStatus.IN_PROGRESS,
        )

        # Bypass item/project short-circuits so we hit the cache
        asset = find_next_transcribable_campaign_asset(
            self.campaign,
            project_slug="",
            item_id="",
            original_asset_id=None,
        )
        self.assertEqual(asset, self.asset2)
        self.assertFalse(mock_get_task.called)
        self.assertFalse(mock_task.delay.called)

    def test_short_circuit_same_item_respects_after_sequence_and_reservations(self):
        """
        Same item short-circuit:
        - Picks the next by sequence (> original)
        - Skips reserved assets
        """
        asset3 = create_asset(
            item=self.asset1.item, sequence=3, slug="test-asset-3", title="Test Asset 3"
        )

        # Normal: after asset1 => choose asset2
        chosen = find_next_transcribable_campaign_asset(
            self.campaign,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(chosen, self.asset2)

        # Reserve asset2 => should skip to asset3
        AssetTranscriptionReservation.objects.create(
            asset=self.asset2, reservation_token="tkn"  # nosec
        )
        chosen2 = find_next_transcribable_campaign_asset(
            self.campaign,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(chosen2, asset3)

    def test_project_short_circuit_prefers_not_started_over_in_progress(self):
        """
        When item-level has no eligible assets, project-level should:
        - Prefer NOT_STARTED over IN_PROGRESS
        - Order by (item_id, sequence) within same status
        """
        # Exhaust item: mark both item assets submitted
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())

        other_item = create_item(
            project=self.asset1.item.project, item_id="proj-only-item"
        )
        in_progress_asset = create_asset(
            item=other_item, slug="proj-inprog", title="Proj InProg"
        )
        create_transcription(asset=in_progress_asset, user=self.anon)  # IN_PROGRESS

        not_started_asset = create_asset(
            item=other_item, slug="proj-notstarted", title="Proj NotStarted"
        )

        chosen = find_next_transcribable_campaign_asset(
            self.campaign,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,  # same item, but it's exhausted
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(chosen, not_started_asset)

    def test_project_short_circuit_when_item_id_empty_string(self):
        """
        If item_id is '', skip item short-circuit and use project-level.
        """
        other_item = create_item(project=self.asset1.item.project, item_id="proj2")
        project_asset = create_asset(
            item=other_item, slug="proj-asset", title="Proj Asset"
        )
        # Make current item ineligible
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())

        chosen = find_next_transcribable_campaign_asset(
            self.campaign,
            project_slug=self.asset1.item.project.slug,
            item_id="",  # empty skips item short-circuit
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(chosen, project_asset)

    @patch("concordia.utils.next_asset.transcribable.campaign.get_registered_task")
    def test_find_transcribable_campaign_asset_none_spawns(self, mock_get_task):
        """
        When no NOT_STARTED/IN_PROGRESS exist, return None and trigger populate.
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()
        # Make both assets SUBMITTED (no transcribable remain)
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())

        asset = find_transcribable_campaign_asset(self.campaign)
        self.assertIsNone(asset)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.transcribable.campaign.get_registered_task")
    def test_next_transcribable_manual_no_after_prefers_not_started(
        self, mock_get_task
    ):
        """
        With no short-circuit and empty cache, pick NOT_STARTED and spawn task.
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        campaign2 = create_campaign(slug="tc-na-camp", title="tc-na-camp")
        project2 = create_project(
            campaign=campaign2, slug="tc-na-proj", title="tc-na-proj"
        )
        item2 = create_item(project=project2, item_id="tc-na-item")

        not_started_asset = create_asset(
            item=item2, sequence=2, slug="tc-na-ns", title="TC NA NS"
        )
        in_progress_asset = create_asset(
            item=item2, sequence=1, slug="tc-na-ip", title="TC NA IP"
        )
        create_transcription(asset=in_progress_asset, user=self.anon)  # IN_PROGRESS

        chosen = find_next_transcribable_campaign_asset(
            campaign2, project_slug="", item_id="", original_asset_id=None
        )
        self.assertEqual(chosen, not_started_asset)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.transcribable.campaign.get_registered_task")
    def test_next_transcribable_manual_invalid_after_str(self, mock_get_task):
        """
        Treat a non-integer "after" like None: choose NOT_STARTED and spawn task.
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        # Make existing setup assets ineligible for selection.
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())

        other_item = create_item(
            project=self.asset1.item.project, item_id="tc-mf-item-2"
        )
        asset_a = create_asset(
            item=other_item, sequence=1, slug="tc-mf-a", title="TC MF A"
        )
        asset_b = create_asset(
            item=other_item, sequence=2, slug="tc-mf-b", title="TC MF B"
        )
        create_transcription(asset=asset_b, user=self.anon)  # IN_PROGRESS

        chosen = find_next_transcribable_campaign_asset(
            self.campaign, project_slug="", item_id="", original_asset_id=None
        )
        self.assertEqual(chosen, asset_a)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.transcribable.campaign.get_registered_task")
    def test_next_transcribable_none_anywhere_spawns(self, mock_get_task):
        """
        With no cache and no manual candidates: return None; do not spawn a task.
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        campaign2 = create_campaign(slug="tc-none-camp", title="tc-none-camp")

        chosen = find_next_transcribable_campaign_asset(
            campaign2, project_slug="", item_id="", original_asset_id=None
        )
        self.assertIsNone(chosen)
        self.assertFalse(mock_get_task.called)
        self.assertFalse(mock_task.delay.called)

    def test_item_short_circuit_missing_after_pk_treated_as_none_top(self):
        # Both assets are NOT_STARTED in the same item. Give a missing "after".
        missing_pk = 987_654_321
        chosen = find_next_transcribable_campaign_asset(
            self.campaign,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=missing_pk,
        )
        # With no valid "after" seq, returns the first NOT_STARTED (asset1).
        self.assertEqual(chosen, self.asset1)

    @patch("concordia.utils.next_asset.transcribable.campaign.get_registered_task")
    def test_cache_excludes_original_pk_and_chooses_next(self, mock_get_task):
        # Two cached rows; original points at the first -> second should be chosen.
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        other_item = create_item(
            project=self.asset1.item.project, item_id="tc-cache-pk-item"
        )
        first = create_asset(item=other_item, sequence=1, slug="tc-cache-first")
        second = create_asset(item=other_item, sequence=2, slug="tc-cache-second")

        for asset in (first, second):
            NextTranscribableCampaignAsset.objects.create(
                asset=asset,
                campaign=self.campaign,
                item=asset.item,
                item_item_id=asset.item.item_id,
                project=asset.item.project,
                project_slug=asset.item.project.slug,
                sequence=asset.sequence,
                transcription_status=TranscriptionStatus.NOT_STARTED,
            )

        chosen = find_next_transcribable_campaign_asset(
            self.campaign,
            project_slug="",
            item_id="",
            original_asset_id=first.id,
        )
        self.assertEqual(chosen, second)
        self.assertFalse(mock_get_task.called)
        self.assertFalse(mock_task.delay.called)

    def test_project_short_circuit_without_original_id(self):
        # Exhaust current item; ensure project-level returns NOT_STARTED with
        # original_asset_id=None.
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())

        other_item = create_item(
            project=self.asset1.item.project, item_id="tc-proj-no-orig"
        )
        pick = create_asset(item=other_item, sequence=5, slug="tc-proj-pick")

        chosen = find_next_transcribable_campaign_asset(
            self.campaign,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=None,
        )
        self.assertEqual(chosen, pick)

    def test_item_short_circuit_after_pk_in_other_item_ignores_gate(self):
        # Original PK exists but belongs to a different item; treat as no "after".
        other_item = create_item(
            project=self.asset1.item.project, item_id="tc-oth-it-ignores-gate"
        )
        other_asset = create_asset(item=other_item, slug="tc-oth-a-ignores-gate")

        chosen = find_next_transcribable_campaign_asset(
            self.campaign,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=other_asset.id,
        )
        # With no valid "after" in this item, pick first NOT_STARTED by sequence.
        self.assertEqual(chosen, self.asset1)

    def test_next_transcribable_after_pk_missing_treats_as_no_after(self):
        """
        Missing original_asset_id -> ignore 'after' gate and pick first NS in item.
        """
        chosen = find_next_transcribable_campaign_asset(
            self.campaign,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=987654321,  # missing
        )
        self.assertEqual(chosen, self.asset1)

    @patch("concordia.utils.next_asset.transcribable.campaign.get_registered_task")
    def test_no_ns_anywhere_and_no_ip_in_item_returns_none(self, mock_get_task):
        """
        With item_id present: no NOT_STARTED anywhere and no same-item IN_PROGRESS
        so return None and do not spawn a task.
        """
        # Exhaust the only item in the project/campaign.
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())

        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        got = find_next_transcribable_campaign_asset(
            self.campaign,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertIsNone(got)
        self.assertFalse(mock_get_task.called)
        self.assertFalse(mock_task.delay.called)

    def test_after_pk_digit_string_missing_treats_as_no_after(self):
        """
        original_asset_id is a digit string for a missing PK -> treat like no 'after'.
        Covers the DoesNotExist branch distinct from non-digit ValueError.
        """
        chosen = find_next_transcribable_campaign_asset(
            self.campaign,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id="987654321",  # digit string, no such Asset
        )
        self.assertEqual(chosen, self.asset1)

    def test_same_item_inprogress_selected_when_no_ns_and_no_after(self):
        """
        With item_id present, no NOT_STARTED anywhere and original_asset_id=None,
        pick same-item IN_PROGRESS (after_seq is None path).
        """
        create_transcription(asset=self.asset2, user=self.anon)  # IN_PROGRESS
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())

        got = find_next_transcribable_campaign_asset(
            self.campaign,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=None,  # after_seq is None in IP fallback
        )
        self.assertEqual(got, self.asset2)

    @patch("concordia.utils.next_asset.transcribable.campaign.get_registered_task")
    def test_manual_invalid_after_str_campaign_valueerror_branch(self, mock_get_task):
        """
        original_asset_id is a non-digit string -> ValueError path.
        Bypass short-circuits and empty cache => manual picks first NOT_STARTED
        and spawns populate task.
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        chosen = find_next_transcribable_campaign_asset(
            self.campaign,
            project_slug="",
            item_id="",
            original_asset_id="not-an-int",
        )
        self.assertEqual(chosen, self.asset1)  # first NOT_STARTED by ordering
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)


class TranscribableCampaignInternalsTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.anon = get_anonymous_user()
        self.user = self.create_test_user()
        self.asset1 = create_asset(sequence=1, slug="tc-a1")
        self.asset2 = create_asset(item=self.asset1.item, sequence=2, slug="tc-a2")
        self.campaign = self.asset1.campaign

    def test_new_transcribable_excludes_reserved_and_cached(self):
        reserved_asset = create_asset(item=self.asset1.item, sequence=3, slug="tc-res")
        cached_asset = create_asset(item=self.asset1.item, sequence=4, slug="tc-cached")
        # Make both potentially transcribable
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())
        # Reserve one and cache the other
        AssetTranscriptionReservation.objects.create(
            asset=reserved_asset, reservation_token="tc-rv"  # nosec
        )
        NextTranscribableCampaignAsset.objects.create(
            asset=cached_asset,
            campaign=self.campaign,
            item=cached_asset.item,
            item_item_id=cached_asset.item.item_id,
            project=cached_asset.item.project,
            project_slug=cached_asset.item.project.slug,
            sequence=cached_asset.sequence,
            transcription_status=TranscriptionStatus.NOT_STARTED,
        )
        queryset = find_new_transcribable_campaign_assets(self.campaign)
        self.assertNotIn(reserved_asset, queryset)
        self.assertNotIn(cached_asset, queryset)

    def test_order_potential_transcribable_pref(self):
        """
        Cached ordering should favor next id, then same project, then same item.
        """
        base_item = self.asset1.item
        same_item_next = create_asset(item=base_item, sequence=10, slug="tc-ci-next")
        same_project = create_asset(
            item=create_item(project=base_item.project, item_id="tc-it-2"),
            sequence=5,
            slug="tc-p-next",
        )
        other_project_asset = create_asset(
            item=create_item(
                project=create_project(
                    campaign=self.campaign, slug="tc-op-proj", title="tc-op-proj"
                ),
                item_id="tc-op-item",
            ),
            sequence=1,
            slug="tc-op",
        )
        for asset in (same_item_next, same_project, other_project_asset):
            NextTranscribableCampaignAsset.objects.create(
                asset=asset,
                campaign=self.campaign,
                item=asset.item,
                item_item_id=asset.item.item_id,
                project=asset.item.project,
                project_slug=asset.item.project.slug,
                sequence=asset.sequence,
                transcription_status=TranscriptionStatus.NOT_STARTED,
            )
        ordered = find_and_order_potential_transcribable_campaign_assets(
            self.campaign,
            project_slug=base_item.project.slug,
            item_id=base_item.item_id,
            asset_pk=self.asset1.id,
        ).values_list("asset_id", flat=True)
        ordered = list(ordered)
        self.assertEqual(ordered[0], same_item_next.id)
        self.assertEqual(ordered[1], same_project.id)
        self.assertIn(other_project_asset.id, ordered[2:])

    def test_order_potential_transcribable_no_after(self):
        """
        With no 'after', prefer same item, then same project.
        """
        base_item = self.asset1.item
        same_item = create_asset(item=base_item, sequence=9, slug="tc-ci-none")
        same_project = create_asset(
            item=create_item(project=base_item.project, item_id="tc-it-np"),
            sequence=2,
            slug="tc-p-none",
        )
        other_project_asset = create_asset(
            item=create_item(
                project=create_project(
                    campaign=self.campaign, slug="tc-proj-none", title="tc-proj-none"
                ),
                item_id="tc-it-op-none",
            ),
            sequence=1,
            slug="tc-op-none",
        )
        for asset in (same_item, same_project, other_project_asset):
            NextTranscribableCampaignAsset.objects.create(
                asset=asset,
                campaign=self.campaign,
                item=asset.item,
                item_item_id=asset.item.item_id,
                project=asset.item.project,
                project_slug=asset.item.project.slug,
                sequence=asset.sequence,
                transcription_status=TranscriptionStatus.NOT_STARTED,
            )
        ordered = find_and_order_potential_transcribable_campaign_assets(
            self.campaign,
            project_slug=base_item.project.slug,
            item_id=base_item.item_id,
            asset_pk=None,
        ).values_list("asset_id", flat=True)
        ordered = list(ordered)
        self.assertEqual(ordered[0], same_item.id)
        self.assertEqual(ordered[1], same_project.id)
        self.assertIn(other_project_asset.id, ordered[2:])

    def test_invalid_next_transcribable_reserved_and_submitted(self):
        """
        Invalid cache rows include reserved or SUBMITTED assets.
        """
        reserved_asset = create_asset(
            item=self.asset1.item, sequence=30, slug="tc-inv-res"
        )
        AssetTranscriptionReservation.objects.create(
            asset=reserved_asset, reservation_token="tc-rv-2"  # nosec
        )
        NextTranscribableCampaignAsset.objects.create(
            asset=reserved_asset,
            campaign=self.campaign,
            item=reserved_asset.item,
            item_item_id=reserved_asset.item.item_id,
            project=reserved_asset.item.project,
            project_slug=reserved_asset.item.project.slug,
            sequence=reserved_asset.sequence,
            transcription_status=TranscriptionStatus.NOT_STARTED,
        )
        wrong_status_asset = create_asset(
            item=self.asset1.item, sequence=31, slug="tc-inv-wrong"
        )
        create_transcription(asset=wrong_status_asset, user=self.anon, submitted=now())
        NextTranscribableCampaignAsset.objects.create(
            asset=wrong_status_asset,
            campaign=self.campaign,
            item=wrong_status_asset.item,
            item_item_id=wrong_status_asset.item.item_id,
            project=wrong_status_asset.item.project,
            project_slug=wrong_status_asset.item.project.slug,
            sequence=wrong_status_asset.sequence,
            transcription_status=TranscriptionStatus.NOT_STARTED,
        )
        bad = list(
            find_invalid_next_transcribable_campaign_assets(
                self.campaign.id
            ).values_list("asset_id", flat=True)
        )
        self.assertIn(reserved_asset.id, bad)
        self.assertIn(wrong_status_asset.id, bad)


class TranscribableCampaignMoreInternalsTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.anon = get_anonymous_user()
        self.user = self.create_test_user()
        self.asset1 = create_asset(sequence=1, slug="tc-more-a1", title="TC More A1")
        self.asset2 = create_asset(
            item=self.asset1.item, sequence=2, slug="tc-more-a2", title="TC More A2"
        )
        self.campaign = self.asset1.campaign

    def test_tc_reserved_ids_filters_to_campaign(self):
        AssetTranscriptionReservation.objects.create(
            asset=self.asset1, reservation_token="tc-res-here"  # nosec
        )
        other_campaign = create_campaign(slug="tc-other-c", title="tc-other-c")
        other_project = create_project(
            campaign=other_campaign, slug="tc-other-p", title="tc-other-p"
        )
        other_item = create_item(project=other_project, item_id="tc-other-it")
        other_asset = create_asset(item=other_item, slug="tc-other-a")
        AssetTranscriptionReservation.objects.create(
            asset=other_asset, reservation_token="tc-res-there"  # nosec
        )

        id_set = set(
            tc_reserved_ids_subq(self.campaign).values_list("asset_id", flat=True)
        )
        self.assertIn(self.asset1.id, id_set)
        self.assertNotIn(other_asset.id, id_set)

    def test_tc_next_seq_after_variants(self):
        self.assertIsNone(tc_next_seq_after(None))
        self.assertIsNone(tc_next_seq_after(999_999_999))
        self.assertEqual(tc_next_seq_after(self.asset2.id), self.asset2.sequence)

    def test_tc_order_unstarted_first_prefers_not_started(self):
        create_transcription(asset=self.asset2, user=self.anon)
        queryset = Asset.objects.filter(id__in=[self.asset1.id, self.asset2.id])
        ordered = list(tc_order_unstarted_first(queryset).values_list("id", flat=True))
        self.assertEqual(ordered[0], self.asset1.id)
        self.assertEqual(ordered[1], self.asset2.id)

    def test_find_in_item_after_none_returns_first_not_started(self):
        item_id = self.asset1.item.item_id
        chosen = tc_find_in_item(self.campaign, item_id=item_id, after_asset_pk=None)
        self.assertEqual(chosen, self.asset1)

    def test_find_in_item_skips_inprog_and_reserved_and_advances(self):
        create_transcription(asset=self.asset1, user=self.anon)
        asset3 = create_asset(item=self.asset1.item, sequence=3, slug="tc-more-a3")
        AssetTranscriptionReservation.objects.create(
            asset=asset3, reservation_token="tc-res-a3"  # nosec
        )
        chosen = tc_find_in_item(
            self.campaign,
            item_id=self.asset1.item.item_id,
            after_asset_pk=self.asset1.id,
        )
        self.assertEqual(chosen, self.asset2)

    def test_find_in_item_after_missing_excludes_id_only(self):
        missing_pk = 987654321
        chosen = tc_find_in_item(
            self.campaign, item_id=self.asset1.item.item_id, after_asset_pk=missing_pk
        )
        self.assertEqual(chosen, self.asset1)

    def test_find_ns_in_proj_excludes_item_and_reserved(self):
        project = self.asset1.item.project
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())
        item2 = create_item(project=project, item_id="tc-more-it-2")
        not_started1 = create_asset(item=item2, sequence=1, slug="tc-more-ns1")
        not_started2 = create_asset(item=item2, sequence=2, slug="tc-more-ns2")
        AssetTranscriptionReservation.objects.create(
            asset=not_started1, reservation_token="tc-res-ns1"  # nosec
        )
        chosen = tc_find_ns_in_proj(
            self.campaign,
            project_slug=project.slug,
            exclude_item_id=self.asset1.item.item_id,
        )
        self.assertEqual(chosen, not_started2)

    def test_find_ns_in_proj_blank_slug_none(self):
        self.assertIsNone(tc_find_ns_in_proj(self.campaign, project_slug=""))

    @patch("concordia.utils.next_asset.transcribable.campaign.get_registered_task")
    def test_cache_same_item_is_ignored_then_manual_selects(self, mock_get_task):
        """
        Same-item cache entries should be ignored; manual should return other item.
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())

        NextTranscribableCampaignAsset.objects.create(
            asset=self.asset2,
            campaign=self.campaign,
            item=self.asset2.item,
            item_item_id=self.asset2.item.item_id,
            project=self.asset2.item.project,
            project_slug=self.asset2.item.project.slug,
            sequence=self.asset2.sequence,
            transcription_status=TranscriptionStatus.NOT_STARTED,
        )

        item2 = create_item(project=self.asset1.item.project, item_id="tc-more-it-man")
        picked_asset = create_asset(item=item2, sequence=10, slug="tc-more-pick")

        chosen = find_next_transcribable_campaign_asset(
            self.campaign,
            project_slug="",  # skip project-level short-circuit
            item_id=self.asset1.item.item_id,  # forces same-item short-circuit first
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(chosen, picked_asset)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.transcribable.campaign.get_registered_task")
    def test_manual_excludes_original_pk_and_same_item(self, mock_get_task):
        """
        Manual ranking must exclude the original asset and the current item.
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())

        item2 = create_item(project=self.asset1.item.project, item_id="tc-more-it-3")
        keep = create_asset(item=item2, sequence=1, slug="tc-more-keep")
        toss = create_asset(item=item2, sequence=2, slug="tc-more-toss")

        chosen = find_next_transcribable_campaign_asset(
            self.campaign,
            project_slug="",
            item_id=self.asset1.item.item_id,
            original_asset_id=toss.id,
        )
        self.assertEqual(chosen, keep)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    def test_same_item_inprog_after_when_no_not_started(self):
        """
        If no NOT_STARTED anywhere qualifies, select IN_PROGRESS in same item.
        """
        create_transcription(asset=self.asset2, user=self.anon)  # IN_PROGRESS
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())

        got = find_next_transcribable_campaign_asset(
            self.campaign,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(got, self.asset2)

    def test_eligible_base_qs_filters_status_and_published(self):
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        not_started_asset = create_asset(
            item=self.asset1.item, sequence=3, slug="tc-more-ns-ok"
        )
        in_progress_asset = create_asset(
            item=self.asset1.item, sequence=4, slug="tc-more-ip-ok"
        )
        create_transcription(asset=in_progress_asset, user=self.anon)  # IN_PROGRESS

        other_campaign = create_campaign(slug="tc-ebq-c", title="tc-ebq-c")
        other_project = create_project(
            campaign=other_campaign, slug="tc-ebq-p", title="tc-ebq-p"
        )
        other_item = create_item(project=other_project, item_id="tc-ebq-i")
        other_asset = create_asset(item=other_item, slug="tc-ebq-a")

        queryset = tc_eligible_base_qs(self.campaign)
        id_set = set(queryset.values_list("id", flat=True))
        self.assertIn(not_started_asset.id, id_set)
        self.assertIn(in_progress_asset.id, id_set)
        self.assertNotIn(self.asset1.id, id_set)
        self.assertNotIn(other_asset.id, id_set)

    def test_cached_transcribable_accessor_returns_rows(self):
        row = NextTranscribableCampaignAsset.objects.create(
            asset=self.asset1,
            campaign=self.campaign,
            item=self.asset1.item,
            item_item_id=self.asset1.item.item_id,
            project=self.asset1.item.project,
            project_slug=self.asset1.item.project.slug,
            sequence=self.asset1.sequence,
            transcription_status=TranscriptionStatus.NOT_STARTED,
        )
        queryset = find_cached_transcribable_assets(self.campaign)
        self.assertIn(row.id, queryset.values_list("id", flat=True))

    def test_find_in_item_blank_item_id_none(self):
        chosen = tc_find_in_item(self.campaign, item_id="", after_asset_pk=None)
        self.assertIsNone(chosen)

    def test_find_ns_in_proj_without_exclude_includes_same_item(self):
        """
        exclude_item_id is falsy, so branch where no exclusion is applied.
        Should pick the first NOT_STARTED asset, even if it's in the same item.
        """
        project = self.asset1.item.project
        chosen = tc_find_ns_in_proj(self.campaign, project_slug=project.slug)
        self.assertEqual(chosen, self.asset1)


================================================
FILE: concordia/tests/test_utils_next_asset_transcribable_topic.py
================================================
from unittest.mock import MagicMock, patch

from django.test import TestCase
from django.utils.timezone import now

from concordia.models import (
    Asset,
    AssetTranscriptionReservation,
    NextTranscribableTopicAsset,
    TranscriptionStatus,
)
from concordia.utils import get_anonymous_user
from concordia.utils.next_asset import (
    find_new_transcribable_topic_assets,
    find_next_transcribable_topic_asset,
    find_transcribable_topic_asset,
)
from concordia.utils.next_asset.transcribable.topic import (
    _eligible_transcribable_base_qs as topic_transcribable_eligible_base_qs,
)
from concordia.utils.next_asset.transcribable.topic import (
    _find_transcribable_in_item_for_topic as topic_find_in_item_for_topic,
)
from concordia.utils.next_asset.transcribable.topic import (
    _find_transcribable_not_started_in_project_for_topic,
    find_and_order_potential_transcribable_topic_assets,
    find_invalid_next_transcribable_topic_assets,
)
from concordia.utils.next_asset.transcribable.topic import (
    _next_seq_after as topic_next_seq_after_for_transcribable,
)
from concordia.utils.next_asset.transcribable.topic import (
    _order_unstarted_first as topic_order_unstarted_first,
)
from concordia.utils.next_asset.transcribable.topic import (
    _reserved_asset_ids_subq as topic_transcribable_reserved_ids_subq,
)

from .utils import (
    CreateTestUsers,
    create_asset,
    create_campaign,
    create_item,
    create_project,
    create_topic,
    create_transcription,
)

topic_find_not_started_in_project_for_topic = (
    _find_transcribable_not_started_in_project_for_topic
)
find_invalid_next_transcribable_topic_assets_fn = (
    find_invalid_next_transcribable_topic_assets
)


class NextTranscribableTopicAssetTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.anon = get_anonymous_user()
        self.user = self.create_test_user()
        self.asset1 = create_asset(
            slug="topic-asset-1", sequence=1, title="Topic Asset 1"
        )
        self.asset2 = create_asset(
            item=self.asset1.item,
            sequence=2,
            slug="topic-asset-2",
            title="Topic Asset 2",
        )
        self.topic = create_topic(project=self.asset1.item.project)

    def test_find_new_transcribable_topic_assets_filters_correctly(self):
        create_transcription(
            asset=self.asset1,
            user=self.anon,
            submitted=now(),
        )

        queryset = find_new_transcribable_topic_assets(self.topic)
        self.assertNotIn(self.asset1, queryset)
        assert_in = self.assertIn
        assert_in(self.asset2, queryset)

    def test_find_transcribable_topic_asset_from_next_table(self):
        NextTranscribableTopicAsset.objects.create(
            asset=self.asset1,
            topic=self.topic,
            item=self.asset1.item,
            item_item_id=self.asset1.item.item_id,
            project=self.asset1.item.project,
            project_slug=self.asset1.item.project.slug,
            sequence=self.asset1.sequence,
            transcription_status=TranscriptionStatus.NOT_STARTED,
        )

        asset = find_transcribable_topic_asset(self.topic)
        self.assertEqual(asset, self.asset1)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_find_transcribable_topic_asset_falls_back_and_spawns_task(
        self, mock_get_task
    ):
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        asset = find_transcribable_topic_asset(self.topic)
        self.assertEqual(asset, self.asset1)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_find_next_transcribable_topic_asset_orders_and_falls_back(
        self, mock_get_task
    ):
        """
        With short-circuiting: item-level returns the next asset
        and we do not spawn a task.
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        asset = find_next_transcribable_topic_asset(
            self.topic,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(asset, self.asset2)
        # Short-circuit satisfied -> no cache fallback -> no task spawned
        self.assertFalse(mock_get_task.called)
        self.assertFalse(mock_task.delay.called)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_find_next_transcribable_topic_asset_when_next_asset_exists(
        self, mock_get_task
    ):
        create_transcription(asset=self.asset2, user=self.anon)
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        NextTranscribableTopicAsset.objects.create(
            asset=self.asset2,
            topic=self.topic,
            item=self.asset2.item,
            item_item_id=self.asset2.item.item_id,
            project=self.asset2.item.project,
            project_slug=self.asset2.item.project.slug,
            sequence=self.asset2.sequence,
            transcription_status=TranscriptionStatus.IN_PROGRESS,
        )

        asset = find_next_transcribable_topic_asset(
            self.topic,
            project_slug="",
            item_id="",
            original_asset_id=None,
        )
        self.assertEqual(asset, self.asset2)
        self.assertFalse(mock_get_task.called)
        self.assertFalse(mock_task.delay.called)

    def test_short_circuit_same_item_topic_respects_after_sequence_and_reservations(
        self,
    ):
        third = create_asset(
            item=self.asset1.item,
            sequence=3,
            slug="topic-asset-3",
            title="Topic Asset 3",
        )

        chosen = find_next_transcribable_topic_asset(
            self.topic,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(chosen, self.asset2)

        AssetTranscriptionReservation.objects.create(
            asset=self.asset2, reservation_token="tkn"  # nosec
        )
        chosen2 = find_next_transcribable_topic_asset(
            self.topic,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(chosen2, third)

    def test_project_short_circuit_topic_prefers_not_started_over_in_progress(self):
        # Exhaust item
        create_transcription(asset=self.asset1, user=self.anon, submitted=now())
        create_transcription(asset=self.asset2, user=self.anon, submitted=now())

        other_item = create_item(project=self.asset1.item.project, item_id="tproj-item")
        in_progress = create_asset(
            item=other_item, sequence=1, slug="tproj-inprog", title="TProj InProg"
        )
        create_transcription(asset=in_progress, user=self.anon)

        not_started_asset = create_asset(
            item=other_item,
            sequence=2,
            slug="tproj-notstarted",
            title="TProj NotStarted",
        )

        chosen = find_next_transcribable_topic_asset(
            self.topic,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(chosen, not_started_asset)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_project_short_circuit_topic_without_item_id_allows_same_item(
        self, mock_get_task
    ):
        """
        With item_id not set, the project-level short-circuit
        should return the first NOT_STARTED in the project,
        ordered by (item__item_id, sequence, id).
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        chosen = find_next_transcribable_topic_asset(
            self.topic,
            project_slug=self.asset1.item.project.slug,
            item_id="",  # falsy -> do not exclude same item
            original_asset_id=None,  # no exclusion of original
        )
        # Both assets are NOT_STARTED in the same item; ordering picks asset1.
        self.assertEqual(chosen, self.asset1)
        self.assertFalse(mock_get_task.called)
        self.assertFalse(mock_task.delay.called)


class TranscribableTopicInternalsTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.anonymous = get_anonymous_user()
        self.user = self.create_test_user()
        self.asset1 = create_asset(sequence=1, slug="tt-int-a1")
        self.asset2 = create_asset(item=self.asset1.item, sequence=2, slug="tt-int-a2")
        self.topic = create_topic(project=self.asset1.item.project)

    def test_topic_transcribable_reserved_ids_is_unfiltered(self):
        AssetTranscriptionReservation.objects.create(
            asset=self.asset1, reservation_token="tt-res-here"  # nosec
        )
        other_campaign = create_campaign(slug="tt-oc", title="tt-oc")
        other_project = create_project(
            campaign=other_campaign, slug="tt-op", title="tt-op"
        )
        other_item = create_item(project=other_project, item_id="tt-oi")
        other_asset = create_asset(item=other_item, slug="tt-oa")
        AssetTranscriptionReservation.objects.create(
            asset=other_asset, reservation_token="tt-res-there"  # nosec
        )
        ids = set(
            topic_transcribable_reserved_ids_subq().values_list("asset_id", flat=True)
        )
        self.assertIn(self.asset1.id, ids)
        self.assertIn(other_asset.id, ids)

    def test_topic_transcribable_eligible_base_qs_filters_correctly(self):
        # Submitted, so excluded
        create_transcription(asset=self.asset2, user=self.anonymous, submitted=now())
        # Not started (included)
        asset_not_started = self.asset1
        # In progress (included)
        asset_in_progress = create_asset(
            item=self.asset1.item, sequence=3, slug="tt-int-ip"
        )
        create_transcription(asset=asset_in_progress, user=self.anonymous)
        # Other campaign (excluded)
        other_campaign = create_campaign(slug="tt-ebq-c", title="tt-ebq-c")
        other_project = create_project(
            campaign=other_campaign, slug="tt-ebq-p", title="tt-ebq-p"
        )
        other_item = create_item(project=other_project, item_id="tt-ebq-i")
        other_asset = create_asset(item=other_item, slug="tt-ebq-a")
        queryset = topic_transcribable_eligible_base_qs(self.topic)
        ids = set(queryset.values_list("id", flat=True))
        self.assertIn(asset_not_started.id, ids)
        self.assertIn(asset_in_progress.id, ids)
        self.assertNotIn(self.asset2.id, ids)
        self.assertNotIn(other_asset.id, ids)

    def test_topic_next_seq_after_variants_for_transcribable(self):
        self.assertIsNone(topic_next_seq_after_for_transcribable(None))
        self.assertIsNone(topic_next_seq_after_for_transcribable(987654321))
        self.assertEqual(
            topic_next_seq_after_for_transcribable(self.asset2.id),
            self.asset2.sequence,
        )

    def test_topic_find_in_item_for_topic_after_none_returns_first_not_started(self):
        chosen = topic_find_in_item_for_topic(
            self.topic, item_id=self.asset1.item.item_id, after_asset_pk=None
        )
        self.assertEqual(chosen, self.asset1)

    def test_topic_find_in_item_for_topic_skips_reserved_and_advances(self):
        third = create_asset(item=self.asset1.item, sequence=3, slug="tt-int-a3")
        AssetTranscriptionReservation.objects.create(
            asset=self.asset2, reservation_token="tt-int-a2"  # nosec
        )
        chosen = topic_find_in_item_for_topic(
            self.topic,
            item_id=self.asset1.item.item_id,
            after_asset_pk=self.asset1.id,
        )
        self.assertEqual(chosen, third)

    def test_topic_find_in_item_for_topic_after_missing_excludes_only_id(self):
        chosen = topic_find_in_item_for_topic(
            self.topic,
            item_id=self.asset1.item.item_id,
            after_asset_pk=987654321,
        )
        self.assertEqual(chosen, self.asset1)

    def test_topic_find_in_item_for_topic_blank_item_id_returns_none(self):
        chosen = topic_find_in_item_for_topic(
            self.topic, item_id="", after_asset_pk=None
        )
        self.assertIsNone(chosen)

    def test_topic_find_not_started_in_project_excludes_item_and_reserved(self):
        other_item = create_item(project=self.asset1.item.project, item_id="tt-int-ex")
        not_started_1 = create_asset(item=other_item, sequence=1, slug="tt-int-ns1")
        not_started_2 = create_asset(item=other_item, sequence=2, slug="tt-int-ns2")
        AssetTranscriptionReservation.objects.create(
            asset=not_started_1, reservation_token="tt-int-res"  # nosec
        )
        chosen = topic_find_not_started_in_project_for_topic(
            self.topic,
            project_slug=self.asset1.item.project.slug,
            exclude_item_id=self.asset1.item.item_id,
        )
        self.assertEqual(chosen, not_started_2)

    def test_topic_find_not_started_in_project_blank_slug_none(self):
        self.assertIsNone(
            topic_find_not_started_in_project_for_topic(self.topic, project_slug="")
        )

    def test_topic_order_unstarted_first_prefers_not_started(self):
        in_progress = create_asset(
            item=self.asset1.item, sequence=4, slug="tt-int-ip-2"
        )
        create_transcription(asset=in_progress, user=self.anonymous)
        queryset = Asset.objects.filter(id__in=[self.asset1.id, in_progress.id])
        ordered = list(
            topic_order_unstarted_first(queryset).values_list("id", flat=True)
        )
        self.assertEqual(ordered[0], self.asset1.id)
        self.assertEqual(ordered[1], in_progress.id)

    def test_topic_find_not_started_in_project_without_exclude_includes_same_item(
        self,
    ):
        """
        With exclude_item_id falsy, the helper should consider the same item and
        pick the first NOT_STARTED asset there (covers the else branch of L154->157).
        """
        project = self.asset1.item.project
        chosen = topic_find_not_started_in_project_for_topic(
            self.topic, project_slug=project.slug, exclude_item_id=""
        )
        self.assertEqual(chosen, self.asset1)


class NextTranscribableTopicMoreTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.anonymous = get_anonymous_user()
        self.user = self.create_test_user()
        self.asset1 = create_asset(slug="tt-more-a1", sequence=1, title="TT More A1")
        self.asset2 = create_asset(
            item=self.asset1.item, slug="tt-more-a2", sequence=2, title="TT More A2"
        )
        self.topic = create_topic(project=self.asset1.item.project)

    def test_new_transcribable_topic_excludes_reserved_and_cached(self):
        reserved_asset = create_asset(
            item=self.asset1.item, sequence=3, slug="tt-more-res"
        )
        cached_asset = create_asset(
            item=self.asset1.item, sequence=4, slug="tt-more-cached"
        )
        NextTranscribableTopicAsset.objects.create(
            asset=cached_asset,
            topic=self.topic,
            item=cached_asset.item,
            item_item_id=cached_asset.item.item_id,
            project=cached_asset.item.project,
            project_slug=cached_asset.item.project.slug,
            sequence=cached_asset.sequence,
            transcription_status=TranscriptionStatus.NOT_STARTED,
        )
        AssetTranscriptionReservation.objects.create(
            asset=reserved_asset, reservation_token="tt-more-rv"  # nosec
        )
        queryset = find_new_transcribable_topic_assets(self.topic)
        self.assertNotIn(reserved_asset, queryset)
        self.assertNotIn(cached_asset, queryset)

    def test_find_and_order_potential_transcribable_topic_assets_ordering(self):
        base_item = self.asset1.item
        same_item_next = create_asset(
            item=base_item, sequence=10, slug="tt-pot-ci-next"
        )
        same_project_other_item = create_asset(
            item=create_item(project=base_item.project, item_id="tt-pot-it-2"),
            sequence=5,
            slug="tt-pot-proj",
        )
        other_project = create_project(
            campaign=self.asset1.campaign,
            slug="tt-pot-proj-oth",
            title="tt-pot-proj-oth",
        )
        other_item = create_item(project=other_project, item_id="tt-pot-it-3")
        other_project_asset = create_asset(
            item=other_item, sequence=1, slug="tt-pot-op"
        )

        for asset in (same_item_next, same_project_other_item, other_project_asset):
            NextTranscribableTopicAsset.objects.create(
                asset=asset,
                topic=self.topic,
                item=asset.item,
                item_item_id=asset.item.item_id,
                project=asset.item.project,
                project_slug=asset.item.project.slug,
                sequence=asset.sequence,
                transcription_status=TranscriptionStatus.NOT_STARTED,
            )

        ordered = find_and_order_potential_transcribable_topic_assets(
            self.topic,
            project_slug=base_item.project.slug,
            item_id=base_item.item_id,
            asset_pk=self.asset1.id,
        ).values_list("asset_id", flat=True)

        ordered = list(ordered)
        # Prefer same item, then same project, then others
        self.assertEqual(ordered[0], same_item_next.id)
        self.assertEqual(ordered[1], same_project_other_item.id)
        self.assertIn(other_project_asset.id, ordered[2:])

    def test_find_invalid_next_transcribable_topic_assets_reserved_and_status(self):
        reserved_asset = create_asset(
            item=self.asset1.item, sequence=30, slug="tt-inv-res"
        )
        create_transcription(asset=reserved_asset, user=self.anonymous)
        AssetTranscriptionReservation.objects.create(
            asset=reserved_asset, reservation_token="tt-inv-rv"  # nosec
        )
        NextTranscribableTopicAsset.objects.create(
            asset=reserved_asset,
            topic=self.topic,
            item=reserved_asset.item,
            item_item_id=reserved_asset.item.item_id,
            project=reserved_asset.item.project,
            project_slug=reserved_asset.item.project.slug,
            sequence=reserved_asset.sequence,
            transcription_status=TranscriptionStatus.IN_PROGRESS,
        )
        wrong_status_asset = create_asset(
            item=self.asset1.item, sequence=31, slug="tt-inv-wrong"
        )
        create_transcription(
            asset=wrong_status_asset, user=self.anonymous, submitted=now()
        )
        NextTranscribableTopicAsset.objects.create(
            asset=wrong_status_asset,
            topic=self.topic,
            item=wrong_status_asset.item,
            item_item_id=wrong_status_asset.item.item_id,
            project=wrong_status_asset.item.project,
            project_slug=wrong_status_asset.item.project.slug,
            sequence=wrong_status_asset.sequence,
            transcription_status=TranscriptionStatus.NOT_STARTED,
        )
        bad = list(
            find_invalid_next_transcribable_topic_assets_fn(self.topic.id).values_list(
                "asset_id", flat=True
            )
        )
        self.assertIn(reserved_asset.id, bad)
        self.assertIn(wrong_status_asset.id, bad)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_cache_same_item_is_ignored_then_manual_selects_topic(self, mock_get_task):
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        # Same-item cached row should be excluded, forcing manual fallback.
        NextTranscribableTopicAsset.objects.create(
            asset=self.asset2,
            topic=self.topic,
            item=self.asset2.item,
            item_item_id=self.asset2.item.item_id,
            project=self.asset2.item.project,
            project_slug=self.asset2.item.project.slug,
            sequence=self.asset2.sequence,
            transcription_status=TranscriptionStatus.NOT_STARTED,
        )
        # Make same-item short-circuit fail by reserving the only candidate.
        AssetTranscriptionReservation.objects.create(
            asset=self.asset2, reservation_token="tt-cache-same"  # nosec
        )
        # Provide a valid choice elsewhere to be picked by manual fallback.
        other_item = create_item(
            project=self.asset1.item.project, item_id="tt-cache-oth"
        )
        picked = create_asset(item=other_item, sequence=5, slug="tt-cache-pick")

        chosen = find_next_transcribable_topic_asset(
            self.topic,
            project_slug="",
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(chosen, picked)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_cache_excludes_original_pk_and_chooses_next_topic(self, mock_get_task):
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        other_item = create_item(
            project=self.asset1.item.project, item_id="tt-cache-exc"
        )
        first = create_asset(item=other_item, sequence=1, slug="tt-cache-first")
        second = create_asset(item=other_item, sequence=2, slug="tt-cache-second")
        for asset in (first, second):
            NextTranscribableTopicAsset.objects.create(
                asset=asset,
                topic=self.topic,
                item=asset.item,
                item_item_id=asset.item.item_id,
                project=asset.item.project,
                project_slug=asset.item.project.slug,
                sequence=asset.sequence,
                transcription_status=TranscriptionStatus.NOT_STARTED,
            )

        chosen = find_next_transcribable_topic_asset(
            self.topic, project_slug="", item_id="", original_asset_id=first.id
        )
        self.assertEqual(chosen, second)
        self.assertFalse(mock_get_task.called)
        self.assertFalse(mock_task.delay.called)

    def test_same_item_inprogress_selected_when_no_not_started_topic(self):
        create_transcription(asset=self.asset2, user=self.anonymous)
        create_transcription(asset=self.asset1, user=self.anonymous, submitted=now())
        got = find_next_transcribable_topic_asset(
            self.topic,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=None,
        )
        self.assertEqual(got, self.asset2)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_next_transcribable_topic_none_anywhere_returns_none_no_spawn(
        self, mock_get_task
    ):
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        # Use a brand-new topic with no eligible assets anywhere.
        empty_campaign = create_campaign(slug="tt-none-c", title="tt-none-c")
        empty_project = create_project(
            campaign=empty_campaign, slug="tt-none-p", title="tt-none-p"
        )
        empty_topic = create_topic(project=empty_project)

        chosen = find_next_transcribable_topic_asset(
            topic=empty_topic, project_slug="", item_id="", original_asset_id=None
        )
        self.assertIsNone(chosen)
        self.assertFalse(mock_get_task.called)
        self.assertFalse(mock_task.delay.called)

    def test_item_gate_ignored_when_original_is_other_item_topic(self):
        """
        original_asset_id exists but belongs to a different item; item gate is ignored
        and we return the first NOT_STARTED in the requested item
        """
        other_item = create_item(
            project=self.asset1.item.project, item_id="tt-oth-item"
        )
        other_asset = create_asset(item=other_item, slug="tt-oth-a")

        chosen = find_next_transcribable_topic_asset(
            self.topic,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=other_asset.id,
        )
        self.assertEqual(chosen, self.asset1)

    def test_item_digit_string_missing_treats_as_no_after_topic(self):
        chosen = find_next_transcribable_topic_asset(
            self.topic,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id="987654321",  # valid digits, missing PK
        )
        self.assertEqual(chosen, self.asset1)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_manual_same_item_ip_when_no_ns_anywhere_topic(self, mock_get_task):
        """
        Manual fallback path with item_id present: when there are
        no NOT_STARTED anywhere, choose same-item IN_PROGRESS.
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        # No NOT_STARTED anywhere in this topic's project; only same-item IN_PROGRESS
        create_transcription(asset=self.asset2, user=self.anonymous)  # IN_PROGRESS
        create_transcription(asset=self.asset1, user=self.anonymous, submitted=now())

        got = find_next_transcribable_topic_asset(
            self.topic,
            project_slug="",  # bypass short-circuit so we hit the manual path
            item_id=self.asset1.item.item_id,
            original_asset_id=None,
        )
        self.assertEqual(got, self.asset2)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    def test_item_invalid_after_str_valueerror_branch_topic(self):
        chosen = find_next_transcribable_topic_asset(
            self.topic,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id="not-an-int",
        )
        self.assertEqual(chosen, self.asset1)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_manual_valid_after_excludes_original_and_picks_next_topic(
        self, mock_get_task
    ):
        """
        Manual fallback with a valid original_asset_id: use after_seq to exclude the
        original and return the next NOT_STARTED
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        other_item = create_item(
            project=self.asset1.item.project, item_id="tt-man-item"
        )
        first = create_asset(item=other_item, sequence=1, slug="tt-man-first")
        second = create_asset(item=other_item, sequence=2, slug="tt-man-second")

        chosen = find_next_transcribable_topic_asset(
            self.topic,
            project_slug="",
            item_id="",
            original_asset_id=first.id,
        )
        self.assertEqual(chosen, second)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_inprogress_fallback_spawns_and_uses_after_gate_topic(self, mock_get_task):
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        # Make original (seq=1) SUBMITTED so it can't be chosen; keep it as "original".
        create_transcription(asset=self.asset1, user=self.anonymous, submitted=now())
        # Only candidate anywhere: same-item IN_PROGRESS (seq=2).
        create_transcription(asset=self.asset2, user=self.anonymous)  # IN_PROGRESS

        # Ensure there are no other items/assets in the topic to be found
        # by manual path (manual path excludes same item when item_id is provided).
        # No cached rows either.

        chosen = find_next_transcribable_topic_asset(
            self.topic,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )

        self.assertEqual(chosen, self.asset2)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_inprogress_fallback_with_digit_string_original_id(self, mock_get_task):
        """
        Same as above, but pass original_asset_id as a DIGIT STRING to
        exercise the int(original_asset_id) path inside the after-seq filter.
        Also ensures exclude(pk=original_asset_id) runs without ValueError.
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        # Original: SUBMITTED, seq=1
        create_transcription(asset=self.asset1, user=self.anonymous, submitted=now())
        # Only candidate: same-item IN_PROGRESS, seq=2
        create_transcription(asset=self.asset2, user=self.anonymous)

        chosen = find_next_transcribable_topic_asset(
            self.topic,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=str(self.asset1.id),
        )

        self.assertEqual(chosen, self.asset2)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_inprogress_fallback_spawns_and_returns_asset_topic(self, mock_get_task):
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        # Use a brand-new topic/project so no cached rows can interfere.
        campaign = create_campaign(slug="tt-ip-c1", title="tt-ip-c1")
        project = create_project(
            campaign=campaign,
            slug="tt-ip-p1",
            title="tt-ip-p1",
        )
        topic = create_topic(project=project)
        item = create_item(project=project, item_id="tt-ip-i1")

        asset1 = create_asset(item=item, sequence=1, slug="tt-ip-a1")
        asset2 = create_asset(item=item, sequence=2, slug="tt-ip-a2")
        create_transcription(asset=asset1, user=get_anonymous_user(), submitted=now())
        create_transcription(asset=asset2, user=get_anonymous_user())

        chosen = find_next_transcribable_topic_asset(
            topic=topic,
            project_slug=project.slug,
            item_id=item.item_id,
            original_asset_id=asset1.id,
        )

        self.assertEqual(chosen, asset2)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_inprogress_fallback_with_digit_str_original_id_topic(self, mock_get_task):
        """
        Same scenario as above, but pass original_asset_id as a DIGIT STRING to
        run the int(...) path inside the after-seq filter and still spawn the task.
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        campaign = create_campaign(slug="tt-ip-c2", title="tt-ip-c2")
        project = create_project(
            campaign=campaign,
            slug="tt-ip-p2",
            title="tt-ip-p2",
        )
        topic = create_topic(project=project)
        item = create_item(project=project, item_id="tt-ip-i2")

        asset1 = create_asset(item=item, sequence=1, slug="tt-ip2-a1")
        asset2 = create_asset(item=item, sequence=2, slug="tt-ip2-a2")
        create_transcription(asset=asset1, user=get_anonymous_user(), submitted=now())
        create_transcription(asset=asset2, user=get_anonymous_user())  # IN_PROGRESS

        chosen = find_next_transcribable_topic_asset(
            topic=topic,
            project_slug=project.slug,
            item_id=item.item_id,
            original_asset_id=str(asset1.id),  # digit-string pk
        )

        self.assertEqual(chosen, asset2)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    def test_project_short_circuit_topic_excludes_current_item_via_item_filter(self):
        """
        project-level short-circuit executes with item_id truthy,
        so the code runs candidate = candidate.exclude(item__item_id=item_id).
        Item-level has no NOT_STARTED, so we land in the project block.
        """
        # Exhaust current item (no NOT_STARTED left there)
        create_transcription(asset=self.asset1, user=self.anonymous, submitted=now())
        create_transcription(asset=self.asset2, user=self.anonymous, submitted=now())

        # Create a NOT_STARTED candidate in the same project but a different item
        other_item = create_item(
            project=self.asset1.item.project, item_id="tt-proj-ex-branch"
        )
        pick = create_asset(item=other_item, sequence=1, slug="tt-proj-ex-pick")

        chosen = find_next_transcribable_topic_asset(
            self.topic,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(chosen, pick)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_inprogress_fallback_spawns_task_with_item_id_topic(self, mock_get_task):
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        # Same item: one IN_PROGRESS, one SUBMITTED -> no NOT_STARTED anywhere.
        create_transcription(asset=self.asset2, user=self.anonymous)
        create_transcription(asset=self.asset1, user=self.anonymous, submitted=now())

        # With item_id set, manual fallback excludes same-item candidates, so
        # it returns nothing (spawn_task=True). Then the IN_PROGRESS fallback
        # must return asset2 and trigger the task.
        chosen = find_next_transcribable_topic_asset(
            self.topic,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=None,
        )
        self.assertEqual(chosen, self.asset2)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_manual_same_item_inprogress_triggers_spawn_task_topic(self, mock_get_task):
        """
        When there are no NOT_STARTED candidates anywhere (after excluding current
        item/original in the manual fallback), the same-item IN_PROGRESS fallback
        should return an asset AND spawn the cache population task.
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        # Same item only:
        # - original (NOT_STARTED) will be excluded by manual fallback,
        # - next is IN_PROGRESS (eligible for final fallback).
        create_transcription(asset=self.asset2, user=self.anonymous)

        chosen = find_next_transcribable_topic_asset(
            self.topic,
            project_slug="",
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(chosen, self.asset2)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_project_short_circuit_excludes_current_item_topic(self, mock_get_task):
        create_transcription(asset=self.asset1, user=self.anonymous, submitted=now())
        create_transcription(asset=self.asset2, user=self.anonymous, submitted=now())

        other_item = create_item(
            project=self.asset1.item.project, item_id="topic-proj-exclude-item"
        )
        pick = create_asset(item=other_item, sequence=5, slug="topic-proj-exclude-pick")

        chosen = find_next_transcribable_topic_asset(
            self.topic,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=self.asset1.id,
        )
        self.assertEqual(chosen, pick)
        self.assertFalse(mock_get_task.called)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_manual_inprogress_fallback_triggers_spawn_task_topic(self, mock_get_task):
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        create_transcription(asset=self.asset1, user=self.anonymous, submitted=now())
        create_transcription(asset=self.asset2, user=self.anonymous)

        chosen = find_next_transcribable_topic_asset(
            self.topic,
            project_slug=self.asset1.item.project.slug,
            item_id=self.asset1.item.item_id,
            original_asset_id=None,
        )
        self.assertEqual(chosen, self.asset2)
        self.assertTrue(mock_get_task.called)
        self.assertTrue(mock_task.delay.called)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_inprogress_fallback_item_id_returns_none_when_no_candidates_topic(
        self, mock_get_task
    ):
        """
        With item_id truthy but no same-item IN_PROGRESS (and no NOT_STARTED anywhere),
        the IN_PROGRESS fallback should yield no asset and the function returns None.
        Ensures the path where `asset` is falsy in the IN_PROGRESS block is covered.
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        # Fresh topic/project with a single item and no transcribable assets at all.
        campaign = create_campaign(slug="tt-ip-none-c", title="tt-ip-none-c")
        project = create_project(
            campaign=campaign, slug="tt-ip-none-p", title="tt-ip-none-p"
        )
        topic = create_topic(project=project)
        item = create_item(project=project, item_id="tt-ip-none-i")

        a1 = create_asset(item=item, sequence=1, slug="tt-ip-none-a1")
        a2 = create_asset(item=item, sequence=2, slug="tt-ip-none-a2")
        # Make both SUBMITTED so neither NOT_STARTED nor IN_PROGRESS exists.
        create_transcription(asset=a1, user=get_anonymous_user(), submitted=now())
        create_transcription(asset=a2, user=get_anonymous_user(), submitted=now())

        got = find_next_transcribable_topic_asset(
            topic=topic,
            project_slug=project.slug,
            item_id=item.item_id,  # truthy, so we enter the IN_PROGRESS fallback
            original_asset_id=None,
        )
        self.assertIsNone(got)
        # No task should be spawned since the IN_PROGRESS block found nothing.
        self.assertFalse(mock_get_task.called)

    @patch("concordia.utils.next_asset.transcribable.topic.get_registered_task")
    def test_inprogress_fallback_returns_asset_without_spawning(self, mock_get_task):
        """
        Force a path where the cache stage is exercised (so spawn_task stays False),
        but yields no usable asset (simulated by making the cached asset retrieval
        return None). The function should then fall through to the IN_PROGRESS
        fallback, return that asset and NOT spawn the population task.
        """
        mock_task = mock_get_task.return_value
        mock_task.delay = MagicMock()

        # Current item: seq1 SUBMITTED, seq2 IN_PROGRESS -> same-item NOT_STARTED fails.
        create_transcription(asset=self.asset1, user=self.anonymous, submitted=now())
        create_transcription(asset=self.asset2, user=self.anonymous)  # IN_PROGRESS

        # Prepare a cached candidate in a DIFFERENT project so project short-circuit
        # doesn't grab it (only checks current project_slug).
        other_campaign = create_campaign(slug="tt-ip-cache-c", title="tt-ip-cache-c")
        other_project = create_project(
            campaign=other_campaign, slug="tt-ip-cache-p", title="tt-ip-cache-p"
        )
        other_item = create_item(project=other_project, item_id="tt-ip-cache-i")
        cached_asset = create_asset(item=other_item, sequence=1, slug="tt-ip-cache-a")

        NextTranscribableTopicAsset.objects.create(
            asset=cached_asset,
            topic=self.topic,
            item=cached_asset.item,
            item_item_id=cached_asset.item.item_id,
            project=cached_asset.item.project,
            project_slug=cached_asset.item.project.slug,
            sequence=cached_asset.sequence,
            transcription_status=TranscriptionStatus.NOT_STARTED,
        )

        # Patch Asset.objects.filter only for id=cached_asset.id so the cache lookup
        # produces an asset_id (spawn_task remains False) but then returns no row,
        # forcing the function into the IN_PROGRESS fallback.
        real_filter = Asset.objects.filter

        def filter_side_effect(*args, **kwargs):
            if kwargs == {"id": cached_asset.id}:
                qs_mock = MagicMock()
                qs_mock.select_for_update.return_value = qs_mock
                qs_mock.select_related.return_value = qs_mock
                qs_mock.first.return_value = None  # simulate skip-locked/missing row
                return qs_mock
            return real_filter(*args, **kwargs)

        with patch.object(Asset.objects, "filter", side_effect=filter_side_effect):
            chosen = find_next_transcribable_topic_asset(
                self.topic,
                project_slug=self.asset1.item.project.slug,
                item_id=self.asset1.item.item_id,
                original_asset_id=None,
            )

        # Should fall back to same-item IN_PROGRESS and NOT spawn the task.
        self.assertEqual(chosen, self.asset2)
        self.assertFalse(mock_get_task.called)


================================================
FILE: concordia/tests/test_validators.py
================================================
import string

from django.core.exceptions import ValidationError
from django.test import TestCase

from concordia.passwords.validators import ComplexityValidator
from concordia.validators import DjangoPasswordsValidator


class TestValidators(TestCase):
    def test_DjangoPasswordsValidator(self):
        validator = DjangoPasswordsValidator()
        expected_error = "Must be more complex (%s)"
        self.assertIsNone(validator.validate("Ab1!"))

        expected_suberror = "must contain 1 or more unique lowercase characters"
        with self.assertRaises(ValidationError) as cm:
            validator.validate("AB1!")
        self.assertEqual(cm.exception.messages, [expected_error % expected_suberror])
        self.assertEqual(cm.exception.error_list[0].code, "complexity")

        expected_suberror = "must contain 1 or more unique uppercase characters"
        with self.assertRaises(ValidationError) as cm:
            validator.validate("ab1!")
        self.assertEqual(cm.exception.messages, [expected_error % expected_suberror])
        self.assertEqual(cm.exception.error_list[0].code, "complexity")

        expected_suberror = "must contain 1 or more unique digits"
        with self.assertRaises(ValidationError) as cm:
            validator.validate("Ab!")
        self.assertEqual(cm.exception.messages, [expected_error % expected_suberror])
        self.assertEqual(cm.exception.error_list[0].code, "complexity")

        expected_suberror = "must contain 1 or more non unique special characters"
        with self.assertRaises(ValidationError) as cm:
            validator.validate("Ab1")
        self.assertEqual(cm.exception.messages, [expected_error % expected_suberror])
        self.assertEqual(cm.exception.error_list[0].code, "complexity")

        self.assertEqual(
            validator.get_help_text(),
            "Your password fails to meet our complexity requirements.",
        )


class ComplexityValidatorTests(TestCase):
    def assertValid(self, validator, string):
        try:
            validator(string)
        except ValidationError:
            self.fail(f"String {string} failed validation unexpectedly")

    def assertInvalid(self, validator, string):
        self.assertRaises(ValidationError, validator, string)

    def make_validator(self, **complexities):
        return ComplexityValidator(complexities=complexities)

    def test_empty_validator(self):
        validator = ComplexityValidator(complexities=None)
        self.assertValid(validator, "")

    def test_minimum_uppercase_count(self):
        validator = self.make_validator(UPPER=0)
        self.assertValid(validator, "no uppercase")
        self.assertValid(validator, "Some UpperCase")
        self.assertValid(validator, "ALL UPPERCASE")

        validator = self.make_validator(UPPER=1)
        self.assertInvalid(validator, "no uppercase")
        self.assertValid(validator, "Some UpperCase")
        self.assertValid(validator, "ALL UPPERCASE")

        validator = self.make_validator(UPPER=100)
        self.assertInvalid(validator, "no uppercase")
        self.assertInvalid(validator, "Some UpperCase")
        self.assertInvalid(validator, "ALL UPPERCASE")

    def test_minimum_lowercase_count(self):
        validator = self.make_validator(LOWER=0)
        self.assertValid(validator, "NO LOWERCASE")
        self.assertValid(validator, "sOME lOWERCASE")
        self.assertValid(validator, "all lowercase")

        validator = self.make_validator(LOWER=1)
        self.assertInvalid(validator, "NO LOWERCASE")
        self.assertValid(validator, "sOME lOWERCASE")
        self.assertValid(validator, "all lowercase")

        validator = self.make_validator(LOWER=100)
        self.assertInvalid(validator, "NO LOWERCASE")
        self.assertInvalid(validator, "sOME lOWERCASE")
        self.assertInvalid(validator, "all lowercase")

    def test_minimum_letter_count(self):
        validator = self.make_validator(LETTERS=0)
        self.assertValid(validator, "1234. ?")
        self.assertValid(validator, "soME 123")
        self.assertValid(validator, "allletters")

        validator = self.make_validator(LETTERS=1)
        self.assertInvalid(validator, "1234. ?")
        self.assertValid(validator, "soME 123")
        self.assertValid(validator, "allletters")

        validator = self.make_validator(LETTERS=100)
        self.assertInvalid(validator, "1234. ?")
        self.assertInvalid(validator, "soME 123")
        self.assertInvalid(validator, "allletters")

    def test_minimum_digit_count(self):
        validator = self.make_validator(DIGITS=0)
        self.assertValid(validator, "")
        self.assertValid(validator, "0")
        self.assertValid(validator, "1")
        self.assertValid(validator, "11")
        self.assertValid(validator, "one 1")

        validator = self.make_validator(DIGITS=1)
        self.assertInvalid(validator, "")
        self.assertValid(validator, "0")
        self.assertValid(validator, "1")
        self.assertValid(validator, "11")
        self.assertValid(validator, "one 1")

    def test_minimum_punctuation_count(self):
        none = "no punctuation"
        one = "ffs!"
        mixed = r"w@oo%lo(om!ol~oo&"
        allpunc = string.punctuation

        validator = self.make_validator(SPECIAL=0)
        self.assertValid(validator, none)
        self.assertValid(validator, one)
        self.assertValid(validator, mixed)
        self.assertValid(validator, allpunc)

        validator = self.make_validator(SPECIAL=1)
        self.assertInvalid(validator, none)
        self.assertValid(validator, one)
        self.assertValid(validator, mixed)
        self.assertValid(validator, allpunc)

        validator = self.make_validator(SPECIAL=100)
        self.assertInvalid(validator, none)
        self.assertInvalid(validator, one)
        self.assertInvalid(validator, mixed)
        self.assertInvalid(validator, allpunc)

    def test_minimum_nonascii_count(self):
        none = "regularchars and numbers 100"
        one = "\x00"  # null
        many = "\x00\x01\x02\x03\x04\x05\t\n\r"

        validator = self.make_validator(SPECIAL=0)
        self.assertValid(validator, none)
        self.assertValid(validator, one)
        self.assertValid(validator, many)

        validator = self.make_validator(SPECIAL=1)
        self.assertInvalid(validator, none)
        self.assertValid(validator, one)
        self.assertValid(validator, many)

        validator = self.make_validator(SPECIAL=100)
        self.assertInvalid(validator, none)
        self.assertInvalid(validator, one)
        self.assertInvalid(validator, many)

    def test_minimum_words_count(self):
        none = ""
        one = "oneword"
        some = "one or two words"
        many = "a b c d e f g h i 1 2 3 4 5 6 7 8 9 { $ # ! )}"

        validator = self.make_validator(WORDS=0)
        self.assertValid(validator, none)
        self.assertValid(validator, one)
        self.assertValid(validator, some)
        self.assertValid(validator, many)

        validator = self.make_validator(WORDS=1)
        self.assertInvalid(validator, none)
        self.assertValid(validator, one)
        self.assertValid(validator, some)
        self.assertValid(validator, many)

        validator = self.make_validator(WORDS=10)
        self.assertInvalid(validator, none)
        self.assertInvalid(validator, one)
        self.assertInvalid(validator, some)
        self.assertValid(validator, many)

        validator = self.make_validator(WORDS=100)
        self.assertInvalid(validator, none)
        self.assertInvalid(validator, one)
        self.assertInvalid(validator, some)
        self.assertInvalid(validator, many)


================================================
FILE: concordia/tests/test_view_decorators.py
================================================
from unittest.mock import MagicMock, patch

from django.core.exceptions import ObjectDoesNotExist, ValidationError
from django.http import HttpRequest
from django.test import TestCase

from concordia.views.decorators import next_asset_rate


class TestNextAssetRate(TestCase):
    def setUp(self):
        self.request = HttpRequest()

    def test_authenticated_user_returns_none(self):
        self.request.user = MagicMock(is_authenticated=True)
        result = next_asset_rate("any.group", self.request)
        self.assertIsNone(result)

    @patch("concordia.views.decorators.configuration_value")
    @patch("concordia.views.decorators.validate_rate")
    def test_anonymous_user_valid_rate(self, mock_validate_rate, mock_config_value):
        self.request.user = MagicMock(is_authenticated=False)
        mock_config_value.return_value = "10/m"
        mock_validate_rate.return_value = "10/m"

        result = next_asset_rate("next_asset", self.request)
        self.assertEqual(result, "10/m")

    @patch("concordia.views.decorators.configuration_value")
    @patch("concordia.views.decorators.validate_rate")
    def test_anonymous_user_invalid_rate_falls_back(
        self, mock_validate_rate, mock_config_value
    ):
        self.request.user = MagicMock(is_authenticated=False)
        mock_config_value.return_value = "invalid"
        mock_validate_rate.side_effect = ValidationError("bad")

        result = next_asset_rate("next_asset", self.request)
        self.assertEqual(result, "4/m")

    @patch("concordia.views.decorators.configuration_value")
    def test_anonymous_user_missing_value_falls_back(self, mock_config_value):
        self.request.user = MagicMock(is_authenticated=False)
        mock_config_value.side_effect = ObjectDoesNotExist()

        result = next_asset_rate("next_asset", self.request)
        self.assertEqual(result, "4/m")


================================================
FILE: concordia/tests/test_views.py
================================================
import json
from datetime import date, timedelta
from unittest.mock import patch

from django import forms
from django.contrib.auth.models import AnonymousUser
from django.core.cache import caches
from django.db.models.signals import post_save
from django.http import HttpResponse, JsonResponse
from django.test import (
    Client,
    RequestFactory,
    TestCase,
    override_settings,
)
from django.urls import reverse
from django.utils.decorators import method_decorator
from django.utils.timezone import now

from concordia.models import (
    Asset,
    Campaign,
    Transcription,
)
from concordia.signals.handlers import on_transcription_save
from concordia.tasks.reports.sitereport import campaign_report
from concordia.utils import get_anonymous_user
from concordia.views.accounts import AccountProfileView, registration_rate
from concordia.views.campaigns import CompletedCampaignListView
from concordia.views.decorators import reserve_rate, user_cache_control
from concordia.views.items import FilteredItemDetailView
from concordia.views.projects import FilteredProjectDetailView
from concordia.views.rate_limit import ratelimit_view
from concordia.views.visualizations import VisualizationDataView

from .utils import (
    CreateTestUsers,
    JSONAssertMixin,
    create_asset,
    create_campaign,
    create_card_family,
    create_guide,
    create_item,
    create_project,
    create_research_center,
    create_tag_collection,
    create_topic,
    create_transcription,
)


def setup_view(view, request, user=None, *args, **kwargs):
    """
    https://stackoverflow.com/a/33647251/10320488
    """
    if user:
        request.user = user
    view.request = request
    view.args = args
    view.kwargs = kwargs
    return view


class AccountProfileViewTests(CreateTestUsers, TestCase):
    """
    This class contains the unit tests for the AccountProfileView.
    """

    def test_get_queryset(self):
        """
        Test the get_queryset method
        """
        self.login_user()
        v = setup_view(
            AccountProfileView(),
            RequestFactory().get("account/password_reset/"),
            user=self.user,
        )
        qs = v.get_queryset()
        self.assertEqual(qs.count(), 0)


class CompletedCampaignListViewTests(TestCase):
    """
    This class contains the unit tests for the CompletedCampaignListView
    """

    def setUp(self):
        today = date.today()
        yesterday = today - timedelta(days=1)

        self.research_center = create_research_center()
        self.campaign2 = create_campaign(
            published=True,
            status=Campaign.Status.COMPLETED,
            slug="test-campaign-2",
            completed_date=yesterday,
        )
        self.campaign2.research_centers.add(self.research_center)
        self.campaign3 = create_campaign(
            published=True,
            status=Campaign.Status.RETIRED,
            slug="test-campaign-3",
            completed_date=yesterday,
        )

    def test_get_all_campaigns(self):
        active = create_campaign(
            published=True,
            slug="test-campaign-4",
            completed_date=self.campaign2.completed_date,
        )
        view = CompletedCampaignListView()
        view.request = RequestFactory().get("/campaigns/completed/")
        completed_and_retired = view._get_all_campaigns()
        self.assertNotIn(active, completed_and_retired)
        self.assertIn(self.campaign2, completed_and_retired)
        self.assertIn(self.campaign3, completed_and_retired)

        view.request = RequestFactory().get("/campaigns/completed/?type=completed")
        completed_campaigns = view._get_all_campaigns()
        self.assertNotIn(active, completed_campaigns)
        self.assertIn(self.campaign2, completed_campaigns)
        self.assertNotIn(self.campaign3, completed_campaigns)

        view.request = RequestFactory().get("/campaigns/completed/?type=retired")
        retired_campaigns = view._get_all_campaigns()
        self.assertNotIn(active, retired_campaigns)
        self.assertNotIn(self.campaign2, retired_campaigns)
        self.assertIn(self.campaign3, retired_campaigns)

    def test_queryset(self):
        today = date.today()
        create_campaign(
            published=True, status=Campaign.Status.COMPLETED, completed_date=today
        )

        view = CompletedCampaignListView()

        # Test default
        view.request = RequestFactory().get("/campaigns/completed/")
        queryset = view.get_queryset()
        self.assertGreater(
            queryset.first().completed_date, queryset.last().completed_date
        )

        # Test retired
        view.request = RequestFactory().get("/campaigns/completed/?type=retired")
        queryset = view.get_queryset()
        self.assertEqual(queryset.count(), 1)

    def test_context_data(self):
        request = RequestFactory().get("/campaigns/completed/")
        response = CompletedCampaignListView.as_view()(request)
        self.assertIsInstance(response.context_data, dict)
        self.assertEqual(response.context_data["result_count"], 2)

        request = RequestFactory().get("/campaigns/completed/?type=completed")
        response = CompletedCampaignListView.as_view()(request)
        self.assertIsInstance(response.context_data, dict)
        self.assertEqual(response.context_data["result_count"], 1)

        request = RequestFactory().get("/campaigns/completed/?type=completed")
        response = CompletedCampaignListView.as_view()(request)
        self.assertIsInstance(response.context_data, dict)
        self.assertEqual(response.context_data["result_count"], 1)

        request = RequestFactory().get(
            f"/campaigns/completed/?research_center={self.research_center.id}"
        )
        response = CompletedCampaignListView.as_view()(request)
        self.assertIsInstance(response.context_data, dict)
        self.assertEqual(response.context_data["result_count"], 1)

    def test_research_centers(self):
        today = date.today()

        create_campaign(
            published=True, status=Campaign.Status.COMPLETED, completed_date=today
        )

        url = f"/campaigns/completed/?research_center={self.research_center.id}"

        # Test queryset directly
        view = CompletedCampaignListView()
        view.request = RequestFactory().get(url)
        queryset = view.get_queryset()

        self.assertEqual(queryset.count(), 1)

        # Test get_context_data through a get
        response = self.client.get(url)

        self.assertIn("research_centers", response.context)
        self.assertEqual(response.context["research_centers"][0], self.research_center)


@override_settings(
    RATELIMIT_ENABLE=False, SESSION_ENGINE="django.contrib.sessions.backends.cache"
)
class ConcordiaViewTests(CreateTestUsers, JSONAssertMixin, TestCase):
    """
    This class contains the unit tests for the view in the concordia app.
    """

    def setUp(self):
        for cache in caches.all():
            cache.clear()

    def tearDown(self):
        for cache in caches.all():
            cache.clear()

    def test_ratelimit_view(self):
        c = Client()
        response = c.get("/error/429/")
        self.assertIsInstance(response, HttpResponse)
        self.assertEqual(response.status_code, 429)

        headers = {"HTTP_X_REQUESTED_WITH": "XMLHttpRequest"}
        response = c.get("/error/429/", **headers)
        self.assertIsInstance(response, JsonResponse)
        self.assertEqual(response.status_code, 429)

    def test_campaign_topic_list_view(self):
        """
        Test the GET method for route /campaigns-topics
        """
        campaign = create_campaign(title="Hello Everyone")
        topic_project = create_project(campaign=campaign)
        campaign_item = create_item(project=topic_project)
        create_asset(item=campaign_item)
        unlisted_campaign = create_campaign(
            title="Hello to only certain people", unlisted=True
        )
        unlisted_topic_project = create_project(campaign=unlisted_campaign)
        unlisted_campaign_item = create_item(project=unlisted_topic_project)
        create_asset(item=unlisted_campaign_item)
        topic = create_topic(title="A Listed Topic", project=topic_project)
        unlisted_topic = create_topic(
            title="An Unlisted Topic", unlisted=True, project=unlisted_topic_project
        )

        response = self.client.get(reverse("campaign-topic-list"))

        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="transcriptions/campaign_topic_list.html"
        )
        self.assertContains(response, topic.title)
        self.assertNotContains(response, unlisted_topic.title)
        self.assertContains(response, campaign.title)
        self.assertNotContains(response, unlisted_campaign.title)

    def test_campaign_list_view(self):
        """
        Test the GET method for route /campaigns
        """
        campaign = create_campaign(title="Hello Everyone 2")
        unlisted_campaign = create_campaign(
            title="Hello to only certain people 2", unlisted=True
        )

        response = self.client.get(reverse("transcriptions:campaign-list"))

        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="transcriptions/campaign_list.html"
        )
        self.assertContains(response, campaign.title)
        self.assertNotContains(response, unlisted_campaign.title)

    def test_campaign_detail_view(self):
        """
        Test GET on route /campaigns/<slug-value> (campaign)
        """
        campaign = create_campaign(title="GET Campaign", slug="get-campaign")
        response = self.client.get(
            reverse("transcriptions:campaign-detail", args=(campaign.slug,))
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="transcriptions/campaign_detail.html"
        )
        self.assertContains(response, campaign.title)
        # Filter by reviewable parameter check
        response = self.client.get(
            reverse("transcriptions:campaign-detail", args=(campaign.slug,)),
            {"filter_by_reviewable": True},
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="transcriptions/campaign_detail.html"
        )
        self.assertContains(response, campaign.title)
        # Bad status parameter check
        response = self.client.get(
            reverse("transcriptions:campaign-detail", args=(campaign.slug,)),
            {"transcription_status": "bad_parameter"},
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="transcriptions/campaign_detail.html"
        )
        self.assertContains(response, campaign.title)

        # Unlisted
        campaign = create_campaign(
            title="GET Unlisted Campaign", unlisted=True, slug="get-unlisted-campaign"
        )
        response = self.client.get(
            reverse("transcriptions:campaign-detail", args=(campaign.slug,))
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="transcriptions/campaign_detail.html"
        )
        self.assertContains(response, campaign.title)

        # Completed
        campaign = create_campaign(
            title="GET Completed Campaign",
            slug="get-completed-campaign",
            status=Campaign.Status.COMPLETED,
        )
        response = self.client.get(
            reverse("transcriptions:campaign-detail", args=(campaign.slug,))
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="transcriptions/campaign_detail_completed.html"
        )
        self.assertContains(response, campaign.title)

        # Retired
        campaign = create_campaign(
            title="GET Retired Campaign",
            slug="get-retired-campaign",
            status=Campaign.Status.RETIRED,
        )
        # We need a site report for a retired campaign because
        # that's where the view pulls data from
        campaign_report(campaign=campaign)
        response = self.client.get(
            reverse("transcriptions:campaign-detail", args=(campaign.slug,))
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="transcriptions/campaign_detail_retired.html"
        )
        self.assertContains(response, campaign.title)

    def test_campaign_unicode_slug(self):
        """Confirm that Unicode characters are usable in Campaign URLs"""

        campaign = create_campaign(title="你好 World")

        self.assertEqual(campaign.slug, "你好-world")

        response = self.client.get(campaign.get_absolute_url())

        self.assertEqual(response.status_code, 200)

    def test_concordiaCampaignView_get_page2(self):
        """
        Test GET on route /campaigns/<slug-value>/ (campaign) on page 2
        """
        c = create_campaign()

        response = self.client.get(
            reverse("transcriptions:campaign-detail", args=(c.slug,)), {"page": 2}
        )

        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="transcriptions/campaign_detail.html"
        )

    def test_empty_item_detail_view(self):
        """
        Test item detail display with no assets
        """

        item = create_item()

        response = self.client.get(
            reverse(
                "transcriptions:item-detail",
                args=(item.project.campaign.slug, item.project.slug, item.item_id),
            )
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="transcriptions/item_detail.html"
        )
        self.assertContains(response, item.title)
        self.assertEqual(0, response.context["not_started_percent"])
        self.assertEqual(0, response.context["in_progress_percent"])
        self.assertEqual(0, response.context["submitted_percent"])
        self.assertEqual(0, response.context["completed_percent"])

    def test_item_detail_view(self):
        """
        Test item detail display with assets
        """

        self.login_user()  # Implicitly create the test account
        anon = get_anonymous_user()

        item = create_item()
        # We'll create 10 assets and transcriptions for some of them so we can
        # confirm that the math is working correctly:
        for i in range(1, 11):
            asset = create_asset(item=item, sequence=i, slug=f"test-{i}")
            if i > 9:
                t = asset.transcription_set.create(asset=asset, user=anon)
                t.submitted = now()
                t.accepted = now()
                t.reviewed_by = self.user
            elif i > 7:
                t = asset.transcription_set.create(asset=asset, user=anon)
                t.submitted = now()
            elif i > 4:
                t = asset.transcription_set.create(asset=asset, user=anon)
            else:
                continue

            t.full_clean()
            t.save()

        response = self.client.get(
            reverse(
                "transcriptions:item-detail",
                args=(item.project.campaign.slug, item.project.slug, item.item_id),
            )
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="transcriptions/item_detail.html"
        )
        self.assertContains(response, item.title)
        # We have 10 total, 6 of which have transcription records and of those
        # 6, 3 have been submitted and one of those was accepted:
        self.assertEqual(40, response.context["not_started_percent"])
        self.assertEqual(30, response.context["in_progress_percent"])
        self.assertEqual(20, response.context["submitted_percent"])
        self.assertEqual(10, response.context["completed_percent"])
        # Filter by reviewable parameter check
        response = self.client.get(
            reverse(
                "transcriptions:item-detail",
                args=(item.project.campaign.slug, item.project.slug, item.item_id),
            ),
            {"filter_by_reviewable": True},
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="transcriptions/item_detail.html"
        )
        # Bad status parameter check
        response = self.client.get(
            reverse(
                "transcriptions:item-detail",
                args=(item.project.campaign.slug, item.project.slug, item.item_id),
            ),
            {"transcription_status": "bad_parameter"},
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="transcriptions/item_detail.html"
        )

        # Non-existent item in an existing campaign
        response = self.client.get(
            reverse(
                "transcriptions:item-detail",
                args=(item.project.campaign.slug, item.project.slug, "bad-id"),
            )
        )
        self.assertRedirects(
            response,
            reverse(
                "transcriptions:campaign-detail", args=(item.project.campaign.slug,)
            ),
        )

    def test_asset_unicode_slug(self):
        """Confirm that Unicode characters are usable in Asset URLs"""

        asset = create_asset(title="你好 World")

        self.assertEqual(asset.slug, "你好-world")

        response = self.client.get(asset.get_absolute_url())

        self.assertEqual(response.status_code, 200)

    def test_asset_detail_view(self):
        """
        This unit test test the GET route /campaigns/<campaign>/asset/<Asset_name>/
        with already in use.
        """
        self.login_user()

        asset = create_asset(sequence=100)

        self.transcription = asset.transcription_set.create(
            user_id=self.user.id, text="Test transcription 1"
        )
        self.transcription.save()

        asset.item.project.campaign.card_family = create_card_family()
        asset.item.project.campaign.save()
        title = "Transcription: Basic Rules"
        create_guide(title=title)

        tag_collection = create_tag_collection(asset=asset)

        response = self.client.get(
            reverse(
                "transcriptions:asset-detail",
                kwargs={
                    "campaign_slug": asset.item.project.campaign.slug,
                    "project_slug": asset.item.project.slug,
                    "item_id": asset.item.item_id,
                    "slug": asset.slug,
                },
            )
        )
        self.assertEqual(response.status_code, 200)
        self.assertIn("cards", response.context)
        self.assertIn("guides", response.context)
        self.assertEqual(title, response.context["guides"][0]["title"])
        self.assertIn("tags", response.context)
        self.assertEqual([tag_collection.tags.all()[0].value], response.context["tags"])

        # Next and previous asset checks
        previous_asset = create_asset(
            item=asset.item, slug="previous-asset", sequence=1
        )
        next_asset = create_asset(item=asset.item, slug="next-asset", sequence=1000)
        response = self.client.get(
            reverse(
                "transcriptions:asset-detail",
                kwargs={
                    "campaign_slug": asset.item.project.campaign.slug,
                    "project_slug": asset.item.project.slug,
                    "item_id": asset.item.item_id,
                    "slug": asset.slug,
                },
            )
        )
        self.assertEqual(response.status_code, 200)
        self.assertIn("previous_asset_url", response.context)
        self.assertEqual(
            previous_asset.get_absolute_url(), response.context["previous_asset_url"]
        )
        self.assertIn("next_asset_url", response.context)
        self.assertEqual(
            next_asset.get_absolute_url(), response.context["next_asset_url"]
        )

        # Download URL iiif check
        asset.download_url = "http://tile.loc.gov/image-services/iiif/service:music:mussuffrage:mussuffrage-100183:mussuffrage-100183.0001/full/pct:100/0/default.jpg"
        asset.save()
        response = self.client.get(
            reverse(
                "transcriptions:asset-detail",
                kwargs={
                    "campaign_slug": asset.item.project.campaign.slug,
                    "project_slug": asset.item.project.slug,
                    "item_id": asset.item.item_id,
                    "slug": asset.slug,
                },
            )
        )
        self.assertEqual(response.status_code, 200)
        self.assertIn("thumbnail_url", response.context)
        self.assertEqual(
            "https://tile.loc.gov/image-services/iiif/service:music:mussuffrage:mussuffrage-100183:mussuffrage-100183.0001/full/!512,512/0/default.jpg",
            response.context["thumbnail_url"],
        )

        # Non-existent asset in an existing campaign
        response = self.client.get(
            reverse(
                "transcriptions:asset-detail",
                kwargs={
                    "campaign_slug": asset.item.project.campaign.slug,
                    "project_slug": asset.item.project.slug,
                    "item_id": asset.item.item_id,
                    "slug": "bad-slug",
                },
            )
        )
        self.assertRedirects(
            response,
            reverse(
                "transcriptions:campaign-detail",
                args=(asset.item.project.campaign.slug,),
            ),
        )

    @patch.object(Asset, "get_ocr_transcript")
    def test_generate_ocr_transcription(self, mock):
        asset1 = create_asset(storage_image="tests/test-european.jpg")
        url = reverse("generate-ocr-transcription", kwargs={"asset_pk": asset1.pk})

        # Anonymous user test; should redirect
        response = self.client.post(url)
        self.assertEqual(302, response.status_code)
        self.assertFalse(mock.called)
        mock.reset_mock()

        self.login_user()
        response = self.client.post(url)
        self.assertEqual(201, response.status_code)
        self.assertTrue(mock.called)
        mock.reset_mock()

        asset2 = create_asset(
            item=asset1.item,
            slug="test-asset-2",
            storage_image="tests/test-european.jpg",
        )
        url = reverse("generate-ocr-transcription", kwargs={"asset_pk": asset2.pk})
        response = self.client.post(url, data={"language": "spa"})
        self.assertEqual(201, response.status_code)
        mock.assert_called_with("spa")
        mock.reset_mock()

        with patch(
            "concordia.views.ajax.get_transcription_superseded"
        ) as superseded_mock:
            # Test case if the trancription being replaced has already been superseded
            superseded_mock.return_value = HttpResponse(status=409)
            url = reverse("generate-ocr-transcription", kwargs={"asset_pk": asset2.pk})
            response = self.client.post(url)
            self.assertEqual(409, response.status_code)
            self.assertTrue(superseded_mock.called)
            self.assertFalse(mock.called)

            # Test case if the transcription being replaced hasn't been superseded
            superseded_mock.reset_mock()
            superseded_mock.return_value = create_transcription(
                asset=asset2, user=get_anonymous_user(), submitted=now()
            )
            url = reverse("generate-ocr-transcription", kwargs={"asset_pk": asset2.pk})
            response = self.client.post(url)
            self.assertEqual(201, response.status_code)
            self.assertTrue(superseded_mock.called)
            self.assertTrue(mock.called)

    def test_project_detail_view(self):
        """
        Test GET on route /campaigns/<slug-value> (campaign)
        """
        project = create_project()

        response = self.client.get(
            reverse(
                "transcriptions:project-detail",
                args=(project.campaign.slug, project.slug),
            )
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="transcriptions/project_detail.html"
        )
        # Filter by reviewable parameter check
        response = self.client.get(
            reverse(
                "transcriptions:project-detail",
                args=(project.campaign.slug, project.slug),
            ),
            {"filter_by_reviewable": True},
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="transcriptions/project_detail.html"
        )
        # Bad status parameter check
        response = self.client.get(
            reverse(
                "transcriptions:project-detail",
                args=(project.campaign.slug, project.slug),
            ),
            {"transcription_status": "bad_parameter"},
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="transcriptions/project_detail.html"
        )

        # Non-existent project in an existing campaign
        response = self.client.get(
            reverse(
                "transcriptions:project-detail",
                args=(project.campaign.slug, "bad-slug"),
            )
        )
        self.assertRedirects(
            response,
            reverse("transcriptions:campaign-detail", args=(project.campaign.slug,)),
        )

    def test_project_unicode_slug(self):
        """Confirm that Unicode characters are usable in Project URLs"""

        project = create_project(title="你好 World")

        self.assertEqual(project.slug, "你好-world")

        response = self.client.get(project.get_absolute_url())

        self.assertEqual(response.status_code, 200)

    def test_campaign_report(self):
        """
        Test campaign reporting
        """

        item = create_item()
        # We'll create 10 assets and transcriptions for some of them so we can
        # confirm that the math is working correctly:
        for i in range(1, 11):
            create_asset(item=item, sequence=i, slug=f"test-{i}")

        response = self.client.get(
            reverse(
                "transcriptions:campaign-report",
                kwargs={"campaign_slug": item.project.campaign.slug},
            )
        )

        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(response, "transcriptions/campaign_report.html")

        ctx = response.context

        self.assertEqual(ctx["title"], item.project.campaign.title)
        self.assertEqual(ctx["total_asset_count"], 10)

        response = self.client.get(
            reverse(
                "transcriptions:campaign-report",
                kwargs={"campaign_slug": item.project.campaign.slug},
            ),
            {"page": "not-an-int"},
        )

        ctx = response.context

        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(response, "transcriptions/campaign_report.html")
        self.assertEqual(ctx["projects"].number, 1)

        response = self.client.get(
            reverse(
                "transcriptions:campaign-report",
                kwargs={"campaign_slug": item.project.campaign.slug},
            ),
            {"page": 10000},
        )

        ctx = response.context
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(response, "transcriptions/campaign_report.html")
        self.assertEqual(ctx["projects"].number, 1)


class UserCacheControlTest(CreateTestUsers, TestCase):
    """
    Tests for the user_cache_control decorator
    """

    def setUp(self):
        self.factory = RequestFactory()
        self.user = self.create_user("testuser")

    def test_vary_on_cookie(self):
        @method_decorator(user_cache_control, name="dispatch")
        def a_view(request):
            return HttpResponse()

        request = self.factory.get("/rand")
        request.user = self.user
        resp = a_view(None, request)
        self.assertEqual(resp.status_code, 200)


class FilteredCampaignDetailViewTests(CreateTestUsers, TestCase):
    def test_get_context_data(self):
        campaign = create_campaign()
        kwargs = {"slug": campaign.slug}
        url = reverse("transcriptions:filtered-campaign-detail", kwargs=kwargs)

        self.login_user(is_staff=False)
        response = self.client.get(url, kwargs)
        self.assertFalse(response.context.get("filter_by_reviewable", False))
        self.logout_user()

        self.user = self.create_staff_user()
        self.login_user()
        response = self.client.get(url, kwargs)
        self.assertTrue(response.context.get("filter_by_reviewable"))


class FilteredProjectDetailViewTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.project = create_project()
        self.kwargs = {
            "campaign_slug": self.project.campaign.slug,
            "slug": self.project.slug,
        }
        self.url = reverse("transcriptions:filtered-project-detail", kwargs=self.kwargs)
        self.login_user()

    def test_get_queryset(self):
        item1 = create_item(project=self.project, item_id="testitem.012345679")
        asset1 = create_asset(item=item1)
        create_transcription(asset=asset1, user=get_anonymous_user(), submitted=now())

        item2 = create_item(
            project=create_project(slug="project-two", campaign=self.project.campaign)
        )
        asset2 = create_asset(item=item2)
        create_transcription(asset=asset2, user=self.user, submitted=now())

        view = FilteredProjectDetailView()
        view.kwargs = self.kwargs
        view.request = RequestFactory().get(self.url, self.kwargs)
        view.request.user = self.user
        qs = view.get_queryset()
        self.assertIn(item1, qs)
        self.assertNotIn(item2, qs)

    def test_get_context_data(self):
        response = self.client.get(self.url, self.kwargs)
        self.assertTrue(response.context.get("filter_by_reviewable"))

    def tearDown(self):
        post_save.connect(on_transcription_save, sender=Transcription)


class FilteredItemDetailViewTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.item = create_item()
        self.kwargs = {
            "campaign_slug": self.item.project.campaign.slug,
            "project_slug": self.item.project.slug,
            "item_id": self.item.item_id,
        }
        self.url = reverse("transcriptions:filtered-item-detail", kwargs=self.kwargs)
        self.login_user()

    def test_get_queryset(self):
        asset1 = create_asset(item=self.item)
        create_transcription(asset=asset1, user=get_anonymous_user(), submitted=now())

        asset2 = create_asset(item=self.item, slug="asset-two")
        create_transcription(asset=asset2, user=self.user, submitted=now())

        view = FilteredItemDetailView()
        view.kwargs = self.kwargs
        view.request = RequestFactory().get(self.url, self.kwargs)
        view.request.user = self.user
        qs = view.get_queryset()
        self.assertIn(asset1, qs)
        self.assertNotIn(asset2, qs)

    def test_get_context_data(self):
        response = self.client.get(self.url, self.kwargs)
        self.assertTrue(response.context.get("filter_by_reviewable"))

    def tearDown(self):
        post_save.connect(on_transcription_save, sender=Transcription)


class RateLimitTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.request_factory = RequestFactory()
        self.user = self.create_user("test-user")

    def test_registration_rate(self):
        request = self.request_factory.get("/")
        self.assertEqual(registration_rate(None, request), "10/h")
        with patch("concordia.views.accounts.UserRegistrationForm", autospec=True):
            # This causes the form to test as valid even though there's no data
            self.assertIsNone(registration_rate(None, request))

    def test_ratelimit_view(self):
        request = self.request_factory.post("/")
        exception = Exception()
        response = ratelimit_view(request, exception)
        self.assertEqual(response.status_code, 429)
        self.assertNotEqual(response["Retry-After"], 0)

    def test_reserve_rate(self):
        request = self.request_factory.post("/")

        request.user = AnonymousUser()
        self.assertEqual("100/m", reserve_rate("test.group", request))

        request.user = self.user
        self.assertEqual(None, reserve_rate("test.group", request))


class LoginTests(TestCase, CreateTestUsers):
    def setUp(self):
        self.user = self.create_user("test-user")

    def test_ConcordiaLoginView(self):
        with patch("concordia.turnstile.fields.TurnstileField.validate") as mock:
            mock.side_effect = forms.ValidationError(
                "Testing error", code="invalid_turnstile"
            )
            response = self.client.post(
                reverse("registration_login"),
                data={"username": self.user.username, "password": self.user._password},
            )
        self.assertIn("user", response.context)
        self.assertFalse(response.context["user"].is_authenticated)

        with patch(
            "concordia.turnstile.fields.TurnstileField.validate", return_value=True
        ):
            response = self.client.post(
                reverse("registration_login"),
                data={"username": self.user.username, "password": self.user._password},
                follow=True,
            )
        self.assertRedirects(
            response,
            expected_url=reverse("homepage"),
            target_status_code=200,
        )
        self.assertIn("user", response.context)
        self.assertTrue(response.context["user"].is_authenticated)


class TranscriptionViewTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.asset = create_asset()

    def test_rollback_transcription(self):
        path = reverse("rollback-transcription", args=[self.asset.id])
        self.login_user()

        # Test rollback when there are no transcriptions
        response = self.client.post(path)
        self.assertEqual(400, response.status_code)
        self.assertIn("error", response.json())

        transcription1 = create_transcription(
            asset=self.asset, text="Test transcription 1"
        )
        user = transcription1.user

        # Test rollback when there are no transcriptions to rollback to
        response = self.client.post(path)
        self.assertEqual(400, response.status_code)
        self.assertIn("error", response.json())

        # Test successful rollback
        create_transcription(asset=self.asset, user=user, text="Test transcription 2")
        response = self.client.post(path)
        self.assertEqual(201, response.status_code)
        response_json = response.json()
        self.assertIn("id", response_json)
        self.assertIn("text", response_json)
        self.assertEqual(response_json["text"], transcription1.text)
        self.assertIn("undo_available", response_json)
        self.assertEqual(response_json["undo_available"], False)
        self.assertIn("redo_available", response_json)
        self.assertEqual(response_json["redo_available"], True)

        # Test after a rollforward
        self.asset.rollforward_transcription(user)
        response = self.client.post(path)
        self.assertEqual(201, response.status_code)
        response_json = response.json()
        self.assertIn("id", response_json)
        self.assertIn("text", response_json)
        self.assertEqual(response_json["text"], transcription1.text)
        self.assertIn("undo_available", response_json)
        self.assertEqual(response_json["undo_available"], False)
        self.assertIn("redo_available", response_json)
        self.assertEqual(response_json["redo_available"], True)

        # Test anonymous user
        self.client.logout()
        create_transcription(asset=self.asset, user=user, text="Test transcription 3")
        with patch(
            "concordia.turnstile.fields.TurnstileField.validate", return_value=True
        ):
            response = self.client.post(path)
        self.assertEqual(201, response.status_code)
        response_json = response.json()
        self.assertIn("id", response_json)
        self.assertIn("text", response_json)
        self.assertEqual(response_json["text"], transcription1.text)
        self.assertIn("undo_available", response_json)
        self.assertEqual(response_json["undo_available"], False)
        self.assertIn("redo_available", response_json)
        self.assertEqual(response_json["redo_available"], True)

    def test_rollforward_transcription(self):
        path = reverse("rollforward-transcription", args=[self.asset.id])
        self.login_user()

        # Test rollforward when there are no transcriptions
        response = self.client.post(path)
        self.assertEqual(400, response.status_code)
        self.assertIn("error", response.json())

        transcription1 = create_transcription(
            asset=self.asset, text="Test transcription 1"
        )
        user = transcription1.user

        # Test rollback when there are no transcriptions to rollforward to
        response = self.client.post(path)
        self.assertEqual(400, response.status_code)
        self.assertIn("error", response.json())

        # Test successful rollforward, which requires a rollback first
        transcription2 = create_transcription(
            asset=self.asset, user=user, text="Test transcription 2"
        )
        self.asset.rollback_transcription(user)
        response = self.client.post(path)
        self.assertEqual(201, response.status_code)
        response_json = response.json()
        self.assertIn("id", response_json)
        self.assertIn("text", response_json)
        self.assertEqual(response_json["text"], transcription2.text)
        self.assertIn("undo_available", response_json)
        self.assertEqual(response_json["undo_available"], True)
        self.assertIn("redo_available", response_json)
        self.assertEqual(response_json["redo_available"], False)

        # Test aftering rolling back then creating a new transcription
        self.asset.rollback_transcription(user)
        create_transcription(asset=self.asset, user=user, text="Test transcription 3")
        response = self.client.post(path)
        self.assertEqual(400, response.status_code)
        self.assertIn("error", response.json())

        # Test anonymous user after a rollback
        self.client.logout()
        transcription3 = create_transcription(
            asset=self.asset, user=user, text="Test transcription 3"
        )
        self.asset.rollback_transcription(user)
        with patch(
            "concordia.turnstile.fields.TurnstileField.validate", return_value=True
        ):
            response = self.client.post(path)
        response_json = response.json()
        self.assertEqual(201, response.status_code)
        self.assertIn("id", response_json)
        self.assertIn("text", response_json)
        self.assertEqual(response_json["text"], transcription3.text)
        self.assertIn("undo_available", response_json)
        self.assertEqual(response_json["undo_available"], True)
        self.assertIn("redo_available", response_json)
        self.assertEqual(response_json["redo_available"], False)

    def tearDown(self):
        post_save.connect(on_transcription_save, sender=Transcription)


@override_settings(
    CACHES={
        "visualization_cache": {
            "BACKEND": "django.core.cache.backends.locmem.LocMemCache",
        }
    }
)
class VisualizationDataViewTests(TestCase):
    def setUp(self):
        self.factory = RequestFactory()
        self.cache = caches["visualization_cache"]
        VisualizationDataView.cache = self.cache
        self.cache.clear()
        self.view = VisualizationDataView.as_view()

    def test_get_missing_data_returns_404(self):
        # If no entry exists in the cache under the given name,
        # the view should return a 404 with a JSON error message.
        request = self.factory.get("/visualizations/data/missing-key/")
        response = self.view(request, name="missing-key")
        self.assertEqual(response.status_code, 404)
        self.assertEqual(response["Content-Type"], "application/json")
        data = json.loads(response.content)
        self.assertEqual(
            data, {"error": "No visualization data found for 'missing-key'"}
        )

    def test_get_existing_data_returns_200_and_json(self):
        # When the cache contains data for the given name,
        # the view should return it as JSON with status 200.
        sample_data = {"foo": "bar", "numbers": [1, 2, 3]}
        self.cache.set("sample-key", sample_data)
        request = self.factory.get("/visualizations/data/sample-key/")
        response = self.view(request, name="sample-key")
        self.assertEqual(response.status_code, 200)
        self.assertEqual(response["Content-Type"], "application/json")
        data = json.loads(response.content)
        self.assertEqual(data, sample_data)


================================================
FILE: concordia/tests/test_views_asset_reservation.py
================================================
from datetime import timedelta

from django.conf import settings
from django.contrib.auth.models import User
from django.db.models.signals import post_save
from django.test import (
    RequestFactory,
    TransactionTestCase,
    override_settings,
)
from django.urls import reverse
from django.utils.timezone import now

from concordia.models import (
    AssetTranscriptionReservation,
    Transcription,
)
from concordia.signals.handlers import on_transcription_save
from concordia.tasks.reservations import (
    delete_old_tombstoned_reservations,
    expire_inactive_asset_reservations,
    tombstone_old_active_asset_reservations,
)
from concordia.utils import get_anonymous_user, get_or_create_reservation_token

from .utils import (
    CreateTestUsers,
    JSONAssertMixin,
    create_asset,
)


@override_settings(
    RATELIMIT_ENABLE=False, SESSION_ENGINE="django.contrib.sessions.backends.cache"
)
class AssetReservationViewTests(CreateTestUsers, JSONAssertMixin, TransactionTestCase):
    def test_asset_reservation(self):
        """
        Test the basic Asset reservation process
        """

        self.login_user()
        self._asset_reservation_test_payload(self.user.pk)

    def test_asset_reservation_anonymously(self):
        """
        Test the basic Asset reservation process as an anonymous user
        """

        anon_user = get_anonymous_user()
        self._asset_reservation_test_payload(anon_user.pk, anonymous=True)

    def _asset_reservation_test_payload(self, user_id, anonymous=False):
        asset = create_asset()

        # Acquire the reservation: 1 acquire
        # + 1 reservation check
        # + 1 logging if not anonymous
        # + 1 session if not anonymous and using a database session engine:
        expected_update_queries = 2
        if not anonymous:
            expected_update_queries += 1  # Added by django-structlog middleware
            if settings.SESSION_ENGINE.endswith("db"):
                expected_update_queries += 1  # Added by database session engine
            # We don't need to add an extra query for accessing request.user
            # because the django-structlog middleware will do that for non-anonymous
            expected_acquire_queries = expected_update_queries
        else:
            expected_acquire_queries = expected_update_queries + 1

        with self.assertNumQueries(expected_acquire_queries):
            resp = self.client.post(reverse("reserve-asset", args=(asset.pk,)))
        data = self.assertValidJSON(resp, expected_status=200)

        reservation = AssetTranscriptionReservation.objects.get()
        self.assertEqual(reservation.reservation_token, data["reservation_token"])
        self.assertEqual(reservation.asset, asset)

        # Confirm that an update did not change the pk when it updated the timestamp:

        with self.assertNumQueries(expected_update_queries):
            resp = self.client.post(reverse("reserve-asset", args=(asset.pk,)))
        data = self.assertValidJSON(resp, expected_status=200)
        self.assertEqual(1, AssetTranscriptionReservation.objects.count())
        updated_reservation = AssetTranscriptionReservation.objects.get()
        self.assertEqual(
            updated_reservation.reservation_token, data["reservation_token"]
        )
        self.assertEqual(updated_reservation.asset, asset)
        self.assertEqual(reservation.created_on, updated_reservation.created_on)
        self.assertLess(reservation.created_on, updated_reservation.updated_on)

        # Release the reservation now that we're done:
        # 1 release
        # + 1 logging if not anonymous
        # + 1 session if not anonymous and using a database
        expected_release_queries = 1
        if not anonymous:
            expected_release_queries += 1  # Added by django-structlog middleware
            if settings.SESSION_ENGINE.endswith("db"):
                expected_release_queries += 1

        with self.assertNumQueries(expected_release_queries):
            resp = self.client.post(
                reverse("reserve-asset", args=(asset.pk,)), data={"release": True}
            )
        data = self.assertValidJSON(resp, expected_status=200)
        self.assertEqual(
            updated_reservation.reservation_token, data["reservation_token"]
        )

        self.assertEqual(0, AssetTranscriptionReservation.objects.count())

    def test_asset_reservation_competition(self):
        """
        Confirm that two users cannot reserve the same asset at the same time
        """

        asset = create_asset()

        # We'll reserve the test asset as the anonymous user and then attempt
        # to edit it after logging in

        # 4 queries =
        # 1 expiry + 1 acquire + 2 get user ID + 2 get user profile from request
        with self.assertNumQueries(6):
            resp = self.client.post(reverse("reserve-asset", args=(asset.pk,)))
        self.assertEqual(200, resp.status_code)
        self.assertEqual(1, AssetTranscriptionReservation.objects.count())

        # Clear the login session so the reservation_token will be regenerated:
        self.client.logout()
        self.login_user()

        # 1 session check + 1 acquire + get user ID from request
        with self.assertNumQueries(3 if settings.SESSION_ENGINE.endswith("db") else 2):
            resp = self.client.post(reverse("reserve-asset", args=(asset.pk,)))
        self.assertEqual(409, resp.status_code)
        self.assertEqual(1, AssetTranscriptionReservation.objects.count())

    def test_asset_reservation_expiration(self):
        """
        Simulate an expired reservation which should not cause the request to fail
        """
        asset = create_asset()

        stale_reservation = AssetTranscriptionReservation(  # nosec
            asset=asset, reservation_token="stale"
        )
        stale_reservation.full_clean()
        stale_reservation.save()
        # Backdate the object as if it happened 31 minutes ago:
        old_timestamp = now() - timedelta(minutes=31)
        AssetTranscriptionReservation.objects.update(
            created_on=old_timestamp, updated_on=old_timestamp
        )

        expire_inactive_asset_reservations()

        self.login_user()

        # 1 reservation check + 1 acquire + 1 get user ID from request
        expected_queries = 3
        if settings.SESSION_ENGINE.endswith("db"):
            # 1 session check
            expected_queries += 1

        with self.assertNumQueries(expected_queries):
            resp = self.client.post(reverse("reserve-asset", args=(asset.pk,)))

        data = self.assertValidJSON(resp, expected_status=200)
        self.assertEqual(1, AssetTranscriptionReservation.objects.count())
        reservation = AssetTranscriptionReservation.objects.get()
        self.assertEqual(reservation.reservation_token, data["reservation_token"])

    def test_asset_reservation_tombstone(self):
        """
        Simulate a tombstoned reservation which should:
            - return 408 during the tombstone period
            - during the tombstone period, another user may
              obtain the reservation but the original user may not
        """
        asset = create_asset()
        self.login_user()
        request_factory = RequestFactory()
        request = request_factory.get("/")
        request.session = {}
        reservation_token = get_or_create_reservation_token(request)

        session = self.client.session
        session["reservation_token"] = reservation_token
        session.save()

        tombstone_reservation = AssetTranscriptionReservation(  # nosec
            asset=asset, reservation_token=reservation_token
        )
        tombstone_reservation.full_clean()
        tombstone_reservation.save()
        # Backdate the object as if it was created hours ago,
        # even if it was recently updated
        old_timestamp = now() - timedelta(
            hours=settings.TRANSCRIPTION_RESERVATION_TOMBSTONE_HOURS + 1
        )
        current_timestamp = now()
        AssetTranscriptionReservation.objects.update(
            created_on=old_timestamp, updated_on=current_timestamp
        )

        tombstone_old_active_asset_reservations()
        self.assertEqual(1, AssetTranscriptionReservation.objects.count())
        reservation = AssetTranscriptionReservation.objects.get()
        self.assertEqual(reservation.tombstoned, True)

        # 1 session check + 1 reservation check + 1 logging
        if settings.SESSION_ENGINE.endswith("db"):
            expected_queries = 3
        else:
            expected_queries = 2

        with self.assertNumQueries(expected_queries):
            resp = self.client.post(reverse("reserve-asset", args=(asset.pk,)))

        self.assertEqual(resp.status_code, 408)
        self.assertEqual(1, AssetTranscriptionReservation.objects.count())
        reservation = AssetTranscriptionReservation.objects.get()
        self.assertEqual(reservation.reservation_token, reservation_token)

        self.client.logout()

        # 1 reservation check + 1 acquire + 1 get user ID
        expected_queries = 3
        if settings.SESSION_ENGINE.endswith("db"):
            # + 1 session check
            expected_queries += 1

        User.objects.create_user(username="anonymous")
        with self.assertNumQueries(expected_queries):
            resp = self.client.post(reverse("reserve-asset", args=(asset.pk,)))

        self.assertValidJSON(resp, expected_status=200)
        self.assertEqual(2, AssetTranscriptionReservation.objects.count())

    def test_asset_reservation_tombstone_expiration(self):
        """
        Simulate a tombstoned reservation which should expire after
        the configured period of time, allowing the original user
        to reserve the asset again
        """
        asset = create_asset()
        self.login_user()
        request_factory = RequestFactory()
        request = request_factory.get("/")
        request.session = {}
        reservation_token = get_or_create_reservation_token(request)

        session = self.client.session
        session["reservation_token"] = reservation_token
        session.save()

        tombstone_reservation = AssetTranscriptionReservation(  # nosec
            asset=asset, reservation_token=reservation_token
        )
        tombstone_reservation.full_clean()
        tombstone_reservation.save()
        # Backdate the object as if it was created hours ago
        # and tombstoned hours ago
        old_timestamp = now() - timedelta(
            hours=settings.TRANSCRIPTION_RESERVATION_TOMBSTONE_HOURS
            + settings.TRANSCRIPTION_RESERVATION_TOMBSTONE_LENGTH_HOURS
            + 1
        )
        not_as_old_timestamp = now() - timedelta(
            hours=settings.TRANSCRIPTION_RESERVATION_TOMBSTONE_LENGTH_HOURS + 1
        )
        AssetTranscriptionReservation.objects.update(
            created_on=old_timestamp, updated_on=not_as_old_timestamp, tombstoned=True
        )

        delete_old_tombstoned_reservations()
        self.assertEqual(0, AssetTranscriptionReservation.objects.count())

        # 1 session check + 1 reservation check + 1 acquire + 1logging
        if settings.SESSION_ENGINE.endswith("db"):
            expected_queries = 4
        else:
            expected_queries = 3

        with self.assertNumQueries(expected_queries):
            resp = self.client.post(reverse("reserve-asset", args=(asset.pk,)))

        data = self.assertValidJSON(resp, expected_status=200)
        self.assertEqual(1, AssetTranscriptionReservation.objects.count())
        reservation = AssetTranscriptionReservation.objects.get()
        self.assertEqual(reservation.reservation_token, data["reservation_token"])
        self.assertEqual(reservation.tombstoned, False)

    def tearDown(self):
        # We'll test the signal handler separately
        post_save.connect(on_transcription_save, sender=Transcription)


================================================
FILE: concordia/tests/test_views_redirect_next_reviewable.py
================================================
from unittest.mock import patch

from django.db.models.signals import post_save
from django.test import (
    TransactionTestCase,
    override_settings,
)
from django.urls import reverse
from django.utils.timezone import now

from concordia.models import (
    Transcription,
)
from concordia.signals.handlers import on_transcription_save
from concordia.utils import get_anonymous_user

from .utils import (
    CreateTestUsers,
    JSONAssertMixin,
    create_asset,
    create_campaign,
    create_item,
    create_project,
    create_topic,
)


@override_settings(
    RATELIMIT_ENABLE=False, SESSION_ENGINE="django.contrib.sessions.backends.cache"
)
class NextReviewableRedirectViewTests(
    CreateTestUsers, JSONAssertMixin, TransactionTestCase
):
    def test_find_next_reviewable_no_campaign(self):
        user = self.create_user("test-user")
        anon = get_anonymous_user()

        # Test case where there are no reviewable assets
        response = self.client.get(reverse("redirect-to-next-reviewable-asset"))
        self.assertRedirects(response, expected_url="/")

        asset1 = create_asset(slug="test-asset-1", title="Test Asset 1")
        asset2 = create_asset(
            item=asset1.item, slug="test-asset-2", title="Test Asset 2"
        )
        asset3 = create_asset(
            item=asset1.item, slug="test-asset-3", title="Test Asset 3"
        )
        campaign = asset1.item.project.campaign

        t1 = Transcription(asset=asset1, user=user, text="test", submitted=now())
        t1.full_clean()
        t1.save()

        t2 = Transcription(asset=asset2, user=anon, text="test", submitted=now())
        t2.full_clean()
        t2.save()

        t3 = Transcription(asset=asset3, user=anon, text="test", submitted=now())
        t3.full_clean()
        t3.save()

        response = self.client.get(reverse("redirect-to-next-reviewable-asset"))
        self.assertRedirects(response, expected_url=asset1.get_absolute_url())

        # Test logged in user (this creates a new user)
        # asset1 is no longer available due to the request above reserving it
        self.login_user()
        response = self.client.get(reverse("redirect-to-next-reviewable-asset"))
        self.assertRedirects(response, expected_url=asset2.get_absolute_url())

        # Configure campaign to be next review cmpaign for tests below
        campaign.next_review_campaign = True
        campaign.save()

        # Test when next reviewable campaign doesn't exist and there
        # are no other campaigns/assets
        with patch("concordia.models.Campaign.objects.get") as mock:
            mock.side_effect = IndexError
            response = self.client.get(reverse("redirect-to-next-reviewable-asset"))
        self.assertRedirects(response, expected_url="/")

        # Test case when a campaign is configured to be default next reviewable
        response = self.client.get(reverse("redirect-to-next-reviewable-asset"))
        self.assertRedirects(response, expected_url=asset3.get_absolute_url())

        # Test when next reviewable campaign has no reviewable assets
        asset1.delete()
        asset2.delete()
        response = self.client.get(reverse("redirect-to-next-reviewable-asset"))
        self.assertRedirects(response, expected_url="/")

        # Test when next reviewable campaign has no reviewable assets
        # and other campaigns exist and have no reviewable assets
        create_campaign(slug="test-campaign-2")
        response = self.client.get(reverse("redirect-to-next-reviewable-asset"))
        self.assertRedirects(response, expected_url="/")

    def test_find_next_reviewable_campaign(self):
        anon = get_anonymous_user()

        asset1 = create_asset(slug="test-review-asset-1", title="Test Asset 1")
        asset2 = create_asset(
            item=asset1.item, slug="test-review-asset-2", title="Test Asset 2"
        )

        t1 = Transcription(asset=asset1, user=anon, text="test", submitted=now())
        t1.full_clean()
        t1.save()

        t2 = Transcription(asset=asset2, user=anon, text="test", submitted=now())
        t2.full_clean()
        t2.save()

        campaign = asset1.item.project.campaign

        # Anonymous user test
        response = self.client.get(
            reverse(
                "transcriptions:redirect-to-next-reviewable-campaign-asset",
                kwargs={"campaign_slug": campaign.slug},
            )
        )
        self.assertRedirects(response, expected_url=asset1.get_absolute_url())

        # Authenticated user test
        # asset1 is no longer available since the previous request reserved it
        self.login_user()
        response = self.client.get(
            reverse(
                "transcriptions:redirect-to-next-reviewable-campaign-asset",
                kwargs={"campaign_slug": campaign.slug},
            )
        )
        self.assertRedirects(response, expected_url=asset2.get_absolute_url())

    def test_find_next_reviewable_topic(self):
        anon = get_anonymous_user()

        asset1 = create_asset(slug="test-review-asset-1")
        asset2 = create_asset(item=asset1.item, slug="test-review-asset-2")
        project = asset1.item.project
        topic = create_topic(project=project)

        t1 = Transcription(asset=asset1, user=anon, text="test", submitted=now())
        t1.full_clean()
        t1.save()

        t2 = Transcription(asset=asset2, user=anon, text="test", submitted=now())
        t2.full_clean()
        t2.save()

        # Anonymous user test
        response = self.client.get(
            reverse(
                "redirect-to-next-reviewable-topic-asset",
                kwargs={"topic_slug": topic.slug},
            )
        )
        self.assertRedirects(response, expected_url=asset1.get_absolute_url())

        # Authenticated user test
        # We expect that asset1 is no longer available. Even though
        # anonymous users can't reserve assets for review, we still will
        # have removed the asset from the NextReviewableTopicAsset table
        # to ensure two users don't receive the same asset
        self.login_user()
        response = self.client.get(
            reverse(
                "redirect-to-next-reviewable-topic-asset",
                kwargs={"topic_slug": topic.slug},
            )
        )
        self.assertRedirects(response, expected_url=asset2.get_absolute_url())

    def test_find_next_reviewable_unlisted_campaign(self):
        anon = get_anonymous_user()

        unlisted_campaign = create_campaign(
            slug="campaign-transcribe-redirect-unlisted",
            title="Test Unlisted Review Redirect Campaign",
            unlisted=True,
        )
        unlisted_project = create_project(
            title="Unlisted Project",
            slug="unlisted-project",
            campaign=unlisted_campaign,
        )
        unlisted_item = create_item(
            title="Unlisted Item",
            item_id="unlisted-item",
            item_url="https://blah.com/unlisted-item",
            project=unlisted_project,
        )

        asset1 = create_asset(slug="test-asset-1", item=unlisted_item)
        asset2 = create_asset(item=asset1.item, slug="test-asset-2")

        t1 = Transcription(asset=asset1, user=anon, text="test", submitted=now())
        t1.full_clean()
        t1.save()

        t2 = Transcription(asset=asset2, user=anon, text="test", submitted=now())
        t2.full_clean()
        t2.save()

        response = self.client.get(
            reverse(
                "transcriptions:redirect-to-next-reviewable-campaign-asset",
                kwargs={"campaign_slug": unlisted_campaign.slug},
            )
        )

        self.assertRedirects(response, expected_url=asset1.get_absolute_url())

    def tearDown(self):
        # We'll test the signal handler separately
        post_save.connect(on_transcription_save, sender=Transcription)


================================================
FILE: concordia/tests/test_views_redirect_next_transcribable.py
================================================
from unittest.mock import patch

from django.db.models.signals import post_save
from django.test import (
    TransactionTestCase,
    override_settings,
)
from django.urls import reverse

from concordia.models import (
    AssetTranscriptionReservation,
    Transcription,
    TranscriptionStatus,
)
from concordia.signals.handlers import on_transcription_save

from .utils import (
    CreateTestUsers,
    JSONAssertMixin,
    create_asset,
    create_campaign,
    create_item,
    create_project,
    create_topic,
)


@override_settings(
    RATELIMIT_ENABLE=False, SESSION_ENGINE="django.contrib.sessions.backends.cache"
)
class NextTranscribableRedirectViewTests(
    CreateTestUsers, JSONAssertMixin, TransactionTestCase
):
    def test_find_next_transcribable_no_campaign(self):
        # Test case where there are no transcribable assets
        resp = self.client.get(reverse("redirect-to-next-transcribable-asset"))
        self.assertRedirects(resp, expected_url="/")

        asset1 = create_asset(slug="test-asset-1")
        asset2 = create_asset(item=asset1.item, slug="test-asset-2")
        campaign = asset1.item.project.campaign

        resp = self.client.get(reverse("redirect-to-next-transcribable-asset"))
        self.assertRedirects(resp, expected_url=asset1.get_absolute_url())

        # Configure next transcription campaign for tests below
        campaign.next_transcription_campaign = True
        campaign.save()

        # Test when next transcribable campaign doesn't exist and there
        # are no other campaigns/assets
        with patch("concordia.models.Campaign.objects.get") as mock:
            mock.side_effect = IndexError
            response = self.client.get(reverse("redirect-to-next-transcribable-asset"))
        self.assertRedirects(response, expected_url="/")

        # Test case when a campaign is configured to be default next transcribable
        response = self.client.get(reverse("redirect-to-next-transcribable-asset"))
        self.assertRedirects(response, expected_url=asset2.get_absolute_url())

        # Test when next transcribable campaign has not transcribable assets
        asset1.delete()
        asset2.delete()
        response = self.client.get(reverse("redirect-to-next-transcribable-asset"))
        self.assertRedirects(response, expected_url="/")

        # Test when next transcription campaign has no transcribable assets
        # and other campaigns exist and have no transcribable assets
        create_campaign(slug="test-campaign-2")
        response = self.client.get(reverse("redirect-to-next-transcribable-asset"))
        self.assertRedirects(response, expected_url="/")

    def test_find_next_transcribable_campaign(self):
        asset1 = create_asset(slug="test-asset-1")
        asset2 = create_asset(item=asset1.item, slug="test-asset-2")
        campaign = asset1.item.project.campaign

        # Anonymous user test
        resp = self.client.get(
            reverse(
                "transcriptions:redirect-to-next-transcribable-campaign-asset",
                kwargs={"campaign_slug": campaign.slug},
            )
        )
        self.assertRedirects(resp, expected_url=asset1.get_absolute_url())

        # Authenticated user test
        self.login_user()
        resp = self.client.get(
            reverse(
                "transcriptions:redirect-to-next-transcribable-campaign-asset",
                kwargs={"campaign_slug": campaign.slug},
            )
        )
        self.assertRedirects(resp, expected_url=asset2.get_absolute_url())

    def test_find_next_transcribable_topic(self):
        asset1 = create_asset(slug="test-asset-1")
        asset2 = create_asset(item=asset1.item, slug="test-asset-2")
        project = asset1.item.project
        topic = create_topic(project=project)

        # Anonymous user test
        resp = self.client.get(
            reverse(
                "redirect-to-next-transcribable-topic-asset",
                kwargs={"topic_slug": topic.slug},
            )
        )
        self.assertRedirects(resp, expected_url=asset1.get_absolute_url())

        # Authenticated user test
        self.login_user()
        resp = self.client.get(
            reverse(
                "redirect-to-next-transcribable-topic-asset",
                kwargs={"topic_slug": topic.slug},
            )
        )
        self.assertRedirects(resp, expected_url=asset2.get_absolute_url())

    def test_find_next_transcribable_unlisted_campaign(self):
        unlisted_campaign = create_campaign(
            slug="campaign-transcribe-redirect-unlisted",
            title="Test Unlisted Transcribe Redirect Campaign",
            unlisted=True,
        )
        unlisted_project = create_project(
            title="Unlisted Project",
            slug="unlisted-project",
            campaign=unlisted_campaign,
        )
        unlisted_item = create_item(
            title="Unlisted Item",
            item_id="unlisted-item",
            item_url="https://blah.com/unlisted-item",
            project=unlisted_project,
        )

        asset1 = create_asset(slug="test-asset-1", item=unlisted_item)
        create_asset(item=asset1.item, slug="test-asset-2")

        response = self.client.get(
            reverse(
                "transcriptions:redirect-to-next-transcribable-campaign-asset",
                kwargs={"campaign_slug": unlisted_campaign.slug},
            )
        )

        self.assertRedirects(response, expected_url=asset1.get_absolute_url())

    def test_find_next_transcribable_single_asset(self):
        asset = create_asset()
        campaign = asset.item.project.campaign

        resp = self.client.get(
            reverse(
                "transcriptions:redirect-to-next-transcribable-campaign-asset",
                kwargs={"campaign_slug": campaign.slug},
            )
        )

        self.assertRedirects(resp, expected_url=asset.get_absolute_url())

    def test_find_next_transcribable_in_singleton_campaign(self):
        asset = create_asset(transcription_status=TranscriptionStatus.SUBMITTED)
        campaign = asset.item.project.campaign

        resp = self.client.get(
            reverse(
                "transcriptions:redirect-to-next-transcribable-campaign-asset",
                kwargs={"campaign_slug": campaign.slug},
            )
        )

        self.assertRedirects(resp, expected_url=reverse("homepage"))

    def test_find_next_transcribable_project_redirect(self):
        asset = create_asset(transcription_status=TranscriptionStatus.SUBMITTED)
        project = asset.item.project
        campaign = project.campaign

        resp = self.client.get(
            "%s?project=%s"
            % (
                reverse(
                    "transcriptions:redirect-to-next-transcribable-campaign-asset",
                    kwargs={"campaign_slug": campaign.slug},
                ),
                project.slug,
            )
        )

        self.assertRedirects(resp, expected_url=reverse("homepage"))

    def test_find_next_transcribable_hierarchy(self):
        """Confirm that find-next-page selects assets in the expected order"""

        asset = create_asset()
        item = asset.item
        project = item.project
        campaign = project.campaign

        asset_in_item = create_asset(item=item, slug="test-asset-in-same-item")
        in_progress_asset_in_item = create_asset(
            item=item,
            slug="inprogress-asset-in-same-item",
            transcription_status=TranscriptionStatus.IN_PROGRESS,
        )

        asset_in_project = create_asset(
            item=create_item(project=project, item_id="other-item-in-same-project"),
            title="test-asset-in-same-project",
        )

        asset_in_campaign = create_asset(
            item=create_item(
                project=create_project(campaign=campaign, title="other project"),
                item_id="another-item-in-different-project",
                title="item in other project",
            ),
            slug="test-asset-in-same-campaign",
        )

        # Now that we have test assets we'll see what find-next-page gives us as
        # successive test records are marked as submitted and thus ineligible.
        # The expected ordering is that it will favor moving forward (i.e. not
        # landing you on the same asset unless that's the only one available),
        # and will keep you closer to the asset you started from (i.e. within
        # the same item or project in that order).

        self.assertRedirects(
            self.client.get(
                reverse(
                    "transcriptions:redirect-to-next-transcribable-campaign-asset",
                    kwargs={"campaign_slug": campaign.slug},
                ),
                {"project": project.slug, "item": item.item_id, "asset": asset.pk},
            ),
            asset_in_item.get_absolute_url(),
        )

        asset_in_item.transcription_status = TranscriptionStatus.SUBMITTED
        asset_in_item.save()
        AssetTranscriptionReservation.objects.all().delete()

        self.assertRedirects(
            self.client.get(
                reverse(
                    "transcriptions:redirect-to-next-transcribable-campaign-asset",
                    kwargs={"campaign_slug": campaign.slug},
                ),
                {"project": project.slug, "item": item.item_id, "asset": asset.pk},
            ),
            asset_in_project.get_absolute_url(),
        )

        asset_in_project.transcription_status = TranscriptionStatus.SUBMITTED
        asset_in_project.save()
        AssetTranscriptionReservation.objects.all().delete()

        self.assertRedirects(
            self.client.get(
                reverse(
                    "transcriptions:redirect-to-next-transcribable-campaign-asset",
                    kwargs={"campaign_slug": campaign.slug},
                ),
                {"project": project.slug, "item": item.item_id, "asset": asset.pk},
            ),
            asset_in_campaign.get_absolute_url(),
        )

        asset_in_campaign.transcription_status = TranscriptionStatus.SUBMITTED
        asset_in_campaign.save()
        AssetTranscriptionReservation.objects.all().delete()

        self.assertRedirects(
            self.client.get(
                reverse(
                    "transcriptions:redirect-to-next-transcribable-campaign-asset",
                    kwargs={"campaign_slug": campaign.slug},
                ),
                {"project": project.slug, "item": item.item_id, "asset": asset.pk},
            ),
            in_progress_asset_in_item.get_absolute_url(),
        )

    def tearDown(self):
        # We'll test the signal handler separately
        post_save.connect(on_transcription_save, sender=Transcription)


================================================
FILE: concordia/tests/test_views_tags.py
================================================
from unittest.mock import patch

from django import forms
from django.contrib.auth.models import User
from django.db.models.signals import post_save
from django.test import (
    TransactionTestCase,
    override_settings,
)
from django.urls import reverse

from concordia.models import (
    Transcription,
)
from concordia.signals.handlers import on_transcription_save

from .utils import (
    CreateTestUsers,
    JSONAssertMixin,
    create_asset,
)


@override_settings(
    RATELIMIT_ENABLE=False, SESSION_ENGINE="django.contrib.sessions.backends.cache"
)
class TagSubmissionViewTests(CreateTestUsers, JSONAssertMixin, TransactionTestCase):
    def test_anonymous_tag_submission(self):
        """Confirm that anonymous users cannot submit tags"""
        asset = create_asset()
        submit_url = reverse("submit-tags", kwargs={"asset_pk": asset.pk})

        resp = self.client.post(submit_url, data={"tags": ["foo", "bar"]})
        self.assertRedirects(resp, "%s?next=%s" % (reverse("login"), submit_url))

    def test_tag_submission(self):
        asset = create_asset()

        self.login_user()

        test_tags = ["foo", "bar"]

        resp = self.client.post(
            reverse("submit-tags", kwargs={"asset_pk": asset.pk}),
            data={"tags": test_tags},
        )
        data = self.assertValidJSON(resp, expected_status=200)
        self.assertIn("user_tags", data)
        self.assertIn("all_tags", data)

        self.assertEqual(sorted(test_tags), data["user_tags"])
        self.assertEqual(sorted(test_tags), data["all_tags"])

    def test_invalid_tag_submission(self):
        asset = create_asset()

        self.login_user()

        test_tags = ["foo", "bar"]

        with patch("concordia.models.Tag.full_clean") as mock:
            mock.side_effect = forms.ValidationError("Testing error")
            resp = self.client.post(
                reverse("submit-tags", kwargs={"asset_pk": asset.pk}),
                data={"tags": test_tags},
            )
            data = self.assertValidJSON(resp, expected_status=400)
            self.assertIn("error", data)

    def test_tag_submission_with_diacritics(self):
        asset = create_asset()

        self.login_user()

        test_tags = ["Café", "château", "señor", "façade"]

        resp = self.client.post(
            reverse("submit-tags", kwargs={"asset_pk": asset.pk}),
            data={"tags": test_tags},
        )
        data = self.assertValidJSON(resp, expected_status=200)
        self.assertIn("user_tags", data)
        self.assertIn("all_tags", data)

        self.assertEqual(sorted(test_tags), data["user_tags"])
        self.assertEqual(sorted(test_tags), data["all_tags"])

    def test_tag_submission_with_multiple_users(self):
        asset = create_asset()
        self.login_user()

        test_tags = ["foo", "bar"]

        resp = self.client.post(
            reverse("submit-tags", kwargs={"asset_pk": asset.pk}),
            data={"tags": test_tags},
        )
        data = self.assertValidJSON(resp, expected_status=200)
        self.assertIn("user_tags", data)
        self.assertIn("all_tags", data)

        self.assertEqual(sorted(test_tags), data["user_tags"])
        self.assertEqual(sorted(test_tags), data["all_tags"])

    def test_duplicate_tag_submission(self):
        """Confirm that tag values cannot be duplicated"""
        asset = create_asset()

        self.login_user()

        resp = self.client.post(
            reverse("submit-tags", kwargs={"asset_pk": asset.pk}),
            data={"tags": ["foo", "bar", "baaz"]},
        )
        data = self.assertValidJSON(resp, expected_status=200)

        second_user = self.create_test_user(
            username="second_tester", email="second_tester@example.com"
        )
        self.client.login(username=second_user.username, password=second_user._password)

        resp = self.client.post(
            reverse("submit-tags", kwargs={"asset_pk": asset.pk}),
            data={"tags": ["foo", "bar", "quux"]},
        )
        data = self.assertValidJSON(resp, expected_status=200)

        # Even though the user submitted (through some horrible bug) duplicate
        # values, they should not be stored:
        self.assertEqual(["bar", "foo", "quux"], data["user_tags"])
        # Users are allowed to delete other users' tags, so since the second
        # user didn't send the "baaz" tag, it was removed
        self.assertEqual(["bar", "foo", "quux"], data["all_tags"])

    def test_tag_deletion(self):
        asset = create_asset()
        self.login_user()

        initial_tags = ["foo", "bar"]
        self.client.post(
            reverse("submit-tags", kwargs={"asset_pk": asset.pk}),
            data={"tags": initial_tags},
        )
        updated_tags = [
            "foo",
        ]
        resp = self.client.post(
            reverse("submit-tags", kwargs={"asset_pk": asset.pk}),
            data={"tags": updated_tags},
        )
        data = self.assertValidJSON(resp, expected_status=200)
        self.assertIn("user_tags", data)
        self.assertIn("all_tags", data)

        self.assertCountEqual(updated_tags, data["user_tags"])
        self.assertCountEqual(updated_tags, data["all_tags"])

    def test_tag_deletion_with_multiple_users(self):
        asset = create_asset()
        self.login_user("first_user")
        initial_tags = ["foo", "bar"]
        resp = self.client.post(
            reverse("submit-tags", kwargs={"asset_pk": asset.pk}),
            data={"tags": initial_tags},
        )
        self.assertIn(
            "first_user",
            asset.userassettagcollection_set.values().values_list(
                "user__username", flat=True
            ),
        )
        data = self.assertValidJSON(resp, expected_status=200)
        self.assertIn("user_tags", data)
        self.assertIn("all_tags", data)
        self.assertCountEqual(initial_tags, data["user_tags"])
        self.assertCountEqual(initial_tags, data["all_tags"])

        self.client.logout()

        second_user = self.create_test_user("second_user")
        self.client.login(username=second_user.username, password=second_user._password)
        updated_tags = [
            "foo",
        ]
        resp = self.client.post(
            reverse("submit-tags", kwargs={"asset_pk": asset.pk}),
            data={"tags": updated_tags},
        )
        data = self.assertValidJSON(resp, expected_status=200)

        self.assertIn(
            "second_user",
            asset.userassettagcollection_set.values().values_list(
                "user__username", flat=True
            ),
        )
        self.assertEqual(asset.userassettagcollection_set.count(), 2)
        self.assertEqual(
            User.objects.filter(userassettagcollection__asset=asset).count(), 2
        )
        self.assertIn("user_tags", data)
        self.assertIn("all_tags", data)
        self.assertCountEqual(updated_tags, data["user_tags"])

    def tearDown(self):
        # We'll test the signal handler separately
        post_save.connect(on_transcription_save, sender=Transcription)


================================================
FILE: concordia/tests/test_views_topics.py
================================================
from django.core.cache import caches
from django.test import TestCase, override_settings
from django.urls import reverse

from concordia.models import ProjectTopic, TranscriptionStatus

from .utils import (
    CreateTestUsers,
    JSONAssertMixin,
    create_asset,
    create_campaign,
    create_item,
    create_project,
    create_topic,
)


@override_settings(
    RATELIMIT_ENABLE=False,
    SESSION_ENGINE="django.contrib.sessions.backends.cache",
    CACHES={
        "default": {"BACKEND": "django.core.cache.backends.dummy.DummyCache"},
        "view_cache": {"BACKEND": "django.core.cache.backends.dummy.DummyCache"},
    },
)
class TopicDetailViewTests(CreateTestUsers, JSONAssertMixin, TestCase):
    """
    Focused tests for the Topic detail view.
    """

    def setUp(self):
        for cache in caches.all():
            cache.clear()

    def tearDown(self):
        for cache in caches.all():
            cache.clear()

    def test_topic_detail_basic(self):
        topic = create_topic(title="GET Topic", slug="get-topic")
        response = self.client.get(reverse("topic-detail", args=(topic.slug,)))
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="transcriptions/topic_detail.html"
        )
        self.assertContains(response, topic.title)

    def test_unlisted_topic_detail_view(self):
        c2 = create_topic(
            title="GET Unlisted Topic", unlisted=True, slug="get-unlisted-topic"
        )

        response2 = self.client.get(reverse("topic-detail", args=(c2.slug,)))

        self.assertEqual(response2.status_code, 200)
        self.assertTemplateUsed(
            response2, template_name="transcriptions/topic_detail.html"
        )
        self.assertContains(response2, c2.title)

    def test_topic_detail_with_status_sets_querystring(self):
        """
        When a valid transcription_status is supplied, sublevel_querystring
        contains only that param.
        """
        topic = create_topic(title="GET Topic", slug="get-topic")
        response = self.client.get(
            reverse("topic-detail", args=(topic.slug,)),
            {"transcription_status": "not_started"},
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(
            response, template_name="transcriptions/topic_detail.html"
        )
        self.assertContains(response, topic.title)
        self.assertIn("sublevel_querystring", response.context)
        self.assertEqual(
            response.context["sublevel_querystring"], "transcription_status=not_started"
        )

    def test_url_filter_links_without_sublevel_querystring(self):
        """
        With a project-level url_filter and no sublevel filter, links for that
        project include transcription_status=<url_filter>, while projects without
        a url_filter do not include a transcription_status param.
        """
        topic = create_topic(title="Filter Topic", slug="filter-topic")
        campaign = create_campaign(title="Filter Test Campaign", slug="filter-test")

        project_with_filter = create_project(
            campaign=campaign, title="Project With Filter", slug="with-filter"
        )
        project_without_filter = create_project(
            campaign=campaign, title="Project Without Filter", slug="without-filter"
        )

        ProjectTopic.objects.create(
            project=project_with_filter,
            topic=topic,
            url_filter=TranscriptionStatus.SUBMITTED,
        )
        ProjectTopic.objects.create(
            project=project_without_filter,
            topic=topic,
            url_filter=None,
        )

        response = self.client.get(reverse("topic-detail", args=(topic.slug,)))
        self.assertEqual(response.status_code, 200)

        # project_with_filter has ?transcription_status=submitted
        # (appears twice: image+title)
        self.assertContains(
            response,
            f"/campaigns/{campaign.slug}/{project_with_filter.slug}/?transcription_status=submitted",
            2,
        )
        # project_without_filter should not include any transcription_status param
        self.assertNotContains(
            response,
            f"/campaigns/{campaign.slug}/{project_without_filter.slug}/?transcription_status=",
        )

    def test_sublevel_querystring_only_keeps_transcription_status(self):
        """
        If extra params are provided along with transcription_status, only
        transcription_status is retained in sublevel_querystring.
        """
        topic = create_topic(title="GET Topic", slug="get-topic")
        response = self.client.get(
            reverse("topic-detail", args=(topic.slug,)),
            {"transcription_status": "not_started", "another_param": "some_value"},
        )
        self.assertEqual(response.status_code, 200)
        self.assertIn("sublevel_querystring", response.context)
        self.assertEqual(
            response.context["sublevel_querystring"], "transcription_status=not_started"
        )

    def test_with_status_and_no_assets_excludes_projects(self):
        """
        When a transcription_status is present and projects have no assets,
        those projects are excluded (no links rendered).
        """
        topic = create_topic(title="Filter Topic", slug="filter-topic")
        campaign = create_campaign(title="Filter Test Campaign", slug="filter-test")

        project_with_filter = create_project(
            campaign=campaign, title="Project With Filter", slug="with-filter"
        )
        project_without_filter = create_project(
            campaign=campaign, title="Project Without Filter", slug="without-filter"
        )

        ProjectTopic.objects.create(
            project=project_with_filter,
            topic=topic,
            url_filter=TranscriptionStatus.SUBMITTED,
        )
        ProjectTopic.objects.create(
            project=project_without_filter,
            topic=topic,
            url_filter=None,
        )

        response = self.client.get(
            reverse("topic-detail", args=(topic.slug,)),
            {"transcription_status": "not_started", "another_param": "some_value"},
        )
        self.assertEqual(response.status_code, 200)
        self.assertIn("sublevel_querystring", response.context)
        self.assertEqual(
            response.context["sublevel_querystring"], "transcription_status=not_started"
        )

        # No assets exist, so neither project should appear with the filter applied
        self.assertContains(
            response,
            f"/campaigns/{campaign.slug}/{project_with_filter.slug}/?transcription_status=not_started",
            0,
        )
        self.assertContains(
            response,
            f"/campaigns/{campaign.slug}/{project_without_filter.slug}/?transcription_status=not_started",
            0,
        )

    def test_with_status_and_assets_uses_sublevel_and_overrides_url_filter(self):
        """
        When assets exist and a transcription_status is supplied, projects with no
        url_filter are shown using the sublevel filter. Projects with a url_filter
        that does not match the sublevel filter are excluded.
        """
        topic = create_topic(title="Filter Topic", slug="filter-topic")
        campaign = create_campaign(title="Filter Test Campaign", slug="filter-test")

        project_with_filter = create_project(
            campaign=campaign, title="Project With Filter", slug="with-filter"
        )
        project_without_filter = create_project(
            campaign=campaign, title="Project Without Filter", slug="without-filter"
        )

        ProjectTopic.objects.create(
            project=project_with_filter,
            topic=topic,
            url_filter=TranscriptionStatus.SUBMITTED,
        )
        ProjectTopic.objects.create(
            project=project_without_filter,
            topic=topic,
            url_filter=None,
        )

        # Add assets so eligible projects will display
        item_with_filter = create_item(project=project_with_filter)
        create_asset(item=item_with_filter)
        item_without_filter = create_item(project=project_without_filter)
        create_asset(item=item_without_filter)

        response = self.client.get(
            reverse("topic-detail", args=(topic.slug,)),
            {"transcription_status": "not_started", "another_param": "some_value"},
        )
        self.assertEqual(response.status_code, 200)
        self.assertIn("sublevel_querystring", response.context)
        self.assertEqual(
            response.context["sublevel_querystring"], "transcription_status=not_started"
        )

        # Project WITH a mismatching url_filter should be excluded
        self.assertContains(
            response,
            f"/campaigns/{campaign.slug}/{project_with_filter.slug}/?transcription_status=not_started",
            0,
        )

        # Project WITHOUT a url_filter should use the sublevel filter
        # (appears twice: image + title)
        self.assertContains(
            response,
            f"/campaigns/{campaign.slug}/{project_without_filter.slug}/?transcription_status=not_started",
            2,
        )

    def test_with_status_and_assets_includes_matching_url_filter(self):
        """
        When assets exist and a transcription_status is supplied, projects with a
        matching url_filter should be included, and links should use that status.
        """
        topic = create_topic(title="Filter Topic", slug="filter-topic")
        campaign = create_campaign(title="Filter Test Campaign", slug="filter-test")

        project_with_filter = create_project(
            campaign=campaign, title="Project With Filter", slug="with-filter"
        )
        project_without_filter = create_project(
            campaign=campaign, title="Project Without Filter", slug="without-filter"
        )

        ProjectTopic.objects.create(
            project=project_with_filter,
            topic=topic,
            url_filter=TranscriptionStatus.SUBMITTED,
        )
        ProjectTopic.objects.create(
            project=project_without_filter,
            topic=topic,
            url_filter=None,
        )

        # Ensure both projects have at least one asset counted as "submitted"
        item_with_filter = create_item(project=project_with_filter)
        a1 = create_asset(item=item_with_filter)
        a1.transcription_status = TranscriptionStatus.SUBMITTED
        a1.save(update_fields=["transcription_status"])

        item_without_filter = create_item(project=project_without_filter)
        a2 = create_asset(item=item_without_filter)
        a2.transcription_status = TranscriptionStatus.SUBMITTED
        a2.save(update_fields=["transcription_status"])

        response = self.client.get(
            reverse("topic-detail", args=(topic.slug,)),
            {"transcription_status": "submitted"},
        )
        self.assertEqual(response.status_code, 200)
        self.assertIn("sublevel_querystring", response.context)
        self.assertEqual(
            response.context["sublevel_querystring"], "transcription_status=submitted"
        )

        # Project WITH a matching url_filter should be included (2 links: image + title)
        self.assertContains(
            response,
            f"/campaigns/{campaign.slug}/{project_with_filter.slug}/?transcription_status=submitted",
            2,
        )

        # Project WITHOUT a url_filter should also be included (also 2 links)
        self.assertContains(
            response,
            f"/campaigns/{campaign.slug}/{project_without_filter.slug}/?transcription_status=submitted",
            2,
        )

    def test_topic_detail_with_invalid_status_ignores_filter(self):
        """
        If transcription_status is present but invalid, the view should treat it
        as absent: no filtering by status and no sublevel_querystring.
        """
        topic = create_topic(title="Filter Topic", slug="filter-topic")
        campaign = create_campaign(title="Filter Test Campaign", slug="filter-test")

        project_with_filter = create_project(
            campaign=campaign, title="Project With Filter", slug="with-filter"
        )
        project_without_filter = create_project(
            campaign=campaign, title="Project Without Filter", slug="without-filter"
        )

        ProjectTopic.objects.create(
            project=project_with_filter,
            topic=topic,
            url_filter=TranscriptionStatus.SUBMITTED,
        )
        ProjectTopic.objects.create(
            project=project_without_filter,
            topic=topic,
            url_filter=None,
        )

        # Make both projects eligible to display
        create_asset(item=create_item(project=project_with_filter))
        create_asset(item=create_item(project=project_without_filter))

        # Supply an invalid status
        response = self.client.get(
            reverse("topic-detail", args=(topic.slug,)),
            {"transcription_status": "not-a-real-status", "another_param": "x"},
        )
        self.assertEqual(response.status_code, 200)

        # sublevel_querystring should be empty (invalid status ignored)
        self.assertIn("sublevel_querystring", response.context)
        self.assertEqual(response.context["sublevel_querystring"], "")

        # Project WITH a url_filter should use its own filter in links
        self.assertContains(
            response,
            f"/campaigns/{campaign.slug}/{project_with_filter.slug}/?transcription_status=submitted",
            2,
        )
        # Project WITHOUT a url_filter should not include a transcription_status param
        self.assertNotContains(
            response,
            f"/campaigns/{campaign.slug}/{project_without_filter.slug}/?transcription_status=",
        )

    def test_url_filter_empty_string_treated_as_missing(self):
        topic = create_topic(title="Filter Topic", slug="filter-topic")
        campaign = create_campaign(title="Filter Test Campaign", slug="filter-test")

        project_empty_filter = create_project(
            campaign=campaign, title="Project Empty Filter", slug="empty-filter"
        )
        project_none_filter = create_project(
            campaign=campaign, title="Project None Filter", slug="none-filter"
        )

        ProjectTopic.objects.create(
            project=project_empty_filter, topic=topic, url_filter=""
        )
        ProjectTopic.objects.create(
            project=project_none_filter, topic=topic, url_filter=None
        )

        # Make both eligible
        item_empty = create_item(project=project_empty_filter)
        asset_empty = create_asset(item=item_empty)
        item_none = create_item(project=project_none_filter)
        asset_none = create_asset(item=item_none)

        # no sublevel filter, so neither link should have transcription_status
        resp1 = self.client.get(reverse("topic-detail", args=(topic.slug,)))
        self.assertEqual(resp1.status_code, 200)
        self.assertNotContains(
            resp1,
            f"/campaigns/{campaign.slug}/{project_empty_filter.slug}/?transcription_status=",
        )
        self.assertNotContains(
            resp1,
            f"/campaigns/{campaign.slug}/{project_none_filter.slug}/?transcription_status=",
        )

        # Set at least one asset to SUBMITTED for each project (so they’re not excluded)
        asset_empty.transcription_status = TranscriptionStatus.SUBMITTED
        asset_empty.save(update_fields=["transcription_status"])

        asset_none.transcription_status = TranscriptionStatus.SUBMITTED
        asset_none.save(update_fields=["transcription_status"])

        # valid sublevel filter, so both included and use that status in links
        resp2 = self.client.get(
            reverse("topic-detail", args=(topic.slug,)),
            {"transcription_status": "submitted"},
        )
        self.assertEqual(resp2.status_code, 200)
        self.assertContains(
            resp2,
            f"/campaigns/{campaign.slug}/{project_empty_filter.slug}/?transcription_status=submitted",
            2,
        )
        self.assertContains(
            resp2,
            f"/campaigns/{campaign.slug}/{project_none_filter.slug}/?transcription_status=submitted",
            2,
        )


================================================
FILE: concordia/tests/test_views_transcription_review.py
================================================
from django.core.cache import caches
from django.db.models.signals import post_save
from django.test import (
    TransactionTestCase,
    override_settings,
)
from django.urls import reverse
from django.utils.timezone import now

from concordia.models import (
    Asset,
    Transcription,
    TranscriptionStatus,
)
from concordia.signals.handlers import on_transcription_save
from concordia.utils import get_anonymous_user
from configuration.models import Configuration

from .utils import (
    CreateTestUsers,
    JSONAssertMixin,
    create_asset,
    create_transcription,
)


@override_settings(
    RATELIMIT_ENABLE=False, SESSION_ENGINE="django.contrib.sessions.backends.cache"
)
class ReviewTranscriptionViewTests(
    CreateTestUsers, JSONAssertMixin, TransactionTestCase
):
    def test_transcription_review(self):
        asset = create_asset()

        anon = get_anonymous_user()

        t1 = Transcription(asset=asset, user=anon, text="test", submitted=now())
        t1.full_clean()
        t1.save()

        self.login_user()

        resp = self.client.post(
            reverse("review-transcription", args=(t1.pk,)), data={"action": "foobar"}
        )
        data = self.assertValidJSON(resp, expected_status=400)
        self.assertIn("error", data)

        self.assertEqual(
            1, Transcription.objects.filter(pk=t1.pk, accepted__isnull=True).count()
        )

        resp = self.client.post(
            reverse("review-transcription", args=(t1.pk,)), data={"action": "accept"}
        )
        data = self.assertValidJSON(resp, expected_status=200)

        self.assertEqual(
            1, Transcription.objects.filter(pk=t1.pk, accepted__isnull=False).count()
        )

    def test_transcription_review_rate_limit(self):
        for cache in caches.all():
            cache.clear()
        anon = get_anonymous_user()
        self.login_user()
        try:
            config = Configuration.objects.get(key="review_rate_limit")
            config.value = "4"
            config.data_type = Configuration.DataType.NUMBER
            config.save()
        except Configuration.DoesNotExist:
            Configuration.objects.create(
                key="review_rate_limit",
                value="4",
                data_type=Configuration.DataType.NUMBER,
            )

        Configuration.objects.get_or_create(
            key="review_rate_limit_popup_message",
            defaults={
                "value": "Test message",
                "data_type": Configuration.DataType.HTML,
            },
        )
        Configuration.objects.get_or_create(
            key="review_rate_limit_popup_title",
            defaults={
                "value": "Test message",
                "data_type": Configuration.DataType.HTML,
            },
        )
        Configuration.objects.get_or_create(
            key="review_rate_limit_banner_message",
            defaults={
                "value": "Test message",
                "data_type": Configuration.DataType.HTML,
            },
        )

        asset = create_asset()
        t1 = create_transcription(user=anon, asset=asset)
        t2 = create_transcription(
            user=anon, asset=create_asset(item=asset.item, slug="test-asset-2")
        )
        t3 = create_transcription(
            user=anon, asset=create_asset(item=asset.item, slug="test-asset-3")
        )
        t4 = create_transcription(
            user=anon, asset=create_asset(item=asset.item, slug="test-asset-4")
        )
        t5 = create_transcription(
            user=anon, asset=create_asset(item=asset.item, slug="test-asset-5")
        )

        resp = self.client.post(
            reverse("review-transcription", args=(t1.pk,)), data={"action": "accept"}
        )
        self.assertValidJSON(resp, expected_status=200)

        resp = self.client.post(
            reverse("review-transcription", args=(t2.pk,)), data={"action": "accept"}
        )
        self.assertValidJSON(resp, expected_status=200)

        resp = self.client.post(
            reverse("review-transcription", args=(t3.pk,)), data={"action": "accept"}
        )
        self.assertValidJSON(resp, expected_status=200)

        resp = self.client.post(
            reverse("review-transcription", args=(t4.pk,)), data={"action": "accept"}
        )
        self.assertValidJSON(resp, expected_status=200)

        resp = self.client.post(
            reverse("review-transcription", args=(t5.pk,)), data={"action": "accept"}
        )
        data = self.assertValidJSON(resp, expected_status=429)
        self.assertIn("error", data)

    def test_transcription_review_rate_limit_superuser(self):
        for cache in caches.all():
            cache.clear()
        anon = get_anonymous_user()
        self.user = self.create_super_user()
        self.login_user()
        try:
            config = Configuration.objects.get(key="review_rate_limit")
            config.value = "4"
            config.data_type = Configuration.DataType.NUMBER
            config.save()
        except Configuration.DoesNotExist:
            Configuration.objects.create(
                key="review_rate_limit",
                value="4",
                data_type=Configuration.DataType.NUMBER,
            )

        Configuration.objects.get_or_create(
            key="review_rate_limit_popup_message",
            defaults={
                "value": "Test message",
                "data_type": Configuration.DataType.HTML,
            },
        )
        Configuration.objects.get_or_create(
            key="review_rate_limit_popup_title",
            defaults={
                "value": "Test message",
                "data_type": Configuration.DataType.HTML,
            },
        )
        Configuration.objects.get_or_create(
            key="review_rate_limit_banner_message",
            defaults={
                "value": "Test message",
                "data_type": Configuration.DataType.HTML,
            },
        )

        asset = create_asset()
        t1 = create_transcription(user=anon, asset=asset)
        t2 = create_transcription(
            user=anon, asset=create_asset(item=asset.item, slug="test-asset-2")
        )
        t3 = create_transcription(
            user=anon, asset=create_asset(item=asset.item, slug="test-asset-3")
        )
        t4 = create_transcription(
            user=anon, asset=create_asset(item=asset.item, slug="test-asset-4")
        )
        t5 = create_transcription(
            user=anon, asset=create_asset(item=asset.item, slug="test-asset-5")
        )

        resp = self.client.post(
            reverse("review-transcription", args=(t1.pk,)), data={"action": "accept"}
        )
        self.assertValidJSON(resp, expected_status=200)

        resp = self.client.post(
            reverse("review-transcription", args=(t2.pk,)), data={"action": "accept"}
        )
        self.assertValidJSON(resp, expected_status=200)

        resp = self.client.post(
            reverse("review-transcription", args=(t3.pk,)), data={"action": "accept"}
        )
        self.assertValidJSON(resp, expected_status=200)

        resp = self.client.post(
            reverse("review-transcription", args=(t4.pk,)), data={"action": "accept"}
        )
        self.assertValidJSON(resp, expected_status=200)

        resp = self.client.post(
            reverse("review-transcription", args=(t5.pk,)), data={"action": "accept"}
        )
        self.assertValidJSON(resp, expected_status=200)

    def test_transcription_review_asset_status_updates(self):
        """
        Confirm that the Asset.transcription_status field is correctly updated
        throughout the review process
        """
        asset = create_asset()

        anon = get_anonymous_user()

        # We should see NOT_STARTED only when no transcription records exist:
        self.assertEqual(asset.transcription_set.count(), 0)
        self.assertEqual(
            Asset.objects.get(pk=asset.pk).transcription_status,
            TranscriptionStatus.NOT_STARTED,
        )

        t1 = Transcription(asset=asset, user=anon, text="test", submitted=now())
        t1.full_clean()
        t1.save()

        self.assertEqual(
            Asset.objects.get(pk=asset.pk).transcription_status,
            TranscriptionStatus.SUBMITTED,
        )

        # “Login” so we can review the anonymous transcription:
        self.login_user()

        self.assertEqual(
            1, Transcription.objects.filter(pk=t1.pk, accepted__isnull=True).count()
        )

        resp = self.client.post(
            reverse("review-transcription", args=(t1.pk,)), data={"action": "reject"}
        )
        self.assertValidJSON(resp, expected_status=200)

        # After rejecting a transcription, the asset status should be reset to
        # in-progress:
        self.assertEqual(
            1,
            Transcription.objects.filter(
                pk=t1.pk, accepted__isnull=True, rejected__isnull=False
            ).count(),
        )
        self.assertEqual(
            Asset.objects.get(pk=asset.pk).transcription_status,
            TranscriptionStatus.IN_PROGRESS,
        )

        # We'll simulate a second attempt:

        t2 = Transcription(
            asset=asset, user=anon, text="test", submitted=now(), supersedes=t1
        )
        t2.full_clean()
        t2.save()

        self.assertEqual(
            Asset.objects.get(pk=asset.pk).transcription_status,
            TranscriptionStatus.SUBMITTED,
        )

        resp = self.client.post(
            reverse("review-transcription", args=(t2.pk,)), data={"action": "accept"}
        )
        self.assertValidJSON(resp, expected_status=200)

        self.assertEqual(
            1, Transcription.objects.filter(pk=t2.pk, accepted__isnull=False).count()
        )
        self.assertEqual(
            Asset.objects.get(pk=asset.pk).transcription_status,
            TranscriptionStatus.COMPLETED,
        )

    def test_transcription_disallow_self_review(self):
        asset = create_asset()

        self.login_user()

        t1 = Transcription(asset=asset, user=self.user, text="test", submitted=now())
        t1.full_clean()
        t1.save()

        resp = self.client.post(
            reverse("review-transcription", args=(t1.pk,)), data={"action": "accept"}
        )
        data = self.assertValidJSON(resp, expected_status=400)
        self.assertIn("error", data)
        self.assertEqual("You cannot accept your own transcription", data["error"])

    def test_transcription_allow_self_reject(self):
        asset = create_asset()

        self.login_user()

        t1 = Transcription(asset=asset, user=self.user, text="test", submitted=now())
        t1.full_clean()
        t1.save()

        resp = self.client.post(
            reverse("review-transcription", args=(t1.pk,)), data={"action": "reject"}
        )
        self.assertValidJSON(resp, expected_status=200)
        self.assertEqual(
            Asset.objects.get(pk=asset.pk).transcription_status,
            TranscriptionStatus.IN_PROGRESS,
        )
        self.assertEqual(Transcription.objects.get(pk=t1.pk).reviewed_by, self.user)

    def test_transcription_double_review(self):
        asset = create_asset()

        anon = get_anonymous_user()

        t1 = Transcription(asset=asset, user=anon, text="test", submitted=now())
        t1.full_clean()
        t1.save()

        self.login_user()

        resp = self.client.post(
            reverse("review-transcription", args=(t1.pk,)), data={"action": "accept"}
        )
        data = self.assertValidJSON(resp, expected_status=200)

        resp = self.client.post(
            reverse("review-transcription", args=(t1.pk,)), data={"action": "reject"}
        )
        data = self.assertValidJSON(resp, expected_status=400)
        self.assertIn("error", data)
        self.assertEqual("This transcription has already been reviewed", data["error"])

    def tearDown(self):
        # We'll test the signal handler separately
        post_save.connect(on_transcription_save, sender=Transcription)


================================================
FILE: concordia/tests/test_views_transcription_save.py
================================================
import sys
from unittest.mock import patch

from django import forms
from django.db.models.signals import post_save
from django.test import (
    TransactionTestCase,
    override_settings,
)
from django.urls import reverse

from concordia.models import (
    Transcription,
)
from concordia.signals.handlers import on_transcription_save

from .utils import (
    CreateTestUsers,
    JSONAssertMixin,
    create_asset,
)


@override_settings(
    RATELIMIT_ENABLE=False, SESSION_ENGINE="django.contrib.sessions.backends.cache"
)
class SaveTranscriptionViewTests(CreateTestUsers, JSONAssertMixin, TransactionTestCase):
    def setUp(self):
        self.asset = create_asset()

    def test_turnstile_validation_fails(self):
        # Test when Turnstile validation failes
        with patch("concordia.turnstile.fields.TurnstileField.validate") as mock:
            mock.side_effect = forms.ValidationError(
                "Testing error", code="invalid_turnstile"
            )
            resp = self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={"text": "test"},
            )
            data = self.assertValidJSON(resp, expected_status=401)
            self.assertIn("error", data)

    def test_initial_save_success(self):
        with patch(
            "concordia.turnstile.fields.TurnstileField.validate", return_value=True
        ):
            resp = self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={"text": "test"},
            )
        data = self.assertValidJSON(resp, expected_status=201)
        self.assertIn("submissionUrl", data)

    def test_duplicate_without_supersedes_conflict(self):
        with patch(
            "concordia.turnstile.fields.TurnstileField.validate", return_value=True
        ):
            self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={"text": "test"},
            )
            # Test attempts to create a second transcription without marking that it
            # supersedes the previous one:
            resp = self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={"text": "test"},
            )
        data = self.assertValidJSON(resp, expected_status=409)
        self.assertIn("error", data)

    def test_save_with_url_error(self):
        with patch(
            "concordia.turnstile.fields.TurnstileField.validate", return_value=True
        ):
            self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={"text": "test"},
            )
            # If a transcription contains a URL, it should return an error
            resp = self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={
                    "text": "http://example.com",
                    "supersedes": self.asset.transcription_set.get().pk,
                },
            )
        data = self.assertValidJSON(resp, expected_status=400)
        self.assertIn("error", data)

    def test_unacceptable_characters_are_removed_on_save(self):
        with patch(
            "concordia.turnstile.fields.TurnstileField.validate", return_value=True
        ):
            bad_text = "He\u200bllo\tWorld\xa0\u3000\u2003!\nBad\x00Char\x1fHere\u200b"
            resp = self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={"text": bad_text},
            )
        data = self.assertValidJSON(resp, expected_status=201)
        self.assertIn("submissionUrl", data)
        t = self.asset.transcription_set.get()
        self.assertEqual(t.text, "Hello\tWorld\xa0\u3000\u2003!\nBadCharHere")

    def test_unacceptable_characters_are_removed_when_superseding(self):
        with patch(
            "concordia.turnstile.fields.TurnstileField.validate", return_value=True
        ):
            self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={"text": "first"},
            )
            bad_text = "b\u200bad\x00"
            resp = self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={
                    "text": bad_text,
                    "supersedes": self.asset.transcription_set.get().pk,
                },
            )
        data = self.assertValidJSON(resp, expected_status=201)
        self.assertIn("submissionUrl", data)
        new_t = self.asset.transcription_set.order_by("pk").last()
        self.assertEqual(new_t.text, "bad")

    def test_save_with_supersedes_success(self):
        with patch(
            "concordia.turnstile.fields.TurnstileField.validate", return_value=True
        ):
            self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={"text": "test"},
            )
            # Test that it correctly works when supersedes is set
            resp = self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={
                    "text": "test",
                    "supersedes": self.asset.transcription_set.get().pk,
                },
            )
        data = self.assertValidJSON(resp, expected_status=201)
        self.assertIn("submissionUrl", data)

    def test_supersedes_sets_ocr_originated_when_previous_was_ocr_originated(self):
        with patch(
            "concordia.turnstile.fields.TurnstileField.validate", return_value=True
        ):
            self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={"text": "test"},
            )
            # Test that it correctly works when supersedes is set and confirm
            # ocr_originaed is properly set
            transcription = self.asset.transcription_set.order_by("pk").last()
            transcription.ocr_originated = True
            transcription.save()
            resp = self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={
                    "text": "test",
                    "supersedes": self.asset.transcription_set.order_by("pk").last().pk,
                },
            )
        data = self.assertValidJSON(resp, expected_status=201)
        self.assertIn("submissionUrl", data)
        new_transcription = self.asset.transcription_set.order_by("pk").last()
        self.assertTrue(new_transcription.ocr_originated)

    def test_supersede_already_superseded_conflict(self):
        with patch(
            "concordia.turnstile.fields.TurnstileField.validate", return_value=True
        ):
            first_resp = self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={"text": "test"},
            )
            self.assertValidJSON(first_resp, expected_status=201)
            first_pk = self.asset.transcription_set.order_by("pk").first().pk

            self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={"text": "test 2", "supersedes": first_pk},
            )

            # We should see an error if you attempt to supersede a transcription
            # which has already been superseded:
            resp = self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={
                    "text": "test",
                    "supersedes": self.asset.transcription_set.order_by("pk")
                    .first()
                    .pk,
                },
            )
        data = self.assertValidJSON(resp, expected_status=409)
        self.assertIn("error", data)

    def test_supersede_nonexistent_returns_400(self):
        with patch(
            "concordia.turnstile.fields.TurnstileField.validate", return_value=True
        ):
            # We should get an error if you attempt to supersede a transcription
            # that doesn't exist
            resp = self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={
                    "text": "test",
                    "supersedes": sys.maxsize,
                },
            )
        data = self.assertValidJSON(resp, expected_status=400)
        self.assertIn("error", data)

    def test_supersede_invalid_pk_returns_400(self):
        with patch(
            "concordia.turnstile.fields.TurnstileField.validate", return_value=True
        ):
            # We should get an error if you attempt to supersede with
            # with a pk that is invalid (i.e., a string instead of int)
            resp = self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={
                    "text": "test",
                    "supersedes": "bad-pk",
                },
            )
        data = self.assertValidJSON(resp, expected_status=400)
        self.assertIn("error", data)

    def test_logged_in_user_can_take_over_from_anonymous(self):
        with patch(
            "concordia.turnstile.fields.TurnstileField.validate", return_value=True
        ):
            anon_resp = self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={"text": "test"},
            )
            self.assertValidJSON(anon_resp, expected_status=201)

            # A logged in user can take over from an anonymous user:
            self.login_user()
            resp = self.client.post(
                reverse("save-transcription", args=(self.asset.pk,)),
                data={
                    "text": "test",
                    "supersedes": self.asset.transcription_set.order_by("pk").last().pk,
                },
            )
        data = self.assertValidJSON(resp, expected_status=201)
        self.assertIn("submissionUrl", data)

    def tearDown(self):
        # We'll test the signal handler separately
        post_save.connect(on_transcription_save, sender=Transcription)


================================================
FILE: concordia/tests/test_views_transcription_submit.py
================================================
from unittest.mock import patch

from django import forms
from django.db.models.signals import post_save
from django.test import (
    TransactionTestCase,
    override_settings,
)
from django.urls import reverse

from concordia.models import (
    Transcription,
)
from concordia.signals.handlers import on_transcription_save
from concordia.utils import get_anonymous_user

from .utils import (
    CreateTestUsers,
    JSONAssertMixin,
    create_asset,
)


@override_settings(
    RATELIMIT_ENABLE=False, SESSION_ENGINE="django.contrib.sessions.backends.cache"
)
class SubmitTranscriptionViewTests(
    CreateTestUsers, JSONAssertMixin, TransactionTestCase
):
    def test_anonymous_transcription_submission(self):
        asset = create_asset()
        anon = get_anonymous_user()

        transcription = Transcription(asset=asset, user=anon, text="previous entry")
        transcription.full_clean()
        transcription.save()

        with patch("concordia.turnstile.fields.TurnstileField.validate") as mock:
            mock.side_effect = forms.ValidationError(
                "Testing error", code="invalid_turnstile"
            )
            resp = self.client.post(
                reverse("submit-transcription", args=(transcription.pk,))
            )
        data = self.assertValidJSON(resp, expected_status=401)
        self.assertIn("error", data)

        self.assertFalse(Transcription.objects.filter(submitted__isnull=False).exists())

        with patch(
            "concordia.turnstile.fields.TurnstileField.validate", return_value=True
        ):
            self.client.post(
                reverse("submit-transcription", args=(transcription.pk,)),
            )
            self.assertTrue(
                Transcription.objects.filter(submitted__isnull=False).exists()
            )

    def test_transcription_submission(self):
        asset = create_asset()

        with patch(
            "concordia.turnstile.fields.TurnstileField.validate", return_value=True
        ):
            resp = self.client.post(
                reverse("save-transcription", args=(asset.pk,)), data={"text": "test"}
            )
        data = self.assertValidJSON(resp, expected_status=201)

        transcription = Transcription.objects.get()
        self.assertIsNone(transcription.submitted)

        with patch(
            "concordia.turnstile.fields.TurnstileField.validate", return_value=True
        ):
            resp = self.client.post(
                reverse("submit-transcription", args=(transcription.pk,))
            )
        data = self.assertValidJSON(resp, expected_status=200)
        self.assertIn("id", data)
        self.assertEqual(data["id"], transcription.pk)

        transcription = Transcription.objects.get()
        self.assertTrue(transcription.submitted)

    def test_stale_transcription_submission(self):
        asset = create_asset()

        anon = get_anonymous_user()

        t1 = Transcription(asset=asset, user=anon, text="test")
        t1.full_clean()
        t1.save()

        t2 = Transcription(asset=asset, user=anon, text="test", supersedes=t1)
        t2.full_clean()
        t2.save()

        with patch(
            "concordia.turnstile.fields.TurnstileField.validate", return_value=True
        ):
            resp = self.client.post(reverse("submit-transcription", args=(t1.pk,)))
            data = self.assertValidJSON(resp, expected_status=400)
            self.assertIn("error", data)

    def tearDown(self):
        # We'll test the signal handler separately
        post_save.connect(on_transcription_save, sender=Transcription)


================================================
FILE: concordia/tests/test_views_utils.py
================================================
import datetime
from time import time

from django.contrib.auth.models import AnonymousUser
from django.test import RequestFactory, TestCase, override_settings
from django.utils.timezone import make_aware, now

from concordia.models import (
    Asset,
    Transcription,
    TranscriptionStatus,
)
from concordia.views.utils import (
    AnonymousUserValidationCheckMixin,
    _get_pages,
    annotate_children_with_progress_stats,
    calculate_asset_stats,
)

from .utils import (
    CreateTestUsers,
    create_asset,
    create_campaign,
    create_item,
    create_project,
    create_transcription,
)


class GetPagesTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.factory = RequestFactory()
        self.user = self.create_test_user()

        # Base campaign, project, item setup
        self.campaign = create_campaign(slug="gp-camp", title="gp-camp")
        self.project = create_project(
            campaign=self.campaign, slug="gp-proj", title="gp-proj"
        )
        self.item = create_item(project=self.project, item_id="gp-item")

        # Two assets in the same item
        self.asset1 = create_asset(item=self.item, slug="gp-a1", sequence=1)
        self.asset2 = create_asset(item=self.item, slug="gp-a2", sequence=2)

        # Another campaign and project for campaign filtering tests
        self.campaign2 = create_campaign(slug="gp-camp-2", title="gp-camp-2")
        self.project2 = create_project(
            campaign=self.campaign2, slug="gp-proj-2", title="gp-proj-2"
        )
        self.item2 = create_item(project=self.project2, item_id="gp-item-2")
        self.asset3_other_campaign = create_asset(
            item=self.item2, slug="gp-a3", sequence=1
        )

    def _request(self, params: dict[str, str]):
        request = self.factory.get("/dummy", data=params)
        request.user = self.user
        return request

    def _touch_transcription_times(
        self,
        transcription: Transcription,
        *,
        created_on=None,
        updated_on=None,
        reviewer=None,
    ):
        if reviewer is not None:
            transcription.reviewed_by = reviewer
        if created_on is not None:
            transcription.created_on = created_on
        if updated_on is not None:
            transcription.updated_on = updated_on
        transcription.save(update_fields=["reviewed_by", "created_on", "updated_on"])

    def test_activity_filters_transcribed_vs_reviewed_vs_default(self):
        now_reference = now()

        # asset1: transcribed by self.user
        transcription1 = create_transcription(asset=self.asset1, user=self.user)
        self._touch_transcription_times(
            transcription1, created_on=now_reference - datetime.timedelta(hours=2)
        )

        # asset2: reviewed by self.user
        transcription2 = create_transcription(
            asset=self.asset2, user=self.create_test_user("transcriber")
        )
        self._touch_transcription_times(
            transcription2,
            reviewer=self.user,
            updated_on=now_reference - datetime.timedelta(hours=1),
        )

        # Default behavior includes both
        queryset_default = _get_pages(self._request({}))
        self.assertCountEqual(
            list(queryset_default.values_list("id", flat=True)),
            [self.asset1.id, self.asset2.id],
        )

        # Transcribed only
        queryset_transcribed = _get_pages(self._request({"activity": "transcribed"}))
        self.assertListEqual(
            list(queryset_transcribed.values_list("id", flat=True)),
            [self.asset1.id],
        )

        # Reviewed only
        queryset_reviewed = _get_pages(self._request({"activity": "reviewed"}))
        self.assertListEqual(
            list(queryset_reviewed.values_list("id", flat=True)),
            [self.asset2.id],
        )

    def test_status_filter_exclusions(self):
        # Ensure the user is associated with each asset via transcriptions
        create_transcription(asset=self.asset1, user=self.user)
        create_transcription(asset=self.asset2, user=self.user, submitted=now())

        # Mark asset1 as IN_PROGRESS explicitly
        Asset.objects.filter(pk=self.asset1.pk).update(
            transcription_status=TranscriptionStatus.IN_PROGRESS
        )

        # Also add an asset in COMPLETED with a user transcription
        completed_asset = create_asset(item=self.item, slug="gp-a4", sequence=3)
        create_transcription(asset=completed_asset, user=self.user)
        Asset.objects.filter(pk=completed_asset.pk).update(
            transcription_status=TranscriptionStatus.COMPLETED
        )

        # Only "submitted" requested, so exclude IN_PROGRESS and COMPLETED
        queryset = _get_pages(self._request({"status": "submitted"}))
        self.assertListEqual(
            list(queryset.values_list("id", flat=True)), [self.asset2.id]
        )

    def test_date_range_and_single_day_filters_and_ordering(self):
        # Transcriptions (associate user) with distinct activity dates
        today = now()
        day_minus_3 = make_aware(
            datetime.datetime.combine(
                (today - datetime.timedelta(days=3)).date(), datetime.time(12)
            )
        )
        day_minus_1 = make_aware(
            datetime.datetime.combine(
                (today - datetime.timedelta(days=1)).date(), datetime.time(12)
            )
        )

        transcription1 = create_transcription(asset=self.asset1, user=self.user)
        self._touch_transcription_times(
            transcription1, created_on=day_minus_3, updated_on=day_minus_3
        )

        transcription2 = create_transcription(asset=self.asset2, user=self.user)
        self._touch_transcription_times(
            transcription2, created_on=day_minus_1, updated_on=day_minus_1
        )

        # The range filter from two days ago through today should include
        # asset2 (day minus one) and exclude asset1 (day minus three)
        start = (today - datetime.timedelta(days=2)).strftime("%Y-%m-%d")
        end = today.strftime("%Y-%m-%d")
        queryset_range = _get_pages(self._request({"start": start, "end": end}))
        self.assertListEqual(
            list(queryset_range.values_list("id", flat=True)), [self.asset2.id]
        )

        # A single-day filter for day minus three picks asset1
        only_day = (today - datetime.timedelta(days=3)).strftime("%Y-%m-%d")
        queryset_single = _get_pages(self._request({"start": only_day}))
        self.assertListEqual(
            list(queryset_single.values_list("id", flat=True)), [self.asset1.id]
        )

        # Ordering: ascending vs default (descending)
        queryset_ascending = _get_pages(self._request({"order_by": "date-ascending"}))
        self.assertEqual(
            list(queryset_ascending.values_list("id", flat=True)),
            [self.asset1.id, self.asset2.id],
        )

        queryset_descending = _get_pages(self._request({}))
        self.assertEqual(
            list(queryset_descending.values_list("id", flat=True)),
            [self.asset2.id, self.asset1.id],
        )

    def test_campaign_filter_and_six_month_cutoff(self):
        # Link user to assets in both campaigns
        recent_timestamp = now() - datetime.timedelta(days=5)
        old_timestamp = now() - datetime.timedelta(days=6 * 30 + 10)

        # Asset in base campaign (recent)
        transcription1 = create_transcription(asset=self.asset1, user=self.user)
        self._touch_transcription_times(
            transcription1, created_on=recent_timestamp, updated_on=recent_timestamp
        )

        # Asset in other campaign (recent)
        transcription2 = create_transcription(
            asset=self.asset3_other_campaign, user=self.user
        )
        self._touch_transcription_times(
            transcription2, created_on=recent_timestamp, updated_on=recent_timestamp
        )

        # Very old activity on asset2 so it should be filtered out by the
        # six months cutoff
        transcription_old = create_transcription(asset=self.asset2, user=self.user)
        self._touch_transcription_times(
            transcription_old, created_on=old_timestamp, updated_on=old_timestamp
        )

        # Without a campaign filter, both recent assets are present
        # and the old one is excluded
        queryset = _get_pages(self._request({}))
        asset_ids = set(queryset.values_list("id", flat=True))
        self.assertSetEqual(asset_ids, {self.asset1.id, self.asset3_other_campaign.id})

        # The campaign filter picks only the other campaign's asset
        queryset_campaign2 = _get_pages(
            self._request({"campaign": str(self.campaign2.pk)})
        )
        self.assertListEqual(
            list(queryset_campaign2.values_list("id", flat=True)),
            [self.asset3_other_campaign.id],
        )

    def test_status_filter_includes_completed_when_requested(self):
        """
        When "completed" is requested, completed assets are kept while
        submitted and in progress assets are excluded.
        """
        # Prepare three assets that all have activity from this user.
        completed_asset = create_asset(
            item=self.item, slug="gp-a4-completed", sequence=4
        )
        create_transcription(asset=completed_asset, user=self.user)
        Asset.objects.filter(pk=completed_asset.pk).update(
            transcription_status=TranscriptionStatus.COMPLETED
        )

        create_transcription(asset=self.asset1, user=self.user)
        Asset.objects.filter(pk=self.asset1.pk).update(
            transcription_status=TranscriptionStatus.IN_PROGRESS
        )

        create_transcription(
            asset=self.asset2, user=self.user, submitted=now()
        )  # submitted

        # Request only "completed" status.
        queryset = _get_pages(self._request({"status": "completed"}))
        self.assertListEqual(
            list(queryset.values_list("id", flat=True)), [completed_asset.id]
        )

    def test_status_filter_includes_in_progress_and_excludes_submitted_not_requested(
        self,
    ):
        """
        When "in_progress" is requested, in progress assets are kept and
        submitted assets are excluded because "submitted" is not requested.
        """
        # Prepare one in progress and one submitted asset with this user's activity.
        create_transcription(asset=self.asset1, user=self.user)
        Asset.objects.filter(pk=self.asset1.pk).update(
            transcription_status=TranscriptionStatus.IN_PROGRESS
        )

        create_transcription(
            asset=self.asset2, user=self.user, submitted=now()
        )  # submitted

        # Request only "in_progress" status.
        queryset = _get_pages(self._request({"status": "in_progress"}))
        ids = list(queryset.values_list("id", flat=True))
        self.assertIn(self.asset1.id, ids)
        self.assertNotIn(self.asset2.id, ids)


class CalculateAssetStatsTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.user = self.create_test_user()
        self.campaign = create_campaign(slug="cas-c", title="cas-c")
        self.project = create_project(
            campaign=self.campaign, slug="cas-p", title="cas-p"
        )
        self.item = create_item(project=self.project, item_id="cas-i")

    def test_counts_percents_and_contributors_remove_none_branch(self):
        # Build a small asset set with varied statuses.
        asset_not_started = create_asset(item=self.item, slug="cas-ns", sequence=1)
        asset_in_progress = create_asset(item=self.item, slug="cas-ip", sequence=2)
        asset_submitted = create_asset(item=self.item, slug="cas-sub", sequence=3)

        # Set desired statuses directly.
        Asset.objects.filter(pk=asset_not_started.pk).update(
            transcription_status=TranscriptionStatus.NOT_STARTED
        )
        Asset.objects.filter(pk=asset_in_progress.pk).update(
            transcription_status=TranscriptionStatus.IN_PROGRESS
        )
        Asset.objects.filter(pk=asset_submitted.pk).update(
            transcription_status=TranscriptionStatus.SUBMITTED
        )

        # Create transcriptions ONLY for the assets that should not remain NOT_STARTED.
        # For IN_PROGRESS, a plain transcription moves or keeps the asset in progress.
        transcription_in_progress = create_transcription(
            asset=asset_in_progress, user=self.user
        )
        # For SUBMITTED, mark the transcription as submitted so the
        # signal preserves SUBMITTED.
        transcription_submitted = create_transcription(
            asset=asset_submitted, user=self.user, submitted=now()
        )
        # Ensure there is at least one None in reviewed_by so the remove(None)
        # path is exercised.
        Transcription.objects.filter(
            pk__in=[transcription_in_progress.pk, transcription_submitted.pk]
        ).update(reviewed_by=None)

        context = {}
        calculate_asset_stats(
            Asset.objects.filter(
                pk__in=[asset_not_started.pk, asset_in_progress.pk, asset_submitted.pk]
            ),
            context,
        )

        # contributor_count counts unique user_ids and reviewed_by values, minus None.
        self.assertEqual(context["contributor_count"], 1)

        # Counts per status.
        self.assertEqual(context["not_started_count"], 1)
        self.assertEqual(context["in_progress_count"], 1)
        self.assertEqual(context["submitted_count"], 1)
        # COMPLETED not present.
        self.assertEqual(context.get("completed_count", 0), 0)

        # Percentages should round sensibly for 1 out of 3.
        self.assertEqual(context["not_started_percent"], round(100 * (1 / 3)))
        self.assertEqual(context["in_progress_percent"], round(100 * (1 / 3)))
        self.assertEqual(context["submitted_percent"], round(100 * (1 / 3)))

        # Labeled list populated and includes "not_started".
        self.assertTrue(
            any(
                status_key == "not_started"
                for status_key, _, _ in context["transcription_status_counts"]
            )
        )

    def test_contributors_keyerror_branch_and_cap_99(self):
        # Create 100 assets and set 99 to NOT_STARTED and 1 to IN_PROGRESS.
        assets = []
        for i in range(1, 101):
            a = create_asset(item=self.item, slug=f"cas-bulk-{i}", sequence=i)
            assets.append(a)

        Asset.objects.filter(pk__in=[a.pk for a in assets[:99]]).update(
            transcription_status=TranscriptionStatus.NOT_STARTED
        )
        Asset.objects.filter(pk=assets[-1].pk).update(
            transcription_status=TranscriptionStatus.IN_PROGRESS
        )

        # Create a transcription ONLY for the single IN_PROGRESS asset
        # and set a reviewer. This ensures there is no None in reviewed_by,
        # which triggers the KeyError branch when calculate_asset_stats
        # attempts to remove(None) from the contributor set.
        other_user = self.create_test_user(username="cas-reviewer")
        transcription = create_transcription(asset=assets[-1], user=self.user)
        transcription.reviewed_by = other_user
        transcription.save(update_fields=["reviewed_by"])

        context = {}
        calculate_asset_stats(
            Asset.objects.filter(pk__in=[a.pk for a in assets]), context
        )

        # Two distinct contributors: the creator (self.user) and
        # the reviewer (other_user).
        self.assertEqual(context["contributor_count"], 2)

        # Verify percentages and that the 99 percent capping behavior is applied.
        self.assertEqual(context["not_started_percent"], 99)
        self.assertEqual(context["in_progress_percent"], 1)
        self.assertEqual(context.get("submitted_percent", 0), 0)
        self.assertEqual(context.get("completed_percent", 0), 0)

        # Also verify counts to ensure the underlying distribution is as intended.
        self.assertEqual(context["not_started_count"], 99)
        self.assertEqual(context["in_progress_count"], 1)
        self.assertEqual(context.get("submitted_count", 0), 0)
        self.assertEqual(context.get("completed_count", 0), 0)


class AnnotateChildrenProgressStatsTests(TestCase):
    class Obj:
        pass

    def test_progress_stats_with_capping_and_lowest_status(self):
        obj = self.Obj()
        # Construct counts such that one bucket yields at least ninety nine
        # but less than one hundred percent
        obj.not_started_count = 99
        obj.in_progress_count = 1
        obj.submitted_count = 0
        obj.completed_count = 0

        annotate_children_with_progress_stats([obj])

        # Total
        self.assertEqual(obj.total_count, 100)
        # Capping at ninety nine
        self.assertEqual(obj.not_started_percent, 99)
        # Others
        self.assertEqual(obj.in_progress_percent, 1)
        self.assertEqual(obj.submitted_percent, 0)
        self.assertEqual(obj.completed_percent, 0)
        # Lowest is the first non-zero by CHOICES order; expect "not_started"
        self.assertEqual(obj.lowest_transcription_status, "not_started")

    def test_progress_stats_zero_total(self):
        obj = self.Obj()
        obj.not_started_count = 0
        obj.in_progress_count = 0
        obj.submitted_count = 0
        obj.completed_count = 0

        annotate_children_with_progress_stats([obj])

        self.assertEqual(obj.total_count, 0)
        self.assertEqual(obj.not_started_percent, 0)
        self.assertEqual(obj.in_progress_percent, 0)
        self.assertEqual(obj.submitted_percent, 0)
        self.assertEqual(obj.completed_percent, 0)
        self.assertIsNone(obj.lowest_transcription_status)


class _BaseView:
    """
    Minimal base class that provides get_context_data so the mixin can call super().
    """

    def get_context_data(self, **kwargs):
        return {}


class DummyTemplateView(AnonymousUserValidationCheckMixin, _BaseView):
    """
    Stand-in view. The mixin is first in the MRO so its get_context_data runs,
    then it calls super() which resolves to _BaseView.get_context_data.
    """

    pass


class AnonymousUserValidationCheckMixinTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.factory = RequestFactory()
        self.user = self.create_test_user()

    def _attach_session(self, request):
        # Attach a session dictionary-like attribute without middleware dependency
        request.session = {}
        return request

    @override_settings(ANONYMOUS_USER_VALIDATION_INTERVAL=10)
    def test_unauthenticated_requires_validation_when_stale(self):
        request = self.factory.get("/dummy")
        request.user = AnonymousUser()
        self._attach_session(request)
        # There is no prior validation so the default timestamp is zero
        # and the validation is stale
        view = DummyTemplateView()
        view.request = request
        context = view.get_context_data()
        self.assertTrue(context["anonymous_user_validation_required"])

    @override_settings(ANONYMOUS_USER_VALIDATION_INTERVAL=10)
    def test_unauthenticated_recent_validation_is_not_required(self):
        request = self.factory.get("/dummy")
        request.user = AnonymousUser()
        self._attach_session(request)
        request.session["turnstile_last_validated"] = int(time())
        view = DummyTemplateView()
        view.request = request
        context = view.get_context_data()
        self.assertFalse(context["anonymous_user_validation_required"])

    @override_settings(ANONYMOUS_USER_VALIDATION_INTERVAL=10)
    def test_authenticated_never_requires_validation(self):
        request = self.factory.get("/dummy")
        request.user = self.user
        self._attach_session(request)
        view = DummyTemplateView()
        view.request = request
        context = view.get_context_data()
        self.assertFalse(context["anonymous_user_validation_required"])


================================================
FILE: concordia/tests/test_widgets.py
================================================
from django.test import TestCase, override_settings

from concordia.turnstile.widgets import TurnstileWidget
from concordia.widgets import EmailWidget


class TestWidgets(TestCase):
    def test_EmailWidget(self):
        widget = EmailWidget()
        output = widget.render("email", None)
        self.assertHTMLEqual(
            output, '<input class="fst-italic form-control" name="email" type="email">'
        )

        output = widget.render("email", "test@example.com")
        self.assertHTMLEqual(
            output,
            '<input class="fst-italic form-control" name="email"'
            ' placeholder="Change your email address" type="email">',
        )

        output = widget.render("email", None, attrs={"display": "none;"})
        self.assertHTMLEqual(
            output,
            '<input class="fst-italic form-control" display="none;"'
            ' name="email" type="email">',
        )

    @override_settings(TURNSTILE_SITEKEY="test-key", TURNSTILE_JS_API_URL="test-url")
    def test_TurnstileWidget(self):
        widget = TurnstileWidget()

        # Testing basic validation
        self.assertEqual(widget.value_from_datadict({}, None, None), None)

        # Testing validation with data
        data = {"cf-turnstile-response": "test-data"}
        self.assertEqual(widget.value_from_datadict(data, None, None), "test-data")

        # Testing basic attrs
        self.assertEqual(widget.build_attrs({}), {"data-sitekey": "test-key"})

        # Testing with extra ttrs
        self.assertEqual(
            widget.build_attrs(
                {"id": "test-id"}, extra_attrs={"custom-attr": "test-attr"}
            ),
            {"data-sitekey": "test-key", "id": "test-id", "custom-attr": "test-attr"},
        )

        # Testing basic context
        self.assertEqual(
            widget.get_context("test-name", "test value", {}),
            {
                "widget": {
                    "name": "test-name",
                    "is_hidden": False,
                    "required": False,
                    "value": "test value",
                    "attrs": {"data-sitekey": "test-key"},
                    "template_name": "forms/widgets/turnstile_widget.html",
                },
                "api_url": "test-url",
            },
        )

        # Testing with special context
        widget.extra_url = {
            "test-parameter1": "test-value1",
            "test-parameter2": "test-value2",
        }
        self.assertEqual(
            widget.get_context("test-name", "test value", {}),
            {
                "widget": {
                    "name": "test-name",
                    "is_hidden": False,
                    "required": False,
                    "value": "test value",
                    "attrs": {"data-sitekey": "test-key"},
                    "template_name": "forms/widgets/turnstile_widget.html",
                },
                "api_url": "test-url?test-parameter1=test-value1&"
                "test-parameter2=test-value2",
            },
        )


================================================
FILE: concordia/tests/utils.py
================================================
import json
from functools import wraps
from secrets import token_hex

from django.utils.text import slugify

from concordia.models import (
    Asset,
    Banner,
    Campaign,
    CampaignRetirementProgress,
    Card,
    CardFamily,
    CarouselSlide,
    ConcordiaFile,
    Guide,
    HelpfulLink,
    Item,
    MediaType,
    Project,
    ResearchCenter,
    SimplePage,
    SiteReport,
    Tag,
    Topic,
    Transcription,
    User,
    UserAssetTagCollection,
    UserProfileActivity,
)


def ensure_slug(original_function):
    @wraps(original_function)
    def inner(*args, **kwargs):
        title = kwargs.get("title")
        slug = kwargs.get("slug")
        if title and slug is None:
            kwargs["slug"] = slugify(title, allow_unicode=True)

        return original_function(*args, **kwargs)

    return inner


@ensure_slug
def create_campaign(
    *,
    title="Test Campaign",
    slug="test-campaign",
    short_description="Short Description",
    description="Test Description",
    published=True,
    unlisted=False,
    status=Campaign.Status.ACTIVE,
    do_save=True,
    **kwargs,
):
    campaign = Campaign(
        title=title,
        slug=slug,
        description=description,
        unlisted=unlisted,
        published=published,
        status=status,
        **kwargs,
    )
    campaign.full_clean()
    if do_save:
        campaign.save()
    return campaign


def create_simple_page(*, do_save=True, **kwargs):
    simple_page = SimplePage(**kwargs)
    if do_save:
        simple_page.save()
    return simple_page


def create_site_report(*, do_save=True, **kwargs):
    site_report = SiteReport(**kwargs)
    if do_save:
        site_report.save()
    return site_report


@ensure_slug
def create_topic(
    *,
    project=None,
    title="Test Topic",
    slug="test-topic",
    description="Test Description",
    published=True,
    unlisted=False,
    do_save=True,
    **kwargs,
):
    if project is None:
        project = create_project(published=published)

    topic = Topic(
        title=title,
        slug=slug,
        description=description,
        unlisted=unlisted,
        published=published,
        **kwargs,
    )
    topic.full_clean()
    if do_save:
        topic.save()

    topic.project_set.add(project)

    if do_save:
        topic.save()
    return topic


@ensure_slug
def create_project(
    *,
    campaign=None,
    title="Test Project",
    slug="test-project",
    description="Test Description",
    published=True,
    do_save=True,
    **kwargs,
):
    if campaign is None:
        campaign = create_campaign(published=published)

    project = Project(
        campaign=campaign, title=title, slug=slug, published=published, **kwargs
    )
    project.full_clean()
    if do_save:
        project.save()
    return project


def create_item(
    *,
    project=None,
    title="Test Item",
    item_id="testitem.0123456789",
    item_url="http://example.com/item/testitem.0123456789/",
    published=True,
    do_save=True,
    **kwargs,
):
    if project is None:
        project = create_project(published=published)

    item = Item(
        project=project,
        title=title,
        item_id=item_id,
        item_url=item_url,
        published=published,
        **kwargs,
    )
    item.full_clean()
    if do_save:
        item.save()
    return item


@ensure_slug
def create_asset(
    *,
    item=None,
    title="Test Asset",
    slug="test-asset",
    media_type=MediaType.IMAGE,
    published=True,
    storage_image="unittest1.jpg",
    do_save=True,
    **kwargs,
):
    if item is None:
        item = create_item(published=published)
    asset = Asset(
        item=item,
        campaign=item.project.campaign,
        title=title,
        slug=slug,
        media_type=media_type,
        published=published,
        storage_image=storage_image,
        **kwargs,
    )
    asset.full_clean()
    if do_save:
        asset.save()
    return asset


def create_transcription(*, asset=None, user=None, do_save=True, **kwargs):
    if asset is None:
        asset = create_asset()
    if user is None:
        user = CreateTestUsers.create_user(f"asset-{asset.id}-user")
    transcription = Transcription(asset=asset, user=user, **kwargs)
    transcription.full_clean()
    if do_save:
        transcription.save()
    return transcription


def create_tag(*, value="tag-value", do_save=True, **kwargs):
    tag = Tag(value=value, **kwargs)
    tag.full_clean()
    if do_save:
        tag.save()
    return tag


def create_tag_collection(*, tag=None, asset=None, user=None, **kwargs):
    # This function doesn't use do_save because ManyToMany fields don't
    # work until the model is saved.
    if tag is None:
        tag = create_tag()
    if asset is None:
        asset = create_asset()
    if user is None:
        user = CreateTestUsers.create_user("tag-user")
    tag_collection = UserAssetTagCollection(asset=asset, user=user, **kwargs)
    tag_collection.full_clean()
    tag_collection.save()
    tag_collection.tags.add(tag)
    return tag_collection


def create_banner(*, slug="Test Banner", do_save=True, **kwargs):
    banner = Banner(slug=slug, **kwargs)
    if do_save:
        banner.save()
    return banner


def create_card(*, title="Test Card", do_save=True, **kwargs):
    card = Card(title=title, **kwargs)
    if do_save:
        card.save()
    return card


def create_card_family(*, slug="test-card-family", do_save=True, **kwargs):
    card_family = CardFamily(slug=slug, **kwargs)
    if do_save:
        card_family.save()
    return card_family


def create_carousel_slide(*, headline="Test Headline", do_save=True, **kwargs):
    slide = CarouselSlide(**kwargs)
    if do_save:
        slide.save()
    return slide


def create_guide(*, do_save=True, **kwargs):
    guide = Guide(**kwargs)
    if do_save:
        guide.save()
    return guide


def create_helpful_link(*, title="Test Helpful Link", do_save=True, **kwargs):
    link = HelpfulLink(title=title, **kwargs)
    if do_save:
        link.save()
    return link


def create_concordia_file(
    *, name="Test Concordia File", uploaded_file="file.pdf", do_save=True, **kwargs
):
    concordia_file = ConcordiaFile(name=name, uploaded_file=uploaded_file, **kwargs)
    if do_save:
        concordia_file.save()
    return concordia_file


def create_user_profile_activity(
    *,
    campaign=None,
    user=None,
    do_save=True,
    **kwargs,
):
    if campaign is None:
        campaign = create_campaign()
    if user is None:
        user = CreateTestUsers.create_user("profile-user")
    activity = UserProfileActivity(campaign=campaign, user=user)
    if do_save:
        activity.save()
    return activity


def create_campaign_retirement_progress(
    *,
    campaign=None,
    do_save=True,
    **kwargs,
):
    if campaign is None:
        campaign = create_campaign()
    progress = CampaignRetirementProgress(campaign=campaign)
    if do_save:
        progress.save()
    return progress


def create_research_center(*, title="Test Research Center", do_save=True, **kwargs):
    center = ResearchCenter(title=title, **kwargs)
    if do_save:
        center.save()
    return center


class JSONAssertMixin(object):
    def assertValidJSON(self, response, expected_status=200):
        """
        Assert that a response contains valid JSON and return the decoded JSON
        """
        self.assertEqual(response.status_code, expected_status)

        try:
            data = json.loads(response.content.decode("utf-8"))
        except json.JSONDecodeError as exc:
            self.fail(msg=f"response content failed to decode: {exc}")
            raise

        return data


class CreateTestUsers(object):
    def login_user(self, username="tester", **kwargs):
        """
        Create a user and log the user in
        """
        if not hasattr(self, "user") or self.user is None:
            self.user = self.create_test_user(username, **kwargs)

        self.client.login(username=self.user.username, password=self.user._password)

    def logout_user(self):
        self.client.logout()
        self.user = None

    @classmethod
    def create_user(cls, username, is_active=True, **kwargs):
        if "email" not in kwargs:
            kwargs["email"] = f"{username}@example.com"

        user = User.objects.create_user(username=username, **kwargs)
        fake_pw = token_hex(24)
        user.is_active = is_active
        user.set_password(fake_pw)
        user.save()

        user._password = fake_pw

        return user

    @classmethod
    def create_test_user(cls, username="testuser", **kwargs):
        """
        Creates an activated test User account
        """
        return cls.create_user(username, is_active=True, **kwargs)

    @classmethod
    def create_inactive_user(cls, username="testinactiveuser", **kwargs):
        """
        Creates an inactive test User account
        """
        return cls.create_user(username, is_active=False, **kwargs)

    @classmethod
    def create_staff_user(cls, username="teststaffuser", **kwargs):
        """
        Creates a staff test User account
        """
        return cls.create_user(username, is_staff=True, is_active=True, **kwargs)

    @classmethod
    def create_super_user(cls, username="testsuperuser", **kwargs):
        """
        Creates a super user User account
        """
        return cls.create_user(
            username, is_staff=True, is_superuser=True, is_active=True, **kwargs
        )


class CacheControlAssertions(object):
    def assertUncacheable(self, response):
        self.assertIn("Cache-Control", response)
        self.assertIn("no-cache", response["Cache-Control"])
        self.assertIn("no-store", response["Cache-Control"])

    def assertCachePrivate(self, response):
        self.assertIn("Cache-Control", response)
        self.assertIn("private", response["Cache-Control"])


class StreamingTestMixin(object):
    def get_streaming_content(self, response):
        self.assertTrue(response.streaming)
        return b"".join(response.streaming_content)


================================================
FILE: concordia/turnstile/LICENSE
================================================
MIT License

Copyright (c) 2022 Zhang Minghan

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.


================================================
FILE: concordia/turnstile/__init__.py
================================================


================================================
FILE: concordia/turnstile/context_processors.py
================================================
from typing import Any, Dict

from django.conf import settings
from django.http import HttpRequest


def turnstile_default_settings(request: "HttpRequest") -> "Dict[str, Any]":
    """
    Provide Turnstile-related settings to template context.

    Behavior:
        Mirrors a subset of Django settings into a dictionary for use in
        templates. Values are retrieved with `getattr` so that each key has a
        sensible default even if the corresponding setting is not defined.

    Args:
        request (HttpRequest): The current request. Included to satisfy the
            Django context processor signature; it is not used.

    Returns:
        Dict[str, Any]: Mapping of keys to values for template context. Keys:
            - "TURNSTILE_JS_API_URL" (str): Base URL for the Turnstile
              JavaScript API. Default:
              "https://challenges.cloudflare.com/turnstile/v0/api.js".
            - "TURNSTILE_VERIFY_URL" (str): Verification endpoint used by the
              server to validate tokens. Default:
              "https://challenges.cloudflare.com/turnstile/v0/siteverify".
            - "TURNSTILE_SITEKEY" (str): Public site key. Default:
              "1x00000000000000000000BB".
            - "TURNSTILE_SECRET" (str): Private secret key. Default:
              "1x0000000000000000000000000000000AA".
            - "TURNSTILE_TIMEOUT" (int): Timeout in seconds for verification
              requests. Default: 5.
            - "TURNSTILE_DEFAULT_CONFIG" (dict[str, Any]): Default widget
              configuration applied as `data-*` attributes. Default: {}.
            - "TURNSTILE_PROXIES" (dict[str, Any]): Proxy configuration for
              outbound verification requests. Default: {}.
    """
    return {
        "TURNSTILE_JS_API_URL": getattr(
            settings,
            "TURN_JS_API_URL",
            "https://challenges.cloudflare.com/turnstile/v0/api.js",
        ),
        "TURNSTILE_VERIFY_URL": getattr(
            settings,
            "TURNSTILE_VERIFY_URL",
            "https://challenges.cloudflare.com/turnstile/v0/siteverify",
        ),
        "TURNSTILE_SITEKEY": getattr(
            settings, "TURNSTILE_SITEKEY", "1x00000000000000000000BB"
        ),
        "TURNSTILE_SECRET": getattr(
            settings,
            "TURNSTILE_SECRET",
            "1x0000000000000000000000000000000AA",  # nosec B106: test-only dummy secret
        ),
        "TURNSTILE_TIMEOUT": getattr(settings, "TURNSTILE_TIMEOUT", 5),
        "TURNSTILE_DEFAULT_CONFIG": getattr(settings, "TURNSTILE_DEFAULT_CONFIG", {}),
        "TURNSTILE_PROXIES": getattr(settings, "TURNSTILE_PROXIES", {}),
    }


================================================
FILE: concordia/turnstile/fields.py
================================================
# Originally from
# https://github.com/zmh-program/django-turnstile/blob/main/turnstile/fields.py

import inspect
import json
from logging import getLogger
from typing import Any, Dict
from urllib.error import HTTPError
from urllib.parse import urlencode
from urllib.request import ProxyHandler, Request, build_opener

from django import forms
from django.conf import settings
from django.utils.translation import gettext_lazy as _

from concordia.logging import ConcordiaLogger

from ..turnstile.widgets import TurnstileWidget

logger = getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


class TurnstileField(forms.Field):
    """
    Field that renders a Turnstile widget and validates its response token.

    Behavior:
        - Collects widget configuration from keyword arguments that are not
          consumed by `forms.Field.__init__` and stores them in
          `self.widget_settings`.
        - Extracts specific script URL options (`onload`, `render`, `hl`) from
          `self.widget_settings` and assigns them to
          `self.widget.extra_url` for query string construction.
        - Renders using `TurnstileWidget`.
        - Validates the submitted token by POSTing to the configured
          Turnstile verify endpoint and raises `forms.ValidationError` on
          failure.

    Args:
        **kwargs: Standard `forms.Field` keyword arguments plus any Turnstile
            configuration that should be emitted as `data-*` attributes on the
            widget. The following keys are treated as script URL parameters and
            moved to `self.widget.extra_url`:
            - `onload`
            - `render`
            - `hl`

    Attributes:
        widget (TurnstileWidget): The widget class used to render Turnstile.
        default_error_messages (dict[str, str]): Error messages for invalid or
            failed verification states.

    Requirements:
        The following Django settings must be defined:
        - `TURNSTILE_DEFAULT_CONFIG` (dict)
        - `TURNSTILE_JS_API_URL` (string)
        - `TURNSTILE_VERIFY_URL` (string)
        - `TURNSTILE_SECRET` (string)
        - `TURNSTILE_TIMEOUT` (float or int)
        - `TURNSTILE_PROXIES` (dict or None)

    Statuses and errors:
        - Raises `forms.ValidationError(code="error_turnstile")` when an HTTP
          error occurs while contacting the verify endpoint.
        - Raises `forms.ValidationError(code="invalid_turnstile")` when the
          verify endpoint returns a non-success response.
        - Uses the standard `required` message when no token is provided.
    """

    widget = TurnstileWidget
    default_error_messages = {
        "error_turnstile": _("Turnstile could not be verified."),
        "invalid_turnstile": _("Turnstile could not be verified."),
        "required": _("Please prove you are a human."),
    }

    def __init__(self, **kwargs: Any) -> None:
        """
        Initialize the field and partition keyword arguments.

        Behavior:
            - Splits `kwargs` into those accepted by `forms.Field.__init__`
              and those intended as Turnstile configuration.
            - Moves `onload`, `render`, and `hl` from the configuration into
              `self.widget.extra_url` so they are appended to the API script
              URL as a query string.
            - Retains the remaining configuration in `self.widget_settings` to
              be emitted as `data-*` attributes by `widget_attrs`.
        """
        superclass_parameters = inspect.signature(super().__init__).parameters
        superclass_kwargs: Dict[str, Any] = {}
        widget_settings = settings.TURNSTILE_DEFAULT_CONFIG.copy()
        for key, value in kwargs.items():
            if key in superclass_parameters:
                superclass_kwargs[key] = value
            else:
                widget_settings[key] = value

        widget_url_settings: Dict[str, Any] = {}
        for prop in filter(lambda p: p in widget_settings, ("onload", "render", "hl")):
            widget_url_settings[prop] = widget_settings[prop]
            del widget_settings[prop]
        self.widget_settings = widget_settings

        super().__init__(**superclass_kwargs)

        self.widget.extra_url = widget_url_settings

    def widget_attrs(self, widget: forms.Widget) -> dict[str, Any]:
        """
        Extend `forms.Field.widget_attrs`.

        Behavior:
            Calls the base implementation to get default attributes, then adds
            one `data-*` attribute per key in `self.widget_settings`. Keys are
            lowercased as-is and prefixed with `data-`.

        Returns:
            dict[str, Any]: Combined widget attributes.
        """
        attrs = super().widget_attrs(widget)
        for key, value in self.widget_settings.items():
            attrs["data-%s" % key] = value
        return attrs

    def validate(self, value: str | None) -> None:
        """
        Validate the submitted Turnstile token against the verify endpoint.

        Behavior:
            - Calls `forms.Field.validate` for base required checks.
            - Issues a POST request to `settings.TURNSTILE_VERIFY_URL` using
              `urllib` with `TURNSTILE_PROXIES` and `TURNSTILE_TIMEOUT`.
            - Parses the JSON response and checks the `success` field.

        Args:
            value (str | None): The token returned by the Turnstile widget.

        Raises:
            forms.ValidationError: If Turnstile verification fails or if an HTTP
                error occurs while contacting the verify endpoint.
        """
        super().validate(value)

        structured_logger.debug(
            "Turnstile validation started.",
            event_code="turnstile_validate_start",
            has_token=bool(value),
            verify_url=settings.TURNSTILE_VERIFY_URL,
        )

        opener = build_opener(ProxyHandler(settings.TURNSTILE_PROXIES))
        post_data = urlencode(
            {
                "secret": settings.TURNSTILE_SECRET,
                "response": value,
            }
        ).encode()

        request = Request(settings.TURNSTILE_VERIFY_URL, post_data)

        try:
            structured_logger.debug(
                "Submitting token to Turnstile verify endpoint.",
                event_code="turnstile_request_submit",
                verify_url=settings.TURNSTILE_VERIFY_URL,
            )
            response = opener.open(request, timeout=settings.TURNSTILE_TIMEOUT)
            structured_logger.debug(
                "Received response from Turnstile verify endpoint.",
                event_code="turnstile_response_received",
                verify_url=settings.TURNSTILE_VERIFY_URL,
                http_status=getattr(response, "status", None),
            )
        except HTTPError as exc:
            logger.exception("HTTPError received from Turnstile: %s", exc, exc_info=exc)
            structured_logger.exception(
                "HTTPError received from Turnstile verify endpoint.",
                event_code="turnstile_http_error",
                reason="HTTP error while contacting Turnstile verify endpoint",
                reason_code="http_error",
                verify_url=settings.TURNSTILE_VERIFY_URL,
                http_status=getattr(exc, "code", None),
            )
            raise forms.ValidationError(
                self.error_messages["error_turnstile"], code="error_turnstile"
            ) from exc

        response_data = json.loads(response.read().decode("utf-8"))

        # Non-success responses from Turnstile.
        if not response_data.get("success"):
            logger.exception(
                "Failure received from Turnstile. Error codes: %s. Messages: %s",
                response_data.get("error-codes"),
                response_data.get("messages"),
            )
            structured_logger.info(
                "Turnstile verification failed.",
                event_code="turnstile_validate_failed",
                verify_url=settings.TURNSTILE_VERIFY_URL,
                error_codes=response_data.get("error-codes"),
                messages=response_data.get("messages"),
            )
            raise forms.ValidationError(
                self.error_messages["invalid_turnstile"], code="invalid_turnstile"
            )

        structured_logger.debug(
            "Turnstile verification succeeded.",
            event_code="turnstile_validate_success",
            verify_url=settings.TURNSTILE_VERIFY_URL,
        )


================================================
FILE: concordia/turnstile/widgets.py
================================================
# Originally from
# https://github.com/zmh-program/django-turnstile/blob/main/turnstile/widgets.py

from typing import Any, Dict, Mapping
from urllib.parse import urlencode

from django import forms
from django.conf import settings


class TurnstileWidget(forms.Widget):
    """
    A Django form widget for Cloudflare Turnstile.

    Behavior:
        Renders using the `forms/widgets/turnstile_widget.html` template and
        augments the base widget behavior by injecting the configured site key
        into the rendered attributes and the Turnstile script URL into the
        template context. Optional query parameters for the script URL may be
        supplied via the `extra_url` dictionary.

    Requirements:
        - `settings.TURNSTILE_SITEKEY` must be defined.
        - `settings.TURNSTILE_JS_API_URL` must be defined.

    Attributes:
        template_name (str): Template used to render the widget.
        extra_url (Dict[str, str]): Optional query parameters appended to the
            Turnstile JavaScript URL.
    """

    template_name = "forms/widgets/turnstile_widget.html"

    def __init__(self, *args, **kwargs) -> None:
        """
        Initialize the widget.

        Notes:
            Initializes `extra_url` to an empty dictionary.

        Args:
            *args (Any): Positional arguments passed through to `forms.Widget`.
            **kwargs (Any): Keyword arguments passed through to `forms.Widget`.
        """
        self.extra_url = {}
        super().__init__(*args, **kwargs)

    def value_from_datadict(
        self,
        data: "Mapping[str, Any]",
        files: "Mapping[str, Any]",
        name: str,
    ) -> "str | None":
        """
        Extract the Turnstile response token from submitted form data.

        Request Parameters:
            - `cf-turnstile-response` (str): The token provided by the
              Turnstile widget.

        Args:
            data (Mapping[str, Any]): The POST data.
            files (Mapping[str, Any]): The file data (unused).
            name (str): The field name (unused for extraction).

        Returns:
            str | None: The Turnstile token if present, otherwise `None`.
        """
        return data.get("cf-turnstile-response")

    def build_attrs(
        self,
        base_attrs: "Dict[str, Any]",
        extra_attrs: "Dict[str, Any] | None" = None,
    ) -> "Dict[str, Any]":
        """
        Override of `forms.Widget.build_attrs`.

        Difference from base:
            Calls the base method to merge attributes, then sets the
            `data-sitekey` attribute using `settings.TURNSTILE_SITEKEY`.

        Args:
            base_attrs (Dict[str, Any]): Base HTML attributes.
            extra_attrs (Dict[str, Any] | None): Additional attributes to merge.

        Returns:
            Dict[str, Any]: The merged attributes with `data-sitekey` set.
        """
        attrs = super().build_attrs(base_attrs, extra_attrs)
        attrs["data-sitekey"] = settings.TURNSTILE_SITEKEY
        return attrs

    def get_context(
        self,
        name: str,
        value: "Any",
        attrs: "Dict[str, Any] | None",
    ) -> "Dict[str, Any]":
        """
        Override of `forms.Widget.get_context`.

        Difference from base:
            Calls the base method to build the context, then adds `api_url`
            from `settings.TURNSTILE_JS_API_URL`. If `extra_url` has entries,
            appends them as a query string.

        Args:
            name (str): Field name.
            value (Any): Field value.
            attrs (Dict[str, Any] | None): HTML attributes for rendering.

        Returns:
            Dict[str, Any]: Template context including `api_url`.
        """
        context = super().get_context(name, value, attrs)
        context["api_url"] = settings.TURNSTILE_JS_API_URL
        if self.extra_url:
            context["api_url"] += "?" + urlencode(self.extra_url)
        return context


================================================
FILE: concordia/urls.py
================================================
from django.conf import settings
from django.contrib import admin
from django.http import Http404, HttpResponseForbidden
from django.urls import include, path
from django.urls.converters import register_converter
from django.views.defaults import page_not_found, permission_denied, server_error
from django.views.generic import RedirectView

from exporter import views as exporter_views
from prometheus_metrics.views import MetricsView

from . import converters, views

register_converter(converters.UnicodeSlugConverter, "uslug")
register_converter(converters.ItemIdConverter, "item_id")

tx_urlpatterns = (
    [
        path("", views.campaigns.CampaignListView.as_view(), name="campaign-list"),
        path(
            "completed/",
            views.campaigns.CompletedCampaignListView.as_view(),
            name="completed-campaign-list",
        ),
        path(
            "<uslug:slug>/reviewable/",
            views.campaigns.FilteredCampaignDetailView.as_view(),
            name="filtered-campaign-detail",
        ),
        path(
            "<uslug:slug>/",
            views.campaigns.CampaignDetailView.as_view(),
            name="campaign-detail",
        ),
        path(
            "<uslug:campaign_slug>/export/csv/",
            exporter_views.ExportCampaignToCSV.as_view(),
            name="campaign-export-csv",
        ),
        path(
            "<uslug:campaign_slug>/export/bagit/",
            exporter_views.ExportCampaignToBagIt.as_view(),
            name="campaign-export-bagit",
        ),
        path(
            "<uslug:campaign_slug>/<uslug:project_slug>/export/bagit/",
            exporter_views.ExportProjectToBagIt.as_view(),
            name="project-export-bagit",
        ),
        path(
            (
                "<uslug:campaign_slug>/<uslug:project_slug>/"
                "<item_id:item_id>/export/bagit/"
            ),
            exporter_views.ExportItemToBagIt.as_view(),
            name="item-export-bagit",
        ),
        path(
            "<uslug:campaign_slug>/report/",
            views.campaigns.ReportCampaignView.as_view(),
            name="campaign-report",
        ),
        path(
            "<uslug:campaign_slug>/<uslug:project_slug>/<item_id:item_id>/reviewable/",
            views.items.FilteredItemDetailView.as_view(),
            name="filtered-item-detail",
        ),
        path(
            (
                "<uslug:campaign_slug>/<uslug:project_slug>/"
                "<item_id:item_id>/<uslug:slug>/"
            ),
            views.assets.AssetDetailView.as_view(),
            name="asset-detail",
        ),
        # n.b. this must be above project-detail to avoid being seen as a project slug:
        path(
            "<uslug:campaign_slug>/next-transcribable-asset/",
            views.assets.redirect_to_next_transcribable_campaign_asset,
            name="redirect-to-next-transcribable-campaign-asset",
        ),
        path(
            "<uslug:campaign_slug>/next-reviewable-asset/",
            views.assets.redirect_to_next_reviewable_campaign_asset,
            name="redirect-to-next-reviewable-campaign-asset",
        ),
        path(
            "<uslug:campaign_slug>/<uslug:slug>/reviewable/",
            views.projects.FilteredProjectDetailView.as_view(),
            name="filtered-project-detail",
        ),
        path(
            "<uslug:campaign_slug>/<uslug:slug>/",
            views.projects.ProjectDetailView.as_view(),
            name="project-detail",
        ),
        path(
            "<uslug:campaign_slug>/<uslug:project_slug>/<item_id:item_id>/",
            views.items.ItemDetailView.as_view(),
            name="item-detail",
        ),
    ],
    "transcriptions",
)

urlpatterns = [
    path("", views.HomeView.as_view(), name="homepage"),
    path("healthz", views.healthz, name="health-check"),
    path("letter", views.accounts.account_letter, name="user-letter"),
    path("about/", views.simple_pages.about_simple_page, name="about"),
    # These patterns are to make sure various links to help-center URLs don't break
    # when the URLs are changed to not include help-center and can be removed after
    # all links are updated.
    path(
        "help-center/",
        RedirectView.as_view(pattern_name="welcome-guide"),
        name="help-center",
    ),
    path(
        "help-center/welcome-guide/", RedirectView.as_view(pattern_name="welcome-guide")
    ),
    path(
        "help-center/welcome-guide-esp/",
        RedirectView.as_view(pattern_name="welcome-guide-spanish"),
    ),
    path(
        "help-center/<slug:page_slug>-esp/",
        views.simple_pages.HelpCenterSpanishRedirectView.as_view(),
    ),
    path(
        "help-center/<slug:page_slug>/",
        views.simple_pages.HelpCenterRedirectView.as_view(),
    ),
    # End of help-center patterns
    path("get-started/", views.simple_pages.simple_page, name="welcome-guide"),
    path(
        "get-started/how-to-transcribe/",
        views.simple_pages.simple_page,
        name="transcription-basic-rules",
    ),
    path(
        "get-started/how-to-review/",
        views.simple_pages.simple_page,
        name="how-to-review",
    ),
    path("get-started/how-to-tag/", views.simple_pages.simple_page, name="how-to-tag"),
    path(
        "get-started/<uslug:slug>/", views.simple_pages.simple_page, name="simple-page"
    ),
    path(
        "get-started-esp/",
        views.simple_pages.simple_page,
        name="welcome-guide-spanish",
    ),
    path(
        "get-started-esp/how-to-transcribe-esp/",
        views.simple_pages.simple_page,
        name="how-to-transcribe-spanish",
    ),
    path(
        "get-started-esp/how-to-review-esp/",
        views.simple_pages.simple_page,
        name="how-to-review-spanish",
    ),
    path(
        "get-started-esp/how-to-tag-esp/",
        views.simple_pages.simple_page,
        name="how-to-tag-spanish",
    ),
    path(
        "get-started-esp/<uslug:slug>/",
        views.simple_pages.simple_page,
        name="simple-page-spanish",
    ),
    path(
        "for-educators/",
        views.simple_pages.simple_page,
        name="for-educators",
    ),
    path(
        "for-staff/",
        views.simple_pages.simple_page,
        name="for-staff",
    ),
    path(
        "resources/",
        RedirectView.as_view(
            pattern_name="guidelines", permanent=True, query_string=True
        ),
        name="resources",
    ),
    path(
        "service/",
        views.simple_pages.simple_page,
        name="service",
    ),
    path(
        "guidelines/",
        views.simple_pages.simple_page,
        name="guidelines",
    ),
    path(
        "programs/",
        views.simple_pages.simple_page,
        name="programs",
    ),
    path(
        "latest/",
        RedirectView.as_view(pattern_name="about", permanent=True, query_string=True),
    ),
    path("questions/", views.simple_pages.simple_page, name="questions"),
    path(
        "contact/",
        RedirectView.as_view(url="https://ask.loc.gov/crowd"),
        name="contact",
    ),
    path(
        "help-center/",
        RedirectView.as_view(pattern_name="welcome-guide"),
        name="help-center",
    ),
    path(
        "campaigns-topics/",
        views.campaigns.CampaignTopicListView.as_view(),
        name="campaign-topic-list",
    ),
    path(
        "topics/<uslug:slug>/",
        views.topics.TopicDetailView.as_view(),
        name="topic-detail",
    ),
    path(
        "topics/<uslug:topic_slug>/next-transcribable-asset/",
        views.assets.redirect_to_next_transcribable_topic_asset,
        name="redirect-to-next-transcribable-topic-asset",
    ),
    path(
        "topics/<uslug:topic_slug>/next-reviewable-asset/",
        views.assets.redirect_to_next_reviewable_topic_asset,
        name="redirect-to-next-reviewable-topic-asset",
    ),
    path(
        "next-transcribable-asset/",
        views.assets.redirect_to_next_transcribable_asset,
        name="redirect-to-next-transcribable-asset",
    ),
    path(
        "next-reviewable-asset/",
        views.assets.redirect_to_next_reviewable_asset,
        name="redirect-to-next-reviewable-asset",
    ),
    path("campaigns/", include(tx_urlpatterns, namespace="transcriptions")),
    path(
        "reserve-asset/<int:asset_pk>/", views.ajax.reserve_asset, name="reserve-asset"
    ),
    path(
        "assets/<int:asset_pk>/transcriptions/save/",
        views.ajax.save_transcription,
        name="save-transcription",
    ),
    path(
        "transcriptions/<int:pk>/submit/",
        views.ajax.submit_transcription,
        name="submit-transcription",
    ),
    path(
        "transcriptions/<int:pk>/review/",
        views.ajax.review_transcription,
        name="review-transcription",
    ),
    path(
        "assets/<int:asset_pk>/transcriptions/generate-ocr/",
        views.ajax.generate_ocr_transcription,
        name="generate-ocr-transcription",
    ),
    path(
        "assets/<int:asset_pk>/transcriptions/rollback/",
        views.ajax.rollback_transcription,
        name="rollback-transcription",
    ),
    path(
        "assets/<int:asset_pk>/transcriptions/rollforward/",
        views.ajax.rollforward_transcription,
        name="rollforward-transcription",
    ),
    path(
        "assets/<int:asset_pk>/tags/submit/", views.ajax.submit_tags, name="submit-tags"
    ),
    path(
        "account/ajax-status/",
        views.ajax.ajax_session_status,
        name="ajax-session-status",
    ),
    path("account/ajax-messages/", views.ajax.ajax_messages, name="ajax-messages"),
    path(
        "account/register/",
        views.accounts.ConcordiaRegistrationView.as_view(),
        name="registration_register",
    ),
    path(
        "account/login/",
        views.accounts.ConcordiaLoginView.as_view(),
        name="registration_login",
    ),
    path("account/get_pages/", views.accounts.get_pages, name="get_pages"),
    path(
        "account/profile/",
        views.accounts.AccountProfileView.as_view(),
        name="user-profile",
    ),
    path(
        "account/password_reset/",
        views.accounts.ConcordiaPasswordResetRequestView.as_view(),
        name="password_reset",
    ),
    path(
        "account/reset/<uidb64>/<token>/",
        views.accounts.ConcordiaPasswordResetConfirmView.as_view(),
        name="password_reset_confirm",
    ),
    path("account/", include("django_registration.backends.activation.urls")),
    path("account/", include("django.contrib.auth.urls")),
    path(
        "account/email_confirmation/<str:confirmation_key>/",
        views.accounts.EmailReconfirmationView.as_view(),
        name="email-reconfirmation",
    ),
    path(
        "account/delete/",
        views.accounts.AccountDeletionView.as_view(),
        name="account-deletion",
    ),
    path(
        ".well-known/change-password",  # https://wicg.github.io/change-password-url/
        RedirectView.as_view(pattern_name="password_change"),
    ),
    path("admin/", admin.site.urls),
    # Internal support assists:
    path("error/500/", server_error),
    path("error/404/", page_not_found, {"exception": Http404()}),
    path("error/429/", views.rate_limit.ratelimit_view),
    path("error/403/", permission_denied, {"exception": HttpResponseForbidden()}),
    path("tinymce/", include("tinymce.urls")),
    path("metrics", MetricsView.as_view(), name="prometheus-django-metrics"),
    path("robots.txt", include("robots.urls")),
    path(
        "maintenance-mode/off/",
        views.maintenance_mode.maintenance_mode_off,
        name="maintenance_mode_off",
    ),
    path(
        "maintenance-mode/on/",
        views.maintenance_mode.maintenance_mode_on,
        name="maintenance_mode_on",
    ),
    path(
        "maintenance-mode/frontend/available",
        views.maintenance_mode.maintenance_mode_frontend_available,
        name="maintenance_mode_frontend_available",
    ),
    path(
        "maintenance-mode/frontend/unavailable",
        views.maintenance_mode.maintenance_mode_frontend_unavailable,
        name="maintenance_mode_frontend_unavailable",
    ),
    path(
        "api/visualization/<slug:name>/",
        views.visualizations.VisualizationDataView.as_view(),
        name="visualization",
    ),
]

if settings.DEBUG:
    import debug_toolbar
    from django.conf.urls.static import static
    from django.views.generic import TemplateView

    from concordia.api import api as concordia_api

    urlpatterns = [path("__debug__/", include(debug_toolbar.urls))] + urlpatterns

    urlpatterns += static(settings.MEDIA_URL, document_root=settings.MEDIA_ROOT)

    urlpatterns += (
        path(
            "transcription/",
            TemplateView.as_view(template_name="transcriptions/transcription.html"),
            name="transcription",
        ),
        path("api/", concordia_api.urls, name="api"),
    )


================================================
FILE: concordia/utils/__init__.py
================================================
from secrets import token_hex

from django.contrib.auth.models import User

from concordia.logging import ConcordiaLogger
from concordia.templatetags.concordia_media_tags import asset_media_url

__all__ = [
    "get_anonymous_user",
    "request_accepts_json",
    "get_or_create_reservation_token",
    "get_image_urls_from_asset",
]

structured_logger = ConcordiaLogger.get_logger(__name__)


def get_anonymous_user():
    """
    Get the user called "anonymous" if it exist. Create the user if it doesn't
    exist This is the default concordia user if someone is working on the site
    without logging in first.
    """

    try:
        return User.objects.get(username="anonymous")
    except User.DoesNotExist:
        return User.objects.create_user(username="anonymous")


def request_accepts_json(request):
    accept_header = request.headers.get("Accept", "*/*")

    return "application/json" in accept_header


def get_or_create_reservation_token(request):
    # Reservation tokens are 44 characters (22 bytes
    # converted into 44 hex digits) plus the user's
    # database id padded with leading zeroes until it's
    # at least 6 characters long
    if "reservation_token" not in request.session:
        request.session["reservation_token"] = token_hex(22)
        user = getattr(request, "user", None)
        if user is not None:
            uid = user.id
            if uid is None:
                uid = get_anonymous_user().id
            request.session["reservation_token"] += str(uid).zfill(6)
            structured_logger.info(
                "Reservation token created.",
                event_code="reservation_token_created",
                reservation_token=request.session["reservation_token"],
                user=user,
            )
    else:
        structured_logger.info(
            "Reservation token reused.",
            event_code="reservation_token_reused",
            reservation_token=request.session["reservation_token"],
        )
    return request.session["reservation_token"]


def get_image_urls_from_asset(asset):
    """
    Given an Asset, return a tuple containing the normalized full-size and
    thumbnail-size image URLs
    """

    image_url = asset_media_url(asset)
    if asset.download_url and "iiif" in asset.download_url:
        thumbnail_url = asset.download_url.replace(
            "http://tile.loc.gov", "https://tile.loc.gov"
        )
    else:
        thumbnail_url = image_url

    return image_url, thumbnail_url


================================================
FILE: concordia/utils/celery.py
================================================
from celery import Task

from concordia.celery import app as concordia_celery_app


def get_registered_task(name: str) -> Task:
    """
    Retrieve a Celery task by its fully qualified name.

    This function looks up a task in the Celery app task registry. It raises a
    RuntimeError if the task is not found. The purpose of this function is to
    provide a usable interface for safely calling a task without importing it
    directly, to avoid issues such as circular imports. This avoids issues with
    `app.send_task`, which ignores settings such as `ALWAYS_EAGER`.

    Args:
        name (str): Fully qualified task name, for example
            "myapp.tasks.my_task".

    Returns:
        Task: The registered Celery task object.

    Raises:
        RuntimeError: If the task name is not found in the registry.
    """
    try:
        return concordia_celery_app.tasks[name]
    except KeyError as err:
        raise RuntimeError(f"Task {name} is not registered. Did you typo it?") from err


================================================
FILE: concordia/utils/constants.py
================================================
from django.contrib import messages

ASSETS_PER_PAGE = 36
PROJECTS_PER_PAGE = 36
ITEMS_PER_PAGE = 36
URL_REGEX = r"http[s]?://"

MESSAGE_LEVEL_NAMES = dict(
    zip(
        messages.DEFAULT_LEVELS.values(),
        map(str.lower, messages.DEFAULT_LEVELS.keys()),
        strict=False,
    )
)


================================================
FILE: concordia/utils/next_asset/__init__.py
================================================
from concordia.logging import ConcordiaLogger
from concordia.models import (
    NextReviewableCampaignAsset,
    NextReviewableTopicAsset,
    NextTranscribableCampaignAsset,
    NextTranscribableTopicAsset,
)

from .reviewable import (
    find_and_order_potential_reviewable_campaign_assets,
    find_and_order_potential_reviewable_topic_assets,
    find_invalid_next_reviewable_campaign_assets,
    find_invalid_next_reviewable_topic_assets,
    find_new_reviewable_campaign_assets,
    find_new_reviewable_topic_assets,
    find_next_reviewable_campaign_asset,
    find_next_reviewable_campaign_assets,
    find_next_reviewable_topic_asset,
    find_next_reviewable_topic_assets,
    find_reviewable_campaign_asset,
    find_reviewable_topic_asset,
)
from .transcribable import (
    find_and_order_potential_transcribable_campaign_assets,
    find_and_order_potential_transcribable_topic_assets,
    find_invalid_next_transcribable_campaign_assets,
    find_invalid_next_transcribable_topic_assets,
    find_new_transcribable_campaign_assets,
    find_new_transcribable_topic_assets,
    find_next_transcribable_campaign_asset,
    find_next_transcribable_campaign_assets,
    find_next_transcribable_topic_asset,
    find_next_transcribable_topic_assets,
    find_transcribable_campaign_asset,
    find_transcribable_topic_asset,
)

__all__ = [
    "find_and_order_potential_transcribable_campaign_assets",
    "find_and_order_potential_transcribable_topic_assets",
    "find_new_transcribable_campaign_assets",
    "find_new_transcribable_topic_assets",
    "find_next_transcribable_campaign_asset",
    "find_next_transcribable_topic_asset",
    "find_next_transcribable_campaign_assets",
    "find_next_transcribable_topic_assets",
    "find_transcribable_campaign_asset",
    "find_transcribable_topic_asset",
    "find_and_order_potential_reviewable_campaign_assets",
    "find_and_order_potential_reviewable_topic_assets",
    "find_new_reviewable_campaign_assets",
    "find_new_reviewable_topic_assets",
    "find_next_reviewable_campaign_assets",
    "find_next_reviewable_topic_assets",
    "find_next_reviewable_campaign_asset",
    "find_next_reviewable_topic_asset",
    "find_reviewable_campaign_asset",
    "find_reviewable_topic_asset",
    "remove_next_asset_objects",
    "find_invalid_next_reviewable_campaign_assets",
    "find_invalid_next_reviewable_topic_assets",
    "find_invalid_next_transcribable_campaign_assets",
    "find_invalid_next_transcribable_topic_assets",
]

structured_logger = ConcordiaLogger.get_logger(__name__)


def remove_next_asset_objects(asset_id):
    """
    Remove all cached next asset entries associated with the given asset id.

    This function deletes entries from the four next asset tables:
    - NextTranscribableCampaignAsset
    - NextTranscribableTopicAsset
    - NextReviewableCampaignAsset
    - NextReviewableTopicAsset

    It is typically used when an asset is no longer valid for caching
    (e.g., after transcription or review status changes, or when a user
    reserves the asset).

    Args:
        asset_id (int): The ID of the asset to remove from next-asset tables.
    """
    structured_logger.info(
        "Removing next asset objects",
        event_code="remove_next_asset_objects",
        asset_id=asset_id,
    )
    NextTranscribableCampaignAsset.objects.filter(asset_id=asset_id).delete()
    NextTranscribableTopicAsset.objects.filter(asset_id=asset_id).delete()
    NextReviewableCampaignAsset.objects.filter(asset_id=asset_id).delete()
    NextReviewableTopicAsset.objects.filter(asset_id=asset_id).delete()


================================================
FILE: concordia/utils/next_asset/reviewable/__init__.py
================================================
from .campaign import (
    find_and_order_potential_reviewable_campaign_assets,
    find_invalid_next_reviewable_campaign_assets,
    find_new_reviewable_campaign_assets,
    find_next_reviewable_campaign_asset,
    find_next_reviewable_campaign_assets,
    find_reviewable_campaign_asset,
)
from .topic import (
    find_and_order_potential_reviewable_topic_assets,
    find_invalid_next_reviewable_topic_assets,
    find_new_reviewable_topic_assets,
    find_next_reviewable_topic_asset,
    find_next_reviewable_topic_assets,
    find_reviewable_topic_asset,
)

__all__ = [
    "find_new_reviewable_campaign_assets",
    "find_next_reviewable_campaign_assets",
    "find_reviewable_campaign_asset",
    "find_and_order_potential_reviewable_campaign_assets",
    "find_next_reviewable_campaign_asset",
    "find_and_order_potential_reviewable_topic_assets",
    "find_new_reviewable_topic_assets",
    "find_next_reviewable_topic_asset",
    "find_next_reviewable_topic_assets",
    "find_reviewable_topic_asset",
    "find_invalid_next_reviewable_campaign_assets",
    "find_invalid_next_reviewable_topic_assets",
]


================================================
FILE: concordia/utils/next_asset/reviewable/campaign.py
================================================
from typing import Dict

from django.contrib.auth.models import User
from django.db import transaction
from django.db.models import Case, IntegerField, Q, QuerySet, Subquery, Value, When

from concordia import models as concordia_models
from concordia.logging import ConcordiaLogger
from concordia.utils.celery import get_registered_task

structured_logger = ConcordiaLogger.get_logger(__name__)


def _reserved_asset_ids_subq(
    campaign: concordia_models.Campaign,
) -> "QuerySet[Dict[str, int]]":
    """
    Return a subquery of reserved asset identifiers for a campaign.

    Behavior:
        Produces a subquery suitable for use with `Subquery(...)` and
        `exclude(pk__in=...)` clauses to filter out assets that currently have
        an active reservation.

    Args:
        campaign (concordia_models.Campaign): Campaign whose reserved
        assets should be excluded.

    Returns:
        QuerySet[Dict[str, int]]: A queryset of dictionaries with a single key
            "asset_id" corresponding to reserved assets.
    """
    return concordia_models.AssetTranscriptionReservation.objects.filter(
        asset__campaign=campaign
    ).values("asset_id")


def _eligible_reviewable_base_qs(
    campaign: concordia_models.Campaign,
    user: User | None = None,
) -> "QuerySet[concordia_models.Asset]":
    """
    Build the base queryset of reviewable assets for a campaign.

    Behavior:
        Restricts to published projects, items, and assets, and to assets whose
        transcription status is `SUBMITTED`. Optionally excludes assets
        transcribed by the supplied user.

    Args:
        campaign (concordia_models.Campaign): Campaign scope for filtering.
        user (User | None): If provided, exclude assets transcribed by this user.

    Returns:
        QuerySet[concordia_models.Asset]: Reviewable assets, with `item` and
            `item__project` selected via `select_related`.
    """
    qs = concordia_models.Asset.objects.filter(
        campaign_id=campaign.id,
        item__project__published=True,
        item__published=True,
        published=True,
        transcription_status=concordia_models.TranscriptionStatus.SUBMITTED,
    ).select_related("item", "item__project")
    if user:
        qs = qs.exclude(transcription__user=user.id)
    return qs


def _next_seq_after(pk: int | None) -> int | None:
    """
    Resolve the sequence number for a given asset primary key.

    Behavior:
        Convenience utility for ordering logic when advancing within a series
        of assets.

    Args:
        pk (int | None): Asset primary key whose sequence to resolve.

    Returns:
        int | None: The asset's sequence number, or None if `pk` is falsy
            or the asset does not exist.
    """
    if not pk:
        return None
    return (
        concordia_models.Asset.objects.filter(pk=pk)
        .values_list("sequence", flat=True)
        .first()
    )


@transaction.atomic
def _find_reviewable_in_item(
    campaign: concordia_models.Campaign,
    user: User,
    *,
    item_id: str,
    after_asset_pk: int | None,
) -> "concordia_models.Asset | None":
    """
    Select the next reviewable asset within the same item.

    Behavior:
        Attempts a short-circuit within the user's current item to provide a
        locally contiguous review flow.

    Eligibility:
        - Asset, Item, and Project are published.
        - Asset transcription status is `SUBMITTED`.
        - Asset is not reserved.
        - Asset was not transcribed by the current user.

    Ordering:
        - If `after_asset_pk` refers to an asset in the same item and campaign,
          select the earliest asset whose (sequence, id) is strictly greater
          than the current asset's pair.
        - Otherwise, select the earliest eligible by (sequence, id).

    Args:
        campaign (concordia_models.Campaign): Campaign scope.
        user (User): Current user; used to exclude their own work.
        item_id (str): Identifier of the item to stay within.
        after_asset_pk (int | None): Asset primary key to advance from.

    Returns:
        concordia_models.Asset | None: A locked eligible asset, or
            None if no match is available.
    """
    reserved_asset_ids = concordia_models.AssetTranscriptionReservation.objects.filter(
        asset__item__item_id=item_id,
        asset__item__project__campaign=campaign,
    ).values("asset_id")

    eligible = (
        concordia_models.Asset.objects.filter(
            item__item_id=item_id,
            item__project__campaign=campaign,
            item__project__published=True,
            item__published=True,
            published=True,
            transcription_status=concordia_models.TranscriptionStatus.SUBMITTED,
        )
        .exclude(pk__in=Subquery(reserved_asset_ids))
        .exclude(transcription__user=user.id)
    )

    seq_gt_filter = None
    if after_asset_pk is not None:
        try:
            current = (
                concordia_models.Asset.objects.only("id", "sequence", "item_id", "item")
                .select_related("item")
                .get(pk=after_asset_pk)
            )
            if (
                current.item.item_id == item_id
                and current.item.project.campaign_id == campaign.id
            ):
                seq_gt_filter = Q(sequence__gt=current.sequence) | (
                    Q(sequence=current.sequence) & Q(id__gt=after_asset_pk)
                )
        except concordia_models.Asset.DoesNotExist:
            pass

    if seq_gt_filter is not None:
        eligible = eligible.filter(seq_gt_filter)

    asset = (
        eligible.select_for_update(skip_locked=True, of=("self",))
        .select_related("item", "item__project")
        .order_by("sequence", "id")
        .first()
    )

    structured_logger.debug(
        "Item short-circuit (campaign reviewable) resolved.",
        event_code="reviewable_item_short_circuit_campaign",
        campaign=campaign,
        item_id=item_id,
        after_asset_pk=after_asset_pk,
        chosen_asset_id=getattr(asset, "id", None),
    )
    return asset


@transaction.atomic
def _find_reviewable_in_project(
    campaign: concordia_models.Campaign,
    user: User,
    *,
    project_slug: str,
    after_asset_pk: int | None,
) -> "concordia_models.Asset | None":
    """
    Select the first eligible reviewable asset within the same project.

    Behavior:
        Short-circuit when staying within a project. Sequence is per item,
        so this returns the first eligible asset, not strictly "after" a given asset.

    Eligibility:
        - Same campaign and project.
        - Asset, Item, and Project are published.
        - Asset transcription status is `SUBMITTED`.
        - Asset is not reserved.
        - Asset was not transcribed by the current user.

    Ordering:
        Deterministic by (item__item_id, sequence, id).

    Args:
        campaign (concordia_models.Campaign): Campaign scope.
        user (User): Current user; used to exclude their own work.
        project_slug (str): Slug of the project to stay within.
        after_asset_pk (int | None): Present for parity with the item
            variant; not used for ordering here.

    Returns:
        concordia_models.Asset | None: A locked eligible asset, or
            None if no match is available.
    """
    reserved_asset_ids = concordia_models.AssetTranscriptionReservation.objects.filter(
        asset__item__project__slug=project_slug,
        asset__item__project__campaign=campaign,
    ).values("asset_id")

    eligible = (
        concordia_models.Asset.objects.filter(
            item__project__campaign=campaign,
            item__project__slug=project_slug,
            item__project__published=True,
            item__published=True,
            published=True,
            transcription_status=concordia_models.TranscriptionStatus.SUBMITTED,
        )
        .exclude(pk__in=Subquery(reserved_asset_ids))
        .exclude(transcription__user=user.id)
        .select_for_update(skip_locked=True, of=("self",))
        .select_related("item", "item__project")
        .order_by("item__item_id", "sequence", "id")
        .first()
    )

    structured_logger.debug(
        "Project short-circuit (campaign reviewable) resolved.",
        event_code="reviewable_project_short_circuit_campaign",
        campaign=campaign,
        project_slug=project_slug,
        after_asset_pk=after_asset_pk,
        chosen_asset_id=getattr(eligible, "id", None),
    )
    return eligible


def find_new_reviewable_campaign_assets(
    campaign: concordia_models.Campaign,
    user: User | None = None,
) -> "QuerySet[concordia_models.Asset]":
    """
    Return assets in a campaign that are eligible to be added to the cache.

    Behavior:
        Builds the candidate set for the NextReviewableCampaignAsset cache by
        excluding assets that are not `SUBMITTED`, assets already reserved, and
        assets already present in the cache. Optionally excludes assets
        transcribed by the provided user.

    Args:
        campaign (concordia_models.Campaign): Campaign to filter by.
        user (User | None): If provided, exclude assets transcribed by this user.

    Returns:
        QuerySet[concordia_models.Asset]: Eligible assets ordered by sequence.
    """
    reserved_asset_ids = concordia_models.AssetTranscriptionReservation.objects.filter(
        asset__campaign=campaign
    ).values("asset_id")
    next_asset_ids = concordia_models.NextReviewableCampaignAsset.objects.filter(
        campaign=campaign
    ).values("asset_id")

    queryset = (
        concordia_models.Asset.objects.filter(
            campaign_id=campaign.id,
            item__project__published=True,
            item__published=True,
            published=True,
        )
        .filter(transcription_status=concordia_models.TranscriptionStatus.SUBMITTED)
        .exclude(pk__in=Subquery(reserved_asset_ids))
        .exclude(pk__in=Subquery(next_asset_ids))
        .order_by("sequence")
    )
    if user:
        queryset = queryset.exclude(transcription__user=user.id)
    return queryset


def find_next_reviewable_campaign_assets(
    campaign: concordia_models.Campaign,
    user: User,
) -> "QuerySet[concordia_models.NextReviewableCampaignAsset]":
    """
    Return cached reviewable assets in a campaign not transcribed by the user.

    Behavior:
        Reads from the NextReviewableCampaignAsset cache table and filters out
        assets where the requesting user appears in transcriber_ids.

    Args:
        campaign (concordia_models.Campaign): Campaign to retrieve cached assets from.
        user (User): Requesting user.

    Returns:
        QuerySet[concordia_models.NextReviewableCampaignAsset]: Cached candidate rows
        for the given user.
    """
    return concordia_models.NextReviewableCampaignAsset.objects.filter(
        campaign=campaign
    ).exclude(transcriber_ids__contains=[user.id])


@transaction.atomic
def find_reviewable_campaign_asset(
    campaign: concordia_models.Campaign,
    user: User,
) -> "concordia_models.Asset | None":
    """
    Retrieve a single reviewable asset for a user from a campaign.

    Behavior:
        First attempts to select a cached asset from NextReviewableCampaignAsset.
        If none is available, falls back to a direct query over Asset and
        triggers a background task to replenish the cache.

    Concurrency:
        Uses `select_for_update(skip_locked=True, of=("self",))` so only the
        Asset row is locked and concurrent consumers skip locked rows.

    Args:
        campaign (concordia_models.Campaign): Campaign to search within.
        user (User): Requesting user; their own transcriptions are excluded.

    Returns:
        concordia_models.Asset | None: A locked eligible asset, or None if unavailable.
    """
    next_asset = (
        find_next_reviewable_campaign_assets(campaign, user)
        .select_for_update(skip_locked=True, of=("self",))
        .values_list("asset_id", flat=True)
        .first()
    )

    spawn_task = False
    if next_asset:
        asset_query = concordia_models.Asset.objects.filter(id=next_asset)
    else:
        # No asset in the NextReviewableCampaignAsset table for this campaign
        # and user, so fallback to manually finding one
        structured_logger.debug(
            "No cached assets available, falling back to manual lookup",
            event_code="reviewable_fallback_manual_lookup",
            campaign=campaign,
            user=user,
        )
        spawn_task = True
        asset_query = find_new_reviewable_campaign_assets(campaign, user)

    # select_for_update(of=("self",)) causes the row locking only to
    # apply to the Asset table, rather than also locking joined item table
    asset = (
        asset_query.select_for_update(skip_locked=True, of=("self",))
        .select_related("item", "item__project")
        .first()
    )

    if spawn_task:
        # Spawn a task to populate the table for this campaign
        # We wait to do this until after getting an asset because otherwise there's
        # a chance all valid assets get grabbed by the task and our query will return
        # nothing
        structured_logger.debug(
            "Spawned background task to populate cache",
            event_code="reviewable_cache_population_triggered",
            campaign=campaign,
            user=user,
        )
        populate_task = get_registered_task(
            "concordia.tasks.next_asset.reviewable.populate_next_reviewable_for_campaign"
        )
        populate_task.delay(campaign.id)

    return asset


def find_and_order_potential_reviewable_campaign_assets(
    campaign: concordia_models.Campaign,
    user: User,
    project_slug: str,
    item_id: str,
    asset_pk: int | None,
) -> "QuerySet[concordia_models.NextReviewableCampaignAsset]":
    """
    Retrieve and prioritize cached reviewable assets for proximity.

    Behavior:
        Orders cached candidates from NextReviewableCampaignAsset to prefer
        continuity with the user's current location.

    Annotations added to each row (transient fields):
        - next_asset (int): 1 if the candidate's asset_id is greater than
            asset_pk, else 0.
        - same_project (int): 1 if the candidate shares the given
            project_slug, else 0.
        - same_item (int): 1 if the candidate shares the given item_id, else 0.

    Prioritization (descending on the following keys, then ascending by sequence):
        - next_asset
        - same_project
        - same_item
        - sequence

    Args:
        campaign (concordia_models.Campaign): Campaign to filter by.
        user (User): Requesting user.
        project_slug (str): Slug of the user's current project.
        item_id (str): Identifier of the user's current item.
        asset_pk (int | None): Identifier of the current asset, if any.

    Returns:
        QuerySet[concordia_models.NextReviewableCampaignAsset]: Prioritized
            cached candidates.
    """
    potential_next_assets = find_next_reviewable_campaign_assets(campaign, user)

    # We'll favor assets which are in the same item or project as the original:
    next_case = (
        Case(
            When(asset_id__gt=asset_pk, then=1),
            default=0,
            output_field=IntegerField(),
        )
        if asset_pk is not None
        else Value(0, output_field=IntegerField())
    )

    potential_next_assets = potential_next_assets.annotate(
        same_project=Case(
            When(project_slug=project_slug, then=1),
            default=0,
            output_field=IntegerField(),
        ),
        same_item=Case(
            When(item_item_id=item_id, then=1), default=0, output_field=IntegerField()
        ),
        next_asset=next_case,
    ).order_by("-next_asset", "-same_project", "-same_item", "sequence")

    return potential_next_assets


@transaction.atomic
def find_next_reviewable_campaign_asset(
    campaign: concordia_models.Campaign,
    user: User,
    project_slug: str,
    item_id: str,
    original_asset_id: int | None,
) -> "concordia_models.Asset | None":
    """
    Retrieve the next best reviewable asset for a user within a campaign.

    Strategy:
        1. If `item_id` is provided, try a same-item short-circuit that advances
           by (sequence, id) relative to `original_asset_id`.
        2. Else, if `project_slug` is provided, select the first eligible asset
           within that project (short-circuit).
        3. Else, prioritize cached candidates, and if none are suitable, fall
           back to computing from Asset and trigger cache population.

    Concurrency:
        Uses `select_for_update(skip_locked=True, of=("self",))` to avoid
        double-assignments across concurrent consumers.

    Args:
        campaign (concordia_models.Campaign): Campaign to search within.
        user (User): Requesting user.
        project_slug (str): Slug of the user's current project.
        item_id (str): Identifier of the user's current item.
        original_asset_id (int | None): Identifier of the asset just reviewed.

    Returns:
        concordia_models.Asset | None: A locked eligible asset, or None if unavailable.
    """
    try:
        after_pk = int(original_asset_id) if original_asset_id else None
    except (TypeError, ValueError):
        after_pk = None

    # Short-circuit: same item
    if item_id:
        asset = _find_reviewable_in_item(
            campaign, user, item_id=item_id, after_asset_pk=after_pk
        )
        if asset:
            return asset

    # Short-circuit: same project
    if project_slug:
        asset = _find_reviewable_in_project(
            campaign, user, project_slug=project_slug, after_asset_pk=after_pk
        )
        if asset:
            return asset

    # cache-backed selection, then manual fallback
    potential_next_assets = find_and_order_potential_reviewable_campaign_assets(
        campaign, user, project_slug, item_id, after_pk
    )

    asset_id = (
        potential_next_assets.select_for_update(skip_locked=True, of=("self",))
        .values_list("asset_id", flat=True)
        .first()
    )

    spawn_task = False
    if asset_id:
        asset_query = concordia_models.Asset.objects.filter(id=asset_id)
    else:
        # Since we had no potential next assets in the caching table, we have to check
        # the asset table directly.
        structured_logger.debug(
            "No cached assets matched, falling back to manual lookup",
            event_code="reviewable_next_fallback_manual",
            campaign=campaign,
            user=user,
        )
        spawn_task = True
        asset_query = find_new_reviewable_campaign_assets(campaign, user)

        next_case = (
            Case(
                When(id__gt=after_pk, then=1),
                default=0,
                output_field=IntegerField(),
            )
            if after_pk is not None
            else Value(0, output_field=IntegerField())
        )

        asset_query = asset_query.annotate(
            same_project=Case(
                When(item__project__slug=project_slug, then=1),
                default=0,
                output_field=IntegerField(),
            ),
            same_item=Case(
                When(item__item_id=item_id, then=1),
                default=0,
                output_field=IntegerField(),
            ),
            next_asset=next_case,
        ).order_by("-next_asset", "-same_project", "-same_item", "sequence")

    asset = (
        asset_query.select_for_update(skip_locked=True, of=("self",))
        .select_related("item", "item__project")
        .first()
    )

    if spawn_task:
        # Spawn a task to populate the table for this campaign
        # We wait to do this until after getting an asset because otherwise there's
        # a chance all valid assets get grabbed by the task and our query will return
        # nothing
        structured_logger.debug(
            "Spawned background task to populate cache",
            event_code="reviewable_next_cache_population",
            campaign=campaign,
            user=user,
        )
        populate_task = get_registered_task(
            "concordia.tasks.next_asset.reviewable.populate_next_reviewable_for_campaign"
        )
        populate_task.delay(campaign.id)

    return asset


def find_invalid_next_reviewable_campaign_assets(
    campaign_id: int,
) -> "QuerySet[concordia_models.NextReviewableCampaignAsset]":
    """
    Return cache rows that are invalid for review for a given campaign.

    Behavior:
        Identifies NextReviewableCampaignAsset rows that are no longer valid
        because the underlying asset is not `SUBMITTED` or because the asset is
        currently reserved.

    Args:
        campaign_id (int): Identifier of the campaign.

    Returns:
        QuerySet[concordia_models.NextReviewableCampaignAsset]: Distinct
            invalid cache rows.
    """
    reserved_asset_ids = concordia_models.AssetTranscriptionReservation.objects.filter(
        asset__campaign_id=campaign_id
    ).values("asset_id")

    status_filtered = concordia_models.NextReviewableCampaignAsset.objects.exclude(
        asset__transcription_status=concordia_models.TranscriptionStatus.SUBMITTED
    ).filter(campaign_id=campaign_id)

    reserved_filtered = concordia_models.NextReviewableCampaignAsset.objects.filter(
        campaign_id=campaign_id, asset_id__in=Subquery(reserved_asset_ids)
    )

    return (status_filtered | reserved_filtered).distinct()


================================================
FILE: concordia/utils/next_asset/reviewable/topic.py
================================================
from typing import Dict

from django.contrib.auth.models import User
from django.db import transaction
from django.db.models import Case, IntegerField, Q, QuerySet, Subquery, Value, When

from concordia import models as concordia_models
from concordia.logging import ConcordiaLogger
from concordia.utils.celery import get_registered_task

structured_logger = ConcordiaLogger.get_logger(__name__)


def _reserved_asset_ids_subq() -> "QuerySet[Dict[str, int]]":
    """
    Return a subquery of reserved asset identifiers.

    Behavior:
        Produces a subquery suitable for use with `Subquery(...)` and
        `exclude(pk__in=...)` to filter out assets that currently have an
        active reservation. This is not filtered to the topic to avoid
        additional joins.

    Returns:
        QuerySet[Dict[str, int]]: A queryset of dictionaries with a single key
            "asset_id" corresponding to reserved assets.
    """
    return concordia_models.AssetTranscriptionReservation.objects.values("asset_id")


def _eligible_reviewable_base_qs(
    topic: concordia_models.Topic,
    user: User | None = None,
) -> "QuerySet[concordia_models.Asset]":
    """
    Build the base queryset of reviewable assets for a topic.

    Behavior:
        Restricts to published projects, items, and assets, and to assets whose
        transcription status is `SUBMITTED`. Optionally excludes assets
        transcribed by the supplied user.

    Args:
        topic (concordia_models.Topic): Topic scope for filtering.
        user (User | None): If provided, exclude assets transcribed by this user.

    Returns:
        QuerySet[concordia_models.Asset]: Reviewable assets, with `item` and
            `item__project` selected via `select_related`.
    """
    qs = concordia_models.Asset.objects.filter(
        item__project__topics=topic.id,
        item__project__published=True,
        item__published=True,
        published=True,
        transcription_status=concordia_models.TranscriptionStatus.SUBMITTED,
    ).select_related("item", "item__project")
    if user:
        qs = qs.exclude(transcription__user=user.id)
    return qs


def _next_seq_after(pk: int | None) -> int | None:
    """
    Resolve the sequence number for a given asset primary key.

    Behavior:
        Convenience utility for ordering logic when advancing within a series
        of assets.

    Args:
        pk (int | None): Asset primary key whose sequence to resolve.

    Returns:
        int | None: The asset's sequence number, or None if `pk` is falsy
            or the asset does not exist.
    """
    if not pk:
        return None
    return (
        concordia_models.Asset.objects.filter(pk=pk)
        .values_list("sequence", flat=True)
        .first()
    )


@transaction.atomic
def _find_reviewable_in_item(
    topic: concordia_models.Topic,
    user: User,
    *,
    item_id: str,
    after_asset_pk: int | None,
) -> "concordia_models.Asset | None":
    """
    Select the next reviewable asset within the same item.

    Behavior:
        Attempts a short-circuit within the user's current item to provide a
        locally contiguous review flow.

    Eligibility:
        - Asset, Item, and Project are published.
        - Asset transcription status is `SUBMITTED`.
        - Asset is not reserved.
        - Asset was not transcribed by the current user.

    Ordering:
        - If `after_asset_pk` refers to an asset in the same item whose project
          is in `topic`, select the earliest asset whose (sequence, id) is
          strictly greater than the current asset's pair.
        - Otherwise, select the earliest eligible by (sequence, id).

    Args:
        topic (concordia_models.Topic): Topic scope.
        user (User): Current user; used to exclude their own work.
        item_id (str): Identifier of the item to stay within.
        after_asset_pk (int | None): Asset primary key to advance from.

    Returns:
        concordia_models.Asset | None: A locked eligible asset, or
            None if no match is available.
    """
    reserved_asset_ids = concordia_models.AssetTranscriptionReservation.objects.filter(
        asset__item__item_id=item_id,
        asset__item__project__topics=topic,
    ).values("asset_id")

    eligible = (
        concordia_models.Asset.objects.filter(
            item__item_id=item_id,
            item__project__topics=topic,
            item__project__published=True,
            item__published=True,
            published=True,
            transcription_status=concordia_models.TranscriptionStatus.SUBMITTED,
        )
        .exclude(pk__in=Subquery(reserved_asset_ids))
        .exclude(transcription__user=user.id)
    )

    seq_gt_filter = None
    if after_asset_pk is not None:
        try:
            current = (
                concordia_models.Asset.objects.only("id", "sequence", "item_id", "item")
                .select_related("item", "item__project")
                .get(pk=after_asset_pk)
            )
            if (
                current.item.item_id == item_id
                and current.item.project.topics.filter(pk=topic.pk).exists()
            ):
                seq_gt_filter = Q(sequence__gt=current.sequence) | (
                    Q(sequence=current.sequence) & Q(id__gt=after_asset_pk)
                )
        except concordia_models.Asset.DoesNotExist:
            pass

    if seq_gt_filter is not None:
        eligible = eligible.filter(seq_gt_filter)

    asset = (
        eligible.select_for_update(skip_locked=True, of=("self",))
        .select_related("item", "item__project")
        .order_by("sequence", "id")
        .first()
    )

    structured_logger.debug(
        "Item short-circuit (topic reviewable) resolved.",
        event_code="reviewable_item_short_circuit_topic",
        topic=topic,
        item_id=item_id,
        after_asset_pk=after_asset_pk,
        chosen_asset_id=getattr(asset, "id", None),
    )
    return asset


@transaction.atomic
def _find_reviewable_in_project(
    topic: concordia_models.Topic,
    user: User,
    *,
    project_slug: str,
    after_asset_pk: int | None,
) -> "concordia_models.Asset | None":
    """
    Select the first eligible reviewable asset within the same project.

    Behavior:
        Short-circuit when staying within a project. Sequence is per item,
        so this returns the first eligible asset, not strictly "after" a given
        asset.

    Eligibility:
        - Same topic and project.
        - Asset, Item, and Project are published.
        - Asset transcription status is `SUBMITTED`.
        - Asset is not reserved.
        - Asset was not transcribed by the current user.

    Ordering:
        Deterministic by (item__item_id, sequence, id).

    Args:
        topic (concordia_models.Topic): Topic scope.
        user (User): Current user; used to exclude their own work.
        project_slug (str): Slug of the project to stay within.
        after_asset_pk (int | None): Present for parity with the item
            variant; not used for ordering here.

    Returns:
        concordia_models.Asset | None: A locked eligible asset, or
            None if no match is available.
    """
    reserved_asset_ids = concordia_models.AssetTranscriptionReservation.objects.filter(
        asset__item__project__slug=project_slug,
        asset__item__project__topics=topic,
    ).values("asset_id")

    eligible = (
        concordia_models.Asset.objects.filter(
            item__project__topics=topic,
            item__project__slug=project_slug,
            item__project__published=True,
            item__published=True,
            published=True,
            transcription_status=concordia_models.TranscriptionStatus.SUBMITTED,
        )
        .exclude(pk__in=Subquery(reserved_asset_ids))
        .exclude(transcription__user=user.id)
        .select_for_update(skip_locked=True, of=("self",))
        .select_related("item", "item__project")
        .order_by("item__item_id", "sequence", "id")
        .first()
    )

    structured_logger.debug(
        "Project short-circuit (topic reviewable) resolved.",
        event_code="reviewable_project_short_circuit_topic",
        topic=topic,
        project_slug=project_slug,
        after_asset_pk=after_asset_pk,
        chosen_asset_id=getattr(eligible, "id", None),
    )
    return eligible


def find_new_reviewable_topic_assets(
    topic: concordia_models.Topic,
    user: User | None = None,
) -> "QuerySet[concordia_models.Asset]":
    """
    Return assets in a topic that are eligible to be added to the cache.

    Behavior:
        Builds the candidate set for the `NextReviewableTopicAsset` cache by
        excluding assets that are not `SUBMITTED`, assets already reserved, and
        assets already present in the cache. Optionally excludes assets
        transcribed by the provided user.

    Args:
        topic (concordia_models.Topic): Topic to filter by.
        user (User | None): If provided, exclude assets transcribed by this user.

    Returns:
        QuerySet[concordia_models.Asset]: Eligible assets ordered by sequence.
    """
    # Filtering this to the topic would be more costly than just getting all ids
    # in most cases because it requires joining the asset table to the item table to
    # the project table to the topic table.
    reserved_asset_ids = concordia_models.AssetTranscriptionReservation.objects.values(
        "asset_id"
    )
    next_asset_ids = concordia_models.NextReviewableTopicAsset.objects.filter(
        topic=topic
    ).values("asset_id")

    queryset = (
        concordia_models.Asset.objects.filter(
            item__project__topics=topic.id,
            item__project__published=True,
            item__published=True,
            published=True,
        )
        .filter(transcription_status=concordia_models.TranscriptionStatus.SUBMITTED)
        .exclude(pk__in=Subquery(reserved_asset_ids))
        .exclude(pk__in=Subquery(next_asset_ids))
        .order_by("sequence")
    )
    if user:
        queryset = queryset.exclude(transcription__user=user.id)
    return queryset


def find_next_reviewable_topic_assets(
    topic: concordia_models.Topic,
    user: User,
) -> "QuerySet[concordia_models.NextReviewableTopicAsset]":
    """
    Return cached reviewable assets in a topic not transcribed by the user.

    Behavior:
        Reads from the `NextReviewableTopicAsset` cache table and filters out
        assets where the requesting user appears in `transcriber_ids`.

    Args:
        topic (concordia_models.Topic): Topic to retrieve cached assets from.
        user (User): Requesting user.

    Returns:
        QuerySet[concordia_models.NextReviewableTopicAsset]: Cached candidate rows
            for the given user.
    """
    return concordia_models.NextReviewableTopicAsset.objects.filter(
        topic=topic
    ).exclude(transcriber_ids__contains=[user.id])


@transaction.atomic
def find_reviewable_topic_asset(
    topic: concordia_models.Topic,
    user: User,
) -> "concordia_models.Asset | None":
    """
    Retrieve a single reviewable asset for a user from a topic.

    Behavior:
        First attempts to select a cached asset from `NextReviewableTopicAsset`.
        If none is available, falls back to a direct query over `Asset` and
        triggers a background task to replenish the cache.

    Concurrency:
        Uses `select_for_update(skip_locked=True, of=("self",))` so only the
        `Asset` row is locked and concurrent consumers skip locked rows.

    Args:
        topic (concordia_models.Topic): Topic to search within.
        user (User): Requesting user; their own transcriptions are excluded.

    Returns:
        concordia_models.Asset | None: A locked eligible asset, or None
            if unavailable.
    """
    next_asset = (
        find_next_reviewable_topic_assets(topic, user)
        .select_for_update(skip_locked=True, of=("self",))
        .values_list("asset_id", flat=True)
        .first()
    )

    spawn_task = False
    if next_asset:
        asset_query = concordia_models.Asset.objects.filter(id=next_asset)
    else:
        # No asset in the NextReviewableTopicAsset table for this topic,
        # so fallback to manually finding one
        structured_logger.debug(
            "No cached assets available, falling back to manual lookup",
            event_code="reviewable_fallback_manual_lookup",
            topic=topic,
            user=user,
        )
        spawn_task = True
        asset_query = find_new_reviewable_topic_assets(topic, user)

    # select_for_update(of=("self",)) causes the row locking only to
    # apply to the Asset table, rather than also locking joined item table
    asset = (
        asset_query.select_for_update(skip_locked=True, of=("self",))
        .select_related("item", "item__project")
        .first()
    )

    if spawn_task:
        # Spawn a task to populate the table for this topic
        # We wait to do this until after getting an asset because otherwise there's a
        # a chance all valid assets get grabbed by the task and our query will return
        # nothing
        structured_logger.debug(
            "Spawned background task to populate cache",
            event_code="reviewable_cache_population_triggered",
            topic=topic,
            user=user,
        )
        populate_task = get_registered_task(
            "concordia.tasks.next_asset.reviewable.populate_next_reviewable_for_topic"
        )
        populate_task.delay(topic.id)

    return asset


def find_and_order_potential_reviewable_topic_assets(
    topic: concordia_models.Topic,
    user: User,
    project_slug: str,
    item_id: str,
    asset_pk: int | None,
) -> "QuerySet[concordia_models.NextReviewableTopicAsset]":
    """
    Retrieve and prioritize cached reviewable assets for proximity.

    Behavior:
        Orders cached candidates from `NextReviewableTopicAsset` to prefer
        continuity with the user's current location.

    Annotations added to each row (transient fields):
        - next_asset (int): 1 if the candidate's asset_id is greater than
            asset_pk, else 0.
        - same_project (int): 1 if the candidate shares the given
            project_slug, else 0.
        - same_item (int): 1 if the candidate shares the given item_id, else 0.

    Prioritization (descending on the following keys, then ascending by sequence):
        - next_asset
        - same_project
        - same_item
        - sequence

    Args:
        topic (concordia_models.Topic): Topic to filter by.
        user (User): Requesting user.
        project_slug (str): Slug of the user's current project.
        item_id (str): Identifier of the user's current item.
        asset_pk (int | None): Identifier of the current asset, if any.

    Returns:
        QuerySet[concordia_models.NextReviewableTopicAsset]: Prioritized
            cached candidates.
    """
    potential_next_assets = find_next_reviewable_topic_assets(topic, user)

    # Handle None safely for the "next" signal
    next_case = (
        Case(
            When(asset_id__gt=asset_pk, then=1),
            default=0,
            output_field=IntegerField(),
        )
        if asset_pk is not None
        else Value(0, output_field=IntegerField())
    )

    # We'll favor assets which are in the same item or project as the original:
    potential_next_assets = potential_next_assets.annotate(
        same_project=Case(
            When(project_slug=project_slug, then=1),
            default=0,
            output_field=IntegerField(),
        ),
        same_item=Case(
            When(item_item_id=item_id, then=1), default=0, output_field=IntegerField()
        ),
        next_asset=next_case,
    ).order_by("-next_asset", "-same_project", "-same_item", "sequence")

    return potential_next_assets


@transaction.atomic
def find_next_reviewable_topic_asset(
    topic: concordia_models.Topic,
    user: User,
    project_slug: str,
    item_id: str,
    original_asset_id: int | None,
) -> "concordia_models.Asset | None":
    """
    Retrieve the next best reviewable asset for a user within a topic.

    Strategy:
        1. If `item_id` is provided, try a same-item short-circuit that advances
           by (sequence, id) relative to `original_asset_id`.
        2. Else, if `project_slug` is provided, select the first eligible asset
           within that project (short-circuit).
        3. Else, prioritize cached candidates, and if none are suitable, fall
           back to computing from `Asset` and trigger cache population.

    Concurrency:
        Uses `select_for_update(skip_locked=True, of=("self",))` to avoid
        double-assignments across concurrent consumers.

    Args:
        topic (concordia_models.Topic): Topic to search within.
        user (User): Requesting user.
        project_slug (str): Slug of the user's current project.
        item_id (str): Identifier of the user's current item.
        original_asset_id (int | None): Identifier of the asset just reviewed.

    Returns:
        concordia_models.Asset | None: A locked eligible asset, or None if
            unavailable.
    """
    # Normalize the "after" reference
    try:
        after_pk = int(original_asset_id) if original_asset_id else None
    except (TypeError, ValueError):
        after_pk = None

    # Short-circuit: same item
    if item_id:
        asset = _find_reviewable_in_item(
            topic, user, item_id=item_id, after_asset_pk=after_pk
        )
        if asset:
            return asset

    # Short-circuit: same project
    if project_slug:
        asset = _find_reviewable_in_project(
            topic, user, project_slug=project_slug, after_asset_pk=after_pk
        )
        if asset:
            return asset

    # Cache-backed selection, then manual fallback
    potential_next_assets = find_and_order_potential_reviewable_topic_assets(
        topic, user, project_slug, item_id, after_pk
    )
    asset_id = (
        potential_next_assets.select_for_update(skip_locked=True, of=("self",))
        .values_list("asset_id", flat=True)
        .first()
    )

    spawn_task = False
    if asset_id:
        asset_query = concordia_models.Asset.objects.filter(id=asset_id)
    else:
        # Since we had no potential next assets in the caching table, we have to check
        # the asset table directly.
        structured_logger.debug(
            "No cached assets matched, falling back to manual lookup",
            event_code="reviewable_next_fallback_manual",
            topic=topic,
            user=user,
        )
        spawn_task = True
        asset_query = find_new_reviewable_topic_assets(topic, user)

        next_case = (
            Case(
                When(id__gt=after_pk, then=1),
                default=0,
                output_field=IntegerField(),
            )
            if after_pk is not None
            else Value(0, output_field=IntegerField())
        )

        asset_query = asset_query.annotate(
            same_project=Case(
                When(item__project__slug=project_slug, then=1),
                default=0,
                output_field=IntegerField(),
            ),
            same_item=Case(
                When(item__item_id=item_id, then=1),
                default=0,
                output_field=IntegerField(),
            ),
            next_asset=next_case,
        ).order_by("-next_asset", "-same_project", "-same_item", "sequence")

    asset = (
        asset_query.select_for_update(skip_locked=True, of=("self",))
        .select_related("item", "item__project")
        .first()
    )

    if spawn_task:
        # Spawn a task to populate the table for this topic
        # We wait to do this until after getting an asset because otherwise there's
        # a chance all valid assets get grabbed by the task and our query will return
        # nothing
        structured_logger.debug(
            "Spawned background task to populate cache",
            event_code="reviewable_next_cache_population",
            topic=topic,
            user=user,
        )
        populate_task = get_registered_task(
            "concordia.tasks.next_asset.reviewable.populate_next_reviewable_for_topic"
        )
        populate_task.delay(topic.id)

    return asset


def find_invalid_next_reviewable_topic_assets(
    topic_id: int,
) -> "QuerySet[concordia_models.NextReviewableTopicAsset]":
    """
    Return cache rows that are invalid for review for a given topic.

    Behavior:
        Identifies `NextReviewableTopicAsset` rows that are no longer valid
        because the underlying asset is not `SUBMITTED` or because the asset is
        currently reserved.

    Args:
        topic_id (int): Identifier of the topic.

    Returns:
        QuerySet[concordia_models.NextReviewableTopicAsset]: Distinct invalid
            cache rows.
    """
    reserved_asset_ids = concordia_models.AssetTranscriptionReservation.objects.filter(
        asset__item__project__topics=topic_id
    ).values("asset_id")

    status_filtered = concordia_models.NextReviewableTopicAsset.objects.exclude(
        asset__transcription_status=concordia_models.TranscriptionStatus.SUBMITTED
    ).filter(topic_id=topic_id)

    reserved_filtered = concordia_models.NextReviewableTopicAsset.objects.filter(
        topic_id=topic_id, asset_id__in=Subquery(reserved_asset_ids)
    )

    return (status_filtered | reserved_filtered).distinct()


================================================
FILE: concordia/utils/next_asset/transcribable/__init__.py
================================================
from .campaign import (
    find_and_order_potential_transcribable_campaign_assets,
    find_invalid_next_transcribable_campaign_assets,
    find_new_transcribable_campaign_assets,
    find_next_transcribable_campaign_asset,
    find_next_transcribable_campaign_assets,
    find_transcribable_campaign_asset,
)
from .topic import (
    find_and_order_potential_transcribable_topic_assets,
    find_invalid_next_transcribable_topic_assets,
    find_new_transcribable_topic_assets,
    find_next_transcribable_topic_asset,
    find_next_transcribable_topic_assets,
    find_transcribable_topic_asset,
)

__all__ = [
    "find_new_transcribable_campaign_assets",
    "find_next_transcribable_campaign_assets",
    "find_transcribable_campaign_asset",
    "find_and_order_potential_transcribable_campaign_assets",
    "find_next_transcribable_campaign_asset",
    "find_and_order_potential_transcribable_topic_assets",
    "find_new_transcribable_topic_assets",
    "find_next_transcribable_topic_asset",
    "find_next_transcribable_topic_assets",
    "find_transcribable_topic_asset",
    "find_invalid_next_transcribable_campaign_assets",
    "find_invalid_next_transcribable_topic_assets",
]


================================================
FILE: concordia/utils/next_asset/transcribable/campaign.py
================================================
from typing import Dict

from django.db import transaction
from django.db.models import Case, IntegerField, Q, QuerySet, Subquery, When

from concordia import models as concordia_models
from concordia.logging import ConcordiaLogger
from concordia.utils.celery import get_registered_task

structured_logger = ConcordiaLogger.get_logger(__name__)


def _reserved_asset_ids_subq(
    campaign: concordia_models.Campaign,
) -> "QuerySet[Dict[str, int]]":
    """
    Return a subquery of reserved asset identifiers for a campaign.

    Behavior:
        Produces a subquery suitable for use with `Subquery(...)` and
        `exclude(pk__in=...)` clauses to filter out assets that currently have
        an active reservation.

    Args:
        campaign (concordia_models.Campaign): Campaign whose reserved assets
            should be excluded.

    Returns:
        QuerySet[Dict[str, int]]: A queryset of dictionaries with a single key
            "asset_id" corresponding to reserved assets.
    """
    return concordia_models.AssetTranscriptionReservation.objects.filter(
        asset__campaign=campaign
    ).values("asset_id")


def _eligible_transcribable_base_qs(
    campaign: concordia_models.Campaign,
) -> "QuerySet[concordia_models.Asset]":
    """
    Build the base queryset of transcribable assets for a campaign.

    Behavior:
        Restricts to published projects, items, and assets, and to assets whose
        transcription status is either `NOT_STARTED` or `IN_PROGRESS`.

    Args:
        campaign (concordia_models.Campaign): Campaign scope for filtering.

    Returns:
        QuerySet[concordia_models.Asset]: Transcribable assets, with `item` and
            `item__project` selected via `select_related`.
    """
    return concordia_models.Asset.objects.filter(
        campaign_id=campaign.id,
        item__project__published=True,
        item__published=True,
        published=True,
        transcription_status__in=[
            concordia_models.TranscriptionStatus.NOT_STARTED,
            concordia_models.TranscriptionStatus.IN_PROGRESS,
        ],
    ).select_related("item", "item__project")


def _next_seq_after(pk: int | None) -> int | None:
    """
    Resolve the sequence number for a given asset primary key.

    Behavior:
        Convenience utility for ordering logic when advancing within a series
        of assets.

    Args:
        pk (int | None): Asset primary key whose sequence to resolve.

    Returns:
        int | None: The asset's sequence number, or None if `pk` is falsy
            or the asset does not exist.
    """
    if not pk:
        return None
    return (
        concordia_models.Asset.objects.filter(pk=pk)
        .values_list("sequence", flat=True)
        .first()
    )


def _order_unstarted_first(
    qs: "QuerySet[concordia_models.Asset]",
) -> "QuerySet[concordia_models.Asset]":
    """
    Apply a stable ordering that prefers `NOT_STARTED` over `IN_PROGRESS`,
    then orders by `sequence`.

    Args:
        qs (QuerySet[concordia_models.Asset]): Base queryset to annotate and sort.

    Returns:
        QuerySet[concordia_models.Asset]: Annotated and ordered queryset with a
            transient `unstarted` field (1 for `NOT_STARTED`, else 0).
    """
    return qs.annotate(
        unstarted=Case(
            When(
                transcription_status=concordia_models.TranscriptionStatus.NOT_STARTED,
                then=1,
            ),
            default=0,
            output_field=IntegerField(),
        )
    ).order_by("-unstarted", "sequence")


@transaction.atomic
def _find_transcribable_in_item(
    campaign: concordia_models.Campaign,
    *,
    item_id: str,
    after_asset_pk: int | None,
) -> "concordia_models.Asset | None":
    """
    Fast path: find the next transcribable asset in the same item.

    Behavior:
        - Exclude the current asset.
        - Advance by `(sequence, id)` within the item.
        - Return only `NOT_STARTED` here (defer `IN_PROGRESS` to later fallbacks).
        - Skip reserved assets.
        - Respect published flags on campaign, project, item, and asset.

    Args:
        campaign (concordia_models.Campaign): Campaign scope.
        item_id (str): Identifier of the item to stay within.
        after_asset_pk (int | None): Asset primary key to advance from.

    Returns:
        concordia_models.Asset | None: The next eligible asset, or None if none.
    """
    if not item_id:
        return None

    # Find current sequence to advance correctly within the item
    cur_seq = None
    if after_asset_pk:
        cur_seq = (
            concordia_models.Asset.objects.filter(pk=after_asset_pk)
            .values_list("sequence", flat=True)
            .first()
        )

    reserved_asset_ids = concordia_models.AssetTranscriptionReservation.objects.values(
        "asset_id"
    )

    base = concordia_models.Asset.objects.filter(
        item__item_id=item_id,
        item__published=True,
        item__project__published=True,
        published=True,
        campaign_id=campaign.id,
    ).exclude(pk__in=Subquery(reserved_asset_ids))

    if after_asset_pk:
        if cur_seq is not None:
            base = base.filter(
                Q(sequence__gt=cur_seq)
                | (Q(sequence=cur_seq) & Q(id__gt=after_asset_pk))
            )
        else:
            base = base.exclude(id=after_asset_pk)

    # ONLY NOT_STARTED in this short-circuit
    return (
        base.filter(
            transcription_status=concordia_models.TranscriptionStatus.NOT_STARTED
        )
        .order_by("sequence", "id")
        .first()
    )


def _find_transcribable_not_started_in_project(
    campaign: concordia_models.Campaign,
    *,
    project_slug: str,
    exclude_item_id: str | None = None,
) -> "concordia_models.Asset | None":
    """
    Fast path: find the first `NOT_STARTED` asset in the same project.

    Behavior:
        Allows different items (optionally excluding the current item to avoid
        bouncing back). Uses a stable ordering by `(item_id, sequence, id)`.

    Args:
        campaign (concordia_models.Campaign): Campaign scope.
        project_slug (str): Slug of the project to stay within.
        exclude_item_id (str | None): If provided, exclude this item.

    Returns:
        concordia_models.Asset | None: The first eligible asset, or None if none.
    """
    if not project_slug:
        return None

    reserved_asset_ids = concordia_models.AssetTranscriptionReservation.objects.values(
        "asset_id"
    )

    base = concordia_models.Asset.objects.filter(
        campaign_id=campaign.id,
        item__project__slug=project_slug,
        item__published=True,
        item__project__published=True,
        published=True,
        transcription_status=concordia_models.TranscriptionStatus.NOT_STARTED,
    ).exclude(pk__in=Subquery(reserved_asset_ids))

    if exclude_item_id:
        base = base.exclude(item__item_id=exclude_item_id)

    return base.order_by("item__item_id", "sequence", "id").first()


def find_new_transcribable_campaign_assets(
    campaign: concordia_models.Campaign,
) -> "QuerySet[concordia_models.Asset]":
    """
    Return assets in a campaign that are eligible to be added to the cache.

    Behavior:
        Builds the candidate set for the `NextTranscribableCampaignAsset` cache
        by excluding assets that are not `NOT_STARTED` or `IN_PROGRESS`, assets
        already reserved, and assets already present in the cache.

    Args:
        campaign (concordia_models.Campaign): Campaign to filter by.

    Returns:
        QuerySet[concordia_models.Asset]: Eligible assets ordered by `sequence`.
    """
    reserved_asset_ids = concordia_models.AssetTranscriptionReservation.objects.filter(
        asset__campaign=campaign
    ).values("asset_id")
    next_asset_ids = concordia_models.NextTranscribableCampaignAsset.objects.filter(
        campaign=campaign
    ).values("asset_id")

    return (
        concordia_models.Asset.objects.filter(
            campaign_id=campaign.id,
            item__project__published=True,
            item__published=True,
            published=True,
        )
        .filter(
            Q(transcription_status=concordia_models.TranscriptionStatus.NOT_STARTED)
            | Q(transcription_status=concordia_models.TranscriptionStatus.IN_PROGRESS)
        )
        .exclude(pk__in=Subquery(reserved_asset_ids))
        .exclude(pk__in=Subquery(next_asset_ids))
        .order_by("sequence")
    )


def find_next_transcribable_campaign_assets(
    campaign: concordia_models.Campaign,
) -> "QuerySet[concordia_models.NextTranscribableCampaignAsset]":
    """
    Return all cached transcribable assets for a campaign.

    Behavior:
        Reads from the `NextTranscribableCampaignAsset` cache table for the
        given campaign.

    Args:
        campaign (concordia_models.Campaign): Campaign to retrieve cached assets for.

    Returns:
        QuerySet[concordia_models.NextTranscribableCampaignAsset]: Cached candidates.
    """
    return concordia_models.NextTranscribableCampaignAsset.objects.filter(
        campaign=campaign
    )


@transaction.atomic
def find_transcribable_campaign_asset(
    campaign: concordia_models.Campaign,
) -> "concordia_models.Asset | None":
    """
    Retrieve a single transcribable asset from the campaign.

    Behavior:
        First attempts to select a cached asset from
        `NextTranscribableCampaignAsset`. If none is available, falls back to a
        direct query over `Asset` and triggers a background task to replenish
        the cache.

    Concurrency:
        Uses `select_for_update(skip_locked=True, of=("self",))` so only the
        `Asset` row is locked and concurrent consumers skip locked rows.

    Args:
        campaign (concordia_models.Campaign): Campaign to search within.

    Returns:
        concordia_models.Asset | None: A locked eligible asset, or None if
            unavailable.
    """
    next_asset = (
        find_next_transcribable_campaign_assets(campaign)
        .select_for_update(skip_locked=True, of=("self",))
        .values_list("asset_id", flat=True)
        .first()
    )

    spawn_task = False
    if next_asset:
        asset_query = concordia_models.Asset.objects.filter(id=next_asset)
    else:
        # No asset in the NextTranscribableCampaignAsset table for this campaign,
        # so fallback to manually finding on
        structured_logger.debug(
            "No cached assets available, falling back to manual lookup",
            event_code="transcribable_fallback_manual_lookup",
            campaign=campaign,
        )
        asset_query = find_new_transcribable_campaign_assets(campaign)
        spawn_task = True
    # select_for_update(of=("self",)) causes the row locking only to
    # apply to the Asset table, rather than also locking joined item table
    asset = (
        asset_query.select_for_update(skip_locked=True, of=("self",))
        .select_related("item", "item__project")
        .first()
    )
    if spawn_task:
        # Spawn a task to populate the table for this campaign
        # We wait to do this until after getting an asset because otherwise there's a
        # a chance all valid assets get grabbed by the task and our query will return
        # nothing
        structured_logger.debug(
            "Spawned background task to populate cache",
            event_code="transcribable_cache_population_triggered",
            campaign=campaign,
        )
        populate_task = get_registered_task(
            "concordia.tasks.next_asset.transcribable.populate_next_transcribable_for_campaign"
        )
        populate_task.delay(campaign.id)
    return asset


def find_and_order_potential_transcribable_campaign_assets(
    campaign: concordia_models.Campaign,
    project_slug: str,
    item_id: str,
    asset_pk: int,
) -> "QuerySet[concordia_models.NextTranscribableCampaignAsset]":
    """
    Retrieve and prioritize cached transcribable assets based on proximity
    and status.

    Behavior:
        Orders cached candidates from `NextTranscribableCampaignAsset` to prefer:
        - `NOT_STARTED` over `IN_PROGRESS` (via transient `unstarted` flag),
        - same project,
        - same item,
        then by `sequence` and `asset_id` for stability.

    Annotations added to each row (transient fields):
        - unstarted (int): 1 if transcription status is `NOT_STARTED`, else 0.
        - same_project (int): 1 if the candidate shares `project_slug`, else 0.
        - same_item (int): 1 if the candidate shares `item_id`, else 0.

    Args:
        campaign (concordia_models.Campaign): Campaign to filter by.
        project_slug (str): Slug of the original asset's project.
        item_id (str): Item identifier of the original asset.
        asset_pk (int): Primary key of the original asset.

    Returns:
        QuerySet[concordia_models.NextTranscribableCampaignAsset]: Prioritized
            cached candidates.
    """
    potential_next_assets = find_next_transcribable_campaign_assets(campaign)

    potential_next_assets = potential_next_assets.annotate(
        unstarted=Case(
            When(
                transcription_status=concordia_models.TranscriptionStatus.NOT_STARTED,
                then=1,
            ),
            default=0,
            output_field=IntegerField(),
        ),
        same_project=Case(
            When(project_slug=project_slug, then=1),
            default=0,
            output_field=IntegerField(),
        ),
        same_item=Case(
            When(item_item_id=item_id, then=1),
            default=0,
            output_field=IntegerField(),
        ),
    ).order_by(
        "-unstarted",
        "-same_project",
        "-same_item",
        "sequence",
        "asset_id",
    )

    return potential_next_assets


@transaction.atomic
def find_next_transcribable_campaign_asset(
    campaign: concordia_models.Campaign,
    project_slug: str,
    item_id: str,
    original_asset_id: int | None,
) -> "concordia_models.Asset | None":
    """
    Retrieve the next best transcribable asset within a campaign.

    Priority for short-circuit selection (before cache and fallback):
        1) If `item_id` is provided, return the next `NOT_STARTED` asset in
           that item by sequence (strictly after the original asset when known).
        2) If `project_slug` is provided, return the first `NOT_STARTED` asset
           in that project (ordered by item id, then sequence), excluding the
           current item to keep moving forward.

    If none of the above match, fall back to the cache-backed path:
        Attempts to retrieve a candidate from `NextTranscribableCampaignAsset`. If
        none is found, compute from `Asset` and trigger cache population.

    After exhausting `NOT_STARTED` options, consider `IN_PROGRESS` assets in the
    same item (strictly after the original when known).

    Concurrency:
        Uses `select_for_update(skip_locked=True, of=("self",))` to avoid
        double-assignments across concurrent consumers.

    Args:
        campaign (concordia_models.Campaign): Campaign to search within.
        project_slug (str): Slug of the current project.
        item_id (str): Identifier of the current item.
        original_asset_id (int | None): Identifier of the asset just transcribed.

    Returns:
        concordia_models.Asset | None: A locked eligible asset, or None if
            unavailable.
    """
    # Normalize original_asset_id for safe use in filters/comparisons
    try:
        original_pk = int(original_asset_id) if original_asset_id is not None else None
    except (TypeError, ValueError):
        original_pk = None

    # Resolve "after sequence" only when the original asset belongs to the same item.
    after_seq = None
    if item_id and original_pk is not None:
        try:
            orig = (
                concordia_models.Asset.objects.select_related("item")
                .only("id", "sequence", "item__item_id")
                .get(pk=original_pk)
            )
            if getattr(orig.item, "item_id", None) == item_id:
                after_seq = orig.sequence
        except concordia_models.Asset.DoesNotExist:
            after_seq = None

    reserved_asset_ids = concordia_models.AssetTranscriptionReservation.objects.values(
        "asset_id"
    )

    # Short-circuit: same item and NOT_STARTED after current sequence
    if item_id:
        qs = concordia_models.Asset.objects.filter(
            campaign_id=campaign.id,
            item__item_id=item_id,
            item__published=True,
            item__project__published=True,
            published=True,
            transcription_status=concordia_models.TranscriptionStatus.NOT_STARTED,
        ).exclude(pk__in=Subquery(reserved_asset_ids))
        if original_pk is not None:
            qs = qs.exclude(pk=original_pk)
        if after_seq is not None:
            qs = qs.filter(
                Q(sequence__gt=after_seq)
                | (Q(sequence=after_seq) & Q(id__gt=original_pk))
            )
        asset = (
            qs.order_by("sequence", "id")
            .select_for_update(skip_locked=True, of=("self",))
            .select_related("item", "item__project")
            .first()
        )
        if asset:
            return asset

    # Short-circuit: same project and NOT_STARTED (avoid current item and original)
    if project_slug:
        candidate = concordia_models.Asset.objects.filter(
            campaign_id=campaign.id,
            item__project__slug=project_slug,
            item__published=True,
            item__project__published=True,
            published=True,
            transcription_status=concordia_models.TranscriptionStatus.NOT_STARTED,
        ).exclude(pk__in=Subquery(reserved_asset_ids))
        if original_pk is not None:
            candidate = candidate.exclude(pk=original_pk)
        if item_id:
            candidate = candidate.exclude(item__item_id=item_id)

        asset = (
            candidate.order_by("item__item_id", "sequence", "id")
            .select_for_update(skip_locked=True, of=("self",))
            .select_related("item", "item__project")
            .first()
        )
        if asset:
            return asset

    # Cache-backed selection (NOT_STARTED), then manual fallback (also NOT_STARTED)
    potential_next_assets = find_and_order_potential_transcribable_campaign_assets(
        campaign, project_slug, item_id, original_asset_id
    )
    if original_pk is not None:
        potential_next_assets = potential_next_assets.exclude(asset_id=original_pk)
    if item_id:
        # Keep moving forward: avoid bouncing to the same item
        potential_next_assets = potential_next_assets.exclude(item_item_id=item_id)

    asset_id = (
        potential_next_assets.select_for_update(skip_locked=True, of=("self",))
        .values_list("asset_id", flat=True)
        .first()
    )

    spawn_task = False
    if asset_id:
        asset_query = concordia_models.Asset.objects.filter(id=asset_id)
    else:
        structured_logger.debug(
            "No cached assets matched, falling back to manual lookup",
            event_code="transcribable_next_fallback_manual",
            campaign=campaign,
        )
        spawn_task = True
        asset_query = find_new_transcribable_campaign_assets(campaign)
        if original_pk is not None:
            asset_query = asset_query.exclude(pk=original_pk)
        if item_id:
            asset_query = asset_query.exclude(item__item_id=item_id)
        asset_query = asset_query.annotate(
            unstarted=Case(
                When(
                    transcription_status=concordia_models.TranscriptionStatus.NOT_STARTED,
                    then=1,
                ),
                default=0,
                output_field=IntegerField(),
            ),
            same_project=Case(
                When(item__project__slug=project_slug, then=1),
                default=0,
                output_field=IntegerField(),
            ),
            same_item=Case(
                When(item__item_id=item_id, then=1),
                default=0,
                output_field=IntegerField(),
            ),
        ).order_by(
            "-unstarted",
            "-same_project",
            "-same_item",
            "sequence",
            "id",
        )

    asset = (
        asset_query.select_for_update(skip_locked=True, of=("self",))
        .select_related("item", "item__project")
        .first()
    )
    if asset:
        if spawn_task:
            structured_logger.debug(
                "Spawned background task to populate cache",
                event_code="transcribable_next_cache_population",
                campaign=campaign,
            )
            populate_task = get_registered_task(
                "concordia.tasks.next_asset.transcribable.populate_next_transcribable_for_campaign"
            )
            populate_task.delay(campaign.id)
        return asset

    # Only now consider same-item IN_PROGRESS after current sequence
    if item_id:
        qs = concordia_models.Asset.objects.filter(
            campaign_id=campaign.id,
            item__item_id=item_id,
            item__published=True,
            item__project__published=True,
            published=True,
            transcription_status=concordia_models.TranscriptionStatus.IN_PROGRESS,
        ).exclude(pk__in=Subquery(reserved_asset_ids))
        if original_pk is not None:
            qs = qs.exclude(pk=original_pk)
        if after_seq is not None:
            qs = qs.filter(
                Q(sequence__gt=after_seq)
                | (Q(sequence=after_seq) & Q(id__gt=original_pk))
            )
        asset = (
            qs.order_by("sequence", "id")
            .select_for_update(skip_locked=True, of=("self",))
            .select_related("item", "item__project")
            .first()
        )
        if asset:
            return asset

    return None


def find_invalid_next_transcribable_campaign_assets(
    campaign_id: int,
) -> "QuerySet[concordia_models.NextTranscribableCampaignAsset]":
    """
    Return cached rows that are invalid for transcription for a campaign.

    Behavior:
        Identifies `NextTranscribableCampaignAsset` rows that are no longer valid
        because the underlying asset is neither `NOT_STARTED` nor `IN_PROGRESS`,
        or because the asset is currently reserved.

    Args:
        campaign_id (int): Identifier of the campaign.

    Returns:
        QuerySet[concordia_models.NextTranscribableCampaignAsset]: Distinct invalid
            cache rows.
    """
    reserved_asset_ids = concordia_models.AssetTranscriptionReservation.objects.filter(
        asset__campaign_id=campaign_id
    ).values("asset_id")

    # Assets with transcription_status not eligible for transcription
    status_filtered = concordia_models.NextTranscribableCampaignAsset.objects.filter(
        campaign_id=campaign_id
    ).exclude(
        asset__transcription_status__in=[
            concordia_models.TranscriptionStatus.NOT_STARTED,
            concordia_models.TranscriptionStatus.IN_PROGRESS,
        ]
    )

    # Assets that are reserved
    reserved_filtered = concordia_models.NextTranscribableCampaignAsset.objects.filter(
        campaign_id=campaign_id, asset_id__in=Subquery(reserved_asset_ids)
    )

    return (status_filtered | reserved_filtered).distinct()


================================================
FILE: concordia/utils/next_asset/transcribable/topic.py
================================================
from typing import Dict

from django.db import transaction
from django.db.models import Case, IntegerField, Q, QuerySet, Subquery, When

from concordia import models as concordia_models
from concordia.logging import ConcordiaLogger
from concordia.utils.celery import get_registered_task

structured_logger = ConcordiaLogger.get_logger(__name__)


def _reserved_asset_ids_subq() -> "QuerySet[Dict[str, int]]":
    """
    Return a subquery of reserved asset identifiers.

    Behavior:
        Not filtered to the topic to avoid extra joins. Produces a subquery
        suitable for use with `Subquery(...)` and `exclude(pk__in=...)`
        clauses to filter out assets that currently have an active
        reservation.

    Returns:
        QuerySet[Dict[str, int]]: A queryset of dictionaries with a single key
            "asset_id" corresponding to reserved assets.
    """
    return concordia_models.AssetTranscriptionReservation.objects.values("asset_id")


def _eligible_transcribable_base_qs(
    topic: "concordia_models.Topic",
) -> "QuerySet[concordia_models.Asset]":
    """
    Build the base queryset of transcribable assets for a topic.

    Behavior:
        Restricts to published projects, items, and assets, and to assets whose
        transcription status is either `NOT_STARTED` or `IN_PROGRESS`.

    Args:
        topic (concordia_models.Topic): Topic scope for filtering.

    Returns:
        QuerySet[concordia_models.Asset]: Transcribable assets, with `item` and
            `item__project` selected via `select_related`.
    """
    return concordia_models.Asset.objects.filter(
        item__project__topics=topic.id,
        item__project__published=True,
        item__published=True,
        published=True,
        transcription_status__in=[
            concordia_models.TranscriptionStatus.NOT_STARTED,
            concordia_models.TranscriptionStatus.IN_PROGRESS,
        ],
    ).select_related("item", "item__project")


def _next_seq_after(pk: int | None) -> int | None:
    """
    Resolve the sequence number for a given asset primary key.

    Behavior:
        Convenience utility for ordering logic when advancing within a series
        of assets.

    Args:
        pk (int | None): Asset primary key whose sequence to resolve.

    Returns:
        int | None: The asset's sequence number, or None if `pk` is falsy
            or the asset does not exist.
    """
    if not pk:
        return None
    return (
        concordia_models.Asset.objects.filter(pk=pk)
        .values_list("sequence", flat=True)
        .first()
    )


def _order_unstarted_first(
    qs: "QuerySet[concordia_models.Asset]",
) -> "QuerySet[concordia_models.Asset]":
    """
    Apply a stable ordering that prefers `NOT_STARTED` over `IN_PROGRESS`,
    then orders by `sequence`.

    Args:
        qs (QuerySet[concordia_models.Asset]): Base queryset to annotate and sort.

    Returns:
        QuerySet[concordia_models.Asset]: Annotated and ordered queryset with a
            transient `unstarted` field (1 for `NOT_STARTED`, else 0).
    """
    return qs.annotate(
        unstarted=Case(
            When(
                transcription_status=concordia_models.TranscriptionStatus.NOT_STARTED,
                then=1,
            ),
            default=0,
            output_field=IntegerField(),
        )
    ).order_by("-unstarted", "sequence")


def _find_transcribable_in_item_for_topic(
    topic: "concordia_models.Topic",
    *,
    item_id: str,
    after_asset_pk: int | None,
) -> "concordia_models.Asset | None":
    """
    Fast path: find the next transcribable asset in the same item, constrained
    to the topic.

    Behavior:
        - Asset must belong to a project that is in this topic.
        - Exclude the current asset.
        - Advance by `(sequence, id)` within the item.
        - Return only `NOT_STARTED` here (defer `IN_PROGRESS` to later fallbacks).
        - Skip reserved assets.
        - Respect published flags.

    Args:
        topic (concordia_models.Topic): Topic scope.
        item_id (str): Identifier of the item to stay within.
        after_asset_pk (int | None): Asset primary key to advance from.

    Returns:
        concordia_models.Asset | None: The next eligible asset, or None if none.
    """
    if not item_id:
        return None

    cur_seq = None
    if after_asset_pk:
        cur_seq = (
            concordia_models.Asset.objects.filter(pk=after_asset_pk)
            .values_list("sequence", flat=True)
            .first()
        )

    reserved_asset_ids = concordia_models.AssetTranscriptionReservation.objects.values(
        "asset_id"
    )

    base = concordia_models.Asset.objects.filter(
        item__item_id=item_id,
        item__project__topics=topic.id,
        item__published=True,
        item__project__published=True,
        published=True,
    ).exclude(pk__in=Subquery(reserved_asset_ids))

    if after_asset_pk:
        if cur_seq is not None:
            base = base.filter(
                Q(sequence__gt=cur_seq)
                | (Q(sequence=cur_seq) & Q(id__gt=after_asset_pk))
            )
        else:
            base = base.exclude(id=after_asset_pk)

    # ONLY NOT_STARTED in this short-circuit
    return (
        base.filter(
            transcription_status=concordia_models.TranscriptionStatus.NOT_STARTED
        )
        .order_by("sequence", "id")
        .first()
    )


def _find_transcribable_not_started_in_project_for_topic(
    topic: "concordia_models.Topic",
    *,
    project_slug: str,
    exclude_item_id: str | None = None,
) -> "concordia_models.Asset | None":
    """
    Fast path: find the first `NOT_STARTED` asset in the same project within
    this topic.

    Behavior:
        Optionally exclude the current item. Uses a stable ordering by
        `(item__item_id, sequence, id)`.

    Args:
        topic (concordia_models.Topic): Topic scope.
        project_slug (str): Slug of the project to stay within.
        exclude_item_id (str | None): If provided, exclude this item.

    Returns:
        concordia_models.Asset | None: The first eligible asset, or None if none.
    """
    if not project_slug:
        return None

    reserved_asset_ids = concordia_models.AssetTranscriptionReservation.objects.values(
        "asset_id"
    )

    base = concordia_models.Asset.objects.filter(
        item__project__topics=topic.id,
        item__project__slug=project_slug,
        item__published=True,
        item__project__published=True,
        published=True,
        transcription_status=concordia_models.TranscriptionStatus.NOT_STARTED,
    ).exclude(pk__in=Subquery(reserved_asset_ids))

    if exclude_item_id:
        base = base.exclude(item__item_id=exclude_item_id)

    return base.order_by("item__item_id", "sequence", "id").first()


def find_new_transcribable_topic_assets(
    topic: "concordia_models.Topic",
) -> "QuerySet[concordia_models.Asset]":
    """
    Return assets in a topic that are eligible to be added to the cache.

    Behavior:
        Builds the candidate set for the `NextTranscribableTopicAsset` cache by
        excluding assets that are not `NOT_STARTED` or `IN_PROGRESS`, assets
        already reserved, and assets already present in the cache.

    Args:
        topic (concordia_models.Topic): Topic to filter by.

    Returns:
        QuerySet[concordia_models.Asset]: Eligible assets ordered by `sequence`.
    """
    # Filtering this to the topic would be more costly than just getting all ids
    # in most cases because it requires joining the asset table to the item table to
    # the project table to the topic table.
    reserved_asset_ids = concordia_models.AssetTranscriptionReservation.objects.values(
        "asset_id"
    )
    next_asset_ids = concordia_models.NextTranscribableTopicAsset.objects.filter(
        topic=topic
    ).values("asset_id")

    return (
        concordia_models.Asset.objects.filter(
            item__project__topics=topic.id,
            item__project__published=True,
            item__published=True,
            published=True,
        )
        .filter(
            Q(transcription_status=concordia_models.TranscriptionStatus.NOT_STARTED)
            | Q(transcription_status=concordia_models.TranscriptionStatus.IN_PROGRESS)
        )
        .exclude(pk__in=Subquery(reserved_asset_ids))
        .exclude(pk__in=Subquery(next_asset_ids))
        .order_by("sequence")
    )


def find_next_transcribable_topic_assets(
    topic: "concordia_models.Topic",
) -> "QuerySet[concordia_models.NextTranscribableTopicAsset]":
    """
    Return all cached transcribable assets for a topic.

    Behavior:
        Reads from the `NextTranscribableTopicAsset` cache table for the
        given topic.

    Args:
        topic (concordia_models.Topic): Topic to retrieve cached assets for.

    Returns:
        QuerySet[concordia_models.NextTranscribableTopicAsset]: Cached candidates.
    """
    return concordia_models.NextTranscribableTopicAsset.objects.filter(topic=topic)


@transaction.atomic
def find_transcribable_topic_asset(
    topic: "concordia_models.Topic",
) -> "concordia_models.Asset | None":
    """
    Retrieve a single transcribable asset from the topic.

    Behavior:
        First attempts to select a cached asset from
        `NextTranscribableTopicAsset`. If none is available, falls back to a
        direct query over `Asset` and triggers a background task to replenish
        the cache.

    Concurrency:
        Uses `select_for_update(skip_locked=True, of=("self",))` so only the
        `Asset` row is locked and concurrent consumers skip locked rows.

    Args:
        topic (concordia_models.Topic): Topic to search within.

    Returns:
        concordia_models.Asset | None: A locked eligible asset, or None if
            unavailable.
    """
    next_asset = (
        find_next_transcribable_topic_assets(topic)
        .select_for_update(skip_locked=True, of=("self",))
        .values_list("asset_id", flat=True)
        .first()
    )

    spawn_task = False
    if next_asset:
        asset_query = concordia_models.Asset.objects.filter(id=next_asset)
    else:
        # No asset in the NextTranscribableTopicAsset table for this topic,
        # so fallback to manually finding one
        structured_logger.debug(
            "No cached assets available, falling back to manual lookup",
            event_code="transcribable_fallback_manual_lookup",
            topic=topic,
        )
        asset_query = find_new_transcribable_topic_assets(topic)
        spawn_task = True
    # select_for_update(of=("self",)) causes the row locking only to
    # apply to the Asset table, rather than also locking joined item table
    asset = (
        asset_query.select_for_update(skip_locked=True, of=("self",))
        .select_related("item", "item__project")
        .first()
    )
    if spawn_task:
        # Spawn a task to populate the table for this topic
        # We wait to do this until after getting an asset because otherwise there's a
        # a chance all valid assets get grabbed by the task and our query will return
        # nothing
        structured_logger.debug(
            "Spawned background task to populate cache",
            event_code="transcribable_cache_population_triggered",
            topic=topic,
        )
        populate_task = get_registered_task(
            "concordia.tasks.next_asset.transcribable.populate_next_transcribable_for_topic"
        )
        populate_task.delay(topic.id)
    return asset


def find_and_order_potential_transcribable_topic_assets(
    topic: "concordia_models.Topic",
    project_slug: str,
    item_id: str,
    asset_pk: int,
) -> "QuerySet[concordia_models.NextTranscribableTopicAsset]":
    """
    Retrieve and prioritize cached transcribable assets based on proximity
    and status.

    Behavior:
        Orders cached candidates from `NextTranscribableTopicAsset` to prefer:
        - `NOT_STARTED` over `IN_PROGRESS` (via transient `unstarted` flag),
        - same project,
        - same item,
        then by `sequence` and `asset_id` for stability.

    Annotations added to each row (transient fields):
        - unstarted (int): 1 if transcription status is `NOT_STARTED`, else 0.
        - same_project (int): 1 if the candidate shares `project_slug`, else 0.
        - same_item (int): 1 if the candidate shares `item_id`, else 0.

    Args:
        topic (concordia_models.Topic): Topic to filter by.
        project_slug (str): Slug of the original asset's project.
        item_id (str): Item identifier of the original asset.
        asset_pk (int): Primary key of the original asset.

    Returns:
        QuerySet[concordia_models.NextTranscribableTopicAsset]: Prioritized
            cached candidates.
    """
    potential_next_assets = find_next_transcribable_topic_assets(topic)

    potential_next_assets = potential_next_assets.annotate(
        unstarted=Case(
            When(
                transcription_status=concordia_models.TranscriptionStatus.NOT_STARTED,
                then=1,
            ),
            default=0,
            output_field=IntegerField(),
        ),
        same_project=Case(
            When(project_slug=project_slug, then=1),
            default=0,
            output_field=IntegerField(),
        ),
        same_item=Case(
            When(item_item_id=item_id, then=1),
            default=0,
            output_field=IntegerField(),
        ),
    ).order_by(
        "-unstarted",
        "-same_project",
        "-same_item",
        "sequence",
        "asset_id",
    )

    return potential_next_assets


@transaction.atomic
def find_next_transcribable_topic_asset(
    topic: "concordia_models.Topic",
    project_slug: str,
    item_id: str,
    original_asset_id: int | None,
) -> "concordia_models.Asset | None":
    """
    Retrieve the next best transcribable asset within a topic.

    Priority for short-circuit selection (before cache and fallback):
        1) If `item_id` is provided, return the next `NOT_STARTED` asset in
           that item by sequence (strictly after the original asset when known).
        2) If `project_slug` is provided, return the first `NOT_STARTED` asset
           in that project (ordered by item id, then sequence), excluding the
           current item to keep moving forward.

    If none of the above match, fall back to the cache-backed path:
        Attempts to retrieve a candidate from `NextTranscribableTopicAsset`. If
        none is found, compute from `Asset` and trigger cache population.

    After exhausting `NOT_STARTED` options, consider `IN_PROGRESS` assets in the
    same item (strictly after the original when known).

    Concurrency:
        Uses `select_for_update(skip_locked=True, of=("self",))` to avoid
        double-assignments across concurrent consumers.

    Args:
        topic (concordia_models.Topic): Topic to search within.
        project_slug (str): Slug of the current project.
        item_id (str): Identifier of the current item.
        original_asset_id (int | None): Identifier of the asset just transcribed.

    Returns:
        concordia_models.Asset | None: A locked eligible asset, or None if
            unavailable.
    """
    # Resolve original context safely (int or digit-string only)
    after_seq = None
    orig = None
    orig_item_id = None
    orig_id_valid = isinstance(original_asset_id, int) or (
        isinstance(original_asset_id, str) and original_asset_id.isdigit()
    )
    if orig_id_valid:
        try:
            orig = (
                concordia_models.Asset.objects.select_related("item")
                .only("id", "sequence", "item__item_id")
                .get(pk=original_asset_id)
            )
            orig_item_id = getattr(orig.item, "item_id", None)
            # Keep sequence handy for same-item gating in any path
            after_seq = orig.sequence
        except concordia_models.Asset.DoesNotExist:
            orig = None
            orig_item_id = None
            after_seq = None

    reserved_asset_ids = concordia_models.AssetTranscriptionReservation.objects.values(
        "asset_id"
    )

    # Short-circuit: same item and NOT_STARTED after current sequence
    if item_id:
        qs = concordia_models.Asset.objects.filter(
            item__project__topics=topic.id,
            item__item_id=item_id,
            item__published=True,
            item__project__published=True,
            published=True,
            transcription_status=concordia_models.TranscriptionStatus.NOT_STARTED,
        ).exclude(pk__in=Subquery(reserved_asset_ids))
        if orig_id_valid:
            qs = qs.exclude(pk=original_asset_id)
        if after_seq is not None and orig_item_id == item_id:
            qs = qs.filter(
                Q(sequence__gt=after_seq)
                | (Q(sequence=after_seq) & Q(id__gt=int(original_asset_id)))
            )
        asset = (
            qs.order_by("sequence", "id")
            .select_for_update(skip_locked=True, of=("self",))
            .select_related("item", "item__project")
            .first()
        )
        if asset:
            return asset

    # Short-circuit: same project and NOT_STARTED (topic-constrained)
    if project_slug:
        candidate = concordia_models.Asset.objects.filter(
            item__project__topics=topic.id,
            item__project__slug=project_slug,
            item__published=True,
            item__project__published=True,
            published=True,
            transcription_status=concordia_models.TranscriptionStatus.NOT_STARTED,
        ).exclude(pk__in=Subquery(reserved_asset_ids))
        if orig_id_valid:
            candidate = candidate.exclude(pk=original_asset_id)
        if item_id:
            candidate = candidate.exclude(item__item_id=item_id)

        asset = (
            candidate.order_by("item__item_id", "sequence", "id")
            .select_for_update(skip_locked=True, of=("self",))
            .select_related("item", "item__project")
            .first()
        )
        if asset:
            return asset

    # Cache-backed selection (NOT_STARTED anywhere), then manual fallback.
    potential_next_assets = find_and_order_potential_transcribable_topic_assets(
        topic, project_slug, item_id, original_asset_id
    )
    if orig_id_valid:
        potential_next_assets = potential_next_assets.exclude(
            asset_id=original_asset_id
        )
    if item_id:
        potential_next_assets = potential_next_assets.exclude(item_item_id=item_id)

    asset_id = (
        potential_next_assets.select_for_update(skip_locked=True, of=("self",))
        .values_list("asset_id", flat=True)
        .first()
    )

    spawn_task = False
    if asset_id:
        asset_query = concordia_models.Asset.objects.filter(id=asset_id)
    else:
        structured_logger.debug(
            "No cached assets matched, falling back to manual lookup",
            event_code="transcribable_next_fallback_manual",
            topic=topic,
        )
        spawn_task = True
        asset_query = find_new_transcribable_topic_assets(topic)
        if orig_id_valid:
            asset_query = asset_query.exclude(pk=original_asset_id)
        if item_id:
            asset_query = asset_query.exclude(item__item_id=item_id)
        # If we know the original's item/seq, keep moving forward within that item
        if orig_item_id and after_seq is not None:
            asset_query = asset_query.exclude(
                Q(item__item_id=orig_item_id, sequence__lte=after_seq)
            )

        # Prefer same project and same item; if item_id is blank, prefer original's item
        ref_item_id = item_id or orig_item_id
        asset_query = asset_query.annotate(
            unstarted=Case(
                When(
                    transcription_status=concordia_models.TranscriptionStatus.NOT_STARTED,
                    then=1,
                ),
                default=0,
                output_field=IntegerField(),
            ),
            same_project=Case(
                When(item__project__slug=project_slug, then=1),
                default=0,
                output_field=IntegerField(),
            ),
            same_item=Case(
                When(item__item_id=ref_item_id, then=1),
                default=0,
                output_field=IntegerField(),
            ),
        ).order_by(
            "-unstarted",
            "-same_project",
            "-same_item",
            "sequence",
            "id",
        )

    asset = (
        asset_query.select_for_update(skip_locked=True, of=("self",))
        .select_related("item", "item__project")
        .first()
    )
    if asset:
        if spawn_task:
            structured_logger.debug(
                "Spawned background task to populate cache",
                event_code="transcribable_next_cache_population",
                topic=topic,
            )
            populate_task = get_registered_task(
                "concordia.tasks.next_asset.transcribable.populate_next_transcribable_for_topic"
            )
            populate_task.delay(topic.id)
        return asset

    # Only now consider same-item IN_PROGRESS after current sequence
    if item_id:
        qs = concordia_models.Asset.objects.filter(
            item__project__topics=topic.id,
            item__item_id=item_id,
            item__published=True,
            item__project__published=True,
            published=True,
            transcription_status=concordia_models.TranscriptionStatus.IN_PROGRESS,
        ).exclude(pk__in=Subquery(reserved_asset_ids))
        if orig_id_valid:
            qs = qs.exclude(pk=original_asset_id)
        if after_seq is not None and orig_item_id == item_id:
            qs = qs.filter(
                Q(sequence__gt=after_seq)
                | (Q(sequence=after_seq) & Q(id__gt=int(original_asset_id)))
            )
        asset = (
            qs.order_by("sequence", "id")
            .select_for_update(skip_locked=True, of=("self",))
            .select_related("item", "item__project")
            .first()
        )
        if asset:
            if spawn_task:
                structured_logger.debug(
                    "Spawned background task to populate cache",
                    event_code="transcribable_next_cache_population",
                    topic=topic,
                )
                populate_task = get_registered_task(
                    "concordia.tasks.next_asset.transcribable.populate_next_transcribable_for_topic"
                )
                populate_task.delay(topic.id)
            return asset

    return None


def find_invalid_next_transcribable_topic_assets(
    topic_id: int,
) -> "QuerySet[concordia_models.NextTranscribableTopicAsset]":
    """
    Return cached rows that are invalid for transcription for a topic.

    Behavior:
        Identifies `NextTranscribableTopicAsset` rows that are no longer valid
        because the underlying asset is neither `NOT_STARTED` nor
        `IN_PROGRESS`, or because the asset is currently reserved.

    Args:
        topic_id (int): Identifier of the topic.

    Returns:
        QuerySet[concordia_models.NextTranscribableTopicAsset]: Distinct invalid
            cache rows.
    """
    reserved_asset_ids = concordia_models.AssetTranscriptionReservation.objects.filter(
        asset__item__project__topics=topic_id
    ).values("asset_id")

    status_filtered = concordia_models.NextTranscribableTopicAsset.objects.filter(
        topic_id=topic_id
    ).exclude(
        asset__transcription_status__in=[
            concordia_models.TranscriptionStatus.NOT_STARTED,
            concordia_models.TranscriptionStatus.IN_PROGRESS,
        ]
    )

    reserved_filtered = concordia_models.NextTranscribableTopicAsset.objects.filter(
        topic_id=topic_id, asset_id__in=Subquery(reserved_asset_ids)
    )

    return (status_filtered | reserved_filtered).distinct()


================================================
FILE: concordia/validators.py
================================================
from django.conf import settings
from django.utils.translation import gettext_lazy as _

from .passwords.validators import ComplexityValidator


class DjangoPasswordsValidator(object):
    """
    Wrapper for the django-passwords complexity validator which is compatible
    with the Django 1.9+ password validation API
    Because django-passwords is not compatible with Django 4+, the validator
    has been integrated into the concordia.passwords module instead.
    """

    message = _("Must be more complex (%s)")
    code = "complexity"

    def __init__(self):
        self.validator = ComplexityValidator(settings.PASSWORD_COMPLEXITY)

    def get_help_text(self):
        return _("Your password fails to meet our complexity requirements.")

    def validate(self, value, user=None):
        return self.validator(value)


================================================
FILE: concordia/version.py
================================================
import functools

from setuptools_scm import get_version


@functools.lru_cache(maxsize=None)
def get_concordia_version():
    return get_version()


================================================
FILE: concordia/views/README.md
================================================
## **init**.py

Initializes the `views` module and re-exports submodules for chained attribute access
such as `views.campaigns`. Also includes some basic views.

### Class-based Views

-   **HomeView** - A `ListView` displaying featured campaigns on the homepage

### Function-based Views

-   **healthz** - Returns a JSON response with system and application status

## accounts.py

Views related to user account management, including login, registration and profile updates

### Class-based Views

-   **ConcordiaPasswordResetConfirmView** - Customized password reset confirmation
-   **ConcordiaPasswordResetRequestView** - Customized password reset requests
-   **ConcordiaRegistrationView** - Custom registration view with rate limiting
-   **ConcordiaLoginView** - Login view with Turnstile challenge validation
-   **AccountProfileView** - View for managing a user's profile and displaying contributions
-   **AccountDeletionView** - View for users to delete their account (or anonymize it)
-   **EmailReconfirmationView** - Handles confirming a user's changed email address

### Function-based Views

-   **account_letter** - Generates and returns a PDF letter summarizing contributions
-   **get_pages** - Renders a fragment of recent contributed pages

### Functions

-   **registration_rate** - Rate-limit for failed registration attempts

## ajax.py

AJAX endpoints for dynamic client interactions

### Function-based Views

-   **ajax_session_status** - Returns user-specific session data used by the frontend
-   **ajax_messages** - Returns any queued messages for the current user
-   **generate_ocr_transcription** - Generates a new transcription using OCR
-   **rollback_transcription** - Reverts transcription to the previous version
-   **rollforward_transcription** - Reverts the most recent transcription rollback
-   **save_transcription** - Saves a new transcription
-   **submit_transcription** - Marks a transcription as submitted for review
-   **review_transcription** - Accepts or rejects a submitted transcription
-   **submit_tags** - Updates the tag list for an asset
-   **reserve_asset** - Manages reservation of an asset to prevent conflicts

### Functions

-   **get_transcription_superseded** - Determines if the superseded transcription is valid
-   **update_reservation** - Updates the timestamp for a reservation
-   **obtain_reservation** - Creates a new reservation

## assets.py

Views for displaying asset detail pages and redirecting users to the next appropriate asset

### Class-based Views

-   **AssetDetailView** - Displays the transcription interface for a single asset

### Function-based Views

-   **redirect_to_next_asset** - Redirects to provided asset
-   **redirect_to_next_reviewable_asset** - Finds and redirects to a reviewable asset
-   **redirect_to_next_transcribable_asset** - Finds and redirects to a transcribable asset
-   **redirect_to_next_reviewable_campaign_asset** - Finds and redirects to the a reviewable asset for a campaign
-   **redirect_to_next_transcribable_campaign_asset** - Finds and redirects to a transcribable asset for a campaign
-   **redirect_to_next_reviewable_topic_asset** - Finds and redirects to a reviewable asset for a topic
-   **redirect_to_next_transcribable_topic_asset** - Finds and redirects to a transcribable asset for a topic

## campaigns.py

Views for listing campaigns, rendering campaign details, showing reports and filtering by reviewable status

### Class-based Views

-   **CampaignListView** - Lists all active campaigns (unused)
-   **CompletedCampaignListView** - Lists all completed and retired campaigns
-   **CampaignTopicListView** - Primary active campaign list view; also includes active topics
-   **CampaignDetailView** - Shows full details about a single campaign
-   **FilteredCampaignDetailView** - Variant of `CampaignDetailView` that applies filtering based on the user
-   **ReportCampaignView** - Displays a campaign report summarizing stats such as asset counts and contributors

## decorators.py

Custom decorators used by views

### Functions

-   **default_cache_control** - Applies default public caching headers for pages that don't vary per user
-   **user_cache_control** - Applies public caching headers with variation for logged-in users
-   **validate_anonymous_user** - Validates anonymous users via Turnstile before processing requests
-   **reserve_rate** - Returns a rate-limit value for unauthenticated users for reserving assets
-   **next_asset_rate** - Returns a rate-limit value for unauthenicated users for next\_\*\_asset views

## items.py

Views for displaying individual item detail pages

### Class-based Views

-   **ItemDetailView** - Displays a paginated list of assets within an item
-   **FilteredItemDetailView** - Variant of `ItemDetailView` that applies filtering based on the user

## maintenance_mode.py

Views for toggling the site's maintenance mode. Only accessible to superusers

### Function-based Views

-   **maintenance_mode_off** - Disables maintenance mode
-   **maintenance_mode_on** - Enables maintenance mode
-   **maintenance_mode_frontend_available** - Enables access to the frontend for staff while in maintenance mode
-   **maintenance_mode_frontend_unavailable** - Disables access to the frontend for staff while in maintenance mode

## projects.py

Views for displaying project detail pages

### Class-based Views

-   **ProjectDetailView** - Displays a project and its items
-   **FilteredProjectDetailView** - Variant of `ProjectDetailView` that applies filtering based on the user

## rate_limit.py

Custom handler for responding to requests that exceed rate limits

### Function-based Views

-   **ratelimit_view** - Returns a 429 response when a user is rate-limited

## simple_pages.py

Views and redirects for rendering static pages stored in the database

### Function-based Views

-   **simple_page** - Renders a simple static page from the database
-   **about_simple_page** - Renders the "about" simple page, which includes some additional data

### Class-based Views

-   **HelpCenterRedirectView** - Redirects old help center URLs to new equivalents
-   **HelpCenterSpanishRedirectView** - Redirects old Spanish help center URLs to new equivalents

## topics.py

View for displaying a topic's detail page

### Class-based Views

-   **TopicDetailView** - Displays a topic's associated projects

## utils.py

Utility functions, constants and mixins used throughout the views module

### Constants

-   **ASSETS_PER_PAGE** - Default number of assets to show per page
-   **PROJECTS_PER_PAGE** - Default number of projects to show per page
-   **ITEMS_PER_PAGE** - Default number of items to show per page
-   **URL_REGEX** - Regular expression used to detect URLs in transcription text
-   **MESSAGE_LEVEL_NAMES** - Dictionary mapping Django message levels to lowercase names

### Functions

-   **\_get_pages** - Returns a queryset of assets a user has worked on
-   **calculate_asset_stats** - Adds contributor and transcription status to the provided assets
-   **annotate_children_with_progress_stats** - Annotates a list of objects with progress information

### Classes

-   **AnonymousUserValidationCheckMixin** - Requires anonymous users to pass Turnstile validation

## visualization.py

Views for displaying visualizations

### Classes

-   **VisualizationDataView** - Returns JSON representing the visualization `name`


================================================
FILE: concordia/views/__init__.py
================================================
import json
import logging
import os
from time import time

from django.conf import settings
from django.http import HttpResponse
from django.utils.decorators import method_decorator
from django.views.decorators.cache import never_cache
from django.views.generic import ListView

from concordia.models import Banner, Campaign, CarouselSlide
from concordia.version import get_concordia_version

# These imports are required to make chainted attribute access like, e.g.,
# views.campaigns.CampaignDetailView work correctly
from . import (
    accounts,  # noqa: F401
    ajax,  # noqa: F401
    assets,  # noqa: F401
    campaigns,  # noqa: F401
    items,  # noqa: F401
    maintenance_mode,  # noqa: F401
    projects,  # noqa: F401
    rate_limit,  # noqa: F401
    simple_pages,  # noqa: F401
    topics,  # noqa: F401
    visualizations,  # noqa: F401
)
from .decorators import default_cache_control

logger = logging.getLogger(__name__)


@never_cache
def healthz(request):
    status = {
        "current_time": time(),
        "load_average": os.getloadavg(),
        "debug": settings.DEBUG,
    }

    # We don't want to query a large table but we do want to hit the database
    # at last once:
    status["database_has_data"] = Campaign.objects.count() > 0

    status["application_version"] = get_concordia_version()

    return HttpResponse(content=json.dumps(status), content_type="application/json")


@method_decorator(default_cache_control, name="dispatch")
class HomeView(ListView):
    template_name = "home.html"

    queryset = (
        Campaign.objects.published()
        .listed()
        .filter(display_on_homepage=True)
        .order_by("ordering", "title")
    )
    context_object_name = "campaigns"

    def get_context_data(self, *args, **kwargs):
        ctx = super().get_context_data(*args, **kwargs)

        banner = Banner.objects.filter(active=True).first()

        if banner is not None:
            ctx["banner"] = banner

        ctx["slides"] = CarouselSlide.objects.published().order_by("ordering")

        if ctx["slides"]:
            ctx["firstslide"] = ctx["slides"][0]

        return ctx


================================================
FILE: concordia/views/accounts.py
================================================
import gc
import logging
import tracemalloc
import uuid
from smtplib import SMTPException
from typing import Any, Optional, Type

from django.conf import settings
from django.contrib import messages
from django.contrib.auth import logout
from django.contrib.auth.decorators import login_required
from django.contrib.auth.mixins import LoginRequiredMixin
from django.contrib.auth.views import (
    LoginView,
    PasswordResetConfirmView,
    PasswordResetView,
)
from django.contrib.sites.shortcuts import get_current_site
from django.core import signing
from django.core.exceptions import ValidationError
from django.core.mail import send_mail
from django.core.paginator import Paginator
from django.db.models import Sum
from django.forms import Form
from django.http import HttpRequest, HttpResponse, HttpResponseRedirect, JsonResponse
from django.shortcuts import redirect
from django.template import loader
from django.template.loader import render_to_string
from django.urls import reverse_lazy
from django.utils.decorators import method_decorator
from django.utils.translation import gettext_lazy as _
from django.views.decorators.cache import never_cache
from django.views.generic import FormView, ListView, TemplateView
from django_ratelimit.decorators import ratelimit
from django_registration.backends.activation.views import RegistrationView
from weasyprint import HTML

from concordia.forms import (
    AccountDeletionForm,
    ActivateAndSetPasswordForm,
    AllowInactivePasswordResetForm,
    TurnstileForm,
    UserLoginForm,
    UserNameForm,
    UserProfileForm,
    UserRegistrationForm,
)
from concordia.logging import ConcordiaLogger
from concordia.models import Campaign, ConcordiaUser, UserProfileActivity

from .utils import _get_pages

logger = logging.getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


class ConcordiaPasswordResetConfirmView(PasswordResetConfirmView):
    """
    Confirm a password reset and automatically log in the user.

    Extends Django’s built-in
    [PasswordResetConfirmView](https://docs.djangoproject.com/en/stable/topics/auth/default/#django.contrib.auth.views.PasswordResetConfirmView)
    to use a custom form and enable automatic login after a successful reset.

    Attributes:
        post_reset_login (bool): Whether to log the user in after resetting
            the password.
        form_class (Form): The form used to set the new password and activate
            the account.

    Returns:
        response (HttpResponse): Renders the password reset confirmation page or
            redirects after successful password change and login.
    """

    post_reset_login: bool = True
    form_class: type[Form] = ActivateAndSetPasswordForm


class ConcordiaPasswordResetRequestView(PasswordResetView):
    """
    Request a password reset, supporting inactive users.

    Extends Django’s built-in
    [`PasswordResetView`](https://docs.djangoproject.com/en/stable/topics/auth/default/#django.contrib.auth.views.PasswordResetView)
    to use a custom form that allows inactive users to reset their password
    and activate their account in one step.

    Attributes:
        form_class (Form): The form used to validate and process the password
            reset request.

    Returns:
        response (HttpResponse): Renders the password reset form or redirects
            after successful submission.
    """

    form_class: type[Form] = AllowInactivePasswordResetForm


def registration_rate(group: str, request: HttpRequest) -> Optional[str]:
    """
    Determine the throttling rate for registration attempts.

    Used with the
    [ratelimit](https://django-ratelimit.readthedocs.io/en/stable/usage.html#ratelimit)
    decorator from `django-ratelimit` to dynamically adjust the request rate based
    on form validation.

    If the submitted form is invalid, limits requests to 10 per hour. If the
    form is valid, allows the request without throttling.

    Args:
        group (str): The rate limit group name. Example: `"registration"`
        request (HttpRequest): The request containing registration form data.

    Returns:
        rate (str or None): The rate limit string (e.g., "10/h") if the form is
            invalid; otherwise `None` to indicate no throttling.
    """
    registration_form = UserRegistrationForm(request.POST)
    user = getattr(request, "user", None)
    if registration_form.is_valid():
        structured_logger.debug(
            "Registration form valid.",
            event_code="registration_rate_ok",
            user=user,
        )
        return None
    else:
        structured_logger.debug(
            "Registration form invalid, throttling.",
            event_code="registration_rate_throttle",
            user=user,
        )
        return "10/h"


@method_decorator(never_cache, name="dispatch")
@method_decorator(
    ratelimit(
        group="registration",
        key="header:cf-connecting-ip",
        rate=registration_rate,
        method="POST",
        block=settings.RATELIMIT_BLOCK,
    ),
    name="post",
)
class ConcordiaRegistrationView(RegistrationView):
    """
    User registration view with rate limiting.

    Extends
    [django_registration.views.RegistrationView](https://django-registration.readthedocs.io/en/stable/views.html#django_registration.views.RegistrationView)
    to apply a POST-specific rate limit using the
    [django-ratelimit](https://django-ratelimit.readthedocs.io/en/stable/usage.html#ratelimit)
    decorator. This protects against abuse by restricting failed registration attempts
    while  allowing valid submissions to proceed freely.

    Attributes:
        form_class (Form): The form used to collect and validate user registration
            data. Example: `UserRegistrationForm`.

    Returns:
        response (HttpResponse): Renders the registration form or redirects after
            successful registration.
    """

    form_class: Type[Form] = UserRegistrationForm


@method_decorator(never_cache, name="dispatch")
class ConcordiaLoginView(LoginView):
    """
    Login view with Turnstile validation.

    Extends Django's
    [LoginView](https://docs.djangoproject.com/en/stable/topics/auth/default/#django.contrib.auth.views.LoginView)
    to integrate Turnstile validation during POST requests.

    Attributes:
        form_class (Form): The login form used to authenticate users.

    Returns:
        response (HttpResponse): The rendered login form or redirect response,
            depending on the validation outcome.

    Return Behavior:
        - On GET: Renders the login form with the embedded Turnstile widget.
        - On POST:
            - If both login and Turnstile succeed: redirects to the next page.
            - If Turnstile fails: returns the login form with an error message.
            - If the login form is invalid: returns the form with validation errors.
    """

    form_class = UserLoginForm

    def post(self, request: HttpRequest, *args: Any, **kwargs: Any) -> HttpResponse:
        structured_logger.debug(
            "Login POST received.",
            event_code="login_post_entry",
            user=request.user,
        )
        form = self.get_form()
        if form.is_valid():
            turnstile_form = TurnstileForm(request.POST)
            if turnstile_form.is_valid():
                structured_logger.debug(
                    "Login and Turnstile ok.",
                    event_code="login_success",
                    user=request.user,
                )
                return self.form_valid(form)
            else:
                structured_logger.warning(
                    "Turnstile failed for login.",
                    event_code="login_turnstile_failed",
                    reason="Turnstile validation failed",
                    reason_code="turnstile_failed",
                    user=request.user,
                )
                form.add_error(
                    None, "Unable to validate. Please login or complete the challenge."
                )
                return self.form_invalid(form)

        else:
            structured_logger.debug(
                "Login form invalid.",
                event_code="login_form_invalid",
                user=request.user,
            )
            return self.form_invalid(form)

    def get_context_data(self, **kwargs: Any) -> dict[str, Any]:
        ctx = super().get_context_data(**kwargs)

        ctx["turnstile_form"] = TurnstileForm(auto_id=False)
        structured_logger.debug(
            "Added Turnstile form to context.",
            event_code="login_context_turnstile",
            user=self.request.user,
        )
        return ctx


@login_required
@never_cache
def account_letter(request: HttpRequest) -> HttpResponse:
    """
    Generate and return a PDF letter summarizing a user's contributions.

    This view creates a service letter for the logged-in user, summarizing their
    transcription and review activity. It uses an HTML template rendered with
    contribution data and converts it to a PDF using WeasyPrint.

    Requires the user to be authenticated.

    Returns:
        response (HttpResponse): A PDF response with content type
            `application/pdf` and a `Content-Disposition` header set to download
            as `letter.pdf`.

    Return Behavior:
        - The generated PDF includes:
            - User's name and join date.
            - Total transcriptions and reviews.
            - List of assets the user contributed to.
    """
    structured_logger.debug(
        "Building account letter.",
        event_code="account_letter_start",
        user=request.user,
    )
    image_url = "file://{0}/{1}/img/logo.jpg".format(
        settings.SITE_ROOT_DIR, settings.STATIC_ROOT
    )
    user_profile_activity = UserProfileActivity.objects.filter(user=request.user)
    aggregate_sums = user_profile_activity.aggregate(
        Sum("review_count"), Sum("transcribe_count")
    )
    asset_list = _get_pages(request)
    context = {
        "user": request.user,
        "join_date": request.user.date_joined,
        "total_reviews": aggregate_sums["review_count__sum"],
        "total_transcriptions": aggregate_sums["transcribe_count__sum"],
        "image_url": image_url,
        "asset_list": asset_list,
    }
    template = loader.get_template("documents/service_letter.html")
    text = template.render(context)
    html = HTML(string=text)
    response = HttpResponse(
        content=html.write_pdf(variant="pdf/ua-1"), content_type="application/pdf"
    )
    response["Content-Disposition"] = "attachment; filename=letter.pdf"
    structured_logger.debug(
        "Account letter generated.",
        event_code="account_letter_success",
        user=request.user,
        total_reviews=aggregate_sums["review_count__sum"],
        total_transcriptions=aggregate_sums["transcribe_count__sum"],
        asset_count=len(asset_list),
    )
    return response


@login_required
@never_cache
def get_pages(request: HttpRequest) -> JsonResponse:
    """
    Return a paginated and filtered list of the user's contributed assets as HTML.

    Retrieves assets the current user has worked on, applies pagination, and
    optionally filters by campaign, activity type, status, and date range. Renders
    the results into a fragment of HTML for use in dynamic page updates.

    Requires the user to be authenticated.

    Args:
        request (HttpRequest): The request from the authenticated user.

    Request Parameters:
        - `page` (int): Page number to display. Example: `2`
        - `campaign` (int): Filter by campaign ID. Example: `17`
        - `status` (list[str]): Filter by asset statuses. Example:
          `["in_progress", "submitted"]`
        - `activity` (str): Filter by activity type. Example: `"transcribe"`
        - `order_by` (str): Sort order. Example: `"date-descending"`
        - `start` (str): Start date in YYYY-MM-DD format. Example: `"2023-01-01"`
        - `end` (str): End date in YYYY-MM-DD format. Example: `"2023-12-31"`

    Returns:
        response (JsonResponse): A JSON object containing rendered HTML for recent
            contributed pages.

    Response Format - Success:
        - `content` (str): Rendered HTML for recent pages.

    Example:
        ```json
        {
            "content": "<div class='page-results'>...</div>"
        }
        ```
    """
    tracemalloc.start()
    gc.collect()

    structured_logger.debug(
        "Fetching recent pages.",
        event_code="recent_pages_entry",
        user=request.user,
        page=request.GET.get("page", "1"),
        campaign=request.GET.get("campaign"),
        activity=request.GET.get("activity"),
    )
    asset_list = _get_pages(request)

    paginator = Paginator(asset_list, 30)  # Show 30 assets per page.

    page_number = int(request.GET.get("page", "1"))
    context = {
        "paginator": paginator,
        "page_obj": paginator.get_page(page_number),
        "is_paginated": True,
        "recent_campaigns": Campaign.objects.filter(
            project__item__asset__in=asset_list.values("pk")
        )
        .distinct()
        .order_by("title")
        .values("pk", "title"),
    }
    for param in ("activity", "end", "order_by", "start", "statuses"):
        context[param] = request.GET.get(param, None)
    campaign = request.GET.get("campaign", None)
    context["statuses"] = request.GET.getlist("status")

    if campaign is not None:
        context["campaign"] = Campaign.objects.get(pk=int(campaign))

    data = {}
    data["content"] = loader.render_to_string(
        "fragments/recent-pages.html", context, request=request
    )

    # Capture memory stats
    current, peak = tracemalloc.get_traced_memory()
    current_mb = current / 1024 / 1024
    peak_mb = peak / 1024 / 1024

    # For immediate visibility
    structured_logger.info(
        "Recent pages rendered.",
        event_code="recent_pages_success",
        user=request.user,
        assets=asset_list.count(),
        num_pages=paginator.num_pages,
        page=page_number,
        memory_current_mb=round(current_mb, 2),
        memory_peak_mb=round(peak_mb, 2),
    )

    tracemalloc.stop()
    return JsonResponse(data)


@method_decorator(never_cache, name="dispatch")
class AccountProfileView(LoginRequiredMixin, FormView, ListView):
    """
    Display and update user account profile and contribution history.

    Combines functionality from:
    - [LoginRequiredMixin](https://docs.djangoproject.com/en/stable/topics/auth/default/#the-loginrequiredmixin-mixin)
    - [FormView](https://docs.djangoproject.com/en/stable/ref/class-based-views/generic-editing/#formview)
    - [ListView](https://docs.djangoproject.com/en/stable/ref/class-based-views/generic-display/#listview)

    Allows authenticated users to:
    - Update their email address and name
    - View a paginated list of assets they have contributed to
    - See aggregate statistics on their transcription and review activity

    Email changes require confirmation unless the setting
    `REQUIRE_EMAIL_RECONFIRMATION` is False.

    Attributes:
        template_name (str): Template used to render the profile page.
            Example: `"account/profile.html"`
        form_class (Form): Form used to update the user's email address.
            Example: `UserProfileForm`
        success_url (str): Redirect URL after successful form submission.
            Example: `"/accounts/profile/"`
        allow_empty (bool): Whether to render the page if the user has no
            contributions. Default is `True`
        paginate_by (int): Number of contributed assets to show per page.
            Default is `30`.
        reconfirmation_email_body_template (str): Path to the plain text email
            body template. Example: `"emails/email_reconfirmation_body.txt"`
        reconfirmation_email_subject_template (str): Path to the email subject
            template. Example: `"emails/email_reconfirmation_subject.txt"`

    Returns:
        response (HttpResponse): The rendered profile page with contribution data
            or a redirect to `#account` after successful form submission.

    Request Parameters:
        - `page` (int): Page number. Example: `1`
        - `campaign` (int): Campaign filter. Example: `42`
        - `activity` (str): Activity type filter. Example: `"transcribe"`
        - `status` (list[str]): Asset statuses. Example: `["completed"]`
        - `start` (str): Start date in YYYY-MM-DD format. Example: `"2023-01-01"`
        - `end` (str): End date in YYYY-MM-DD format. Example: `"2023-12-31"`
        - `order_by` (str): Sort field. Example: `"date-descending"`
        - `tab` (str): Selected tab. Example: `"account"`
    """

    template_name: str = "account/profile.html"
    form_class: Type[Form] = UserProfileForm
    success_url = reverse_lazy("user-profile")
    reconfirmation_email_body_template: str = "emails/email_reconfirmation_body.txt"
    reconfirmation_email_subject_template: str = (
        "emails/email_reconfirmation_subject.txt"
    )

    # This view will list the assets which the user has contributed to
    # along with their most recent action on each asset. This will be
    # presented in the template as a standard paginated list of Asset
    # instances with annotations
    allow_empty: bool = True
    paginate_by: int = 30

    def post(self, request: HttpRequest, *args: Any, **kwargs: Any) -> HttpResponse:
        structured_logger.debug(
            "Profile POST received.",
            event_code="profile_post_entry",
            user=request.user,
        )
        self.object_list = self.get_queryset()
        if "submit_name" in request.POST:
            form = UserNameForm(request.POST)
            if form.is_valid():
                user = ConcordiaUser.objects.get(id=request.user.id)
                user.first_name = form.cleaned_data["first_name"]
                user.last_name = form.cleaned_data["last_name"]
                user.save()
                structured_logger.debug(
                    "Updated profile name.",
                    event_code="profile_name_updated",
                    user=request.user,
                )
            return redirect("user-profile")
        else:
            return super().post(request, *args, **kwargs)

    def get_queryset(self) -> Any:
        structured_logger.debug(
            "Fetching pages for profile.",
            event_code="profile_get_queryset",
            user=self.request.user,
        )
        return _get_pages(self.request)

    def get_context_data(self, *args: Any, **kwargs: Any) -> dict[str, Any]:
        ctx = super().get_context_data(*args, **kwargs)

        page = self.request.GET.get("page", None)
        campaign = self.request.GET.get("campaign", None)
        activity = self.request.GET.get("activity", None)
        status_list = self.request.GET.getlist("status")
        start = self.request.GET.get("start", None)
        end = self.request.GET.get("end", None)
        order_by = self.request.GET.get("order_by", None)
        if any([activity, campaign, page, status_list, start, end, order_by]):
            ctx["active_tab"] = "recent"
            if status_list:
                ctx["status_list"] = status_list
            ctx["order_by"] = self.request.GET.get("order_by", "date-descending")
        elif "active_tab" not in ctx:
            ctx["active_tab"] = self.request.GET.get("tab", "contributions")
        ctx["activity"] = activity
        if end is not None:
            ctx["end"] = end
        ctx["order_by"] = order_by
        if start is not None:
            ctx["start"] = start

        ctx["valid"] = self.request.session.pop("valid", None)

        user = self.request.user
        concordia_user = ConcordiaUser.objects.get(id=user.id)
        user_profile_activity = UserProfileActivity.objects.filter(user=user).order_by(
            "campaign__title"
        )
        ctx["user_profile_activity"] = user_profile_activity

        aggregate_sums = user_profile_activity.aggregate(
            Sum("review_count"), Sum("transcribe_count"), Sum("asset_count")
        )
        ctx["totalReviews"] = aggregate_sums["review_count__sum"]
        ctx["totalTranscriptions"] = aggregate_sums["transcribe_count__sum"]
        ctx["pages_worked_on"] = aggregate_sums["asset_count__sum"]
        if ctx["totalReviews"] is not None:
            ctx["totalCount"] = ctx["totalReviews"] + ctx["totalTranscriptions"]
        ctx["unconfirmed_email"] = concordia_user.get_email_for_reconfirmation()
        ctx["name_form"] = UserNameForm()
        structured_logger.debug(
            "Profile context ready.",
            event_code="profile_context_ready",
            user=self.request.user,
            total_reviews=ctx["totalReviews"],
            total_transcriptions=ctx["totalTranscriptions"],
            pages_worked=ctx["pages_worked_on"],
        )
        return ctx

    def get_initial(self) -> dict[str, Any]:
        initial = super().get_initial()
        initial["email"] = self.request.user.email
        return initial

    def get_form_kwargs(self) -> dict[str, Any]:
        # We'll expose the request object to the form so we can validate that an
        # email is not in use:
        kwargs = super().get_form_kwargs()
        kwargs["request"] = self.request
        return kwargs

    def form_valid(self, form: Form) -> HttpResponse:
        user = self.request.user
        new_email = form.cleaned_data["email"]
        structured_logger.info(
            "Profile email update submitted.",
            event_code="profile_email_update",
            user=user,
            require_reconfirm=settings.REQUIRE_EMAIL_RECONFIRMATION,
        )
        # This is annoying, but there's no better way to get the proxy model here
        # without being hacky (changing user.__class__ directly.)
        # Every method (such as using a user profile) would incur the same
        # database request.
        concordia_user = ConcordiaUser.objects.get(id=user.id)
        if settings.REQUIRE_EMAIL_RECONFIRMATION:
            concordia_user.set_email_for_reconfirmation(new_email)
            structured_logger.debug(
                "Email set for reconfirmation.",
                event_code="email_reconfirm_set",
                user=user,
                new_email=new_email,
            )
            self.send_reconfirmation_email(concordia_user)
        else:
            concordia_user.email = new_email
            concordia_user.full_clean()
            concordia_user.save()
            concordia_user.delete_email_for_reconfirmation()
            structured_logger.debug(
                "Email updated without reconfirmation.",
                event_code="email_updated_no_reconfirm",
                user=user,
                new_email=new_email,
            )

        self.request.session["valid"] = True

        return super().form_valid(form)

    def form_invalid(self, form: Form) -> HttpResponse:
        structured_logger.debug(
            "Profile form invalid.",
            event_code="profile_form_invalid",
            user=self.request.user,
        )
        self.request.session["valid"] = False
        return self.render_to_response(
            self.get_context_data(form=form, active_tab="account")
        )

    def get_success_url(self) -> str:
        # automatically open the Account Settings tab
        return "{}#account".format(super().get_success_url())

    def get_reconfirmation_email_context(self, confirmation_key: str) -> dict[str, Any]:
        return {
            "confirmation_key": confirmation_key,
            "expiration_days": settings.EMAIL_RECONFIRMATION_DAYS,
            "site": get_current_site(self.request),
        }

    def send_reconfirmation_email(self, user: ConcordiaUser) -> None:
        confirmation_key = user.get_email_reconfirmation_key()
        context = self.get_reconfirmation_email_context(confirmation_key)
        context["user"] = user
        subject = render_to_string(
            template_name=self.reconfirmation_email_subject_template,
            context=context,
            request=self.request,
        )
        # Ensure subject is a single line
        subject = "".join(subject.splitlines())
        message = render_to_string(
            template_name=self.reconfirmation_email_body_template,
            context=context,
            request=self.request,
        )
        try:
            structured_logger.info(
                "Sending reconfirmation email.",
                event_code="email_reconfirm_send_start",
                user=user,
                email=user.get_email_for_reconfirmation(),
            )
            send_mail(
                subject,
                message=message,
                from_email=settings.DEFAULT_FROM_EMAIL,
                recipient_list=[user.get_email_for_reconfirmation()],
            )
            structured_logger.debug(
                "Reconfirmation email sent.",
                event_code="email_reconfirm_send_success",
                user=user,
                email=user.get_email_for_reconfirmation(),
            )
        except SMTPException:
            logger.exception(
                "Unable to send email reconfirmation to %s",
                user.get_email_for_reconfirmation(),
            )
            structured_logger.exception(
                "Reconfirmation email send failed.",
                event_code="email_reconfirm_send_failed",
                reason="SMTPException",
                reason_code="smtp_error",
                user=user,
                email=user.get_email_for_reconfirmation(),
            )
            messages.error(
                self.request,
                _("Email confirmation could not be sent."),
            )


@method_decorator(never_cache, name="dispatch")
class AccountDeletionView(LoginRequiredMixin, FormView):
    """
    Handle user-initiated account deletion.

    Extends:
        - [LoginRequiredMixin](https://docs.djangoproject.com/en/stable/topics/auth/default/#the-loginrequiredmixin-mixin)
        - [FormView](https://docs.djangoproject.com/en/stable/ref/class-based-views/generic-editing/#formview)

    Provides a confirmation form for deleting the user's account. If the user has
    contributed transcriptions, their data is anonymized instead of being deleted.
    Otherwise, the account is fully removed. A confirmation email is sent to the
    user's address before deletion. After deletion, the user is logged out.

    Requires the user to be authenticated.

    Attributes:
        template_name (str): Template used to render the confirmation form.
            Example: `"account/account_deletion.html"`
        form_class (Form): Form used to confirm account deletion.
            Example: `AccountDeletionForm`
        success_url (str): URL to redirect to after deletion.
            Example: `"/"`
        email_body_template (str): Template for the body of the confirmation email.
            Example: `"emails/delete_account_body.txt"`
        email_subject_template (str): Template for the subject of the confirmation
            email. Example: `"emails/delete_account_subject.txt"`

    Returns:
        response (HttpResponse): A redirect to the homepage after deletion, or a
            rendered form with errors if validation fails.

    Return Behavior:
        - If the user confirms deletion and has transcriptions: anonymizes their
          account and logs them out.
        - If the user has no transcriptions: deletes the account entirely and logs
          them out.
        - If the form is invalid: re-renders the confirmation form with errors.
    """

    template_name: str = "account/account_deletion.html"
    form_class: Type[Form] = AccountDeletionForm
    success_url: str = reverse_lazy("homepage")
    email_body_template: str = "emails/delete_account_body.txt"
    email_subject_template: str = "emails/delete_account_subject.txt"

    def get_form_kwargs(self) -> dict[str, Any]:
        # We expose the request object to the form so we can use it
        # to log the user out after deletion
        kwargs = super().get_form_kwargs()
        kwargs["request"] = self.request
        return kwargs

    def form_valid(self, form: Form) -> HttpResponse:
        structured_logger.info(
            "Account deletion confirmed.",
            event_code="account_delete_confirmed",
            user=form.request.user,
        )
        self.delete_user(form.request.user, form.request)
        return super().form_valid(form)

    def delete_user(self, user: ConcordiaUser, request: HttpRequest) -> None:
        logger.info("Deletion request for %s", user)
        structured_logger.info(
            "Processing account deletion.",
            event_code="account_delete_start",
            user=user,
        )
        email = user.email
        if user.transcription_set.exists():
            logger.info("Anonymizing %s", user)
            structured_logger.info(
                "Anonymizing user account.",
                event_code="account_anonymize",
                user=user,
            )
            user.username = "Anonymized %s" % uuid.uuid4()
            user.first_name = ""
            user.last_name = ""
            user.email = ""
            user.set_unusable_password()
            user.is_staff = False
            user.is_superuser = False
            user.is_active = False
            user.save()
        else:
            logger.info("Deleting %s", user)
            structured_logger.info(
                "Deleting user account.",
                event_code="account_delete",
                user=user,
            )
            user.delete()
        self.send_deletion_email(email)
        logout(request)
        structured_logger.info(
            "Account deletion complete.",
            event_code="account_delete_complete",
            user=user,
        )

    def send_deletion_email(self, email: str) -> None:
        context = {}
        subject = render_to_string(
            template_name=self.email_subject_template,
            context=context,
            request=self.request,
        )
        # Ensure subject is a single line
        subject = "".join(subject.splitlines())
        message = render_to_string(
            template_name=self.email_body_template,
            context=context,
            request=self.request,
        )
        try:
            structured_logger.info(
                "Sending deletion email.",
                event_code="account_delete_email_send_start",
                user=self.request.user,
                email=email,
            )
            send_mail(
                subject,
                message=message,
                from_email=settings.DEFAULT_FROM_EMAIL,
                recipient_list=[email],
            )
            structured_logger.debug(
                "Deletion email sent.",
                event_code="account_delete_email_send_success",
                user=self.request.user,
                email=email,
            )
        except SMTPException:
            logger.exception(
                "Unable to send account deletion email to %s",
                email,
            )
            structured_logger.exception(
                "Deletion email send failed.",
                event_code="account_delete_email_send_failed",
                reason="SMTPException",
                reason_code="smtp_error",
                user=self.request.user,
                email=email,
            )
            messages.error(
                self.request,
                _("Email confirmation of deletion could not be sent."),
            )


class EmailReconfirmationView(TemplateView):
    """
    Handle email reconfirmation via a signed URL token.

    Extends:
        - [TemplateView](https://docs.djangoproject.com/en/stable/ref/class-based-views/base/#templateview)

    Validates a confirmation key sent to the user's new email address during
    an address change. If valid and not expired, applies the email update. If
    invalid, expired or mismatched, renders an error message.

    Attributes:
        template_name (str): Template rendered if the confirmation fails.
            Example: `"account/email_reconfirmation_failed.html"`
        success_url (str): URL to redirect to on success.
            Example: `"/accounts/profile/#account"`
        BAD_USERNAME_MESSAGE (str): Error if the user account cannot be found.
        BAD_EMAIL_MESSAGE (str): Error if the email does not match expectations.
        EXPIRED_MESSAGE (str): Error if the key is expired.
        INVALID_KEY_MESSAGE (str): Error if the key signature is invalid.

    Returns:
        response (HttpResponse): Redirects to the profile page with `#account`
            on success, or renders the failure template with error details.

    Request Parameters:
        confirmation_key (str): A signed token containing the username and new
            email. Example: `"ZHVtbXl1c2VyOnNvbWVvbmVAZXhhbXBsZS5jb20="`
    """

    success_url = reverse_lazy("user-profile")
    template_name = "account/email_reconfirmation_failed.html"

    BAD_USERNAME_MESSAGE: str = _("The account you attempted to confirm is invalid.")
    BAD_EMAIL_MESSAGE: str = _("The email you attempted to confirm is invalid.")
    EXPIRED_MESSAGE: str = _(
        "The confirmation key you provided is expired. Email confirmation links "
        "expire after 7 days. If your key is expired, you will need to re-enter "
        "your new email address"
    )
    INVALID_KEY_MESSAGE: str = _(
        "The confirmation key you provided is invalid. Email confirmation links "
        "expire after 7 days. If your key is expired, you will need to re-enter "
        "your new email address."
    )

    def get_success_url(self) -> str:
        return "{}#account".format(self.success_url)

    def get(self, *args: Any, **kwargs: Any) -> HttpResponse:
        extra_context = {}
        try:
            structured_logger.debug(
                "Email reconfirmation GET received.",
                event_code="email_reconfirm_entry",
            )
            self.confirm(*args, **kwargs)
        except ValidationError as exc:
            structured_logger.warning(
                "Email reconfirmation failed.",
                event_code="email_reconfirm_failed",
                reason=str(exc.message),
                reason_code=str(exc.code),
            )
            extra_context["reconfirmation_error"] = {
                "message": exc.message,
                "code": exc.code,
                "params": exc.params,
            }
            context_data = self.get_context_data()
            context_data.update(extra_context)
            return self.render_to_response(context_data, status=403)
        else:
            structured_logger.debug(
                "Email reconfirmation ok.",
                event_code="email_reconfirm_success",
            )
            return HttpResponseRedirect(self.get_success_url())

    def confirm(self, *args: Any, **kwargs: Any) -> ConcordiaUser:
        username, email = self.validate_key(kwargs.get("confirmation_key"))
        user = self.get_user(username)
        if not user.validate_reconfirmation_email(email):
            raise ValidationError(self.BAD_EMAIL_MESSAGE, code="bad_email") from None
        try:
            user.email = email
            user.full_clean()
        except ValidationError:
            raise ValidationError(self.BAD_EMAIL_MESSAGE, code="bad_email") from None
        user.save()
        user.delete_email_for_reconfirmation()
        structured_logger.info(
            "Email reconfirmed and applied.",
            event_code="email_reconfirm_applied",
            user=user,
            new_email=email,
        )
        return user

    def validate_key(self, confirmation_key: str) -> tuple[str, str]:
        try:
            context = signing.loads(
                confirmation_key, max_age=settings.EMAIL_RECONFIRMATION_TIMEOUT
            )
            return context["username"], context["email"]
        except signing.SignatureExpired as exc:
            raise ValidationError(self.EXPIRED_MESSAGE, code="expired") from exc
        except signing.BadSignature as exc:
            raise ValidationError(
                self.INVALID_KEY_MESSAGE,
                code="invalid_key",
                params={"confirmation_key": confirmation_key},
            ) from exc

    def get_user(self, username: str) -> ConcordiaUser:
        try:
            user = ConcordiaUser.objects.get(username=username)
            structured_logger.debug(
                "Loaded user for reconfirmation.",
                event_code="email_reconfirm_user_loaded",
                user=user,
            )
            return user
        except ConcordiaUser.DoesNotExist as exc:
            structured_logger.warning(
                "User not found for reconfirmation.",
                event_code="email_reconfirm_user_missing",
                reason="User does not exist",
                reason_code="user_missing",
            )
            raise ValidationError(
                self.BAD_USERNAME_MESSAGE, code="bad_username"
            ) from exc


================================================
FILE: concordia/views/ajax.py
================================================
import logging
import re
from time import time
from typing import Union

from django.conf import settings
from django.contrib.auth.decorators import login_required
from django.contrib.messages import get_messages
from django.core.exceptions import ValidationError
from django.db import connection
from django.db.transaction import atomic
from django.http import HttpRequest, HttpResponse, JsonResponse
from django.shortcuts import get_object_or_404
from django.urls import reverse
from django.utils.timezone import now
from django.views.decorators.cache import cache_control, never_cache
from django.views.decorators.csrf import csrf_exempt
from django.views.decorators.http import require_POST
from django_ratelimit.decorators import ratelimit

from concordia.exceptions import RateLimitExceededError
from concordia.logging import ConcordiaLogger
from concordia.models import (
    Asset,
    AssetTranscriptionReservation,
    ConcordiaUser,
    Tag,
    Transcription,
    UserAssetTagCollection,
)
from concordia.signals.signals import (
    reservation_obtained,
    reservation_released,
)
from concordia.utils import (
    get_anonymous_user,
    get_or_create_reservation_token,
)
from concordia.utils.constants import MESSAGE_LEVEL_NAMES, URL_REGEX
from configuration.utils import configuration_value
from exporter.utils import remove_unacceptable_characters

from .decorators import reserve_rate, validate_anonymous_user

logger = logging.getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


@cache_control(private=True, max_age=settings.DEFAULT_PAGE_TTL)
@csrf_exempt
def ajax_session_status(request: HttpRequest) -> JsonResponse:
    """
    Return a JSON object describing the authenticated session state.

    If the user is authenticated, this includes a truncated username and
    navigational links to profile, logout, and admin pages (if staff or superuser).
    If the user is anonymous, returns an empty dictionary.

    Args:
        request (HttpRequest): The HTTP request initiating the session status check.

    Returns:
        response (JsonResponse): A dictionary containing either session information
            or empty data.

    Response Format - Success:
        - `username` (str): The first 15 characters of the user's username.
        - `links` (list[dict]): A list of links relevant to the user's session.
            - `title` (str): The label for the link (e.g., "Profile", "Logout").
            - `url` (str): The absolute URL for the link.

    Example:
        ```json
        // If the user is authenticated:
        {
            "username": "johndoe",
            "links": [
                {"title": "Profile", "url": "https://example.com/accounts/profile/"},
                {"title": "Logout", "url": "https://example.com/accounts/logout/"}
            ]
        }

        // If the user is anonymous:
        {}
        ```
    """
    user = request.user
    if user.is_anonymous:
        res = {}
    else:
        links = [
            {
                "title": "Profile",
                "type": "link",
                "url": request.build_absolute_uri(reverse("user-profile")),
            }
        ]
        if user.is_superuser or user.is_staff:
            links.append(
                {
                    "title": "Admin Area",
                    "type": "link",
                    "url": request.build_absolute_uri(reverse("admin:index")),
                }
            )
        links.append(
            {
                "title": "Logout",
                "type": "post",
                "url": request.build_absolute_uri(reverse("logout")),
                "fields": {"next": "/"},
            }
        )

        res = {"username": user.username[:15], "links": links}

    return JsonResponse(res)


@never_cache
@login_required
@csrf_exempt
def ajax_messages(request: HttpRequest) -> JsonResponse:
    """
    Return a JSON object containing the user's queued messages.

    Retrieves Django messages for the current request and formats them
    as a list of dictionaries, each containing the message text and its
    severity level.

    Requires the user to be authenticated.

    Args:
        request (HttpRequest): The request from the authenticated user.

    Returns:
        response (JsonResponse): A dictionary with a `messages` field containing
            a list of message entries.

    Response Format - Success:
        - `messages` (list[dict]): A list of user-visible messages.
            - `level` (str): The severity level of the message
              (e.g., "info", "warning", "error").
            - `message` (str): The text content of the message.

    Example:
        ```json
        {
            "messages": [
                {"level": "info", "message": "You have been logged out."},
                {"level": "warning", "message": "Your session is about to expire."}
            ]
        }
        ```
    """
    return JsonResponse(
        {
            "messages": [
                {"level": MESSAGE_LEVEL_NAMES[i.level], "message": i.message}
                for i in get_messages(request)
            ]
        }
    )


def get_transcription_superseded(
    asset: Asset, supersedes_pk: Union[int, str, None]
) -> Union[Transcription, JsonResponse, None]:
    """
    Determine the superseded transcription, if any, for a new transcription.

    If a valid `supersedes_pk` is provided, returns the corresponding transcription
    unless it has already been superseded. If no `supersedes_pk` is provided,
    checks whether the asset already has an open transcription.

    This helper may return an error response to be passed directly to the client,
    or a transcription object used when saving a new one.

    Args:
        asset (Asset): The asset the transcription is associated with.
        supersedes_pk (int or str or None): The primary key of the transcription
            being superseded, or `None` if this is the first transcription.

    Returns:
        response (Transcription or JsonResponse or None): A valid transcription,
            an error response, or `None`.

    Return Behavior:
        - If a valid transcription is found, a `Transcription` object is returned.
        - If the request is invalid or the transcription has already been superseded,
          a `JsonResponse` with an error is returned.
        - If there is no previous transcription to supersede, `None` is returned.

    Response Format - Error:
        - `error` (str): Explanation of why the transcription cannot be created.
            - "An open transcription already exists"
            - "This transcription has been superseded"
            - "Invalid supersedes value"

    Example:
        ```json
        {
            "error": "An open transcription already exists"
        }
        ```
    """
    structured_logger.info(
        "Checking for superseded transcription.",
        event_code="transcription_supersede_check_start",
        asset=asset,
        supersedes_pk=supersedes_pk,
    )
    if not supersedes_pk:
        if asset.transcription_set.filter(supersedes=None).exists():
            structured_logger.warning(
                "Open transcription already exists for asset.",
                event_code="transcription_supersede_check_failed",
                reason="An open transcription already exists",
                reason_code="already_exists",
                asset=asset,
            )
            return JsonResponse(
                {"error": "An open transcription already exists"}, status=409
            )
        else:
            superseded = None
    else:
        try:
            if asset.transcription_set.filter(supersedes=supersedes_pk).exists():
                structured_logger.warning(
                    "Transcription already superseded.",
                    event_code="transcription_supersede_check_failed",
                    reason="This transcription has been superseded",
                    reason_code="already_superseded",
                    asset=asset,
                    supersedes_pk=supersedes_pk,
                )
                return JsonResponse(
                    {"error": "This transcription has been superseded"}, status=409
                )

            try:
                superseded = asset.transcription_set.get(pk=supersedes_pk)
            except Transcription.DoesNotExist:
                structured_logger.warning(
                    "Supersedes transcription not found.",
                    event_code="transcription_supersede_check_failed",
                    reason="Invalid supersedes value",
                    reason_code="not_found",
                    asset=asset,
                    supersedes_pk=supersedes_pk,
                )
                return JsonResponse({"error": "Invalid supersedes value"}, status=400)
        except ValueError:
            structured_logger.warning(
                "Invalid supersedes value (non-integer).",
                event_code="transcription_supersede_check_failed",
                reason="Supersedes value must be an integer",
                reason_code="invalid_pk_format",
                asset=asset,
                supersedes_pk=supersedes_pk,
            )
            return JsonResponse({"error": "Invalid supersedes value"}, status=400)
        structured_logger.info(
            "Superseded transcription found.",
            event_code="transcription_supersede_check_success",
            asset=asset,
            supersedes_pk=supersedes_pk,
        )
    return superseded


@require_POST
@login_required
@atomic
@ratelimit(key="header:cf-connecting-ip", rate="1/m", block=settings.RATELIMIT_BLOCK)
def generate_ocr_transcription(
    request: HttpRequest, *, asset_pk: Union[int, str]
) -> JsonResponse:
    """
    Create and save a new OCR-generated transcription for an asset.

    If no prior transcription exists, creates a blank transcription to serve as
    the superseded record. Otherwise, the specified previous transcription is
    superseded by the new OCR transcription.

    Requires the user to be authenticated.

    Request Parameters:
        - `supersedes` (int or str, optional): The ID of the transcription being
          superseded.
        - `language` (str, optional): The language code to influence OCR output.

    Returns:
        response (JsonResponse): A dictionary describing the new transcription
            and asset status.

    Response Format - Success:
        - `id` (int): ID of the new transcription.
        - `sent` (float): UNIX timestamp when the transcription was created.
        - `submissionUrl` (str): URL to submit the transcription.
        - `text` (str): The OCR-generated transcription content.
        - `asset` (dict):
            - `id` (int): ID of the associated asset.
            - `status` (str): Current transcription status.
            - `contributors` (int): Number of users who have contributed.
        - `undo_available` (bool): Whether the user can roll back this transcription.
        - `redo_available` (bool): Whether the user can roll forward to another version.

    Example:
        ```json
        {
            "id": 123,
            "sent": 1716294920.927134,
            "submissionUrl": "/transcriptions/123/submit/",
            "text": "Detected OCR content...",
            "asset": {
                "id": 456,
                "status": "in_progress",
                "contributors": 2
            },
            "undo_available": true,
            "redo_available": false
        }
        ```
    """
    asset = get_object_or_404(Asset, pk=asset_pk)
    user = request.user

    supersedes_pk = request.POST.get("supersedes")
    language = request.POST.get("language", None)
    structured_logger.info(
        "Starting OCR transcription generation.",
        event_code="ocr_generation_start",
        user=user,
        asset=asset,
        supersedes_pk=supersedes_pk,
        language=language,
    )
    superseded = get_transcription_superseded(asset, supersedes_pk)
    if superseded:
        # If superseded is an HttpResponse, that means
        # this transcription has already been superseded, so
        # we won't run OCR and instead send back an error
        # Otherwise, we just have thr transcription the OCR
        # is gong to supersede, so we can continue
        if isinstance(superseded, HttpResponse):
            structured_logger.warning(
                "OCR generation aborted: superseded transcription is invalid.",
                event_code="ocr_generation_aborted",
                reason="Superseded transcription is invalid",
                reason_code="superseded_invalid",
                user=user,
                asset=asset,
            )
            return superseded
    else:
        # This means this is the first transcription on this asset.
        # To enable undoing of the OCR transcription, we create
        # an empty transcription for the OCR transcription to supersede
        structured_logger.info(
            "No existing transcription; creating empty one for OCR supersession.",
            event_code="ocr_blank_supersede",
            user=user,
            asset=asset,
        )
        superseded = Transcription(
            asset=asset,
            user=get_anonymous_user(),
            text="",
        )
        superseded.full_clean()
        superseded.save()
        structured_logger.info(
            "Blank superseded transcription created for OCR.",
            event_code="ocr_blank_transcription_created",
            user=user,
            transcription=superseded,
        )

    transcription_text = asset.get_ocr_transcript(language)
    transcription = Transcription(
        asset=asset,
        user=user,
        supersedes=superseded,
        text=transcription_text,
        ocr_generated=True,
        ocr_originated=True,
    )
    transcription.full_clean()
    transcription.save()

    structured_logger.info(
        "OCR transcription successfully created.",
        event_code="ocr_generation_success",
        user=user,
        transcription=transcription,
    )

    return JsonResponse(
        {
            "id": transcription.pk,
            "sent": time(),
            "submissionUrl": reverse("submit-transcription", args=(transcription.pk,)),
            "text": transcription.text,
            "asset": {
                "id": transcription.asset.id,
                "status": transcription.asset.transcription_status,
                "contributors": transcription.asset.get_contributor_count(),
            },
            "undo_available": asset.can_rollback()[0],
            "redo_available": asset.can_rollforward()[0],
        },
        status=201,
    )


@require_POST
@validate_anonymous_user
@atomic
@ratelimit(key="header:cf-connecting-ip", rate="1/m", block=settings.RATELIMIT_BLOCK)
def rollback_transcription(
    request: HttpRequest, *, asset_pk: Union[int, str]
) -> JsonResponse:
    """
    Perform a rollback on the latest transcription for the given asset.

    Restores the asset's transcription to the previous version in its history.
    If rollback is not possible (e.g., no prior version exists), returns an error.

    Anonymous users are supported and handled via `get_anonymous_user()`. The caller
    must be validated via `validate_anonymous_user`.

    Args:
        request (HttpRequest): The POST request to initiate rollback.
        asset_pk (int or str): The primary key of the asset being rolled back.

    Returns:
        response (JsonResponse): A dictionary containing the restored transcription
            and asset status, or an error response if rollback fails.

    Response Format - Success:
        - `id` (int): ID of the restored transcription.
        - `sent` (float): UNIX timestamp of the response.
        - `submissionUrl` (str): URL to submit the transcription.
        - `text` (str): The restored transcription text.
        - `asset` (dict):
            - `id` (int): ID of the asset.
            - `status` (str): Current transcription status.
            - `contributors` (int): Number of users who contributed.
        - `message` (str): Confirmation message.
        - `undo_available` (bool): Whether rollback is possible again.
        - `redo_available` (bool): Whether rollforward is now available.

    Response Format - Error:
        - `error` (str): Explanation of the failure.
            - "No previous transcription available"

    Example:
        ```json
        {
            "id": 123,
            "sent": 1716295121.113204,
            "submissionUrl": "/transcriptions/123/submit/",
            "text": "Previous transcription text",
            "asset": {
                "id": 456,
                "status": "in_progress",
                "contributors": 1
            },
            "message": "Successfully rolled back transcription to previous version",
            "undo_available": false,
            "redo_available": true
        }
        ```
    """
    asset = get_object_or_404(Asset, pk=asset_pk)

    if request.user.is_anonymous:
        user = get_anonymous_user()
    else:
        user = request.user

    try:
        transcription = asset.rollback_transcription(user)
    except ValueError as e:
        logger.exception("No previous transcription available for rollback", exc_info=e)
        structured_logger.warning(
            "Rollback failed: no previous transcription to revert to.",
            event_code="rollback_failed",
            reason_code="no_valid_target",
            reason=str(e),
            asset=asset,
            user=user,
        )
        return JsonResponse(
            {"error": "No previous transcription available"}, status=400
        )

    structured_logger.info(
        "Rollback successfully performed.",
        event_code="rollback_success",
        user=user,
        transcription=transcription,
    )

    return JsonResponse(
        {
            "id": transcription.pk,
            "sent": time(),
            "submissionUrl": reverse("submit-transcription", args=(transcription.pk,)),
            "text": transcription.text,
            "asset": {
                "id": transcription.asset.id,
                "status": transcription.asset.transcription_status,
                "contributors": transcription.asset.get_contributor_count(),
            },
            "message": "Successfully rolled back transcription to previous version",
            "undo_available": transcription.asset.can_rollback()[0],
            "redo_available": transcription.asset.can_rollforward()[0],
        },
        status=201,
    )


@require_POST
@validate_anonymous_user
@atomic
@ratelimit(key="header:cf-connecting-ip", rate="1/m", block=settings.RATELIMIT_BLOCK)
def rollforward_transcription(
    request: HttpRequest, *, asset_pk: Union[int, str]
) -> JsonResponse:
    """
    Perform a rollforward to the transcription previously replaced by a rollback.

    Restores the asset's transcription to the next version in its history,
    if a valid rollforward target exists. If not, returns an error response.

    Anonymous users are supported and handled via `get_anonymous_user()`. The caller
    must be validated via `validate_anonymous_user`.

    Args:
        request (HttpRequest): The POST request to initiate rollforward.
        asset_pk (int or str): The primary key of the asset being rolled forward.

    Returns:
        response (JsonResponse): A dictionary containing the restored transcription
            and asset status, or an error response if rollforward fails.

    Response Format - Success:
        - `id` (int): ID of the restored transcription.
        - `sent` (float): UNIX timestamp of the response.
        - `submissionUrl` (str): URL to submit the transcription.
        - `text` (str): The restored transcription text.
        - `asset` (dict):
            - `id` (int): ID of the asset.
            - `status` (str): Current transcription status.
            - `contributors` (int): Number of users who contributed.
        - `message` (str): Confirmation message.
        - `undo_available` (bool): Whether rollback is now possible.
        - `redo_available` (bool): Whether another rollforward is possible.

    Response Format - Error:
        - `error` (str): Explanation of the failure.
            - "No transcription to restore"

    Example:
        ```json
        {
            "id": 124,
            "sent": 1716295243.029184,
            "submissionUrl": "/transcriptions/124/submit/",
            "text": "Next transcription text",
            "asset": {
                "id": 456,
                "status": "in_progress",
                "contributors": 1
            },
            "message": "Successfully restored transcription to next version",
            "undo_available": true,
            "redo_available": false
        }
        ```
    """
    asset = get_object_or_404(Asset, pk=asset_pk)

    if request.user.is_anonymous:
        user = get_anonymous_user()
    else:
        user = request.user

    try:
        transcription = asset.rollforward_transcription(user)
    except ValueError as e:
        logger.exception("No transcription available for rollforward", exc_info=e)
        structured_logger.warning(
            "Rollforward failed: no transcription available to restore.",
            event_code="rollforward_failed",
            reason_code="no_valid_target",
            reason=str(e),
            asset=asset,
            user=user,
        )
        return JsonResponse({"error": "No transcription to restore"}, status=400)

    structured_logger.info(
        "Rollforward successfully performed.",
        event_code="rollforward_success",
        user=user,
        transcription=transcription,
    )

    return JsonResponse(
        {
            "id": transcription.pk,
            "sent": time(),
            "submissionUrl": reverse("submit-transcription", args=(transcription.pk,)),
            "text": transcription.text,
            "asset": {
                "id": transcription.asset.id,
                "status": transcription.asset.transcription_status,
                "contributors": transcription.asset.get_contributor_count(),
            },
            "message": "Successfully restored transcription to next version",
            "undo_available": transcription.asset.can_rollback()[0],
            "redo_available": transcription.asset.can_rollforward()[0],
        },
        status=201,
    )


@require_POST
@validate_anonymous_user
@atomic
def save_transcription(
    request: HttpRequest, *, asset_pk: Union[int, str]
) -> JsonResponse:
    """
    Save a transcription draft for a given asset.

    Validates the transcription text for disallowed content (e.g., URLs).
    Non-printable characters are automatically removed before saving,
    using the shared exporter sanitization utilities. The view also checks
    for supersession rules. If valid, it creates and saves a new
    transcription associated with the current or anonymous user.

    Request Parameters:
        - `text` (str): The transcription text.
        - `supersedes` (int or str, optional): The ID of the transcription
          being superseded. Example: `"123"`

    Returns:
        response (JsonResponse): A dictionary describing the saved transcription
            and asset status, or an error response if validation fails.

    Response Format - Success:
        - `id` (int): ID of the saved transcription.
        - `sent` (float): UNIX timestamp of the response.
        - `submissionUrl` (str): URL to submit the transcription.
        - `asset` (dict):
            - `id` (int): ID of the associated asset.
            - `status` (str): Current transcription status.
            - `contributors` (int): Number of users who contributed.
        - `undo_available` (bool): Whether rollback is currently possible.
        - `redo_available` (bool): Whether rollforward is currently possible.

    Response Format - Error:
        - `error` (str): Explanation of the validation failure.
            - "It looks like your text contains URLs."
            - "An open transcription already exists"
            - "This transcription has been superseded"
            - "Invalid supersedes value"

    Example:
        ```json
        {
            "id": 125,
            "sent": 1716295310.743182,
            "submissionUrl": "/transcriptions/125/submit/",
            "text" : "Transcription text\r\nSecond line",
            "asset": {
                "id": 456,
                "status": "in_progress",
                "contributors": 1
            },
            "undo_available": true,
            "redo_available": false
        }
        ```
    """
    asset = get_object_or_404(Asset, pk=asset_pk)
    logger.info("Saving transcription for %s (%s)", asset, asset.id)

    if request.user.is_anonymous:
        user = get_anonymous_user()
    else:
        user = request.user

    structured_logger.info(
        "Starting transcription save.",
        event_code="transcription_save_start",
        user=user,
        asset=asset,
    )

    transcription_text = request.POST["text"]

    # Check whether this transcription text contains any URLs.
    # If so, ask the user to correct the transcription by removing the URLs.
    url_match = re.search(URL_REGEX, transcription_text)
    if url_match:
        structured_logger.warning(
            "Transcription save rejected due to URL in text.",
            event_code="transcription_save_rejected",
            reason="Transcription text contains URLs",
            reason_code="url_detected",
            user=user,
            asset=asset,
        )
        return JsonResponse(
            {
                "error": "It looks like your text contains URLs. "
                "Please remove the URLs and try again.",
                "error-code": "url_detected",
            },
            status=400,
        )

    # Sanitize the text by removing any unacceptable (non-printable) characters.
    # This leverages the shared exporter whitelist and logic so behavior remains
    # consistent across validation and export paths.
    transcription_text = remove_unacceptable_characters(transcription_text)

    supersedes_pk = request.POST.get("supersedes")
    superseded = get_transcription_superseded(asset, supersedes_pk)
    if superseded and isinstance(superseded, HttpResponse):
        logger.info("Transcription superseded")
        structured_logger.warning(
            "Superseded transcription is invalid; aborting save.",
            event_code="transcription_save_aborted",
            reason="Superseded transcription is invalid",
            reason_code="superseded_invalid",
            user=user,
            asset=asset,
        )
        return superseded

    if superseded and (superseded.ocr_generated or superseded.ocr_originated):
        ocr_originated = True
    else:
        ocr_originated = False

    transcription = Transcription(
        asset=asset,
        user=user,
        supersedes=superseded,
        text=transcription_text,
        ocr_originated=ocr_originated,
    )
    transcription.full_clean()
    transcription.save()
    logger.info("Transction %s saved", transcription.id)
    structured_logger.info(
        "Transcription saved successfully.",
        event_code="transcription_save_success",
        user=user,
        transcription=transcription,
    )

    return JsonResponse(
        {
            "id": transcription.pk,
            "sent": time(),
            "submissionUrl": reverse("submit-transcription", args=(transcription.pk,)),
            "text": transcription.text,
            "asset": {
                "id": transcription.asset.id,
                "status": transcription.asset.transcription_status,
                "contributors": transcription.asset.get_contributor_count(),
            },
            "undo_available": transcription.asset.can_rollback()[0],
            "redo_available": transcription.asset.can_rollforward()[0],
        },
        status=201,
    )


@require_POST
@validate_anonymous_user
def submit_transcription(request: HttpRequest, *, pk: Union[int, str]) -> JsonResponse:
    """
    Submit a transcription for review.

    Marks the transcription as submitted and clears any rejection state.
    Prevents submission if the transcription has already been accepted or
    superseded.

    Anonymous users are supported and handled via `get_anonymous_user()`. The caller
    must be validated via `validate_anonymous_user`.

    Args:
        request (HttpRequest): The POST request to submit the transcription.
        pk (int or str): The primary key of the transcription to submit.

    Returns:
        response (JsonResponse): A dictionary with the asset status and submission
            metadata, or an error response if submission is not allowed.

    Response Format - Success:
        - `id` (int): ID of the submitted transcription.
        - `sent` (float): UNIX timestamp of the response.
        - `asset` (dict):
            - `id` (int): ID of the associated asset.
            - `status` (str): Current transcription status.
            - `contributors` (int): Number of users who contributed.
        - `undo_available` (bool): Always `false` after submission.
        - `redo_available` (bool): Always `false` after submission.

    Response Format - Error:
        - `error` (str): Explanation of the submission failure.
            - "This transcription has already been updated."

    Example:
        ```json
        {
            "id": 126,
            "sent": 1716295421.019122,
            "asset": {
                "id": 456,
                "status": "submitted",
                "contributors": 1
            },
            "undo_available": false,
            "redo_available": false
        }
        ```
    """
    transcription = get_object_or_404(Transcription, pk=pk)
    asset = transcription.asset

    logger.info(
        "Transcription %s submitted for %s (%s)", transcription.id, asset, asset.id
    )

    is_superseded = transcription.asset.transcription_set.filter(supersedes=pk).exists()
    is_already_submitted = transcription.submitted and not transcription.rejected

    if is_already_submitted or is_superseded:
        logger.warning(
            (
                "Submit for review was attempted for invalid transcription "
                "record: submitted: %s pk: %d"
            ),
            str(transcription.submitted),
            pk,
        )
        structured_logger.warning(
            "Submission rejected: transcription already submitted or superseded.",
            event_code="transcription_submit_rejected",
            reason="Transcription already submitted or superseded",
            reason_code="already_updated",
            user=request.user,
            transcription=transcription,
        )

        return JsonResponse(
            {
                "error": "This transcription has already been updated."
                " Reload the current status before continuing."
            },
            status=400,
        )

    transcription.submitted = now()
    transcription.rejected = None
    transcription.full_clean()
    transcription.save()

    logger.info("Transcription %s successfully submitted", transcription.id)
    structured_logger.info(
        "Transcription submitted successfully.",
        event_code="transcription_submit_success",
        user=request.user,
        transcription=transcription,
    )

    return JsonResponse(
        {
            "id": transcription.pk,
            "sent": time(),
            "asset": {
                "id": transcription.asset.id,
                "status": transcription.asset.transcription_status,
                "contributors": transcription.asset.get_contributor_count(),
            },
            "undo_available": False,
            "redo_available": False,
        },
        status=200,
    )


@require_POST
@login_required
@never_cache
def review_transcription(request: HttpRequest, *, pk: Union[int, str]) -> JsonResponse:
    """
    Review and accept or reject a submitted transcription.

    Only non-authors may accept a transcription. Users are limited by a
    rate limit when accepting transcriptions. Review actions are rejected
    if the transcription has already been reviewed or is invalid.

    Args:
        request (HttpRequest): The POST request containing the review action.
        pk (int or str): The primary key of the transcription to review.

    Returns:
        response (JsonResponse): A dictionary with updated asset status and
            metadata, or an error response if the review fails.

    Response Format - Success:
        - `id` (int): ID of the reviewed transcription.
        - `sent` (float): UNIX timestamp of the response.
        - `asset` (dict):
            - `id` (int): ID of the associated asset.
            - `status` (str): Updated transcription status.
            - `contributors` (int): Number of users who contributed.

    Response Format - Error:
        - `error` (str): Explanation of the review failure.
            - "Invalid action"
            - "This transcription has already been reviewed"
            - "You cannot accept your own transcription"
            - Configuration-based rate limit messages

    Example:
        ```json
        {
            "id": 127,
            "sent": 1716295502.642184,
            "asset": {
                "id": 456,
                "status": "completed",
                "contributors": 2
            }
        }
        ```
    """
    action = request.POST.get("action")
    structured_logger.info(
        "Starting transcription review.",
        event_code="transcription_review_start",
        user=request.user,
        transcription_id=pk,
        action=action,
    )

    if action not in ("accept", "reject"):
        structured_logger.warning(
            "Transcription review failed: invalid action.",
            event_code="transcription_review_rejected",
            reason="Invalid review action",
            reason_code="invalid_action",
            user=request.user,
            transcription_id=pk,
            action=action,
        )
        return JsonResponse({"error": "Invalid action"}, status=400)

    transcription = get_object_or_404(Transcription, pk=pk)
    asset = transcription.asset

    logger.info(
        "Transcription %s reviewed (%s) for %s (%s)",
        transcription.id,
        action,
        asset,
        asset.id,
    )

    if transcription.accepted or transcription.rejected:
        structured_logger.warning(
            "Review rejected: transcription already reviewed.",
            event_code="transcription_review_rejected",
            reason="Transcription has already been reviewed",
            reason_code="already_reviewed",
            user=request.user,
            transcription=transcription,
        )
        return JsonResponse(
            {"error": "This transcription has already been reviewed"}, status=400
        )

    if transcription.user.pk == request.user.pk and action == "accept":
        logger.warning("Attempted self-acceptance for transcription %s", transcription)
        structured_logger.warning(
            "Review rejected: user attempted to accept their own transcription.",
            event_code="transcription_review_rejected",
            reason="User attempted to accept their own transcription",
            reason_code="self_accept",
            user=request.user,
            transcription=transcription,
        )
        return JsonResponse(
            {"error": "You cannot accept your own transcription"}, status=400
        )

    transcription.reviewed_by = request.user

    if action == "accept":
        concordia_user = ConcordiaUser.objects.get(id=request.user.id)
        try:
            concordia_user.check_and_track_accept_limit(transcription)
        except RateLimitExceededError:
            structured_logger.warning(
                "Review rejected: user exceeded review rate limit.",
                event_code="transcription_review_rejected",
                reason="User exceeded review rate limit",
                reason_code="rate_limit_exceeded",
                user=request.user,
                transcription=transcription,
            )
            return JsonResponse(
                {
                    "error": configuration_value("review_rate_limit_banner_message"),
                    "popupTitle": configuration_value("review_rate_limit_popup_title"),
                    "popupError": configuration_value(
                        "review_rate_limit_popup_message"
                    ),
                },
                status=429,
            )
        transcription.accepted = now()
    else:
        transcription.rejected = now()

    transcription.full_clean()
    transcription.save()

    logger.info("Transcription %s successfully reviewed (%s)", transcription.id, action)
    structured_logger.info(
        "Transcription review successful.",
        event_code="transcription_review_success",
        user=request.user,
        transcription=transcription,
        action=action,
    )

    return JsonResponse(
        {
            "id": transcription.pk,
            "sent": time(),
            "asset": {
                "id": transcription.asset.id,
                "status": transcription.asset.transcription_status,
                "contributors": transcription.asset.get_contributor_count(),
            },
        },
        status=200,
    )


@require_POST
@login_required
@atomic
def submit_tags(request: HttpRequest, *, asset_pk: Union[int, str]) -> JsonResponse:
    """
    Submit a new set of tags for an asset from the current user.

    Creates any new tags as needed and updates the user's tag collection
    for the asset. Removes tags that are no longer present in the submission.

    Args:
        request (HttpRequest): The POST request containing tag values.
        asset_pk (int or str): The primary key of the asset to tag.

    Returns:
        response (JsonResponse): A dictionary containing the updated user-specific
            and global tag lists for the asset.

    Response Format - Success:
        - `user_tags` (list[str]): Tags currently assigned to the asset by this user.
        - `all_tags` (list[str]): All tags currently applied to the asset by any user.

    Response Format - Error:
        - `error` (list[str]): Validation error messages for malformed/duplicate tags.

    Example:
        ```json
        {
            "user_tags": ["map", "handwritten"],
            "all_tags": ["handwritten", "map", "note"]
        }
        ```
    """
    asset = get_object_or_404(Asset, pk=asset_pk)
    structured_logger.info(
        "Starting tag submission.",
        event_code="tag_submit_start",
        user=request.user,
        asset=asset,
    )

    user_tags, created = UserAssetTagCollection.objects.get_or_create(
        asset=asset, user=request.user
    )

    tags = set(request.POST.getlist("tags"))
    existing_tags = Tag.objects.filter(value__in=tags)
    new_tag_values = tags.difference(i.value for i in existing_tags)
    new_tags = [Tag(value=i) for i in new_tag_values]
    try:
        for i in new_tags:
            i.full_clean()
    except ValidationError as exc:
        structured_logger.warning(
            "Tag submission rejected: validation error on new tags.",
            event_code="tag_submit_rejected",
            reason="Tag failed validation",
            reason_code="validation_error",
            user=request.user,
            asset=asset,
            errors=str(exc.messages),
        )
        return JsonResponse({"error": exc.messages}, status=400)

    Tag.objects.bulk_create(new_tags)

    # At this point we now have Tag objects for everything in the POSTed
    # request. We'll add anything which wasn't previously in this user's tag
    # collection and remove anything which is no longer present.

    all_submitted_tags = list(existing_tags) + new_tags
    existing_user_tags = user_tags.tags.all()

    for tag in all_submitted_tags:
        if tag not in existing_user_tags:
            user_tags.tags.add(tag)

    all_tags_qs = Tag.objects.filter(userassettagcollection__asset__pk=asset_pk)

    for tag in all_tags_qs:
        if tag not in all_submitted_tags:
            for collection in asset.userassettagcollection_set.all():
                collection.tags.remove(tag)

    all_tags = all_tags_qs.order_by("value")
    final_user_tags = user_tags.tags.order_by("value").values_list("value", flat=True)
    all_tags = all_tags.values_list("value", flat=True).distinct()

    structured_logger.info(
        "Tags submitted successfully.",
        event_code="tag_submit_success",
        user=request.user,
        asset=asset,
        user_tags=[tag.value for tag in user_tags.tags.all()],
    )

    return JsonResponse(
        {"user_tags": list(final_user_tags), "all_tags": list(all_tags)}
    )


@ratelimit(
    key="header:cf-connecting-ip", rate=reserve_rate, block=settings.RATELIMIT_BLOCK
)
@require_POST
@never_cache
def reserve_asset(request: HttpRequest, *, asset_pk: Union[int, str]) -> JsonResponse:
    """
    Attempt to reserve an asset for transcription by the current session.

    If no active reservation exists, creates a new one using the session's
    reservation token. If a reservation exists for this session, updates it.
    If the asset is reserved by another session, returns a conflict response.
    Handles reservation release if `release` is set in the request body.

    Request Parameters:
        - `release` (bool, optional): If present and true, releases the current
          reservation instead of acquiring or updating it. Example: `"true"`

    Returns:
        response (JsonResponse or HttpResponse): A dictionary indicating the
        reservation status and token, or an HTTP 408/409 response for timeout
        or conflict.

    Response Format - Success:
        - `asset_pk` (int): The ID of the reserved asset.
        - `reservation_token` (str): A unique identifier for the reservation session.

    Response Format - Error:
        - `408 Request Timeout`: The current session's reservation is tombstoned.
        - `409 Conflict`: The asset is actively reserved by another session.

    Example:
        ```json
        {
            "asset_pk": 789,
            "reservation_token": "abc123xyz"
        }
        ```
    """

    reservation_token = get_or_create_reservation_token(request)
    structured_logger.info(
        "Handling reservation request.",
        event_code="asset_reserve_start",
        asset_pk=asset_pk,
        reservation_token=reservation_token,
    )

    # If the browser is letting us know of a specific reservation release,
    # let it go even if it's within the grace period.
    if request.POST.get("release"):
        with connection.cursor() as cursor:
            cursor.execute(
                """
                DELETE FROM concordia_assettranscriptionreservation
                WHERE asset_id = %s and reservation_token = %s
                """,
                [asset_pk, reservation_token],
            )

        # We'll pass the message to the WebSocket listeners before returning it:
        msg = {"asset_pk": asset_pk, "reservation_token": reservation_token}
        logger.info("Releasing reservation with token %s", reservation_token)
        structured_logger.info(
            "Releasing asset reservation via client request.",
            event_code="asset_reserve_release",
            asset_pk=asset_pk,
            reservation_token=reservation_token,
        )
        reservation_released.send(sender="reserve_asset", **msg)
        return JsonResponse(msg)

    # We're relying on the database to meet our integrity requirements and since
    # this is called periodically we want to be fairly fast until we switch to
    # something like Redis.

    reservations = AssetTranscriptionReservation.objects.filter(
        asset_id__exact=asset_pk
    )

    # Default: pretend there is no activity on the asset
    is_it_already_mine = False
    am_i_tombstoned = False
    is_someone_else_tombstoned = False
    is_someone_else_active = False

    if reservations:
        for reservation in reservations:
            if reservation.tombstoned:
                if reservation.reservation_token == reservation_token:
                    am_i_tombstoned = True
                    logger.debug("I'm tombstoned %s", reservation_token)
                else:
                    is_someone_else_tombstoned = True
                    logger.debug(
                        "Someone else is tombstoned %s", reservation.reservation_token
                    )
            else:
                if reservation.reservation_token == reservation_token:
                    is_it_already_mine = True
                    logger.debug(
                        "I already have this active reservation %s", reservation_token
                    )
                if not is_it_already_mine:
                    is_someone_else_active = True
                    logger.info(
                        "Someone else has this active reservation %s",
                        reservation.reservation_token,
                    )

        if am_i_tombstoned:
            structured_logger.warning(
                "Reservation rejected: client is tombstoned.",
                event_code="asset_reserve_rejected",
                reason="Client reservation token is tombstoned",
                reason_code="tombstoned_self",
                asset_pk=asset_pk,
                reservation_token=reservation_token,
            )
            return HttpResponse(status=408)  # Request Timed Out

        if is_someone_else_active:
            structured_logger.warning(
                "Reservation rejected: asset is reserved by another client.",
                event_code="asset_reserve_rejected",
                reason="Asset is actively reserved by another session",
                reason_code="conflict_active_other",
                asset_pk=asset_pk,
                reservation_token=reservation_token,
            )
            return HttpResponse(status=409)  # Conflict

        if is_it_already_mine:
            # This user already has the reservation and it's not tombstoned
            structured_logger.info(
                "Reservation updated for client.",
                event_code="asset_reserve_updated",
                asset_pk=asset_pk,
                reservation_token=reservation_token,
            )
            msg = update_reservation(asset_pk, reservation_token)
            logger.debug("Updating reservation %s", reservation_token)

        if is_someone_else_tombstoned:
            # No reservations = no activity = go ahead and do an insert
            structured_logger.info(
                "Reservation acquired from tombstoned client.",
                event_code="asset_reserve_from_tombstone",
                asset_pk=asset_pk,
                reservation_token=reservation_token,
            )
            msg = obtain_reservation(asset_pk, reservation_token)
            logger.debug(
                "Obtaining reservation for %s from tombstoned user", reservation_token
            )
    else:
        # No reservations = no activity = go ahead and do an insert
        structured_logger.info(
            "Initial reservation acquired (no existing reservations).",
            event_code="asset_reserve_fresh",
            asset_pk=asset_pk,
            reservation_token=reservation_token,
        )
        msg = obtain_reservation(asset_pk, reservation_token)
        logger.debug("No activity, just get the reservation %s", reservation_token)

    return JsonResponse(msg)


def update_reservation(
    asset_pk: Union[int, str], reservation_token: str
) -> dict[str, Union[int, str]]:
    """
    Update the timestamp on an existing active reservation for an asset.

    Refreshes the reservation's `updated_on` field to extend its validity
    and emits the `reservation_obtained` signal.

    Args:
        asset_pk (int or str): The primary key of the reserved asset.
        reservation_token (str): The session's reservation token.

    Returns:
        response (dict): A dictionary confirming the updated reservation state.

    Response Format - Success:
        - `asset_pk` (int): The ID of the reserved asset.
        - `reservation_token` (str): The reservation token used by the session.

    Example:
        ```json
        {
            "asset_pk": 789,
            "reservation_token": "abc123xyz"
        }
        ```
    """
    structured_logger.info(
        "Attempting to update reservation timestamp.",
        event_code="reservation_update_start",
        asset_pk=asset_pk,
        reservation_token=reservation_token,
    )
    with connection.cursor() as cursor:
        cursor.execute(
            """
        UPDATE concordia_assettranscriptionreservation AS atr
            SET updated_on = current_timestamp
            WHERE (
                atr.asset_id = %s
                AND atr.reservation_token = %s
                AND atr.tombstoned != TRUE
                )
        """.strip(),
            [asset_pk, reservation_token],
        )
    structured_logger.info(
        "Reservation update SQL executed.",
        event_code="reservation_update_sql_executed",
        asset_pk=asset_pk,
        reservation_token=reservation_token,
    )
    # We'll pass the message to the WebSocket listeners before returning it:
    msg = {"asset_pk": asset_pk, "reservation_token": reservation_token}
    reservation_obtained.send(sender="reserve_asset", **msg)
    structured_logger.info(
        "Reservation update completed; signal dispatched.",
        event_code="reservation_update_success",
        asset_pk=asset_pk,
        reservation_token=reservation_token,
    )
    return msg


def obtain_reservation(
    asset_pk: Union[int, str], reservation_token: str
) -> dict[str, Union[int, str]]:
    """
    Create a new reservation entry for an asset.

    Inserts a new reservation row in the database for the given asset and
    session token. Emits the `reservation_obtained` signal to notify listeners.

    Args:
        asset_pk (int or str): The primary key of the asset to reserve.
        reservation_token (str): The session's reservation token.

    Returns:
        response (dict): A dictionary confirming the newly obtained reservation.

    Response Format - Success:
        - `asset_pk` (int): The ID of the reserved asset.
        - `reservation_token` (str): The reservation token used by the session.

    Example:
        ```json
        {
            "asset_pk": 789,
            "reservation_token": "abc123xyz"
        }
        ```
    """
    structured_logger.info(
        "Attempting to create new reservation.",
        event_code="reservation_obtain_start",
        asset_pk=asset_pk,
        reservation_token=reservation_token,
    )
    with connection.cursor() as cursor:
        cursor.execute(
            """
        INSERT INTO concordia_assettranscriptionreservation AS atr
            (asset_id, reservation_token, tombstoned, created_on,
            updated_on)
            VALUES (%s, %s, FALSE, current_timestamp,
            current_timestamp)
        """.strip(),
            [asset_pk, reservation_token],
        )
    structured_logger.info(
        "Reservation INSERT executed successfully.",
        event_code="reservation_insert_success",
        asset_pk=asset_pk,
        reservation_token=reservation_token,
    )
    # We'll pass the message to the WebSocket listeners before returning it:
    msg = {"asset_pk": asset_pk, "reservation_token": reservation_token}
    reservation_obtained.send(sender="reserve_asset", **msg)
    structured_logger.info(
        "Reservation successfully obtained; signal dispatched.",
        event_code="reservation_obtain_success",
        asset_pk=asset_pk,
        reservation_token=reservation_token,
    )
    return msg


================================================
FILE: concordia/views/assets.py
================================================
import logging
import random
from typing import Any
from urllib.parse import urlencode

from django.conf import settings
from django.contrib import messages
from django.contrib.auth.models import User
from django.db.models import QuerySet
from django.db.transaction import atomic
from django.http import Http404, HttpRequest, HttpResponse, HttpResponseRedirect
from django.shortcuts import get_object_or_404, redirect
from django.urls import reverse
from django.utils.decorators import method_decorator
from django.views.decorators.cache import never_cache
from django_ratelimit.decorators import ratelimit

from concordia.api_views import APIDetailView
from concordia.forms import TurnstileForm
from concordia.logging import ConcordiaLogger
from concordia.models import (
    Asset,
    AssetTranscriptionReservation,
    Campaign,
    CardFamily,
    Guide,
    Topic,
    TranscriptionStatus,
    TutorialCard,
    UserAssetTagCollection,
)
from concordia.templatetags.concordia_media_tags import asset_media_url
from concordia.utils import (
    get_anonymous_user,
    get_or_create_reservation_token,
)
from concordia.utils.next_asset import (
    find_next_reviewable_campaign_asset,
    find_next_reviewable_topic_asset,
    find_next_transcribable_campaign_asset,
    find_next_transcribable_topic_asset,
    find_reviewable_campaign_asset,
    find_transcribable_campaign_asset,
    remove_next_asset_objects,
)

from .decorators import next_asset_rate
from .utils import AnonymousUserValidationCheckMixin

logger = logging.getLogger(__name__)
structured_logger = ConcordiaLogger.get_logger(__name__)


@method_decorator(never_cache, name="dispatch")
class AssetDetailView(AnonymousUserValidationCheckMixin, APIDetailView):
    """
    Display details for a single asset and handle missing assets.

    This view handles `GET` and `POST` requests by retrieving the published
    `Asset` that matches the campaign, project and item.

    It uses `AnonymousUserValidationCheckMixin` for anonymous-user validation
    and `APIDetailView` for API-driven detail behavior. It overrides
    `dispatch` to log and redirect to the parent campaign page if the asset
    is not found.

    Attributes:
        template_name (str): Template used to render the asset detail page.
    """

    template_name = "transcriptions/asset_detail.html"

    def dispatch(
        self,
        request: HttpRequest,
        *args: Any,
        **kwargs: Any,
    ) -> HttpResponse:
        try:
            return super().dispatch(request, *args, **kwargs)
        except Http404:
            structured_logger.info(
                "AssetDetailView: asset not found, redirecting to campaign " "page.",
                event_code="asset_detail_not_found_redirect",
                user=request.user,
                campaign_slug=self.kwargs.get("campaign_slug"),
                project_slug=self.kwargs.get("project_slug"),
                item_id=self.kwargs.get("item_id"),
                asset_slug=self.kwargs.get("slug"),
            )
            campaign = get_object_or_404(
                Campaign.objects.published(), slug=self.kwargs["campaign_slug"]
            )
            return redirect(campaign)

    def get_queryset(self) -> QuerySet[Asset]:
        asset_qs = Asset.objects.published().filter(
            item__project__campaign__slug=self.kwargs["campaign_slug"],
            item__project__slug=self.kwargs["project_slug"],
            item__item_id=self.kwargs["item_id"],
            slug=self.kwargs["slug"],
        )
        asset_qs = asset_qs.select_related("item__project__campaign")

        return asset_qs

    def get_context_data(self, **kwargs: Any) -> dict[str, Any]:
        """
        Build the context for the asset detail template.

        Constructs a dictionary with the entries described in the context
        format.

        Context Format:
            - `asset` (Asset): Asset instance being viewed.
            - `item` (Item): Parent item of the asset.
            - `project` (Project): Parent project of the item.
            - `campaign` (Campaign): Campaign that contains the project.
            - `transcription` (Transcription | None): Latest transcription or
              `None`.
            - `next_open_asset_url` (str): URL to the next transcribable
              asset.
            - `next_review_asset_url` (str): URL to the next reviewable
              asset.
            - `transcription_status` (str): One of the keys from
              `TranscriptionStatus`.
            - `activity_mode` (str): `"transcribe"` or `"review"`, based on
              the transcription status.
            - `disable_ocr` (bool): Whether OCR should be disabled for this
              asset.
            - `previous_asset_url` (str | None): URL to the previous asset, if
              any.
            - `next_asset_url` (str | None): URL to the next asset, if any.
            - `asset_navigation` (list[tuple[int, str]]): Sequence and slug
              pairs for navigation.
            - `thumbnail_url` (str): URL of the asset thumbnail image.
            - `current_asset_url` (str): Absolute URL of this asset detail
              view.
            - `tags` (list[str]): Sorted tag values applied to the asset.
            - `registered_contributors` (int): Number of users who have
              contributed to the asset.
            - `cards` (list[Card]): Tutorial cards for the campaign or the
              default card set.
            - `guides` (QuerySet[dict[str, Any]] | None): Tutorial guide
              entries.
            - `languages` (list[tuple[str, str]]): Supported language
              code and name pairs.
            - `undo_available` (bool): Whether a rollback is possible.
            - `redo_available` (bool): Whether a rollforward is possible.
            - `turnstile_form` (TurnstileForm): Form for the Turnstile
              widget.

        Args:
            **kwargs (Any): Additional keyword arguments passed to the
                superclass implementation.

        Returns:
            dict[str, Any]: Context data for rendering the asset detail page.
        """

        ctx = super().get_context_data(**kwargs)
        asset = ctx["asset"]
        # Bind a new logger so asset and user are always included
        context_logger = structured_logger.bind(user=self.request.user, asset=asset)
        context_logger.info(
            "AssetDetailView: building context.",
            event_code="asset_detail_context_start",
        )
        ctx["item"] = item = asset.item
        ctx["project"] = project = item.project
        ctx["campaign"] = project.campaign

        transcription = asset.transcription_set.order_by("-pk").first()
        context_logger.debug(
            "AssetDetailView: latest transcription selected.",
            event_code="asset_detail_latest_transcription",
            transcription=transcription,
        )
        ctx["transcription"] = transcription

        ctx["next_open_asset_url"] = "%s?%s" % (
            reverse(
                "transcriptions:redirect-to-next-transcribable-campaign-asset",
                kwargs={"campaign_slug": project.campaign.slug},
            ),
            urlencode(
                {"project": project.slug, "item": item.item_id, "asset": asset.id}
            ),
        )

        ctx["next_review_asset_url"] = "%s?%s" % (
            reverse(
                "transcriptions:redirect-to-next-reviewable-campaign-asset",
                kwargs={"campaign_slug": project.campaign.slug},
            ),
            urlencode(
                {"project": project.slug, "item": item.item_id, "asset": asset.id}
            ),
        )

        # We handle the case where an item with no transcriptions should be
        # shown as status=not_started here so the logic does not need to be
        # repeated in templates.
        if transcription:
            for choice_key, choice_value in TranscriptionStatus.CHOICE_MAP.items():
                if choice_value == transcription.status:
                    transcription_status = choice_key
        else:
            transcription_status = TranscriptionStatus.NOT_STARTED
        ctx["transcription_status"] = transcription_status

        context_logger.debug(
            "AssetDetailView: computed transcription status.",
            event_code="asset_detail_transcription_status",
            computed_status=transcription_status,
            asset_status=asset.transcription_status,
        )

        if (
            transcription_status == TranscriptionStatus.NOT_STARTED
            or transcription_status == TranscriptionStatus.IN_PROGRESS
        ):
            ctx["activity_mode"] = "transcribe"
            ctx["disable_ocr"] = asset.turn_off_ocr()
        else:
            ctx["disable_ocr"] = True
        if transcription_status == TranscriptionStatus.SUBMITTED:
            ctx["activity_mode"] = "review"

        previous_asset = (
            item.asset_set.published()
            .filter(sequence__lt=asset.sequence)
            .order_by("sequence")
            .last()
        )
        next_asset = (
            item.asset_set.published()
            .filter(sequence__gt=asset.sequence)
            .order_by("sequence")
            .first()
        )
        context_logger.debug(
            "AssetDetailView: asset navigation resolved.",
            event_code="asset_detail_navigation",
            previous_asset_id=getattr(previous_asset, "pk", None),
            next_asset_id=getattr(next_asset, "pk", None),
        )
        if previous_asset:
            ctx["previous_asset_url"] = previous_asset.get_absolute_url()
        if next_asset:
            ctx["next_asset_url"] = next_asset.get_absolute_url()

        ctx["asset_navigation"] = (
            item.asset_set.published()
            .order_by("sequence")
            .values_list("sequence", "slug")
        )

        image_url = asset_media_url(asset)
        if asset.download_url and "iiif" in asset.download_url:
            thumbnail_url = asset.download_url.replace(
                "http://tile.loc.gov", "https://tile.loc.gov"
            )
            thumbnail_url = thumbnail_url.replace("/pct:100/", "/!512,512/")
        else:
            thumbnail_url = image_url
        context_logger.debug(
            "AssetDetailView: thumbnail URL determined.",
            event_code="asset_detail_thumbnail",
            thumbnail_url=thumbnail_url,
        )
        ctx["thumbnail_url"] = thumbnail_url

        ctx["current_asset_url"] = self.request.build_absolute_uri()

        tag_groups = UserAssetTagCollection.objects.filter(asset__slug=asset.slug)

        tags = set()

        for tag_group in tag_groups:
            for tag in tag_group.tags.all():
                tags.add(tag.value)

        ctx["tags"] = sorted(tags)

        ctx["registered_contributors"] = asset.get_contributor_count()

        if project.campaign.card_family:
            card_family = project.campaign.card_family
        else:
            card_family = CardFamily.objects.filter(default=True).first()
        if card_family is not None:
            unordered_cards = TutorialCard.objects.filter(tutorial=card_family)
            ordered_cards = unordered_cards.order_by("order")
            ctx["cards"] = [tutorial_card.card for tutorial_card in ordered_cards]

        guides = Guide.objects.order_by("order").values("title", "body")
        if guides.count() > 0:
            ctx["guides"] = guides

        ctx["languages"] = list(settings.LANGUAGE_CODES.items())

        ctx["undo_available"] = asset.can_rollback()[0] if transcription else False
        ctx["redo_available"] = asset.can_rollforward()[0] if transcription else False

        ctx["turnstile_form"] = TurnstileForm(auto_id=False)

        context_logger.info(
            "AssetDetailView: context ready.",
            event_code="asset_detail_context_ready",
            transcription=transcription,
            transcription_status=transcription_status,
        )
        return ctx


def redirect_to_next_asset(
    asset: Asset | None,
    mode: str,
    request: HttpRequest,
    user: User,
) -> HttpResponseRedirect:
    """
    Redirect the user to the appropriate asset view or the homepage.

    If an asset is found, this helper creates a reservation for it and
    removes the asset from the relevant caching tables. The user is then
    redirected to the transcription page for that asset.

    If no asset is provided, it redirects to the homepage and adds an
    informational message.

    Args:
        asset (Asset | None): Asset to redirect to, or `None` if no asset is
            available.
        mode (str): Either `"transcribe"` or `"review"`, used for messaging.
        request (HttpRequest): Request that initiated the redirect.
        user (User): User being redirected.

    Returns:
        HttpResponseRedirect: Redirect to the asset detail page or the
        homepage.
    """
    structured_logger.info(
        "Starting redirect to next asset.",
        event_code="redirect_next_asset_start",
        user=user,
        mode=mode,
        asset=asset,
    )
    reservation_token = get_or_create_reservation_token(request)
    if asset:
        # We previously created reservations for transcriptions but not
        # reviews. This created a race condition with the next asset caching
        # system because the non-reserved asset could be added into the cache
        # table between when the user was redirected and when they made their
        # own reservation. That could result in the asset being added to the
        # caching system and sent to another user.
        res = AssetTranscriptionReservation(
            asset=asset, reservation_token=reservation_token
        )
        res.full_clean()
        res.save()
        structured_logger.info(
            "Asset reserved and redirecting to asset detail view.",
            event_code="redirect_next_asset_success",
            asset=asset,
            user=user,
        )
        remove_next_asset_objects(asset.id)
        return redirect(
            "transcriptions:asset-detail",
            asset.item.project.campaign.slug,
            asset.item.project.slug,
            asset.item.item_id,
            asset.slug,
        )
    else:
        no_pages_message = f"There are no remaining pages to {mode}."
        structured_logger.warning(
            "No available asset to redirect to.",
            event_code="redirect_next_asset_empty",
            reason=("There were no eligible assets found to assign to the user."),
            reason_code="no_asset_available",
            asset=asset,
            user=user,
            mode=mode,
        )
        messages.info(request, no_pages_message)

        return redirect("homepage")


@ratelimit(
    key="header:cf-connecting-ip",
    rate=next_asset_rate,
    group="next_asset",
    block=True,
)
@never_cache
@atomic
def redirect_to_next_reviewable_asset(
    request: HttpRequest,
) -> HttpResponseRedirect:
    """
    Redirect the user to a reviewable asset from any active reviewable
    campaign.

    This view iterates through campaigns marked as next-reviewable, then
    falls back to other active campaigns if needed. It skips campaigns with
    no eligible assets and uses asset caching when possible.

    Args:
        request (HttpRequest): Incoming HTTP request.

    Returns:
        HttpResponseRedirect: Redirect to the selected asset or the
        homepage.
    """
    structured_logger.info(
        "Entered redirect_to_next_reviewable_asset view.",
        event_code="redirect_reviewable_entry",
        user=request.user,
    )
    if not request.user.is_authenticated:
        user = get_anonymous_user()
    else:
        user = request.user

    campaign_ids = list(
        Campaign.objects.active()
        .listed()
        .published()
        .get_next_review_campaigns()
        .values_list("id", flat=True)
    )
    structured_logger.debug(
        "Fetched candidate campaign IDs for reviewable assets.",
        event_code="redirect_reviewable_campaign_ids",
        user=user,
        campaign_ids=campaign_ids,
    )
    asset = None
    if campaign_ids:
        random.shuffle(campaign_ids)  # nosec
    else:
        logger.info("No configured reviewable campaigns")
        structured_logger.info(
            "No configured reviewable campaigns.",
            event_code="redirect_reviewable_no_campaigns",
            user=user,
        )

    for campaign_id in campaign_ids:
        try:
            campaign = Campaign.objects.get(id=campaign_id)
        except IndexError:
            logger.error("Next reviewable campaign %s not found", campaign_id)
            structured_logger.error(
                "Failed to retrieve next reviewable campaign by ID.",
                event_code="redirect_reviewable_campaign_missing",
                reason=("Reviewable campaign with specified ID was not found."),
                reason_code="reviewable_campaign_not_found",
                user=user,
                campaign_id=campaign_id,
            )
            continue
        asset = find_reviewable_campaign_asset(campaign, user)
        if asset:
            break
        else:
            logger.info("No reviewable assets found in %s", campaign)
            structured_logger.info(
                "No reviewable assets found in campaign.",
                event_code="redirect_reviewable_campaign_empty_primary",
                user=user,
                campaign=campaign,
            )

    if not asset:
        for campaign in (
            Campaign.objects.active()
            .listed()
            .published()
            .exclude(id__in=campaign_ids)
            .order_by("launch_date")
        ):
            asset = find_reviewable_campaign_asset(campaign, user)
            if asset:
                break
            else:
                logger.info("No reviewable assets found in %s", campaign)
                structured_logger.info(
                    "No reviewable assets found in campaign.",
                    event_code="redirect_reviewable_campaign_empty_fallback",
                    user=user,
                    campaign=campaign,
                )
    structured_logger.info(
        "Redirecting to next reviewable asset.",
        event_code="redirect_reviewable_success",
        user=user,
        asset=asset,
    )
    return redirect_to_next_asset(asset, "review", request, user)


@ratelimit(
    key="header:cf-connecting-ip",
    rate=next_asset_rate,
    group="next_asset",
    block=True,
)
@never_cache
@atomic
def redirect_to_next_transcribable_asset(
    request: HttpRequest,
) -> HttpResponseRedirect:
    """
    Redirect the user to a transcribable asset from any active transcription
    campaign.

    This view iterates through campaigns marked as next-transcribable, then
    falls back to other active campaigns if needed. It skips campaigns with
    no eligible assets and uses asset caching when possible.

    Args:
        request (HttpRequest): Incoming HTTP request.

    Returns:
        HttpResponseRedirect: Redirect to the selected asset or the
        homepage.
    """
    structured_logger.info(
        "Entered redirect_to_next_transcribable_asset view.",
        event_code="redirect_transcribable_entry",
        user=request.user,
    )
    campaign_ids = list(
        Campaign.objects.active()
        .listed()
        .published()
        .get_next_transcription_campaigns()
        .values_list("id", flat=True)
    )
    structured_logger.debug(
        "Fetched candidate campaign IDs for transcribable assets.",
        event_code="redirect_transcribable_campaign_ids",
        user=request.user,
        campaign_ids=campaign_ids,
    )
    asset = None
    if campaign_ids:
        random.shuffle(campaign_ids)  # nosec
    else:
        logger.info("No configured transcribable campaigns")
        structured_logger.info(
            "No configured transcribable campaigns.",
            event_code="redirect_transcribable_no_campaigns",
            user=request.user,
        )

    for campaign_id in campaign_ids:
        try:
            campaign = Campaign.objects.get(id=campaign_id)
        except IndexError:
            logger.error("Next transcribable campaign %s not found", campaign_id)
            structured_logger.error(
                "Next transcribable campaign ID not found.",
                event_code="redirect_transcribable_campaign_missing",
                reason=("Transcribable campaign with specified ID was not found."),
                reason_code="transcribable_campaign_not_found",
                user=request.user,
                campaign_id=campaign_id,
            )
            continue
        asset = find_transcribable_campaign_asset(campaign)
        if asset:
            break
        else:
            logger.info("No transcribable assets found in %s", campaign)
            structured_logger.info(
                "No transcribable assets found in campaign.",
                event_code="redirect_transcribable_campaign_empty_primary",
                user=request.user,
                campaign=campaign,
            )

    if not asset:
        for campaign in (
            Campaign.objects.active()
            .listed()
            .published()
            .exclude(id__in=campaign_ids)
            .order_by("-launch_date")
        ):
            asset = find_transcribable_campaign_asset(campaign)
            if asset:
                break
            else:
                logger.info("No transcribable assets found in %s", campaign)
                structured_logger.info(
                    "No transcribable assets found in campaign (fallback " "loop).",
                    event_code="redirect_transcribable_campaign_empty_fallback",
                    user=request.user,
                    campaign=campaign,
                )

    if not asset:
        logger.info("No transcribable assets found in any campaign")
        structured_logger.info(
            "No transcribable assets found in any campaign.",
            event_code="redirect_transcribable_no_assets_anywhere",
            user=request.user,
        )

    structured_logger.info(
        "Redirecting to next transcribable asset.",
        event_code="redirect_transcribable_success",
        user=request.user,
        asset=asset,
    )
    return redirect_to_next_asset(asset, "transcribe", request, request.user)


@ratelimit(
    key="header:cf-connecting-ip",
    rate=next_asset_rate,
    group="next_asset",
    block=True,
)
@never_cache
@atomic
def redirect_to_next_reviewable_campaign_asset(
    request: HttpRequest,
    *,
    campaign_slug: str,
) -> HttpResponseRedirect:
    """
    Redirect the user to the next reviewable asset within a campaign.

    This view redirects within a specific campaign, which may be listed or
    unlisted. It can use optional query parameters to influence which asset
    is prioritized.

    Request Parameters:
        project (str): Current project slug.
        item (str): Current item identifier. This is `item_id`, not the item
            primary key.
        asset (int): ID of the most recently reviewed asset.

    Args:
        request (HttpRequest): Incoming HTTP request.
        campaign_slug (str): Slug for the target campaign.

    Returns:
        HttpResponseRedirect: Redirect to the selected asset or the
        homepage.
    """
    structured_logger.info(
        "Entered redirect_to_next_reviewable_campaign_asset view.",
        event_code="redirect_reviewable_campaign_entry",
        user=request.user,
        campaign_slug=campaign_slug,
    )
    # Campaign is specified: may be listed or unlisted
    campaign = get_object_or_404(Campaign.objects.published(), slug=campaign_slug)
    project_slug = request.GET.get("project", "")
    item_id = request.GET.get("item", "")
    asset_pk = request.GET.get("asset", 0)
    structured_logger.debug(
        "Parsed query parameters for reviewable asset redirection.",
        event_code="redirect_reviewable_campaign_query_params",
        user=request.user,
        campaign=campaign,
        project_slug=project_slug,
        item_id=item_id,
        asset_pk=asset_pk,
    )

    if not request.user.is_authenticated:
        user = get_anonymous_user()
    else:
        user = request.user

    # We pass request.user instead of user here to maintain pre-existing
    # behavior (though it is probably unintended).
    # TODO: Re-evaluate whether we should pass in user instead.
    asset = find_next_reviewable_campaign_asset(
        campaign, request.user, project_slug, item_id, asset_pk
    )
    structured_logger.info(
        "Redirecting to next reviewable asset in campaign.",
        event_code="redirect_reviewable_campaign_success",
        user=user,
        request_user=request.user,
        asset=asset,
        campaign=campaign,  # We log campaign because asset might be None.
    )
    return redirect_to_next_asset(asset, "review", request, user)


@ratelimit(
    key="header:cf-connecting-ip",
    rate=next_asset_rate,
    group="next_asset",
    block=True,
)
@never_cache
@atomic
def redirect_to_next_transcribable_campaign_asset(
    request: HttpRequest,
    *,
    campaign_slug: str,
) -> HttpResponseRedirect:
    """
    Redirect the user to the next transcribable asset within a campaign.

    This view redirects within a specific campaign, which may be listed or
    unlisted. It can use optional query parameters to influence which asset
    is prioritized.

    Request Parameters:
        project (str): Current project slug.
        item (str): Current item identifier. This is `item_id`, not the item
            primary key.
        asset (int): ID of the most recently transcribed asset.

    Args:
        request (HttpRequest): Incoming HTTP request.
        campaign_slug (str): Slug for the target campaign.

    Returns:
        HttpResponseRedirect: Redirect to the selected asset or the
        homepage.
    """
    structured_logger.info(
        "Entered redirect_to_next_transcribable_campaign_asset view.",
        event_code="redirect_transcribable_campaign_entry",
        user=request.user,
        campaign_slug=campaign_slug,
    )
    # Campaign is specified: may be listed or unlisted
    campaign = get_object_or_404(Campaign.objects.published(), slug=campaign_slug)
    project_slug = request.GET.get("project", "")
    item_id = request.GET.get("item", "")
    asset_pk = request.GET.get("asset", 0)
    structured_logger.debug(
        "Parsed query parameters for transcribable asset redirection.",
        event_code="redirect_transcribable_campaign_query_params",
        user=request.user,
        campaign=campaign,
        project_slug=project_slug,
        item_id=item_id,
        asset_pk=asset_pk,
    )

    if not request.user.is_authenticated:
        user = get_anonymous_user()
    else:
        user = request.user

    asset = find_next_transcribable_campaign_asset(
        campaign, project_slug, item_id, asset_pk
    )
    structured_logger.info(
        "Redirecting to next transcribable asset in campaign.",
        event_code="redirect_transcribable_campaign_success",
        user=user,
        asset=asset,
        campaign=campaign,  # We log campaign because asset may be None.
    )
    return redirect_to_next_asset(asset, "transcribe", request, user)


@ratelimit(
    key="header:cf-connecting-ip",
    rate=next_asset_rate,
    group="next_asset",
    block=True,
)
@never_cache
@atomic
def redirect_to_next_reviewable_topic_asset(
    request: HttpRequest,
    *,
    topic_slug: str,
) -> HttpResponseRedirect:
    """
    Redirect the user to the next reviewable asset within a topic.

    This view redirects within a specific topic, which may be listed or
    unlisted. It can use optional query parameters to influence which asset
    is prioritized.

    Request Parameters:
        project (str): Current project slug.
        item (str): Current item identifier. This is `item_id`, not the item
            primary key.
        asset (int): ID of the most recently reviewed asset.

    Args:
        request (HttpRequest): Incoming HTTP request.
        topic_slug (str): Slug for the target topic.

    Returns:
        HttpResponseRedirect: Redirect to the selected asset or the
        homepage.
    """
    structured_logger.info(
        "Entered redirect_to_next_reviewable_topic_asset view.",
        event_code="redirect_reviewable_topic_entry",
        user=request.user,
        topic_slug=topic_slug,
    )
    # Topic is specified: may be listed or unlisted
    topic = get_object_or_404(Topic.objects.published(), slug=topic_slug)
    project_slug = request.GET.get("project", "")
    item_id = request.GET.get("item", "")
    asset_pk = request.GET.get("asset", 0)
    structured_logger.debug(
        "Parsed query parameters for reviewable topic redirection.",
        event_code="redirect_reviewable_topic_query_params",
        user=request.user,
        topic=topic,
        project_slug=project_slug,
        item_id=item_id,
        asset_pk=asset_pk,
    )

    if not request.user.is_authenticated:
        user = get_anonymous_user()
    else:
        user = request.user

    # We pass request.user instead of user here to maintain pre-existing
    # behavior (though it is probably unintended).
    # TODO: Re-evaluate whether we should pass in user instead.
    asset = find_next_reviewable_topic_asset(
        topic, request.user, project_slug, item_id, asset_pk
    )
    structured_logger.info(
        "Redirecting to next reviewable asset in topic.",
        event_code="redirect_reviewable_topic_success",
        user=user,
        request_user=request.user,
        asset=asset,
        topic=topic,
    )

    return redirect_to_next_asset(asset, "review", request, user)


@ratelimit(
    key="header:cf-connecting-ip",
    rate=next_asset_rate,
    group="next_asset",
    block=True,
)
@never_cache
@atomic
def redirect_to_next_transcribable_topic_asset(
    request: HttpRequest,
    *,
    topic_slug: str,
) -> HttpResponseRedirect:
    """
    Redirect the user to the next transcribable asset within a topic.

    This view redirects within a specific topic, which may be listed or
    unlisted. It can use optional query parameters to influence which asset
    is prioritized.

    Request Parameters:
        project (str): Current project slug.
        item (str): Current item identifier. This is `item_id`, not the item
            primary key.
        asset (int): ID of the most recently transcribed asset.

    Args:
        request (HttpRequest): Incoming HTTP request.
        topic_slug (str): Slug for the target topic.

    Returns:
        HttpResponseRedirect: Redirect to the selected asset or the
        homepage.
    """
    structured_logger.info(
        "Entered redirect_to_next_transcribable_topic_asset view.",
        event_code="redirect_transcribable_topic_entry",
        user=request.user,
        topic_slug=topic_slug,
    )
    # Topic is specified: may be listed or unlisted
    topic = get_object_or_404(Topic.objects.published(), slug=topic_slug)
    project_slug = request.GET.get("project", "")
    item_id = request.GET.get("item", "")
    asset_pk = request.GET.get("asset", 0)
    structured_logger.debug(
        "Parsed query parameters for transcribable topic redirection.",
        event_code="redirect_transcribable_topic_query_params",
        user=request.user,
        topic=topic,
        project_slug=project_slug,
        item_id=item_id,
        asset_pk=asset_pk,
    )

    if not request.user.is_authenticated:
        user = get_anonymous_user()
    else:
        user = request.user

    asset = find_next_transcribable_topic_asset(topic, project_slug, item_id, asset_pk)
    structured_logger.info(
        "Redirecting to next transcribable asset in topic.",
        event_code="redirect_transcribable_topic_success",
        user=user,
        asset=asset,
        topic=topic,
    )
    return redirect_to_next_asset(asset, "transcribe", request, user)


================================================
FILE: concordia/views/campaigns.py
================================================
from typing import Any, Iterable
from urllib.parse import urlencode

from django.core.paginator import Paginator
from django.db.models import Count, Q, QuerySet
from django.http import HttpResponse
from django.shortcuts import get_object_or_404, render
from django.utils.decorators import method_decorator
from django.views.generic import TemplateView

from concordia.api_views import APIDetailView, APIListView
from concordia.models import (
    STATUS_COUNT_KEYS,
    Asset,
    Campaign,
    Project,
    ResearchCenter,
    SiteReport,
    Topic,
    Transcription,
    TranscriptionStatus,
)
from concordia.utils.constants import ASSETS_PER_PAGE

from .decorators import default_cache_control, user_cache_control
from .utils import (
    annotate_children_with_progress_stats,
    calculate_asset_stats,
)


@method_decorator(default_cache_control, name="dispatch")
class CampaignListView(APIListView):
    """
    Display a list of active campaigns.

    Renders a list of published, listed, and active campaigns ordered by
    their configured ordering and title. Adds context entries for topics
    and completed campaigns for secondary display.

    Inherits from APIListView to support both HTML rendering and API
    serialization of campaigns.

    Attributes:
        template_name (str): Template used to render the campaign list.
        queryset (QuerySet[Campaign]): The base queryset of campaigns.
        context_object_name (str): The name of the context variable for campaigns.

    Returns:
        HttpResponse: Renders the campaign list template with context.
    """

    template_name = "transcriptions/campaign_list.html"
    queryset = (
        Campaign.objects.published()
        .listed()
        .filter(status=Campaign.Status.ACTIVE)
        .order_by("ordering", "title")
    )
    context_object_name = "campaigns"

    def get_context_data(self, **kwargs: Any) -> dict[str, Any]:
        """
        Build context data for the campaign list template.

        Adds:
        - 'topics': Ordered list of published topics.
        - 'completed_campaigns': Ordered list of completed or retired campaigns.

        Args:
            **kwargs: Additional context arguments.

        Returns:
            dict[str, Any]: Context data for rendering.
        """
        data = super().get_context_data(**kwargs)
        data["topics"] = (
            Topic.objects.published().listed().order_by("ordering", "title")
        )
        data["completed_campaigns"] = (
            Campaign.objects.published()
            .listed()
            .filter(status__in=[Campaign.Status.COMPLETED, Campaign.Status.RETIRED])
            .order_by("ordering", "title")
        )
        return data

    def serialize_context(self, context: dict[str, Any]) -> dict[str, Any]:
        """
        Serialize context data for API responses.

        Annotates each campaign object with its asset status counts.

        Args:
            context (dict[str, Any]): The view context.

        Returns:
            dict[str, Any]: Serialized context data for API output.
        """
        data = super().serialize_context(context)

        object_list = data["objects"]

        campaign_stats_qs = (
            Campaign.objects.filter(pk__in=[i["id"] for i in object_list])
            .annotate(
                **{
                    v: Count(
                        "project__item__asset",
                        filter=Q(
                            project__published=True,
                            project__item__published=True,
                            project__item__asset__published=True,
                            project__item__asset__transcription_status=k,
                        ),
                    )
                    for k, v in STATUS_COUNT_KEYS.items()
                }
            )
            .values("pk", *STATUS_COUNT_KEYS.values())
        )

        campaign_asset_counts = {}
        for campaign_stats in campaign_stats_qs:
            campaign_asset_counts[campaign_stats.pop("pk")] = campaign_stats

        for obj in object_list:
            obj["asset_stats"] = campaign_asset_counts[obj["id"]]

        return data


@method_decorator(default_cache_control, name="dispatch")
class CompletedCampaignListView(APIListView):
    """
    Display a list of completed and/or retired campaigns.

    Renders a list of published, listed campaigns filtered by completion or
    retirement status. Optionally filters by research center or campaign type.

    Attributes:
        model (Model): The Campaign model class.
        template_name (str): Template used to render the campaign list.
        context_object_name (str): The name of the context variable for campaigns.

    Returns:
        HttpResponse: Renders the completed campaign list template with context.
    """

    model = Campaign
    template_name = "transcriptions/campaign_list_small_blocks.html"
    context_object_name = "campaigns"

    def _get_all_campaigns(self) -> QuerySet[Campaign]:
        """
        Retrieve all completed or retired campaigns, optionally filtered by type.

        Returns:
            QuerySet[Campaign]: Filtered campaigns.
        """
        campaignType = self.request.GET.get("type", None)
        campaigns = Campaign.objects.published().listed()
        if campaignType is None:
            return campaigns.filter(
                status__in=[Campaign.Status.COMPLETED, Campaign.Status.RETIRED]
            )
        elif campaignType == "retired":
            status = Campaign.Status.RETIRED
        else:
            status = Campaign.Status.COMPLETED

        return campaigns.filter(status=status)

    def get_queryset(self) -> QuerySet[Campaign]:
        """
        Build the queryset of completed or retired campaigns.

        Optionally filters by research center if provided.

        Returns:
            QuerySet[Campaign]: The queryset for completed campaigns.
        """
        campaigns = self._get_all_campaigns()
        research_center = self.request.GET.get("research_center", None)
        if research_center is not None:
            campaigns = campaigns.filter(research_centers=research_center)
        return campaigns.order_by("-completed_date")

    def get_context_data(self, **kwargs: Any) -> dict[str, Any]:
        """
        Build context data for the completed campaign list template.

        Adds:
        - 'result_count': The number of campaigns in the list.
        - 'research_centers': Distinct research centers for these campaigns.

        Args:
            **kwargs: Additional context arguments.

        Returns:
            dict[str, Any]: Context data for rendering.
        """
        campaigns = self._get_all_campaigns()
        data = super().get_context_data(**kwargs)
        data["result_count"] = self.object_list.count()
        data["research_centers"] = ResearchCenter.objects.filter(
            campaign__in=campaigns
        ).distinct()

        return data


@method_decorator(default_cache_control, name="dispatch")
class CampaignTopicListView(TemplateView):
    """
    Display a list of campaigns grouped by topic.

    Renders active campaigns, a subset of topics and completed/retired campaigns
    for navigation and discovery pages.

    Attributes:
        template_name (str): Template used to render the campaign-topic list page.

    Returns:
        HttpResponse: Renders the campaign topic list template with context.
    """

    template_name = "transcriptions/campaign_topic_list.html"

    def get(self, request, *args: Any, **kwargs: Any) -> HttpResponse:
        """
        Handle GET requests for the campaign-topic list page.

        Builds context containing:
        - 'campaigns': Ordered list of active campaigns.
        - 'topics': Ordered list of up to 5 topics.
        - 'completed_campaigns': Ordered list of completed and retired campaigns.

        Args:
            request (HttpRequest): The incoming HTTP request.
            *args: Additional positional arguments.
            **kwargs: Additional keyword arguments.

        Returns:
            HttpResponse: Rendered campaign topic list page.
        """
        data = {}
        data["campaigns"] = (
            Campaign.objects.published()
            .listed()
            .filter(status=Campaign.Status.ACTIVE)
            .annotated()
            .order_by("ordering", "title")
        )
        data["topics"] = (
            Topic.objects.published().listed().order_by("ordering", "title")[:5]
        )
        data["completed_campaigns"] = (
            Campaign.objects.published()
            .listed()
            .filter(status__in=[Campaign.Status.COMPLETED, Campaign.Status.RETIRED])
            .order_by("ordering", "title")
        )

        return render(request, self.template_name, data)


@method_decorator(default_cache_control, name="dispatch")
class CampaignDetailView(APIDetailView):
    """
    Display details for a single campaign.

    Renders campaign information, associated projects, and aggregated asset
    statistics. Selects different templates based on campaign status
    (active, completed, or retired).

    Attributes:
        template_name (str): Template for active campaigns.
        completed_template_name (str): Template for completed campaigns.
        retired_template_name (str): Template for retired campaigns.
        context_object_name (str): Context variable name for the campaign.
        queryset (QuerySet[Campaign]): Base queryset of campaigns.

    Returns:
        HttpResponse: Renders the campaign detail template with context.
    """

    template_name = "transcriptions/campaign_detail.html"
    completed_template_name = "transcriptions/campaign_detail_completed.html"
    retired_template_name = "transcriptions/campaign_detail_retired.html"
    context_object_name = "campaign"
    queryset = Campaign.objects.published().order_by("title")

    def get_context_data(self, **kwargs: Any) -> dict[str, Any]:
        """
        Build context data for the campaign detail page.

        Adds:
        - For retired campaigns: contributor and completed counts from SiteReport.
        - For active campaigns: filtered and annotated projects, asset statistics.

        Args:
            **kwargs: Additional context arguments.

        Returns:
            dict[str, Any]: Context data for rendering.
        """
        ctx = super().get_context_data(**kwargs)
        if self.object and self.object.status == Campaign.Status.RETIRED:
            latest_report = SiteReport.objects.filter(campaign=ctx["campaign"]).latest(
                "created_on"
            )
            ctx["completed_count"] = latest_report.assets_completed
            ctx["contributor_count"] = latest_report.registered_contributors
        else:
            projects = (
                ctx["campaign"].project_set.published().order_by("ordering", "title")
            )
            ctx["filters"] = filters = {}
            filter_by_reviewable = kwargs.get("filter_by_reviewable", False)
            if filter_by_reviewable:
                projects = projects.filter(
                    item__asset__transcription__id__in=Transcription.objects.exclude(
                        user=self.request.user.id
                    ).values_list("id", flat=True)
                )
                ctx["filter_assets"] = True
            projects = projects.annotate(
                **{
                    f"{key}_count": Count(
                        "item__asset",
                        filter=Q(
                            item__published=True,
                            item__asset__published=True,
                            item__asset__transcription_status=key,
                        ),
                    )
                    for key in TranscriptionStatus.CHOICE_MAP
                }
            )

            if filter_by_reviewable:
                status = TranscriptionStatus.SUBMITTED
            else:
                status = self.request.GET.get("transcription_status")
            if status in TranscriptionStatus.CHOICE_MAP:
                projects = projects.exclude(**{f"{status}_count": 0})
                # We only want to pass specific QS parameters
                # to lower-level search pages:
                filters["transcription_status"] = status
            ctx["sublevel_querystring"] = urlencode(filters)

            annotate_children_with_progress_stats(projects)
            ctx["projects"] = projects

            campaign_assets = Asset.objects.filter(
                item__project__campaign=self.object,
                item__project__published=True,
                item__published=True,
                published=True,
            )
            if filter_by_reviewable:
                campaign_assets = campaign_assets.exclude(
                    transcription__user=self.request.user.id
                )
                ctx["transcription_status"] = TranscriptionStatus.SUBMITTED
            else:
                ctx["transcription_status"] = status

            calculate_asset_stats(campaign_assets, ctx)

        return ctx

    def serialize_context(self, context: dict[str, Any]) -> dict[str, Any]:
        """
        Serialize campaign context data for API responses.

        Adds:
        - 'related_links': Helpful Link title and URL pairs for the campaign.

        Args:
            context (dict[str, Any]): The view context.

        Returns:
            dict[str, Any]: Serialized context data for API output.
        """
        ctx = super().serialize_context(context)
        ctx["object"]["related_links"] = [
            {"title": title, "url": url}
            for title, url in self.object.helpfullink_set.values_list(
                "title", "link_url"
            )
        ]
        return ctx

    def get_template_names(self) -> list[str]:
        """
        Determine the template to use based on campaign status.

        Returns:
            list[str]: List containing the selected template name.
        """
        if self.object.status == Campaign.Status.COMPLETED:
            return [self.completed_template_name]
        elif self.object.status == Campaign.Status.RETIRED:
            return [self.retired_template_name]
        return super().get_template_names()


@method_decorator(user_cache_control, name="dispatch")
class FilteredCampaignDetailView(CampaignDetailView):
    """
    Display campaign details with reviewable asset filtering for staff users.

    Inherits from CampaignDetailView, overriding context data to include only
    assets eligible for review by staff users when authenticated.

    Returns:
        HttpResponse: Renders the filtered campaign detail template with context.
    """

    def get_context_data(self, **kwargs: Any) -> dict[str, Any]:
        """
        Build context data with reviewable asset filtering for staff users.

        Adds 'filter_by_reviewable' to kwargs when user is authenticated and staff.

        Args:
            **kwargs: Additional context arguments.

        Returns:
            dict[str, Any]: Context data for rendering.
        """
        if self.request.user.is_authenticated and self.request.user.is_staff:
            kwargs["filter_by_reviewable"] = True

        return super().get_context_data(**kwargs)


@method_decorator(default_cache_control, name="dispatch")
class ReportCampaignView(TemplateView):
    """
    Display a report summarizing campaign resources and status.

    Renders a paginated report including project-level asset counts, tag counts,
    contributor counts, reviewer counts and transcription status summaries.

    Attributes:
        template_name (str): Template used to render the campaign report page.

    Returns:
        HttpResponse: Renders the campaign report template with context.
    """

    template_name = "transcriptions/campaign_report.html"

    def get(
        self, request, campaign_slug: str, *args: Any, **kwargs: Any
    ) -> HttpResponse:
        """
        Handle GET requests for the campaign report page.

        Builds context containing:
        - Campaign title and slug
        - Total asset count
        - Paginated projects with asset, tag, transcriber and reviewer counts
        - Transcription status summaries per project

        Args:
            request (HttpRequest): The incoming HTTP request.
            campaign_slug (str): Slug for the campaign to report on.
            *args: Additional positional arguments.
            **kwargs: Additional keyword arguments.

        Returns:
            HttpResponse: Rendered campaign report page.
        """
        campaign = get_object_or_404(Campaign.objects.published(), slug=campaign_slug)

        try:
            page = int(self.request.GET.get("page", "1"))
        except ValueError:
            page = 1

        campaign_assets = Asset.objects.published().filter(
            item__project__campaign=campaign
        )

        ctx = {
            "title": campaign.title,
            "campaign_slug": campaign.slug,
            "total_asset_count": campaign_assets.count(),
        }

        projects_qs = campaign.project_set.published().order_by("title")

        projects_qs = projects_qs.annotate(
            asset_count=Count(
                "item__asset",
                filter=Q(item__published=True, item__asset__published=True),
                distinct=True,
            )
        )
        projects_qs = projects_qs.annotate(
            tag_count=Count("item__asset__userassettagcollection__tags", distinct=True)
        )
        projects_qs = projects_qs.annotate(
            transcriber_count=Count("item__asset__transcription__user", distinct=True),
            reviewer_count=Count(
                "item__asset__transcription__reviewed_by", distinct=True
            ),
        )

        paginator = Paginator(projects_qs, ASSETS_PER_PAGE)
        if page > paginator.num_pages:
            page = 1
        projects_page = paginator.get_page(page)

        self.add_transcription_status_summary_to_projects(projects_page)

        ctx["paginator"] = paginator
        ctx["projects"] = projects_page

        return render(self.request, self.template_name, ctx)

    def add_transcription_status_summary_to_projects(
        self, projects: Iterable[Project]
    ) -> None:
        """
        Annotate each project with a summary of transcription statuses.

        Adds a 'transcription_statuses' attribute to each project, containing
        status names and their respective counts, ordered by status.

        Args:
            projects (Iterable): Projects to annotate.

        Returns:
            None
        """
        status_qs = Asset.objects.filter(
            item__published=True, item__project__in=projects, published=True
        )
        status_qs = status_qs.values_list("item__project__id", "transcription_status")
        status_qs = status_qs.annotate(Count("transcription_status"))
        project_statuses = {}

        for project_id, status_value, count in status_qs:
            status_name = TranscriptionStatus.CHOICE_MAP[status_value]
            project_statuses.setdefault(project_id, []).append((status_name, count))

        # We'll sort the statuses in the same order they're presented in the choices
        # list so the display order will be both stable and consistent with the way
        # we talk about the workflow:
        sort_order = [j for i, j in TranscriptionStatus.CHOICES]

        for project in projects:
            statuses = project_statuses.get(project.id, [])
            statuses.sort(key=lambda i: sort_order.index(i[0]))
            project.transcription_statuses = statuses


================================================
FILE: concordia/views/decorators.py
================================================
from collections.abc import Callable
from functools import wraps
from time import time

from django.conf import settings
from django.core.exceptions import ObjectDoesNotExist, ValidationError
from django.http import HttpRequest, JsonResponse
from django.views.decorators.cache import cache_control, never_cache
from django.views.decorators.vary import vary_on_headers

from concordia.forms import TurnstileForm
from concordia.logging import ConcordiaLogger
from configuration.utils import configuration_value
from configuration.validation import validate_rate

structured_logger = ConcordiaLogger.get_logger(__name__)


def default_cache_control(view_function: Callable) -> Callable:
    """
    Decorator that applies default cache control headers to public-facing views.

    This decorator sets `Cache-Control: public` with a max-age defined in the
    `DEFAULT_PAGE_TTL` Django setting. It also varies the response by the
    `Accept-Encoding` header.

    Args:
        view_function (Callable): The view function to decorate.

    Returns:
        Callable: The wrapped view function with cache control headers applied.
    """

    @vary_on_headers("Accept-Encoding")
    @cache_control(public=True, max_age=settings.DEFAULT_PAGE_TTL)
    @wraps(view_function)
    def inner(*args, **kwargs):
        return view_function(*args, **kwargs)

    return inner


def user_cache_control(view_function: Callable) -> Callable:
    """
    Decorator that applies cache control headers for views varying by session.

    This decorator is intended for views that may return different content
    based on whether the user is authenticated. It sets
    `Cache-Control: public` with the `DEFAULT_PAGE_TTL` setting and varies
    the response by both `Accept-Encoding` and `Cookie` headers.

    Args:
        view_function (Callable): The view function to decorate.

    Returns:
        Callable: The wrapped view function with user-aware cache control
            headers.
    """

    @vary_on_headers("Accept-Encoding", "Cookie")
    @cache_control(public=True, max_age=settings.DEFAULT_PAGE_TTL)
    @wraps(view_function)
    def inner(*args, **kwargs):
        return view_function(*args, **kwargs)

    return inner


def validate_anonymous_user(view: Callable) -> Callable:
    """
    Decorator that applies anonymous user validation for `POST` requests.

    If the user is unauthenticated and submits a `POST` request, this
    decorator checks whether the user has recently passed Turnstile
    validation. If not, it validates the request using a `TurnstileForm`.
    Failing validation returns a 401 JSON response.

    The timestamp of a successful validation is stored in the user session
    to avoid re-validating within the configured interval.

    Args:
        view (Callable): The view function to wrap.

    Returns:
        Callable: The wrapped view function with anonymous user validation
            logic.
    """

    @wraps(view)
    @never_cache
    def inner(request, *args, **kwargs):
        if not request.user.is_authenticated and request.method == "POST":
            # First check if the user has already been validated within the
            # time limit. If so, validation can be skipped.
            turnstile_last_validated = request.session.get(
                "turnstile_last_validated", 0
            )
            age = time() - turnstile_last_validated
            if age > settings.ANONYMOUS_USER_VALIDATION_INTERVAL:
                form = TurnstileForm(request.POST)
                if not form.is_valid():
                    return JsonResponse(
                        {
                            "error": (
                                "Unable to validate. Please try again or " "login."
                            )
                        },
                        status=401,
                    )
                else:
                    # User has been validated, so cache the time in the
                    # session.
                    request.session["turnstile_last_validated"] = time()

        return view(request, *args, **kwargs)

    return inner


def reserve_rate(group: str, request: HttpRequest) -> str | None:
    """
    Determine the rate limit value for a request.

    This helper is used to control throttling behavior. If the user is
    anonymous, it returns a fixed rate limit string, for example "100/m".
    Authenticated users are not rate-limited and it returns `None`.

    The `group` parameter controls how rate limits are grouped. It defaults
    to the dotted name of the view so each view is treated as its own rate
    limit bucket unless explicitly overridden.

    Args:
        group (str): Group name used to bucket rate limits. Defaults to the
            dotted view name if not set manually.
        request (HttpRequest): The incoming HTTP request.

    Returns:
        str | None: A rate string such as "100/m" for anonymous users, or
            `None` otherwise.
    """
    return None if request.user.is_authenticated else "100/m"


def next_asset_rate(group: str, request: HttpRequest) -> str | None:
    """
    Determine the rate limit value for a next-asset request.

    If the user is anonymous, this helper returns a rate limit string from
    the `next_asset_rate_limit` configuration value, for example "4/m".
    Authenticated users are not rate-limited and it returns `None`.

    The `group` parameter controls how rate limits are grouped. It is used
    internally by `django-ratelimit`. It could be used to return different
    rate limits based on the group, but that is not needed currently.

    Args:
        group (str): Group name used to bucket rate limits. Defaults to the
            dotted view name if not set manually.
        request (HttpRequest): The incoming HTTP request.

    Returns:
        str | None: A rate string such as "4/m" for anonymous users, or
            `None` otherwise.
    """
    if request.user.is_authenticated:
        return None
    try:
        rate_limit = configuration_value("next_asset_rate_limit")
        return validate_rate(rate_limit)
    except (ObjectDoesNotExist, ValidationError) as exc:
        structured_logger.warning(
            "Falling back to default next-asset rate limit.",
            event_code="next_asset_rate_config_fallback",
            reason="Could not load or validate configured rate limit",
            reason_code="config_missing_or_invalid",
            group=group,
            default_rate="4/m",
            user=request.user,
            error_type=exc.__class__.__name__,
            error=str(exc),
        )
        return "4/m"


================================================
FILE: concordia/views/items.py
================================================
from urllib.parse import urlencode

from django.db.models import QuerySet
from django.http import Http404, HttpRequest, HttpResponse
from django.shortcuts import get_object_or_404, redirect
from django.utils.decorators import method_decorator

from concordia.api_views import APIListView
from concordia.models import Campaign, Item, TranscriptionStatus
from concordia.utils import get_image_urls_from_asset

from .decorators import default_cache_control, user_cache_control
from .utils import calculate_asset_stats


@method_decorator(default_cache_control, name="dispatch")
class ItemDetailView(APIListView):
    """
    Display a paginated list of assets for a specific item.

    This view handles GET requests and renders the item detail page,
    which includes the item's assets, context for filtering, and transcription stats.

    Uses `APIListView` to support both HTML rendering and optional JSON output for
    frontend consumption.

    Attributes:
        template_name (str): Template used to render the asset list.
        context_object_name (str): The variable name for assets in the template.
        paginate_by (int): Number of assets to display per page.
        http_method_names (list[str]): HTTP methods supported by the view.
    """

    template_name = "transcriptions/item_detail.html"
    context_object_name = "assets"
    paginate_by = 10

    http_method_names = ["get", "options", "head"]

    def dispatch(self, request: HttpRequest, *args, **kwargs) -> HttpResponse:
        """
        Handle incoming HTTP requests and redirect if the item or campaign is missing.

        Args:
            request (HttpRequest): The HTTP request object.

        Returns:
            HttpResponse: The response for the view or a redirect to the campaign page.
        """
        try:
            return super().dispatch(request, *args, **kwargs)
        except Http404:
            campaign = get_object_or_404(
                Campaign.objects.published(), slug=self.kwargs["campaign_slug"]
            )
            return redirect(campaign)

    def _get_assets(self) -> QuerySet:
        """
        Retrieve the queryset of published assets for the current item.

        If the `filter_by_reviewable` flag is set in `self.kwargs`, excludes any assets
        already transcribed by the current user to allow for review filtering.

        Returns:
            QuerySet: The filtered set of published `Asset` objects for the item.
        """
        assets = self.item.asset_set.published()
        if self.kwargs.get("filter_by_reviewable", False):
            assets = assets.exclude(transcription__user=self.request.user.id)
        return assets

    def get_queryset(self):
        """
        Build and return the queryset of assets for the current item.

        Retrieves the specified `Item` and filters its published assets based on
        transcription status. If `filter_by_reviewable` is set in `self.kwargs`,
        filters assets not yet transcribed by the current user and restricts the
        status to SUBMITTED.

        The resulting queryset is ordered by sequence and annotated for use in the view.
        Also sets `self.filters` for use in context and querystring construction.

        Returns:
            QuerySet: The filtered and ordered queryset of `Asset` objects.
        """
        self.item = get_object_or_404(
            Item.objects.published().select_related("project__campaign"),
            project__campaign__slug=self.kwargs["campaign_slug"],
            project__slug=self.kwargs["project_slug"],
            item_id=self.kwargs["item_id"],
        )

        asset_qs = self._get_assets().order_by("sequence")
        asset_qs = asset_qs.select_related(
            "item__project__campaign", "item__project", "item"
        )

        self.filters = {}
        if self.kwargs.get("filter_by_reviewable", False):
            status = TranscriptionStatus.SUBMITTED
        else:
            status = self.request.GET.get("transcription_status")
        if status in TranscriptionStatus.CHOICE_MAP:
            asset_qs = asset_qs.filter(transcription_status=status)
            # We only want to pass specific QS parameters to lower-level search
            # pages so we'll record those here:
            self.filters["transcription_status"] = status

        return asset_qs

    def get_context_data(self, **kwargs):
        """
        Construct the context dictionary for rendering the item detail page.

        Adds campaign, project, item and transcription status to the context. Also
        attaches filter state and querystring for pagination or navigation. If review
        filtering is enabled, the context is marked accordingly.

        Includes asset-level transcription statistics via `calculate_asset_stats()`.

        Returns:
            dict: The context data for the template rendering.
        """
        ctx = super().get_context_data(**kwargs)

        ctx.update(
            {
                "campaign": self.item.project.campaign,
                "project": self.item.project,
                "item": self.item,
                "sublevel_querystring": urlencode(self.filters),
                "filters": self.filters,
            }
        )

        item_assets = self._get_assets()
        if self.kwargs.get("filter_by_reviewable", False):
            ctx["filter_assets"] = True
            ctx["transcription_status"] = TranscriptionStatus.SUBMITTED
        else:
            ctx["transcription_status"] = self.request.GET.get("transcription_status")

        calculate_asset_stats(item_assets, ctx)

        return ctx

    def serialize_context(self, context: dict) -> dict:
        """
        Serialize the context data for JSON responses.

        Enhances each serialized asset with its associated image and thumbnail URLs.
        Also includes serialized data for the parent item.

        Args:
            context (dict): The original context data returned by `get_context_data()`.

        Returns:
            dict: The serialized version of the context suitable for API responses.
        """
        data = super().serialize_context(context)

        for i, asset in enumerate(context["object_list"]):
            serialized_asset = data["objects"][i]
            image_url, thumbnail_url = get_image_urls_from_asset(asset)
            serialized_asset["image_url"] = image_url
            serialized_asset["thumbnail_url"] = thumbnail_url

        data["item"] = self.serialize_object(context["item"])
        return data


@method_decorator(user_cache_control, name="dispatch")
class FilteredItemDetailView(ItemDetailView):
    """
    View that displays only reviewable assets for an item.

    Inherits from `ItemDetailView` but overrides queryset and context behavior to
    exclude assets already transcribed by the current user. Used to present assets
    eligible for review.
    """

    def get_queryset(self):
        """
        Modify the queryset to include only reviewable assets.

        Sets the `filter_by_reviewable` flag in `self.kwargs` to enable filtering logic
        in the parent view.

        Returns:
            QuerySet: A filtered queryset of `Asset` objects for review.
        """
        self.kwargs["filter_by_reviewable"] = True
        return super().get_queryset()

    def get_context_data(self, **kwargs):
        """
        Update the context to reflect that only reviewable assets are being shown.

        Ensures `filter_by_reviewable` is set in both `self.kwargs` and `kwargs` so that
        downstream logic (like filtering and labeling) behaves consistently.

        Returns:
            dict: The context dictionary for rendering the filtered item detail view.
        """
        self.kwargs["filter_by_reviewable"] = True
        kwargs["filter_by_reviewable"] = True
        return super().get_context_data(**kwargs)


================================================
FILE: concordia/views/maintenance_mode.py
================================================
from time import time

from django.core.cache import cache
from django.http import HttpRequest, HttpResponseRedirect
from maintenance_mode.core import set_maintenance_mode


def maintenance_mode_off(request: HttpRequest) -> HttpResponseRedirect:
    """
    Deactivates maintenance mode and redirects to the site root.

    Only superusers are allowed to use this view. If the requesting user is not a
    superuser, no change is made to the system state.

    Returns:
        HttpResponseRedirect: Redirect to the root path with a timestamp parameter
        used for cache busting.
    """
    if request.user.is_superuser:
        set_maintenance_mode(False)

    # Added cache busting to make sure maintenance mode banner is
    # always displayed/removed
    return HttpResponseRedirect("/?t={}".format(int(time())))


def maintenance_mode_on(request: HttpRequest) -> HttpResponseRedirect:
    """
    Activates maintenance mode and redirects to the site root.

    Only superusers are allowed to use this view. If the requesting user is not a
    superuser, no change is made to the system state.

    Returns:
        HttpResponseRedirect: Redirect to the root path with a timestamp parameter
        used for cache busting.
    """
    if request.user.is_superuser:
        set_maintenance_mode(True)

    # Added cache busting to make sure maintenance mode banner is
    # always displayed/removed
    return HttpResponseRedirect("/?t={}".format(int(time())))


def maintenance_mode_frontend_available(request: HttpRequest) -> HttpResponseRedirect:
    """
    Enables frontend access during maintenance mode and redirects to the site root.

    This sets a cache key (`maintenance_mode_frontend_available`) to allow staff and
    superusers to bypass maintenance restrictions while the site is otherwise disabled.
    Only superusers are allowed to use this view.

    Returns:
        HttpResponseRedirect: Redirect to the root path with a timestamp parameter
        used for cache busting.
    """
    if request.user.is_superuser:
        cache.set("maintenance_mode_frontend_available", True, None)

    return HttpResponseRedirect("/?t={}".format(int(time())))


def maintenance_mode_frontend_unavailable(request: HttpRequest) -> HttpResponseRedirect:
    """
    Disables frontend access during maintenance mode and redirects to the site root.

    This clears the `maintenance_mode_frontend_available` cache key, fully locking out
    all users (including staff) from the site frontend during maintenance mode.
    Only superusers are allowed to use this view.

    Returns:
        HttpResponseRedirect: Redirect to the root path with a timestamp parameter
        used for cache busting.
    """
    if request.user.is_superuser:
        cache.set("maintenance_mode_frontend_available", False, None)

    return HttpResponseRedirect("/?t={}".format(int(time())))


================================================
FILE: concordia/views/projects.py
================================================
from urllib.parse import urlencode

from django.db.models import Count, Q, QuerySet
from django.http import Http404, HttpRequest, HttpResponse
from django.shortcuts import get_object_or_404, redirect
from django.utils.decorators import method_decorator

from concordia.api_views import APIListView
from concordia.models import Asset, Campaign, Project, TranscriptionStatus

from .decorators import default_cache_control, user_cache_control
from .utils import annotate_children_with_progress_stats, calculate_asset_stats


@method_decorator(default_cache_control, name="dispatch")
class ProjectDetailView(APIListView):
    """
    Display a paginated list of items for a single project.

    Handles GET requests for a published project scoped by campaign and project
    slugs. Applies optional filtering to show only items with a specific
    transcription status. Builds context including campaign/project metadata
    and progress statistics.

    Attributes:
        template_name (str): Template used for project detail.
        context_object_name (str): Context key under which the list of items is
            exposed to templates.
        paginate_by (int): Number of items per page.

    Returns:
        HttpResponse: Rendered project detail page or a redirect if the project
            or campaign cannot be found.
    """

    template_name = "transcriptions/project_detail.html"
    context_object_name = "items"
    paginate_by = 10

    def dispatch(self, request: HttpRequest, *args, **kwargs) -> HttpResponse:
        """
        Dispatch the request or redirect to campaign if the item is missing.

        If an `Http404` occurs during normal dispatch (e.g., item not found),
        redirect to the campaign page to keep navigation stable.

        Args:
            request (HttpRequest): The incoming request.
            *args: Positional args forwarded to the superclass.
            **kwargs: Keyword args forwarded to the superclass.

        Returns:
            HttpResponse: Normal response from `APIListView.dispatch` or a
                redirect to the campaign page when the asset path is invalid.
        """
        try:
            return super().dispatch(request, *args, **kwargs)
        except Http404:
            campaign = get_object_or_404(
                Campaign.objects.published(), slug=self.kwargs["campaign_slug"]
            )
            return redirect(campaign)

    def get_queryset(self, filter_by_reviewable: bool = False) -> QuerySet:
        """
        Return the queryset of items for the current project.

        Loads the published project identified by `campaign_slug` and `slug`,
        then builds an ordered queryset of its published items. When
        `filter_by_reviewable` is true, excludes items already transcribed by
        the requesting user. Each item is annotated with per-status counts
        using `TranscriptionStatus.CHOICE_MAP`.

        Request Parameters:
            - `transcription_status` (str, optional): If present and valid,
              restrict the queryset to items that have at least one asset in
              that status (items with zero count for that status are excluded).

        Args:
            filter_by_reviewable (bool): If true, exclude items containing an
                asset with a transcription by the current user.

        Returns:
            QuerySet: Ordered queryset of items annotated with per-status
                counts. Also sets `self.filters` to the propagated filters that
                should appear in sublevel navigation links.
        """
        self.project = get_object_or_404(
            Project.objects.published().select_related("campaign"),
            slug=self.kwargs["slug"],
            campaign__slug=self.kwargs["campaign_slug"],
        )

        item_qs = self.project.item_set.published().order_by("item_id")
        if filter_by_reviewable:
            item_qs = item_qs.exclude(asset__transcription__user=self.request.user.id)
        item_qs = item_qs.annotate(
            **{
                f"{key}_count": Count(
                    "asset", filter=Q(asset__transcription_status=key)
                )
                for key in TranscriptionStatus.CHOICE_MAP
            }
        )

        self.filters: dict[str, str] = {}

        if filter_by_reviewable:
            status = TranscriptionStatus.SUBMITTED
        else:
            status = self.request.GET.get("transcription_status")
        if status in TranscriptionStatus.CHOICE_MAP:
            item_qs = item_qs.exclude(**{f"{status}_count": 0})
            # We only want to pass specific QS parameters to lower-level search
            # pages so we'll record those here:
            self.filters["transcription_status"] = status

        return item_qs

    def get_context_data(self, **kws) -> dict[str, object]:
        """
        Build context for the project detail template.

        Context Format:
            - `items` (QuerySet): Paginated list of project items.
            - `project` (Project): The current project.
            - `campaign` (Campaign): The parent campaign.
            - `filters` (dict[str, str] | absent): Filters applied to this view.
            - `sublevel_querystring` (str | absent): URL-encoded filters to pass
              into sublevel pages.
            - `transcription_status` (str | None): Current status filter or
              derived status when reviewable filtering is active.
            - `filter_assets` (bool | absent): True when items are filtered to
              exclude those transcribed by the current user.
            - `total_assets` (int): Count of assets in the project (published).
            - `completed_assets` (int): Count of completed assets.
            - `in_progress_assets` (int): Count of in-progress assets.
            - `not_started_assets` (int): Count of not-started assets.
            - `submitted_assets` (int): Count of submitted assets.
            - Progress statistics on each item are added in-place by
              `annotate_children_with_progress_stats`.

        Args:
            **kws: Optional flags. Recognized:
                - `filter_by_reviewable` (bool): When true, limit assets and
                  force `transcription_status` to `SUBMITTED`.

        Returns:
            dict[str, object]: Template context including project/campaign
                metadata, filters, and computed statistics.
        """
        ctx = super().get_context_data(**kws)
        ctx["project"] = project = self.project
        ctx["campaign"] = project.campaign

        if self.filters:
            ctx["sublevel_querystring"] = urlencode(self.filters)
            ctx["filters"] = self.filters

        project_assets = Asset.objects.filter(
            item__project=project, published=True, item__published=True
        )
        filter_by_reviewable = kws.get("filter_by_reviewable", False)
        if filter_by_reviewable:
            project_assets = project_assets.exclude(
                transcription__user=self.request.user.id
            )
            ctx["filter_assets"] = True
            ctx["transcription_status"] = TranscriptionStatus.SUBMITTED
        else:
            ctx["transcription_status"] = self.request.GET.get("transcription_status")

        calculate_asset_stats(project_assets, ctx)

        annotate_children_with_progress_stats(ctx["items"])

        return ctx

    def serialize_context(self, context: dict[str, object]) -> dict[str, object]:
        """
        Serialize context for API responses.

        Extends the base list serialization by attaching the serialized project
        object. Mirrors the behavior used elsewhere to pair list payloads with
        their parent container.

        Args:
            context (dict[str, object]): The view context to serialize.

        Returns:
            dict[str, object]: A JSON-serializable structure including:
                - `results`/pagination fields from the base serializer.
                - `project` (dict): Serialized project metadata.
        """
        data = super().serialize_context(context)
        data["project"] = self.serialize_object(context["project"])
        return data


@method_decorator(user_cache_control, name="dispatch")
class FilteredProjectDetailView(ProjectDetailView):
    """
    Project detail view that filters to reviewable items for the user.

    This variant restricts the queryset and context to prioritize items that
    are ready for review by the current user (i.e., excludes items with assets
    already transcribed by that user). It also sets the effective status filter
    to `SUBMITTED` in context.
    """

    def get_queryset(self) -> QuerySet:
        """
        Return the review-focused queryset.

        Delegates to the parent implementation with `filter_by_reviewable=True`.

        Returns:
            QuerySet: Item queryset annotated with status counts and filtered
                for reviewable content.
        """
        return super().get_queryset(filter_by_reviewable=True)

    def get_context_data(self, **kws) -> dict[str, object]:
        """
        Build context with reviewable filtering enabled.

        Sets the `filter_by_reviewable` flag before delegating to the parent
        implementation so that downstream context keys (e.g., status and
        `filter_assets`) reflect review-mode behavior.

        Args:
            **kws: Context keyword arguments.

        Returns:
            dict[str, object]: Context dictionary with reviewable filtering.
        """
        kws["filter_by_reviewable"] = True

        return super().get_context_data(**kws)


================================================
FILE: concordia/views/rate_limit.py
================================================
from django.http import HttpRequest, HttpResponse, JsonResponse
from django.shortcuts import render

from concordia.utils import request_accepts_json


def ratelimit_view(
    request: HttpRequest, exception: Exception | None = None
) -> HttpResponse:
    """
    Handles requests blocked due to rate limiting (HTTP 429).

    Determines whether to return a JSON or HTML response based on the request headers.
    Adds a `Retry-After` header instructing clients to wait 15 minutes before retrying.

    Args:
        request (HttpRequest): The incoming request that triggered the rate limit.
        exception (Exception | None): The exception that caused the view to trigger,
            if available.

    Returns:
        HttpResponse: A JSON or HTML 429 response with a retry header.
    """
    status_code = 429

    ctx = {
        "error": "You have been rate-limited. Please try again later.",
        "status": status_code,
    }

    if exception is not None:
        ctx["exception"] = str(exception)

    if request.headers.get(
        "x-requested-with"
    ) == "XMLHttpRequest" or request_accepts_json(request):
        response = JsonResponse(ctx, status=status_code)
    else:
        response = render(request, "429.html", context=ctx, status=status_code)

    response["Retry-After"] = 15 * 60

    return response


================================================
FILE: concordia/views/simple_pages.py
================================================
import datetime
from typing import Any

import markdown
from django.core.cache import cache
from django.http import HttpRequest, HttpResponse
from django.shortcuts import get_object_or_404, render
from django.template import Context, Template
from django.utils.http import http_date
from django.utils.timezone import now
from django.views.generic import RedirectView

from concordia.models import Guide, SimplePage, SiteReport
from concordia.parser import paginate_blog_posts

from .decorators import default_cache_control


@default_cache_control
def simple_page(
    request: HttpRequest,
    path: str | None = None,
    slug: str | None = None,
    body_ctx: dict[str, Any] | None = None,
    template: str = "static-page.html",
) -> HttpResponse:
    """
    Renders a simple Markdown-based page stored in the `SimplePage` model.

    If no `path` is provided, defaults to the current request path. Markdown is
    rendered with optional associated guide content. Breadcrumbs and language
    detection are computed from the URL structure.

    Request Parameters:
        path (str, optional): The database path of the page. Defaults to the
            current request path.
        slug (str, optional): Unused in current logic; passed for route compatibility.
        body_ctx (dict[str, Any], optional): Additional context injected into the page
            body during rendering.
        template (str): Template used to render the page.

    Returns:
        HttpResponse: Rendered HTML of the simple page.
    """
    if not path:
        path = request.path

    if body_ctx is None:
        body_ctx = {}

    page = get_object_or_404(SimplePage, path=path)

    md = markdown.Markdown(extensions=["meta"])

    breadcrumbs = []
    path_components = request.path.strip("/").split("/")
    for i, segment in enumerate(path_components[:-1], start=1):
        breadcrumbs.append(
            ("/%s/" % "/".join(path_components[0:i]), segment.replace("-", " ").title())
        )
    breadcrumbs.append((request.path, page.title))

    language_code = "en"
    if request.path.replace("/", "").endswith("-esp"):
        language_code = "es"

    ctx = {
        "language_code": language_code,
        "title": page.title,
        "breadcrumbs": breadcrumbs,
    }

    guide = page.guide_set.all().first()
    if guide is not None:
        html = "".join((page.body, guide.body))
        ctx["add_navigation"] = True
    else:
        html = page.body
    if "add_navigation" in ctx:
        ctx["guides"] = Guide.objects.order_by("order")
    body = Template(md.convert(html))
    ctx["body"] = body.render(Context(body_ctx))
    ctx.update(body_ctx)

    resp = render(request, template, ctx)
    resp["Created"] = http_date(page.created_on.timestamp())
    return resp


@default_cache_control
def about_simple_page(
    request: HttpRequest, path: str | None = None, slug: str | None = None
) -> HttpResponse:
    """
    Renders the "about" simple page with additional cached campaign and blog stats.

    Adds the following keys to the context:
        - `report_date` (datetime): Yesterday’s date.
        - `campaigns_published` (int): Count from active SiteReport.
        - `assets_published` (int): Active + retired total.
        - `assets_completed` (int): Active + retired total.
        - `assets_waiting_review` (int): Active + retired total.
        - `users_activated` (int): From active SiteReport.
        - `blog_posts` (Callable): Reference to blog post fetcher.

    Returns:
        HttpResponse: Rendered HTML of the about page with campaign stats.
    """
    context_cache_key = "about_simple_page-about_context"
    about_context = cache.get(context_cache_key)
    if not about_context:
        try:
            active_campaigns = SiteReport.objects.filter(
                report_name=SiteReport.ReportName.TOTAL
            ).latest()
        except SiteReport.DoesNotExist:
            active_campaigns = SiteReport(
                campaigns_published=0,
                assets_published=0,
                assets_completed=0,
                assets_waiting_review=0,
                users_activated=0,
            )
        try:
            retired_campaigns = SiteReport.objects.filter(
                report_name=SiteReport.ReportName.RETIRED_TOTAL
            ).latest()
        except SiteReport.DoesNotExist:
            retired_campaigns = SiteReport(
                assets_published=0,
                assets_completed=0,
                assets_waiting_review=0,
            )
        about_context = {
            "report_date": now() - datetime.timedelta(days=1),
            "campaigns_published": active_campaigns.campaigns_published,
            "assets_published": active_campaigns.assets_published
            + retired_campaigns.assets_published,
            "assets_completed": active_campaigns.assets_completed
            + retired_campaigns.assets_completed,
            "assets_waiting_review": active_campaigns.assets_waiting_review
            + retired_campaigns.assets_waiting_review,
            "users_activated": active_campaigns.users_activated,
            "blog_posts": paginate_blog_posts(),
            "about_page": True,
        }
        cache.set(context_cache_key, about_context, 60 * 60)

    return simple_page(request, path, slug, about_context)


# These views are to make sure various links to help-center URLs don't break
# when the URLs are changed to not include help-center and can be removed after
# all links are updated.


class HelpCenterRedirectView(RedirectView):
    def get_redirect_url(self, *args, **kwargs):
        path = kwargs["page_slug"]
        return "/get-started/" + path + "/"


class HelpCenterSpanishRedirectView(RedirectView):
    def get_redirect_url(self, *args, **kwargs):
        path = kwargs["page_slug"]
        return "/get-started-esp/" + path + "-esp/"


# End of help-center views


================================================
FILE: concordia/views/topics.py
================================================
from typing import Any
from urllib.parse import urlencode

from django.db.models import Count, F, FilteredRelation, Q
from django.utils.decorators import method_decorator
from django.views.decorators.cache import cache_page

from concordia.api_views import APIDetailView
from concordia.models import Asset, Topic, TranscriptionStatus

from .decorators import default_cache_control
from .utils import annotate_children_with_progress_stats, calculate_asset_stats


@method_decorator(default_cache_control, name="dispatch")
@method_decorator(cache_page(60 * 60, cache="view_cache"), name="dispatch")
class TopicDetailView(APIDetailView):
    """
    Display a topic and its projects with aggregated progress stats.

    Renders the topic detail page with a list of published projects tied to
    the topic, annotated with per-status asset counts. Supports an optional
    transcription-status filter which narrows projects to those containing
    assets in that status and respects per-topic URL filter overrides.

    Attributes:
        template_name (str): Template used for topic detail.
        context_object_name (str): Context key for the main object (`topic`).
        queryset (QuerySet[Topic]): Base queryset for lookup and ordering.
    """

    template_name = "transcriptions/topic_detail.html"
    context_object_name = "topic"
    queryset = Topic.objects.published().order_by("title")

    def get_context_data(self, **kwargs: Any) -> dict[str, object]:
        """
        Build context for the topic detail template.

        Computes project-level progress annotations and applies an optional
        status filter. Also computes topic-wide asset statistics and prepares
        sublevel querystring parameters for downstream pages.

        Request Parameters:
            - `transcription_status` (str, optional): When present and valid,
              filters projects to those that:
                * have at least one asset in the given status, and
                * either have no `pt__url_filter` or have one matching the
                  requested status.

        Context Format:
            - `topic` (Topic): The topic being viewed.
            - `projects` (QuerySet): Topic projects with:
                * per-status counts (e.g., `submitted_count`), and
                * `topic_ordering` and `topic_url_filter` from the through
                  relation.
            - `filters` (dict[str, str]): Applied filter parameters.
            - `sublevel_querystring` (str): URL-encoded `filters` for links.
            - `transcription_status` (str | None): Reflected status filter.
            - Aggregated asset stats for the topic (added by
              `calculate_asset_stats`), including keys such as:
                * `total_assets`, `completed_assets`, `in_progress_assets`,
                  `not_started_assets`, `submitted_assets`.

        Args:
            **kwargs: Additional context arguments passed by the base class.

        Returns:
            dict[str, object]: Context for rendering the topic detail page.
        """
        ctx = super().get_context_data(**kwargs)
        topic = ctx["topic"]

        status = self.request.GET.get("transcription_status")
        status_valid = status in TranscriptionStatus.CHOICE_MAP

        projects = (
            topic.project_set.published().annotate(
                **{
                    f"{key}_count": Count(
                        "item__asset",
                        filter=Q(
                            item__published=True,
                            item__asset__published=True,
                            item__asset__transcription_status=key,
                        ),
                    )
                    for key in TranscriptionStatus.CHOICE_MAP.keys()
                }
            )
            # Pin the through relation to THIS topic, otherwise it will annotate for
            # each ProjectTopic the project is part of
            .annotate(
                pt=FilteredRelation(
                    "projecttopic", condition=Q(projecttopic__topic=topic)
                )
            )
            # Pull fields from the pinned alias
            .annotate(
                topic_ordering=F("pt__ordering"),
                topic_url_filter=F("pt__url_filter"),
            )
        )

        # If there's a status filter, we want to exclude any projects
        # don't don't have assets in that status, as well as any
        # that have a URL filter that's different than the status filter
        if status_valid:
            ctx["transcription_status"] = status
            projects = projects.filter(
                Q(pt__url_filter__isnull=True)
                | Q(pt__url_filter="")
                | Q(pt__url_filter=status)
            ).exclude(**{f"{status}_count": 0})

        projects = projects.order_by("topic_ordering", "campaign__title", "title")

        ctx["filters"] = filters = {}
        if status_valid:
            # We only want to pass specific QS parameters to lower-level search pages:
            filters["transcription_status"] = status
        ctx["sublevel_querystring"] = urlencode(filters)

        annotate_children_with_progress_stats(projects)
        ctx["projects"] = projects

        topic_assets = Asset.objects.filter(
            item__project__topics=self.object,
            item__project__published=True,
            item__published=True,
            published=True,
        )

        calculate_asset_stats(topic_assets, ctx)

        return ctx

    def serialize_context(self, context: dict[str, object]) -> dict[str, object]:
        """
        Serialize context for API consumers.

        Extends the base serializer with a `related_links` list derived from the
        topic's associated helpful links.

        Args:
            context (dict[str, object]): Fully built template context.

        Returns:
            dict[str, object]: JSON-serializable payload that includes the base
                fields from `APIDetailView.serialize_context` and:
                - `object.related_links` (list[dict]): Each with:
                    * `title` (str)
                    * `url` (str)
        """
        ctx = super().serialize_context(context)
        ctx["object"]["related_links"] = [
            {"title": title, "url": url}
            for title, url, sequence in self.object.helpfullink_set.values_list(
                "title", "link_url"
            )
        ]
        return ctx


================================================
FILE: concordia/views/utils.py
================================================
import datetime
from collections.abc import Iterable
from time import time

from django.conf import settings
from django.db.models import Count, Max, Q, QuerySet
from django.db.models.functions import Greatest
from django.http import HttpRequest
from django.utils import timezone
from django.utils.timezone import now

from concordia.models import Asset, Transcription, TranscriptionStatus


def _get_pages(request: HttpRequest) -> QuerySet:
    """
    Retrieve a filtered and annotated queryset of assets based on user activity.

    Filters the Asset queryset by:
      - Activity type (transcribed or reviewed)
      - Transcription status
      - Date range (start, end or both)
      - Campaign ID
      - Last six months of activity

    Assets are annotated with:
      - Timestamps of last transcription/review activity
      - Combined latest activity timestamp

    Also applies ordering based on the selected sort parameter.

    Args:
        request (HttpRequest): The incoming HTTP request with query parameters.

    Returns:
        QuerySet: A queryset of `Asset` objects with applied filters and annotations.
    """
    user = request.user
    activity = request.GET.get("activity", None)

    if activity == "transcribed":
        q = Q(transcription__user=user)
    elif activity == "reviewed":
        q = Q(transcription__reviewed_by=user)
    else:
        q = Q(transcription__user=user) | Q(transcription__reviewed_by=user)
    assets = Asset.objects.filter(q)

    status_list = request.GET.getlist("status")
    if status_list and status_list != []:
        if "completed" not in status_list:
            assets = assets.exclude(transcription_status=TranscriptionStatus.COMPLETED)
        if "submitted" not in status_list:
            assets = assets.exclude(transcription_status=TranscriptionStatus.SUBMITTED)
        if "in_progress" not in status_list:
            assets = assets.exclude(
                transcription_status=TranscriptionStatus.IN_PROGRESS
            )

    assets = assets.select_related("item", "item__project", "item__project__campaign")

    assets = assets.annotate(
        last_transcribed=Max(
            "transcription__created_on",
            filter=Q(transcription__user=user),
        ),
        last_reviewed=Max(
            "transcription__updated_on",
            filter=Q(transcription__reviewed_by=user),
        ),
        latest_activity=Greatest(
            "last_transcribed",
            "last_reviewed",
            filter=Q(transcription__user=user) | Q(transcription__reviewed_by=user),
        ),
    )
    fmt = "%Y-%m-%d"
    start_date = None
    start = request.GET.get("start", None)
    if start is not None and len(start) > 0:
        start_date = timezone.make_aware(datetime.datetime.strptime(start, fmt))
    end_date = None
    end = request.GET.get("end", None)
    if end is not None and len(end) > 0:
        end_date = timezone.make_aware(datetime.datetime.strptime(end, fmt))
    if start_date is not None and end_date is not None:
        end_date += datetime.timedelta(days=1)
        end = end_date.strftime(fmt)
        assets = assets.filter(latest_activity__range=[start, end])
    elif start_date is not None or end_date is not None:
        date = start_date if start_date else end_date
        assets = assets.filter(
            latest_activity__year=date.year,
            latest_activity__month=date.month,
            latest_activity__day=date.day,
        )
    # CONCD-189 only show pages from the last 6 months
    # This should be an aware datetime, not a date. A date is cast
    # to a naive datetime when it's compared to a datetime
    # field, as is being done here
    SIX_MONTHS_AGO = now() - datetime.timedelta(days=6 * 30)
    assets = assets.filter(latest_activity__gte=SIX_MONTHS_AGO)
    order_by = request.GET.get("order_by", "date-descending")
    if order_by == "date-ascending":
        assets = assets.order_by("latest_activity", "-id")
    else:
        assets = assets.order_by("-latest_activity", "-id")

    campaign_id = request.GET.get("campaign", None)
    if campaign_id is not None:
        assets = assets.filter(item__project__campaign__pk=campaign_id)

    return assets


def calculate_asset_stats(asset_qs: QuerySet, ctx: dict) -> None:
    """
    Annotates the context dictionary with asset statistics and contributor data.

    Computes:
      - Total number of unique contributors across all transcriptions.
      - Count and percentage of assets per transcription status.
      - Labeled status counts for use in progress displays.

    Percentages are capped at 99% for values between 99.0 and 99.999... to avoid
    showing 100% prematurely.

    Args:
        asset_qs (QuerySet): A queryset of `Asset` objects to calculate statistics on.
        ctx (dict): The context dictionary to populate with computed values.

    Returns:
        None
    """
    asset_count = asset_qs.count()

    trans_qs = Transcription.objects.filter(asset__in=asset_qs).values_list(
        "user_id", "reviewed_by"
    )
    user_ids = set()
    for i, j in trans_qs.iterator():
        user_ids.add(i)
        user_ids.add(j)
    # Remove null values from the set, if it exists
    try:
        user_ids.remove(None)
    except KeyError:
        pass

    ctx["contributor_count"] = len(user_ids)

    asset_state_qs = asset_qs.values_list("transcription_status")
    asset_state_qs = asset_state_qs.annotate(Count("transcription_status")).order_by()
    status_counts_by_key = dict(asset_state_qs)

    ctx["transcription_status_counts"] = labeled_status_counts = []

    for status_key, status_label in TranscriptionStatus.CHOICES:
        value = status_counts_by_key.get(status_key, 0)
        if value:
            pct_raw = 100 * (value / asset_count)
            if pct_raw >= 99 and pct_raw < 100:
                pct = 99
            else:
                pct = round(pct_raw)
        else:
            pct = 0

        ctx[f"{status_key}_percent"] = pct
        ctx[f"{status_key}_count"] = value
        labeled_status_counts.append((status_key, status_label, value))


def annotate_children_with_progress_stats(children: Iterable) -> None:
    """
    Annotates child objects with transcription progress statistics.

    Each object is expected to have attributes named `{status}_count` corresponding to
    each transcription status key. This function calculates:

      - `total_count`: Total asset count for the object.
      - `{status}_percent`: Percentage of total for each transcription status.
      - `lowest_transcription_status`: The first non-zero status in defined order.

    Percentages are capped at 99% for values between 99.0 and 99.999... to avoid
    rounding up to 100% prematurely.

    Args:
        children (Iterable): A sequence of objects with `{status}_count` attributes.

    Returns:
        None
    """
    for obj in children:
        counts = {}

        for k, __ in TranscriptionStatus.CHOICES:
            counts[k] = getattr(obj, f"{k}_count", 0)

        obj.total_count = total = sum(counts.values())

        lowest_status = None

        for k, __ in TranscriptionStatus.CHOICES:
            count = counts[k]

            if total > 0:
                pct_raw = 100 * (count / total)
                if pct_raw >= 99 and pct_raw < 100:
                    pct = 99
                else:
                    pct = round(pct_raw)
            else:
                pct = 0

            setattr(obj, f"{k}_percent", pct)

            if lowest_status is None and count > 0:
                lowest_status = k

        obj.lowest_transcription_status = lowest_status


class AnonymousUserValidationCheckMixin:
    """
    Mixin that injects anonymous user validation context into class-based views.

    Adds a boolean `anonymous_user_validation_required` to the context, indicating
    whether a Turnstile validation prompt should be displayed based on the time since
    the user's last successful validation.

    Intended for use with views that already implement `get_context_data()`, such as
    Django's TemplateView or DetailView subclasses.
    """

    def get_context_data(self, *args, **kwargs) -> dict:
        """
        Add anonymous user validation flag to the context.

        If the user is unauthenticated and the time since their last validation exceeds
        the configured interval, the flag is set to True. Otherwise, it is set to False.

        Returns:
            dict: The updated template context with the validation flag included.
        """
        context = super().get_context_data(**kwargs)
        if not self.request.user.is_authenticated:
            turnstile_last_validated = self.request.session.get(
                "turnstile_last_validated", 0
            )
            age = time() - turnstile_last_validated
            context["anonymous_user_validation_required"] = (
                age > settings.ANONYMOUS_USER_VALIDATION_INTERVAL
            )
        else:
            context["anonymous_user_validation_required"] = False
        return context


================================================
FILE: concordia/views/visualizations.py
================================================
from django.core.cache import caches
from django.http import JsonResponse
from django.utils.decorators import method_decorator
from django.views import View
from django.views.decorators.cache import never_cache


@method_decorator(never_cache, name="dispatch")
class VisualizationDataView(View):
    """
    Serve cached visualization data as JSON, returning a 404 JSON error if missing.

    A single endpoint that, given a `name` slug in the URL, looks up exactly
    that key in the 'visualization_cache' and returns its contents as JSON.
    If no entry exists under that key, responds with a 404 and a JSON error message.

    Attributes:
        cache (BaseCache): The Django cache used to retrieve data.

    URL Parameters:
        name (str): The slug identifying which visualization data to return.
            Example: "daily-transcription-activity-by-campaign".

    Returns:
        JsonResponse:
            - On success: the cached data (any JSON-serializable structure).
            - On failure: a JSON object {"error": "..."} with HTTP status 404.
    """

    cache = caches["visualization_cache"]

    def get(self, request, name):
        data = self.cache.get(name)
        if data is None:
            return JsonResponse(
                {"error": f"No visualization data found for '{name}'"}, status=404
            )

        return JsonResponse(data)


================================================
FILE: concordia/widgets.py
================================================
from django import forms


class EmailWidget(forms.EmailInput):
    template_name = "forms/widgets/email.html"


================================================
FILE: concordia/wsgi.py
================================================
"""
WSGI config for concordia project.

It exposes the WSGI callable as a module-level variable named ``application``.

For more information on this file, see
https://docs.djangoproject.com/en/2.0/howto/deployment/wsgi/
"""

from django.core.wsgi import get_wsgi_application

application = get_wsgi_application()


================================================
FILE: configuration/__init__.py
================================================


================================================
FILE: configuration/admin.py
================================================
from typing import Any

from django.contrib import admin, messages
from django.http import HttpRequest, HttpResponse
from django.template.response import TemplateResponse
from django.utils.html import format_html

from configuration.models import Configuration


@admin.register(Configuration)
class ConfigurationAdmin(admin.ModelAdmin):
    """
    Admin configuration for the `Configuration` model.

    Behavior:
        - Displays the key, raw value, and description in the changelist.
        - Provides a read-only `validated_value` field on the change form that
          shows the interpreted value as returned by `Configuration.get_value`.
        - Overrides `changeform_view` to add a two-step confirmation flow when
          saving changes, including a preview of the parsed value. Also handles
          an explicit cancel action by rebuilding the normal change form
          context rather than delegating to the base implementation.
    """

    list_display = ("key", "value", "description")
    readonly_fields = ("validated_value",)

    def validated_value(self, obj: Configuration) -> str:
        """
        Render the parsed configuration value and explanatory text.

        Notes:
            This method does not alter the base `ModelAdmin` behavior. It is a
            helper used by the change form to display both the interpreted
            value from `Configuration.get_value()` and a short explanation
            that this parsed value is what application code will consume.

        Args:
            obj (Configuration): The instance being edited.

        Returns:
            str: HTML-safe string produced by `format_html` containing the
                parsed value and explanatory note.
        """
        return format_html(
            "<div>{}</div><div style='color: #777; font-size: 0.9em;'>{}</div>",
            obj.get_value(),
            "This is the interpreted value based on the selected data type. "
            "This value is what will be seen by the code that uses this "
            "configuration.",
        )

    def changeform_view(
        self,
        request: HttpRequest,
        object_id: str | None = None,
        form_url: str = "",
        extra_context: dict[str, Any] | None = None,
    ) -> HttpResponse:
        """
        Override the base change form view to add a confirmation step.

        Differences from the base implementation:
            - On initial POST, validate the form and, if valid, render a
              confirmation template that previews the parsed value produced by
              `Configuration.get_value()`.
            - On confirmation POST (`_confirm_update`), save the instance and
              show a success message.
            - On cancel POST (`cancel_update`), rebuild the standard change
              form context manually and re-render the change form instead of
              delegating to the base method (which would otherwise proceed with
              the change because it is a POST).
            - For all other flows, fall back to the base implementation.

        Args:
            request (HttpRequest): The current request.
            object_id (str | None): Primary key of the object being edited.
            form_url (str): Form action URL.
            extra_context (dict[str, Any] | None): Extra template context.

        Returns:
            HttpResponse: Either the confirmation screen, the re-rendered
                change form, or the default response from the base view.
        """
        obj = self.get_object(request, object_id)

        if request.method == "POST":
            if "_confirm_update" in request.POST:
                # Second POST: confirmation of update
                form = self.get_form(request, obj)(request.POST, instance=obj)
                if form.is_valid():
                    form.save()
                    self.message_user(request, "Configuration updated and cached.")
                    return self.response_post_save_change(request, form.instance)
                else:
                    self.message_user(
                        request, "Invalid data on confirmation.", level=messages.ERROR
                    )
            elif "cancel_update" in request.POST:
                form = self.get_form(request, obj)(request.POST, instance=obj)

                admin_form = admin.helpers.AdminForm(
                    form,
                    list(self.get_fieldsets(request, obj)),
                    self.get_prepopulated_fields(request, obj),
                    self.get_readonly_fields(request, obj),
                    model_admin=self,
                )
                # We unfortunately have to manually construct this context, since using
                # super causes it to just perform the cancelled change, because this is
                # a POST request
                context = {
                    **self.admin_site.each_context(request),
                    "title": f"Edit Configuration: {obj.key}",
                    "adminform": admin_form,
                    "inline_admin_formsets": [],
                    "media": self.media + form.media,
                    "object_id": object_id,
                    "original": obj,
                    "opts": self.model._meta,
                    "add": False,
                    "change": True,
                    "is_popup": False,
                    "save_as": self.save_as,
                    "has_view_permission": self.has_view_permission(request, obj),
                    "has_add_permission": self.has_add_permission(request),
                    "has_change_permission": self.has_change_permission(request, obj),
                    "has_delete_permission": self.has_delete_permission(request, obj),
                    "form_url": form_url,
                    "to_field": None,
                    "has_editable_inline_admin_formsets": False,
                }
                return self.render_change_form(
                    request,
                    context=context,
                    add=False,
                    change=True,
                    form_url=form_url,
                    obj=obj,
                )

            else:
                # First POST: validate and show confirmation screen
                form = self.get_form(request, obj)(request.POST, instance=obj)
                if form.is_valid():
                    new_instance = form.save(commit=False)
                    try:
                        parsed_value = new_instance.get_value()
                    except Exception as e:
                        self.message_user(
                            request, f"Validation failed: {e}", level=messages.ERROR
                        )
                        return super().changeform_view(
                            request, object_id, form_url, extra_context=extra_context
                        )

                    context = {
                        "title": (
                            f"Confirm Update of Configuration '{new_instance.key}'"
                        ),
                        "original": self.model._default_manager.get(pk=obj.pk),
                        "new_instance": new_instance,
                        "parsed_value": parsed_value,
                        "opts": self.model._meta,
                        "object_id": object_id,
                        "form_url": form_url,
                        "request": request,
                    }
                    return TemplateResponse(
                        request, "admin/configuration_confirm_update.html", context
                    )

        return super().changeform_view(request, object_id, form_url, extra_context)


================================================
FILE: configuration/apps.py
================================================
from django.apps import AppConfig


class ConfigurationConfig(AppConfig):
    default_auto_field = "django.db.models.BigAutoField"
    name = "configuration"

    def ready(self):
        import configuration.signals  # NOQA


================================================
FILE: configuration/management/__init__.py
================================================


================================================
FILE: configuration/management/commands/__init__.py
================================================


================================================
FILE: configuration/management/commands/configcache.py
================================================
from django.core.cache import caches
from django.core.management.base import BaseCommand


class Command(BaseCommand):
    help = "Fetch a value from the configuration cache by key."  # NOQA: A003

    def add_arguments(self, parser):
        parser.add_argument("key", type=str, help="The cache key to retrieve")

    def handle(self, *args, **options):
        config_cache = caches["configuration_cache"]
        key = options["key"]
        cache_key = f"config_{key}"
        value = config_cache.get(cache_key)

        if value is None:
            self.stdout.write(self.style.WARNING(f"Key '{key}' not found in cache."))
        else:
            self.stdout.write(self.style.SUCCESS(f"Key '{key}' found:"))
            self.stdout.write(str(value))


================================================
FILE: configuration/migrations/0001_initial.py
================================================
# Generated by Django 4.2.16 on 2025-02-25 19:21

from django.db import migrations, models


class Migration(migrations.Migration):

    initial = True

    dependencies = []

    operations = [
        migrations.CreateModel(
            name="Configuration",
            fields=[
                (
                    "id",
                    models.BigAutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                (
                    "key",
                    models.CharField(
                        help_text="Unique identifier for the configuration setting",
                        max_length=255,
                        unique=True,
                    ),
                ),
                (
                    "value",
                    models.TextField(help_text="Value of the configuration setting"),
                ),
                (
                    "data_type",
                    models.CharField(
                        choices=[
                            ("text", "Plain text"),
                            ("number", "Number"),
                            ("boolean", "Boolean"),
                            ("json", "JSON"),
                            ("html", "HTML"),
                        ],
                        default="text",
                        help_text="Data type of the value",
                        max_length=10,
                    ),
                ),
                (
                    "description",
                    models.TextField(
                        blank=True,
                        help_text="Optional description of the configuration setting",
                    ),
                ),
            ],
        ),
    ]


================================================
FILE: configuration/migrations/0002_populate_configurations.py
================================================
# Generated by Django 4.2.16 on 2025-02-25 20:15

from django.db import migrations


def populate_configuration(apps, schema_editor):
    Configuration = apps.get_model("configuration", "Configuration")

    # List of initial configuration entries
    initial_data = [
        {
            "key": "review_rate_limit_popup_message",
            "data_type": "html",
            "value": "<p>Volunteers can only accept {% configuration_value 'review_rate_limit' %} pages per minute.</p>\r\n<p>Please read all transcriptions completely to ensure they are whole and accurate. <a href=\"{% url 'how-to-review' %}\">See review instructions.</a></p>",
            "description": "Message shown in the pop-up when a user exceeds the review rate limit",
        },
        {
            "key": "review_rate_limit_popup_title",
            "data_type": "html",
            "value": "You cannot yet accept this page",
            "description": "Title of the error pop-up displayed when a user exceeds the review rate limit",
        },
        {
            "key": "review_rate_limit",
            "data_type": "number",
            "value": "4",
            "description": "Number of reviews allowed per minute",
        },
        {
            "key": "review_rate_limit_banner_message",
            "data_type": "html",
            "value": "You cannot yet accept this page. Volunteers can only accept {% configuration_value 'review_rate_limit' %} pages per minute. See <a href=\"{% url 'how-to-review' %}\">review instructions</a>.",
            "description": "Message to display on the banner when a user exceeds the review rate limit",
        },
    ]

    # Insert data into the database
    for entry in initial_data:
        Configuration.objects.update_or_create(key=entry["key"], defaults=entry)


def revert_populate_configuration(apps, schema_editor):
    # We can't actually revert the data to the state it was before,
    # and there's no actual need to, but we need this function to be
    # able to reverse this migration
    pass


class Migration(migrations.Migration):

    dependencies = [
        ("configuration", "0001_initial"),
    ]

    operations = [
        migrations.RunPython(populate_configuration, revert_populate_configuration),
    ]


================================================
FILE: configuration/migrations/0003_populate_retry_configurations.py
================================================
# Generated by Django 4.2.16 on 2025-03-03 20:51

from django.db import migrations


def populate_retry_configuration(apps, schema_editor):
    Configuration = apps.get_model("configuration", "Configuration")

    # List of initial retry configuration entries
    initial_data = [
        {
            "key": "asset_image_import_max_retries",
            "data_type": "number",
            "value": "3",
            "description": "The maximum number of times to retry downloading "
            "an asset image during import",
        },
        {
            "key": "asset_image_import_max_retry_delay",
            "data_type": "number",
            "value": "10",
            "description": "The number of minutes to wait before retrying downloading "
            "an image during import. A non-positive number will disable retries. Should "
            "not be greater than around 45 to avoid the system duplicating the task.",
        },
    ]

    # Insert data into the database
    for entry in initial_data:
        Configuration.objects.update_or_create(key=entry["key"], defaults=entry)


def revert_populate_retry_configuration(apps, schema_editor):
    # We can't actually revert the data to the state it was before,
    # and there's no actual need to, but we need this function to be
    # able to reverse this migration
    pass


class Migration(migrations.Migration):

    dependencies = [
        ("configuration", "0002_populate_configurations"),
    ]

    operations = [
        migrations.RunPython(
            populate_retry_configuration, revert_populate_retry_configuration
        ),
    ]


================================================
FILE: configuration/migrations/0004_alter_configuration_options.py
================================================
# Generated by Django 4.2.16 on 2025-03-18 20:01

from django.db import migrations


class Migration(migrations.Migration):

    dependencies = [
        ("configuration", "0003_populate_retry_configurations"),
    ]

    operations = [
        migrations.AlterModelOptions(
            name="configuration",
            options={"ordering": ["key"]},
        ),
    ]


================================================
FILE: configuration/migrations/0005_alter_configuration_data_type.py
================================================
# Generated by Django 4.2.22 on 2025-07-29 17:28

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("configuration", "0004_alter_configuration_options"),
    ]

    operations = [
        migrations.AlterField(
            model_name="configuration",
            name="data_type",
            field=models.CharField(
                choices=[
                    ("text", "Plain text"),
                    ("number", "Number"),
                    ("boolean", "Boolean"),
                    ("json", "JSON"),
                    ("html", "HTML"),
                    ("rate", "Rate"),
                ],
                default="text",
                help_text="Data type of the value",
                max_length=10,
            ),
        ),
    ]


================================================
FILE: configuration/migrations/0006_populate_next_asset_rate_limit.py
================================================
from django.db import migrations


def populate_configuration(apps, schema_editor):
    Configuration = apps.get_model("configuration", "Configuration")

    initial_data = [
        {
            "key": "next_asset_rate_limit",
            "data_type": "rate",
            "value": "4/m",
            "description": "Rate limit of anonymous users for the next_*_asset views. Format is 'X/u', where 'X' is the number of requests and 'u' is 's', 'm', 'h' or'd' (second, minute, hour or day). '5/s' means 'five per second'.",
        },
    ]

    for entry in initial_data:
        Configuration.objects.update_or_create(key=entry["key"], defaults=entry)


def revert_populate_configuration(apps, schema_editor):
    # We can't actually revert the data to the state it was before,
    # and there's no actual need to, but we need this function to be
    # able to reverse this migration
    pass


class Migration(migrations.Migration):

    dependencies = [
        ("configuration", "0005_alter_configuration_data_type"),
    ]

    operations = [
        migrations.RunPython(populate_configuration, revert_populate_configuration),
    ]


================================================
FILE: configuration/migrations/__init__.py
================================================


================================================
FILE: configuration/models.py
================================================
import json
from typing import Any

from django import template
from django.core.exceptions import ValidationError
from django.db import models

from configuration.validation import validate_rate


class Configuration(models.Model):
    """
    Key/value configuration model with typed decoding.

    Purpose:
        Store site configuration as string values and expose a helper that
        converts the stored text into a concrete Python type based on
        `data_type`.

    Fields:
        key (models.CharField): Unique identifier for the setting.
        data_type (models.CharField): One of `DataType` choices indicating how
            `value` should be interpreted.
        value (models.TextField): Raw text representation of the value.
        description (models.TextField): Optional human-readable description.

    Meta:
        ordering: Sorted by `key`.
    """

    class DataType(models.TextChoices):
        """
        Supported data types for decoding `value` in `get_value`.
        """

        TEXT = "text", "Plain text"
        NUMBER = "number", "Number"
        BOOLEAN = "boolean", "Boolean"
        JSON = "json", "JSON"
        HTML = "html", "HTML"
        RATE = "rate", "Rate"

    key = models.CharField(
        max_length=255,
        unique=True,
        help_text="Unique identifier for the configuration setting",
    )
    data_type = models.CharField(
        max_length=10,
        choices=DataType.choices,
        default=DataType.TEXT,
        help_text="Data type of the value",
    )
    value = models.TextField(help_text="Value of the configuration setting")
    description = models.TextField(
        blank=True, help_text="Optional description of the configuration setting"
    )

    class Meta:
        ordering = ["key"]

    def __str__(self) -> str:
        """
        Return the configuration key for display.
        """
        return self.key

    def get_value(self) -> "Any":
        """
        Decode and return `value` according to `data_type`.

        Behavior:
            - `NUMBER`: Try `int(value)`, else try `float(value)`, else return 0.
            - `BOOLEAN`: Return True if `value.lower() == "true"`, else False.
            - `JSON`: Parse with `json.loads(value)` and return the result.
            - `HTML`: Render `value` through Django's template engine with an
              empty context and return the rendered string.
            - `RATE`: Validate using `validate_rate(value)`. If validation
              fails, return an empty string. Otherwise return the validated
              value as provided by `validate_rate`.
            - `TEXT` or any unrecognized type: Return `value` unchanged.

        Returns:
            Any: Decoded value. The concrete type depends on `data_type` and
            may be `int`, `float`, `bool`, `str`, `dict`, `list`, or a value
            returned by `validate_rate`.

        Raises:
            json.JSONDecodeError: If `data_type` is `JSON` and `value` is not
            valid JSON.
        """
        if self.data_type == Configuration.DataType.NUMBER:
            try:
                return int(self.value)
            except ValueError:
                try:
                    return float(self.value)
                except ValueError:
                    return 0
        elif self.data_type == Configuration.DataType.BOOLEAN:
            if self.value.lower() == "true":
                return True
            else:
                return False
        elif self.data_type == Configuration.DataType.JSON:
            return json.loads(self.value)
        elif self.data_type == Configuration.DataType.HTML:
            value = template.Template(self.value)
            return value.render(template.Context({}))
        elif self.data_type == Configuration.DataType.RATE:
            try:
                return validate_rate(self.value)
            except ValidationError:
                return ""
        else:
            # DataType.TEXT or an unknown type,
            # so just return the value itself
            return self.value


================================================
FILE: configuration/signals.py
================================================
from django.db.models.signals import post_save
from django.dispatch import receiver

from configuration.models import Configuration
from configuration.utils import cache_configuration_value


@receiver(post_save, sender=Configuration)
def update_cached_configuration_value(
    sender: type[Configuration], *, instance: Configuration, **kwargs
) -> None:
    """
    Post-save signal handler that updates the cached configuration value.

    Behavior:
        - Parse the instance value using `Configuration.get_value()`.
        - If parsing succeeds, write the parsed value to the cache via
          `cache_configuration_value`.
        - If parsing raises any exception, skip caching to avoid persisting an
          invalid value.

    Signals:
        Connected to `django.db.models.signals.post_save` for
        `configuration.models.Configuration`.

    Args:
        sender (type[Configuration]): The model class that sent the signal.
        instance (Configuration): The saved instance whose parsed value should
            be cached.

    Returns:
        None
    """
    try:
        value = instance.get_value()
    except Exception:
        # Do not cache if value is invalid
        return
    cache_configuration_value(instance.key, value)


================================================
FILE: configuration/templates/admin/configuration_confirm_update.html
================================================
{% extends "admin/base_site.html" %}
{% load i18n %}

{% block content %}
  <form method="post">
    {% csrf_token %}
    <input type="hidden" name="_confirm_update" value="1">
    <input type="hidden" name="key" value="{{ new_instance.key }}">
    <input type="hidden" name="data_type" value="{{ new_instance.data_type }}">
    <input type="hidden" name="value" value="{{ new_instance.value }}">
    <input type="hidden" name="description" value="{{ new_instance.description }}">

    <table class="admin-confirmation-table">
      <tr>
        <th>Key</th>
        <td>{{ new_instance.key }}</td>
      </tr>
      <tr>
        <th>Original Value</th>
        <td>{{ original.value }}</td>
      </tr>
      <tr>
        <th>New Raw Value</th>
        <td>{{ new_instance.value }}</td>
      </tr>
      <tr>
        <th>Interpreted Value</th>
        <td><pre>{{ parsed_value }}</pre></td>
      </tr>
    </table>

    <div class="submit-row">
      <input type="submit" value="{% trans "Confirm Save" %}" class="default">
      <a href="#" class="button cancel-link" onclick="document.getElementById('cancel-form').submit(); return false;">
        {% trans "Cancel" %}
      </a>
    </div>
  </form>

  <form id="cancel-form" method="post">
    {% csrf_token %}
    <input type="hidden" name="cancel_update" value="1">
    <input type="hidden" name="key" value="{{ new_instance.key }}">
    <input type="hidden" name="data_type" value="{{ new_instance.data_type }}">
    <input type="hidden" name="value" value="{{ new_instance.value }}">
    <input type="hidden" name="description" value="{{ new_instance.description }}">
  </form>
{% endblock %}


================================================
FILE: configuration/templatetags/__init__.py
================================================


================================================
FILE: configuration/templatetags/configuration_tags.py
================================================
from typing import Any

from django import template

from configuration.models import Configuration
from configuration.utils import configuration_value as _configuration_value

register = template.Library()


@register.simple_tag
def configuration_value(key: str) -> Any:
    """
    Return the parsed configuration value for a key, for use in templates.

    Behavior:
        Delegates to `configuration.utils.configuration_value` to fetch and parse
        the value (including any casting based on the configured data type).
        If the configuration is missing or parsing raises an exception of any
        kind, return an empty string to keep template rendering resilient.

    Args:
        key (str): The unique configuration key.

    Returns:
        Any: The parsed value when available and valid; otherwise an empty string.
    """
    try:
        return _configuration_value(key)
    except (Configuration.DoesNotExist, Exception):
        # Return an empty string if the key does not exist or parsing fails
        return ""


================================================
FILE: configuration/tests/__init__.py
================================================


================================================
FILE: configuration/tests/test_admin.py
================================================
from django.contrib.auth import get_user_model
from django.test import TestCase
from django.urls import reverse

from configuration.models import Configuration


class TestConfigurationAdmin(TestCase):
    def setUp(self):
        self.superuser = get_user_model().objects.create_superuser(
            username="admin",
            email="admin@example.com",
            password="adminpass",  # nosec
        )
        self.client.force_login(self.superuser)

        self.config = Configuration.objects.create(
            key="test-key",
            value="Initial value",
            data_type=Configuration.DataType.TEXT,
            description="Initial description",
        )
        self.url = reverse(
            "admin:configuration_configuration_change", args=[self.config.pk]
        )

    def test_change_view_initial_get(self):
        response = self.client.get(self.url)
        self.assertEqual(response.status_code, 200)
        self.assertContains(response, "test-key")
        self.assertContains(response, "Initial value")

    def test_save_triggers_confirmation(self):
        response = self.client.post(
            self.url,
            {
                "key": self.config.key,
                "value": "Updated value",
                "data_type": Configuration.DataType.TEXT,
                "description": "Updated description",
            },
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(response, "admin/configuration_confirm_update.html")
        self.assertContains(response, "Confirm Update of Configuration")

    def test_confirm_save_updates_object(self):
        # Step 1: post to trigger confirmation
        confirmation_response = self.client.post(
            self.url,
            {
                "key": self.config.key,
                "value": "Updated value",
                "data_type": Configuration.DataType.TEXT,
                "description": "Updated description",
            },
        )
        self.assertEqual(confirmation_response.status_code, 200)
        self.assertTemplateUsed(
            confirmation_response, "admin/configuration_confirm_update.html"
        )

        # Step 2: confirm the update
        confirm_response = self.client.post(
            self.url,
            {
                "_confirm_update": "1",
                "key": self.config.key,
                "value": "Updated value",
                "data_type": Configuration.DataType.TEXT,
                "description": "Updated description",
            },
            follow=True,
        )

        changelist_url = reverse("admin:configuration_configuration_changelist")
        self.assertRedirects(confirm_response, changelist_url)
        self.assertContains(confirm_response, "Configuration updated and cached.")
        self.config.refresh_from_db()
        self.assertEqual(self.config.value, "Updated value")
        self.assertEqual(self.config.description, "Updated description")

    def test_cancel_preserves_input(self):
        # Step 1: post to trigger confirmation
        confirmation_response = self.client.post(
            self.url,
            {
                "key": self.config.key,
                "value": "New value",
                "data_type": Configuration.DataType.TEXT,
                "description": "Changed description",
            },
        )
        self.assertEqual(confirmation_response.status_code, 200)

        # Step 2: simulate "Cancel" by posting with cancel_update
        cancel_response = self.client.post(
            self.url,
            {
                "cancel_update": "1",
                "key": self.config.key,
                "value": "New value",
                "data_type": Configuration.DataType.TEXT,
                "description": "Changed description",
            },
        )

        self.assertEqual(cancel_response.status_code, 200)
        self.assertContains(cancel_response, "Changed description")
        self.assertContains(cancel_response, "New value")

        self.config.refresh_from_db()
        self.assertEqual(self.config.value, "Initial value")
        self.assertEqual(self.config.description, "Initial description")

    def test_confirm_save_with_invalid_form(self):
        # Step 1: trigger confirmation with valid initial post
        self.client.post(
            self.url,
            {
                "key": self.config.key,
                "value": "value",
                "data_type": Configuration.DataType.TEXT,
                "description": "desc",
            },
        )

        # Step 2: confirm with missing required field (invalid POST)
        response = self.client.post(
            self.url,
            {
                "_confirm_update": "1",
                # Omit 'key' which is required
                "value": "value",
                "data_type": Configuration.DataType.TEXT,
                "description": "desc",
            },
            follow=True,
        )

        self.assertEqual(response.status_code, 200)
        self.assertContains(response, "Invalid data on confirmation.")
        self.config.refresh_from_db()
        self.assertEqual(self.config.value, "Initial value")  # unchanged

    def test_get_value_failure_on_confirmation(self):
        # Create a config with data_type=JSON and invalid JSON
        config = Configuration.objects.create(
            key="bad-json-key",
            value="Not JSON",
            data_type=Configuration.DataType.JSON,
            description="desc",
        )
        url = reverse("admin:configuration_configuration_change", args=[config.pk])

        # Initial POST with invalid JSON triggers get_value failure
        response = self.client.post(
            url,
            {
                "key": config.key,
                "value": "Still not JSON",
                "data_type": Configuration.DataType.JSON,
                "description": "desc",
            },
            follow=True,
        )

        self.assertEqual(response.status_code, 200)
        self.assertContains(response, "Validation failed:")

    def test_first_post_invalid_form(self):
        response = self.client.post(
            self.url,
            {
                "key": "",  # key is required, so this makes the form invalid
                "value": "Some value",
                "data_type": Configuration.DataType.TEXT,
                "description": "Bad post",
            },
        )
        self.assertEqual(response.status_code, 200)
        self.assertTemplateUsed(response, "admin/change_form.html")
        self.assertContains(response, "This field is required.")


================================================
FILE: configuration/tests/test_models.py
================================================
import json

from django.core.cache import caches
from django.test import TestCase

from configuration.models import Configuration


class TestConfiguration(TestCase):
    def setUp(self):
        caches["configuration_cache"].clear()

    def test_str(self):
        config = Configuration.objects.create(
            key="test-key", value="Test value", data_type=Configuration.DataType.TEXT
        )
        self.assertEqual(str(config), "test-key")

    def test_text(self):
        config = Configuration.objects.create(
            key="test-key", value="Test value", data_type=Configuration.DataType.TEXT
        )
        self.assertEqual(config.get_value(), "Test value")

        config2 = Configuration.objects.create(
            key="test-key2", value="", data_type=Configuration.DataType.TEXT
        )
        self.assertEqual(config2.get_value(), "")

        config3 = Configuration.objects.create(
            key="test-key3",
            value='{"key" : "value"}',
            data_type=Configuration.DataType.TEXT,
        )
        self.assertEqual(config3.get_value(), '{"key" : "value"}')

    def test_number(self):
        config = Configuration.objects.create(
            key="test-key", value="100", data_type=Configuration.DataType.NUMBER
        )
        self.assertEqual(config.get_value(), 100)

        config2 = Configuration.objects.create(
            key="test-key2", value="100.12", data_type=Configuration.DataType.NUMBER
        )
        self.assertEqual(config2.get_value(), 100.12)

        config3 = Configuration.objects.create(
            key="test-key3", value="Test value", data_type=Configuration.DataType.NUMBER
        )
        self.assertEqual(config3.get_value(), 0)

        config4 = Configuration.objects.create(
            key="test-key4", value="", data_type=Configuration.DataType.NUMBER
        )
        self.assertEqual(config4.get_value(), 0)

    def test_boolean(self):
        config = Configuration.objects.create(
            key="test-key", value="True", data_type=Configuration.DataType.BOOLEAN
        )
        self.assertEqual(config.get_value(), True)

        config2 = Configuration.objects.create(
            key="test-key2", value="true", data_type=Configuration.DataType.BOOLEAN
        )
        self.assertEqual(config2.get_value(), True)

        config3 = Configuration.objects.create(
            key="test-key3", value="TrUe", data_type=Configuration.DataType.BOOLEAN
        )
        self.assertEqual(config3.get_value(), True)

        config4 = Configuration.objects.create(
            key="test-key4", value="", data_type=Configuration.DataType.BOOLEAN
        )
        self.assertEqual(config4.get_value(), False)

        config5 = Configuration.objects.create(
            key="test-key5", value="1", data_type=Configuration.DataType.BOOLEAN
        )
        self.assertEqual(config5.get_value(), False)

        config6 = Configuration.objects.create(
            key="test-key6",
            value="Test value",
            data_type=Configuration.DataType.BOOLEAN,
        )
        self.assertEqual(config6.get_value(), False)

    def test_json(self):
        config = Configuration.objects.create(
            key="test-key", value="true", data_type=Configuration.DataType.JSON
        )
        self.assertEqual(config.get_value(), True)

        config2 = Configuration.objects.create(
            key="test-key2", value="True", data_type=Configuration.DataType.JSON
        )
        self.assertRaises(json.decoder.JSONDecodeError, config2.get_value)

        config3 = Configuration.objects.create(
            key="test-key3",
            value='{"key" : "value"}',
            data_type=Configuration.DataType.JSON,
        )
        self.assertEqual(config3.get_value(), {"key": "value"})

        config4 = Configuration.objects.create(
            key="test-key4", value="", data_type=Configuration.DataType.JSON
        )
        self.assertRaises(json.decoder.JSONDecodeError, config4.get_value)

        config5 = Configuration.objects.create(
            key="test-key5", value="1", data_type=Configuration.DataType.JSON
        )
        self.assertEqual(config5.get_value(), 1)

        config6 = Configuration.objects.create(
            key="test-key6", value="Test value", data_type=Configuration.DataType.JSON
        )
        self.assertRaises(json.decoder.JSONDecodeError, config6.get_value)

    def test_html(self):
        config = Configuration.objects.create(
            key="test-key", value="Test value", data_type=Configuration.DataType.HTML
        )
        self.assertEqual(config.get_value(), "Test value")

        config2 = Configuration.objects.create(
            key="test-key2", value="", data_type=Configuration.DataType.HTML
        )
        self.assertEqual(config2.get_value(), "")

        config3 = Configuration.objects.create(
            key="test-key3",
            value='{"key" : "value"}',
            data_type=Configuration.DataType.HTML,
        )
        self.assertEqual(config3.get_value(), '{"key" : "value"}')

        config4 = Configuration.objects.create(
            key="test-key4",
            value="<p>Test value</p>",
            data_type=Configuration.DataType.HTML,
        )
        self.assertEqual(config4.get_value(), "<p>Test value</p>")

        config5 = Configuration.objects.create(
            key="test-key5",
            value="<p>{% configuration_value 'test-key' %}</p>",
            data_type=Configuration.DataType.HTML,
        )
        self.assertEqual(config5.get_value(), "<p>Test value</p>")

        config6 = Configuration.objects.create(
            key="test-key6",
            value="{% url 'homepage' %}",
            data_type=Configuration.DataType.HTML,
        )
        self.assertEqual(config6.get_value(), "/")

    def test_rate(self):
        # Valid rates
        config1 = Configuration.objects.create(
            key="test-key1", value="1/s", data_type=Configuration.DataType.RATE
        )
        self.assertEqual(config1.get_value(), "1/s")

        config2 = Configuration.objects.create(
            key="test-key2", value="100/m", data_type=Configuration.DataType.RATE
        )
        self.assertEqual(config2.get_value(), "100/m")

        config3 = Configuration.objects.create(
            key="test-key3", value="50/h", data_type=Configuration.DataType.RATE
        )
        self.assertEqual(config3.get_value(), "50/h")

        config4 = Configuration.objects.create(
            key="test-key4", value="1000/d", data_type=Configuration.DataType.RATE
        )
        self.assertEqual(config4.get_value(), "1000/d")

        # Invalid formats
        config5 = Configuration.objects.create(
            key="test-key5", value="5/hour", data_type=Configuration.DataType.RATE
        )
        self.assertEqual(config5.get_value(), "")

        config6 = Configuration.objects.create(
            key="test-key6", value="ten/m", data_type=Configuration.DataType.RATE
        )
        self.assertEqual(config6.get_value(), "")

        config7 = Configuration.objects.create(
            key="test-key7", value="10", data_type=Configuration.DataType.RATE
        )
        self.assertEqual(config7.get_value(), "")

        config8 = Configuration.objects.create(
            key="test-key8", value="10/", data_type=Configuration.DataType.RATE
        )
        self.assertEqual(config8.get_value(), "")

        config9 = Configuration.objects.create(
            key="test-key9", value="/m", data_type=Configuration.DataType.RATE
        )
        self.assertEqual(config9.get_value(), "")

        # Zero and negative values
        config10 = Configuration.objects.create(
            key="test-key10", value="0/s", data_type=Configuration.DataType.RATE
        )
        self.assertEqual(config10.get_value(), "")

        config11 = Configuration.objects.create(
            key="test-key11", value="-5/m", data_type=Configuration.DataType.RATE
        )
        self.assertEqual(config11.get_value(), "")

        # Empty value
        config12 = Configuration.objects.create(
            key="test-key12", value="", data_type=Configuration.DataType.RATE
        )
        self.assertEqual(config12.get_value(), "")


================================================
FILE: configuration/tests/test_signals.py
================================================
from django.core.cache import caches
from django.test import TestCase

from configuration.models import Configuration


class TestConfigurationSignal(TestCase):
    def setUp(self):
        caches["configuration_cache"].clear()

    def test_signal_caches_valid_value(self):
        Configuration.objects.create(
            key="signal-key",
            value="42",
            data_type=Configuration.DataType.NUMBER,
        )
        self.assertEqual(caches["configuration_cache"].get("config_signal-key"), 42)

    def test_signal_does_not_cache_invalid_json(self):
        Configuration.objects.create(
            key="signal-json-invalid",
            value="not valid json",
            data_type=Configuration.DataType.JSON,
        )
        # Should not raise, but value should not be cached
        self.assertIsNone(
            caches["configuration_cache"].get("config_signal-json-invalid")
        )


================================================
FILE: configuration/tests/test_templatetags.py
================================================
from django.test import TestCase

from configuration.models import Configuration
from configuration.templatetags.configuration_tags import configuration_value


class TestTemplatetags(TestCase):
    def test_configuration_value(self):
        Configuration.objects.create(
            key="test-key", value="Test value", data_type=Configuration.DataType.TEXT
        )
        self.assertEqual(configuration_value("test-key"), "Test value")

        Configuration.objects.create(
            key="test-key2", value="100", data_type=Configuration.DataType.NUMBER
        )
        self.assertEqual(configuration_value("test-key2"), 100)

        Configuration.objects.create(
            key="test-key3", value="TrUe", data_type=Configuration.DataType.BOOLEAN
        )
        self.assertEqual(configuration_value("test-key3"), True)

        Configuration.objects.create(
            key="test-key4", value="Test value", data_type=Configuration.DataType.JSON
        )
        # This raises an exception due to invalid JSON, but the template tag should
        # catch and return a blank string instead
        self.assertEqual(configuration_value("test-key4"), "")

        Configuration.objects.create(
            key="test-key5",
            value='{"key" : "value"}',
            data_type=Configuration.DataType.JSON,
        )
        self.assertEqual(configuration_value("test-key5"), {"key": "value"})

        Configuration.objects.create(
            key="test-key6",
            value="<p>{% configuration_value 'test-key' %}</p>",
            data_type=Configuration.DataType.HTML,
        )
        self.assertEqual(configuration_value("test-key6"), "<p>Test value</p>")


================================================
FILE: configuration/tests/test_utils.py
================================================
import json

from django.core.cache import caches
from django.test import TestCase

from configuration.models import Configuration
from configuration.utils import (
    CONFIGURATION_KEY_PREFIX,
    cache_configuration_value,
    configuration_value,
)


class TestConfigurationUtils(TestCase):
    def setUp(self):
        self.cache = caches["configuration_cache"]
        self.cache.clear()

    def test_configuration_value(self):
        Configuration.objects.create(
            key="test-key", value="Test value", data_type=Configuration.DataType.TEXT
        )
        self.assertEqual(configuration_value("test-key"), "Test value")

        Configuration.objects.create(
            key="test-key2", value="100", data_type=Configuration.DataType.NUMBER
        )
        self.assertEqual(configuration_value("test-key2"), 100)

        Configuration.objects.create(
            key="test-key3", value="TrUe", data_type=Configuration.DataType.BOOLEAN
        )
        self.assertEqual(configuration_value("test-key3"), True)

        Configuration.objects.create(
            key="test-key4", value="", data_type=Configuration.DataType.JSON
        )
        self.assertRaises(
            json.decoder.JSONDecodeError, configuration_value, "test-key4"
        )

        Configuration.objects.create(
            key="test-key5",
            value='{"key" : "value"}',
            data_type=Configuration.DataType.JSON,
        )
        self.assertEqual(configuration_value("test-key5"), {"key": "value"})

        Configuration.objects.create(
            key="test-key6",
            value="<p>{% configuration_value 'test-key' %}</p>",
            data_type=Configuration.DataType.HTML,
        )
        self.assertEqual(configuration_value("test-key6"), "<p>Test value</p>")


class TestCacheConfigurationValue(TestCase):
    def setUp(self):
        self.cache = caches["configuration_cache"]
        self.cache.clear()

    def test_explicit_value_is_cached(self):
        key = "explicit-key"
        cached = cache_configuration_value(key, 123)
        self.assertEqual(cached, 123)
        self.assertEqual(
            self.cache.get(f"{CONFIGURATION_KEY_PREFIX}_{key}"),
            123,
        )

    def test_value_is_fetched_from_model_if_not_supplied(self):
        Configuration.objects.create(
            key="fetched-key", value="true", data_type=Configuration.DataType.BOOLEAN
        )
        cached = cache_configuration_value("fetched-key")
        self.assertEqual(cached, True)
        self.assertEqual(
            self.cache.get(f"{CONFIGURATION_KEY_PREFIX}_fetched-key"),
            True,
        )


================================================
FILE: configuration/tests/test_validation.py
================================================
from django.core.exceptions import ValidationError
from django.test import TestCase

from configuration.validation import validate_rate


class TestValidation(TestCase):
    def test_valid_rates(self):
        self.assertEqual(validate_rate("1/s"), "1/s")
        self.assertEqual(validate_rate("10/m"), "10/m")
        self.assertEqual(validate_rate("100/h"), "100/h")
        self.assertEqual(validate_rate("1000/d"), "1000/d")

    def test_rate_stripping_whitespace(self):
        # Leading/trailing spaces
        self.assertEqual(validate_rate(" 10/m "), "10/m")
        self.assertEqual(validate_rate("\t10/m"), "10/m")
        self.assertEqual(validate_rate("10/m\t"), "10/m")
        self.assertEqual(validate_rate("\n10/m\n"), "10/m")
        self.assertEqual(validate_rate(" \n\t10/m\t\n "), "10/m")

        # Internal whitespace is not allowed and should still raise
        with self.assertRaises(ValidationError):
            validate_rate("10 /m")

        with self.assertRaises(ValidationError):
            validate_rate("10/ m")

        with self.assertRaises(ValidationError):
            validate_rate("10 / m")

    def test_non_string_input(self):
        with self.assertRaises(ValidationError):
            validate_rate(10)

        with self.assertRaises(ValidationError):
            validate_rate(None)

        with self.assertRaises(ValidationError):
            validate_rate(["5/m"])

    def test_invalid_format(self):
        with self.assertRaises(ValidationError):
            validate_rate("10")  # no unit

        with self.assertRaises(ValidationError):
            validate_rate("10/min")  # full word

        with self.assertRaises(ValidationError):
            validate_rate("ten/m")  # non-numeric

        with self.assertRaises(ValidationError):
            validate_rate("10/")  # missing unit

        with self.assertRaises(ValidationError):
            validate_rate("/m")  # missing number

        # This is now valid due to stripping
        self.assertEqual(validate_rate("10/m\n"), "10/m")

        with self.assertRaises(ValidationError):
            validate_rate("10/m/extra")  # too many parts

    def test_zero_or_negative_values(self):
        with self.assertRaises(ValidationError):
            validate_rate("0/s")

        with self.assertRaises(ValidationError):
            validate_rate("-5/m")

    def test_invalid_unit(self):
        with self.assertRaises(ValidationError):
            validate_rate("10/w")  # unsupported unit

        with self.assertRaises(ValidationError):
            validate_rate("10/ms")  # unsupported unit

        with self.assertRaises(ValidationError):
            validate_rate("10/seconds")  # full unit


================================================
FILE: configuration/utils.py
================================================
from typing import Any

from django.conf import settings
from django.core.cache import caches

from configuration.models import Configuration

CONFIGURATION_KEY_PREFIX = "config"


def configuration_value(key: str) -> Any:
    """
    Retrieve a configuration value by key with caching and type casting.

    Behavior:
        - Look up the value in the ``configuration_cache`` using a namespaced
          cache key.
        - If the value is missing, delegate to
          ``cache_configuration_value(key)`` to fetch, cast, cache, and return
          the value.
        - Casting is performed by ``Configuration.get_value()`` based on the
          instance's ``data_type``.

    Caching:
        - Values are stored in the cache alias ``configuration_cache``.
        - Cache entries expire according to
          ``settings.CONFIGURATION_CACHE_TIMEOUT``.

    Args:
        key (str): The configuration key to resolve.

    Returns:
        Any: The resolved and type-cast configuration value.

    Raises:
        Configuration.DoesNotExist: If the key is not present in the database
            when attempting to populate the cache.
    """
    config_cache = caches["configuration_cache"]
    cache_key = f"{CONFIGURATION_KEY_PREFIX}_{key}"
    value = config_cache.get(cache_key)

    if value is None:
        value = cache_configuration_value(key)

    return value


def cache_configuration_value(key: str, value: Any | None = None) -> Any:
    """
    Populate or refresh the cached value for a configuration key.

    Behavior:
        - If ``value`` is ``None``, fetch the ``Configuration`` by ``key``,
          cast it via ``get_value()``, and cache the result.
        - If ``value`` is provided, cache that value directly.
        - Always write to the ``configuration_cache`` using the configured
          ``settings.CONFIGURATION_CACHE_TIMEOUT``.

    Args:
        key (str): The configuration key to cache.
        value (Any | None): An explicit value to cache. If ``None``, the value
            is loaded from the database and cast via ``get_value()``.

    Returns:
        Any: The value that was stored in the cache.

    Raises:
        Configuration.DoesNotExist: If ``value`` is ``None`` and there is no
            ``Configuration`` row with the given key.
    """
    config_cache = caches["configuration_cache"]
    cache_key = f"{CONFIGURATION_KEY_PREFIX}_{key}"

    if value is None:
        config = Configuration.objects.get(key=key)
        value = config.get_value()

    config_cache.set(cache_key, value, timeout=settings.CONFIGURATION_CACHE_TIMEOUT)
    return value


================================================
FILE: configuration/validation.py
================================================
import re

from django.core.exceptions import ValidationError

RATE_LIMIT_PATTERN = re.compile(r"^\d+/(s|m|h|d)$")


def validate_rate(rate: str) -> str:
    """
    Validate that a rate string matches the expected pattern like '10/m'.

    Behavior:
        - Strip leading and trailing whitespace.
        - Require the format '<positive integer>/<unit>' where unit is one of
          's', 'm', 'h', or 'd' (seconds, minutes, hours, days).
        - Return the cleaned string unchanged if valid.

    Args:
        rate (str): The candidate rate string to validate.

    Returns:
        str: The cleaned rate string if valid.

    Raises:
        ValidationError: If the input is not a string, if the format does not
            match the required pattern, or if the integer portion is less than
            or equal to zero.
    """
    if not isinstance(rate, str):
        raise ValidationError("Rate limit must be a string.")

    rate = rate.strip()

    if not RATE_LIMIT_PATTERN.match(rate):
        raise ValidationError("Invalid rate limit format. Use '<number>/<s|m|h|d>'.")

    count, unit = rate.split("/")
    if int(count) <= 0:
        raise ValidationError("Rate limit count must be greater than 0.")

    return rate


================================================
FILE: configuration/views.py
================================================
# Create your views here.


================================================
FILE: db_scripts/Dockerfile
================================================
# Base layer with all tools
FROM public.ecr.aws/amazonlinux/amazonlinux:2023-minimal AS base

# Trusted CA for proxy
RUN curl -fsO --output-dir /etc/pki/ca-trust/source/anchors/ http://crl.loc.gov/LOC-ROOT-CA-1.crt \
    && update-ca-trust

# Install tools once
RUN dnf -y upgrade && \
    dnf -y install postgresql15.x86_64 awscli-2.noarch && \
    dnf -y clean all

# Logic for Dump
FROM base AS dump
COPY dump.sh .
RUN chmod +x dump.sh
CMD ["./dump.sh"]

# Logic for Restore
FROM base AS restore
COPY restore.sh .
RUN chmod +x restore.sh
CMD ["./restore.sh"]


================================================
FILE: db_scripts/dump.sh
================================================
#!/bin/bash

set -eu -o pipefail

if [[ -z "${ENV_NAME}" ]]; then
    echo "ENV_NAME must be set prior to running this script."
    exit 1
fi

if [ $ENV_NAME != "prod" ]; then
    echo "This script should only be run in the production environment."
    exit 1
fi

TODAY=$(date +%Y%m%d)
if [[ "$TODAY" =~ (0101|0401|0701|1001)$ ]]; then
    TAGVALUE="true"
else
    TAGVALUE="false"
fi
POSTGRESQL_PW="$(aws secretsmanager get-secret-value --region us-east-1 --secret-id crowd/${ENV_NAME}/DB/MasterUserPassword | python3 -c 'import json,sys;Secret=json.load(sys.stdin);SecretString=json.loads(Secret["SecretString"]);print(SecretString["password"])')"
POSTGRESQL_HOST="$(aws ssm get-parameter --region us-east-1 --name /concordia/${ENV_NAME}/db.url | python3 -c 'import json,sys;ParameterInput=json.load(sys.stdin);Parameter=ParameterInput["Parameter"];print(Parameter["Value"])')"
DUMP_FILE=concordia.dmp

echo "${POSTGRESQL_HOST}:5432:*:concordia:${POSTGRESQL_PW}" > ~/.pgpass
chmod 600 ~/.pgpass

pg_dump -Fc --no-acl -U concordia -h "${POSTGRESQL_HOST}" concordia -f "${DUMP_FILE}"

if [ -s $DUMP_FILE ]; then
    aws s3 cp "${DUMP_FILE}" "s3://crowd-deployment/database-dumps/concordia.${TODAY}.dmp"
    aws s3 cp "${DUMP_FILE}" s3://crowd-deployment/database-dumps/concordia.latest.dmp
    aws s3api put-object-tagging --bucket 'crowd-deployment' --key database-dumps/concordia.${TODAY}.dmp --tagging '{"TagSet": [{ "Key": "first-dmp-of-quarter", "Value": "'${TAGVALUE}'" }]}'
    aws s3api put-object-tagging --bucket 'crowd-deployment' --key database-dumps/concordia.latest.dmp --tagging '{"TagSet": [{ "Key": "first-dmp-of-quarter", "Value": "'${TAGVALUE}'" }]}'
fi
echo $?


================================================
FILE: db_scripts/restore.sh
================================================
#!/bin/bash

set -eu -o pipefail

export PATH=$HOME/.local/bin:$PATH

if [[ -z "${ENV_NAME}" ]]; then
    echo "ENV_NAME must be set prior to running this script."
    exit 1
fi

if [ $ENV_NAME = "prod" ]; then
    echo "This script should not be run in the production environment."
    exit 1
fi

POSTGRESQL_PW="$(aws secretsmanager get-secret-value --region us-east-1 --secret-id crowd/${ENV_NAME}/DB/MasterUserPassword | python3 -c 'import json,sys;Secret=json.load(sys.stdin);SecretString=json.loads(Secret["SecretString"]);print(SecretString["password"])')"
POSTGRESQL_HOST="$(aws ssm get-parameter --region us-east-1 --name /concordia/${ENV_NAME}/db.url | python3 -c 'import json,sys;ParameterInput=json.load(sys.stdin);Parameter=ParameterInput["Parameter"];print(Parameter["Value"])')"
DUMP_FILE=concordia.dmp

aws s3 cp s3://crowd-deployment/database-dumps/concordia.latest.dmp ${DUMP_FILE}

echo "${POSTGRESQL_HOST}:5432:*:concordia:${POSTGRESQL_PW}" > ~/.pgpass
chmod 600 ~/.pgpass

aws s3 sync s3://crowd-content s3://crowd-${ENV_NAME}-content --delete

psql -U concordia -h "$POSTGRESQL_HOST" -d postgres -c "select pg_terminate_backend(pid) from pg_stat_activity where datname='concordia';"
psql -U concordia -h "$POSTGRESQL_HOST" -d postgres -c "drop database concordia with (force);"
pg_restore --create -U concordia -h "${POSTGRESQL_HOST}" -Fc --dbname=postgres --no-owner --no-acl "${DUMP_FILE}"
RETURNCODE=$?
echo $RETURNCODE

if [ $RETURNCODE = 0 ] && [ $ENV_NAME = "test" ]; then
    ECS_SERVICE="$(aws ecs list-services --region us-east-1 --cluster crowd-${ENV_NAME} | python3 -c 'import json,sys;ParameterInput=json.load(sys.stdin);Parameter=ParameterInput["serviceArns"];print(Parameter[0].split("/")[2])')"

    # If a feature branch env is running the number of services in the test cluster increases.
    NUMBER_OF_SERVICES="$(aws ecs list-services --region us-east-1 --cluster crowd-test | python3 -c 'import json,sys;ParameterInput=json.load(sys.stdin);Parameter=ParameterInput["serviceArns"];print(len(Parameter))')"
    if [ $NUMBER_OF_SERVICES = 3 ];then
        # Normal
        ECS_SERVICE_2="$(aws ecs list-services --region us-east-1 --cluster crowd-${ENV_NAME} | python3 -c 'import json,sys;ParameterInput=json.load(sys.stdin);Parameter=ParameterInput["serviceArns"];print(Parameter[2].split("/")[2])')"
    else
        # Feature branch env exists.
        ECS_SERVICE_2="$(aws ecs list-services --region us-east-1 --cluster crowd-${ENV_NAME} | python3 -c 'import json,sys;ParameterInput=json.load(sys.stdin);Parameter=ParameterInput["serviceArns"];print(Parameter[3].split("/")[2])')"
    fi

    aws ecs update-service --region us-east-1 --force-new-deployment --cluster crowd-${ENV_NAME} --service ${ECS_SERVICE}
    aws ecs update-service --region us-east-1 --force-new-deployment --cluster crowd-${ENV_NAME} --service ${ECS_SERVICE_2}
elif [ $RETURNCODE = 0 ]; then
    ECS_SERVICE="$(aws ecs list-services --region us-east-1 --cluster crowd-${ENV_NAME} | python3 -c 'import json,sys;ParameterInput=json.load(sys.stdin);Parameter=ParameterInput["serviceArns"];print(Parameter[0].split("/")[2])')"
    aws ecs update-service --region us-east-1 --force-new-deployment --cluster crowd-${ENV_NAME} --service ${ECS_SERVICE}
fi


================================================
FILE: development/Containerfile
================================================
FROM python:3.12-slim-bookworm

# Major Node.js version to install (e.g., 20, 22). This is used to select the
# NodeSource APT repository "node_<major>.x".
ARG NODE_MAJOR=20

# Define build-time arguments for UID and GID
ARG USERNAME
ARG UID
ARG GID

ENV DEBIAN_FRONTEND="noninteractive"

# Create the group and user with specified UID/GID
RUN groupadd -g $GID $USERNAME && \
    useradd -m -u $UID -g $GID -s /bin/bash $USERNAME

# Bootstrap minimal tooling needed later in the build:
# - curl: download files/keys
# - ca-certificates: validate HTTPS endpoints
# - gnupg: import and dearmor APT repository signing keys
RUN apt-get update -qy && apt-get install -qy curl ca-certificates gnupg

# Ensure that the Library's certificate authority is trusted so the tampering
# proxy will not break TLS validation. See
# https://staff.loc.gov/wikis/display/SE/Configuring+HTTPS+clients+for+the+HTTPS+tampering+proxy.

RUN curl -fso /etc/ssl/certs/LOC-ROOT-CA-1.crt http://crl.loc.gov/LOC-ROOT-CA-1.crt && openssl x509 -inform der -in /etc/ssl/certs/LOC-ROOT-CA-1.crt -outform pem -out /etc/ssl/certs/LOC-ROOT-CA-1.pem && c_rehash

# Install Node.js via the NodeSource APT repository (manual setup; no setup
# script). Debian bookworm ships Node 18; adding this repo allows installing a
# newer major version (e.g., Node 20) via apt.
#
# This step:
# - creates a dedicated keyring directory under /etc/apt/keyrings
# - downloads and installs the NodeSource signing key into a keyring file
# - registers the NodeSource repository for the selected Node.js major line
#
# Note: When installing Node.js from NodeSource, the `nodejs` package includes
# npm (and npm comes with node-gyp), so there is no separate `npm` or
# `node-gyp` APT package to install here.
#
# References: NodeSource "Repository Manual Installation" guide. https://github.com/nodesource/distributions/wiki/Repository-Manual-Installation
RUN \
    # Create a dedicated directory for third-party APT keyrings.
    mkdir -p /etc/apt/keyrings && \
    # Download the NodeSource repository signing key and store it as a keyring
    # file that apt can use to verify NodeSource packages.
    curl -fsSL https://deb.nodesource.com/gpgkey/nodesource-repo.gpg.key \
        | gpg --dearmor -o /etc/apt/keyrings/nodesource.gpg && \
    # Register the NodeSource repository for the selected Node.js major version.
    # The "signed-by=" option scopes trust to just this repository entry.
    echo "deb [signed-by=/etc/apt/keyrings/nodesource.gpg] https://deb.nodesource.com/node_${NODE_MAJOR}.x nodistro main" \
        > /etc/apt/sources.list.d/nodesource.list

RUN apt-get update -qy && apt-get dist-upgrade -qy && apt-get install -o Dpkg::Options::='--force-confnew' -qy \
    build-essential \
    git \
    libmemcached-dev \
    # Pillow/Imaging: https://pillow.readthedocs.io/en/latest/installation.html#external-libraries
    libz-dev libfreetype6-dev \
    libtiff-dev libjpeg-dev libopenjp2-7-dev libwebp-dev zlib1g-dev \
    # Postgres client library to build psycopg
    libpq-dev \
    locales \
    # Weasyprint requirements
    libpango-1.0-0 libharfbuzz0b libpangoft2-1.0-0 \
    # Tesseract
    tesseract-ocr tesseract-ocr-all \
    # Selenium/Chrome/chromedriver requirements
    libnss3 libnspr4 libatk1.0-0 libatk-bridge2.0-0 libcups2 libxdamage1 libxkbcommon0 libasound2 libatspi2.0-0 \
    # Additional tools for development
    nano bash-completion \
    nodejs && apt-get -qy autoremove && apt-get -qy autoclean

RUN locale-gen en_US.UTF-8
ENV LC_ALL=en_US.UTF-8
ENV LANG=en_US.UTF-8
ENV LANGUAGE=en_US.UTF-8

ENV PYTHONUNBUFFERED 1
ENV PYTHONPATH /workspace

ENV DJANGO_SETTINGS_MODULE=${DJANGO_SETTINGS_MODULE:-concordia.settings_docker}

RUN pip install --upgrade pip
RUN pip install --no-cache-dir pre-commit
RUN pip install --no-cache-dir pipenv

RUN npm install --silent --global npm@10

# Set the working directory and permissions
WORKDIR /workspace
COPY . /workspace
RUN chown -R $USERNAME:$USERNAME /workspace

# Switch to the new user
USER $USERNAME

# Set user's path to include local bin, which is where Python libraries will be installed
ENV PATH "/home/${USERNAME}/.local/bin:$PATH"

RUN mkdir -p /workspace/logs
RUN touch /workspace/logs/concordia.log

# Front-end build and asset pipeline:
# - update npm to a known major version
# - install JS dependencies (production-only)
RUN npm install --silent
# Additional JS build step for Vite - compile scss, bundle, hash, and compress js files.
RUN npm run build

RUN pipenv install --system --dev --deploy && rm -rf ~/.cache/

RUN pre-commit install-hooks

EXPOSE 80

CMD ["bash"]


================================================
FILE: development/README.md
================================================
# Concordia Development Containers

The files in this directory, `compose.yml` and `Containerfile`, have been created to better facilitate developing Concordia in a containerized environment. The files are compatible with both Docker and Podman, using docker-compose or podman-compose.

Though newer versions of docker-compose and podman-compose support combining compose files and compose file overriding, the versions of these tools available on some current distributions (such as Red Hat Enterprise Linux 9) do not, so a singular compose file (`compose.yml`) with all the necessary settings is provided here.

## Purpose

The intention of these files is to provide a usable development environment purely in containers.

The default configuration (`../docker-compose.yml`) creates a container environment that's not suitable for development. Primarily, it creates an container for Elasticsearch, which is often used except in production, and the `app` container is not configured well for development. It runs as root, which causes file permission issues, and runs the daphne asgi server, which can't be restarted without restarting the entire container (manually killing and starting daphne does not work, either, because that causes the container to shutdown).

In addition, the default container file for the `app` container (`../Dockerfile`) runs `../entrypoint.sh`, which does several things that are undesirable in a development environment that involves restarting containers regularly. It automatically generates and applies migrations, runs collectstatic and launches daphne. The development Containerfile instead simply launches a bash shell.

## Configuration

In order to use `compose.yml` with your compose CLI tool of choice, you'll need to pass in the path, either through an environment variable or a command-line switch.

```bash
podman-compose -f development/compose.yml
```

```dotenv
COMPOSE_FILE=development/compose.yml
```

Your CLI tool should be executed in the concordia directory (`..`).

### .env caveat

Note that some versions of the tools (notably, podman-compose<=1.0.6) do not use .env files. If you wish to use environment variables, you'll need to inject those variables manually, such as by using a script that sources your .env file before executing podman-compose.

## Development

Configuring for your environment when using containers follows the process in the [For Developers](../docs/for-developers.md) page, except that most of the work is done for you by `compose.yml` and `Containerfile`. Notably, you do not need to install any dependencies (except git and your compose CLI) on your host. You will still need to configure your .env file, but otherwise simply running `podman-compose up -d` or `docker-compose up -d`, with the proper COMPOSE_FILE configuration (and other additions to .env, see below), will create an app container with everything you need for development.

### Additions to .env

There are a few additions to your .env file required to properly use the provided `compose.yml` and `Containerfile`:

```dotenv
COMPOSE_FILE=development/compose.yml
HOME_DIR=/home/<username>/
AWS_SHARED_CREDENTIALS_FILE=/home/<username>/.aws/credentials
CONTAINER_UID=<uid>
CONTAINER_GID=<guid>
CONTAINER_USERNAME=<username>
```

These values should be for the user account that you'll be doing development with, the same one that owns your local repository. This information is used to mount various necessary directories in the container, as well as configure the user account inside the container (to avoid running as root).

The last three settings can automatically be added to your .env file with the following scripts (executed in the directory with the .env):

```bash
#!/bin/bash

ENV_FILE=".env"
BACKUP_FILE=".env.bak"

# Create the .env file if it doesn't exist
touch "$ENV_FILE"

# Backup the original .env once
cp "$ENV_FILE" "$BACKUP_FILE"

# Set the values
NEW_UID=$(id -u)
NEW_GID=$(id -g)
NEW_USERNAME=$(whoami)

# Function to add or update a key in the .env file
update_env_var() {
    local key="$1"
    local value="$2"
    if grep -qE "^${key}=" "$ENV_FILE"; then
        sed -i "s/^${key}=.*/${key}=${value}/" "$ENV_FILE"
    else
        echo "${key}=${value}" >> "$ENV_FILE"
    fi
}

# Update the values
update_env_var "CONTAINER_UID" "$NEW_UID"
update_env_var "CONTAINER_GID" "$NEW_GID"
update_env_var "CONTAINER_USERNAME" "$NEW_USERNAME"

echo "Backup saved as $BACKUP_FILE"
echo ".env updated with CONTAINER_UID=$NEW_UID, CONTAINER_GID=$NEW_GID, CONTAINER_USERNAME=$NEW_USERNAME"
```

### Attaching to the app container

Once you've launched your containers, you can attach to a shell in the app container to perform development. Your compose CLI tool should provide a method for doing this.

```bash
sudo docker-compose exec -it app bash
```

Note that older versions of podman-compose do not properly pass switches to the underlying command, meaning the above won't work with those versions of podmon-compose. You can instead run it without the switches:

```bash
sudo podman-compose exec app bash
```

However, this has the disadvantage of not creating an interactive shell shell, which can cause issues with bash functionality. If you have a version of podman-compose with this limitation, the workaround is to use podman directly instead:

```bash
sudo podman exec -it concordia_app bash
```

You have to use the full container name because compose.yml is not referenced when using podman directly.

### Configuring for development

You will need to manually collect the static files before running the development server. This only needs to be done once after building the app container (and when changing static files in the future).

```bash
npx vite build
python manage.py collectstatic --no-post-process
```

### Launch the development server

Launching the development server is identical to launching it outside a container. The app container is configured to map port 8000 in the container to port 80 on the host:

```bash
python manage.py runserver 0.0.0.0:8000
```

### Committing changes

Git and the Concordia precommit hooks are included in the app container. You can simply use git commands as normal inside /workspace in the container.


================================================
FILE: development/compose.yml
================================================
version: '3.6'
services:
    redis:
        container_name: concordia_redis
        restart: unless-stopped
        image: redis:latest
        hostname: redis
        ports:
            - 63791:6379
        volumes:
            - redis_volume:/data

    db:
        container_name: concordia_db
        restart: unless-stopped
        image: postgres:15
        environment:
            POSTGRES_PASSWORD: ${POSTGRESQL_PW}
            POSTGRES_USER: concordia
            POSTGRES_MULTIPLE_DATABASES: test_concordia
        ports:
            - 54323:5432
        volumes:
            - ../postgresql:/docker-entrypoint-initdb.d:z
            - db_volume:/var/lib/postgresql/data/

    app:
        container_name: concordia_app
        hostname: app
        restart: unless-stopped
        build:
            context: ..
            dockerfile: development/Containerfile
            args:
                UID: ${CONTAINER_UID}
                GID: ${CONTAINER_GID}
                USERNAME: ${CONTAINER_USERNAME}
        environment: &django-environment
            WAIT_HOSTS: db:5432, redis:6379
            POSTGRESQL_HOST: db
            POSTGRESQL_PW: ${POSTGRESQL_PW}
            CONCORDIA_ENVIRONMENT: development
            DJANGO_SETTINGS_MODULE: ${DJANGO_SETTINGS_MODULE:-concordia.settings_template}
            DEBUG: ${DEBUG:-}
            REDIS_ADDRESS: redis
            REDIS_PORT: 6379
            AWS_PROFILE: ${AWS_PROFILE}
            AWS_SHARED_CREDENTIALS_FILE: ${AWS_SHARED_CREDENTIALS_FILE}
            TURNSTILE_SITEKEY: ${TURNSTILE_SITEKEY:-1x00000000000000000000AA}
            TURNSTILE_SECRET: ${TURNSTILE_SECRET:-1x0000000000000000000000000000000AA}
        depends_on:
            - redis
            - db
        volumes:
            - ..:/workspace:z
            - ${HOME_DIR}/.aws:${HOME_DIR}/.aws:z
            - ${HOME_DIR}/.gitconfig:${HOME_DIR}/.gitconfig:z
            - ${HOME_DIR}/.ssh:${HOME_DIR}/.ssh:z
            - images_volume:/concordia_images
        networks:
            - default
        ports:
            - 80:8000
        stdin_open: true
        tty: true

    importer:
        container_name: concordia_importer
        hostname: importer
        restart: unless-stopped
        build:
            context: ..
            dockerfile: importer/Dockerfile
        environment: *django-environment
        depends_on:
            - redis
            - db
        networks:
            - default
        volumes:
            - ..:/app:z
            - ${HOME_DIR}/.aws:/root/.aws:z
            - images_volume:/concordia_images

    celerybeat:
        container_name: concordia_celerybeat
        hostname: celerybeat
        restart: unless-stopped
        build:
            context: ..
            dockerfile: celerybeat/Dockerfile
        environment: *django-environment
        depends_on:
            - redis
            - db
        networks:
            - default

volumes:
    db_volume:
    images_volume:
    redis_volume:

networks:
    default:


================================================
FILE: docker-compose.yml
================================================
version: '3.6'
services:
    opensearch-node:
        image: public.ecr.aws/opensearchproject/opensearch:1
        container_name: opensearch-node
        environment:
            - cluster.name=opensearch-cluster
            - node.name=opensearch-node
            - discovery.type=single-node
            - bootstrap.memory_lock=true # along with the memlock settings below, disables swapping
            - OPENSEARCH_JAVA_OPTS=-Xms512m -Xmx512m # minimum and maximum Java heap size, recommend setting both to 50% of system RAM
            - 'DISABLE_INSTALL_DEMO_CONFIG=true' # Prevents execution of bundled demo script which installs demo certificates and security configurations to OpenSearch
            - 'DISABLE_SECURITY_PLUGIN=true' # initial local setup - Disables security plugin
        ulimits:
            memlock:
                soft: -1
                hard: -1
            nofile:
                soft: 65536 # maximum number of open files for the OpenSearch user, set to at least 65536 on modern systems
                hard: 65536
        volumes:
            - opensearch-data:/usr/share/opensearch/data
        ports:
            - 9200:9200 # REST API
            - 9600:9600 # Performance Analyzer
        networks:
            - default

    opensearch-dashboards:
        image: public.ecr.aws/opensearchproject/opensearch-dashboards:1
        container_name: opensearch-dashboards
        ports:
            - 5601:5601
        expose:
            - '5601'
        environment:
            - 'OPENSEARCH_HOSTS=http://opensearch-node:9200'
            - 'DISABLE_SECURITY_DASHBOARDS_PLUGIN=true' # disables security dashboards plugin in OpenSearch Dashboards
        networks:
            - default

    redis:
        restart: unless-stopped
        image: redis:latest
        hostname: redis
        ports:
            - 6379:6379
        volumes:
            - redis_volume:/data

    db:
        restart: unless-stopped
        image: postgres:15
        environment:
            POSTGRES_PASSWORD: ${POSTGRESQL_PW}
            POSTGRES_USER: concordia
            POSTGRES_MULTIPLE_DATABASES: test_concordia
        ports:
            - 5432:5432
        volumes:
            - ./postgresql:/docker-entrypoint-initdb.d
            - db_volume:/var/lib/postgresql/data/

    app:
        restart: unless-stopped
        build: .
        env_file:
            - .env
        environment: &django-environment
            WAIT_HOSTS: db:5432, redis:6379
            POSTGRESQL_HOST: db
            POSTGRESQL_PW: ${POSTGRESQL_PW}
            CONCORDIA_ENVIRONMENT: development
            DJANGO_SETTINGS_MODULE: ${DJANGO_SETTINGS_MODULE:-concordia.settings_docker}
            DEBUG: ${DEBUG:-}
            REDIS_ADDRESS: redis
            REDIS_PORT: 6379
        depends_on:
            - redis
            - db
        volumes:
            - .:/app
            - images_volume:/concordia_images
        networks:
            - default
        ports: # if running locally use 80:80, if running in local container use 8000:80
            - 80:80

    importer:
        restart: unless-stopped
        build:
            context: .
            dockerfile: importer/Dockerfile
        environment: *django-environment
        depends_on:
            - redis
            - db
        networks:
            - default
        volumes:
            - images_volume:/concordia_images

    celerybeat:
        restart: unless-stopped
        build:
            context: .
            dockerfile: celerybeat/Dockerfile
        environment: *django-environment
        depends_on:
            - redis
            - db
        networks:
            - default

volumes:
    db_volume:
    images_volume:
    redis_volume:
    opensearch-data:

networks:
    default:


================================================
FILE: docs/accessibility-goals.md
================================================
# Accessibility Goals

## Background Information

-   Microsoft has a site with a number of resources detailing their “Inclusive Design” strategy: https://www.microsoft.com/design/inclusive/

    Of note is the [“Inclusive 101” PDF](https://download.microsoft.com/download/b/0/d/b0d4bf87-09ce-4417-8f28-d60703d672ed/inclusive_toolkit_manual_final.pdf) covering the range of factors which designs should take into account and common strategies.

    [Kill Your Personas: How persona spectrums champion real user needs](https://medium.com/microsoft-design/kill-your-personas-1c332d4908cc)
    has a longer discussion about avoiding binary thinking when designing

## Desired Outcomes by Activity

We have desired goals for each category of activity on the site

### Transcription

-   Users with mobility restrictions should be able to complete the process
-   Users with color vision impairments should be able to complete the process except for specific pages where the content is inherently inaccessible until https://github.com/LibraryOfCongress/concordia/issues/666 is complete
-   Users with significant vision impairments should be able to learn the nature of the task and why it is difficult to continue

### Review

-   Users with mobility restrictions should be able to complete the process
-   Users with color vision impairments should be able to complete the process except for specific pages where the content is inherently inaccessible until https://github.com/LibraryOfCongress/concordia/issues/666 is complete
-   Users with significant vision impairments should be able to learn the nature of the task and why it is difficult to continue

### Final results

-   The transcribed text should be accessible to everyone

### Project Information

-   Information about the project should be accessible to everyone
-   Users should be able to easily learn the level of difficulty for their participation in particular activities


================================================
FILE: docs/accessibility-techniques.md
================================================
# Accessibility Techniques

## Background Information

-   18F has a detailed U.S. government-focused guide: https://accessibility.18f.gov/
-   The BBC has their comprehensive guide: https://bbc.github.io/accessibility-news-and-you/

## Assistive Technology Categories

### Screen Readers

#### Background information

-   https://webaim.org/techniques/screenreader/
-   The BBC has some guides for testing: https://bbc.github.io/accessibility-news-and-you/accessibility-and-testing-with-assistive-technology

#### Resources for common screen readers

##### JAWS

-   Freedom Scientific has a detailed [JAWS HTML and ARIA support matrix](https://freedomscientific.github.io/VFO-standards-support/) and [a downloable version](https://www.freedomscientific.com/Downloads/JAWS) which may be used for up to 40 minutes without a license
-   https://bbc.github.io/accessibility-news-and-you/accessibility-and-testing-with-jaws

##### Windows Narrator

-   https://support.microsoft.com/en-us/help/17173/windows-10-hear-text-read-aloud

##### Apple (macOS and iOS) VoiceOver

-   https://help.apple.com/voiceover/info/guide/
-   https://bbc.github.io/accessibility-news-and-you/accessibility-and-testing-with-voiceover-ios
-   https://bbc.github.io/accessibility-news-and-you/accessibility-and-testing-with-voiceover-os


================================================
FILE: docs/design-principles.md
================================================
## Design Principles for System Features &amp; Capabilities

We are collaborating across the Library of Congress to support this vision: _creating new pathways of engagement, scholarship, and serving the public—while making history with people, staff, collections and systems—by inviting public participation in a transformative project that improves discovery of the treasures of the Library of Congress._

Two principles guide these proposed features and the ways we can launch, manage, and sustain a crowdsourced transcription and tagging platform at the Library of Congress:

**Trust** and **Approachability**

The system features and capabilities envisioned below will support a user-centered crowdsourcing initiative through functionality and a program of engagement.

## **ENGAGE**

### Participation by many audiences in the same place, at the same time

We have a unique opportunity to support many audiences including, but not limited to, a curious public, researchers, teachers, students, those seeking volunteer opportunities, and staff. This crowdsourcing platform presents a digital space in which audiences with different, but possibly overlapping interests, skill levels, and familiarity with the Library of Congress may gather together. This vision builds on the work Library of Congress staff have invested in crafting programs that serve tanging audiences based on their specific needs. We are likely to have a dynamic and constantly changing atmosphere of participants and collections; here are some essential approaches and features to accommodate many participants in the same place, at the same time.

#### Lowest barrier to entry: No accounts necessary (but possible)

To ensure that every visitor can contribute and begin their Library of Congress crowdsourcing experience immediately, it would be best that accounts are not required to participate. Accounts may still be possible but not set as a prerequisite to contribute. Entries by &quot;anonymous&quot; users can be assessed separately or in a wider pool of contributions. As discussed below, it will be important to understand activity on the site; therefore, care should be taken to inform even anonymous users about the ways their behavior is captured. It is essential that these details are explained with clear language about the need for and use of that information.

#### Accessibility

Library of Congress audiences and visitors have a range of needs. This project should at all times meet the needs of all audiences. Examples of ways to create a welcoming and accommodating space include making it clear how to customize font sizes, interface adjustments, font styles and color choices, and plain language for instructions and project contexts. There are opportunities to invite participation in the system and use of the collections in many ways including reviewing and integrating voice to text capabilities, particularly for tagging. By meeting and thoughtfully surpassing compliance standards, the Library of Congress can create pathways for increased accessibility within the transcription workflow - such as the simple addition of a field to create alt text for the images. Captioned video content to support collections contexts, blog posts about discoveries and activity updates, and other featured content would also foreground that all audiences, even those who are not directly transcribing or tagging, are invited.

#### Multiple entry points

We should anticipate visitors entering from many different paths: whether a visitor is routed through the homepage into a collection and then selects an individual page to transcribe and tag; or referred by a post on a social network; or uncovered in internet search engine results; or introduced via [https://loc.gov](https://loc.gov) or simply word of mouth; or returning to transcribe and tag again via their own account page. It should always be clear how a visitor would navigate to the instructions, to an overview of the crowdsourcing program, to move to one&#39;s account pages (if one has created an account), and to navigate &quot;up&quot; to the project or campaign page(s), if entering on an individual transcription or tagging page from persistent unique URL.

#### Many Paths through Digital Collections

Heterogeneous subjects, forms, stories, and tasks are key to sustaining a long-term and representative crowdsourcing project. It is likely that many visitors will follow the sequential presentation of images, just as they were reading a diary or letter, or following other documentation as it unfolds. However, other visitors may wish to explore pages across collections with minimal reorientation to the home or collection-level pages. Still other volunteers may wish to change tasks between transcribing and tagging, or performing review passes, while participating. Community managers may also wish to lead visitors to targeted activity. There are unique opportunities to use the tool with prepared and simultaneous programming around the collections and campaigns. It may be helpful to have &quot;tracks&quot; for the multiple audiences interacting in this dynamic space.

#### Make Sense Quickly: Invitations to Contribute through Information Architecture

Upon entering the platform, a visitor should understand what tasks are requested and the goals of the program. It should be easy to explore featured collections by tags identified by community managers and curators; it should also be possible to explore collections based on community or self-created tags. Some tag categories that might connect to audience interests include location, era, and event. It should also be easy to understand the historical contexts of the collections, including difficult topics and subject matter.

#### Make it Easy to Participate

From entry into the site, volunteers should feel welcomed and within only a few steps of getting started with contributing. Clear instructions that are accessible from many different points that incorporate illustrative examples; perhaps even instruction or participation support in varying formats, such as video. Helpful tips about material culture and practice, such as handwriting or paleography resources may further help. Technical features that support accuracy and ease of contribution include annotation tools and editors. Providing a mechanism for volunteers to elect to receive timely feedback on their efforts and provide similar to others are just some community management approaches that can support accuracy and ease of contribution.

#### Serving Completed Data in Multiple Formats

Text and tags that are created by volunteers as they participate will be used to improve the ways collections can be found and connected. These forms of data should also be made available as project level JSON, CSV, and XML files, as well as a full corpus of completed transcription text. Ideally, these forms or data would be presented within the site on a &quot;data&quot; or research page. It should also be made clear the ways in which visitors might use the loc.gov interface to download individual images; and the loc.gov JSON API to download images and data from digital collections.

#### Responsibly Share Code

Thoroughly documenting and sharing the design decisions that inform the crafting of the codebase will ensure that other libraries, cultural heritage organizations, and educational bodies can best decide if this tool is appropriate for their needs and matches the skills and resources they have to apply to a web-application based participatory project. We should appropriately document and make available the source code for the tool, as well as other technical considerations and design decisions. Furthermore, lessons learned in the process of developing and improving the underlying tool, as well as the program(s) of engagement made possible by the affordances of the tool, should be shared openly as supporting documentation and stand-alone considerations.

#### Foregrounding Collaboration

There are many ways to signal respect for the contributions of volunteers while making the experience of participating most rewarding. One way is to maximize the extent of collaboration by better integrating opportunities to &quot;positively compound&quot; participation within the process of transcription, tagging, and review. Most existing tools use a blend of asynchronous transcription and either algorithmic review (matching) or volunteer review. Showcasing interpretation and activity by other volunteers can help participants craft a shared, agreed upon, and quality version of transcribed text. Displaying tags as categorization in the form of arranged and connected knowledge allows participants to crosswalk understanding, opening possibilities of new discovery and connection to the project mission and one another.

## **UNDERSTAND**

### Analyze activity &amp; assess participant motivations to improve experiences

It will be imperative to responsibly gather, analyze, and share information about activity in the crowdsourcing platform. This information will be used to best communicate, improve upon existing capabilities, and extend future possibilities of the tool and program of engagement. This section discusses features and capabilities to support better experiences for all participants, from volunteers to staff.

#### Privacy &amp; Ethical Use of Data

It is imperative that we responsibly and carefully define the need to collect data - whether that is about activity, location, or other forms of information - and connect that explicitly to intended uses of that data to understand audience needs and improve service. However, it should not be required or possible to track users through their visits. Furthermore, it should be possible for users to have their accounts deleted and account information purged from the site, while retaining their anonymized contributions.

#### No Accounts Necessary... but also creating an Account is possible

As noted above, it should be as easy as possible for visitors to become volunteers. However, creating an account within the system will allow participants to recall their activity, customize their experience, and fulfill needs for reporting should their motivations relate to formal volunteering or school assignments. We should explain to volunteers that creating an account affords additional possibilities including estimating participation. Accounts would also allow volunteers to experience other benefits: invitations to webinars with curators, alerts about new or related collections, and notifications of completion of projects or subjects of interest perhaps based on tags and other self-selection.

#### Understanding for Community Management

For the health and future of the crowdsourcing initiative, gathering information about the efforts and communication of volunteers imperative. Presenting a clear snapshot of activity, recent discussion, possible roadblocks, and upcoming campaigns or communication would aid community management through quick assessment of the ecosystem&#39;s state. Easy access to &quot;live data,&quot; rapidly gathering the pulse on high traffic projects or energetic discussion, and performance of ongoing campaigns are key needs for community managers. This scope of activity information would also be useful for community managers in discreetly and sparingly offering volunteers opportunities to re-engage with new collections.

#### Motivations meet Behavior

We can help identify needed capabilities or features by surfacing the reasons people wish to participate and mapping patterns of activity in the system to these goals. The experience of participating in this project will be dynamic. Our visitors will not cleanly map onto single personas because their reasons for participating may change from visit to visit and over time. Common motivations include pursuing personal learning objectives, contributing to something greater and access to open knowledge, and to fulfill course or volunteer requirements. In 2014, researchers and project managers from the Zooniverse described the benefits of designing digital citizen science projects for participants with limited time and commitment; Eveleigh et al termed this approach &quot;designing for dabblers.&quot; Crafting workflows that support bite-sized or small targeted tasks can meet the needs of this type of volunteer who may fit in participation in the crowdsourcing platform amid their other interests and activities. Other volunteers may seek more immersive experiences. Furthermore, students and other volunteers may have participation targets to meet during their time on site.

#### Enabling Immersion

From user interfaces to tracks, there are opportunities to design a site that enables immersive, deep engagement with stories in the collections, and to find flow in serialized tasks; yet also makes it possible to step out of the workflow quickly and with confidence that one&#39;s contributions will be retained and valued. Success may not always mean pace of transcription but rather the attainment of a visitor&#39;s goals, whether to learn, fulfill volunteering hours, or make a meaningful contribution to the Library of Congress.

#### Volunteers with accounts should be able to understand their own activity

Participants in the crowdsourcing program who have created accounts should be able to quickly access, understand, filter or scope, print or download summaries of their activity. This information should be presented to them in a visually dynamic and customizable (or filtered) manner. It should also represent their cumulative activity as well as recent tasks, allow them to pick up where they left off, share or engage others with their own contributions, and perhaps suggest related content via tags or campaigns.

#### Ability to gather feedback from participants about their needs

Responses, questions, feedback, and other means of communication between participants and community managers will be essential to the health of the project. Beyond a feedback button or comment form, community managers will want to be able to assess participation activity data as feedback on complexities of the collections, spot barriers and drop offs, identify stickiness, and sight opportunities in content and behavior.

#### Tell a Public Story by Displaying Activity

Presenting information about system-wide activity, as well as individual activity, creates opportunities for shared understanding of the progress toward collective goals, as well as individualized approaches. This information can also be presented on an About or Homepage to quickly convey a sense of participation--via dynamic and perhaps interactive charts, torque maps, timelines, and more--and encourage visitors to join the activity.

#### Reporting for Staff and Organization

Being able to provide reporting that integrates with or corresponds to staff workflows will help this project become more closely connected to regular activity in the organization. Information gathered about project performance might include the number of pages per collection, the number of volunteers that contributed, the number of views and engagement with the object in loc.gov/Project One, and details about visits including generalized time on site and return visits that engage with collections they&#39;ve shared. It should be possible to query this data for custom reports, and include filters or other bounding options for specific time frames. Careful consideration should be taken around visitor information; never achieving tracking of users, and at all times generalized and disconnected from any cross-walkable search.

## **CONNECT**

### Manage &amp; Match Collections to Tasks to Data and more

These activities focus on engaging audiences with Library of Congress collections. Simultaneously, we strive to design a series of tasks and support that result in data that may be applied to improve access to those Library collections. This section recommends tasks, design decisions, and processes to achieve these goals.

#### Tasks: Transcription AND Tagging

Of a range of possible tasks, we&#39;ve identified transcription and tagging to be most relevant to our goals to improve search and identification within Library of Congress collections. These two tasks can be mapped to the digital content lifecycle in the description phase. These tasks are envisioned as a means of creating asset or page level text that can enhance discovery of and access to the Library of Congress digital collections.

#### Transcription

Based on the goals of engaging audiences and creating useful text for discovery, legibility, and access, the recommended transcription process is one that facilitates asynchronous but rapid access transcription; asks for minimal interaction with the collection asset image; situates the transcription window adjacent to the collection asset image; offers an adjustable and immersive presentation, if desired; &quot;positively compounds&quot; the efforts of participants; honors the time and contributions of participants; visually supports identification of possible errors or areas needing additional work; and connects to the context of the object in focus, whether smooth transition between pages before and after or to the catalog information and project description.

#### Tagging

The goals of tagging are to classify or categorize the content in such a way as to make it discoverable for future use. It is recommended that the tagging feature be built to accommodate set(s) of collection level and platform-wide controlled vocabularies, as well as to accept crowd-generated tags. The former set of tags would allow the platform to leverage existing subject headings, known and popular loc.gov search terms, and other forms of metadata already associated with the collections. The latter tagging capability would allow volunteers to customize their experiences with collections once these tags were made available to search or surface content across the platform; it would also allow community managers to organize campaigns at the point of import and feature this content both on the homepage and highlighted throughout the experience of transcription and tagging. Finally, a visual coding of the tags would offer an opportunity for a subtle contextualization of staff and Library of Congress generated tags and those created by participants.

#### Task Ecosystem: Tasks in the Workflow

Projects and pilots including [Beyond Words](https://labs.loc.gov/experiments/beyond-words/) have demonstrated that the transcription and tagging tasks may successful be presented together in the crowdsourced workflow; however it should be possible for participants to elect to only complete one task, if they prefer. It is also possible that these tasks might be best presented in separate interfaces or as distinct workflows. The tasks should also be introduced to participants by describing the goals of the information that is being created, examples of how and where it will be discoverable after volunteers have contributed. Specifically, care should be taken to communicate the ways that the information created will be used—whether for search, for research, for publication and display, or to improve the features of the system—as these details will shape the ways the tasks are undertaken by volunteers.

#### Reaching Agreement

Agreement around the final version of transcription text will be a process that should be achieved through displaying the work of volunteers and facilitating a process in which they can negotiate to reach consensus of the completeness and quality of the text. The collections we will ask the public to transcribe will be of varying format, even changing in format from asset image to asset image. Therefore, there are likely to many points at which interpretation will occur. As a result, workflows that allow participants to work together and create a shared understanding of the asset image (at object/collection level) are most likely to be successful when the opportunity to exchange interpretations are presented throughout the transcription and tagging processes. Features in support of negotiated consensus include an ability to see, mark, report, and/or correct errors in the text; to discuss an asset image or page in a forum; and generalized discussion at the collection level. Another way to permit negotiated consensus is to allow for a peer-review workflow.

#### Complete the Cycle

It is imperative that the crowd-generated transcription text be returned and served with the [loc.gov](https://loc.gov) presentation of the object and at the asset image level. It may be possible to marry this information as metadata or perhaps as data supporting the collection or object. This urgency and responsibility in completing the cycle connects to a user-centered design; building trust with public participants by meeting motivations that relate to contributing to greater access to knowledge, while honoring their time and contribution.

#### Connect Activity to Collections

At all times it should be possible to navigate from the crowdsourcing project, campaign, or transcription and tagging page to the source object. In the volunteer&#39;s account view, it should be possible to navigate from the project to which they contributed to the record of that collection in [loc.gov](https://loc.gov). Furthermore, there are opportunities to connect volunteers to the [Ask a Librarian](https://www.loc.gov/rr/askalib/) service from the crowdsourcing platform, such as in the discussion section, the project and collection pages, the homepage, and even in the footer.

#### Managing Projects

These key features and approaches should be available for the long-term sustainability of the project:

-   Continuity with existing staff workflows, including work within CTS (content transfer system)
-   A pipeline for the queue of projects, as well as a monthly mechanism for proposing, identifying, and planning new collections for transcription including a recurring forum for nominating projects - perhaps even a sandbox or test space in which details of nominated collections may be stored or prepared
-   Collections management in bulk to support creating an extensive queue; storing offline in advance of campaign, collection, or other programming needs
-   Enabling Community Managers to post, launch and queue projects and campaigns via an administrative interface. Over time, this functionality can be expanded with a permissions-based self-service mechanism for curators and collections staff to identify, flag, or queue projects for transcription. This will likely require coherence with Library of Congress web services, Design &amp; Development, as well as the CTS workflow

#### Applying our APIs

As with other features recommended here, it would be best to seize and map to existing workflows and technologies. A goal for the platform should be to identify and deliver collections via [loc.gov](https://loc.gov) API to become transcription projects. Furthermore, allowing the transcription results to be queried via the [loc.gov JSON API](https://libraryofcongress.github.io/data-exploration/) once associated with the source images or record would be valuable.

#### Transparent Development

The greatest opportunity exists to develop this tool and platform in the open, as open source with appropriate licensing. Documenting development in a repository like GitHub is advisable.

#### Identify, Articulate, Acknowledge Content Created by Volunteers

Identify content created by participants within loc.gov as volunteer-created. Allow volunteers with an account to retain a pointer to the work they created, with a persistent URL or URI. Actively acknowledge the contributions of volunteers in publications, presentations, social media, and communications outreach. License for content created in the transcription and tagging workflow should be public domain or CC0; it should also be explicitly stated and incorporated as metadata when presented as a dataset and in loc.gov. These contexts should be clearly communicated to volunteers contributing the content as well as researchers engaging with the content.

#### Data Available for Download

To compliment research and exploration at the object and collection level, providing transcription and tagging results as a bulk data set would allow researchers in a range of disciplines to explore patterns and connections across collections. The transcription text and tags should be licensed as openly as possible and volunteers should be kept informed of the ways their efforts support discovery in the Library of Congress systems, as well as the role their work plays in other scholarly inquiry.

#### Navigating options to get started

Visitors and volunteers should be able to navigate the available collections in several ways. For example, presenting available projects as a list or set of tiles and incorporating filtering and sorting capability would allow volunteers to swiftly make sense of the active opportunities. Incorporating existing metadata offers other ways to orient volunteers to opportunities. For example, offering selection based on the object time period or era, location metadata, or subject heading. Finally, as participation increases, it may be possible to estimate time to complete a project based on participation data. This approach serves the needs of visitors who wish to dedicate a specific amount of time to their visit to the project.

### **GROW**

### Sustaining and Improving through Workflows and Spaces of Participation

Once the system has been designed, developed, and launched and once visitors become volunteers, there are endless opportunities to improve and sustain the platform and the program based on the ways people use it, their needs and challenges, and information gathered in the process of participation.

#### Show the Work!

Displaying the work of others in the system allows participants, whether new or seasoned, to more quickly understand that others are contributing to shared goals. The visibility of content &amp; contribution also signals active collaboration. Furthermore, visual indications of collaboration, whether intended or even in conflict, can be reflected in an interface that shows the efforts of editing. Allowing content to be editable, then marking out those edits—with font, size or other indicator—allows individuals to better understand who and what has come before them on the page.

#### Create an Atmosphere

Creating a shared understanding of expectations around behavior and communication can help shape expectations of respect and civility in this space. Inviting participants to acknowledge and commit to a Code of Conduct provides them the opportunity to reflect on how they will engage with others, as well as offers them support for framing communication they receive. Examples of public community code of conduct include the Coral Project and Airbnb; the former articulates acceptable and unacceptable behavior and expectations, while the latter asks customers (guests) to sign a code of conduct pledge as part of the booking process.

#### Clear Examples

As participants create transcription and tagged content and more collections are added, plenty of examples to best represent what is needed when encountering decision-making moments will emerge. In the interim, creating clear and annotated examples may be useful to those who are just getting started with transcription and tagging.

#### Collate and Connect Extraneous Knowledge

As volunteers participate in the crowdsourcing initiative, they will acquire, recall, and perhaps seek to share information and knowledge with others; perhaps to be helpful to other volunteers and, at other times, as an expression of their interest and engagement with Library of Congress collections. They may wish to share examples and further non-Library of Congress resources. A discussion board or forum can help volunteers achieve their motivations of learning, contributing to wider knowledge (a greater good), and to build community or a sense of shared purpose through discussion. It may also be useful to create an asset level discussion for specific or nuanced questions about the asset image or page that is receiving transcription and tagging activity. Impressive examples of discussion spaces in crowdsourcing projects include the Zooniverse talk pages and the Discourse implementation in use by In the Spotlight at the British Library.

#### Sustain Interest and Increase the Capability of Participants

As described above, visitors may have many different motivations when they first arrive at the crowdsourcing platform; they may also have different motivations each time they arrive on site. Their movement to becoming volunteers may be catalyzed by offering a range of tasks, heterogeneous collections, and oscillating levels of complexity. Furthermore, the system may be built with tracks that prompt a participant to continue in the next step, or asks them to contribute to a new task. It is also possible to blend these approaches and particularly helpful if these are cyclical or distributed opportunities - either naturally based on variety in the collections or designed by community management approaches. Furthermore, offering opportunities to problem-solve, support other volunteers in other roles, level up in transcription and tagging tasks, or self-select for more complex (or pilot) tasks can create a dynamic experience that is rewarding to volunteers and the program ecosystem.

#### Build Knowledge for Outcomes

It is recommended that Community Managers and staff with collections expertise work together closely to build programming and engagement in relation to the transcription and tagging tasks. This programming could take the shape of essays, webinars, edited video content, chats hosted in discussion pages or social networks, and in-person events. In these activities, persistent URLs for the page, collection, and campaign (or collection of tags) would be required. In the previous section, recommendations were shared for connecting activity to collections. It is also possible to connect collections to catalyze activity; for example, a prompt or pathway from the collection or object Project One page to the crowdsourcing platform.

#### Practice

One way to encourage activity is to offer a low risk point of entry in which a volunteer might practice and keep notes, such as in a sandbox. This space may also make it possible for a volunteer to elect to receive feedback that can increase their confidence, coherence and consistency in transcription and tagging, and connection between their goals and those of the program. Another means of training could be a practice page, potentially offered after a volunteer has made a few contributions or after they have created an account.

#### Piloting

The Library of Congress Labs team is well-situated to partner with staff in the Office of the Chief Information Officer and Library Services to continue to run crowdsourcing experiments focused on tasks, cataloging and metadata, and machine learning. Examples include working with Optical Character Recognition (OCR) and Handwritten Text Recognition (HTR) outputs to assess quality of transcription &amp; assistance with tagging; parsing task workflows; repeated passes on the same material for thematic, semantic, or other tagging; named entity recognition and more. Furthermore, there are opportunities to integrate other collections and materials into a crowdsourced workflow including audio-visual and time-based media objects. Creating an extensible tool or system into which features that emerge from experiments could be added would support the evolution of the project, as well as create opportunities for volunteers to grow their skills and knowledge.


================================================
FILE: docs/for-developers.md
================================================
# For Developers

## Prerequisites

This application can run on a single Docker host using docker-compose.
(recommended for development environments). See the [development Readme](../development/README.md) for more information. Note that the instructions below assume you'll be developing on your host rather than in a container. The development Readme provides instructions on performing development in a purely containerized environment, without installing any dependencies (outside of git and your container tool of choice) on the host.

For production, see the
[cloudformation](https://github.com/LibraryOfCongress/concordia/tree/master/cloudformation) directory for AWS Elastic Container Service
stack templates.

## Running Concordia

### Docker Compose

```bash
git clone https://github.com/LibraryOfCongress/concordia.git
```

If you're intending to edit static resources, templates, etc. and would like to
enable Django's DEBUG mode ensure that your environment has `DEBUG=true` set
before you run `docker-compose up` for the `app` container. The easiest way to
do this permanently is to add it to the `.env` file:

```bash
echo DEBUG=true >> .env
```

##### Install the application virtual environment

These steps only need to be performed the first time you setup a fresh
virtualenv environment:

1. Ensure that you have the necessary C library dependencies available:

    - `libmemcached`
    - `postgresql`
    - `node` & `npm` for the front-end tools

1. Ensure that you have Python 3.8 or later installed

1. Install [pipenv](https://docs.pipenv.org/) either using a tool like
   [Homebrew](https://brew.sh) (`brew install pipenv`) or using `pip`:

    ```bash
    pip3 install pipenv
    ```

1. If you encounter errors installing psycopg, you may need to set LDFLAGS in your environment variables.

1. Let Pipenv create the virtual environment and install all of the packages,
   including our developer tools:

    ```bash
    pipenv install --dev
    ```

    n.b. if `libmemcached` is installed using Homebrew you will need to [set the CFLAGS long enough to build it](https://stackoverflow.com/questions/14803310/error-when-install-pylibmc-using-pip#comment94853072_19432949):

    ```bash
    CFLAGS=$(pkg-config --cflags libmemcached) LDFLAGS=$(pkg-config --libs libmemcached) pipenv install --dev
    ```

    Once it has been installed you will not need to repeat this process unless
    you upgrade the version of libmemcached or Python installed on your system.

1. Configure the Django settings module in the `.env` file which Pipenv will use
   to automatically populate the environment for every command it runs:

    ```bash
    echo DJANGO_SETTINGS_MODULE="concordia.settings_dev" >> .env
    ```

    You can use this to set any other values you want to customize, such as
    `POSTGRESQL_PW` or `POSTGRESQL_HOST`.

    n.b to allow a local server to connect to the dockerized db set `POSTGRESQL_PORT=54323` - the db containers external postgres port.

1. Make sure that [redis](https://redis.io/docs/getting-started/) is installed and
   running.

1. Configure Turnstile in your `.env` file. Unless specifically testing Turnstile,
   you'll probably want the following settings:

    ```bash
    echo TURNSTILE_SITEKEY=1x00000000000000000000BB >> .env
    echo TURNSTILE_SECRET=1x0000000000000000000000000000000AA >> .env
    ```

    Those two settings ensure all Turnstile tests pass. See [Turnstile Testing](https://developers.cloudflare.com/turnstile/troubleshooting/testing/) for other options.

### Local Development Environment

You will likely want to run the Django development server on your localhost
instead of within a Docker container if you are working on the backend. This is
best done using the same `pipenv`-based toolchain as the Docker deployments:

#### Python Dependencies

Python dependencies and virtual environment creation are handled by
[pipenv](https://docs.pipenv.org/).

If you want to add a new Python package requirement to the application
environment, it must be added to the Pipfile and the Pipfile.lock file.
This can be done with the command:

```bash
pipenv install <package>
```

If the dependency you are installing is only of use for developers, mark it as
such using `--dev` so it will not be deployed to servers — for example:

```bash
pipenv install --dev django-debug-toolbar
```

Both the `Pipfile` and the `Pipfile.lock` files must be committed to the source
code repository any time you change them to ensure that all testing uses the
same package versions which you used during development.

#### Launching the environnment

In order to successfully launch the environment, the environment variables
`POSTGRESQL_PW` and `DJANGO_SETTINGS_MODULE` must be set. `POSTGRESQL_PW`
may be set to any value (which will become the database password for the
environment), but `DJANGO_SETTINGS_MODULE` should be set to
`concordia.settings_dev` to use the development settings file.

```bash
export POSTGRESQL_PW=password
export DJANGO_SETTINGS_MODULE=concordia.settings_dev
```

```bash
cd concordia
docker-compose up
```

Browse to [localhost](http://localhost)

#### Setting up a local development server

##### See section - [Ensuring your work follows the Library's coding standards](https://github.com/LibraryOfCongress/concordia/blob/master/docs/how-we-work.md#ensuring-your-work-follows-the-librarys-coding-standards) in How We Work

##### Start the support services

Instead of doing `docker-compose up` as above, instead start everything except the app:

```bash
docker-compose up -d db redis importer celerybeat
```

This will run the database in a container to ensure that it always matches the
expected version and configuration. If you want to reset the database, simply
delete the local container so it will be rebuilt the next time you run
`docker-compose up`: `docker-compose rm --stop db`.

##### Install front end

1. Install Node 20. If you're on MacOS, you can install it using brew:

    ```bash
    brew install node@12
    ```

1. Use NPM to install our development tools:

    ```bash
    npm install
    ```

1. In another terminal, start Vite to watch for changes to the SCSS files and
   compile them to CSS, and changes in the bundled, hased and compressed js files:

    ```bash
    npx vite
    ```

    If you only want to build, bundle, and compress them a single time without live updates:

    ```bash
    npx vite build
    ```

1) You may need to manually create a logs directory.

    ```bash
    mkdir logs
    ```

1) Collect Django static files:

    ```bash
    pipenv run ./manage.py collectstatic --no-post-process
    ```

##### Start the application server

1. Apply any database migrations:

    ```bash
    pipenv run ./manage.py migrate
    ```

1. Start the development server:

    ```bash
    pipenv run ./manage.py runserver
    ```

#### Running the unit tests

Use the `settings_local_test` Django settings in your environment. Your `.env` file should look something like:

```bash
POSTGRESQL_PW=password
DJANGO_SETTINGS_MODULE=concordia.settings_local_test
```

Bring up the docker database and redis servers:

```bash
docker-compose up -d db redis
```

Then execute the tests:

```bash
pipenv run ./manage.py test
```

#### Import Data

Once the database, redis service, importer and the application
are running, you're ready to import data.
First, [create a Django admin user](https://docs.djangoproject.com/en/2.1/intro/tutorial02/#creating-an-admin-user)
and log in as that user.
Then, go to the Admin area (under Account) and click "Bulk Import Items".
Upload a spreadsheet populated according to the instructions. Once all the import
jobs are complete, publish the Campaigns, Projects, Items and Assets that you
wish to make available.

#### Data Model Graph

To generate a model graph, make sure that you have [GraphViz](https://graphviz.org/doc/info/command.html) installed (e.g.
`brew install graphviz` or `apt-get install graphviz`) and use the
[django-extensions `graph_models`](https://django-extensions.readthedocs.io/en/latest/graph_models.html) command:

```bash
dot -Tsvg <(pipenv run ./manage.py graph_models concordia importer) -o concordia.svg
```

## Other Front-End Tools

### Public-facing URLs

1. If you need a list of public-facing URLs for testing, there's a management
   command which may be helpful:

    ```bash
    pipenv run ./manage.py print_frontend_test_urls
    ```

### Accessibility testing using aXe

Automated tools such as [aXe](https://www.deque.com/axe/) are useful for
catching low-hanging fruit and regressions. You run aXe against a development
server by giving it one or more URLs:

```bash
npx axe-cli --show-errors http://localhost:8000/
pipenv run ./manage.py print_frontend_test_urls | xargs npx axe-cli --show-errors
```

### Static Image Compression

When you update any of the files under `concordia/static/img`, please use an
optimizer such as [ImageOptim](https://imageoptim.com) or [Caesium](https://caesium.app/)
to **losslessly** compress JPEG, PNG, SVG, etc. files.

```bash
brew cask install imageoptim
open -a ImageOptim concordia/static/img/
```


================================================
FILE: docs/how-we-work.md
================================================
# How We Work

## Principles

Our basic principles are:

-   We produce open source software, shared in repositories where it may be inspected by the public who places their trust in it and copied for use by other agencies or institutions.
-   We adhere to the basic practices of agile software development, using the Scrum development framework.
-   We practice human-centered design. Everything that we produce is highly accessible, per [WCAG 2.1](https://www.w3.org/TR/WCAG21/).
-   Finally, we believe in having the relevant decision-makers at the table during all meetings, to maximize efficiency and maintain momentum.

## Product Team

This is a cross functional product team for Concordia made up of members across the Library who are working together. This product team will be comprised of the following roles:

-   Product owner
-   Product manager (Scrum master)
-   Technical lead
-   User Experience designer
-   Developers (Front-end, Back-end, Full-stack)
-   QA Tester
-   Community Managers (content writers, administrators)

This team participates in stand ups, product alignment, backlog grooming and retrospectives in service of prioritizing, defining and delivering value to the department and the public it serves.

## Sprint Organization and Meetings

Each sprint is three weeks long. We have a sprint kick off the first day of the new sprint. There are five basic meeting rhythms:

-   **Backlog grooming and Sprint Planning, every 2 weeks**
    -   Structure: tickets in the backlog are sorted by priority, the team adds acceptance criteria, estimates size, and assigns the tasks to a team member.
-   **Demo and retrospectives, every 2 weeks**
    -   At the end of each sprint, Developers or content writers demo completed work in the sprint for the larger library stakeholders. During demo, we will confirm if the user acceptance criteria is met and moved to be tested. Following the demo, the team will go through a retrospective. These are held back-to-back, on the same day

## Definition of Done

So that we can work more efficiently and be confident in the quality of the work we are delivering, we have a clear definition of what it means for a user story to be done, or production-ready.

**For delivering a user story to the product team:**

-   Story needs to be written in a way that is clear from both a development and a testing standpoint. Stories will need to be reviewed by the product team during creation.
-   Acceptance criteria should include the relevant tests needed (unit, security, performance, acceptance, etc)
-   Acceptance criteria should include the objective of the story, for use in approval by PO or tech team or both
-   The delivered functionality should match the acceptance criteria of the user story

**for product team to accept the user story and ship it:**

-   The functionality meets the acceptance criteria
-   The product team has verified the functionality in staging
-   All tests must pass in the the stage environment (unit, integration, feature)
-   The delivered functionality should be 508 compliant
-   Security requirements must be met
-   All documentation must be up to date (diagrams, training documentation, API documentation, help text, etc)
-   The delivered functionality should be compatible with the latest versions of Firefox, Chrome and Safari

## Processes

### Testing Strategy

We practice testing at three levels: unit tests, integration tests, and feature tests. For details about how we create and maintain unit, integration and feature tests.

-   Unit - Unit tests must be created for all new code, during the sprint in which the code is written, with coverage of at least 90%.
-   Integration - Code must include tests that verify that interfaces are functioning as designed.
-   Feature - New features must have functional definitions of the thing that they are to perform, and a description of human-performable actions to verify that they perform that thing.

#### Testing new code

Each ticket will include acceptance tests, especially for new user facing functionality. When the developer signals that the ticket is ready for test, they will move it to the `Needs test` column and pings the tester in the comment of the ticket.

Testers will identify issues - HIGH, LOW, or NONE. Here are the criteria for each of the levels:

-   FAIL: Does not meet the acceptace criteria and can not complete the acceptance test.
-   PASS: Does meet both acceptace criteria and and acceptance tests. When a ticket passes but there are noticable opportunities for improvements or enhancements, close the ticket and create a new ticket and add to the backlog.

If all user acceptance criteria has been met, the ticket will be closed and moved to Done column.

Final step: Technical lead will create a release with all tickets that are done.

**How to provide feedback**

If feature testers find issues to address:

-   FAIL: comment and @ the developer in the feature ticket
-   Enhancements or Improvements: open a new FEATURE ticket. This ticket will be added to the backlog and up for priortization in alignment meeting and backlog grooming. Link to related ticket by adding the issue #.

If a FAIL issue needs to be addressed, tester should expect to be available to respond to developers questions and retest until acceptance criteria is met.

### Ticket Movement in a Sprint

**For a new feature ticket:**

1. Ticket is generated as an issue and placed in the backlog
2. Product owner will place priority tickets in a sprint
3. Product Manager will ensure all acceptance criteria has been articulated and assign developer
4. Developer will move to In Progress when ticket is being worked on
5. When Developer has completed initial code will move code into crowd-test.loc.gov
6. Developer moves ticket into test assigned Product Owner to review feature needs
7. Product Owner test the feature and test if Acceptance Criteria is met, provides feedback to devs if needed
8. Product Owner approves feature then assigns to QA
9. QA will affirm AC and test broader functionality and accessibility. Will pass/fail ticket. Outcome of testing will be written in comments.
    - If pass, QA will close ticket and move to Done.
    - If fail, QA will move ticket back into In Progress and assigned back to developer
10. If additional issues are found in testing that are not related to the feature of functionality, new tickets will be written by QA and added to the backlog. Ticket will be assigned to PO for further ticket development and grooming.

**For system wide upgrades**

1. Ticket is generated as an issue and placed in the backlog in GitHub
2. Technical Lead will place priority tickets in a sprint
3. Product Manager will ensure all acceptance criteria has been articualted and assign developer
4. Developer will move to In Progress when ticket is being worked on
5. Unit testing incorporated into the code pipeline
    - Manually run unit tests
    - CI/CD integration
6. Move ticket into test and assign peer review testing by developer
    - If fail, developer provides feedback, moves ticket back to In Progress and assigns to the original dev
    - If pass, assign to QA for regression testing
7. Tester will copy the [Regression Testing Checklist](https://staff.loc.gov/wikis/x/UomCBQ) as a comment in the ticket
8. Tester will go through all the functionality described in the checklist
    - If fail, provides feedback in the comments, moves ticket back to In Progress and assigns to dev
    - If pass, checks boxes to show that all main functionality are working and moves ticket to done

### Branch strategy and Pull Request Process

#### Git branching strategy

We have two long-lived git branches, `master` and `release`.

The `master` branch continuously deploys to our development environment.

The `release` branch continuously deploys to our staging environment.
Our development and staging environments are on AWS and only accessible through the Library's network.

##### Starting new work

When someone begins new work, they cut a new branch from `master` and name it after their work, perhaps `feature1`. New changes are pushed to the feature branch origin.

##### Merging to `master`

When new work is complete, we set up a Pull Request (PR) from `feature1` to `master`. Discussion about, and approval of changes by either the Technical Lead, Product Owner or both happens in the PR interface in GitHub.

Once this new work is approved we merge the code, which closes the PR.
From here, our CI pipeline will build the new changes on the `master` branch. Next, our CD pipeline will deploy the new work to our development environment.

##### Merging to `release`

Once the development work on a sprint is completed, we set up a PR from `master` to `release`.

This constitutes a new release candidate. Any last-minute discussion, as well as approval happens in the PR interface. Once approved by the Technical Lead, Product Owner or both and merged, CI runs for `release` branch to the staging environment.

##### Tagging and deploying to production

When the `release` branch has been fully tested in the staging environment, we create a GitHub release with a tag on the `release` branch.

Either trigger a Jenkins build manually or wait for continuous integration for the `release` branch to kick in. This will build a cleanly tagged versioned release candidate and upload the docker images to Amazon Elastic Container Registry.

To deploy to production, create a new task revision for the `concordia-prod` task which updates the version numbers of the docker containers to match the recently built cleanly tagged release candidate. Update the production service to use the new task definition revision. Monitor the health check endpoint to ensure the service is updated to the proper version.

##### Patching production mid-sprint

If a problem is identified in production that needs a quick fix, we code the fix to production in a new branch cut from `release`, maybe called `prod_fix`. We set up a PR against `release` for review and discussion.

Any QA or manual testing will take place in the staging environment deployed from the `release` branch. Once the release is tagged and deployed to production, we have to bring those new changes in release back into master. We use rebase again: `git rebase master release`.

### Code quality and review process

Code reviews are about keeping code clean and limiting technical debt. We will look for things that increase technical debt or create an environment where technical debt can be introduced easily later. Each pull request will be reviewed by the technical lead or assigned reviewer. As a reviewer, they will look closely for untested code, if there are tests that they are testing what they're supposed to, that they are following the Library's code standards.

### Ensuring your work follows the Library's coding standards

The project extends the standard Django settings model for project configuration and the Django test framework for unit tests.

#### Configuring your virtual env

The easiest way to install the site is using [Pipenv](https://pipenv.readthedocs.io/) to manage the virtual environment and install dependencies.

#### Configure your local checkout with code-quality hooks

1.  Install [pre-commit](https://pre-commit.com/)
1.  Run `pre-commit install`

Now every time you make a commit in Git the various tools listed in the next
section will automatically run and report any problems.

n.b. Each time you check out a new copy of this Git repository, run `pre-commit install`.

#### Configure your editor with helpful tools:

[setup.cfg](https://github.com/LibraryOfCongress/concordia/blob/master/setup.cfg) contains configuration for [pycodestyle](https://pypi.org/project/pycodestyle/), [isort](https://pypi.org/project/isort/) and [flake8](https://pypi.org/project/flake8/).

Configure your editor to run black and isort on each file at save time.

1.  Install [black](https://pypi.org/project/black/) and integrate it with your editor of choice.
2.  Run [flake8](http://flake8.pycqa.org/en/latest/) to ensure you don't increase the warning count or introduce errors with your commits.
3.  This project uses [EditorConfig](https://editorconfig.org) for code consistency.

If you can't modify your editor, here is how to run the code quality
tools manually:

```
    $ black .
    $ isort --recursive
```

Black should be run prior to isort. It's recommended to commit your code
before running black, after running black, and after running isort so
the changes from each step are visible.

## Tools we use

-   GitHub - We use our GitHub organization for storing both software and collaboratively-maintained text.
-   Slack - We use the Slack for communication that falls outside of the structure of Jira or GitHub, but that doesn’t rise to the level of email, or for communication that it’s helpful for everybody else to be able to observe.
-   WebEx - We use WebEx for video conferencing in all our meetings


================================================
FILE: entrypoint.sh
================================================
#!/bin/bash

set -e -u # Exit immediately for unhandled errors or undefined variables

mkdir -p /app/logs
touch /app/logs/concordia.log

echo "Running makemigrations"
./manage.py makemigrations --merge --noinput

echo "Running migrations"
./manage.py migrate

echo "Ensuring our base configuration is present in the database"
./manage.py ensure_initial_site_configuration

if [ -v SENTRY_BACKEND_DSN ]; then
    echo "Testing Sentry configuration"
    echo "from sentry_sdk import capture_message;capture_message('This is a test event');" | ./manage.py shell
fi

echo "Running Django ASGI server"
daphne -b 0.0.0.0 -p 80 concordia.asgi:application


================================================
FILE: exporter/__init__.py
================================================


================================================
FILE: exporter/admin.py
================================================
# Register your models here.


================================================
FILE: exporter/apps.py
================================================
from django.apps import AppConfig


class ExporterConfig(AppConfig):
    name = "exporter"


================================================
FILE: exporter/exceptions.py
================================================
from typing import List, Tuple


class UnacceptableCharacterError(ValueError):
    """
    Raised when unacceptable characters are discovered in text to be exported.

    Each violation is stored so that callers can inspect which line / column held
    the character.

    Args:
        violations: A list of `(line, column, character)` triples representing
            every disallowed character found.  Line and column numbers are both
            **1-based** so they can be reported directly to users.
    """

    def __init__(self, violations: List[Tuple[int, int, str]]):
        self.violations: List[Tuple[int, int, str]] = violations
        details = ", ".join(
            f"line {ln} col {col} -> {ch!r}" for ln, col, ch in violations
        )
        super().__init__(f"Unacceptable characters found: {details}")


================================================
FILE: exporter/migrations/__init__.py
================================================


================================================
FILE: exporter/models.py
================================================
# Create your models here.


================================================
FILE: exporter/tabular_export/admin.py
================================================
# encoding: utf-8
"""
Helpers for exporting Django admin querysets as Excel or CSV files.

Usage in a ModelAdmin:

    actions = (export_to_excel_action, export_to_csv_action)

These actions take the current queryset and export it using the same field
selection you would get from `values()` by default. The download filename is
derived from the `ModelAdmin.model._meta.verbose_name_plural` unless a custom
filename is passed.

These helpers are adapted from the original django-tabular-export implementation:
https://github.com/LibraryOfCongress/django-tabular-export/blob/master/tabular_export/admin.py
"""

from functools import wraps
from typing import Any, Callable, Iterable

from django.contrib.admin import ModelAdmin
from django.db.models import QuerySet
from django.http import HttpRequest, HttpResponse
from django.utils.encoding import force_str as force_text
from django.utils.translation import gettext_lazy as _

from .core import (
    export_to_csv_response,
    export_to_excel_response,
    flatten_queryset,
)


def ensure_filename(suffix: str) -> Callable[[Callable[..., Any]], Callable[..., Any]]:
    """
    Decorator factory to ensure a default filename for export admin actions.

    If the wrapped action is called with ``filename=None``, the filename is
    built from ``modeladmin.model._meta.verbose_name_plural`` plus the given
    suffix.

    Args:
        suffix (str): File extension to append (for example, ``"csv"`` or
            ``"xlsx"``).

    Returns:
        Callable[[Callable[..., Any]], Callable[..., Any]]: A decorator that
        wraps an admin action and injects a default filename when needed.
    """

    def outer(f: Callable[..., Any]) -> Callable[..., Any]:
        @wraps(f)
        def inner(
            modeladmin: ModelAdmin,
            request: HttpRequest,
            queryset: QuerySet[Any],
            filename: str | None = None,
            *args: Any,
            **kwargs: Any,
        ) -> HttpResponse:
            if filename is None:
                filename = "%s.%s" % (
                    force_text(modeladmin.model._meta.verbose_name_plural),
                    suffix,
                )
            return f(
                modeladmin,
                request,
                queryset,
                *args,
                filename=filename,
                **kwargs,
            )

        return inner

    return outer


@ensure_filename("xlsx")
def export_to_excel_action(
    modeladmin: ModelAdmin,
    request: HttpRequest,
    queryset: QuerySet[Any],
    filename: str | None = None,
    field_names: Iterable[str] | None = None,
    extra_verbose_names: dict[str, str] | None = None,
) -> HttpResponse:
    """
    Django admin action that exports selected records as an Excel XLSX download.

    The queryset is first flattened via :func:`flatten_queryset`, optionally
    restricted to the provided ``field_names`` and ``extra_verbose_names``,
    then returned as an XLSX file response.

    Args:
        modeladmin (ModelAdmin): The Django admin class that owns this action.
        request (HttpRequest): The current admin request.
        queryset (QuerySet[Any]): The selected objects to export.
        filename (str | None): Optional download filename. When omitted, a
            name is generated from the model's ``verbose_name_plural`` and the
            ``"xlsx"`` suffix.
        field_names (Iterable[str] | None): Optional iterable of field names to
            include in the export. When omitted, the default flattening logic
            is used.
        extra_verbose_names (dict[str, str] | None): Optional mapping of field
            names to custom column headers.

    Returns:
        HttpResponse: A response containing the XLSX file.
    """
    headers, rows = flatten_queryset(
        queryset,
        field_names=field_names,
        extra_verbose_names=extra_verbose_names,
    )
    return export_to_excel_response(filename, headers, rows)


export_to_excel_action.short_description = _("Export to Excel")


@ensure_filename("csv")
def export_to_csv_action(
    modeladmin: ModelAdmin,
    request: HttpRequest,
    queryset: QuerySet[Any],
    filename: str | None = None,
    field_names: Iterable[str] | None = None,
    extra_verbose_names: dict[str, str] | None = None,
) -> HttpResponse:
    """
    Django admin action that exports selected records as a CSV download.

    The queryset is first flattened via :func:`flatten_queryset`, optionally
    restricted to the provided ``field_names`` and ``extra_verbose_names``,
    then returned as a CSV file response.

    Args:
        modeladmin (ModelAdmin): The Django admin class that owns this action.
        request (HttpRequest): The current admin request.
        queryset (QuerySet[Any]): The selected objects to export.
        filename (str | None): Optional download filename. When omitted, a
            name is generated from the model's ``verbose_name_plural`` and the
            ``"csv"`` suffix.
        field_names (Iterable[str] | None): Optional iterable of field names to
            include in the export. When omitted, the default flattening logic
            is used.
        extra_verbose_names (dict[str, str] | None): Optional mapping of field
            names to custom column headers.

    Returns:
        HttpResponse: A response containing the CSV file.
    """
    headers, rows = flatten_queryset(
        queryset,
        field_names=field_names,
        extra_verbose_names=extra_verbose_names,
    )
    return export_to_csv_response(filename, headers, rows)


export_to_csv_action.short_description = _("Export to CSV")


================================================
FILE: exporter/tabular_export/core.py
================================================
# encoding: utf-8
"""Exports to tabular (2D) formats

This module contains functions which take (headers, rows) pairs and return
HttpResponses with either XLSX or CSV downloads

The ``export_to_FORMAT_response`` functions accept a ``filename``, and
``headers`` and ``rows``. This allows full control over the data using
non-database data-sources, the Django ORM's various aggregations and
optimization methods, generators for large responses, control over the
column names, or post-processing using methods like ``get_FOO_display()``
to format the data for display.

The ``flatten_queryset`` utility used to generate lists from QuerySets
intentionally does not attempt to handle foreign-key fields to avoid
performance issues. If you need to include such data, prepare it in advance
using whatever optimizations are possible and pass the data in directly.

If your Django settings module sets ``TABULAR_RESPONSE_DEBUG`` to ``True``
the data will be dumped as an HTML table and will not be delivered as a
download.

Originally from
https://github.com/LibraryOfCongress/django-tabular-export/blob/master/tabular_export/core.py
"""

import csv
import datetime
from functools import wraps
from itertools import chain
from typing import Any, Callable, Iterable, Mapping, Sequence
from urllib.parse import quote

import xlsxwriter
from django.conf import settings
from django.db.models import QuerySet
from django.http import HttpResponse, StreamingHttpResponse
from django.utils.encoding import force_str

ResponseType = HttpResponse | StreamingHttpResponse


def get_field_names_from_queryset(qs: QuerySet[Any]) -> list[str]:
    """
    Derive field names from a queryset, including extra and aggregate columns.

    The queryset is first coerced to a ``values()`` queryset so that extra
    selects and annotations appear with the same names Django would use for
    ``values()`` results.

    Args:
        qs: QuerySet to introspect.

    Returns:
        List of field and annotation names in the order they will appear in
        ``qs.values()``.
    """

    # We'll set the queryset to include all fields including calculated
    # aggregates using the same names which a values() queryset would return:
    v_qs = qs.values()

    field_names: list[str] = []
    field_names.extend(i.target.name for i in v_qs.query.select)
    field_names.extend(v_qs.query.extra_select.keys())
    field_names.extend(v_qs.query.annotation_select.keys())

    return field_names


def flatten_queryset(
    qs: QuerySet[Any],
    field_names: Iterable[str] | None = None,
    extra_verbose_names: Mapping[str, str] | None = None,
) -> tuple[list[str], Iterable[Sequence[Any]]]:
    """
    Convert a queryset into headers and row tuples for tabular export.

    By default the column headers are derived from the queryset's field
    names (as returned by ``get_field_names_from_queryset``) and the rows
    use ``values_list()`` for efficient iteration.

    If ``field_names`` is provided, only those fields are included and they
    are used to order both headers and row values.

    The ``extra_verbose_names`` mapping can override the verbose names for
    specific fields, including related lookups or calculated values.

    Args:
        qs: Base queryset to flatten.
        field_names: Optional explicit list of field names to include.
        extra_verbose_names: Optional mapping of field names to friendly
            column labels. This can be used to provide proper names for
            related lookups (for example,
            ``{"institution__title": "Institution"}``) or calculated values
            (for example, ``{"items__count": "Item Count"}``).

    Returns:
        A 2-tuple of ``(headers, rows)`` where ``headers`` is a list of
        column labels and ``rows`` is an iterable of sequences of values.
    """

    if field_names is None:
        field_names = get_field_names_from_queryset(qs)

    # Headers will use the verbose names where available and fall back to the
    # field name if not (e.g. custom aggregate or extra fields):
    verbose_names = {i.name: i.verbose_name for i in qs.model._meta.fields}
    if extra_verbose_names is not None:
        verbose_names.update(extra_verbose_names)

    headers = [verbose_names.get(i, i) for i in field_names]

    return headers, qs.values_list(*field_names)


def convert_value_to_unicode(v: Any) -> str:
    """
    Convert a value to a display-safe string for tabular export.

    ``None`` is rendered as an empty string. ``date`` and ``datetime``
    instances are converted using ``isoformat()``. All other values are
    coerced via ``force_str``.

    Args:
        v: Value to convert.

    Returns:
        String representation suitable for CSV, HTML, or XLSX output.
    """

    if v is None:
        return ""
    elif hasattr(v, "isoformat"):
        return v.isoformat()
    else:
        return force_str(v)


def set_content_disposition(
    f: Callable[..., ResponseType],
) -> Callable[..., ResponseType]:
    """
    Decorator that applies a Content-Disposition header using the filename.

    The wrapped function must accept ``filename`` as its first positional
    argument and return an ``HttpResponse`` (or subclass). The decorator
    sets the ``Content-Disposition`` header using RFC 5987 encoding for the
    provided filename.

    Args:
        f: Callable that builds the HTTP response for a given filename.

    Returns:
        Wrapped callable that always sets ``Content-Disposition`` on the
        response.
    """

    @wraps(f)
    def inner(filename: str, *args: Any, **kwargs: Any) -> ResponseType:
        response = f(filename, *args, **kwargs)
        # See RFC 5987 for the filename* spec:
        response["Content-Disposition"] = "attachment; filename*=UTF-8''%s" % quote(
            filename
        )
        return response

    return inner


def return_debug_reponse(
    f: Callable[..., ResponseType],
) -> Callable[..., ResponseType]:
    """
    Decorator to swap export responses for an HTML debug table.

    When the ``TABULAR_RESPONSE_DEBUG`` setting is truthy, the wrapped
    function is not called. Instead ``export_to_debug_html_response`` is
    used and the ``Content-Disposition`` header is removed so the browser
    renders the table inline.

    Args:
        f: Export callable to wrap.

    Returns:
        Wrapped callable that either returns the original export response or
        an HTML debug response, depending on settings.
    """

    @wraps(f)
    def inner(filename: str, *args: Any, **kwargs: Any) -> ResponseType:
        if not getattr(settings, "TABULAR_RESPONSE_DEBUG", False):
            return f(filename, *args, **kwargs)
        else:
            resp = export_to_debug_html_response(filename, *args, **kwargs)
            del resp["Content-Disposition"]  # Don't trigger a download
            return resp

    return inner


def export_to_debug_html_response(
    filename: str,
    headers: Iterable[Any],
    rows: Iterable[Sequence[Any]],
) -> StreamingHttpResponse:
    """
    Build an HTML table response for inspection of tabular export data.

    This is used when ``TABULAR_RESPONSE_DEBUG`` is enabled. It renders the
    headers and rows into a simple Bootstrap-styled HTML table and returns a
    ``StreamingHttpResponse``.

    Args:
        filename: Suggested filename for the export (kept for API parity).
        headers: Iterable of header labels.
        rows: Iterable of row sequences.

    Returns:
        StreamingHttpResponse streaming the HTML document.
    """

    def output_generator():
        # Note the use of bytestrings to avoid unnecessary Unicode-bytes cycles:
        yield b"<!DOCTYPE html><html>"
        yield b'<head><meta charset="utf-8"><title>TABULAR DEBUG</title>'
        yield b'<link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/bootstrap@5.3.3/dist/css/bootstrap.min.css">'  # noqa
        yield b"</head>"
        yield b'<body class="container-fluid"><div class="table-responsive"><table class="table table-striped">'  # noqa
        yield b"<thead><tr><th>"
        yield b"</th><th>".join(
            convert_value_to_unicode(i).encode("utf-8") for i in headers
        )
        yield b"</th></tr></thead>"

        yield b"<tbody>"
        for row in rows:
            values = map(convert_value_to_unicode, row)
            values = [i.encode("utf-8").replace(b"\n", b"<br>") for i in values]
            yield b"<tr><td>%s</td></tr>" % b"</td><td>".join(values)
        yield b"</tbody>"
        yield b"</table></div></body></html>"

    return StreamingHttpResponse(
        output_generator(), content_type="text/html; charset=UTF-8"
    )


@return_debug_reponse
@set_content_disposition
def export_to_excel_response(
    filename: str,
    headers: Iterable[Any],
    rows: Iterable[Sequence[Any]],
) -> HttpResponse:
    """
    Return an XLSX ``HttpResponse`` for the given headers and rows.

    The payload is constructed using ``xlsxwriter`` with a constant-memory
    workbook and a default ``yyyy-mm-dd`` date format. ``datetime`` and
    ``date`` values are written with Excel date formatting; all other values
    are coerced to strings.

    Args:
        filename: Download filename used in the ``Content-Disposition``
            header.
        headers: Iterable of header labels for the first row.
        rows: Iterable of row sequences.

    Returns:
        HttpResponse containing the XLSX file.
    """

    # See http://technet.microsoft.com/en-us/library/ee309278%28office.12%29.aspx
    content_type = "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"

    # This cannot be a StreamingHttpResponse because XLSX files are .zip format and
    # the Python ZipFile library doesn't offer a generator form (which would also
    # not be called per-row but per-chunk)

    resp = HttpResponse(content_type=content_type)

    workbook = xlsxwriter.Workbook(
        resp,
        {
            "constant_memory": True,
            "in_memory": True,
            "default_date_format": "yyyy-mm-dd",
        },
    )

    date_format = workbook.add_format({"num_format": "yyyy-mm-dd"})

    worksheet = workbook.add_worksheet()

    for y, row in enumerate(chain((headers,), rows)):
        for x, col in enumerate(row):
            if isinstance(col, datetime.datetime):
                # xlsxwriter cannot handle timezones:
                worksheet.write_datetime(y, x, col.replace(tzinfo=None), date_format)
            elif isinstance(col, datetime.date):
                worksheet.write_datetime(y, x, col, date_format)
            else:
                worksheet.write(y, x, force_str(col, strings_only=True))

    workbook.close()

    return resp


class Echo(object):
    # See
    # https://docs.djangoproject.com/en/1.8/howto/outputting-csv/#streaming-csv-files

    def write(self, value: str) -> str:
        return value


@return_debug_reponse
@set_content_disposition
def export_to_csv_response(
    filename: str,
    headers: Iterable[Any],
    rows: Iterable[Sequence[Any]],
) -> StreamingHttpResponse:
    """
    Return a CSV ``StreamingHttpResponse`` for the given headers and rows.

    Values are converted to strings via ``convert_value_to_unicode`` and
    written using the standard library ``csv`` module. The response streams
    each rendered row to avoid holding the entire CSV in memory.

    Args:
        filename: Download filename used in the ``Content-Disposition``
            header.
        headers: Iterable of header labels for the header row.
        rows: Iterable of row sequences.

    Returns:
        StreamingHttpResponse streaming the CSV content.
    """
    pseudo_buffer = Echo()

    writer = csv.writer(pseudo_buffer)

    def row_generator() -> Iterable[Iterable[str]]:
        yield map(convert_value_to_unicode, headers)

        for row in rows:
            yield map(convert_value_to_unicode, row)

    # This works because csv.writer.writerow calls the underlying
    # file-like .write method *and* returns the result. We cannot
    # use the same approach for Excel because xlsxwriter doesn't
    # have a way to emit chunks from ZipFile and StreamingHttpResponse
    # does not offer a file-like handle.

    return StreamingHttpResponse(
        (writer.writerow(row) for row in row_generator()),
        content_type="text/csv; charset=utf-8",
    )


def force_utf8_encoding(
    f: Callable[[], Iterable[Sequence[Any]]],
) -> Callable[[], Iterable[Sequence[bytes]]]:
    """
    Decorator that forces all values yielded by a row generator to UTF-8 bytes.

    The wrapped callable must return an iterable of row sequences. Each value
    in each row is encoded as UTF-8 bytes.

    Args:
        f: Callable returning an iterable of rows.

    Returns:
        Callable that yields rows with all values encoded as UTF-8 bytes.
    """

    @wraps(f)
    def inner() -> Iterable[Sequence[bytes]]:
        for row in f():
            yield [i.encode("utf-8") for i in row]

    return inner


================================================
FILE: exporter/templates/admin/exporter/unacceptable_character_report.html
================================================
{% extends "admin/base.html" %}

{% load concordia_text_tags %}

{% comment %}
Displays per-asset lists of unacceptable characters detected during export.
Each error entry provides a link to the asset's admin change page.
{% endcomment %}

{% block messages %}
    {# Messages are rendered elsewhere in the admin; suppress duplicate view #}
{% endblock messages %}

{% block extrahead %}
    {{ block.super }}
    <style>
        .char-error-table th {
            text-align: left;
        }

        .char-error-table td,
        .char-error-table th {
            padding: 0.25rem 0.75rem;
        }

        .char-error-table tr:nth-child(even) {
            background: #f9f9f9;
        }

        .char-error-table code {
            font-weight: bold;
            color: #dc3545; /* bootstrap danger */
            background: transparent;
        }
    </style>
{% endblock extrahead %}

{% block content %}
    <div id="content-main">
        <h2>Unacceptable Characters Report</h2>

        {% if errors %}
            <table class="char-error-table">
                <thead>
                    <tr>
                        <th>Asset</th>
                        <th>Violations&nbsp;(line, column, char)</th>
                    </tr>
                </thead>
                <tbody>
                    {% for entry in errors %}
                        <tr>
                            <td>
                                <a href="{% url 'admin:concordia_asset_change' entry.asset.pk %}">
                                    {{ entry.asset }}
                                </a>
                            </td>
                            <td>
                                <ul>
                                    {% for v in entry.violations %}
                                        <li>
                                            Line&nbsp;{{ v.0 }},&nbsp;Col&nbsp;{{ v.1 }}:
                                            <code>{{ v.2|reprchar }}</code>
                                        </li>
                                    {% endfor %}
                                </ul>
                            </td>
                        </tr>
                    {% endfor %}
                </tbody>
            </table>
        {% else %}
            <p>No unacceptable characters were found.</p>
        {% endif %}
    </div>
{% endblock content %}


================================================
FILE: exporter/tests/__init__.py
================================================


================================================
FILE: exporter/tests/test_exceptions.py
================================================
from django.test import TestCase

from exporter.exceptions import UnacceptableCharacterError


class UnacceptableCharacterErrorTests(TestCase):
    def test_violations_are_stored(self):
        """The `violations` list passed to `__init__` is stored unmodified."""
        violations = [(2, 3, "\u200b"), (4, 1, "\x00")]
        err = UnacceptableCharacterError(violations)
        self.assertEqual(err.violations, violations)

    def test_message_contains_formatted_details(self):
        """The exception message should embed a human-readable summary."""
        violations = [(1, 1, "\x00")]
        err = UnacceptableCharacterError(violations)
        msg = str(err)
        self.assertIn("line 1 col 1", msg)
        # The backslash in "\\x00" is escaped once by repr() and once in the
        # string literal, so we search for the double-escaped form.
        self.assertIn("\\x00", msg)


================================================
FILE: exporter/tests/test_tabular_export.py
================================================
import datetime
from unittest.mock import Mock

from django.db import models
from django.http import HttpResponse, StreamingHttpResponse
from django.test import TestCase, override_settings

from exporter.tabular_export.admin import (
    export_to_csv_action,
    export_to_excel_action,
)
from exporter.tabular_export.core import (
    Echo,
    convert_value_to_unicode,
    export_to_csv_response,
    export_to_debug_html_response,
    export_to_excel_response,
    flatten_queryset,
    force_utf8_encoding,
    get_field_names_from_queryset,
    set_content_disposition,
)


class DummyModel(models.Model):
    name = models.CharField(max_length=255, verbose_name="Name")
    created = models.DateField(null=True, verbose_name="Created")

    class Meta:
        app_label = "tests"


class DummyQuerySet:
    def __init__(self, data, field_names):
        self._data = data
        self._field_names = field_names
        self.model = DummyModel

    def values_list(self, *args):
        return self._data

    def values(self):
        return self

    @property
    def query(self):
        class Query:
            select = [
                type("Field", (), {"target": type("Target", (), {"name": fn})()})
                for fn in self._field_names
            ]
            extra_select = {"extra": "value"}
            annotation_select = {"annotate": "value"}

        return Query()


class CoreTests(TestCase):
    def test_convert_value_to_unicode(self):
        self.assertEqual(convert_value_to_unicode(None), "")
        self.assertEqual(convert_value_to_unicode("abc"), "abc")
        dt = datetime.datetime(2020, 1, 1, 12, 0)
        self.assertEqual(convert_value_to_unicode(dt), "2020-01-01T12:00:00")
        d = datetime.date(2020, 1, 1)
        self.assertEqual(convert_value_to_unicode(d), "2020-01-01")

    def test_echo_write(self):
        echo = Echo()
        self.assertEqual(echo.write("abc"), "abc")

    def test_get_field_names_from_queryset(self):
        qs = DummyQuerySet([], ["name", "created"])
        self.assertEqual(
            get_field_names_from_queryset(qs),
            ["name", "created", "extra", "annotate"],
        )

    def test_flatten_queryset_defaults(self):
        qs = DummyQuerySet([("abc", datetime.date(2020, 1, 1))], ["name", "created"])
        headers, rows = flatten_queryset(qs)
        self.assertEqual(headers, ["Name", "Created", "extra", "annotate"])
        self.assertEqual(list(rows), [("abc", datetime.date(2020, 1, 1))])

    def test_flatten_queryset_with_custom_headers(self):
        qs = DummyQuerySet([("abc",)], ["name"])
        headers, rows = flatten_queryset(
            qs, field_names=["name"], extra_verbose_names={"name": "Full Name"}
        )
        self.assertEqual(headers, ["Full Name"])
        self.assertEqual(list(rows), [("abc",)])

    def test_force_utf8_encoding(self):
        def rows():
            yield ["ü", "æ"]

        out = list(force_utf8_encoding(rows)())
        self.assertEqual(out, [[b"\xc3\xbc", b"\xc3\xa6"]])

    def test_set_content_disposition(self):
        @set_content_disposition
        def dummy(filename):
            return StreamingHttpResponse()

        resp = dummy("test.csv")
        self.assertIn(
            "attachment; filename*=UTF-8''test.csv", resp["Content-Disposition"]
        )

    def test_export_to_debug_html_response(self):
        headers = ["h1", "h2"]
        rows = [["val1", "val2"], ["val3", "val4"]]
        resp = export_to_debug_html_response("test.html", headers, rows)
        self.assertIsInstance(resp, StreamingHttpResponse)
        content = b"".join(resp.streaming_content)
        self.assertIn(b"<table", content)
        self.assertIn(b"val1", content)
        self.assertIn(b"val4", content)

    @override_settings(TABULAR_RESPONSE_DEBUG=False)
    def test_export_to_csv_response(self):
        headers = ["h1", "h2"]
        rows = [["a", "b"]]
        resp = export_to_csv_response("test.csv", headers, rows)
        self.assertIsInstance(resp, StreamingHttpResponse)
        content = b"".join(resp.streaming_content)
        self.assertIn(b"a", content)

    @override_settings(TABULAR_RESPONSE_DEBUG=True)
    def test_export_to_csv_response_debug(self):
        headers = ["h1"]
        rows = [["b"]]
        resp = export_to_csv_response("debug.csv", headers, rows)
        self.assertIsInstance(resp, StreamingHttpResponse)
        content = b"".join(resp.streaming_content)
        self.assertIn(b"<table", content)
        self.assertNotIn("Content-Disposition", resp)

    @override_settings(TABULAR_RESPONSE_DEBUG=False)
    def test_export_to_excel_response(self):
        headers = ["h1", "h2"]
        rows = [["x", datetime.date(2022, 1, 1)]]
        resp = export_to_excel_response("file.xlsx", headers, rows)
        self.assertIsInstance(resp, HttpResponse)
        self.assertEqual(
            resp["Content-Type"],
            "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
        )
        self.assertEqual(
            "attachment; filename*=UTF-8''file.xlsx", resp["Content-Disposition"]
        )

    @override_settings(TABULAR_RESPONSE_DEBUG=False)
    def test_export_to_excel_response_with_datetime(self):
        headers = ["h1"]
        rows = [[datetime.datetime(2022, 1, 1, 12, 0)]]
        resp = export_to_excel_response("datetime.xlsx", headers, rows)
        self.assertIsInstance(resp, HttpResponse)
        self.assertEqual(
            resp["Content-Type"],
            "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
        )
        self.assertEqual(
            "attachment; filename*=UTF-8''datetime.xlsx", resp["Content-Disposition"]
        )

    @override_settings(TABULAR_RESPONSE_DEBUG=True)
    def test_export_to_excel_response_debug(self):
        headers = ["h1"]
        rows = [["x"]]
        resp = export_to_excel_response("debug.xlsx", headers, rows)
        self.assertIsInstance(resp, StreamingHttpResponse)
        content = b"".join(resp.streaming_content)
        self.assertIn(b"<table", content)


class AdminTests(TestCase):
    def setUp(self):
        self.queryset = DummyQuerySet(
            data=[("val1", "val2"), ("val3", "val4")],
            field_names=["name", "created"],
        )
        self.modeladmin = Mock()
        self.modeladmin.model = DummyModel
        self.request = Mock()

    def test_export_to_excel_action_default_filename(self):
        response = export_to_excel_action(self.modeladmin, self.request, self.queryset)
        self.assertIsInstance(response, HttpResponse)
        self.assertIn(
            "application/vnd.openxmlformats-officedocument", response["Content-Type"]
        )
        self.assertEqual(
            "attachment; filename*=UTF-8''dummy%20models.xlsx",
            response["Content-Disposition"],
        )

    def test_export_to_excel_action_with_custom_filename_and_fields(self):
        response = export_to_excel_action(
            self.modeladmin,
            self.request,
            self.queryset,
            filename="custom.xlsx",
            field_names=["name"],
            extra_verbose_names={"name": "Custom Name"},
        )
        self.assertIsInstance(response, HttpResponse)
        self.assertIn(
            "application/vnd.openxmlformats-officedocument", response["Content-Type"]
        )
        self.assertEqual(
            "attachment; filename*=UTF-8''custom.xlsx", response["Content-Disposition"]
        )

    def test_export_to_csv_action_default_filename(self):
        response = export_to_csv_action(self.modeladmin, self.request, self.queryset)
        self.assertIsInstance(response, StreamingHttpResponse)
        content = b"".join(response.streaming_content)
        self.assertIn(b"val1", content)
        self.assertIn(b"val4", content)

    def test_export_to_csv_action_with_custom_filename_and_fields(self):
        response = export_to_csv_action(
            self.modeladmin,
            self.request,
            self.queryset,
            filename="custom.csv",
            field_names=["name"],
            extra_verbose_names={"name": "Custom Name"},
        )
        self.assertIsInstance(response, StreamingHttpResponse)
        content = b"".join(response.streaming_content)
        self.assertIn(b"val1", content)


================================================
FILE: exporter/tests/test_utils.py
================================================
from django.test import TestCase

from exporter.exceptions import UnacceptableCharacterError
from exporter.utils import (
    find_unacceptable_characters,
    is_acceptable_character,
    remove_unacceptable_characters,
    validate_text_for_export,
)


class UtilsValidationTests(TestCase):
    def test_printable_ascii_is_acceptable(self):
        self.assertTrue(is_acceptable_character("A"))
        self.assertTrue(is_acceptable_character("9"))
        self.assertTrue(is_acceptable_character(" "))

    def test_whitelisted_nonprintable_is_acceptable(self):
        # Tab (\t) and NBSP (\xa0) are explicitly whitelisted
        self.assertTrue(is_acceptable_character("\t"))
        self.assertTrue(is_acceptable_character("\xa0"))

    def test_control_char_is_rejected(self):
        self.assertFalse(is_acceptable_character("\x00"))
        self.assertFalse(is_acceptable_character("\x1f"))

    def test_find_unacceptable_characters_returns_positions(self):
        sample = "ok\nBad\x00line\nnext\tgood"
        violations = find_unacceptable_characters(sample)
        # Expect the single null-byte at line 2, column 4 (1-based)
        self.assertEqual(violations, [(2, 4, "\x00")])

    def test_duplicate_violations_are_recorded(self):
        sample = "a\x00b\x00"  # two null bytes same line
        violations = find_unacceptable_characters(sample)
        self.assertEqual(violations, [(1, 2, "\x00"), (1, 4, "\x00")])

    def test_validate_text_for_export_passes_clean_text(self):
        clean = "Hello world!\nThis\u3000is ok."
        # \u3000 (ideographic space) is whitelisted
        self.assertTrue(validate_text_for_export(clean))

    def test_validate_text_for_export_raises_on_bad_text(self):
        bad = "Bad\u200bText"  # zero-width space is not allowed
        with self.assertRaises(UnacceptableCharacterError) as cm:
            validate_text_for_export(bad)
        err = cm.exception
        self.assertEqual(err.violations, [(1, 4, "\u200b")])

    def test_remove_unacceptable_characters_removes_disallowed_chars(self):
        # Mix of unacceptable characters across positions.
        sample = "\x00Start\u200bMiddleEnd\x1f"
        cleaned = remove_unacceptable_characters(sample)
        self.assertEqual(cleaned, "StartMiddleEnd")

    def test_remove_unacceptable_characters_keeps_whitelisted_chars(self):
        # Ensure whitelist is honored: \t, NBSP, ideographic space, em space.
        sample = "A\tB\xa0C\u3000D\u2003E"
        cleaned = remove_unacceptable_characters(sample)
        self.assertEqual(cleaned, sample)

    def test_remove_unacceptable_characters_preserves_newlines_and_crlf(self):
        # Preserve exact newline forms while removing bad chars within lines.
        sample = "one\r\ntwo\nthree\rfour"
        # Insert a zero-width space in "two" and a NUL at end of "three".
        sample_with_bad = "one\r\nt\u200bwo\nthree\x00\rfour"
        cleaned = remove_unacceptable_characters(sample_with_bad)
        self.assertEqual(cleaned, sample)

    def test_remove_unacceptable_characters_noop_on_clean_text(self):
        clean = "Line 1\nLine 2\tTabbed\u3000Ideographic\u2003Em"
        cleaned = remove_unacceptable_characters(clean)
        self.assertEqual(cleaned, clean)

    def test_remove_unacceptable_characters_handles_multiple_lines(self):
        # Multiple lines with several unacceptable chars per line.
        sample = (
            "ok line\n"
            "bad\x00line\x00with\x00many\n"
            "zero\u200bwidth\u200bspaces\n"
            "\x00\x00start and end\u200b"
        )
        cleaned = remove_unacceptable_characters(sample)
        self.assertEqual(
            cleaned, "ok line\n" "badlinewithmany\n" "zerowidthspaces\n" "start and end"
        )

    def test_remove_unacceptable_characters_preserves_carriage_return_alone(self):
        # Some inputs may include bare '\r' (classic Mac, or copy/paste artifacts).
        sample = "a\rb\rc"
        # Add disallowed chars around to ensure we only drop them, not '\r'.
        sample_with_bad = "a\x00\rb\u200b\rc\x1f"
        cleaned = remove_unacceptable_characters(sample_with_bad)
        self.assertEqual(cleaned, sample)


================================================
FILE: exporter/tests/test_views.py
================================================
import io
import tempfile
import zipfile
from pathlib import Path
from unittest.mock import patch

from django.http import HttpResponse, HttpResponseRedirect
from django.test import TestCase, override_settings
from django.urls import reverse
from django.utils import timezone

from concordia.models import (
    Asset,
    Item,
    MediaType,
    Transcription,
    TranscriptionStatus,
    User,
)
from concordia.tests.utils import (
    create_asset,
    create_campaign,
    create_item,
    create_project,
)
from exporter.views import (
    ExportProjectToCSV,
    do_bagit_export,
    get_latest_transcription_data,
    get_original_asset_id,
    get_tag_values,
    remove_incomplete_items,
    write_distinct_asset_resource_file,
)

DOWNLOAD_URL = (
    "http://tile.loc.gov/image-services/iiif/"
    "service:mss:mal:003:0036300:002/full/pct:25/0/default.jpg"
)

RESOURCE_URL = "https://www.loc.gov/resource/mal.0043300/"


class ViewTests(TestCase):
    def setUp(self):
        self.user = User.objects.create(
            username="tester", email="tester@example.com", is_staff=True
        )
        self.user.set_password("top_secret")
        self.user.save()
        self.assertTrue(
            self.client.login(username="tester", password="top_secret")  # nosec
        )

        self.campaign = create_campaign(published=True)
        self.project = create_project(campaign=self.campaign, published=True)
        self.item = create_item(project=self.project, published=True)

        self.asset = create_asset(
            item=self.item,
            title="TestAsset",
            description="Asset Description",
            download_url=DOWNLOAD_URL,
            resource_url=RESOURCE_URL,
            media_type=MediaType.IMAGE,
            sequence=1,
        )

        transcription = Transcription(
            asset=self.asset,
            user=self.user,
            text="Sample",
            submitted=timezone.now(),
            accepted=timezone.now(),
        )
        transcription.full_clean()
        transcription.save()

        # Create another project with the same slug in a different campaign
        # to ensure this does not cause issues with any exports
        campaign2 = create_campaign(published=True, slug="test-campaign-2")
        create_project(campaign=campaign2, published=True, slug=self.project.slug)

    def test_csv_export(self):
        response = self.client.get(
            reverse("transcriptions:campaign-export-csv", args=(self.campaign.slug,))
        )
        self.assertEqual(response.status_code, 200)
        response_content = "".join(map(str, response.streaming_content))
        self.assertIn(
            "Campaign,Project,Item,ItemId,Asset,AssetId,AssetStatus", response_content
        )
        self.assertIn("TestAsset", response_content)
        self.assertIn("Sample", response_content)

    def test_campaign_bagit_export(self):
        response = self.client.get(
            reverse("transcriptions:campaign-export-bagit", args=(self.campaign.slug,))
        )
        self.assertEqual(response.status_code, 200)
        self.assertIn("Content-Disposition", response)

        f = io.BytesIO(response.content)
        zipped = zipfile.ZipFile(f, "r")
        self.assertIn("bagit.txt", zipped.namelist())
        self.assertIn("data/mss/mal/003/0036300/002.txt", zipped.namelist())

    def test_project_bagit_export(self):
        response = self.client.get(
            reverse(
                "transcriptions:project-export-bagit",
                args=(self.campaign.slug, self.project.slug),
            )
        )
        self.assertEqual(response.status_code, 200)
        self.assertIn("Content-Disposition", response)

        f = io.BytesIO(response.content)
        zipped = zipfile.ZipFile(f, "r")
        self.assertIn("bagit.txt", zipped.namelist())
        self.assertIn("data/mss/mal/003/0036300/002.txt", zipped.namelist())

    def test_project_csv_export(self):
        request = self.client.get("/").wsgi_request
        request.user = self.user
        request.user.is_staff = True

        response = ExportProjectToCSV.as_view()(
            request, campaign_slug=self.campaign.slug, project_slug=self.project.slug
        )

        self.assertEqual(response.status_code, 200)
        response_content = b"".join(response.streaming_content).decode()
        self.assertIn("TestAsset", response_content)
        self.assertIn("Sample", response_content)

    def test_item_bagit_export(self):
        response = self.client.get(
            reverse(
                "transcriptions:item-export-bagit",
                args=(self.campaign.slug, self.project.slug, self.item.item_id),
            )
        )
        self.assertEqual(response.status_code, 200)
        self.assertIn("Content-Disposition", response)
        f = io.BytesIO(response.content)
        zipped = zipfile.ZipFile(f, "r")
        self.assertIn("bagit.txt", zipped.namelist())
        self.assertIn("data/mss/mal/003/0036300/002.txt", zipped.namelist())

    def test_get_original_asset_id_fallback(self):
        fallback_url = "http://example.com/image.jpg"
        self.assertEqual(get_original_asset_id(fallback_url), fallback_url)

    def test_get_original_asset_id_service_match(self):
        url = "http://tile.loc.gov/image-services/iiif/service:mss:mss38299:mss38299_016:0588/full/pct:100/0/default.jpg"
        result = get_original_asset_id(url)
        self.assertEqual(result, "mss:mss38299:mss38299_016:0588")

    def test_get_original_asset_id_master_match(self):
        # This is a made-up URL because no current Assets
        # have a "master" URL to test against
        url = "http://tile.loc.gov/image-services/iiif/master/mus/123/456/mus123456.002/full/pct:100/0/default.jpg"
        result = get_original_asset_id(url)
        self.assertEqual(result, "mus/123/456/mus123456")

    def test_get_original_asset_id_public_match(self):
        url = "https://tile.loc.gov/image-services/iiif/public:music:musbernstein-100020080:musbernstein-100020080.0021/full/pct:100.0/0/default.jpg"
        result = get_original_asset_id(url)
        self.assertEqual(result, "musbernstein-100020080:musbernstein-100020080.0021")

    def test_get_original_asset_id_failure(self):
        # This tests if a URL doesn't match any of the patterns
        invalid_url = "http://tile.loc.gov/image-services/iiif/master/foo/bar/baz/full/pct:100/0/default.jpg"
        with self.assertRaises(ValueError):
            get_original_asset_id(invalid_url)

    def test_write_distinct_asset_resource_file_missing_url(self):
        self.asset.resource_url = ""
        self.asset.save()

        with tempfile.TemporaryDirectory() as tmpdir:
            with self.assertRaises(AssertionError):
                write_distinct_asset_resource_file([self.asset.pk], tmpdir)

    @override_settings(EXPORT_S3_BUCKET_NAME=None)
    @patch("exporter.views.logger")
    def test_do_bagit_export_no_s3(self, mock_logger):
        assets = get_latest_transcription_data(Asset.objects.filter(pk=self.asset.pk))

        with tempfile.TemporaryDirectory() as tmpdir:
            response = do_bagit_export(assets, tmpdir, "sample-bagit")
            self.assertEqual(response.status_code, 200)
            self.assertIn("application/zip", response["Content-Type"])

    def test_remove_incomplete_items(self):
        item2 = create_item(
            project=self.project, published=True, item_id="different-id"
        )
        create_asset(item=item2, transcription_status=TranscriptionStatus.NOT_STARTED)

        asset_qs = remove_incomplete_items(Item.objects.filter(project=self.project))
        self.assertEqual(asset_qs.count(), 1)
        self.assertEqual(asset_qs.first(), self.asset)

    def test_get_tag_values_empty(self):
        assets = get_tag_values(Asset.objects.filter(pk=self.asset.pk))
        self.assertEqual(list(assets.values_list("tag_values", flat=True))[0], "")

    def test_get_latest_transcription_data(self):
        assets = get_latest_transcription_data(Asset.objects.filter(pk=self.asset.pk))
        self.assertEqual(list(assets)[0].latest_transcription, "Sample")

    @override_settings(EXPORT_S3_BUCKET_NAME="fake-bucket")
    @patch("exporter.views.boto3.resource")
    @patch("exporter.views.logger")
    def test_do_bagit_export_with_s3(self, mock_logger, mock_boto):
        assets = get_latest_transcription_data(Asset.objects.filter(pk=self.asset.pk))

        with tempfile.TemporaryDirectory() as tmpdir:
            response = do_bagit_export(assets, tmpdir, "sample-bagit")
            self.assertIsInstance(response, HttpResponseRedirect)
            self.assertIn("fake-bucket.s3.amazonaws.com", response["Location"])
            mock_boto().Bucket().upload_file.assert_called()

    @override_settings(EXPORT_S3_BUCKET_NAME=None)
    @patch("exporter.views.logger")
    def test_do_bagit_export_without_transcription(self, mock_logger):
        asset = create_asset(
            item=self.item,
            sequence=99,
            title="No Transcription",
            download_url=DOWNLOAD_URL,
            resource_url=RESOURCE_URL,
        )

        with tempfile.TemporaryDirectory() as tmpdir:
            assets = get_latest_transcription_data(Asset.objects.filter(pk=asset.pk))
            response = do_bagit_export(assets, tmpdir, "sample-bagit-no-txt")

            self.assertEqual(response.status_code, 200)
            self.assertIn("application/zip", response["Content-Type"])

            # Read contents of the zip
            zip_bytes = io.BytesIO(response.content)
            with zipfile.ZipFile(zip_bytes, "r") as zip_file:
                file_list = zip_file.namelist()

            # There should be no .txt transcription files
            transcription_files = [
                f
                for f in file_list
                if f.endswith(".txt")
                and f.startswith("data/")
                and not f.endswith("item-resource-urls.txt")
            ]
            self.assertEqual(
                transcription_files,
                [],
                f"Unexpected transcription files: {transcription_files}",
            )

    @override_settings(EXPORT_S3_BUCKET_NAME=None)
    @patch("exporter.views.render")  # <- patch render itself
    @patch("exporter.views.shutil.rmtree")
    def test_do_bagit_export_validation_errors_render(self, mock_rmtree, mock_render):
        bad_asset = create_asset(
            item=self.item,
            sequence=42,
            title="BadAsset",
            download_url=DOWNLOAD_URL,
            resource_url=RESOURCE_URL,
        )
        Transcription.objects.create(
            asset=bad_asset,
            user=self.user,
            text="Bad\u200bText",  # invalid char
            submitted=timezone.now(),
        )
        assets = get_latest_transcription_data(
            Asset.objects.filter(pk__in=[self.asset.pk, bad_asset.pk])
        )

        request = self.client.get("/dummy").wsgi_request
        request.user = self.user
        request.user.is_staff = True

        # make render return a simple HttpResponse we can ignore
        mock_render.return_value = HttpResponse("dummy")

        with tempfile.TemporaryDirectory() as tmpdir:
            response = do_bagit_export(
                assets,
                tmpdir,
                "bad-bagit",
                request=request,
            )

            mock_render.assert_called_once()
            args, kwargs = mock_render.call_args
            template_name = args[1]  # args[0] is the request
            context = args[2]  # third positional arg
            self.assertEqual(
                template_name,
                "admin/exporter/unacceptable_character_report.html",
            )
            self.assertIn("errors", context)
            self.assertEqual(len(context["errors"]), 1)
            self.assertEqual(context["errors"][0]["asset"], bad_asset)

            mock_rmtree.assert_called_once_with(Path(tmpdir), ignore_errors=True)

            self.assertEqual(response.content, b"dummy")

    @override_settings(EXPORT_S3_BUCKET_NAME=None)
    @patch("exporter.views.shutil.rmtree")
    def test_do_bagit_export_validation_errors_no_request(self, mock_rmtree):
        """
        When called without a request, do_bagit_export should return the raw
        error list.
        """
        bad_asset = create_asset(
            item=self.item,
            sequence=99,
            title="BadAssetNoRequest",
            download_url=DOWNLOAD_URL,
            resource_url=RESOURCE_URL,
        )
        Transcription.objects.create(
            asset=bad_asset,
            user=self.user,
            text="Invisible\u200eText",  # LEFT-TO-RIGHT MARK -> invalid
            submitted=timezone.now(),
        )

        assets = get_latest_transcription_data(
            Asset.objects.filter(pk__in=[self.asset.pk, bad_asset.pk])
        )

        with tempfile.TemporaryDirectory() as tmpdir:
            errors = do_bagit_export(assets, tmpdir, "bad-bagit-no-request")

            # helper should return a list, not an HttpResponse
            self.assertIsInstance(errors, list)
            self.assertEqual(len(errors), 1)
            self.assertEqual(errors[0]["asset"], bad_asset)

            # directory should have been removed
            mock_rmtree.assert_called_once_with(Path(tmpdir), ignore_errors=True)

    @override_settings(EXPORT_S3_BUCKET_NAME=None)
    @patch("exporter.views.shutil.rmtree")
    @patch(
        "pathlib.Path.exists", return_value=False
    )  # force the exists() check to fail
    def test_do_bagit_export_validation_errors_no_export_dir(
        self,
        mock_exists,
        mock_rmtree,
    ):
        """
        If validation fails and the export directory no longer exists,
        do_bagit_export should NOT attempt to call shutil.rmtree.
        """
        bad_asset = create_asset(
            item=self.item,
            sequence=77,
            title="BadAssetNoDir",
            download_url=DOWNLOAD_URL,
            resource_url=RESOURCE_URL,
        )
        Transcription.objects.create(
            asset=bad_asset,
            user=self.user,
            text="Oops\u200b",  # zero-width space -> invalid
            submitted=timezone.now(),
        )

        assets = get_latest_transcription_data(
            Asset.objects.filter(pk__in=[self.asset.pk, bad_asset.pk])
        )

        with tempfile.TemporaryDirectory() as tmpdir:
            # invoke without request -> should return raw errors list
            errors = do_bagit_export(assets, tmpdir, "bad-bagit-no-dir")

            # exists() forced to False -> rmtree must not be called
            mock_rmtree.assert_not_called()
            self.assertIsInstance(errors, list)
            self.assertEqual(len(errors), 1)


================================================
FILE: exporter/utils.py
================================================
"""
Utility helpers for validating outgoing text.

The primary public entry-point is `exporter.utils.validate_text_for_export`,
which raises an `exporter.exceptions.UnacceptableCharacterError` when any
non-printable Unicode character is detected.  Validation is performed per
line so the caller receives the exact location of every problem character.
"""

from typing import List, Tuple

from exporter.exceptions import UnacceptableCharacterError

_WHITELIST = [
    "\t",  # Tab
    "\xa0",  # Non-breaking space
    "\u3000",  # Ideographic space; used in Chinese/Japanese/Korean
    "\u2003",  # em space (space the width of the 'm' character)
]


def is_acceptable_character(character: str) -> bool:
    """
    Return `True` when `character` is considered printable.

    The function simply wraps `str.isprintable()` so behaviour stays in sync
    with the official Unicode definition of *printable*.

    Args:
        character: A single Unicode character.

    Returns:
        `True` if the character is printable; otherwise `False`.
    """

    return character.isprintable() or character in _WHITELIST


def find_unacceptable_characters(text: str) -> List[Tuple[int, int, str]]:
    """
    Locate every non-printable character in *text*.

    The scan is performed line by line so that the exact position (line and
    column) of each offending character can be fed back to the caller.

    Args:
        text: The string to validate.

    Returns:
        A list of `(line_number, column_number, character)` triples.  The list
        may contain duplicates because each instance of an invalid character is
        recorded individually.
    """

    violations: List[Tuple[int, int, str]] = []

    for line_no, line in enumerate(text.splitlines(), start=1):
        for col_no, ch in enumerate(line, start=1):
            if not is_acceptable_character(ch):
                violations.append((line_no, col_no, ch))

    return violations


def validate_text_for_export(text: str) -> bool:
    """
    Validate `text` and raise if it contains any unacceptable characters.

    Args:
        text: The text destined for export.

    Returns:
        `True` if the text is valid for export

    Raises:
        UnacceptableCharacterError: If at least one non-printable character is
        found.
    """

    violations = find_unacceptable_characters(text)
    if violations:
        raise UnacceptableCharacterError(violations)
    return True


def remove_unacceptable_characters(text: str) -> str:
    """
    Produce a copy of `text` with all non-printable characters removed.

    The removal uses the same acceptability rules as validation, ensuring the
    behaviour stays consistent with `is_acceptable_character()` and the shared
    whitelist.  Standard line breaks are preserved.  Characters considered
    unacceptable (i.e., not printable and not in the whitelist) are omitted
    from the result.

    Args:
        text: The input string to sanitize.

    Returns:
        A new string with all unacceptable characters removed.

    Notes:
        The scan mirrors `find_unacceptable_characters()` by operating
        line-by-line.  Unlike validation, there is no error raised; the
        offending characters are dropped from the output.  Newline characters
        (``\\n`` and ``\\r``) are preserved so the original line structure is
        maintained.
    """

    cleaned_parts: List[str] = []
    for line in text.splitlines(keepends=True):
        # Keepends means any trailing '\n'/'\r\n' is part of `line`.
        out_line_chars: List[str] = []
        for ch in line:
            # Preserve standard line breaks exactly as seen.
            if ch == "\n" or ch == "\r":
                out_line_chars.append(ch)
                continue
            if is_acceptable_character(ch):
                out_line_chars.append(ch)
        cleaned_parts.append("".join(out_line_chars))
    return "".join(cleaned_parts)


================================================
FILE: exporter/views.py
================================================
import os
import re
import shutil
import tempfile
from collections.abc import Iterable
from logging import getLogger
from pathlib import Path
from typing import Any, List

import bagit
import boto3
from django.conf import settings
from django.contrib.admin.views.decorators import staff_member_required
from django.contrib.postgres.aggregates.general import StringAgg
from django.db.models import OuterRef, Subquery, TextField, Value
from django.db.models.functions import Coalesce
from django.db.models.query import QuerySet
from django.http import (
    HttpRequest,
    HttpResponse,
    HttpResponseRedirect,
)
from django.shortcuts import render
from django.utils.decorators import method_decorator
from django.views.generic import TemplateView

from concordia.models import (
    Asset,
    Campaign,
    Item,
    Project,
    Transcription,
    TranscriptionStatus,
)
from exporter.exceptions import UnacceptableCharacterError
from exporter.tabular_export.core import export_to_csv_response, flatten_queryset
from exporter.utils import validate_text_for_export

logger = getLogger(__name__)


def get_latest_transcription_data(
    asset_qs: QuerySet[Asset],
) -> QuerySet[Asset]:
    """
    Annotate each asset with its latest transcription text.

    The annotation is named ``latest_transcription`` and is derived from the
    most recent ``Transcription`` by primary key.

    Args:
        asset_qs:
            QuerySet[Asset] to annotate.

    Returns:
        QuerySet[Asset]: The input queryset annotated with
        ``latest_transcription``.
    """
    latest_trans_subquery = (
        Transcription.objects.filter(asset=OuterRef("pk"))
        .order_by("-pk")
        .values("text")
    )

    assets = asset_qs.annotate(
        latest_transcription=Coalesce(
            Subquery(latest_trans_subquery[:1]),
            Value("", output_field=TextField()),
        )
    )
    return assets


def get_tag_values(asset_qs: QuerySet[Asset]) -> QuerySet[Asset]:
    """
    Annotate each asset with a semicolon-joined string of tag values.

    The annotation is named ``tag_values`` and aggregates related tag text from
    ``userassettagcollection__tags__value``.

    Args:
        asset_qs:
            QuerySet[Asset] to annotate.

    Returns:
        QuerySet[Asset]: The input queryset annotated with ``tag_values``.
    """
    assets = asset_qs.annotate(
        tag_values=StringAgg(
            "userassettagcollection__tags__value",
            "; ",
            default=Value("", output_field=TextField()),
        )
    )
    return assets


def remove_incomplete_items(item_qs: QuerySet[Item]) -> QuerySet[Asset]:
    """
    Filter out items that are not fully completed and return their assets.

    An item is considered incomplete if any of its assets have a status of
    NOT_STARTED, IN_PROGRESS or SUBMITTED.

    Args:
        item_qs:
            QuerySet[Item] to check for completeness.

    Returns:
        QuerySet[Asset]: Assets belonging to completed items, ordered by
        project, item and sequence.
    """
    incomplete_item_assets = Asset.objects.filter(
        item__in=item_qs,
        transcription_status__in=(
            TranscriptionStatus.NOT_STARTED,
            TranscriptionStatus.IN_PROGRESS,
            TranscriptionStatus.SUBMITTED,
        ),
    )
    item_qs = item_qs.exclude(asset__in=incomplete_item_assets)
    asset_qs = Asset.objects.filter(item__in=item_qs).order_by(
        "item__project", "item", "sequence"
    )
    return asset_qs


def get_original_asset_id(download_url: str) -> str:
    """
    Derive a stable external asset identifier from a LOC download URL.

    For ``tile.loc.gov`` URLs a best-effort pattern is used to extract the
    identifier. Non-matching URLs are returned unchanged.

    Args:
        download_url:
            The asset's download URL.

    Returns:
        str: Identifier suitable for naming files inside the BagIt payload.

    Raises:
        ValueError: If the URL looks like ``tile.loc.gov`` but no ID is found.
    """
    download_url = download_url.replace("https", "http")
    if download_url.startswith("http://tile.loc.gov/"):
        pattern = (
            r"/service:([A-Za-z0-9:.\-\_]+)/"
            + r"|/master/([A-Za-z0-9/]+)([0-9.]+)"
            + r"|/public:[A-Za-z0-9]+:([A-Za-z0-9:.\-_]+?)/"
        )
        asset_id = re.search(pattern, download_url)
        if not asset_id:
            logger.error(
                "Could not find a matching asset ID in download URL %s",
                download_url,
            )
            raise ValueError(
                f"Could not find a matching asset ID in download URL {download_url}"
            )
        matching_asset_id = next((group for group in asset_id.groups() if group))
        logger.debug(
            "Found asset ID %s in download URL %s",
            matching_asset_id,
            download_url,
        )
        return matching_asset_id

    logger.warning(
        "Download URL does not start with tile.loc.gov: %s",
        download_url,
    )
    return download_url


def write_distinct_asset_resource_file(
    assets: Iterable[Any], export_base_dir: str | Path
) -> None:
    """
    Write a unique list of resource URLs for the provided assets.

    The file is named ``item-resource-urls.txt`` and written at the export
    root. Each line contains one distinct ``Asset.resource_url``.

    Args:
        assets:
            Iterable of asset identifiers or a QuerySet[Asset]. Passed to
            ``Asset.objects.filter(pk__in=assets)``.
        export_base_dir:
            Directory where the file should be created.

    Raises:
        AssertionError: If an asset has no ``resource_url``.
    """
    asset_resource_file = os.path.join(export_base_dir, "item-resource-urls.txt")

    with open(asset_resource_file, "a") as f:
        distinct_resource_urls = (
            Asset.objects.filter(pk__in=assets)
            .order_by("resource_url")
            .values_list("resource_url", "title")
            .distinct("resource_url")
        )

        for url, title in distinct_resource_urls:
            if url:
                f.write(url)
                f.write("\n")
            else:
                logger.error("No resource URL found for asset %s", title)
                raise AssertionError


def do_bagit_export(
    assets: Iterable[Asset] | QuerySet[Asset],
    export_base_dir: str | Path,
    export_filename_base: str,
    request: HttpRequest | None = None,
) -> HttpResponse | HttpResponseRedirect | List[dict[str, Any]]:
    """
    Build and deliver a BagIt package for ``assets`` or report invalid chars.

    The function validates every asset's ``latest_transcription``. For each
    unacceptable character it records:
    - the asset ID
    - the 1-based line number
    - the 1-based column number
    - the offending character

    Behaviour:
    1. Validation pass: files are written only after a transcription passes
       validation.
    2. Failure(s): any files already written are removed. If ``request`` is
       supplied a template is rendered, otherwise the raw error list is
       returned.
    3. All clear: a BagIt structure is created, zipped and either returned as a
       download or uploaded to S3.

    Args:
        assets:
            Iterable or QuerySet of ``Asset`` to export. Each must have
            ``download_url`` and ``latest_transcription``.
        export_base_dir:
            Temporary directory into which the BagIt hierarchy is built.
        export_filename_base:
            Base name (without ``.zip``) for the archive.
        request:
            Current request. If provided, an error template will be rendered
            when validation fails.

    Returns:
        HttpResponse | HttpResponseRedirect | list[dict[str, Any]]:

        - a download response when packaging locally
        - a redirect to the uploaded archive when S3 is configured
        - a list of validation errors when ``request`` is ``None`` and errors
          were found
    """
    export_base_dir = Path(export_base_dir)
    errors: List[dict[str, Any]] = []

    # Validate every transcription before writing anything to disk
    for asset in assets:
        asset_id = get_original_asset_id(asset.download_url)
        asset_id = asset_id.replace(":", "/")  # BagIt-safe path fragment

        transcription = asset.latest_transcription or ""
        try:
            validate_text_for_export(transcription)
        except UnacceptableCharacterError as err:
            errors.append({"asset": asset, "violations": err.violations})
            continue

        # Passed validation -> write the transcription file
        asset_path, asset_filename = os.path.split(asset_id)
        asset_dest_path = export_base_dir / asset_path
        asset_dest_path.mkdir(parents=True, exist_ok=True)

        if transcription:
            with open(asset_dest_path / f"{asset_filename}.txt", "w") as fp:
                fp.write(transcription)

    # If any errors -> cleanup and report
    if errors:
        if export_base_dir.exists():
            shutil.rmtree(export_base_dir, ignore_errors=True)

        if request is not None:
            return render(
                request,
                "admin/exporter/unacceptable_character_report.html",
                {"errors": errors},
            )
        return errors

    # All assets valid -> create BagIt, zip, upload / return
    write_distinct_asset_resource_file(assets, export_base_dir)

    bagit.make_bag(
        export_base_dir,
        {
            "Content-Access": "web",
            "Content-Custodian": "dcms",
            "Content-Process": "crowdsourced",
            "Content-Type": "textual",
            "LC-Bag-Id": export_filename_base,
            "LC-Items": f"{len(assets)} transcriptions",
            "LC-Project": "gdccrowd",
            "License-Information": "Public domain",
        },
    )

    archive_name = shutil.make_archive(
        str(export_base_dir), "zip", root_dir=export_base_dir
    )
    export_filename = f"{export_filename_base}.zip"

    s3_bucket = getattr(settings, "EXPORT_S3_BUCKET_NAME", None)
    if s3_bucket:
        logger.debug("Uploading exported bag to S3 bucket %s", s3_bucket)
        s3 = boto3.resource("s3")
        s3.Bucket(s3_bucket).upload_file(archive_name, export_filename)

        return HttpResponseRedirect(
            f"https://{s3_bucket}.s3.amazonaws.com/{export_filename}"
        )

    # Local download
    with open(archive_name, "rb") as zip_file:
        response = HttpResponse(zip_file, content_type="application/zip")
    response["Content-Disposition"] = f"attachment; filename={export_filename}"
    return response


class ExportCampaignToCSV(TemplateView):
    """
    Stream a CSV of the most recent transcription for each asset in a campaign.

    Only the latest transcription text per asset is included. Tag values
    are aggregated into a semicolon-delimited string.
    """

    @method_decorator(staff_member_required)
    def get(self, request: HttpRequest, *args, **kwargs) -> HttpResponse:
        """
        Return a CSV response for the requested campaign.

        Args:
            request: Current HTTP request.

        Returns:
            HttpResponse: CSV content for the campaign.
        """
        asset_qs: QuerySet[Asset] = Asset.objects.filter(
            item__project__campaign__slug=self.kwargs["campaign_slug"]
        )
        assets: QuerySet[Asset] = get_latest_transcription_data(asset_qs)
        assets = get_tag_values(assets)

        headers, data = flatten_queryset(
            assets,
            field_names=[
                "item__project__campaign__title",
                "item__project__title",
                "item__title",
                "item__item_id",
                "title",
                "id",
                "transcription_status",
                "download_url",
                "latest_transcription",
                "tag_values",
            ],
            extra_verbose_names={
                "item__project__campaign__title": "Campaign",
                "item__project__title": "Project",
                "item__title": "Item",
                "item__item_id": "ItemId",
                "item_id": "ItemId",
                "title": "Asset",
                "id": "AssetId",
                "transcription_status": "AssetStatus",
                "download_url": "DownloadUrl",
                "latest_transcription": "Transcription",
                "tag_values": "Tags",
            },
        )

        logger.info("Exporting %s to csv", self.kwargs["campaign_slug"])
        return export_to_csv_response(
            "%s.csv" % self.kwargs["campaign_slug"], headers, data
        )


class ExportItemToBagIt(TemplateView):
    """
    Build a BagIt archive for a single item consisting of completed assets.

    Only assets with ``TranscriptionStatus.COMPLETED`` are included.
    """

    @method_decorator(staff_member_required)
    def get(
        self, request: HttpRequest, *args, **kwargs
    ) -> HttpResponse | HttpResponseRedirect:
        """
        Create and return a BagIt archive for the requested item.

        Args:
            request: Current HTTP request.

        Returns:
            HttpResponse | HttpResponseRedirect: Local zip download or redirect
            to S3.
        """
        campaign_slug = self.kwargs["campaign_slug"]
        project_slug = self.kwargs["project_slug"]
        item_id = self.kwargs["item_id"]

        asset_qs: QuerySet[Asset] = Asset.objects.filter(
            item__project__campaign__slug=campaign_slug,
            item__project__slug=project_slug,
            item__item_id=item_id,
            transcription_status=TranscriptionStatus.COMPLETED,
        ).order_by("sequence")

        assets: QuerySet[Asset] = get_latest_transcription_data(asset_qs)

        campaign = Campaign.objects.get(slug__exact=campaign_slug)
        campaign_slug_dbv = campaign.slug
        project = Project.objects.get(campaign=campaign, slug__exact=project_slug)
        project_slug_dbv = project.slug
        item_id_dbv = Item.objects.get(item_id__exact=item_id).item_id

        export_filename_base = "%s-%s-%s" % (
            campaign_slug_dbv,
            project_slug_dbv,
            item_id_dbv,
        )

        with tempfile.TemporaryDirectory(
            prefix=export_filename_base
        ) as export_base_dir:
            return do_bagit_export(
                assets, export_base_dir, export_filename_base, request
            )


class ExportProjectToBagIt(TemplateView):
    """
    Build a BagIt archive for a project consisting of completed items only.
    """

    @method_decorator(staff_member_required)
    def get(
        self, request: HttpRequest, *args, **kwargs
    ) -> HttpResponse | HttpResponseRedirect:
        """
        Create and return a BagIt archive for the requested project.

        Args:
            request: Current HTTP request.

        Returns:
            HttpResponse | HttpResponseRedirect: Local zip download or redirect
            to S3.
        """
        campaign_slug = self.kwargs["campaign_slug"]
        project_slug = self.kwargs["project_slug"]

        item_qs: QuerySet[Item] = Item.objects.filter(
            project__campaign__slug=campaign_slug, project__slug=project_slug
        )
        asset_qs: QuerySet[Asset] = remove_incomplete_items(item_qs)
        assets: QuerySet[Asset] = get_latest_transcription_data(asset_qs)

        campaign = Campaign.objects.get(slug__exact=campaign_slug)
        campaign_slug_dbv = campaign.slug
        project = Project.objects.get(campaign=campaign, slug__exact=project_slug)
        project_slug_dbv = project.slug

        export_filename_base = "%s-%s" % (campaign_slug_dbv, project_slug_dbv)

        with tempfile.TemporaryDirectory(
            prefix=export_filename_base
        ) as export_base_dir:
            return do_bagit_export(
                assets, export_base_dir, export_filename_base, request
            )


class ExportCampaignToBagIt(TemplateView):
    """
    Build a BagIt archive for a campaign consisting of completed items only.
    """

    @method_decorator(staff_member_required)
    def get(
        self, request: HttpRequest, *args, **kwargs
    ) -> HttpResponse | HttpResponseRedirect:
        """
        Create and return a BagIt archive for the requested campaign.

        Args:
            request: Current HTTP request.

        Returns:
            HttpResponse | HttpResponseRedirect: Local zip download or redirect
            to S3.
        """
        campaign_slug = self.kwargs["campaign_slug"]

        item_qs: QuerySet[Item] = Item.objects.filter(
            project__campaign__slug=campaign_slug
        )
        asset_qs: QuerySet[Asset] = remove_incomplete_items(item_qs)
        assets: QuerySet[Asset] = get_latest_transcription_data(asset_qs)

        campaign_slug_dbv = Campaign.objects.get(slug__exact=campaign_slug).slug

        export_filename_base = "%s" % (campaign_slug_dbv,)

        with tempfile.TemporaryDirectory(
            prefix=export_filename_base
        ) as export_base_dir:
            return do_bagit_export(
                assets, export_base_dir, export_filename_base, request
            )


class ExportProjectToCSV(TemplateView):
    """
    Stream a CSV of the most recent transcription for each asset in a project.

    Only the latest transcription text per asset is included. Tag values
    are aggregated into a semicolon-delimited string.
    """

    @method_decorator(staff_member_required)
    def get(self, request: HttpRequest, *args, **kwargs) -> HttpResponse:
        """
        Return a CSV response for the requested project.

        Args:
            request: Current HTTP request.

        Returns:
            HttpResponse: CSV content for the project.
        """
        campaign_slug = self.kwargs["campaign_slug"]
        project_slug = self.kwargs["project_slug"]

        campaign = Campaign.objects.get(slug__exact=campaign_slug)
        project = Project.objects.get(campaign=campaign, slug__exact=project_slug)

        asset_qs: QuerySet[Asset] = Asset.objects.filter(item__project=project)
        assets: QuerySet[Asset] = get_latest_transcription_data(asset_qs)
        assets = get_tag_values(assets)

        headers, data = flatten_queryset(
            assets,
            field_names=[
                "item__project__campaign__title",
                "item__project__title",
                "item__title",
                "item__item_id",
                "title",
                "id",
                "transcription_status",
                "download_url",
                "latest_transcription",
                "tag_values",
            ],
            extra_verbose_names={
                "item__project__campaign__title": "Campaign",
                "item__project__title": "Project",
                "item__title": "Item",
                "item__item_id": "ItemId",
                "item_id": "ItemId",
                "title": "Asset",
                "id": "AssetId",
                "transcription_status": "AssetStatus",
                "download_url": "DownloadUrl",
                "latest_transcription": "Transcription",
                "tag_values": "Tags",
            },
        )

        logger.info("Exporting %s to csv", self.kwargs["project_slug"])
        return export_to_csv_response(
            f"{campaign.slug}-{project.slug}.csv", headers, data
        )


================================================
FILE: fixtures/original-static-pages.json
================================================
[
    {
        "fields": {
            "body": "crowd.loc.gov provides students of all ages with opportunities to explore unique historical documents from the collections of the Library of Congress.\n\nDeciphering and transcribing these documents can build students\u2019 skills in close reading, examining historical context, and building interpretive consensus.\n\n## Teaching Ideas\n\n- As students transcribe a document, urge them to pay close attention to the language used in the document. What does that language tell them about who the audience for the document was? Was it a close friend or family member? A powerful person? A complete stranger? If the document is a letter, what clues can they find in the greeting and closing?\n\n- Prompt students to speculate about what the document\u2019s author was trying to accomplish. What strategies, persuasive or otherwise, did the author use to accomplish their goal?\n\n- Challenge students to recreate the document in their own words, using today\u2019s communication tools. What did your students say differently? What did they say that was the same?\n\n- Ask students to identify clues about the time and place in which the document was created. What do they know about what was going on at the time? How can they find out more? \n\n- Ask students to research and describe what happened as a result of this document being created. If they can\u2019t identify what happened, ask them to speculate about what might have happened as a result of the document.\n\n- As students complete the transcription-reconciliation process, encourage them to take note of the ways they compared the differences between different transcriptions of the same document. What similarities and differences can they find between this process and the process of evaluating sources for a class project or research paper?\n\n## Primary Source Analysis\n\nThe documents in crowd.loc.gov are _primary sources_ \u2014 the raw materials of history and culture. Analyzing primary sources like these can give students a powerful sense of the complexity of the past, and can guide them toward higher-order thinking and better critical thinking skills.\n\nUse the Library\u2019s [primary source analysis tool and teacher\u2019s guide to analyzing manuscripts](http://www.loc.gov/teachers/usingprimarysources/guides.html) to guide your students through an analysis of any of the documents in crowd.loc.gov.\n\n**A note about content**: The historical documents in the Library\u2019s collections may include language or topics that aren\u2019t appropriate for your students, or that your students might find especially difficult to engage with. You may want to review documents before assigning them, or to use some of the strategies explored here.\n\n## Campaign Specific Resources\n\n### Letters to Lincoln (Featured Challenge for 2018!)\n\n- [\"I Do Solemnly Swear...\"  Presidential Inaugurations](https://www.loc.gov/rr/program/bib/inaugurations/index.html)\n- [The Library of Congress Celebrates the Songs of America](https://www.loc.gov/collections/songs-of-america/about-this-collection/)\n- [Additional Primary Materials](http://www.loc.gov/teachers/classroommaterials/primarysourcesets/lincoln/)\n\n### Branch Rickey: Changing the Game\n\n- Lesson Plan: [Baseball, Race and Ethnicity: Rounding the Bases](http://www.loc.gov/teachers/classroommaterials/lessons/bases/)\n- Lesson Plan: [Baseball, Race Relations and Jackie Robinson](http://www.loc.gov/teachers/classroommaterials/lessons/robinson/)\n- Primary Source Set: [Baseball Across a Divided Society](http://www.loc.gov/teachers/classroommaterials/primarysourcesets/baseball/)\n\n### Civil War Soldiers: \"Disabled but not disheartened\"\n\n- Lesson plan: [The Civil War Through a Child's Eye](http://www.loc.gov/teachers/classroommaterials/lessons/childs-eye/)\n- Teacher's guide: [The Civil War: The Nation Moves Towards War, 1850-61](http://www.loc.gov/teachers/classroommaterials/primarysourcesets/civil-war-approach/)\n\n### Clara Barton: \"Angel of the Battlefield\"\n\n- [Clara Barton Missing Soldiers Office Museum External additional resources](http://www.clarabartonmuseum.org/learn/studentresearch/)\n\n### Mary Church Terrell: Advocate for African Americans and Women\n\n- Lesson plan: [Suffrage Strategies: Voices for Votes](http://www.loc.gov/teachers/classroommaterials/lessons/suffrage/)\n- [http://www.loc.gov/teachers/classroommaterials/lessons/strivings/](http://www.loc.gov/teachers/classroommaterials/lessons/strivings/)\n- [Votes for Women: Selections from the National American Woman Suffrage Association Collection, 1848 to 1921](https://www.loc.gov/teachers/classroommaterials/connections/votes-women/)\n- [Civil Rights, information for Students](http://www.loc.gov/teachers/classroommaterials/themes/civil-rights/students.html)\n- [From Slavery to Civil Rights: A Timeline of African American History](https://www.loc.gov/teachers/classroommaterials/presentationsandactivities/presentations/civil-rights/) \n- [Segregation: From Jim Crow to Linda Brown](http://www.loc.gov/teachers/classroommaterials/lessons/jimcrow/)",
            "created_on": "2018-11-26T22:00:43.688Z",
            "path": "/for-educators/",
            "title": "Resources for Educators",
            "updated_on": "2018-11-26T22:00:43.696Z"
        },
        "model": "concordia.simplepage",
        "pk": 1
    },
    {
        "fields": {
            "body": "## Join us at the Library for the 155th Anniversary of the Gettysburg Address\n\n---\n\nOn November 19, 1863, Abraham Lincoln delivered the Gettysburg Address in Gettysburg, Pennsylvania. The Library of Congress will mark the 155th anniversary of this historic speech with a one-day celebration, featuring an exhibition of the earliest known draft of the speech, and a Letters to Lincoln Challenge transcribe-a-thon for volunteers on and off site!\n\n### Schedule\n\n-   08:30am Jefferson Building doors open!\n-   10:00am Welcome remarks by Dr. Carla Hayden, 14th Librarian of Congress\n-   10:05am Special talk about the background of the Gettysburg Address by historian and curator Michelle Krowl\n-   10:15am Gettysburg Address delivered by student orator Christian Melgar\n-   10:25am Details of the Letters to Lincoln Challenge for onsite and remote participants\n-   10:30am Nicolay copy of the Gettysburg Address unveiled \n-   10:35am Letters to Lincoln Challenge transcribe-a-thon begins \n-   10:35am-1:30pm Letters to Lincoln Challenge Transcribe-a-thon\n-   4:30pm Jefferson Building doors close for the day \n\n#### In the area on November 19th?\n\nJoin us in the Great Hall of the Jefferson Building (Library of Congress) to have the rare opportunity to see the Nicolay copy of the Gettysburg Address in person. Dr. Hayden will kick things off at 10am, followed by a reading of the Address by a student orator, and a special talk about Lincoln and the Gettysburg Address, by historian and curator Michelle Krowl. After the Gettysburg Address is revealed at 10:30 various hands on transcription and learning opportunities will be available. \n\n#### Off site but online?\n\nWe\u2019ll livestream the Librarian and curator\u2019s talks, and the reading of the Gettysburg address from 10:00-10:30 [via this link](https://www.youtube.com/loc). After that people at the Library and online can participate in the #LettersToLincoln challenge right here on [crowd.loc.gov](/campaigns/letters-to-lincoln/)! Choose an item from the Letters to Lincoln Campaign to transcribe, review, and/or tag. So far we've made material from the 1830s through 1850s available, but for our transcribe-a-thon we'll release materials from 1860, 1861, and 1862, spanning part of the Civil War and important moments in Lincoln's career and the history of the nation. Join in the discussion on [History Hub](https://historyhub.history.gov/community/crowd-loc) and [Twitter](https://twitter.com/Crowd_LOC)! \n\nYou can [check in live](https://historyhub.history.gov/community/crowd-loc/blog/2018/11/14/transcribe-with-us-nov-19-the-155th-anniversary-of-the-gettysburg-address) with a Community Manager on History Hub throughout the transcribe-a-thon from 10:30am to 1:30pm EST. \n\n#### Opportunities for students near and far\n\nTune in at 10:00am for the livestream or join us in person to see the Gettysburg address, hear talks, and do some hands on activities and online transcriptions. Students onsite or in their own classrooms will be invited to transcribe, tag, and review documents received by Abraham Lincoln throughout his career. You can transcribe as a group or challenge your students to transcribe on their own or in pairs. All transcriptions are reviewed by at least one other volunteer, so don't be shy to try! If you or your students are finding it hard to read something, try finding something to review first. This is a great way to \"get your eye in\" and learn from others how to read these original documents.\n\nTo confirm participation for your class or students, please e-mail the Community Managers at [crowd@loc.gov](mailto:crowd@loc.gov) for further instructions. [Visit History Hub](https://historyhub.history.gov/community/crowd-loc/blog/2018/11/14/transcribe-with-us-nov-19-the-155th-anniversary-of-the-gettysburg-address) for your transcribe-a-thon pack including details on how to take part. \n\n## Letters to Lincoln Challenge\n\n---\n\n![Cover of yellow envelope with drawn portrait of Lincoln in the top left corner and a depiction of Lincoln chopping wood in the middle](/static/img/LincolnCampaign.jpg)\n\n### Help us transcribe 10,000+ items from the Abraham Lincoln Papers by the end of 2018!\n\n#### A grand challenge: why we're asking you to join us\n\nAround half of the digitized Abraham Lincoln Papers, primarily materials written by Lincoln, have been transcribed by other volunteers at Knox College and elsewhere, and are already keyword searchable at loc.gov. However, there remain 10,000+ items including letters and other materials sent to him that are not yet keyword searchable. Completing the [Letters to Lincoln Challenge](https://crowd.loc.gov/campaigns/letters-to-lincoln/) will make all of the digital Lincoln Papers word-searchable and accessible to future readers. Just imagine the possibilities--from new research to local connections--that will be possible once we've achieved this goal. Thank you in advance for sharing your time with us. Your Community Managers, reference librarians and curatorial staff here at the Library of Congress will be cheering you on with bonus historical context and resources all along the way, as well as some special rewards for goals met!\n\n#### So, what’s the challenge? Our first milestone was completion of all the material in the first three Campaign projects: \"1830-1839, first forays in politics and law,\" \"1840-1849, marriage, election to Congress,\" and \"1850-1857: death and birth of children, and re-entry to politics\" by November 1st. Our next *updated* challenge to you is to transcribe and review all 646 pages in the \"1858-1859 Presidential Nomination\" project by midnight on November 6th, election day!\n\nCan you transcribe even just one letter and share the challenge with one friend to help push toward our goal?  When the project completes we’ll move onto the next exciting decade of Lincoln's life, the 1850s when he returned to politics.\n\n#### What are the Letters to Lincoln?\n\nYou might guess that the Abraham Lincoln Papers include materials written in his own hand, but did you know the collection contains correspondence sent to Abraham Lincoln throughout his life and political career? Here's a taste of what you'll find: a range of materials by writers ranging from friends and associates from Lincoln’s Springfield days, well-known political figures and reformers, constituents writing to their President, and even the occasional document in Lincoln's own hand. Read the concerns and requests of nineteenth-century Americans and international correspondents.\n\n## Library of Congress News\n\n---\n\nEnabling Discovery of unique treasures at the Library of Congress [Press release](https://www.loc.gov/item/prn-18-134/crowdsourcing-tool-enables-discovery-of-unique-treasures-at-the-library-of-congress/2018-10-24/)\n\nAnnouncing crowd.loc.gov: [Here we go!](https://blogs.loc.gov/thesignal/2018/10/lets-go-explore-transcribe-and-tag-at-crowd-loc-gov/)\n\n[Connecting crowdsourcing](https://blogs.loc.gov/thesignal/2018/10/new-strategy-new-crowd-new-team/) to the new Library of Congress 2019-2023 Strategic Plan and Digital Strategy\n\n## Press coverage\n\n---\n\nMental Floss - 28 October 2018 - [The Library of Congress Needs Help Transcribing Lincoln's Letters and Other Historic Documents](http://mentalfloss.com/article/561842/library-congress-needs-help-transcribing-lincolns-letters-and-other-historic)",
            "created_on": "2018-11-26T22:00:43.700Z",
            "path": "/latest/",
            "title": "Latest News",
            "updated_on": "2018-11-26T22:00:43.702Z"
        },
        "model": "concordia.simplepage",
        "pk": 2
    },
    {
        "fields": {
            "body": "<div class=\"row my-default\">\n    <div class=\"col-sm-12\">\n        <div class=\"card bg-dark text-white text center mx-default\">\n        <img src=\"/static/img/help-center.jpg\" alt=\"Spread of Branch Rickey papers\">\n          <div class=\"card-body pxy-default card-img-overlay\">\n            <h2 class=\"card-title text-white\">Welcome to crowd.loc.gov</h2>\n            <h5 class=\"card-text\"> Here you will find a guide to help you get started. </h5>\n            <a href=\"welcome-guide/\" class=\"btn btn-primary\">Learn more &raquo;</a>\n          </div>\n        </div>\n    </div>\n</div>\n\n# Guides\n\n<div class=\"help-center-cards text-white row my-default\">\n  <div class=\"col-sm-4\">\n    <div class=\"help-center-card card text center mx-default\">\n      <div class=\"card-body pxy-default\">\n        <h4 class=\"card-title\"><a href=\"how-to-transcribe/\">How to Transcribe &raquo;</a></h4>\n      </div>\n    </div>\n  </div>\n  <div class=\"col-sm-4\">\n    <div class=\"help-center-card card text center mx-default\">\n      <div class=\"card-body pxy-default\">\n        <h4 class=\"card-title\"><a href=\"how-to-review/\">How to Review &raquo;</a></h4>\n      </div>\n    </div>\n  </div>\n  <div class=\"col-sm-4\">\n    <div class=\"help-center-card card text center mx-default\">\n      <div class=\"card-body pxy-default\">\n        <h4 class=\"card-title\"><a href=\"how-to-tag/\">How to Tag &raquo;</a></h4>\n      </div>\n    </div>\n  </div>\n</div>\n\n# FAQs\n\n<div class=\"accordion\" id=\"faqAccordion\">\n  <div class=\"card\">\n    <div class=\"card-header\" id=\"whatIsCrowdHeader\">\n      <h5 class=\"mb-0\">\n        <button class=\"btn btn-link collapsed\" type=\"button\" data-toggle=\"collapse\" data-target=\"#whatIsCrowd\" aria-expanded=\"false\" aria-controls=\"whatIsCrowd\">\n          What is crowd.loc.gov and what is crowdsourcing?\n        </button>\n      </h5>\n    </div>\n\n    <div id=\"whatIsCrowd\" class=\"collapse\" aria-labelledby=\"whatIsCrowdHeader\" data-parent=\"#faqAccordion\">\n      <div class=\"card-body\">\n      <p>\n       crowd.loc.gov is an online transcription platform where anyone with an internet connection can transcribe documents from the Library of Congress\u2019 digitized collections. We welcome anyone interested in making non-machine readable resources fully word searchable to contribute.\n      </p>\n      <p>\n      Crowdsourcing invites members of the public, non-specialists and specialists alike, to help make data more usable and discoverable. Crowdsourcing at the Library of Congress invites unpaid volunteers to explore collections while gaining new skills, for example, learning to read older forms of handwriting such as cursive.\n      </p>\n      </div>\n    </div>\n\n  </div>\n  <div class=\"card\">\n    <div class=\"card-header\" id=\"takePartHeader\">\n      <h5 class=\"mb-0\">\n        <button class=\"btn btn-link collapsed\" type=\"button\" data-toggle=\"collapse\" data-target=\"#takePart\" aria-expanded=\"false\" aria-controls=\"takePart\">\n          Who can take part?\n        </button>\n      </h5>\n    </div>\n    <div id=\"takePart\" class=\"collapse\" aria-labelledby=\"takePartHeader\" data-parent=\"#faqAccordion\">\n      <div class=\"card-body\">\n        Anyone who wants to help the Library make its collections more discoverable online. Anyone who is interested in history, cultural heritage, literature, languages, art, sciences, and much more. Anyone who wants to be a virtual volunteer, exploring collections and transcribing at their own pace and at times that are convenient for them. Students of all ages who want to help the Library and learn new skills.\n\n      </div>\n    </div>\n\n  </div>\n  <div class=\"card\">\n    <div class=\"card-header\" id=\"volunteersHeader\">\n      <h5 class=\"mb-0\">\n        <button class=\"btn btn-link collapsed\" type=\"button\" data-toggle=\"collapse\" data-target=\"#volunteersTogether\" aria-expanded=\"false\" aria-controls=\"volunteersTogether\">\n          How do volunteers work together?\n        </button>\n      </h5>\n    </div>\n    <div id=\"volunteersTogether\" class=\"collapse\" aria-labelledby=\"volunteersHeader\" data-parent=\"#faqAccordion\">\n      <div class=\"card-body\">\n       You'll collaborate with other volunteers to transcribe and review collections. We ask for at least one person to transcribe and a different person to review each transcription. If you find that a transcription needs a few corrections while you're reviewing, you can edit that page. Another person will then review your new edits. Sometimes more than one person will contribute to transcribe an image; such as if you find an image with a transcription that needs more work. We think of this negotiated editing process as a way to get the best version of a transcription and help solve different challenges for each image.\n\n      </div>\n    </div>\n\n  </div>\n\n <div class=\"card\">\n    <div class=\"card-header\" id=\"materialsHeader\">\n      <h5 class=\"mb-0\">\n        <button class=\"btn btn-link collapsed\" type=\"button\" data-toggle=\"collapse\" data-target=\"#materials\" aria-expanded=\"false\" aria-controls=\"materials\">\n          What kinds of materials can I transcribe?\n        </button>\n      </h5>\n    </div>\n    <div id=\"materials\" class=\"collapse\" aria-labelledby=\"materialsHeader\" data-parent=\"#faqAccordion\">\n      <div class=\"card-body\">\n       Materials in crowd.loc.gov represent the diversity of the Library\u2019s collections and are selected from across the Library of Congress\u2019s curatorial divisions. You\u2019ll encounter presidential papers, materials from the women's suffrage, abolition and other movements, the work of American poets, such as Walt Whitman, and much more. We will add new content regularly: <a href=\"https://updates.loc.gov/accounts/USLOC/subscriber/new?topic_id=USLOC_175\">sign up for our newsletter</a> to hear about new Campaigns and Challenges.\n\n      </div>\n    </div>\n\n  </div>\n\n <div class=\"card\">\n    <div class=\"card-header\" id=\"transcriptionGoalsHeader\">\n      <h5 class=\"mb-0\">\n        <button class=\"btn btn-link collapsed\" type=\"button\" data-toggle=\"collapse\" data-target=\"#transcriptionGoals\" aria-expanded=\"false\" aria-controls=\"transcriptionGoals\">\n          How do I know if I\u2019m transcribing, tagging or reviewing correctly?\n        </button>\n      </h5>\n    </div>\n    <div id=\"transcriptionGoals\" class=\"collapse\" aria-labelledby=\"transcriptionGoalsHeader\" data-parent=\"#faqAccordion\">\n      <div class=\"card-body\">\n       Follow the transcribe, review, or tag links at the top of the page. Our goal is to make transcriptions that are readable to computers and humans, with minimal markup, not attempting to recreate the layout of the original images. Quick tips are available within the transcription interface.\n\n      </div>\n    </div>\n\n  </div>\n <div class=\"card\">\n    <div class=\"card-header\" id=\"registerHeader\">\n      <h5 class=\"mb-0\">\n        <button class=\"btn btn-link collapsed\" type=\"button\" data-toggle=\"collapse\" data-target=\"#register\" aria-expanded=\"false\" aria-controls=\"register\">\n          Do I have to register for an account to participate or join in the discussion?\n        </button>\n      </h5>\n    </div>\n    <div id=\"register\" class=\"collapse\" aria-labelledby=\"registerHeader\" data-parent=\"#faqAccordion\">\n      <div class=\"card-body\">\n      \nRegistering for an account is optional, but gives you access to the tagging and reviewing features of crowd.loc.gov. Go to Register at the top of the homepage to make an account. Create a username, which will be visible to other volunteers and users of the site. Enter your email address in the \u201cEmail\u201d field (this will not be visible to or shared with other users), and in the password field create a unique password with a combination of capital and lowercase letters, numbers and special characters such as #, $, !, or %.\n\nYou can also register for a separate account on the <a href=\"https://historyhub.history.gov/community/crowd-loc\">History Hub discussion forum</a>, where you can discuss the material you are transcribing or your experience of encountering primary sources. Feel free to raise questions or concerns, especially if you think other volunteers might be able to respond or benefit from your post. History Hub is a moderated forum. The Community Managers will check in regularly to approve comments and engage in discussion, and will try to answer questions about the project or the collections within 3-5 business days. Reference Librarians and curators will also answer some questions.\n\n</div>\n</div>\n\n  </div>\n <div class=\"card\">\n    <div class=\"card-header\" id=\"forgotPasswordHeader\">\n      <h5 class=\"mb-0\">\n        <button class=\"btn btn-link collapsed\" type=\"button\" data-toggle=\"collapse\" data-target=\"#forgotPassword\" aria-expanded=\"false\" aria-controls=\"forgotPassword\">\n          What if I forget my password?\n        </button>\n      </h5>\n    </div>\n    <div id=\"forgotPassword\" class=\"collapse\" aria-labelledby=\"forgotPasswordHeader\" data-parent=\"#faqAccordion\">\n      <div class=\"card-body\">\n      \nIf you've forgotten your password click Login, then \"Forgot my password\". You will receive an email with a link asking you to reset your password. You may also change your password within your profile.\n      </div>\n    </div>\n  </div>\n <div class=\"card\">\n    <div class=\"card-header\" id=\"whyEmailHeader\">\n      <h5 class=\"mb-0\">\n        <button class=\"btn btn-link collapsed\" type=\"button\" data-toggle=\"collapse\" data-target=\"#whyEmail\" aria-expanded=\"false\" aria-controls=\"whyEmail\">\n          Why do we ask for your email?\n        </button>\n      </h5>\n    </div>\n    <div id=\"whyEmail\" class=\"collapse\" aria-labelledby=\"whyEmailHeader\" data-parent=\"#faqAccordion\">\n      <div class=\"card-body\">\n      \nYour email address gives us the ability to support you. Community managers are here to help with account administration like changes to your profile, troubleshooting any issues with contributing to a transcription, or to answer general questions. We will never share your information with other institutions or individuals. At registration you can opt in to receive email updates on crowd.loc.gov campaigns and features \u2013 you can also <a href=\"https://updates.loc.gov/accounts/USLOC/subscriber/new?topic_id=USLOC_175\">register for emails from us here</a>.\n      </div>\n    </div>\n  </div>\n <div class=\"card\">\n    <div class=\"card-header\" id=\"transcriptionUseHeader\">\n      <h5 class=\"mb-0\">\n        <button class=\"btn btn-link collapsed\" type=\"button\" data-toggle=\"collapse\" data-target=\"#transcriptionUse\" aria-expanded=\"false\" aria-controls=\"transcriptionUse\">\n          How will the transcriptions I create be used?\n        </button>\n      </h5>\n    </div>\n    <div id=\"transcriptionUse\" class=\"collapse\" aria-labelledby=\"transcriptionUseHeader\" data-parent=\"#faqAccordion\">\n      <div class=\"card-body\">\n      \nThe data contributed by volunteers like you can be used in many different ways. We are giving back to our community by making this data public. All contributions to this application are released into the public domain. Anyone is free to use this data set in any way they want. The data produced by volunteers is also free to reuse. If you need help accessing the data or want to share news of your research with the crowd.loc.gov community, please contact the Community Managers at <a href=\"mailto:crowd@loc.gov\">crowd@loc.gov</a>. The transcriptions produced on crowd.loc.gov will typically be published in the Library catalog on loc.gov within a year of a Campaign's completion. \n      </div>\n    </div>\n  </div>\n <div class=\"card\">\n    <div class=\"card-header\" id=\"tagUseHeader\">\n      <h5 class=\"mb-0\">\n        <button class=\"btn btn-link collapsed\" type=\"button\" data-toggle=\"collapse\" data-target=\"#tagUse\" aria-expanded=\"false\" aria-controls=\"tagUse\">\n          What are tags for?\n        </button>\n      </h5>\n    </div>\n    <div id=\"tagUse\" class=\"collapse\" aria-labelledby=\"tagUseHeader\" data-parent=\"#faqAccordion\">\n      <div class=\"card-body\">\n Tags are an experimental feature. Tags can be used to identify people, places or things in documents that are not already identified in the page or asset\u2019s metadata on <a href=\"https://loc.gov\">loc.gov</a>. We want to understand how volunteers like to use tags. We also want to understand whether tags can someday be included in the metadata on the Library catalog to make items discoverable through search terms that are not represented in the existing metadata or the transcriptions we will produce on crowd.loc.gov.\n\n      </div>\n    </div>\n\n  </div>\n <div class=\"card\">\n    <div class=\"card-header\" id=\"offensiveContentHeader\">\n      <h5 class=\"mb-0\">\n        <button class=\"btn btn-link collapsed\" type=\"button\" data-toggle=\"collapse\" data-target=\"#offensiveContent\" aria-expanded=\"false\" aria-controls=\"offensiveContent\">\n          What if I find offensive content while I\u2019m transcribing and reviewing?\n        </button>\n      </h5>\n    </div>\n    <div id=\"offensiveContent\" class=\"collapse\" aria-labelledby=\"offensiveContentHeader\" data-parent=\"#faqAccordion\">\n      <div class=\"card-body\">\nThe language and terminology used in the historical materials on this site reflect the context and culture of their creators, and may include words, phrases, and attitudes that would now be deemed insensitive, inappropriate or factually inaccurate, or may not be appropriate for all ages. Views expressed in historical documents do not reflect the views of the Library of Congress. Because the purpose of crowd.loc.gov is to make the Library\u2019s collections searchable, we ask that all original content be transcribed as it appears in the original material. If you find some material offensive or upsetting, please choose something else to transcribe. If you have questions or comments regarding the material you encounter during your participation here, please contact a Community Manager via <a href=\"mailto:crowd.loc.gov@loc.gov\">crowd.loc.gov@loc.gov</a>, the <a href=\"/contact/\">Contact Us</a> or join and start a new conversation on the <a href=\"https://historyhub.history.gov/community/crowd-loc\">History Hub discussion forum</a>.\n\n      </div>\n    </div>\n\n  </div>\n\n <div class=\"card\">\n    <div class=\"card-header\" id=\"browserSupportHeader\">\n      <h5 class=\"mb-0\">\n        <button class=\"btn btn-link collapsed\" type=\"button\" data-toggle=\"collapse\" data-target=\"#browserSupport\" aria-expanded=\"false\" aria-controls=\"browserSupport\">\n         What devices and browsers are supported by crowd.loc.gov?\n        </button>\n      </h5>\n    </div>\n    <div id=\"browserSupport\" class=\"collapse\" aria-labelledby=\"browserSupportHeader\" data-parent=\"#faqAccordion\">\n      <div class=\"card-body\">\nBecause crowd.loc.gov invites you to transcribe documents, it is best experienced on a device with a large or full sized keyboard. A desktop computer or laptop is best; a tablet with keyboard should work. Unfortunately, phones are not yet supported. We recommend an external mouse for most precise zoom. We support the two most recent versions of major browsers. You\u2019ll have the best experience if you use Chrome, Firefox, Edge, and Safari browsers. The site will not work as designed on the Internet Explorer browser.\n\n      </div>\n    </div>\n\n  </div>\n  <div class=\"card\">\n    <div class=\"card-header\" id=\"technologyHeader\">\n      <h5 class=\"mb-0\">\n        <button class=\"btn btn-link collapsed\" type=\"button\" data-toggle=\"collapse\" data-target=\"#technology\" aria-expanded=\"false\" aria-controls=\"technology\">\n         What is the technology behind crowd.loc.gov?\n        </button>\n      </h5>\n    </div>\n    <div id=\"technology\" class=\"collapse\" aria-labelledby=\"technologyHeader\" data-parent=\"#faqAccordion\">\n      <div class=\"card-body\">\nCrowd.loc.gov runs on Concordia, new open source software developed by the Library of Congress to power crowdsourced transcription projects. The code is visible and free to reuse: <a href=\"https://github.com/LibraryOfCongress/concordia\">Visit our Github repository</a> for more information. The platform was built utilizing user-centered design principles based around building trust and approachability. This project is a partnership between the Library and a growing community of volunteers who help us to iteratively improve the platform. Everyone is welcome to take part in transcription and tagging and to give feedback about how we can improve the code base and the project itself. Be in touch!\n\n      </div>\n    </div>\n\n  </div>\n  <div class=\"card\">\n    <div class=\"card-header\" id=\"privacyHeader\">\n      <h5 class=\"mb-0\">\n        <button class=\"btn btn-link collapsed\" type=\"button\" data-toggle=\"collapse\" data-target=\"#privacy\" aria-expanded=\"false\" aria-controls=\"privacy\">\n         How do you protect my privacy?\n        </button>\n      </h5>\n    </div>\n    <div id=\"privacy\" class=\"collapse\" aria-labelledby=\"privacyHeader\" data-parent=\"#faqAccordion\">\n      <div class=\"card-body\">\n<p>\nA detailed explanation of the Library\u2019s <a href=\"https://www.loc.gov/legal/\">Privacy Policy</a> including what kinds of data we collect and store, and what we use to track your session while you are on a Library website is available at this link, and in the footer of this page under the \u201cLegal\u201d link button.\n</p>\n<p>\nYou do not have to register an account on crowd.loc.gov in order to transcribe, but you can register if you would like to review or tag. In order to make sure a transcription is submitted by a real human, anonymous users will be prompted to fill in a captcha before their first submission will be accepted. The Library\u2019s captcha is an image of a few letters and numbers that you need to transcribe into the box below the image.\n</p>\n<p>\nA session cookie will be used in your browser while you are transcribing so that you do not need to enter a captcha every time you work on a page. Session cookies for anonymous users are limited to 24 hours, so you will only be prompted to enter a captcha once a session.\n</p>\n<p>\nSession cookies are used for registered users too, so that your contributions can be saved to your account. Check out your user profile to see how many pages you have transcribed, tagged and reviewed. Registered user session cookies last two weeks.\n</p>\n</div>\n</div>\n\n  </div>\n    <div class=\"card\">\n    <div class=\"card-header\" id=\"pastProjectsHeader\">\n      <h5 class=\"mb-0\">\n        <button class=\"btn btn-link collapsed\" type=\"button\" data-toggle=\"collapse\" data-target=\"#pastProjects\" aria-expanded=\"false\" aria-controls=\"pastProjects\">\n         What are past crowdsourcing projects at the Library?\n        </button>\n      </h5>\n    </div>\n    <div id=\"pastProjects\" class=\"collapse\" aria-labelledby=\"pastProjectsHeader\" data-parent=\"#faqAccordion\">\n      <div class=\"card-body\">\nThe Library of Congress has long invested in building digitized collections and making them searchable. The Library\u2019s first attempt recruiting members of the public to increase findability on our website began in 2008 when the Photography and Prints Division published thousands of photographs on <a href=\"https://www.flickr.com/photos/library_of_congress\">Flickr Commons</a>. This long-running project invites visitors to help identify people and places in the photographs and, once verified, this rich information is used to enhance the online catalog and improve access for all users. Two additional crowdsourcing efforts within the Library include <a href=\"https://www.zooniverse.org/projects/sroosa/roll-the-credits\">Roll the Credits</a> and <a href=\"http://beyondwords.labs.loc.gov/\">Beyond Words</a>, projects that invited people to transcribe credit captions from television programs, and identify cartoons and photographs in the Library's historic newspaper collections respectively.\n\n      </div>\n    </div>\n\n  </div>\n    <div class=\"card\">\n    <div class=\"card-header\" id=\"otherProjectsHeader\">\n      <h5 class=\"mb-0\">\n        <button class=\"btn btn-link collapsed\" type=\"button\" data-toggle=\"collapse\" data-target=\"#otherProjects\" aria-expanded=\"false\" aria-controls=\"otherProjects\">\n         Do other libraries and cultural institutions have crowdsourcing projects?\n        </button>\n      </h5>\n    </div>\n    <div id=\"otherProjects\" class=\"collapse\" aria-labelledby=\"otherProjectsHeader\" data-parent=\"#faqAccordion\">\n      <div class=\"card-body\">\nIn addition to the Library of Congress\u2019 own history of varied participatory projects, other cultural heritage institutions with established transcription programs have paved the way for crowd.loc.gov. Projects at the National Archives and Records Administration (NARA), the Smithsonian, the New York Public Library, Zooniverse.org, From the Page, and others have developed workflows and user engagement strategies that this platform leverages and builds upon. Concordia deploys a different architecture to these existing models of crowdsourced transcription, and aims to provide simple data structures and easier project implementation for cultural heritage institutions and other people who want to set up their own crowdsourced transcription projects.\n      </div>\n    </div>\n  </div>\n</div>\n\n_Concordia and crowd.loc.gov are supported by the National Digital Library Trust Fund. They are the result of collaboration between numerous divisions, expertise, and teams at the Library of Congress._",
            "created_on": "2018-11-26T22:00:43.705Z",
            "path": "/help-center/",
            "title": "Help Center",
            "updated_on": "2018-11-26T22:00:43.708Z"
        },
        "model": "concordia.simplepage",
        "pk": 3
    },
    {
        "fields": {
            "body": "<div class=\"help-center-cards text-white row my-default\">\n<div class=\"col-sm-4\">\n    <div class=\"help-center-card card text center mx-default\">\n      <div class=\"card-body pxy-default\">\n        <h3 class=\"card-title\"><a href=\"/help-center/\">Help Center &raquo;</a></h3>\n        <h5 class=\"card-text\">Find guides to help you tag, transcribe, and review.</h5>\n      </div>\n    </div>\n  </div>\n  <div class=\"col-sm-4\">\n    <div class=\"help-center-card card text center mx-default\">\n      <div class=\"card-body pxy-default\">\n        <h4 class=\"card-title\"><a target=\"_blank\" href=\"https://historyhub.history.gov/community/crowd-loc\">Discuss &raquo;</a></h4>\n        <h5 class=\"card-text\"> Join the conversation on History Hub. We'll take you there in a new tab.</h5>\n      </div>\n    </div>\n  </div>\n  <div class=\"col-sm-4\">\n    <div class=\"help-center-card card text center mx-default\">\n      <div class=\"card-body pxy-default\">\n        <h4 class=\"card-title\"><a href=\"/contact/\">Technical issue? &raquo;</a></h4>\n        <h5 class=\"card-text\"> Have a problem with a page or an image? Want to see a new feature? Send us a message.</h5>\n      </div>\n    </div>\n  </div>\n</div>",
            "created_on": "2018-11-26T22:00:43.712Z",
            "path": "/questions/",
            "title": "Have a question? We're here to help!",
            "updated_on": "2018-11-26T22:00:43.715Z"
        },
        "model": "concordia.simplepage",
        "pk": 4
    },
    {
        "fields": {
            "body": "The Library of Congress launched crowd.loc.gov in the autumn of 2018. The application asks people to transcribe and tag digitized images of manuscripts and typed materials from the Library\u2019s collections. Everyone is welcome to take part! You don't even need to create an account, but if you do you'll have access to additional features such as tagging and reviewing other people's transcriptions. All transcriptions are made by volunteers and reviewed by volunteers before they are returned to [loc.gov](https://loc.gov/), the Library's catalog. These transcriptions will improve search, readability, and access to handwritten and typed documents for those who are not fully sighted or cannot read the handwriting of the original documents. Check out the [FAQs section](/help-center/) in our Help Center for more detailed information.\n\nCrowd.loc.gov runs on Concordia, new open source software developed by the Library of Congress to power crowdsourced transcription projects. The code is visible and free to reuse: [visit our Github repository](https://github.com/LibraryOfCongress/concordia) for more information. The platform was built utilizing user-centered design principles based around building trust and approachability. This project is a partnership between the Library and a growing community of volunteers who help us to iteratively improve the platform. Everyone is welcome to take part in transcription and tagging and to give feedback about how we can improve the code base and the project itself. Be in touch!\n\nThis program is generously supported by the National Digital Library Trust Fund. This application is the result of collaboration between numerous divisions and teams at the Library of Congress.",
            "created_on": "2018-11-26T22:00:43.718Z",
            "path": "/about/",
            "title": "About crowd.loc.gov",
            "updated_on": "2018-11-26T22:00:43.720Z"
        },
        "model": "concordia.simplepage",
        "pk": 5
    },
    {
        "fields": {
            "body": "<div class=\"row\">\n  <div class=\"col-3\">\n    <div class=\"nav flex-column help-center\">\n    <h4>Instructions</h4>\n     <a class=\"nav-link\" href=\"/help-center/welcome-guide/\">Welcome to crowd.loc.gov</a>\n  <a class=\"nav-link\" href=\"/help-center/how-to-transcribe/\">How to transcribe</a>\n  <a class=\"nav-link active\" href=\"/help-center/how-to-review/\">How to review</a>\n  <a class=\"nav-link\" href=\"/help-center/how-to-tag\">How to tag</a>\n    </div>\n  </div>\n  <div class=\"col-9\">\n\n  <p>\nIn addition to transcribing, you can review and edit transcriptions created by your fellow volunteers. A reviewer\u2019s task is to read the entire transcription and carefully compare it against the image of the document. If you want to become a reviewer, please register an account.\n</p>\n\n<h2>A good transcription:</h2>\n\n<p>\nWhen a transcription is accurate and you do not need to make any changes, click the \"Approve\" button to mark the page as complete. The page will no longer be available for transcription, but you and other volunteers can still read the document and add tags.\n</p>\n\n<h2>\nA transcription that needs more work:\n</h2>\n<p>\nWhile reviewing, you can change a transcription to fix errors or add missing material. Remember, do not edit the spelling and grammar of the original document, but do correct any spelling errors or misreadings created by the transcriber. When you’re done, click the \"Save\" and \"Submit\" buttons. Another volunteer will then need to review the page. A page is complete when a reviewer clicks \"Accept\" without making changes.\n</p>\n  </div>\n</div>",
            "created_on": "2018-11-26T22:00:43.723Z",
            "path": "/help-center/how-to-review/",
            "title": "How to Review",
            "updated_on": "2018-11-26T22:00:43.725Z"
        },
        "model": "concordia.simplepage",
        "pk": 6
    },
    {
        "fields": {
            "body": "<div class=\"row\">\n  <div class=\"col-3\">\n    <div class=\"nav flex-column help-center\">\n   <h4>Instructions</h4>\n        <a class=\"nav-link\" href=\"/help-center/welcome-guide/\">Welcome to crowd.loc.gov</a>\n  <a class=\"nav-link\" href=\"/help-center/how-to-transcribe/\">How to transcribe</a>\n  <a class=\"nav-link\" href=\"/help-center/how-to-review/\">How to review</a>\n  <a class=\"nav-link active\" href=\"/help-center/how-to-tag\">How to tag</a>\n\n    </div>\n\n  </div>\n  <div class=\"col-9\">\n<p>\nYou can use tags however you like, so long as you avoid using offensive, degrading or hurtful language about other individuals or groups of people. Read the <a href=\"https://www.loc.gov/legal/comment-and-posting-policy/\">Library\u2019s commenting policy here</a>. Here are some ways you might consider tagging:\n<p>\n<ul>\n<li>If you transcribe an important word in a document, such as somebody\u2019s name, and the original author spelled the name incorrectly, you can add a tag to provide the correct name using the \u201cTag\u201d button.</li>\n<li>\nSometimes writers use nicknames or code words. If you know or can correctly identify the full name or subject using contextual information from the larger document or collection, please tag this information using the \u201cTag\u201d button.\n</li>\n<li>  Are you interested in documents mentioning cats? Use the \u201cTag\u201d button to tag all pages that mention cats. Other examples include \u201cCivil War\u201d, \u201cCooking\u201d, \u201cSports\u201d. You can apply whatever tags you like. </li>\n<li>  Keep tags as short as you can and use whole words instead of abbreviations. This will make it easier for other people to understand your tags and to reuse them elsewhere in the collection. </li>\n<li> Tagging is an experimental feature. Tags might one day go back into the Library website, but for now they will only be used as a method to explore items within crowd.loc.gov.\n</li>\n</ul>\n</div>\n</div>",
            "created_on": "2018-11-26T22:00:43.728Z",
            "path": "/help-center/how-to-tag/",
            "title": "How to Tag",
            "updated_on": "2018-11-26T22:00:43.731Z"
        },
        "model": "concordia.simplepage",
        "pk": 7
    },
    {
        "fields": {
            "body": "<div class=\"row\">\n  <div class=\"col-3\">\n    <div class=\"nav flex-column help-center\">\n   <h4>Instructions</h4>\n  <a class=\"nav-link active\" href=\"/help-center/welcome-guide/\">Welcome to crowd.loc.gov</a>\n  <a class=\"nav-link\" href=\"/help-center/how-to-transcribe/\">How to transcribe</a>\n  <a class=\"nav-link\" href=\"/help-center/how-to-review/\">How to review</a>\n  <a class=\"nav-link\" href=\"/help-center/how-to-tag\">How to tag</a>\n    </div>\n  </div>\n  <div class=\"col-9\">\n<p>\nWelcome to crowd.loc.gov! Our goal is to make documents word-searchable in the Library of Congress catalog. Help us transcribe original items, many of which have never been transcribed before. Anyone can transcribe, you don\u2019t need an account, but registered volunteers can access the review and tag features. You can choose which tasks you want to do, and what pages you want to work on. To create an account, <a href=\"/account/register/\">go to our registration page</a>. Let's get started!\n</p>\n<ol>\n<li>Choose what to transcribe. You can either click the \"Let's Go\" button on the <a href=\"/\">homepage</a> or <a href=\"/campaigns/\">explore our various campaigns</a>.\n</li>\n<li>\nTranscribe what you can into the white box on the right. Transcribe lines in the order they appear and preserve line breaks. This will make the transcriptions useful for researchers. If you see multiple pages, such as an open notebook with two pages, just transcribe the content in the order it appears.\n</li>\n<li>\nDon\u2019t reproduce features such as underlining, bold text, line breaks or indentation in your transcription. Only words will be searchable in these transcriptions--not formatting. See the <a href=\"../how-to-transcribe/\">How to transcribe</a> section for more information.\n</li>\n<li>\nClick \u201cSave\u201d as you go to save your work in progress. Always click \u201cSave\u201d before you move from transcribing to tagging or moving to another page.\n</li>\n<li>\nClick \"Save\" and \u201cSubmit for review\u201d when you are done transcribing and are ready to move on to the next page or to reviewing or tagging. Anonymous users will be prompted to submit a captcha.\n</li>\n<li>\nYou can explore collections by clicking the <a href=\"/campaigns/\">Campaigns</a> link at the top of the screen.\n</li>\n<li>\n<a href=\"/account/register\">Registered volunteers</a> can review other people\u2019s transcriptions. To start reviewing pages, select an item and click an image titled \u201cReview\u201d or filter the images by \"Review\". Read a page carefully and decide if the transcription looks correct. When a transcription is accurate and you do not need to make any changes, click the \"Approve\" button. The page will now be marked as complete. If you need to make changes start editing the page by clicking \"Edit\". Be sure to click \u201cSave\u201d periodically, and then click \u201cFinish\u201d. Changes you submit will be reviewed by another volunteer. You cannot review your own work. This process continues until someone Completes a transcription by clicking \u201cApprove\u201d without making changes.\n</li>\n<li>\nIf you have a question or comment about how crowd.loc.gov works, or about a Campaign, item or page, connect with our team and other volunteers on <a href=\"https://historyhub.history.gov/community/crowd-loc\">History Hub</a>, a public online forum where everyone can join in the discussion. If you would prefer to email a Community Manager send us a message on our <a href=\"/contact/\">Contact Us</a> page. \n</li>\n</div>\n</div>",
            "created_on": "2018-11-26T22:00:43.734Z",
            "path": "/help-center/welcome-guide/",
            "title": "Welcome Guide",
            "updated_on": "2018-11-26T22:00:43.736Z"
        },
        "model": "concordia.simplepage",
        "pk": 8
    },
    {
        "fields": {
            "body": "<div class=\"row\">\n  <div class=\"col-3\">\n    <div class=\"nav flex-column help-center\">\n      <h4>Instructions</h4>\n     <a class=\"nav-link\" href=\"/help-center/welcome-guide/\">Welcome to crowd.loc.gov</a>\n  <a class=\"nav-link active\" href=\"/help-center/how-to-transcribe/\">How to transcribe</a>\n  <a class=\"nav-link\" href=\"/help-center/how-to-review/\">How to review</a>\n  <a class=\"nav-link\" href=\"/help-center/how-to-tag\">How to tag</a>\n    </div>\n  </div>\n  <div class=\"col-9\">\n<p>\nWe transcribe to improve search functionality. Our goal is to make documents word-searchable in the Library of Congress catalog, which means typing transcriptions that can be read by that computer system, as well as by humans. Most handwriting and some typed text cannot be automatically and accurately translated into machine-readable text using current technologies -- that\u2019s why we need your help!\n</p>\n<p>\nWe ask you to transcribe a document roughly as it appears on the page. Preserve line breaks, except in cases where words are broken over two lines. Our main goal is to capture all of the words on these pages, so broken words are not helpful for search. Using line breaks to roughly capture the layout of the page helps reviewers (other volunteers) check transcriptions. These will be viewable beside the original images in the catalog, so anyone who is interested in the physical layout of the original document will be able to see it.\n</p>\n\n<h3>All in order:</h3>\n<p>\nTranscribe text in the order it appears.\n</p>\n<h3>\nSpelling:\n</h3>\n<p>\nPreserve original spelling unless the author seems to have made a minor error, such as writing \u201cteh\u201d instead of \u201cthe\u201d. If a misspelling will impact the searchability of the document, use a tag to add the correct spelling. Example:\n<ul>\n<li>  An author wrote \u201cWilla Kather\u201d instead of \u201cWilla Cather\u201d. Transcribe Willa Kather, and tag \u201cWilla Cather\u201d. </li>\n</ul>\n</p>\n\n<h3>Insertions:</h3>\n<p>\nWhen text has been inserted or added later, but should be read as part of a sentence, bring it down into the line and type it in the order you would read it aloud.\n</p>\n<h3>\nLine-breaks:</h3>\n<p>\nDo not reproduce words broken between two lines. Write library rather than li-brary, kitten rather than kit-ten. Otherwise hit \"enter\" or \"return\" at the end of a line, to roughly mirror the layout of the original document. This will help reviewers in crowd.loc.gov to easily compare your transcription with the image.\n</p>\n<h3>\nEmphasis:\n</h3>\n<p>\nThe Library catalog cannot search for bold, italic, underlined or superscript text, so even when you see these features please transcribe the words without any styling.\n</p>\n<h3>\nIllegible:\n</h3>\n<p>\nIllegible text is anything you can\u2019t read because a page is damaged, text is heavily crossed out or you can\u2019t tell what the author has written. If there is a word or a string of words you cannot read use a pair of square brackets around an empty space [ ]. Example:\n</p>\n<ul>\n<li>  \"I have [ ] loved coffee ice cream\" </li>\n</ul>\n<p>\nIf you can read any letters or parts of words transcribe what you can and use question marks for the remaining letters or words. Examples:\n</p>\n<ul>\n<li>  \"I have [a?????] loved coffee ice cream\"</li>\n<li>   \"I have [a?] loved coffee ice cream\"</li>\n</ul>\n<p>\nIf you cannot read a word or phrase that\u2019s ok. Another volunteer may be able to identify the missing letters and update your transcription. If there is a lot of text you cannot read consider looking for another page that you can decipher better.\n</p>\n<h3>Deletions:</h3>\n<p>\nIf you can read crossed out or otherwise deleted text, transcribe the deleted words within a pair of square brackets. Example:\n</p>\n<ul><li>  \u201cI have always loved [vanilla] coffee ice cream.\u201d </li></ul>\n\n<h3>Marginalia:</h3>\n\n<p>\nMarginalia is text written in the space around the main block of text. It is usually a comment on the main body text but can also be unrelated. It is different from an insertion, because it cannot be directly inserted into the main text and still make sense when read aloud. Use a pair of square brackets and asterisk [*] around marginalia text and order it within the transcription where it makes the most sense (or at the end of the transcription if it appears unrelated). Example:\n</p>\n<ul><li>\n   I have always loved coffee ice cream. Last summer I made my own using a recipe from the 1970s. It was the creamiest coffee ice cream I ever ate. No one else in my family likes that flavor. Oh well, more for me! [*Brazil was the largest coffee producing country in the world in 2017*]</li>\n</ul>\n\n<h3>Printed and typed text:</h3>\n<p>\nSome material in crowd.loc.gov was created on a typewriter or printed. If we have included it here it is because the text is not machine-readable. A computer using Optical Character Recognition (OCR) technology cannot create an accurate word-searchable transcription. Examples include the scouting reports of Branch Rickey, which are typed on thin paper and are often too fuzzy for successful OCR. Similarly, mixed materials containing manuscript and print have not been run through OCR, so please transcribe letterhead and any other printed features that will shed light on where a document was created.\n</p>\n\n<h3>When not to transcribe printed text:</h3>\n<p>\nSome calendars and diaries contain many pages of pre-printed almanacs or other text that is probably machine-readable and therefore should not be transcribed as part of this project. It might be interesting to copy the first page from a repeating template in a diary or journal, but this is not the core text we are aiming to capture. However, if you want to transcribe it, feel free. Alternatively, click \"Nothing to transcribe\". This button should also be used for archival folders, blank pages, and pictorial images.\n</p>\n    \n<h3>Tables, graphics, images:</h3>\n<p>\nSome documents will contain tables. Transcribe these in a way that will make them relatively easy for a reviewer to check over, but don't try to capture the exact layout of the data. The material will go back into the catalog without styling. Don't include notes or descriptions of visual features. If you would like to describe images, watermarks, stamps, or any other non-text features, feel free to use the tagging function. Register for an account if you want to add tags!\n    </p>\n</div>\n</div>",
            "created_on": "2018-11-26T22:00:43.740Z",
            "path": "/help-center/how-to-transcribe/",
            "title": "How to transcribe",
            "updated_on": "2018-11-26T22:00:43.742Z"
        },
        "model": "concordia.simplepage",
        "pk": 9
    }
]


================================================
FILE: frontend/.gitignore
================================================
# Logs
logs
*.log
npm-debug.log*
yarn-debug.log*
yarn-error.log*
pnpm-debug.log*
lerna-debug.log*

node_modules
dist
dist-ssr
*.local

# Editor directories and files
.vscode/*
!.vscode/extensions.json
.idea
.DS_Store
*.suo
*.ntvs*
*.njsproj
*.sln
*.sw?


================================================
FILE: frontend/README.md
================================================
# Frontend

This is the React frontend for the transcription page

## Building

To build the app, run `npm run build` in this directory. The app will then be available at /transcription/ (if you have DEBUG=True).


================================================
FILE: frontend/eslint.config.js
================================================
import js from '@eslint/js';
import globals from 'globals';
import reactHooks from 'eslint-plugin-react-hooks';
import reactRefresh from 'eslint-plugin-react-refresh';

export default [
    {ignores: ['dist']},
    {
        files: ['**/*.{js,jsx}'],
        languageOptions: {
            ecmaVersion: 2020,
            globals: globals.browser,
            parserOptions: {
                ecmaVersion: 'latest',
                ecmaFeatures: {jsx: true},
                sourceType: 'module',
            },
        },
        plugins: {
            'react-hooks': reactHooks,
            'react-refresh': reactRefresh,
        },
        rules: {
            ...js.configs.recommended.rules,
            ...reactHooks.configs.recommended.rules,
            'no-unused-vars': ['error', {varsIgnorePattern: '^[A-Z_]'}],
            'react-refresh/only-export-components': [
                'warn',
                {allowConstantExport: true},
            ],
        },
    },
];


================================================
FILE: frontend/index.html
================================================
<!doctype html>
<html lang="en">
  <head>
    <meta charset="UTF-8" />
    <link rel="icon" type="image/svg+xml" href="/vite.svg" />
    <meta name="viewport" content="width=device-width, initial-scale=1.0" />
    <title>Vite + React</title>
  </head>
  <body>
    <div id="root"></div>
    <script type="module" src="/src/main.jsx"></script>
  </body>
</html>


================================================
FILE: frontend/package.json
================================================
{
    "name": "frontend",
    "private": true,
    "version": "0.0.0",
    "type": "module",
    "scripts": {
        "dev": "vite",
        "build": "vite build",
        "lint": "eslint .",
        "preview": "vite preview"
    },
    "dependencies": {
        "@reduxjs/toolkit": "^2.8.2",
        "lodash.debounce": "^4.0.8",
        "openseadragon": "^5.0.1",
        "openseadragon-filters": "^2.2.0",
        "react": "^19.1.0",
        "react-bootstrap": "^2.10.10",
        "react-dom": "^19.1.0",
        "react-redux": "^9.2.0",
        "react-router-dom": "^6.30.3",
        "screenfull": "^6.0.2",
        "split.js": "^1.6.5"
    },
    "devDependencies": {
        "@eslint/js": "^9.25.0",
        "@types/react": "^19.1.2",
        "@types/react-dom": "^19.1.2",
        "@vitejs/plugin-react": "^4.4.1",
        "eslint": "^9.25.0",
        "eslint-plugin-react-hooks": "^5.2.0",
        "eslint-plugin-react-refresh": "^0.4.19",
        "globals": "^16.0.0",
        "vite": "^7.3.2",
        "vite-plugin-static-copy": "^3.1.2"
    }
}


================================================
FILE: frontend/src/App.jsx
================================================
import React, {useEffect, useState} from 'react';
import {HashRouter, Routes, Route, Link, useParams} from 'react-router-dom';
import ViewerSplit from './ViewerSplit';

/**
 * Fetches a JSON endpoint and displays the response.
 *
 * Useful as a temporary inspector while APIs and UI are evolving.
 *
 * @param {Object} props
 * @param {string} props.endpoint
 *   Relative or absolute API URL to request.
 * @param {string} [props.method="GET"]
 *   HTTP method to use.
 * @returns {JSX.Element}
 */
function FetchAndDisplay({endpoint, method = 'GET'}) {
    const [data, setData] = useState(null);
    const [error, setError] = useState(null);

    useEffect(() => {
        fetch(endpoint, {
            method,
            headers: {'Content-Type': 'application/json'},
        })
            .then((response) => {
                if (!response.ok) throw new Error(response.statusText);
                return response.json();
            })
            .then(setData)
            .catch((err) => setError(err.toString()));
    }, [endpoint, method]);

    return (
        <div>
            <h2>
                {method} {endpoint}
            </h2>
            {error && <div style={{color: 'red'}}>Error: {error}</div>}
            <pre>{JSON.stringify(data, null, 2)}</pre>
        </div>
    );
}

/**
 * Loads asset JSON by id or by slugs, then renders children with the data.
 *
 * Route params are read from the current URL. If params describe either
 * `/assets/:assetId` or the slug form, the component fetches the asset
 * from the API and passes results to a render prop.
 *
 * Children receive an object with:
 *   - `assetData`: the latest asset payload
 *   - `handleTranscriptionUpdate`: callback to merge a server response from
 *     a transcription action back into `assetData`
 *
 * @param {Object} props
 * @param {Function} props.children
 *   Render prop called as `children({ assetData, handleTranscriptionUpdate })`.
 * @returns {JSX.Element}
 */
function AssetLoader({children}) {
    const params = useParams();
    const [assetData, setAssetData] = useState(null);
    const [error, setError] = useState(null);

    useEffect(() => {
        let endpoint;
        if (params.assetId) {
            endpoint = `/api/assets/${params.assetId}`;
        } else if (
            params.campaignSlug &&
            params.projectSlug &&
            params.itemId &&
            params.assetSlug
        ) {
            endpoint = `/api/assets/${params.campaignSlug}/${params.projectSlug}/${params.itemId}/${params.assetSlug}/`;
        } else {
            setError('Missing asset parameters');
            return;
        }

        fetch(endpoint, {
            method: 'GET',
            headers: {'Content-Type': 'application/json'},
        })
            .then((response) => {
                if (!response.ok) throw new Error(response.statusText);
                return response.json();
            })
            .then(setAssetData)
            .catch((err) => setError(err.toString()));
    }, [params]);

    /**
     * Merge a transcription API response back into local asset state.
     *
     * Expects the server to return `{ id, text, ..., asset: <AssetOut> }`.
     * If the response is missing `asset`, the update is skipped.
     *
     * @param {Object} updatedTranscription
     */
    const handleTranscriptionUpdate = (updatedTranscription) => {
        if (!updatedTranscription?.asset) {
            console.error(
                'Missing asset on updatedTranscription:',
                updatedTranscription,
            );
            return;
        }

        setAssetData({
            ...updatedTranscription.asset,
            transcription: updatedTranscription,
            transcriptionStatus: updatedTranscription.asset.transcriptionStatus,
        });
    };

    if (error) return <div style={{color: 'red'}}>Error: {error}</div>;
    if (!assetData) return <div>Loading asset data...</div>;

    return children({assetData, handleTranscriptionUpdate});
}

/**
 * Defines nested routes for a single asset view.
 *
 * Renders the split viewer by default and wires routes for supporting
 * actions like OCR, rollback, rollforward, submit and review.
 *
 * @param {Object} props
 * @param {Object} props.assetData
 * @param {Function} props.handleTranscriptionUpdate
 * @returns {JSX.Element}
 */
function AssetRoutes({assetData, handleTranscriptionUpdate}) {
    return (
        <>
            <NavLinks assetData={assetData} />
            <Routes>
                <Route
                    path=""
                    element={
                        <ViewerSplit
                            assetData={assetData}
                            onTranscriptionUpdate={handleTranscriptionUpdate}
                        />
                    }
                />
                <Route path="transcriptions" element={<Transcriptions />} />
                <Route path="ocr" element={<OCRTranscription />} />
                <Route path="rollback" element={<Rollback />} />
                <Route path="rollforward" element={<Rollforward />} />
                <Route path="submit/:transcriptionId" element={<Submit />} />
                <Route path="review/:transcriptionId" element={<Review />} />
                <Route path="*" element={<NotFound />} />
            </Routes>
        </>
    );
}

/**
 * Renders navigation links for the current asset and optional
 * links for a specific transcription.
 *
 * @param {Object} props
 * @param {Object} props.assetData
 * @returns {JSX.Element|null}
 */
function NavLinks({assetData}) {
    if (!assetData) return null;

    const currentAssetId = assetData.id;
    const transcriptionId = assetData.transcription?.id;

    return (
        <nav>
            <Link to={`/${currentAssetId}`}>Asset</Link> |{' '}
            <Link to={`/${currentAssetId}/transcriptions`}>Transcriptions</Link>{' '}
            | <Link to={`/${currentAssetId}/ocr`}>OCR</Link> |{' '}
            <Link to={`/${currentAssetId}/rollback`}>Rollback</Link> |{' '}
            <Link to={`/${currentAssetId}/rollforward`}>Rollforward</Link>
            {transcriptionId && (
                <>
                    {' | '}
                    <Link to={`/${currentAssetId}/submit/${transcriptionId}`}>
                        Submit
                    </Link>{' '}
                    |{' '}
                    <Link to={`/${currentAssetId}/review/${transcriptionId}`}>
                        Review
                    </Link>
                </>
            )}
        </nav>
    );
}

/**
 * Fallback route for unknown paths.
 *
 * @returns {JSX.Element}
 */
function NotFound() {
    return <h2 style={{color: 'red'}}>404 Not Found</h2>;
}

/**
 * Debug route: show transcriptions list payload for an asset.
 *
 * @returns {JSX.Element}
 */
function Transcriptions() {
    const {assetId} = useParams();
    const endpoint = `/api/assets/${assetId}/transcriptions`;
    return <FetchAndDisplay endpoint={endpoint} />;
}

/**
 * Debug route: trigger OCR transcription endpoint for an asset.
 *
 * @returns {JSX.Element}
 */
function OCRTranscription() {
    const {assetId} = useParams();
    const endpoint = `/api/assets/${assetId}/transcriptions/ocr`;
    return <FetchAndDisplay endpoint={endpoint} />;
}

/**
 * Debug route: call rollback endpoint for an asset.
 *
 * @returns {JSX.Element}
 */
function Rollback() {
    const {assetId} = useParams();
    const endpoint = `/api/assets/${assetId}/transcriptions/rollback`;
    return <FetchAndDisplay endpoint={endpoint} />;
}

/**
 * Debug route: call rollforward endpoint for an asset.
 *
 * @returns {JSX.Element}
 */
function Rollforward() {
    const {assetId} = useParams();
    const endpoint = `/api/assets/${assetId}/transcriptions/rollforward`;
    return <FetchAndDisplay endpoint={endpoint} />;
}

/**
 * Debug route: submit a transcription by id.
 *
 * @returns {JSX.Element}
 */
function Submit() {
    const {transcriptionId} = useParams();
    const endpoint = `/api/transcriptions/${transcriptionId}/submit`;
    return <FetchAndDisplay endpoint={endpoint} />;
}

/**
 * Debug route: review a transcription by id.
 *
 * @returns {JSX.Element}
 */
function Review() {
    const {transcriptionId} = useParams();
    const endpoint = `/api/transcriptions/${transcriptionId}/review`;
    return <FetchAndDisplay endpoint={endpoint} />;
}

/**
 * Application router for the React transcription UI.
 *
 * Supports two entry patterns:
 *   1) `/:assetId/*` -- load by numeric id
 *   2) `/:campaignSlug/:projectSlug/:itemId/:assetSlug/*` -- load by slugs
 *
 * Both patterns use `AssetLoader`, which fetches JSON then renders nested
 * routes with `AssetRoutes`.
 *
 * @returns {JSX.Element}
 */
export default function App() {
    return (
        <HashRouter>
            <Routes>
                <Route
                    path="/:assetId/*"
                    element={
                        <AssetLoader>
                            {({assetData, handleTranscriptionUpdate}) => (
                                <AssetRoutes
                                    assetData={assetData}
                                    handleTranscriptionUpdate={
                                        handleTranscriptionUpdate
                                    }
                                />
                            )}
                        </AssetLoader>
                    }
                />
                <Route
                    path="/:campaignSlug/:projectSlug/:itemId/:assetSlug/*"
                    element={
                        <AssetLoader>
                            {({assetData, handleTranscriptionUpdate}) => (
                                <AssetRoutes
                                    assetData={assetData}
                                    handleTranscriptionUpdate={
                                        handleTranscriptionUpdate
                                    }
                                />
                            )}
                        </AssetLoader>
                    }
                />
                <Route path="*" element={<NotFound />} />
            </Routes>
        </HashRouter>
    );
}


================================================
FILE: frontend/src/ViewerSplit.jsx
================================================
import React, {useLayoutEffect, useRef, useState} from 'react';
import Split from 'split.js';

import Editor from './editor/Editor';
import Viewer from './viewer/Viewer';
import OcrSection from './ocr/Section';

/**
 * @typedef {Object} AssetData
 * @property {number} id
 * @property {string} imageUrl
 * @property {Object} [transcription]
 *   Latest transcription object for the asset, or null if none.
 * @property {string} transcriptionStatus
 *   One of the server statuses used to choose UI state.
 * @property {number} registeredContributors
 * @property {Array<[string,string]>} languages
 *   Array of [isoCode, languageName] pairs used by OCR.
 * @property {boolean} undoAvailable
 * @property {boolean} redoAvailable
 */

/**
 * Split-pane layout for the transcription UI.
 *
 * Renders the image viewer on one side and the editor on the other,
 * with a draggable gutter. The split direction and pane sizes persist
 * to localStorage. When the direction changes, the viewer is nudged to
 * re-fit the image.
 *
 * Local storage keys:
 * - "transcription-split-sizes-vertical" for vertical sizes
 * - "transcription-split-sizes-horizontal" for horizontal sizes
 * - "transcription-split-direction" for the active direction
 *
 * @param {{assetData: AssetData, onTranscriptionUpdate?: (t: Object) => void}} props
 *   assetData: Data for the current asset.
 *   onTranscriptionUpdate: Callback when a new transcription is saved
 *   or loaded.
 */
export default function ViewerSplit({assetData, onTranscriptionUpdate}) {
    const contributeContainerRef = useRef(null);
    const editorColumnRef = useRef(null);

    const verticalKey = 'transcription-split-sizes-vertical';
    const horizontalKey = 'transcription-split-sizes-horizontal';
    const directionKey = 'transcription-split-direction';

    const [splitDirection, setSplitDirection] = useState(
        JSON.parse(localStorage.getItem(directionKey)) || 'h',
    );

    const [transcription, setTranscription] = useState(assetData.transcription);

    /**
     * Handle an updated transcription payload from child components.
     * Updates local state and forwards to the optional parent callback.
     *
     * @param {Object} updated
     */
    const handleTranscriptionUpdate = (updated) => {
        if (!updated?.text) {
            console.warn(
                'handleTranscriptionUpdate called with malformed object:',
                updated,
            );
            return;
        }
        setTranscription(updated);
        if (onTranscriptionUpdate) onTranscriptionUpdate(updated);
    };

    /**
     * Update only the transcription text field as the user types.
     *
     * @param {string} newText
     */
    const handleTranscriptionTextChange = (newText) => {
        setTranscription((prev) => ({
            ...prev,
            text: newText,
        }));
    };

    /**
     * Read persisted Split.js sizes or return the provided defaults.
     *
     * @param {string} key
     * @param {number[]} defaultSizes
     * @returns {number[]}
     */
    const getSizes = (key, defaultSizes) => {
        const sizes = localStorage.getItem(key);
        return sizes ? JSON.parse(sizes) : defaultSizes;
    };

    /**
     * Persist pane sizes for the current direction.
     *
     * @param {number[]} sizes
     */
    const saveSizes = (sizes) => {
        const key = splitDirection === 'h' ? horizontalKey : verticalKey;
        localStorage.setItem(key, JSON.stringify(sizes));
    };

    /**
     * Persist the active split direction.
     *
     * @param {'h'|'v'} dir
     */
    const saveDirection = (dir) => {
        localStorage.setItem(directionKey, JSON.stringify(dir));
    };

    /**
     * Create or recreate the Split.js instance whenever direction changes.
     * Cleans up on unmount. Uses flex-basis so panes respect the gutter size.
     */
    useLayoutEffect(() => {
        const sizes =
            splitDirection === 'h'
                ? getSizes(horizontalKey, [50, 50])
                : getSizes(verticalKey, [50, 50]);

        const splitInstance = Split(['#viewer-column', '#editor-column'], {
            sizes,
            minSize: 100,
            gutterSize: 8,
            direction: splitDirection === 'h' ? 'horizontal' : 'vertical',
            elementStyle: (dimension, size, gutterSize) => ({
                flexBasis: `calc(${size}% - ${gutterSize}px)`,
            }),
            gutterStyle: (dimension, gutterSize) => ({
                flexBasis: `${gutterSize}px`,
            }),
            onDragEnd: saveSizes,
        });

        return () => {
            splitInstance.destroy();
        };
    }, [splitDirection]);

    /**
     * Toggle between horizontal and vertical layouts.
     * Saves direction then requests the OpenSeadragon viewer to re-fit.
     *
     * @param {'h'|'v'} dir
     */
    const handleToggle = (dir) => {
        if (dir !== splitDirection) {
            setSplitDirection(dir);
            saveDirection(dir);
            setTimeout(() => {
                if (window.seadragonViewer?.viewport) {
                    window.seadragonViewer.viewport.zoomTo(1, undefined, true);
                }
            }, 10);
        }
    };

    return (
        <div className="viewer-split">
            <div
                id="contribute-container"
                ref={contributeContainerRef}
                className={`d-flex ${
                    splitDirection === 'h' ? 'flex-row' : 'flex-column'
                }`}
                style={{height: '100vh'}}
            >
                <div
                    id="viewer-column"
                    className="ps-0 d-flex align-items-stretch bg-dark d-print-block flex-column"
                >
                    <Viewer
                        imageUrl={assetData.imageUrl}
                        onLayoutHorizontal={() => handleToggle('h')}
                        onLayoutVertical={() => handleToggle('v')}
                    />
                    <OcrSection
                        assetId={assetData.id}
                        transcription={transcription}
                        onTranscriptionUpdate={handleTranscriptionUpdate}
                        languages={assetData.languages}
                    />
                </div>
                <div id="editor-column" ref={editorColumnRef}>
                    <Editor
                        assetId={assetData.id}
                        transcription={transcription}
                        transcriptionStatus={assetData.transcriptionStatus}
                        registeredContributors={
                            assetData.registeredContributors
                        }
                        undoAvailable={assetData.undoAvailable}
                        redoAvailable={assetData.redoAvailable}
                        onTranscriptionUpdate={handleTranscriptionUpdate}
                        onTranscriptionTextChange={
                            handleTranscriptionTextChange
                        }
                    />
                </div>
            </div>
        </div>
    );
}


================================================
FILE: frontend/src/config.js
================================================
/**
 * Viewer configuration helpers for the React transcription UI.
 *
 * Reads optional values from a DOM element with id "viewer-data" and exposes
 * resolved settings as named exports. Falls back to safe defaults when the
 * element is missing or its dataset values are empty.
 *
 * Expected dataset attributes on #viewer-data:
 *   - data-prefix-url: string URL prefix for OpenSeadragon control images
 *   - data-contact-url: string URL for the "contact us" link
 *
 * No runtime side effects beyond a DOM lookup and a console warning when the
 * element is not present.
 */

/** Default OpenSeadragon image prefix if none is provided via #viewer-data. */
const DEFAULT_PREFIX_URL = '/static/openseadragon-images/';

/** Default contact URL if none is provided via #viewer-data. */
const DEFAULT_CONTACT_URL = 'https://ask.loc.gov/crowd';

/**
 * Shape of the viewer configuration object.
 *
 * @typedef {Object} ViewerConfig
 * @property {string} prefixUrl
 *   Base URL where OpenSeadragon looks for its control images.
 * @property {string} contactUrl
 *   Absolute URL used by "contact us" or help links.
 */

/**
 * Resolve viewer configuration from the DOM with fallbacks.
 *
 * Looks for an element with id "viewer-data". If found, reads the
 * `data-prefix-url` and `data-contact-url` attributes. Empty strings are
 * treated as missing and replaced by defaults.
 *
 * @returns {ViewerConfig}
 */
function getViewerConfig() {
    const viewerDataElement = document.getElementById('viewer-data');

    if (!viewerDataElement) {
        console.warn('viewer-data element not found');
        return {
            prefixUrl: DEFAULT_PREFIX_URL,
            contactUrl: DEFAULT_CONTACT_URL,
        };
    }

    const {prefixUrl, contactUrl} = viewerDataElement.dataset;

    return {
        prefixUrl: prefixUrl || DEFAULT_PREFIX_URL,
        contactUrl: contactUrl || DEFAULT_CONTACT_URL,
    };
}

/**
 * Resolved configuration values for consumers.
 *
 * `prefixUrl` is used by OpenSeadragon for control image paths.
 * `contactUrl` is used by UI links that route users to support.
 *
 * @type {string}
 * @name prefixUrl
 *
 * @type {string}
 * @name contactUrl
 */
export const {prefixUrl, contactUrl} = getViewerConfig();


================================================
FILE: frontend/src/editor/Buttons.jsx
================================================
import React from 'react';
import EditableButtons from './buttons/Editable';
import SubmitButton from './buttons/Submit';
import ReviewButton from './buttons/Review';

/**
 * Render the editor button row.
 *
 * Shows:
 * - <EditableButtons> when `isEditable` is true
 * - <SubmitButton> when `submitVisible` is true
 * - <ReviewButton> when `inReview` is true
 *
 * If none of the sections are visible, the component returns null.
 *
 * Layout: a centered flex container with wrap to handle narrow viewports.
 *
 * @param {Object} props
 * @param {boolean} props.isEditable
 *   Whether the draft editing controls should be shown.
 * @param {boolean} props.submitVisible
 *   Whether the submit control should be shown.
 * @param {boolean} props.inReview
 *   Whether accept and reject controls should be shown.
 * @param {boolean} props.undoAvailable
 *   Whether undo is available for the current asset.
 * @param {boolean} props.redoAvailable
 *   Whether redo is available for the current asset.
 * @param {string} props.text
 *   Current transcription text, passed to <EditableButtons>.
 * @param {boolean} props.isSaving
 *   True while a save is in flight.
 * @param {boolean} props.isSubmitting
 *   True while a submit is in flight.
 * @param {boolean} props.isReviewing
 *   True while a review action is in flight.
 * @param {boolean} props.submitEnabled
 *   Whether the submit button should be enabled.
 * @param {() => void} props.onSave
 *   Handler for saving a draft transcription.
 * @param {() => void} props.onSubmit
 *   Handler for submitting a transcription for review.
 * @param {() => void} props.onAccept
 *   Handler for accepting a submitted transcription.
 * @param {() => void} props.onReject
 *   Handler for rejecting a submitted transcription.
 * @param {() => void} props.onUndo
 *   Handler to trigger an undo action.
 * @param {() => void} props.onRedo
 *   Handler to trigger a redo action.
 */
export default function EditorButtons({
    isEditable,
    submitVisible,
    inReview,
    undoAvailable,
    redoAvailable,
    text,
    isSaving,
    isSubmitting,
    isReviewing,
    submitEnabled,
    onSave,
    onSubmit,
    onAccept,
    onReject,
    onUndo,
    onRedo,
}) {
    if (!isEditable && !submitVisible && !inReview) return null;

    return (
        <div className="d-flex justify-content-center mt-3 flex-wrap">
            {isEditable && (
                <EditableButtons
                    onSave={onSave}
                    isSaving={isSaving}
                    text={text}
                    undoAvailable={undoAvailable}
                    redoAvailable={redoAvailable}
                    onUndo={onUndo}
                    onRedo={onRedo}
                />
            )}
            {submitVisible && (
                <SubmitButton
                    onSubmit={onSubmit}
                    isSubmitting={isSubmitting}
                    submitEnabled={submitEnabled}
                />
            )}
            {inReview && (
                <ReviewButton
                    onAccept={onAccept}
                    onReject={onReject}
                    isReviewing={isReviewing}
                />
            )}
        </div>
    );
}


================================================
FILE: frontend/src/editor/Editor.jsx
================================================
import React from 'react';
import EditorHeader from './Header';
import TranscriptionTextarea from './TranscriptionTextarea';
import EditorStatusMessages from './StatusMessages';
import EditorButtons from './Buttons';

/**
 * Editor panel for the React transcription page.
 *
 * Renders the header, textarea and action buttons. Manages save, submit,
 * accept, reject, undo and redo flows against the API, then emits updates
 * to the parent via `onTranscriptionUpdate`.
 *
 * Status mapping:
 * - "not_started" or "in_progress" -> editable with submit option visible
 * - "submitted" -> review controls visible
 *
 * This code is functional but not final. The API surface and UX may change.
 */

/**
 * Submit a draft transcription for review.
 *
 * @param {number} transcriptionId
 * @returns {Promise<Object>} JSON payload from the API
 * @throws {Error} when the response is not OK
 */
async function submitTranscription(transcriptionId) {
    const response = await fetch(
        `/api/transcriptions/${transcriptionId}/submit`,
        {
            method: 'POST',
            headers: {'Content-Type': 'application/json'},
        },
    );
    if (!response.ok) {
        const error = await response.json();
        throw new Error(error.detail || 'Failed to submit transcription');
    }
    return await response.json();
}

/**
 * Review a submitted transcription.
 *
 * @param {number} transcriptionId
 * @param {'accept'|'reject'} action
 * @returns {Promise<Object>} JSON payload from the API
 * @throws {Error} when the response is not OK
 */
async function reviewTranscription(transcriptionId, action) {
    const response = await fetch(
        `/api/transcriptions/${transcriptionId}/review`,
        {
            method: 'PATCH',
            headers: {'Content-Type': 'application/json'},
            body: JSON.stringify({action}),
        },
    );
    if (!response.ok) {
        const error = await response.json();
        throw new Error(error.detail || 'Failed to review transcription');
    }
    return await response.json();
}

/**
 * Accept helper.
 *
 * @param {number} transcriptionId
 * @returns {Promise<Object>}
 */
async function acceptTranscription(transcriptionId) {
    return await reviewTranscription(transcriptionId, 'accept');
}

/**
 * Reject helper.
 *
 * @param {number} transcriptionId
 * @returns {Promise<Object>}
 */
async function rejectTranscription(transcriptionId) {
    return await reviewTranscription(transcriptionId, 'reject');
}

/**
 * Editor container component.
 *
 * Orchestrates UI state, calls API endpoints for save, submit, accept,
 * reject, undo and redo, then forwards the updated payload upstream.
 *
 * @param {Object} props
 * @param {number} props.assetId
 *   Asset id used for API calls.
 * @param {Object|null} props.transcription
 *   Current transcription object, or null when none exists.
 * @param {'not_started'|'in_progress'|'submitted'} props.transcriptionStatus
 *   Current workflow status for the asset.
 * @param {number} props.registeredContributors
 *   Count of registered contributors for the asset.
 * @param {boolean} props.undoAvailable
 *   Whether an undo target exists.
 * @param {boolean} props.redoAvailable
 *   Whether a redo target exists.
 * @param {(updated:Object) => void} props.onTranscriptionUpdate
 *   Callback fired with the API response after any change.
 * @param {(text:string) => void} props.onTranscriptionTextChange
 *   Callback fired when the textarea value changes.
 */
export default function Editor(props) {
    const {
        assetId,
        transcription,
        transcriptionStatus,
        registeredContributors,
        undoAvailable,
        redoAvailable,
        onTranscriptionUpdate,
        onTranscriptionTextChange,
    } = props;

    const [isSaving, setIsSaving] = React.useState(false);
    const [isSubmitting, setIsSubmitting] = React.useState(false);
    const [isReviewing, setIsReviewing] = React.useState(false);
    const [error, setError] = React.useState(null);
    const [success, setSuccess] = React.useState(false);
    const [submitSuccess, setSubmitSuccess] = React.useState(false);

    const status = transcriptionStatus;
    const isEditable = ['not_started', 'in_progress'].includes(status);
    const submitVisible = ['not_started', 'in_progress'].includes(status);
    const submitEnabled = status === 'in_progress' && transcription?.id;
    const inReview = status === 'submitted';
    const supersedes = transcription?.id;
    const text = transcription?.text || '';

    const handleSave = async () => {
        setIsSaving(true);
        setError(null);
        setSuccess(false);

        try {
            const response = await fetch(
                `/api/assets/${assetId}/transcriptions`,
                {
                    method: 'POST',
                    headers: {'Content-Type': 'application/json'},
                    body: JSON.stringify({
                        text,
                        ...(supersedes ? {supersedes} : {}),
                    }),
                },
            );

            if (!response.ok) {
                const data = await response.json();
                throw new Error(data.error || response.statusText);
            }

            const updated = await response.json();
            setSuccess(true);
            if (onTranscriptionUpdate) onTranscriptionUpdate(updated);
        } catch (err) {
            setError(err.message);
        } finally {
            setIsSaving(false);
        }
    };

    const handleSubmit = async () => {
        if (!transcription?.id) return;
        setIsSubmitting(true);
        setError(null);
        setSubmitSuccess(false);

        try {
            const updated = await submitTranscription(transcription.id);
            setSubmitSuccess(true);
            if (onTranscriptionUpdate) onTranscriptionUpdate(updated);
        } catch (err) {
            setError(err.message);
        } finally {
            setIsSubmitting(false);
        }
    };

    const handleAccept = async () => {
        if (!transcription?.id) return;
        setIsReviewing(true);
        setError(null);

        try {
            const updated = await acceptTranscription(transcription.id);
            if (onTranscriptionUpdate) onTranscriptionUpdate(updated);
        } catch (err) {
            setError(err.message);
        } finally {
            setIsReviewing(false);
        }
    };

    const handleReject = async () => {
        if (!transcription?.id) return;
        setIsReviewing(true);
        setError(null);

        try {
            const updated = await rejectTranscription(transcription.id);
            if (onTranscriptionUpdate) onTranscriptionUpdate(updated);
        } catch (err) {
            setError(err.message);
        } finally {
            setIsReviewing(false);
        }
    };

    const handleUndo = async () => {
        setIsSaving(true);
        setError(null);
        try {
            const response = await fetch(
                `/api/assets/${assetId}/transcriptions/rollback`,
                {
                    method: 'POST',
                    headers: {'Content-Type': 'application/json'},
                },
            );
            if (!response.ok) {
                const data = await response.json();
                throw new Error(data.detail || data.error || 'Undo failed');
            }
            const updated = await response.json();
            if (onTranscriptionUpdate) onTranscriptionUpdate(updated);
        } catch (err) {
            setError(err.message);
        } finally {
            setIsSaving(false);
        }
    };

    const handleRedo = async () => {
        setIsSaving(true);
        setError(null);
        try {
            const response = await fetch(
                `/api/assets/${assetId}/transcriptions/rollforward`,
                {
                    method: 'POST',
                    headers: {'Content-Type': 'application/json'},
                },
            );
            if (!response.ok) {
                const data = await response.json();
                throw new Error(data.detail || data.error || 'Redo failed');
            }
            const updated = await response.json();
            if (onTranscriptionUpdate) onTranscriptionUpdate(updated);
        } catch (err) {
            setError(err.message);
        } finally {
            setIsSaving(false);
        }
    };

    return (
        <div className="editor p-3 d-flex flex-column flex-grow-1">
            <EditorHeader
                status={status}
                registeredContributors={registeredContributors}
            />

            <TranscriptionTextarea
                value={text}
                onChange={onTranscriptionTextChange}
                editable={isEditable}
            />

            <EditorStatusMessages
                error={error}
                success={success}
                submitSuccess={submitSuccess}
            />

            <EditorButtons
                isEditable={isEditable}
                submitVisible={submitVisible}
                inReview={inReview}
                undoAvailable={undoAvailable}
                redoAvailable={redoAvailable}
                text={text}
                isSaving={isSaving}
                isSubmitting={isSubmitting}
                isReviewing={isReviewing}
                submitEnabled={submitEnabled}
                onSave={handleSave}
                onSubmit={handleSubmit}
                onAccept={handleAccept}
                onReject={handleReject}
                onUndo={handleUndo}
                onRedo={handleRedo}
            />
        </div>
    );
}


================================================
FILE: frontend/src/editor/Header.jsx
================================================
import React from 'react';

/**
 * Editor header for the React transcription page.
 *
 * Shows a human friendly status label, task instructions and, when applicable,
 * the count of registered contributors. This module is functional but in flux.
 * It is part of the React transcription UI and may change as the API and UX
 * are refined.
 */

/**
 * Maps workflow status codes to display labels.
 * Keys must match backend status values.
 * @type {Record<'submitted'|'completed'|'not_started'|'in_progress', string>}
 */
const statusMap = {
    submitted: 'Needs review',
    completed: 'Completed',
    not_started: 'Not started',
    in_progress: 'In progress',
};

/**
 * Maps workflow status codes to short user instructions.
 * Copy is provisional and may change.
 * @type {Record<'submitted'|'completed'|'not_started'|'in_progress', string>}
 */
const instructionsMap = {
    not_started: 'Transcribe this page.',
    in_progress: 'Someone started this transcription. Can you finish it?',
    submitted: 'Check this transcription thoroughly. Accept if correct!',
    completed: 'This transcription is finished! You can read and add tags.',
};

/**
 * Header section for the editor column.
 *
 * @param {Object} props
 * @param {'not_started'|'in_progress'|'submitted'|'completed'} props.status
 *   Current workflow status for the asset.
 * @param {number} props.registeredContributors
 *   Count of registered contributors. Shown for all states except not_started.
 */
export default function EditorHeader({status, registeredContributors}) {
    const statusLabel = statusMap[status] || 'Unknown status';
    const instructions = instructionsMap[status] || '';

    return (
        <div className="mb-2">
            <h2>{statusLabel}</h2>
            {status !== 'not_started' && (
                <h2>
                    Registered Contributors:{' '}
                    <span className="fw-normal">{registeredContributors}</span>
                </h2>
            )}
            <p>{instructions}</p>
        </div>
    );
}


================================================
FILE: frontend/src/editor/StatusMessages.jsx
================================================
import React from 'react';

/**
 * Status message area for the React transcription editor.
 *
 * Displays inline feedback for error, save success and submit success.
 * This module is part of the transcription UI and is in flux as the app
 * evolves.
 *
 * @param {Object} props
 * @param {string|null} props.error
 *   Error message to display. When truthy shows "Error: <message>".
 * @param {boolean} props.success
 *   When true shows "Transcription saved."
 * @param {boolean} props.submitSuccess
 *   When true shows "Transcription submitted."
 */
export default function EditorStatusMessages({error, success, submitSuccess}) {
    return (
        <>
            {error && <div className="text-danger">Error: {error}</div>}
            {success && (
                <div className="text-success">Transcription saved.</div>
            )}
            {submitSuccess && (
                <div className="text-success">Transcription submitted.</div>
            )}
        </>
    );
}


================================================
FILE: frontend/src/editor/TranscriptionTextarea.jsx
================================================
import React from 'react';

/**
 * Multiline textarea for transcription input.
 *
 * Renders a Bootstrap styled `<textarea>` bound to `value`, `onChange` and
 * an `editable` flag. When `editable` is false the field is readOnly and a
 * non editing placeholder is shown.
 *
 * @param {Object} props
 * @param {string} props.value
 *   Current transcription text.
 * @param {(value: string) => void} props.onChange
 *   Callback invoked with the updated text.
 * @param {boolean} props.editable
 *   When true the textarea is editable, otherwise it is readOnly.
 */
export default function TranscriptionTextarea({value, onChange, editable}) {
    return (
        <textarea
            className="form-control flex-grow-1 mb-3"
            value={value}
            onChange={(e) => onChange(e.target.value)}
            readOnly={!editable}
            placeholder={
                editable
                    ? 'Go ahead, start typing. You got this!'
                    : 'Nothing to transcribe'
            }
            aria-label="Transcription input"
            style={{minHeight: '200px'}}
        />
    );
}


================================================
FILE: frontend/src/editor/buttons/Editable.jsx
================================================
import React from 'react';
import EditorButtonSave from './Save';
import EditorButtonUndo from './Undo';
import EditorButtonRedo from './Redo';

/**
 * Button cluster for editable transcription state.
 *
 * Renders Save, Undo and Redo controls. Each child button receives only
 * the props it needs. This component does not manage any state.
 *
 * @param {Object} props
 * @param {boolean} props.isSaving
 *   True while a save request is in flight.
 * @param {string} props.text
 *   Current transcription text to validate save availability.
 * @param {boolean} props.undoAvailable
 *   True when an undo operation is possible.
 * @param {boolean} props.redoAvailable
 *   True when a redo operation is possible.
 * @param {() => void} props.onSave
 *   Called when the Save button is clicked.
 * @param {() => void} props.onUndo
 *   Called when the Undo button is clicked.
 * @param {() => void} props.onRedo
 *   Called when the Redo button is clicked.
 */
export default function EditorButtonsEditable({
    isSaving,
    text,
    undoAvailable,
    redoAvailable,
    onSave,
    onUndo,
    onRedo,
}) {
    return (
        <>
            <EditorButtonSave isSaving={isSaving} text={text} onSave={onSave} />
            <EditorButtonUndo undoAvailable={undoAvailable} onClick={onUndo} />
            <EditorButtonRedo redoAvailable={redoAvailable} onClick={onRedo} />
        </>
    );
}


================================================
FILE: frontend/src/editor/buttons/Redo.jsx
================================================
import React from 'react';

/**
 * Redo button for the transcription editor.
 *
 * Presentational only. Disabled when no redo is available.
 *
 * @param {Object} props
 * @param {boolean} props.redoAvailable
 *   True when a redo operation can be performed.
 * @param {() => void} props.onClick
 *   Click handler invoked to trigger redo.
 */
export default function EditorButtonRedo({redoAvailable, onClick}) {
    return (
        <button
            className="btn btn-outline-primary mx-1 mb-2"
            disabled={!redoAvailable}
            onClick={onClick}
        >
            Redo <span className="fas fa-redo"></span>
        </button>
    );
}


================================================
FILE: frontend/src/editor/buttons/Review.jsx
================================================
import React from 'react';

/**
 * Review action buttons for the transcription editor.
 *
 * Renders two primary buttons:
 * - "Edit" triggers the reject flow so a reviewer can make changes
 * - "Accept" confirms the transcription is accurate
 *
 * @param {Object} props
 * @param {boolean} props.isReviewing
 *   True while a review API call is active which disables the buttons.
 * @param {() => void} props.onAccept
 *   Handler to accept the current transcription.
 * @param {() => void} props.onReject
 *   Handler to send the transcription back for edits.
 */
export default function EditorButtonsReview({isReviewing, onAccept, onReject}) {
    return (
        <>
            <button
                className="btn btn-primary mx-1 mb-2"
                onClick={onReject}
                disabled={isReviewing}
                title="Correct errors you see in the text"
            >
                Edit
            </button>
            <button
                className="btn btn-primary mx-1 mb-2"
                onClick={onAccept}
                disabled={isReviewing}
                title="Confirm that the text is accurately transcribed"
            >
                Accept
            </button>
        </>
    );
}


================================================
FILE: frontend/src/editor/buttons/Save.jsx
================================================
import React from 'react';

/**
 * Save button for the transcription editor.
 *
 * Renders a primary button that calls `onSave`. The button is disabled while a
 * save is in progress or when the current text is empty after trimming.
 *
 * @param {Object} props
 * @param {() => void} props.onSave - Click handler to persist the draft.
 * @param {boolean} props.isSaving - True while a save request is in flight.
 * @param {string} props.text - Current transcription text used to gate enable state.
 * @returns {JSX.Element}
 */
export default function EditorButtonSave({onSave, isSaving, text}) {
    return (
        <button
            className="btn btn-primary mx-1 mb-2"
            onClick={onSave}
            disabled={isSaving || !text.trim()}
        >
            Save
        </button>
    );
}


================================================
FILE: frontend/src/editor/buttons/Submit.jsx
================================================
import React from 'react';

/**
 * Submit button for the transcription editor.
 *
 * Renders a primary button that calls `onSubmit`. The button is disabled
 * while a submit request is in flight or when submission is not allowed.
 *
 * @param {Object} props
 * @param {() => void} props.onSubmit - Click handler to submit the draft for review.
 * @param {boolean} props.isSubmitting - True while a submit request is in flight.
 * @param {boolean} props.submitEnabled - True when the current draft can be submitted.
 * @returns {JSX.Element}
 */
export default function EditorButtonSubmit({
    onSubmit,
    isSubmitting,
    submitEnabled,
}) {
    return (
        <button
            className="btn btn-primary mx-1 mb-2"
            onClick={onSubmit}
            disabled={!submitEnabled || isSubmitting}
            title="Request another volunteer to review the text you entered above"
        >
            {isSubmitting ? 'Submitting...' : 'Submit for Review'}
        </button>
    );
}


================================================
FILE: frontend/src/editor/buttons/Undo.jsx
================================================
import React from 'react';

/**
 * Undo button for the transcription editor.
 *
 * Renders an outline button that calls `onClick`. The button is disabled
 * when `undoAvailable` is false.
 *
 * @param {Object} props
 * @param {boolean} props.undoAvailable - True if a prior version exists to undo to.
 * @param {() => void} props.onClick - Click handler to perform the undo action.
 * @returns {JSX.Element}
 */
export default function EditorButtonUndo({undoAvailable, onClick}) {
    return (
        <button
            className="btn btn-outline-primary mx-1 mb-2"
            disabled={!undoAvailable}
            onClick={onClick}
        >
            <span className="fas fa-undo"></span> Undo
        </button>
    );
}


================================================
FILE: frontend/src/main.jsx
================================================
/**
 * Application entry point for the React transcription UI.
 *
 * Mounts <App /> into the DOM element with id "app" and enables React
 * StrictMode.
 *
 * Behavior notes:
 * - StrictMode turns on extra checks in development and may invoke some
 *   render effects twice -- this is expected.
 * - No globals are exported. Side effects are limited to mounting React.
 */

import React from 'react';
import ReactDOM from 'react-dom/client';
import App from './App';

ReactDOM.createRoot(document.getElementById('app')).render(
    <React.StrictMode>
        <App />
    </React.StrictMode>,
);


================================================
FILE: frontend/src/ocr/Button.jsx
================================================
import React from 'react';
import Button from 'react-bootstrap/Button';

/**
 * OCR action UI: a help link that opens the OCR help modal
 * and a primary button that starts OCR transcription.
 *
 * Notes:
 * - The help link triggers the Bootstrap modal with id "#ocr-help-modal"
 *   via data attributes. Ensure that modal exists in the DOM.
 * - Requires Bootstrap's modal JavaScript to be loaded.
 *
 * @param {Object} props
 * @param {() => void} props.onClick - Handler to begin the OCR flow.
 * @returns {JSX.Element}
 */
export default function OcrButton({onClick}) {
    return (
        <div className="d-flex flex-row align-items-center justify-content-end mt-1">
            <a
                tabIndex={0}
                className="btn btn-link d-inline p-0"
                role="button"
                data-bs-placement="top"
                data-bs-trigger="focus click hover"
                title="When to use OCR"
                data-bs-toggle="modal"
                data-bs-target="#ocr-help-modal"
            >
                <span className="underline-link fw-bold">What is OCR</span>{' '}
                <span
                    className="fas fa-question-circle"
                    aria-label="When to use OCR"
                ></span>
            </a>
            <Button className="mx-1" variant="primary" onClick={onClick}>
                Transcribe with OCR
            </Button>
        </div>
    );
}


================================================
FILE: frontend/src/ocr/ConfirmModal.jsx
================================================
import React from 'react';
import Modal from 'react-bootstrap/Modal';
import Button from 'react-bootstrap/Button';

/**
 * Confirmation modal shown before running OCR that would replace the current
 * transcription text with machine generated text.
 *
 * Behavior:
 * - Appears when `show` is true. Hides when the backdrop or close button is
 *   activated or when `onClose` is called.
 * - Clicking "Yes, Select Language" calls `onConfirm`, which should advance to
 *   language selection and OCR.
 * - Uses react-bootstrap Modal. Ensure Bootstrap's JS bundle is loaded.
 *
 * Accessibility:
 * - Modal is centered and managed by react-bootstrap which handles focus trap
 *   and aria attributes.
 *
 * Design note:
 * - The potential destructive action is on a link styled as a button for visual
 *   prominence while "Cancel" is a primary button.
 *
 * @param {Object} props
 * @param {boolean} props.show - Whether the modal is visible.
 * @param {() => void} props.onClose - Called when the user cancels or closes.
 * @param {() => void} props.onConfirm - Called to proceed to OCR language select.
 * @returns {JSX.Element}
 */
export default function OcrConfirmModal({show, onClose, onConfirm}) {
    return (
        <Modal show={show} onHide={onClose} centered>
            <Modal.Header closeButton />
            <Modal.Body>
                <div className="bg-light p-3">
                    <h5 className="modal-title mb-3">Are you sure?</h5>
                    <p>
                        Clicking "Transcribe with OCR" will remove all existing
                        transcription text and replace it with automatically
                        generated text. Use the "Undo" button to restore
                        previous text.
                    </p>
                </div>
            </Modal.Body>
            <Modal.Footer>
                <Button variant="primary" onClick={onClose}>
                    Cancel
                </Button>
                <Button
                    variant="link"
                    className="underline-link fw-bold"
                    onClick={onConfirm}
                >
                    Yes, Select Language
                </Button>
            </Modal.Footer>
        </Modal>
    );
}


================================================
FILE: frontend/src/ocr/Handler.jsx
================================================
import React, {useState} from 'react';

import OcrButton from './Button';
import OcrConfirmModal from './ConfirmModal';
import OcrLanguageModal from './LanguageModal';
import OcrHelpModal from './HelpModal';

/**
 * Orchestrates the OCR flow for the transcription editor.
 *
 * Flow:
 * 1) User clicks "Transcribe with OCR" button which opens a confirm modal.
 * 2) Confirm opens a language selection modal.
 * 3) Submit posts to `/api/assets/{assetId}/transcriptions/ocr` with
 *    `{language, supersedes}` then calls `onTranscriptionUpdate` with
 *    the server response.
 *
 * State:
 * - showConfirm: controls the confirm modal.
 * - showLanguage: controls the language modal.
 * - selectedLang: ISO 639-3 code, defaults to "eng".
 * - isSubmitting: disables inputs during the request.
 * - error: displays server or network errors in the language modal.
 *
 * Notes:
 * - OCR replaces existing text.
 * - Expects the API to return a TranscriptionOut payload with an `asset`
 *   object used to refresh editor state.
 *
 * Accessibility:
 * - Modals come from react-bootstrap which handles focus and aria attributes.
 *
 * @param {Object} props
 * @param {number} props.assetId - Asset primary key for API calls.
 * @param {Object|null} props.transcription - Current transcription or null.
 * @param {Array<[string,string]>} props.languages - OCR languages as
 *   `[code, label]`.
 * @param {(updated: Object) => void} props.onTranscriptionUpdate - Called with
 *   the API response after a successful OCR request.
 * @returns {JSX.Element}
 */
export default function OcrHandler({
    assetId,
    transcription,
    languages,
    onTranscriptionUpdate,
}) {
    const [showConfirm, setShowConfirm] = useState(false);
    const [showLanguage, setShowLanguage] = useState(false);
    const [selectedLang, setSelectedLang] = useState('eng');
    const [isSubmitting, setIsSubmitting] = useState(false);
    const [error, setError] = useState(null);

    const handleOcrClick = () => {
        setShowConfirm(true);
    };

    const handleConfirm = () => {
        setShowConfirm(false);
        setShowLanguage(true);
    };

    const handleCancelLanguage = () => {
        setShowLanguage(false);
        setSelectedLang('eng');
    };

    const handleLanguageChange = (lang) => {
        setSelectedLang(lang);
    };

    const handleLanguageSubmit = async () => {
        setIsSubmitting(true);
        setError(null);
        try {
            const response = await fetch(
                `/api/assets/${assetId}/transcriptions/ocr`,
                {
                    method: 'POST',
                    headers: {'Content-Type': 'application/json'},
                    body: JSON.stringify({
                        language: selectedLang,
                        supersedes: transcription?.id || null,
                    }),
                },
            );

            if (!response.ok) {
                const data = await response.json();
                throw new Error(data.detail || data.error || 'OCR failed');
            }

            const updated = await response.json();
            setShowLanguage(false);
            if (onTranscriptionUpdate) onTranscriptionUpdate(updated);
        } catch (err) {
            setError(err.message);
        } finally {
            setIsSubmitting(false);
        }
    };

    return (
        <>
            <OcrHelpModal />
            <OcrButton onClick={handleOcrClick} />
            <OcrConfirmModal
                show={showConfirm}
                onClose={() => setShowConfirm(false)}
                onConfirm={handleConfirm}
            />
            <OcrLanguageModal
                show={showLanguage}
                selectedLang={selectedLang}
                onChange={handleLanguageChange}
                onClose={handleCancelLanguage}
                onSubmit={handleLanguageSubmit}
                disabled={isSubmitting}
                error={error}
                languages={languages}
            />
        </>
    );
}


================================================
FILE: frontend/src/ocr/HelpModal.jsx
================================================
import React from 'react';

/**
 * Bootstrap modal explaining the "Transcribe with OCR" feature.
 *
 * Behavior:
 * - Static content only. Shown and hidden by Bootstrap via data attributes.
 * - Triggered by an element using `data-bs-target="#ocr-help-modal"`.
 *
 * Accessibility:
 * - Uses Bootstrap modal roles and close button. Container has `role="dialog"`.
 *
 * @returns {JSX.Element}
 */
export default function OcrHelpModal() {
    return (
        <div id="ocr-help-modal" className="modal" tabIndex={-1} role="dialog">
            <div className="modal-dialog modal-dialog-centered" role="document">
                <div className="modal-content">
                    <div className="modal-header">
                        <h5 className="modal-title">
                            About Transcribe with OCR
                        </h5>
                        <button
                            type="button"
                            className="btn-close"
                            data-bs-dismiss="modal"
                            aria-label="Close"
                        ></button>
                    </div>
                    <div className="modal-body">
                        <h6 className="modal-title">What is OCR?</h6>
                        <p>
                            OCR stands for Optical Character Recognition. OCR is
                            a software tool that can extract print text from
                            some documents.
                        </p>

                        <h6>When will OCR work well?</h6>
                        <p>
                            OCR does not work on handwriting. It only works for
                            printed or typed text, meaning text created by a
                            typewriter, printing press or other mechanical
                            means. OCR will do best on consistent and clear
                            images of modern typefaces.
                        </p>

                        <h6>
                            Do I still need to review pages started with OCR?
                        </h6>
                        <p>
                            Yes. OCR is imperfect. It may not work well for some
                            or all parts of a typed page, but it can be a great
                            starting point. If you start a page with OCR you
                            should read the text closely before submitting. If
                            you are reviewing an OCR-ed page you still need to
                            review.
                        </p>

                        <h6>Who can use "Transcribe with OCR"?</h6>
                        <p>
                            <a href="/account/register/">
                                Register for an account
                            </a>{' '}
                            and <a href="/account/login/">log in</a> to use this
                            feature.
                        </p>

                        <h6>
                            Why does{' '}
                            <span className="fst-italic">By the People</span>{' '}
                            have this feature?
                        </h6>
                        <p>
                            We always want to use volunteer time effectively.
                            When the Library of Congress digitizes a large group
                            of printed pages it will usually OCR them. The
                            materials in By the People campaigns are not good
                            candidates for applying OCR at scale either because
                            they are handwritten, a mixed collection of
                            handwritten and print materials or printed on paper
                            or in a typeface that does not produce accurate OCR
                            results. However, OCR can still be a useful starting
                            point for some typed pages. Use it if you like it or
                            skip it if you do not.
                        </p>
                    </div>
                    <div className="modal-footer justify-content-center">
                        <button
                            type="button"
                            className="btn btn-primary"
                            data-bs-dismiss="modal"
                        >
                            Close
                        </button>
                    </div>
                </div>
            </div>
        </div>
    );
}


================================================
FILE: frontend/src/ocr/LanguageModal.jsx
================================================
import React, {useState} from 'react';
import Modal from 'react-bootstrap/Modal';
import Button from 'react-bootstrap/Button';

/**
 * Language picker modal for OCR.
 *
 * Behavior:
 * - Presents a scrollable list of languages from `languages`.
 * - Calls `onSubmit({ language, supersedes })` when the user confirms.
 *
 * Accessibility:
 * - Uses react-bootstrap Modal roles. The select has an associated label.
 *
 * Props:
 * @param {boolean} show
 *   Whether the modal is visible.
 * @param {function} onClose
 *   Called to dismiss the modal.
 * @param {function} onSubmit
 *   Called on confirmation. Receives `{ language, supersedes }`.
 * @param {Array<[string,string]>} languages
 *   Array of `[code, label]` tuples, e.g. `[["eng","English"], ...]`.
 * @param {string} [supersedes]
 *   Transcription id that the OCR result will supersede.
 * @param {string} [selectedLang]
 *   Controlled selected language code.
 * @param {function} [onChange]
 *   Controlled change handler: `onChange(code)`.
 * @param {boolean} [disabled]
 *   Disable the confirm button while submitting.
 * @param {string|null} [error]
 *   Optional error message to display.
 *
 * Usage:
 * <OcrLanguageModal
 *   show={show}
 *   languages={languages}
 *   selectedLang={selectedLang}
 *   onChange={setSelectedLang}
 *   onClose={handleClose}
 *   onSubmit={handleSubmit}
 *   disabled={isSubmitting}
 *   error={error}
 * />
 */
export default function OcrLanguageModal({
    show,
    onClose,
    onSubmit,
    languages,
    supersedes,
    selectedLang,
    onChange,
    disabled = false,
    error = null,
}) {
    // Uncontrolled fallback state
    const [localLang, setLocalLang] = useState(() => {
        const eng = languages.find(([code]) => code === 'eng')?.[0];
        return eng || languages[0]?.[0] || '';
    });

    const isControlled =
        typeof selectedLang === 'string' && typeof onChange === 'function';
    const value = isControlled ? selectedLang : localLang;

    const handleChange = (e) => {
        const code = e.target.value;
        if (isControlled) {
            onChange(code);
        } else {
            setLocalLang(code);
        }
    };

    const handleSubmit = () => {
        if (!value) return;
        onSubmit({language: value, supersedes});
    };

    return (
        <Modal show={show} onHide={onClose} centered>
            <Modal.Header closeButton />
            <Modal.Body>
                <div className="bg-light p-3">
                    <h5 className="modal-title mb-3">Select language</h5>
                    <p>
                        Select the language of the transcription from the list
                        below.
                    </p>

                    {error && (
                        <div className="alert alert-danger" role="alert">
                            {error}
                        </div>
                    )}

                    <div className="text-center pb-1">
                        <label htmlFor="language" className="form-label">
                            Language
                        </label>
                        <select
                            id="language"
                            name="language"
                            size={7}
                            className="form-select"
                            value={value}
                            onChange={handleChange}
                            aria-label="Select OCR language"
                        >
                            {languages.map(([code, label]) => (
                                <option key={code} value={code}>
                                    {label}
                                </option>
                            ))}
                        </select>
                    </div>
                </div>
            </Modal.Body>
            <Modal.Footer>
                <Button variant="primary" onClick={onClose}>
                    Cancel
                </Button>
                <Button
                    className="underline-link fw-bold"
                    variant="link"
                    disabled={!value || disabled}
                    onClick={handleSubmit}
                >
                    Replace Text
                </Button>
            </Modal.Footer>
        </Modal>
    );
}


================================================
FILE: frontend/src/ocr/Section.jsx
================================================
/**
 * OCR section wrapper for the viewer column.
 *
 * Purpose:
 * - Hosts the OCR entrypoint UI.
 * - Forwards asset context and handlers to the OCR flow.
 *
 * Integration:
 * - Rendered by ViewerSplit alongside the image viewer.
 * - Delegates all OCR actions to OcrHandler.
 *
 * Usage:
 * <OcrSection
 *   assetId={asset.id}
 *   transcription={asset.transcription}
 *   onTranscriptionUpdate={handleTranscriptionUpdate}
 *   languages={asset.languages}
 * />
 */

import React from 'react';

import OcrHandler from './Handler';

/**
 * Lightweight container that places the OCR controls in the viewer column.
 *
 * Props:
 * @param {Object} props
 * @param {number} props.assetId
 *   The current asset id used by API calls.
 * @param {{ id?: number, text?: string } | null} props.transcription
 *   The current transcription object or null if none exists.
 * @param {function(Object):void} props.onTranscriptionUpdate
 *   Callback invoked with the API response after OCR creates a transcription.
 * @param {Array<[string,string]>} props.languages
 *   Array of [code, label] language tuples for OCR selection.
 *
 * Returns:
 * @returns {JSX.Element}
 */
export default function OcrSection({
    assetId,
    transcription,
    onTranscriptionUpdate,
    languages,
}) {
    return (
        <div id="ocr-section" className="row ps-3 pb-4 bg-white print-none">
            <div className="d-flex flex-row align-items-center justify-content-end mt-1">
                <OcrHandler
                    assetId={assetId}
                    transcription={transcription}
                    onTranscriptionUpdate={onTranscriptionUpdate}
                    languages={languages}
                />
            </div>
        </div>
    );
}


================================================
FILE: frontend/src/viewer/Controls.jsx
================================================
/**
 * Viewer toolbar with layout, zoom, rotate, flip, filters, help and fullscreen.
 *
 * Purpose:
 * - Provide a consistent control strip for the image viewer.
 * - Emit layout events to the parent container.
 * - Expose stable button ids so external code can bind OpenSeadragon actions.
 *
 * Integration:
 * - The parent supplies handlers for layout changes and fullscreen:
 *   onLayoutHorizontal, onLayoutVertical, toggleFullscreen.
 * - Other buttons are bound by id at runtime by OpenSeadragon:
 *   #viewer-home, #viewer-zoom-in, #viewer-zoom-out,
 *   #viewer-rotate-left, #viewer-rotate-right, #viewer-flip.
 * - Bootstrap attributes handle the filters collapse and keyboard help modal.
 *
 * Accessibility:
 * - Buttons include title text. Icons add aria-label where needed.
 *
 * Usage:
 * <ViewerControls
 *   onLayoutHorizontal={() => setLayout('h')}
 *   onLayoutVertical={() => setLayout('v')}
 *   toggleFullscreen={handleFullscreen}
 * />
 */

import React from 'react';

/**
 * @param {Object} props
 * @param {function():void} props.onLayoutHorizontal
 *   Switch to horizontal layout.
 * @param {function():void} props.onLayoutVertical
 *   Switch to vertical layout.
 * @param {function():void} props.toggleFullscreen
 *   Enter or exit fullscreen mode for the viewer.
 * @returns {JSX.Element}
 */
export default function ViewerControls({
    onLayoutHorizontal,
    onLayoutVertical,
    toggleFullscreen,
}) {
    return (
        <div id="viewer-controls" className="m-1 text-center d-print-none">
            <div className="d-inline-flex justify-content-between">
                <div className="d-flex btn-group m-1">
                    <button
                        id="viewer-layout-vertical"
                        className="btn btn-dark viewer-control-button"
                        title="Vertical Layout"
                        onClick={onLayoutVertical}
                    >
                        <span className="fas fa-grip-lines"></span>
                    </button>
                    <button
                        id="viewer-layout-horizontal"
                        className="btn btn-dark"
                        title="Horizontal Layout"
                        onClick={onLayoutHorizontal}
                    >
                        <span className="fas fa-grip-lines-vertical"></span>
                    </button>
                </div>

                <div className="d-flex btn-group m-1">
                    <button
                        type="button"
                        id="viewer-home"
                        className="btn btn-dark viewer-control-button"
                        title="Fit Image to Viewport"
                    >
                        <span className="fas fa-compress"></span>
                    </button>
                </div>

                <div className="d-flex btn-group m-1">
                    <button
                        id="viewer-zoom-in"
                        className="btn btn-dark viewer-control-button"
                        title="Zoom In"
                    >
                        <span className="fas fa-search-plus"></span>
                    </button>
                    <button
                        id="viewer-zoom-out"
                        className="btn btn-dark"
                        title="Zoom Out"
                    >
                        <span className="fas fa-search-minus"></span>
                    </button>
                </div>

                <div className="d-flex btn-group m-1">
                    <button
                        id="viewer-rotate-left"
                        className="btn btn-dark viewer-control-button"
                        title="Rotate Left"
                    >
                        <span className="fas fa-undo"></span>
                    </button>
                    <button
                        id="viewer-rotate-right"
                        className="btn btn-dark viewer-control-button"
                        title="Rotate Right"
                    >
                        <span className="fas fa-redo"></span>
                    </button>
                </div>

                <div className="d-flex btn-group m-1">
                    <button
                        id="viewer-flip"
                        className="btn btn-dark viewer-control-button"
                        title="Flip"
                    >
                        <span className="fas fa-exchange-alt"></span>
                    </button>
                </div>

                <div className="d-flex btn-group m-1">
                    <button
                        type="button"
                        className="btn btn-dark extra-control-button"
                        title="Image Filters"
                        data-bs-toggle="collapse"
                        data-bs-target="#image-filters"
                    >
                        <span
                            className="fas fa-sliders-h"
                            aria-label="Image Filters"
                        ></span>
                    </button>
                </div>

                <div className="d-flex btn-group m-1">
                    <button
                        type="button"
                        id="viewer-fullscreen"
                        className="btn btn-dark extra-control-button"
                        title="View Full Screen"
                        onClick={toggleFullscreen}
                    >
                        <span className="fas fa-expand"></span>
                    </button>
                </div>

                <div className="d-flex btn-group m-1">
                    <button
                        type="button"
                        className="btn btn-dark extra-control-button"
                        title="Viewer keyboard shortcuts"
                        data-bs-toggle="modal"
                        data-bs-target="#keyboard-help-modal"
                    >
                        <span
                            className="fas fa-question-circle"
                            aria-label="Viewer keyboard shortcuts"
                        ></span>
                    </button>
                </div>
            </div>
        </div>
    );
}


================================================
FILE: frontend/src/viewer/FilterTabNav.jsx
================================================
/**
 * Tab navigation for image filters: Brightness, Invert, Contrast.
 *
 * Purpose:
 * - Provide three Bootstrap tab buttons that toggle filter panes.
 * - Expose stable button ids for external binding:
 *   #viewer-gamma, #viewer-invert, #viewer-threshold.
 *
 * Integration:
 * - Buttons use data-bs-toggle="tab" and data-bs-target to switch panes:
 *   #gamma-filter, #invert-filter, #threshold-filter.
 * - Parent markup must include a .tab-content with matching pane ids.
 *
 * Accessibility:
 * - role="tablist" on the <ul>, role="presentation" on list items, role="tab" on
 *   buttons.
 * - The first tab is marked active by default.
 *
 * Usage:
 * <FilterTabNav />
 */

/**
 * @returns {JSX.Element}
 */
export default function FilterTabNav() {
    return (
        <ul
            className="d-inline-flex mt-1 btn-group nav nav-tabs"
            role="tablist"
        >
            <li className="nav-item" role="presentation">
                <button
                    id="viewer-gamma"
                    className="btn btn-dark nav-link active"
                    title="Adjust gamma"
                    data-bs-toggle="tab"
                    data-bs-target="#gamma-filter"
                    role="tab"
                >
                    Brightness
                </button>
            </li>
            <li className="nav-item" role="presentation">
                <button
                    id="viewer-invert"
                    className="btn btn-dark nav-link"
                    title="Invert colors"
                    data-bs-toggle="tab"
                    data-bs-target="#invert-filter"
                    role="tab"
                >
                    Invert
                </button>
            </li>
            <li className="nav-item" role="presentation">
                <button
                    id="viewer-threshold"
                    className="btn btn-dark nav-link"
                    title="Adjust threshold"
                    data-bs-toggle="tab"
                    data-bs-target="#threshold-filter"
                    role="tab"
                >
                    Contrast
                </button>
            </li>
        </ul>
    );
}


================================================
FILE: frontend/src/viewer/GammaFilterForm.jsx
================================================
/**
 * Gamma filter controls for the viewer.
 *
 * Purpose:
 * - Provide synchronized number and range inputs to adjust gamma.
 * - Offer step up/down buttons and a Reset filter control.
 *
 * Behavior:
 * - Value is clamped to [0, 5] and rounded to two decimals.
 * - onSubmit is prevented; onReset sets gamma to 1.0.
 * - Exposed ids for external hooks:
 *   #gamma-filter, #gamma-form, #gamma, #gamma-range, #gamma-up, #gamma-down.
 *
 * Accessibility:
 * - Visually hidden labels for inputs.
 * - Buttons include hidden Increase and Decrease text.
 *
 * Props:
 * @param {number} gamma - Current gamma value.
 * @param {(value:number)=>void} setGamma - Setter invoked on change.
 * @returns {JSX.Element}
 */
export default function GammaFilterForm({gamma, setGamma}) {
    const handleNumberChange = (e) => {
        const value = parseFloat(e.target.value);
        if (!isNaN(value)) setGamma(value);
    };

    const handleRangeChange = (e) => {
        const value = parseFloat(e.target.value);
        if (!isNaN(value)) setGamma(value);
    };

    const stepUp = () => {
        const newValue = Math.min(5, gamma + 0.01);
        setGamma(parseFloat(newValue.toFixed(2)));
    };

    const stepDown = () => {
        const newValue = Math.max(0, gamma - 0.01);
        setGamma(parseFloat(newValue.toFixed(2)));
    };

    const handleReset = () => {
        setGamma(1.0);
    };

    return (
        <div
            id="gamma-filter"
            className="tab-pane pt-1 ps-3 show active"
            role="tabpanel"
        >
            <form
                id="gamma-form"
                className="d-flex align-items-center"
                onSubmit={(e) => e.preventDefault()}
                onReset={handleReset}
            >
                <div className="row ms-0 me-3 number-input">
                    <div className="col p-1">
                        <input
                            type="number"
                            id="gamma"
                            name="gamma"
                            min="0"
                            max="5"
                            step="0.01"
                            value={gamma}
                            onChange={handleNumberChange}
                        />
                        <label className="visually-hidden" htmlFor="gamma">
                            Gamma
                        </label>
                    </div>
                    <div className="col p-0 filter-buttons">
                        <div className="row m-0">
                            <button
                                id="gamma-up"
                                type="button"
                                className="arrow-button"
                                onClick={stepUp}
                            >
                                <span className="fas fa-chevron-up" />
                                <span className="visually-hidden">
                                    Increase
                                </span>
                            </button>
                        </div>
                        <div className="row m-0">
                            <button
                                id="gamma-down"
                                type="button"
                                className="arrow-button"
                                onClick={stepDown}
                            >
                                <span className="fas fa-chevron-down" />
                                <span className="visually-hidden">
                                    Decrease
                                </span>
                            </button>
                        </div>
                    </div>
                </div>
                <input
                    type="range"
                    id="gamma-range"
                    name="gamma-range"
                    min="0"
                    max="5"
                    step="0.01"
                    value={gamma}
                    onChange={handleRangeChange}
                    className="filter-slider flex-grow-1"
                />
                <label className="visually-hidden" htmlFor="gamma-range">
                    Gamma
                </label>
                <input
                    type="reset"
                    className="btn btn-link underline-link fw-bold"
                    value="Reset filter"
                />
            </form>
        </div>
    );
}


================================================
FILE: frontend/src/viewer/ImageFilters.jsx
================================================
/**
 * UI for per-viewer image filters backed by OpenSeadragon. Exposes gamma,
 * invert and threshold controls, and applies them to the active viewer via
 * `setFilterOptions`. Updates are debounced to reduce reflow and redraw churn.
 *
 * Dependencies: OpenSeadragon Filters, lodash.debounce, Bootstrap.
 *
 * Behavior:
 * - Builds a processors array from the current control values and sends it to
 *   the viewer with `setFilterOptions({ filters: { processors } })`.
 * - Debounces updates by 100ms.
 * - Resets all filters to defaults with the "Reset All" button.
 *
 * Side effects:
 * - Reads `osdViewerRef.current` and calls `setFilterOptions` if present.
 * - Cancels the debounced updater on unmount or dependency change.
 */

import {useState, useEffect} from 'react';
import OpenSeadragon from 'openseadragon';
import {GAMMA, INVERT, THRESHOLDING} from 'openseadragon-filters';
import debounce from 'lodash.debounce';

import FilterTabNav from './FilterTabNav';
import GammaFilterForm from './GammaFilterForm';
import InvertFilterForm from './InvertFilterForm';
import ThresholdFilterForm from './ThresholdFilterForm';

/**
 * ImageFilters
 *
 * Controls gamma, invert and threshold, and pushes changes to an
 * OpenSeadragon viewer instance.
 *
 * @component
 * @param {Object} props
 * @param {React.MutableRefObject<OpenSeadragon.Viewer|null>} props.osdViewerRef
 *   A ref to the active OpenSeadragon viewer. Must expose `setFilterOptions`.
 *
 * @example
 *   <ImageFilters filterPluginRef={viewerRef} />
 */
export default function ImageFilters({filterPluginRef}) {
    const [gamma, setGamma] = useState(1.0);
    const [invert, setInvert] = useState(false);
    const [threshold, setThreshold] = useState(0);

    // Debounced bridge to OSD filter pipeline
    const updateFilters = debounce(() => {
        // Get the plugin instance from the ref
        const plugin = filterPluginRef.current;
        if (!plugin) return;

        const processors = [];

        if (gamma !== 1 && gamma >= 0 && gamma <= 5) {
            processors.push(GAMMA(gamma));
        }
        if (invert) {
            processors.push(INVERT());
        }
        if (threshold > 0 && threshold <= 255) {
            processors.push(THRESHOLDING(threshold));
        }

        //Call setFilterOptions on the PLUGIN
        plugin.setFilterOptions({
            filters: {processors},
        });
    }, 100);

    // Apply filters when any control changes
    useEffect(() => {
        updateFilters();
        return updateFilters.cancel; // cleanup debounce
    }, [gamma, invert, threshold]); // eslint-disable-line react-hooks/exhaustive-deps

    const handleReset = () => {
        setGamma(1.0);
        setInvert(false);
        setThreshold(0);
    };

    return (
        <div
            id="image-filters"
            className="m-1 text-center d-print-none collapse"
        >
            <hr className="m-0" />
            <FilterTabNav />
            <div className="btn-group m-1">
                <button
                    id="viewer-reset"
                    className="btn"
                    title="Reset all filters"
                    onClick={handleReset}
                >
                    Reset All
                </button>
            </div>
            <div id="filter-tabs" className="tab-content">
                <GammaFilterForm gamma={gamma} setGamma={setGamma} />
                <InvertFilterForm invert={invert} setInvert={setInvert} />
                <ThresholdFilterForm
                    threshold={threshold}
                    setThreshold={setThreshold}
                />
            </div>
        </div>
    );
}


================================================
FILE: frontend/src/viewer/InvertFilterForm.jsx
================================================
/**
 * InvertFilterForm
 *
 * Simple on/off control for an invert color filter. Parent manages state and
 * passes the current value plus a setter.
 *
 * @component
 * @param {Object} props
 * @param {boolean} props.invert - Current invert state
 * @param {(value: boolean) => void} props.setInvert - Setter for invert state
 */
export default function InvertFilterForm({invert, setInvert}) {
    const handleChange = (e) => {
        setInvert(e.target.checked);
    };

    const handleReset = () => {
        setInvert(false);
    };

    return (
        <div
            id="invert-filter"
            className="tab-pane pt-2"
            role="tabpanel"
            style={{backgroundColor: 'white'}}
        >
            <form
                id="invert-form"
                onSubmit={(e) => e.preventDefault()}
                onReset={handleReset}
                className="d-flex justify-content-center"
            >
                <label className="ms-2 align-middle">Off</label>
                <div className="form-check form-switch custom-control-inline">
                    <input
                        type="checkbox"
                        id="invert"
                        name="invert"
                        className="form-check-input"
                        role="switch"
                        checked={invert}
                        onChange={handleChange}
                    />
                    <label className="form-check-label" htmlFor="invert">
                        <span className="visually-hidden">Invert</span>
                    </label>
                </div>
                <label className="align-middle">On</label>
            </form>
        </div>
    );
}


================================================
FILE: frontend/src/viewer/KeyboardHelpModal.jsx
================================================
import KeyboardShortcutRow from './KeyboardShortcutRow';

/*
KeyboardHelpModal

Bootstrap modal that lists viewer keyboard shortcuts. Rows are rendered
with KeyboardShortcutRow.

Usage:
- Trigger with data-bs-target="#keyboard-help-modal"
- Presentational only

Accessibility:
- Uses role="dialog" and Bootstrap aria attributes
- Close button has aria-label
*/
export default function KeyboardHelpModal() {
    return (
        <div
            id="keyboard-help-modal"
            className="modal"
            tabIndex={-1}
            role="dialog"
        >
            <div className="modal-dialog modal-dialog-centered" role="document">
                <div className="modal-content">
                    <div className="modal-header">
                        <h5 className="modal-title">Keyboard Shortcuts</h5>
                        <button
                            type="button"
                            className="btn-close"
                            data-bs-dismiss="modal"
                            aria-label="Close"
                        ></button>
                    </div>
                    <div className="modal-body">
                        <h6>Viewer Shortcuts</h6>
                        <table className="table table-compact table-responsive">
                            <tbody>
                                <KeyboardShortcutRow
                                    keys={[
                                        {text: 'w', wrap: true},
                                        {text: 'up arrow', wrap: false},
                                    ]}
                                    description="Scroll the viewport up"
                                />
                                <KeyboardShortcutRow
                                    keys={[
                                        {text: 's', wrap: true},
                                        {text: 'down arrow', wrap: false},
                                    ]}
                                    description="Scroll the viewport down"
                                />
                                <KeyboardShortcutRow
                                    keys={[
                                        {text: 'a', wrap: true},
                                        {text: 'left arrow', wrap: false},
                                    ]}
                                    description="Scroll the viewport left"
                                />
                                <KeyboardShortcutRow
                                    keys={[
                                        {text: 'd', wrap: true},
                                        {text: 'right arrow', wrap: false},
                                    ]}
                                    description="Scroll the viewport right"
                                />
                                <KeyboardShortcutRow
                                    keys={[{text: '0', wrap: true}]}
                                    description="Fit the entire image to the viewport"
                                />
                                <KeyboardShortcutRow
                                    keys={[
                                        {text: '-', wrap: true},
                                        {text: '_', wrap: true},
                                        {text: 'Shift+W', wrap: false},
                                        {text: 'Shift+Up arrow', wrap: false},
                                    ]}
                                    description="Zoom the viewport out"
                                />
                                <KeyboardShortcutRow
                                    keys={[
                                        {text: '=', wrap: true},
                                        {text: '+', wrap: true},
                                        {text: 'Shift+S', wrap: false},
                                        {text: 'Shift+Down arrow', wrap: false},
                                    ]}
                                    description="Zoom the viewport in"
                                />
                                <KeyboardShortcutRow
                                    keys={[{text: 'r', wrap: true}]}
                                    description="Rotate the viewport clockwise"
                                />
                                <KeyboardShortcutRow
                                    keys={[{text: 'R', wrap: true}]}
                                    description="Rotate the viewport counterclockwise"
                                />
                                <KeyboardShortcutRow
                                    keys={[{text: 'f', wrap: true}]}
                                    description="Flip the viewport horizontally"
                                />
                            </tbody>
                        </table>
                    </div>
                    <div className="modal-footer">
                        <button
                            type="button"
                            className="btn btn-primary"
                            data-bs-dismiss="modal"
                        >
                            Close
                        </button>
                    </div>
                </div>
            </div>
        </div>
    );
}


================================================
FILE: frontend/src/viewer/KeyboardShortcutRow.jsx
================================================
import React from 'react';

/**
 * KeyboardShortcutRow
 *
 * Renders one table row for a keyboard shortcut. Shows the key sequence in a
 * row header cell and the action description in an adjacent cell.
 *
 * Rendering:
 * - Keys are comma separated with a space
 * - Keys are placed in a <th>, description in a <td>
 *
 * Accessibility:
 * - <kbd> provides semantic markup for key names
 * - Consumers should ensure the surrounding table has proper headers or caption
 *
 * @param {Array<{text: string, wrap: boolean}>} keys - Ordered keys to display.
 *   When wrap is true the key is wrapped in <kbd>, otherwise rendered as plain
 *   text.
 * @param {string} description - Human readable description of the shortcut
 *   action.
 * @returns {JSX.Element}
 */
export default function KeyboardShortcutRow({keys, description}) {
    return (
        <tr>
            <th>
                {keys.map((key, i) => (
                    <React.Fragment key={i}>
                        {key.wrap ? <kbd>{key.text}</kbd> : key.text}
                        {i < keys.length - 1 && ', '}
                    </React.Fragment>
                ))}
            </th>
            <td>{description}</td>
        </tr>
    );
}


================================================
FILE: frontend/src/viewer/ThresholdFilterForm.jsx
================================================
/**
 * Controls the binarization threshold used by the image viewer filter.
 *
 * Behavior:
 * - Number input and range slider stay in sync.
 * - Up and down arrow buttons change the value by 1 within 0-255.
 * - Reset sets the threshold to 0.
 *
 * Accessibility:
 * - Inputs have associated labels with visually hidden text.
 * - Increment and decrement buttons include hidden text for screen readers.
 *
 * @param {number} threshold - Current threshold value in the range 0-255.
 * @param {Function} setThreshold - Setter to update the threshold.
 * @returns {JSX.Element}
 */
export default function ThresholdFilterForm({threshold, setThreshold}) {
    const handleNumberChange = (e) => {
        setThreshold(parseInt(e.target.value, 10));
    };

    const handleRangeChange = (e) => {
        setThreshold(parseInt(e.target.value, 10));
    };

    const handleReset = () => {
        setThreshold(0);
    };

    const stepUp = () => {
        setThreshold((prev) => Math.min(prev + 1, 255));
    };

    const stepDown = () => {
        setThreshold((prev) => Math.max(prev - 1, 0));
    };

    return (
        <div
            id="threshold-filter"
            className="tab-pane pt-1 ps-3"
            role="tabpanel"
        >
            <form
                id="threshold-form"
                className="d-flex align-items-center"
                onSubmit={(e) => e.preventDefault()}
                onReset={handleReset}
            >
                <div className="row ms-0 me-3 number-input">
                    <div className="col p-1">
                        <input
                            type="number"
                            id="threshold"
                            name="threshold"
                            min="0"
                            max="255"
                            step="1"
                            value={threshold}
                            onChange={handleNumberChange}
                        />
                        <label className="visually-hidden" htmlFor="threshold">
                            Threshold
                        </label>
                    </div>
                    <div className="col p-0 filter-buttons">
                        <div className="row m-0">
                            <button
                                id="threshold-up"
                                type="button"
                                className="arrow-button"
                                onClick={stepUp}
                            >
                                <span className="fas fa-chevron-up" />
                                <span className="visually-hidden">
                                    Increase
                                </span>
                            </button>
                        </div>
                        <div className="row m-0">
                            <button
                                id="threshold-down"
                                type="button"
                                className="arrow-button"
                                onClick={stepDown}
                            >
                                <span className="fas fa-chevron-down" />
                                <span className="visually-hidden">
                                    Decrease
                                </span>
                            </button>
                        </div>
                    </div>
                </div>
                <input
                    type="range"
                    id="threshold-range"
                    name="threshold-range"
                    min="0"
                    max="255"
                    step="1"
                    value={threshold}
                    onChange={handleRangeChange}
                    className="filter-slider flex-grow-1"
                />
                <label className="visually-hidden" htmlFor="threshold-range">
                    Threshold
                </label>
                <input
                    type="reset"
                    className="btn btn-link underline-link fw-bold"
                    value="Reset filter"
                />
            </form>
        </div>
    );
}


================================================
FILE: frontend/src/viewer/Viewer.jsx
================================================
import React, {useEffect, useRef, useState} from 'react';
import OpenSeadragon from 'openseadragon';
import {initializeFiltering} from 'openseadragon-filters';
import screenfull from 'screenfull';

import {prefixUrl, contactUrl} from '../config.js';
import ViewerControls from './Controls';
import ImageFilters from './ImageFilters';
import KeyboardHelpModal from './KeyboardHelpModal';

/**
 * Viewer
 *
 * Mounts an OpenSeadragon instance, wires up UI controls and filter panels,
 * and exposes a fullscreen toggle. Cleans up the viewer on unmount.
 *
 * Behavior:
 * - Initializes OpenSeadragon with filtering support and common UI buttons
 * - On "open" event, recenters via viewport.goHome(true)
 * - On "open-failed", logs an error and shows an alert with a contact URL
 * - Stores the live OSD instance on window.seadragonViewer for external use
 * - Destroys the OSD instance during cleanup to avoid leaks
 *
 * Dependencies:
 * - Requires the "openseadragon-filters" plugin to be imported once
 * - Uses the "screenfull" library for fullscreen where available
 *
 * @param {string} imageUrl - Source image URL used by OpenSeadragon.
 * @param {Function} onLayoutHorizontal - Callback to switch to horizontal layout.
 * @param {Function} onLayoutVertical - Callback to switch to vertical layout.
 * @returns {JSX.Element}
 */
export default function Viewer({
    imageUrl,
    onLayoutHorizontal,
    onLayoutVertical,
}) {
    const viewerRef = useRef(null); // For OSD
    const containerRef = useRef(null); // For Fullscreen wrapper
    const osdViewerRef = useRef(null);
    const filterPluginRef = useRef(null);

    // State to track fullscreen changes
    const [isFullscreen, setIsFullscreen] = useState(false);

    // Add listener for fullscreen changes
    useEffect(() => {
        const handler = () => {
            setIsFullscreen(screenfull.isFullscreen);
        };

        if (screenfull.isEnabled) {
            screenfull.on('change', handler);
        }

        return () => {
            if (screenfull.isEnabled) {
                screenfull.off('change', handler);
            }
        };
    }, []);

    useEffect(() => {
        if (!viewerRef.current || !imageUrl) return;

        osdViewerRef.current = OpenSeadragon({
            element: viewerRef.current,
            prefixUrl: prefixUrl,
            tileSources: {
                type: 'image',
                url: `${imageUrl}?canvas`,
            },
            gestureSettingsTouch: {
                pinchRotate: true,
            },
            showNavigator: true,
            showRotationControl: true,
            showFlipControl: true,
            zoomInButton: 'viewer-zoom-in',
            zoomOutButton: 'viewer-zoom-out',
            homeButton: 'viewer-home',
            rotateLeftButton: 'viewer-rotate-left',
            rotateRightButton: 'viewer-rotate-right',
            flipButton: 'viewer-flip',
            crossOriginPolicy: 'Anonymous',
            drawer: 'canvas',
            defaultZoomLevel: 0,
            homeFillsView: false,
        });

        window.seadragonViewer = osdViewerRef.current;

        osdViewerRef.current.addHandler('open', () => {
            setTimeout(() => {
                osdViewerRef.current.viewport.goHome(true);
            }, 0);
        });

        osdViewerRef.current.addHandler('open-failed', () => {
            console.error('Unable to display image');
            alert(`Unable to display image. Contact us at ${contactUrl}`);
        });

        // Initialize the plugin instance - filtering using the ESM method
        filterPluginRef.current = initializeFiltering(osdViewerRef.current);

        return () => {
            if (osdViewerRef.current) {
                osdViewerRef.current.destroy();
                osdViewerRef.current = null;
            }
            // Clear the plugin ref on unmount
            filterPluginRef.current = null;
        };
    }, [imageUrl]);

    const toggleFullscreen = (e) => {
        e.preventDefault();
        if (!screenfull.isEnabled) return;
        if (screenfull.isFullscreen) {
            screenfull.exit();
        } else {
            // Request fullscreen on the wrapper, not just the image
            screenfull.request(containerRef.current);
        }
    };

    return (
        <div
            ref={containerRef}
            className={`d-flex flex-column h-100 w-100 ${
                isFullscreen ? 'is-fullscreen' : ''
            }`}
            style={isFullscreen ? {backgroundColor: '#212529'} : {}}
        >
            <ViewerControls
                onLayoutHorizontal={onLayoutHorizontal}
                onLayoutVertical={onLayoutVertical}
                toggleFullscreen={toggleFullscreen}
            />
            <ImageFilters filterPluginRef={filterPluginRef} />
            <KeyboardHelpModal />
            <div
                id="asset-image"
                ref={viewerRef}
                className="flex-grow-1 bg-dark d-print-none w-100"
            ></div>
        </div>
    );
}


================================================
FILE: frontend/vite.config.js
================================================
import {defineConfig} from 'vite';
import react from '@vitejs/plugin-react';
import {viteStaticCopy} from 'vite-plugin-static-copy';

export default defineConfig({
    base: '/static/frontend/',
    plugins: [
        react(),
        viteStaticCopy({
            targets: [
                {
                    src: 'node_modules/openseadragon/build/openseadragon/images/*',
                    dest: 'openseadragon-images',
                },
            ],
        }),
    ],
    build: {
        outDir: '../static/frontend',
        minify: false,
        emptyOutDir: true,
        rollupOptions: {
            output: {
                entryFileNames: 'js/[name].js',
                chunkFileNames: 'js/[name].js',
                assetFileNames: ({name}) =>
                    name && name.endsWith('.css')
                        ? 'css/[name][extname]'
                        : 'assets/[name][extname]',
            },
        },
    },
});


================================================
FILE: importer/Dockerfile
================================================
FROM python:3.12-slim-bookworm

## Add the wait script to the image
ADD https://github.com/ufoscout/docker-compose-wait/releases/download/2.2.1/wait /wait
RUN chmod +x /wait

ENV DEBIAN_FRONTEND="noninteractive"

RUN apt-get update -qy && apt-get install -qy curl

# Ensure that the Library's certificate authority is trusted so the tampering
# proxy will not break TLS validation. See
# https://staff.loc.gov/wikis/display/SE/Configuring+HTTPS+clients+for+the+HTTPS+tampering+proxy.

RUN curl -fso /etc/ssl/certs/LOC-ROOT-CA-1.crt http://crl.loc.gov/LOC-ROOT-CA-1.crt && openssl x509 -inform der -in /etc/ssl/certs/LOC-ROOT-CA-1.crt -outform pem -out /etc/ssl/certs/LOC-ROOT-CA-1.pem && c_rehash

RUN apt-get update -qy && apt-get dist-upgrade -qy && apt-get install -o Dpkg::Options::='--force-confnew' -qy \
    git \
    libmemcached-dev \
    # Pillow/Imaging: https://pillow.readthedocs.io/en/latest/installation.html#external-libraries
    libz-dev libfreetype6-dev \
    libtiff-dev libjpeg-dev libopenjp2-7-dev libwebp-dev zlib1g-dev \
    # Postgres client library to build psycopg
    libpq-dev \
    locales \
    # Weasyprint requirements
    libpango-1.0-0 libharfbuzz0b libpangoft2-1.0-0 \
    gcc && apt-get -qy autoremove && apt-get -qy autoclean

RUN locale-gen en_US.UTF-8
ENV LC_ALL=en_US.UTF-8
ENV LANG=en_US.UTF-8
ENV LANGUAGE=en_US.UTF-8

ENV PYTHONUNBUFFERED=1 \
    PYTHONPATH=/app

ENV DJANGO_SETTINGS_MODULE=${DJANGO_SETTINGS_MODULE:-concordia.settings_docker}

RUN pip install --upgrade pip
RUN pip install --no-cache-dir pipenv

WORKDIR /app
COPY . /app

RUN pipenv install --system --dev --deploy && rm -rf ~/.cache/

CMD /wait && ./importer/entrypoint.sh


================================================
FILE: importer/README.md
================================================
# Importer

This is a Django app which uses celery to download images from a
collection on loc.gov. It also uploads those images to an S3 bucket.

## Prerequisites

1. If uploading to S3 bucket, AWS S3 bucket created and your environment is configured for the awscli tool
1. If running in dev mode, HTTP access to tile-dev.loc.gov and dev.loc.gov

## Usage

1. Start the Python shell:

    ```bash
    $ docker-compose up
    $ docker exec -it concordia_importer_1 bash
    root@62e3ebef4de2:/app# python3 ./manage.py shell
    ```

1. Run some test imports:

    ```Python console
    Python 3.6.5rc1 (default, Mar 14 2018, 06:54:23) [GCC 7.3.0] on linux
    Type "help", "copyright", "credits" or "license" for more information.
    >>> from importer.importer.tasks import download_async_campaign, check_completeness
    >>> result = download_async_campaign.delay("https://www.loc.gov/collections/clara-barton-papers/?fa=partof:clara+barton+papers:++diaries+and+journals,+1849-1911")
    >>> result.ready()
    >>> result.get()
    >>> result2 = check_completeness.delay()
    >>> result2.ready()
    >>> result2.get()
    ```

To count the files and check disk usage in `/concordia_images` after download is
complete:

```console
$ docker exec -it concordia_app_1 bash
$ find /concordia_images -type f | wc -l
$ df -kh
```

## Integration

After the images have been downloaded in the docker environment:

1. Copy the images from the docker volume to the running docker app container.

    ```bash
    $ ubuntu@ip-172-31-94-65:~/concordia$ sudo docker exec -it concordia_app_1 bash
    $ root@6eca4f3cd16d:/app# cp -R /concordia_images/mss* concordia/static/img/
    ```

1. Run the migrations in the docker app to load Clara Barton Diaries and Branch
   Rickey collections to concordia.

    ```bash
    $ root@6eca4f3cd16d:/app# python3 ./manage.py migrate
    ```


================================================
FILE: importer/__init__.py
================================================
"""
Design
======

The importer currently only supports loading items from www.loc.gov

General goals:

* All state is stored in the database and visible for reporting
* Celery tasks are ephemeral and while they may be configured to retry they will
  always check the database to avoid conflicts and use transactions to prevent
  race conditions

The import process works like this:

1. A user submits a request to import a URL. This can be an item page, a
   collection page, or an arbitrary search result set.
2. An ImportJob is created which records that request and a background Celery
   task is launched to determine what items it contains (this can potentially be
   well into the thousands)
3. For collection and search URLs (which share a common data format) the task
   loads the JSON representation and queues item import tasks for each item. For
   item URLs, the item import task is directly queued.
4. When the item import task runs it creates an ImportItem record, loads the
   item metadata, and creates ImportItem and ImportItemAsset records to track
   subsequent import work. It creates the Item and Asset records which will hold
   the actual item data as well because this allows review while a large import
   is in progress and our community managers quality review items before making
   them visible to the community. The asset import tasks are queued at the end
   of this step.
5. When the asset import task runs, it downloads the remote file and saves it in
   Concordia's working storage. Each asset is processed independently so
   completed downloads will not consume local storage until the [potentially
   very large] item has completely downloaded, which could potentially take
   hours or days if there are service availability issues requiring retries.
6. When all of the asset tasks are completed the item will be marked as
   completed.
7. When all of the item tasks are completed the job will be marked as completed.
"""


================================================
FILE: importer/admin.py
================================================
from django.contrib import admin, messages
from django.contrib.humanize.templatetags.humanize import naturaltime
from django.db.models import Count, F, Max, Q, QuerySet
from django.http import HttpRequest
from django.utils.translation import gettext_lazy as _

from concordia.admin.filters import (
    CampaignListFilter,
    CampaignProjectListFilter,
    NullableTimestampFilter,
)
from concordia.models import Campaign
from importer.tasks.assets import download_asset_task

from .models import (
    DownloadAssetImageJob,
    ImportItem,
    ImportItemAsset,
    ImportJob,
    VerifyAssetImageJob,
)


@admin.action(description="Retry import")
def retry_download_task(
    modeladmin: admin.ModelAdmin,
    request: HttpRequest,
    queryset: QuerySet[ImportItemAsset],
) -> None:
    """
    Queue the asset download Celery task again for selected rows.

    Args:
        modeladmin (admin.ModelAdmin): Admin class invoking the action.
        request (HttpRequest): Current admin request.
        queryset (QuerySet[ImportItemAsset]): Selected ImportItemAsset rows.

    Returns:
        None
    """
    pks = queryset.values_list("pk", flat=True)
    for pk in pks:
        download_asset_task.delay(pk)
    messages.add_message(request, messages.INFO, "Queued %d tasks" % len(pks))


class LastStartedFilter(NullableTimestampFilter):
    """Filter by whether a task has a 'last_started' timestamp."""

    title = "Last Started"
    parameter_name = "last_started"
    lookup_labels = ("Unstarted", "Started")


class CompletedFilter(NullableTimestampFilter):
    """Filter by whether a task has a 'completed' timestamp."""

    title = "Completed"
    parameter_name = "completed"
    lookup_labels = ("Incomplete", "Completed")


class FailedFilter(NullableTimestampFilter):
    """Filter by whether a task has a 'failed' timestamp."""

    title = "Failed"
    parameter_name = "failed"
    lookup_labels = ("Has not failed", "Has failed")


class ImportJobProjectListFilter(CampaignProjectListFilter):
    """Project filter for ImportJob rows."""

    parameter_name = "project__in"
    related_filter_parameter = "project__campaign__id__exact"
    project_ref = "project_id"


class ImportJobItemProjectListFilter(CampaignProjectListFilter):
    """Project filter for ImportItem rows (via job)."""

    parameter_name = "job__project__in"
    related_filter_parameter = "job__project__campaign__id__exact"
    project_ref = "job__project_id"


class ImportJobAssetProjectListFilter(CampaignProjectListFilter):
    """Project filter for ImportItemAsset rows (via job)."""

    parameter_name = "import_item__job__project__in"
    related_filter_parameter = "import_item__job__project__campaign__id__exact"
    project_ref = "import_item__job__project_id"


class ImportCampaignListFilter(CampaignListFilter):
    """Campaign filter that excludes retired campaigns."""

    def lookups(
        self,
        request: HttpRequest,
        model_admin: admin.ModelAdmin,
    ) -> list[tuple[int | str, str]]:
        """
        Provide (id, title) choices for non-retired campaigns.

        Args:
            request (HttpRequest): Current admin request.
            model_admin (admin.ModelAdmin): Admin class in use.

        Returns:
            list[tuple[int | str, str]]: Campaign id/title pairs.
        """
        queryset = Campaign.objects.exclude(status=Campaign.Status.RETIRED)
        return list(queryset.values_list("id", "title").order_by("title"))


class ImportJobCampaignListFilter(ImportCampaignListFilter):
    """Campaign filter for ImportJob rows."""

    parameter_name = "project__campaign"
    status_filter_parameter = "project__campaign__status"


class ImportItemCampaignListFilter(ImportCampaignListFilter):
    """Campaign filter for ImportItem rows (via job)."""

    parameter_name = "job__project__campaign"
    status_filter_parameter = "job__project__campaign__status"


class ImportItemAssetCampaignListFilter(ImportCampaignListFilter):
    """Campaign filter for ImportItemAsset rows (via job)."""

    parameter_name = "import_item__job__project__campaign"
    status_filter_parameter = "import_item__job__project__campaign__status"


class BatchFilter(admin.SimpleListFilter):
    """Compact batch filter showing recent/incomplete and last complete batches."""

    title = _("Batch")
    parameter_name = "batch"

    def lookups(
        self,
        request: HttpRequest,
        model_admin: admin.ModelAdmin,
    ) -> list[tuple[str, str]]:
        """
        Show up to five batches with incomplete jobs, plus the currently filtered
        batch, and the most recent fully complete batch. Fill with more completed
        batches if there are fewer than five batches shown.

        Args:
            request (HttpRequest): Current admin request.
            model_admin (admin.ModelAdmin): Admin class in use.

        Returns:
            list[tuple[str, str]]: (value, label) pairs for batch selection.
        """
        queryset = model_admin.get_queryset(request)

        # Get up to 5 batches with incomplete jobs
        incomplete_batches = (
            queryset.filter(completed__isnull=True)
            .exclude(batch__isnull=True)
            .values("batch")
            .annotate(latest_created=Max("created"))
            .order_by("-latest_created")[:5]
        )

        batch_choices = {str(batch["batch"]) for batch in incomplete_batches}

        # Ensure the currently filtered batch is included
        current_batch = self.value()
        if current_batch:
            batch_choices.add(current_batch)

        # Fetch the most recent fully completed batch
        most_recent_complete_batch = (
            queryset.filter(batch__isnull=False)
            .values("batch")
            .annotate(
                latest_created=Max("created"),
                total_jobs=Count("id"),
                completed_jobs=Count("id", filter=Q(completed__isnull=False)),
            )
            .filter(total_jobs=F("completed_jobs"))  # Only fully completed batches
            .order_by("-latest_created")
            .first()
        )

        if most_recent_complete_batch:
            batch_choices.add(str(most_recent_complete_batch["batch"]))

        # If we still have fewer than 5, add more completed batches
        if len(batch_choices) < 5:
            additional_complete_batches = (
                queryset.filter(~Q(batch__in=batch_choices), batch__isnull=False)
                .values("batch")
                .annotate(
                    latest_created=Max("created"),
                    total_jobs=Count("id"),
                    completed_jobs=Count("id", filter=Q(completed__isnull=False)),
                )
                .filter(total_jobs=F("completed_jobs"))  # Only fully completed batches
                .order_by("-latest_created")
            )

            for batch in additional_complete_batches:
                if len(batch_choices) >= 5:
                    break
                batch_choices.add(str(batch["batch"]))

        return [(batch, batch[:12] + "...") for batch in batch_choices]

    def queryset(
        self,
        request: HttpRequest,
        queryset: QuerySet,
    ) -> QuerySet:
        """
        Filter the queryset to a specific batch when a value is selected.

        Args:
            request (HttpRequest): Current admin request.
            queryset (QuerySet): Base queryset for the changelist.

        Returns:
            QuerySet: Filtered queryset limited to the chosen batch.
        """
        batch_value = self.value()
        if batch_value:
            return queryset.filter(batch=batch_value)
        return queryset


class TaskStatusModelAdmin(admin.ModelAdmin):
    """
    Base ModelAdmin for task-like models with standard readonly fields.

    Also adds human-friendly timestamp display properties (e.g., "3 minutes
    ago") for common lifecycle fields.
    """

    readonly_fields = (
        "created",
        "modified",
        "last_started",
        "completed",
        "failed",
        "status",
        "task_id",
        "failure_reason",
        "retry_count",
        "failure_history",
        "status_history",
    )

    @staticmethod
    def generate_natural_timestamp_display_property(field_name: str):
        """
        Build a `naturaltime` display function for a timestamp field.

        The returned function is suitable for inclusion in `list_display`.
        It sets `short_description` and `admin_order_field` to match the
        provided field.

        Args:
            field_name (str): Name of the timestamp field on the model.

        Returns:
            callable: A function that takes an object and returns a
            human-readable string (or `None` when unset).
        """

        def inner(obj):
            try:
                value = getattr(obj, field_name)
            except AttributeError:
                return None
            if value:
                return naturaltime(value)
            else:
                return value

        inner.short_description = field_name.replace("_", " ").title()
        inner.admin_order_field = field_name
        return inner

    def __init__(self, *args, **kwargs):
        """
        Initialize and attach dynamic display_* timestamp helpers.

        For each known timestamp field, a `display_<field>` method is created
        that renders a human-friendly relative time and can be used in
        `list_display`.
        """
        for field_name in (
            "created",
            "modified",
            "last_started",
            "completed",
            "failed",
        ):
            setattr(
                self,
                f"display_{field_name}",
                self.generate_natural_timestamp_display_property(field_name),
            )

        super().__init__(*args, **kwargs)


@admin.register(ImportJob)
class ImportJobAdmin(TaskStatusModelAdmin):
    """Admin configuration for `ImportJob`."""

    readonly_fields = TaskStatusModelAdmin.readonly_fields + (
        "project",
        "created_by",
        "url",
    )
    list_display = (
        "display_created",
        "display_modified",
        "display_last_started",
        "display_completed",
        "url",
        "status",
    )
    list_filter = (
        LastStartedFilter,
        CompletedFilter,
        FailedFilter,
        ("created_by", admin.RelatedOnlyFieldListFilter),
        ImportJobCampaignListFilter,
        ImportJobProjectListFilter,
    )
    search_fields = ("url", "status")


@admin.register(ImportItem)
class ImportItemAdmin(TaskStatusModelAdmin):
    """Admin configuration for `ImportItem`."""

    readonly_fields = TaskStatusModelAdmin.readonly_fields + ("job", "item")

    list_display = (
        "display_created",
        "display_modified",
        "display_last_started",
        "display_completed",
        "url",
        "status",
    )
    list_filter = (
        LastStartedFilter,
        CompletedFilter,
        FailedFilter,
        ("job__created_by", admin.RelatedOnlyFieldListFilter),
        ImportItemCampaignListFilter,
        ImportJobItemProjectListFilter,
    )
    search_fields = ("url", "status")


@admin.register(ImportItemAsset)
class ImportItemAssetAdmin(TaskStatusModelAdmin):
    """Admin configuration for `ImportItemAsset`."""

    readonly_fields = TaskStatusModelAdmin.readonly_fields + (
        "import_item",
        "asset",
        "sequence_number",
    )

    list_display = (
        "display_created",
        "display_last_started",
        "display_completed",
        "url",
        "failure_reason",
        "status",
    )
    list_filter = (
        LastStartedFilter,
        CompletedFilter,
        FailedFilter,
        "failure_reason",
        ("import_item__job__created_by", admin.RelatedOnlyFieldListFilter),
        ImportItemAssetCampaignListFilter,
        ImportJobAssetProjectListFilter,
    )
    search_fields = ("url", "status")
    actions = (retry_download_task,)


@admin.register(VerifyAssetImageJob)
class VerifyAssetImageJobAdmin(TaskStatusModelAdmin):
    """Admin configuration for `VerifyAssetImageJob`."""

    readonly_fields = TaskStatusModelAdmin.readonly_fields + ("asset", "batch")
    list_display = (
        "display_created",
        "display_last_started",
        "asset",
        "batch",
        "failure_reason",
        "status",
    )
    list_filter = (
        LastStartedFilter,
        CompletedFilter,
        FailedFilter,
        "failure_reason",
        BatchFilter,
    )
    search_fields = ("status",)


@admin.register(DownloadAssetImageJob)
class DownloadAssetImageJobAdmin(TaskStatusModelAdmin):
    """Admin configuration for `DownloadAssetImageJob`."""

    readonly_fields = TaskStatusModelAdmin.readonly_fields + ("asset", "batch")
    list_display = (
        "display_created",
        "display_last_started",
        "asset",
        "batch",
        "failure_reason",
        "status",
    )
    list_filter = (
        LastStartedFilter,
        CompletedFilter,
        FailedFilter,
        "failure_reason",
        BatchFilter,
    )
    search_fields = ("status",)


================================================
FILE: importer/apps.py
================================================
from django.apps import AppConfig


class ImporterAppConfig(AppConfig):
    name = "importer"


================================================
FILE: importer/celery.py
================================================
import importlib
import pkgutil

from celery import Celery

app = Celery("importer")

# Using a string here means the worker doesn't have to serialize
# the configuration object to child processes.
# - namespace='CELERY' means all celery-related configuration keys
#   should have a `CELERY_` prefix.
app.config_from_object("django.conf:settings", namespace="CELERY")

# Load task modules from all registered Django app configs.
app.autodiscover_tasks()


def import_all_submodules(package_name: str):
    """
    Import a package and recursively import all submodules.
    Used sparingly at Celery startup to ensure all task modules are loaded.
    """
    pkg = importlib.import_module(package_name)
    if not hasattr(pkg, "__path__"):
        return
    for mod in pkgutil.walk_packages(pkg.__path__, pkg.__name__ + "."):
        importlib.import_module(mod.name)


# Import all task modules under these packages
# We do this because celery autodiscovery won't
# find anything not in tasks.py or tasks/__init__.py
# We need to defer this until after Django is fully loaded
@app.on_after_finalize.connect
def _load_all_task_modules(sender, **kwargs):
    import_all_submodules("concordia.tasks")
    import_all_submodules("importer.tasks")


================================================
FILE: importer/config.py
================================================


================================================
FILE: importer/entrypoint.sh
================================================
#!/bin/bash

set -e -u # Exit immediately for unhandled errors or undefined variables

mkdir -p /app/logs
touch /app/logs/concordia.log

#  To avoid trace and reporting of errors in the X-Ray SDK
export AWS_XRAY_CONTEXT_MISSING=LOG_ERROR

echo "Running celery worker"
celery -A concordia worker -l info -c 10


================================================
FILE: importer/exceptions.py
================================================
class ImageImportFailure(Exception):
    """
    Raised when an image import operation fails.

    This exception signals a failure while importing or downloading an asset
    image. Callers should include a concise human-readable reason in the
    exception message to aid in debugging and logging.
    """

    pass


================================================
FILE: importer/migrations/0001_initial.py
================================================
# Generated by Django 2.0.7 on 2018-07-09 08:02

from django.db import migrations, models


class Migration(migrations.Migration):
    initial = True

    dependencies = []

    operations = [
        migrations.CreateModel(
            name="CampaignItemAssetCount",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("campaign_slug", models.SlugField()),
                ("campaign_item_identifier", models.CharField(max_length=50)),
                ("campaign_item_asset_count", models.IntegerField()),
            ],
        ),
        migrations.CreateModel(
            name="CampaignTaskDetails",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("campaign_name", models.CharField(max_length=50)),
                ("campaign_slug", models.SlugField(unique=True)),
                ("campaign_page_count", models.IntegerField()),
                ("campaign_item_count", models.IntegerField()),
                ("campaign_asset_count", models.IntegerField()),
                ("campaign_task_id", models.CharField(max_length=100)),
            ],
        ),
    ]


================================================
FILE: importer/migrations/0001_squashed_0015_auto_20180925_1851.py
================================================
# Generated by Django 2.0.9 on 2018-10-04 15:00

import django.core.validators
import django.db.models.deletion
from django.conf import settings
from django.db import migrations, models


class Migration(migrations.Migration):
    replaces = [
        ("importer", "0001_initial"),
        ("importer", "0002_auto_20180709_0833"),
        ("importer", "0003_auto_20180709_0933"),
        ("importer", "0004_auto_20180812_1007"),
        ("importer", "0005_auto_20180816_1702"),
        ("importer", "0006_auto_20180912_0229"),
        ("importer", "0007_auto_20180917_1654"),
        ("importer", "0008_campaigntaskdetails_project"),
        ("importer", "0009_convert_project_text_to_keys"),
        ("importer", "0010_auto_20180920_2013"),
        ("importer", "0011_auto_20180922_0208"),
        ("importer", "0012_auto_20180923_0231"),
        ("importer", "0013_auto_20180924_1318"),
        ("importer", "0014_auto_20180924_1943"),
        ("importer", "0015_auto_20180925_1851"),
    ]

    initial = True

    dependencies = [
        ("concordia", "0019_auto_20180920_1503"),
        migrations.swappable_dependency(settings.AUTH_USER_MODEL),
        ("concordia", "0021_auto_20180922_0202"),
        ("concordia", "0024_auto_20180924_1529"),
    ]

    operations = [
        migrations.CreateModel(
            name="ImportItem",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("created", models.DateTimeField(auto_now_add=True)),
                ("modified", models.DateTimeField(auto_now=True)),
                (
                    "last_started",
                    models.DateTimeField(
                        blank=True,
                        null=True,
                        verbose_name="Last time when a worker started processing this job",  # NOQA
                    ),
                ),
                (
                    "completed",
                    models.DateTimeField(
                        blank=True,
                        null=True,
                        verbose_name="Time when the job completed processing",
                    ),
                ),
                (
                    "failed",
                    models.DateTimeField(
                        blank=True,
                        null=True,
                        verbose_name="Time when the job failed and will not be restarted",  # NOQA
                    ),
                ),
                (
                    "status",
                    models.TextField(
                        blank=True,
                        null=True,
                        verbose_name="Status message, if any, from the last worker",
                    ),
                ),
                (
                    "task_id",
                    models.UUIDField(
                        blank=True,
                        null=True,
                        verbose_name="UUID of the last Celery task to process this record",  # NOQA
                    ),
                ),
                ("url", models.URLField()),
                (
                    "item",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE, to="concordia.Item"
                    ),
                ),
            ],
            options={"abstract": False},
        ),
        migrations.CreateModel(
            name="ImportItemAsset",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("created", models.DateTimeField(auto_now_add=True)),
                ("modified", models.DateTimeField(auto_now=True)),
                (
                    "last_started",
                    models.DateTimeField(
                        blank=True,
                        help_text="Last time when a worker started processing this job",
                        null=True,
                    ),
                ),
                (
                    "completed",
                    models.DateTimeField(
                        blank=True,
                        help_text="Time when the job completed without error",
                        null=True,
                    ),
                ),
                (
                    "failed",
                    models.DateTimeField(
                        blank=True,
                        help_text="Time when the job failed due to an error",
                        null=True,
                    ),
                ),
                (
                    "status",
                    models.TextField(
                        blank=True,
                        default="",
                        help_text="Status message, if any, from the last worker",
                    ),
                ),
                (
                    "task_id",
                    models.UUIDField(
                        blank=True,
                        help_text="UUID of the last Celery task to process this record",
                        null=True,
                    ),
                ),
                ("url", models.URLField()),
                (
                    "sequence_number",
                    models.PositiveIntegerField(
                        validators=[django.core.validators.MinValueValidator(1)]
                    ),
                ),
                (
                    "asset",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.Asset",
                    ),
                ),
                (
                    "import_item",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        related_name="assets",
                        to="importer.ImportItem",
                    ),
                ),
            ],
            options={"abstract": False},
        ),
        migrations.CreateModel(
            name="ImportJob",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("created", models.DateTimeField(auto_now_add=True)),
                ("modified", models.DateTimeField(auto_now=True)),
                (
                    "last_started",
                    models.DateTimeField(
                        blank=True,
                        help_text="Last time when a worker started processing this job",
                        null=True,
                    ),
                ),
                (
                    "completed",
                    models.DateTimeField(
                        blank=True,
                        help_text="Time when the job completed without error",
                        null=True,
                    ),
                ),
                (
                    "failed",
                    models.DateTimeField(
                        blank=True,
                        help_text="Time when the job failed due to an error",
                        null=True,
                    ),
                ),
                (
                    "status",
                    models.TextField(
                        blank=True,
                        default="",
                        help_text="Status message, if any, from the last worker",
                    ),
                ),
                (
                    "task_id",
                    models.UUIDField(
                        blank=True,
                        help_text="UUID of the last Celery task to process this record",
                        null=True,
                    ),
                ),
                ("url", models.URLField(verbose_name="Source URL for the entire job")),
                (
                    "created_by",
                    models.ForeignKey(
                        null=True,
                        on_delete=django.db.models.deletion.SET_NULL,
                        to=settings.AUTH_USER_MODEL,
                    ),
                ),
                (
                    "project",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.Project",
                    ),
                ),
            ],
            options={"abstract": False},
        ),
        migrations.AddField(
            model_name="importitem",
            name="job",
            field=models.ForeignKey(
                on_delete=django.db.models.deletion.CASCADE,
                related_name="items",
                to="importer.ImportJob",
            ),
        ),
        migrations.AlterField(
            model_name="importitem",
            name="status",
            field=models.TextField(
                blank=True,
                default="",
                verbose_name="Status message, if any, from the last worker",
            ),
        ),
        migrations.AlterField(
            model_name="importitem",
            name="completed",
            field=models.DateTimeField(
                blank=True,
                help_text="Time when the job completed without error",
                null=True,
            ),
        ),
        migrations.AlterField(
            model_name="importitem",
            name="failed",
            field=models.DateTimeField(
                blank=True,
                help_text="Time when the job failed due to an error",
                null=True,
            ),
        ),
        migrations.AlterField(
            model_name="importitem",
            name="last_started",
            field=models.DateTimeField(
                blank=True,
                help_text="Last time when a worker started processing this job",
                null=True,
            ),
        ),
        migrations.AlterField(
            model_name="importitem",
            name="status",
            field=models.TextField(
                blank=True,
                default="",
                help_text="Status message, if any, from the last worker",
            ),
        ),
        migrations.AlterField(
            model_name="importitem",
            name="task_id",
            field=models.UUIDField(
                blank=True,
                help_text="UUID of the last Celery task to process this record",
                null=True,
            ),
        ),
        migrations.AlterUniqueTogether(
            name="importitem", unique_together={("job", "item")}
        ),
        migrations.AlterUniqueTogether(
            name="importitemasset",
            unique_together={
                ("import_item", "asset"),
                ("import_item", "sequence_number"),
            },
        ),
    ]


================================================
FILE: importer/migrations/0002_auto_20180709_0833.py
================================================
# Generated by Django 2.0.7 on 2018-07-09 08:33

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("importer", "0001_initial")]

    operations = [
        migrations.AlterField(
            model_name="campaignitemassetcount",
            name="campaign_item_asset_count",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="campaigntaskdetails",
            name="campaign_asset_count",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="campaigntaskdetails",
            name="campaign_item_count",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="campaigntaskdetails",
            name="campaign_page_count",
            field=models.IntegerField(blank=True, null=True),
        ),
        migrations.AlterField(
            model_name="campaigntaskdetails",
            name="campaign_task_id",
            field=models.CharField(blank=True, max_length=100, null=True),
        ),
    ]


================================================
FILE: importer/migrations/0003_auto_20180709_0933.py
================================================
# Generated by Django 2.0.7 on 2018-07-09 09:33

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("importer", "0002_auto_20180709_0833")]

    operations = [
        migrations.AlterField(
            model_name="campaignitemassetcount",
            name="campaign_item_asset_count",
            field=models.IntegerField(blank=True, default=0, null=True),
        ),
        migrations.AlterField(
            model_name="campaigntaskdetails",
            name="campaign_asset_count",
            field=models.IntegerField(blank=True, default=0, null=True),
        ),
        migrations.AlterField(
            model_name="campaigntaskdetails",
            name="campaign_item_count",
            field=models.IntegerField(blank=True, default=0, null=True),
        ),
        migrations.AlterField(
            model_name="campaigntaskdetails",
            name="campaign_page_count",
            field=models.IntegerField(blank=True, default=0, null=True),
        ),
    ]


================================================
FILE: importer/migrations/0004_auto_20180812_1007.py
================================================
# Generated by Django 2.0.8 on 2018-08-12 10:07

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("importer", "0003_auto_20180709_0933")]

    operations = [
        migrations.RemoveField(
            model_name="campaignitemassetcount", name="campaign_slug"
        ),
        migrations.AddField(
            model_name="campaignitemassetcount",
            name="campaign_task",
            field=models.ForeignKey(
                default=1,
                on_delete=django.db.models.deletion.CASCADE,
                to="importer.CampaignTaskDetails",
            ),
            preserve_default=False,
        ),
        migrations.AddField(
            model_name="campaignitemassetcount",
            name="item_task_id",
            field=models.CharField(blank=True, max_length=100, null=True),
        ),
        migrations.AddField(
            model_name="campaigntaskdetails",
            name="project_name",
            field=models.CharField(default=1, max_length=250),
            preserve_default=False,
        ),
        migrations.AddField(
            model_name="campaigntaskdetails",
            name="project_slug",
            field=models.SlugField(default=1, max_length=250, unique=True),
            preserve_default=False,
        ),
        migrations.RemoveField(
            model_name="campaigntaskdetails", name="campaign_page_count"
        ),
        migrations.AlterUniqueTogether(
            name="campaigntaskdetails",
            unique_together={("campaign_slug", "project_slug")},
        ),
    ]


================================================
FILE: importer/migrations/0005_auto_20180816_1702.py
================================================
# Generated by Django 2.0.8 on 2018-08-16 17:02

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("importer", "0004_auto_20180812_1007")]

    operations = [
        migrations.AlterField(
            model_name="campaigntaskdetails",
            name="campaign_slug",
            field=models.SlugField(),
        ),
        migrations.AlterField(
            model_name="campaigntaskdetails",
            name="project_slug",
            field=models.SlugField(max_length=250),
        ),
    ]


================================================
FILE: importer/migrations/0006_auto_20180912_0229.py
================================================
# Generated by Django 2.0.8 on 2018-09-12 02:29

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("importer", "0005_auto_20180816_1702")]

    operations = [
        migrations.AlterField(
            model_name="campaignitemassetcount",
            name="campaign_item_identifier",
            field=models.CharField(max_length=500),
        ),
        migrations.AlterField(
            model_name="campaigntaskdetails",
            name="campaign_name",
            field=models.CharField(max_length=500),
        ),
        migrations.AlterField(
            model_name="campaigntaskdetails",
            name="campaign_slug",
            field=models.SlugField(max_length=500),
        ),
        migrations.AlterField(
            model_name="campaigntaskdetails",
            name="project_name",
            field=models.CharField(max_length=500),
        ),
        migrations.AlterField(
            model_name="campaigntaskdetails",
            name="project_slug",
            field=models.SlugField(max_length=500),
        ),
    ]


================================================
FILE: importer/migrations/0007_auto_20180917_1654.py
================================================
# Generated by Django 2.0.8 on 2018-09-17 16:54

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("importer", "0006_auto_20180912_0229")]

    operations = [
        migrations.AlterField(
            model_name="campaignitemassetcount",
            name="campaign_item_identifier",
            field=models.CharField(max_length=80),
        ),
        migrations.AlterField(
            model_name="campaigntaskdetails",
            name="campaign_name",
            field=models.CharField(max_length=80),
        ),
        migrations.AlterField(
            model_name="campaigntaskdetails",
            name="campaign_slug",
            field=models.SlugField(max_length=80),
        ),
        migrations.AlterField(
            model_name="campaigntaskdetails",
            name="project_name",
            field=models.CharField(max_length=250),
        ),
        migrations.AlterField(
            model_name="campaigntaskdetails",
            name="project_slug",
            field=models.SlugField(max_length=250),
        ),
    ]


================================================
FILE: importer/migrations/0008_campaigntaskdetails_project.py
================================================
# Generated by Django 2.0.8 on 2018-09-20 20:05

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("importer", "0007_auto_20180917_1654")]

    operations = [
        migrations.AddField(
            model_name="campaigntaskdetails",
            name="project",
            field=models.ForeignKey(
                null=True,
                on_delete=django.db.models.deletion.CASCADE,
                to="concordia.Project",
            ),
        )
    ]


================================================
FILE: importer/migrations/0009_convert_project_text_to_keys.py
================================================
# Generated by Django 2.0.8 on 2018-09-20 20:06
import logging

from django.db import migrations


def convert_slugs_to_references(apps, schema_editor):
    Project = apps.get_model("concordia", "Project")
    CampaignTaskDetails = apps.get_model("importer", "CampaignTaskDetails")

    for ctd in CampaignTaskDetails.objects.all():
        try:
            ctd.project = Project.objects.get(
                slug=ctd.project_slug, campaign__slug=ctd.campaign_slug
            )
            ctd.save()
        except Project.DoesNotExist:
            logging.error("%s references a non-existent project! Deleting it!", ctd)
            ctd.delete()


class Migration(migrations.Migration):
    dependencies = [("importer", "0008_campaigntaskdetails_project")]

    operations = [migrations.RunPython(convert_slugs_to_references)]


================================================
FILE: importer/migrations/0010_auto_20180920_2013.py
================================================
# Generated by Django 2.0.8 on 2018-09-20 20:13

import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("importer", "0009_convert_project_text_to_keys")]

    operations = [
        migrations.AlterField(
            model_name="campaigntaskdetails",
            name="project",
            field=models.ForeignKey(
                on_delete=django.db.models.deletion.CASCADE, to="concordia.Project"
            ),
        ),
        migrations.AlterUniqueTogether(
            name="campaigntaskdetails", unique_together=set()
        ),
        migrations.RemoveField(model_name="campaigntaskdetails", name="campaign_name"),
        migrations.RemoveField(model_name="campaigntaskdetails", name="campaign_slug"),
        migrations.RemoveField(model_name="campaigntaskdetails", name="project_name"),
        migrations.RemoveField(model_name="campaigntaskdetails", name="project_slug"),
    ]


================================================
FILE: importer/migrations/0011_auto_20180922_0208.py
================================================
# Generated by Django 2.0.8 on 2018-09-22 02:08

import django.core.validators
import django.db.models.deletion
from django.conf import settings
from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0021_auto_20180922_0202"),
        migrations.swappable_dependency(settings.AUTH_USER_MODEL),
        ("importer", "0010_auto_20180920_2013"),
    ]

    operations = [
        migrations.CreateModel(
            name="ImportItem",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("created", models.DateTimeField(auto_now_add=True)),
                ("modified", models.DateTimeField(auto_now=True)),
                (
                    "last_started",
                    models.DateTimeField(
                        blank=True,
                        null=True,
                        verbose_name="Last time when a worker started processing this job",  # NOQA
                    ),
                ),
                (
                    "completed",
                    models.DateTimeField(
                        blank=True,
                        null=True,
                        verbose_name="Time when the job completed processing",
                    ),
                ),
                (
                    "failed",
                    models.DateTimeField(
                        blank=True,
                        null=True,
                        verbose_name="Time when the job failed and will not be restarted",  # NOQA
                    ),
                ),
                (
                    "status",
                    models.TextField(
                        blank=True,
                        null=True,
                        verbose_name="Status message, if any, from the last worker",
                    ),
                ),
                (
                    "task_id",
                    models.UUIDField(
                        blank=True,
                        null=True,
                        verbose_name="UUID of the last Celery task to process this record",  # NOQA
                    ),
                ),
                ("url", models.URLField()),
                (
                    "item",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE, to="concordia.Item"
                    ),
                ),
            ],
            options={"abstract": False},
        ),
        migrations.CreateModel(
            name="ImportItemAsset",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("created", models.DateTimeField(auto_now_add=True)),
                ("modified", models.DateTimeField(auto_now=True)),
                (
                    "last_started",
                    models.DateTimeField(
                        blank=True,
                        null=True,
                        verbose_name="Last time when a worker started processing this job",  # NOQA
                    ),
                ),
                (
                    "completed",
                    models.DateTimeField(
                        blank=True,
                        null=True,
                        verbose_name="Time when the job completed processing",
                    ),
                ),
                (
                    "failed",
                    models.DateTimeField(
                        blank=True,
                        null=True,
                        verbose_name="Time when the job failed and will not be restarted",  # NOQA
                    ),
                ),
                (
                    "status",
                    models.TextField(
                        blank=True,
                        null=True,
                        verbose_name="Status message, if any, from the last worker",
                    ),
                ),
                (
                    "task_id",
                    models.UUIDField(
                        blank=True,
                        null=True,
                        verbose_name="UUID of the last Celery task to process this record",  # NOQA
                    ),
                ),
                ("url", models.URLField()),
                (
                    "sequence_number",
                    models.PositiveIntegerField(
                        validators=[django.core.validators.MinValueValidator(1)]
                    ),
                ),
                (
                    "asset",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.Asset",
                    ),
                ),
                (
                    "import_item",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        related_name="assets",
                        to="importer.ImportItem",
                    ),
                ),
            ],
            options={"abstract": False},
        ),
        migrations.CreateModel(
            name="ImportJob",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("created", models.DateTimeField(auto_now_add=True)),
                ("modified", models.DateTimeField(auto_now=True)),
                (
                    "last_started",
                    models.DateTimeField(
                        blank=True,
                        null=True,
                        verbose_name="Last time when a worker started processing this job",  # NOQA
                    ),
                ),
                (
                    "completed",
                    models.DateTimeField(
                        blank=True,
                        null=True,
                        verbose_name="Time when the job completed processing",
                    ),
                ),
                (
                    "failed",
                    models.DateTimeField(
                        blank=True,
                        null=True,
                        verbose_name="Time when the job failed and will not be restarted",  # NOQA
                    ),
                ),
                (
                    "status",
                    models.TextField(
                        blank=True,
                        null=True,
                        verbose_name="Status message, if any, from the last worker",
                    ),
                ),
                (
                    "task_id",
                    models.UUIDField(
                        blank=True,
                        null=True,
                        verbose_name="UUID of the last Celery task to process this record",  # NOQA
                    ),
                ),
                (
                    "source_url",
                    models.URLField(verbose_name="Source URL for the entire job"),
                ),
                (
                    "created_by",
                    models.ForeignKey(
                        null=True,
                        on_delete=django.db.models.deletion.SET_NULL,
                        to=settings.AUTH_USER_MODEL,
                    ),
                ),
                (
                    "project",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.Project",
                    ),
                ),
            ],
            options={"abstract": False},
        ),
        migrations.RemoveField(
            model_name="campaignitemassetcount", name="campaign_task"
        ),
        migrations.RemoveField(model_name="campaigntaskdetails", name="project"),
        migrations.DeleteModel(name="CampaignItemAssetCount"),
        migrations.DeleteModel(name="CampaignTaskDetails"),
        migrations.AddField(
            model_name="importitem",
            name="job",
            field=models.ForeignKey(
                on_delete=django.db.models.deletion.CASCADE,
                related_name="items",
                to="importer.ImportJob",
            ),
        ),
    ]


================================================
FILE: importer/migrations/0012_auto_20180923_0231.py
================================================
# Generated by Django 2.0.8 on 2018-09-23 02:31

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("importer", "0011_auto_20180922_0208")]

    operations = [
        migrations.AlterField(
            model_name="importitem",
            name="status",
            field=models.TextField(
                blank=True,
                default="",
                verbose_name="Status message, if any, from the last worker",
            ),
        ),
        migrations.AlterField(
            model_name="importitemasset",
            name="status",
            field=models.TextField(
                blank=True,
                default="",
                verbose_name="Status message, if any, from the last worker",
            ),
        ),
        migrations.AlterField(
            model_name="importjob",
            name="status",
            field=models.TextField(
                blank=True,
                default="",
                verbose_name="Status message, if any, from the last worker",
            ),
        ),
    ]


================================================
FILE: importer/migrations/0013_auto_20180924_1318.py
================================================
# Generated by Django 2.0.8 on 2018-09-24 13:18

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [("importer", "0012_auto_20180923_0231")]

    operations = [
        migrations.RenameField(
            model_name="importjob", old_name="source_url", new_name="url"
        )
    ]


================================================
FILE: importer/migrations/0014_auto_20180924_1943.py
================================================
# Generated by Django 2.0.8 on 2018-09-24 19:43

from django.db import migrations


class Migration(migrations.Migration):
    dependencies = [
        ("concordia", "0024_auto_20180924_1529"),
        ("importer", "0013_auto_20180924_1318"),
    ]

    operations = [
        migrations.AlterUniqueTogether(
            name="importitem", unique_together={("job", "item")}
        ),
        migrations.AlterUniqueTogether(
            name="importitemasset",
            unique_together={
                ("import_item", "sequence_number"),
                ("import_item", "asset"),
            },
        ),
    ]


================================================
FILE: importer/migrations/0015_auto_20180925_1851.py
================================================
# Generated by Django 2.0.8 on 2018-09-25 18:51

from django.db import migrations, models


class Migration(migrations.Migration):
    dependencies = [("importer", "0014_auto_20180924_1943")]

    operations = [
        migrations.AlterField(
            model_name="importitem",
            name="completed",
            field=models.DateTimeField(
                blank=True,
                help_text="Time when the job completed without error",
                null=True,
            ),
        ),
        migrations.AlterField(
            model_name="importitem",
            name="failed",
            field=models.DateTimeField(
                blank=True,
                help_text="Time when the job failed due to an error",
                null=True,
            ),
        ),
        migrations.AlterField(
            model_name="importitem",
            name="last_started",
            field=models.DateTimeField(
                blank=True,
                help_text="Last time when a worker started processing this job",
                null=True,
            ),
        ),
        migrations.AlterField(
            model_name="importitem",
            name="status",
            field=models.TextField(
                blank=True,
                default="",
                help_text="Status message, if any, from the last worker",
            ),
        ),
        migrations.AlterField(
            model_name="importitem",
            name="task_id",
            field=models.UUIDField(
                blank=True,
                help_text="UUID of the last Celery task to process this record",
                null=True,
            ),
        ),
        migrations.AlterField(
            model_name="importitemasset",
            name="completed",
            field=models.DateTimeField(
                blank=True,
                help_text="Time when the job completed without error",
                null=True,
            ),
        ),
        migrations.AlterField(
            model_name="importitemasset",
            name="failed",
            field=models.DateTimeField(
                blank=True,
                help_text="Time when the job failed due to an error",
                null=True,
            ),
        ),
        migrations.AlterField(
            model_name="importitemasset",
            name="last_started",
            field=models.DateTimeField(
                blank=True,
                help_text="Last time when a worker started processing this job",
                null=True,
            ),
        ),
        migrations.AlterField(
            model_name="importitemasset",
            name="status",
            field=models.TextField(
                blank=True,
                default="",
                help_text="Status message, if any, from the last worker",
            ),
        ),
        migrations.AlterField(
            model_name="importitemasset",
            name="task_id",
            field=models.UUIDField(
                blank=True,
                help_text="UUID of the last Celery task to process this record",
                null=True,
            ),
        ),
        migrations.AlterField(
            model_name="importjob",
            name="completed",
            field=models.DateTimeField(
                blank=True,
                help_text="Time when the job completed without error",
                null=True,
            ),
        ),
        migrations.AlterField(
            model_name="importjob",
            name="failed",
            field=models.DateTimeField(
                blank=True,
                help_text="Time when the job failed due to an error",
                null=True,
            ),
        ),
        migrations.AlterField(
            model_name="importjob",
            name="last_started",
            field=models.DateTimeField(
                blank=True,
                help_text="Last time when a worker started processing this job",
                null=True,
            ),
        ),
        migrations.AlterField(
            model_name="importjob",
            name="status",
            field=models.TextField(
                blank=True,
                default="",
                help_text="Status message, if any, from the last worker",
            ),
        ),
        migrations.AlterField(
            model_name="importjob",
            name="task_id",
            field=models.UUIDField(
                blank=True,
                help_text="UUID of the last Celery task to process this record",
                null=True,
            ),
        ),
    ]


================================================
FILE: importer/migrations/0016_importitem_failure_reason_and_more.py
================================================
# Generated by Django 4.2.16 on 2025-02-20 16:30

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("importer", "0001_squashed_0015_auto_20180925_1851"),
    ]

    operations = [
        migrations.AddField(
            model_name="importitem",
            name="failure_reason",
            field=models.CharField(
                blank=True, choices=[("Image", "Image")], default="", max_length=50
            ),
        ),
        migrations.AddField(
            model_name="importitemasset",
            name="failure_reason",
            field=models.CharField(
                blank=True, choices=[("Image", "Image")], default="", max_length=50
            ),
        ),
        migrations.AddField(
            model_name="importjob",
            name="failure_reason",
            field=models.CharField(
                blank=True, choices=[("Image", "Image")], default="", max_length=50
            ),
        ),
    ]


================================================
FILE: importer/migrations/0017_importitem_failure_history_importitem_retry_count_and_more.py
================================================
# Generated by Django 4.2.16 on 2025-03-03 20:49

import django.core.serializers.json
from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("importer", "0016_importitem_failure_reason_and_more"),
    ]

    operations = [
        migrations.AddField(
            model_name="importitem",
            name="failure_history",
            field=models.JSONField(
                default=list,
                encoder=django.core.serializers.json.DjangoJSONEncoder,
                help_text="Information about previous failures of the task, if any",
            ),
        ),
        migrations.AddField(
            model_name="importitem",
            name="retry_count",
            field=models.IntegerField(
                default=0, help_text="Number of times the task was retried"
            ),
        ),
        migrations.AddField(
            model_name="importitemasset",
            name="failure_history",
            field=models.JSONField(
                default=list,
                encoder=django.core.serializers.json.DjangoJSONEncoder,
                help_text="Information about previous failures of the task, if any",
            ),
        ),
        migrations.AddField(
            model_name="importitemasset",
            name="retry_count",
            field=models.IntegerField(
                default=0, help_text="Number of times the task was retried"
            ),
        ),
        migrations.AddField(
            model_name="importjob",
            name="failure_history",
            field=models.JSONField(
                default=list,
                encoder=django.core.serializers.json.DjangoJSONEncoder,
                help_text="Information about previous failures of the task, if any",
            ),
        ),
        migrations.AddField(
            model_name="importjob",
            name="retry_count",
            field=models.IntegerField(
                default=0, help_text="Number of times the task was retried"
            ),
        ),
        migrations.AlterField(
            model_name="importitem",
            name="failure_reason",
            field=models.CharField(
                blank=True,
                choices=[("Image", "Image"), ("Retries", "Retries")],
                default="",
                help_text="Reason the task failed, if one was provided",
                max_length=50,
            ),
        ),
        migrations.AlterField(
            model_name="importitemasset",
            name="failure_reason",
            field=models.CharField(
                blank=True,
                choices=[("Image", "Image"), ("Retries", "Retries")],
                default="",
                help_text="Reason the task failed, if one was provided",
                max_length=50,
            ),
        ),
        migrations.AlterField(
            model_name="importjob",
            name="failure_reason",
            field=models.CharField(
                blank=True,
                choices=[("Image", "Image"), ("Retries", "Retries")],
                default="",
                help_text="Reason the task failed, if one was provided",
                max_length=50,
            ),
        ),
    ]


================================================
FILE: importer/migrations/0018_importitem_status_history_and_more.py
================================================
# Generated by Django 4.2.16 on 2025-03-06 16:04

import django.core.serializers.json
import django.db.models.deletion
from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0103_alter_item_title"),
        ("importer", "0017_importitem_failure_history_importitem_retry_count_and_more"),
    ]

    operations = [
        migrations.AddField(
            model_name="importitem",
            name="status_history",
            field=models.JSONField(
                blank=True,
                default=list,
                encoder=django.core.serializers.json.DjangoJSONEncoder,
                help_text="Previous statuses on the task, if any",
            ),
        ),
        migrations.AddField(
            model_name="importitemasset",
            name="status_history",
            field=models.JSONField(
                blank=True,
                default=list,
                encoder=django.core.serializers.json.DjangoJSONEncoder,
                help_text="Previous statuses on the task, if any",
            ),
        ),
        migrations.AddField(
            model_name="importjob",
            name="status_history",
            field=models.JSONField(
                blank=True,
                default=list,
                encoder=django.core.serializers.json.DjangoJSONEncoder,
                help_text="Previous statuses on the task, if any",
            ),
        ),
        migrations.AlterField(
            model_name="importitem",
            name="failure_history",
            field=models.JSONField(
                blank=True,
                default=list,
                encoder=django.core.serializers.json.DjangoJSONEncoder,
                help_text="Information about previous failures of the task, if any",
            ),
        ),
        migrations.AlterField(
            model_name="importitem",
            name="retry_count",
            field=models.IntegerField(
                blank=True, default=0, help_text="Number of times the task was retried"
            ),
        ),
        migrations.AlterField(
            model_name="importitemasset",
            name="failure_history",
            field=models.JSONField(
                blank=True,
                default=list,
                encoder=django.core.serializers.json.DjangoJSONEncoder,
                help_text="Information about previous failures of the task, if any",
            ),
        ),
        migrations.AlterField(
            model_name="importitemasset",
            name="retry_count",
            field=models.IntegerField(
                blank=True, default=0, help_text="Number of times the task was retried"
            ),
        ),
        migrations.AlterField(
            model_name="importjob",
            name="failure_history",
            field=models.JSONField(
                blank=True,
                default=list,
                encoder=django.core.serializers.json.DjangoJSONEncoder,
                help_text="Information about previous failures of the task, if any",
            ),
        ),
        migrations.AlterField(
            model_name="importjob",
            name="retry_count",
            field=models.IntegerField(
                blank=True, default=0, help_text="Number of times the task was retried"
            ),
        ),
        migrations.CreateModel(
            name="VerifyAssetImageJob",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("created", models.DateTimeField(auto_now_add=True)),
                ("modified", models.DateTimeField(auto_now=True)),
                (
                    "last_started",
                    models.DateTimeField(
                        blank=True,
                        help_text="Last time when a worker started processing this job",
                        null=True,
                    ),
                ),
                (
                    "completed",
                    models.DateTimeField(
                        blank=True,
                        help_text="Time when the job completed without error",
                        null=True,
                    ),
                ),
                (
                    "failed",
                    models.DateTimeField(
                        blank=True,
                        help_text="Time when the job failed due to an error",
                        null=True,
                    ),
                ),
                (
                    "status",
                    models.TextField(
                        blank=True,
                        default="",
                        help_text="Status message, if any, from the last worker",
                    ),
                ),
                (
                    "task_id",
                    models.UUIDField(
                        blank=True,
                        help_text="UUID of the last Celery task to process this record",
                        null=True,
                    ),
                ),
                (
                    "failure_reason",
                    models.CharField(
                        blank=True,
                        choices=[("Image", "Image"), ("Retries", "Retries")],
                        default="",
                        help_text="Reason the task failed, if one was provided",
                        max_length=50,
                    ),
                ),
                (
                    "retry_count",
                    models.IntegerField(
                        blank=True,
                        default=0,
                        help_text="Number of times the task was retried",
                    ),
                ),
                (
                    "failure_history",
                    models.JSONField(
                        blank=True,
                        default=list,
                        encoder=django.core.serializers.json.DjangoJSONEncoder,
                        help_text="Information about previous failures of the task, if any",
                    ),
                ),
                (
                    "status_history",
                    models.JSONField(
                        blank=True,
                        default=list,
                        encoder=django.core.serializers.json.DjangoJSONEncoder,
                        help_text="Previous statuses on the task, if any",
                    ),
                ),
                ("batch", models.UUIDField(blank=True, editable=False)),
                (
                    "asset",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.asset",
                    ),
                ),
            ],
            options={
                "abstract": False,
            },
        ),
        migrations.CreateModel(
            name="DownloadAssetImageJob",
            fields=[
                (
                    "id",
                    models.AutoField(
                        auto_created=True,
                        primary_key=True,
                        serialize=False,
                        verbose_name="ID",
                    ),
                ),
                ("created", models.DateTimeField(auto_now_add=True)),
                ("modified", models.DateTimeField(auto_now=True)),
                (
                    "last_started",
                    models.DateTimeField(
                        blank=True,
                        help_text="Last time when a worker started processing this job",
                        null=True,
                    ),
                ),
                (
                    "completed",
                    models.DateTimeField(
                        blank=True,
                        help_text="Time when the job completed without error",
                        null=True,
                    ),
                ),
                (
                    "failed",
                    models.DateTimeField(
                        blank=True,
                        help_text="Time when the job failed due to an error",
                        null=True,
                    ),
                ),
                (
                    "status",
                    models.TextField(
                        blank=True,
                        default="",
                        help_text="Status message, if any, from the last worker",
                    ),
                ),
                (
                    "task_id",
                    models.UUIDField(
                        blank=True,
                        help_text="UUID of the last Celery task to process this record",
                        null=True,
                    ),
                ),
                (
                    "failure_reason",
                    models.CharField(
                        blank=True,
                        choices=[("Image", "Image"), ("Retries", "Retries")],
                        default="",
                        help_text="Reason the task failed, if one was provided",
                        max_length=50,
                    ),
                ),
                (
                    "retry_count",
                    models.IntegerField(
                        blank=True,
                        default=0,
                        help_text="Number of times the task was retried",
                    ),
                ),
                (
                    "failure_history",
                    models.JSONField(
                        blank=True,
                        default=list,
                        encoder=django.core.serializers.json.DjangoJSONEncoder,
                        help_text="Information about previous failures of the task, if any",
                    ),
                ),
                (
                    "status_history",
                    models.JSONField(
                        blank=True,
                        default=list,
                        encoder=django.core.serializers.json.DjangoJSONEncoder,
                        help_text="Previous statuses on the task, if any",
                    ),
                ),
                ("batch", models.UUIDField(blank=True, editable=False)),
                (
                    "asset",
                    models.ForeignKey(
                        on_delete=django.db.models.deletion.CASCADE,
                        to="concordia.asset",
                    ),
                ),
            ],
            options={
                "abstract": False,
            },
        ),
    ]


================================================
FILE: importer/migrations/0019_alter_downloadassetimagejob_batch_and_more.py
================================================
# Generated by Django 4.2.16 on 2025-03-07 19:19

from django.db import migrations, models


class Migration(migrations.Migration):

    dependencies = [
        ("importer", "0018_importitem_status_history_and_more"),
    ]

    operations = [
        migrations.AlterField(
            model_name="downloadassetimagejob",
            name="batch",
            field=models.UUIDField(blank=True, editable=False, null=True),
        ),
        migrations.AlterField(
            model_name="verifyassetimagejob",
            name="batch",
            field=models.UUIDField(blank=True, editable=False, null=True),
        ),
    ]


================================================
FILE: importer/migrations/0020_alter_downloadassetimagejob_unique_together_and_more.py
================================================
# Generated by Django 4.2.16 on 2025-03-18 20:01

from django.db import migrations


class Migration(migrations.Migration):

    dependencies = [
        ("concordia", "0103_alter_item_title"),
        ("importer", "0019_alter_downloadassetimagejob_batch_and_more"),
    ]

    operations = [
        migrations.AlterUniqueTogether(
            name="downloadassetimagejob",
            unique_together={("asset", "batch")},
        ),
        migrations.AlterUniqueTogether(
            name="verifyassetimagejob",
            unique_together={("asset", "batch")},
        ),
    ]


================================================
FILE: importer/migrations/__init__.py
================================================


================================================
FILE: importer/models.py
================================================
from logging import getLogger
from uuid import UUID

from django.core.serializers.json import DjangoJSONEncoder
from django.core.validators import MinValueValidator
from django.db import models
from django.urls import reverse
from django.utils import timezone

from configuration.utils import configuration_value
from importer import tasks

logger = getLogger(__name__)


class TaskStatusModel(models.Model):
    """
    Abstract base model that tracks task lifecycle and outcomes.

    Subclasses get standard timestamp fields, a free-form status, failure
    bookkeeping (reason, history, retry count), and the last Celery task ID
    that processed the record.
    """

    class FailureReason(models.TextChoices):
        IMAGE = "Image"
        RETRIES = "Retries"

    created = models.DateTimeField(auto_now_add=True)
    modified = models.DateTimeField(auto_now=True)

    last_started = models.DateTimeField(
        help_text="Last time when a worker started processing this job",
        null=True,
        blank=True,
    )
    completed = models.DateTimeField(
        help_text="Time when the job completed without error", null=True, blank=True
    )
    failed = models.DateTimeField(
        help_text="Time when the job failed due to an error", null=True, blank=True
    )

    status = models.TextField(
        help_text="Status message, if any, from the last worker", blank=True, default=""
    )

    task_id = models.UUIDField(
        help_text="UUID of the last Celery task to process this record",
        null=True,
        blank=True,
    )

    failure_reason = models.CharField(
        help_text="Reason the task failed, if one was provided",
        max_length=50,
        blank=True,
        default="",
        choices=FailureReason.choices,
    )

    retry_count = models.IntegerField(
        help_text="Number of times the task was retried", default=0, blank=True
    )

    failure_history = models.JSONField(
        help_text="Information about previous failures of the task, if any",
        encoder=DjangoJSONEncoder,
        default=list,
        blank=True,
    )

    status_history = models.JSONField(
        help_text="Previous statuses on the task, if any",
        encoder=DjangoJSONEncoder,
        default=list,
        blank=True,
    )

    class Meta:
        abstract = True

    def retry_if_possible(self) -> bool:
        """
        Attempt to schedule a retry for this task if policy allows.

        Subclasses should override this to implement their own logic.

        Returns:
            bool: True if a retry was scheduled, otherwise False.
        """
        return False

    def update_failure_history(self, do_save: bool = True) -> None:
        """
        Append the current failure details to the failure history.

        Args:
            do_save (bool): If True, save the model after updating.
        """
        self.failure_history.append(
            {
                "failed": self.failed,
                "failure_reason": self.failure_reason,
                "status": self.status,
            }
        )
        if do_save:
            self.save()

    def update_status(self, status: str, do_save: bool = True) -> None:
        """
        Append the previous status to the history and set a new status.

        Args:
            status (str): The new status value to set.
            do_save (bool): If True, save the model after updating.
        """
        self.status_history.append(
            {
                "status": self.status,
                "timestamp": self.modified,
            }
        )
        self.status = status
        if do_save:
            self.save()

    def reset_for_retry(self) -> bool:
        """
        Reset failure fields and prepare the record for retry.

        When the instance is currently marked as failed, move the failure
        details into history, clear failure markers, increment retry count,
        and set a transitional status.

        Returns:
            bool: True if the record was reset, otherwise False.
        """
        if self.failed:
            logger.info(
                "Resetting task %s for retrying",
                self,
            )
            self.update_failure_history(do_save=False)
            self.failed = None
            self.failure_reason = ""
            self.update_status("Retrying", do_save=False)
            self.retry_count += 1
            self.save()
            return True
        else:
            new_status = (
                "Task was not marked as failed, so it will "
                "not be reset for retrying."
            )
            self.update_status(new_status)
            logger.warning(
                "Task %s was not marked as failed, so it will not be "
                "reset for retrying",
                self,
            )
            return False


class BatchedJob(TaskStatusModel):
    """
    Abstract base model for jobs grouped into batches.

    The optional `batch` UUID groups related jobs for scheduling and
    admin filtering. Use `batch_admin_url` or `get_batch_admin_url`
    to link to the admin list filtered by the batch.
    """

    # Allows grouping jobs by batch.
    # `batch` is used by the task system to group jobs
    # and run them in smaller groups rather than spawning
    # an arbitrarily large number at once
    # It's also used to group jobs in the admin, allowing
    # filtering to see all the jobs spawned by a particular
    # action
    batch = models.UUIDField(blank=True, null=True, editable=False)

    class Meta:
        abstract = True

    @classmethod
    def get_batch_admin_url(cls, batch: UUID | str | None) -> str:
        """
        Build the admin changelist URL filtered to the provided batch.

        Args:
            batch (UUID | str | None): Batch identifier to filter by. Must be
                provided.

        Returns:
            str: Admin changelist URL with the batch query string applied.

        Raises:
            ValueError: If `batch` is falsy.
        """
        if not batch:
            raise ValueError("A batch value must be provided.")

        app_label = cls._meta.app_label
        model_name = cls._meta.model_name

        admin_url = reverse(f"admin:{app_label}_{model_name}_changelist")

        return f"{admin_url}?batch={batch}"

    @property
    def batch_admin_url(self) -> str | None:
        """
        Convenience property to get the admin URL for this instance's batch.

        Returns:
            str | None: Admin URL filtered by the instance's batch, or None
            when no batch is set.
        """
        # Allows getting the batch url from an instance, automatically
        # using self.batch rather than needing to call the class method
        # get_batch_admin_url if you have an instance
        return self.__class__.get_batch_admin_url(self.batch) if self.batch else None


class ImportJob(TaskStatusModel):
    """
    Represents a request by a user to import item(s) from a remote URL.
    """

    created_by = models.ForeignKey("auth.User", null=True, on_delete=models.SET_NULL)

    project = models.ForeignKey("concordia.Project", on_delete=models.CASCADE)

    url = models.URLField(verbose_name="Source URL for the entire job")

    def __str__(self) -> str:
        return "ImportJob(created_by=%s, project=%s, url=%s)" % (
            self.created_by.username if self.created_by else None,
            self.project.title,
            self.url,
        )


class ImportItem(TaskStatusModel):
    """
    Record of the task status for each Item being imported.
    """

    job = models.ForeignKey(ImportJob, on_delete=models.CASCADE, related_name="items")

    url = models.URLField()

    item = models.ForeignKey("concordia.Item", on_delete=models.CASCADE)

    class Meta:
        unique_together = (("job", "item"),)

    def __str__(self) -> str:
        return "ImportItem(job=%s, url=%s)" % (self.job, self.url)


class ImportItemAsset(TaskStatusModel):
    """
    Record of the task status for each Asset being imported.
    """

    import_item = models.ForeignKey(
        ImportItem, on_delete=models.CASCADE, related_name="assets"
    )

    url = models.URLField()
    sequence_number = models.PositiveIntegerField(validators=[MinValueValidator(1)])

    asset = models.ForeignKey("concordia.Asset", on_delete=models.CASCADE)

    class Meta:
        unique_together = (("import_item", "sequence_number"), ("import_item", "asset"))

    def __str__(self) -> str:
        return "ImportItemAsset(import_item=%s, url=%s)" % (self.import_item, self.url)

    def retry_if_possible(self) -> bool:
        """
        Attempt to schedule a retry when the failure was an image error.

        Uses two configuration values:

        - `asset_image_import_max_retries`: Maximum number of retries allowed.
        - `asset_image_import_max_retry_delay`: Delay (minutes) before retry.

        When eligible and reset succeeds, schedules a Celery task via
        `download_asset_task.apply_async(...)`.

        Returns:
            bool: True if a retry was scheduled, otherwise False.
        """
        if self.failure_reason == TaskStatusModel.FailureReason.IMAGE:
            max_retries = configuration_value("asset_image_import_max_retries")
            retry_delay = configuration_value("asset_image_import_max_retry_delay")
            if self.retry_count < max_retries and retry_delay > 0:
                if self.reset_for_retry():
                    return bool(
                        tasks.assets.download_asset_task.apply_async(
                            (self.pk,), countdown=retry_delay * 60
                        )
                    )
                else:
                    logger.warning(
                        "Task %s was not reset for retrying, so it will not be retried",
                        self,
                    )
                    return False
            else:
                logger.warning(
                    "Task %s has reached the maximum number of retries (%s) "
                    "and will not be repeated",
                    self,
                    max_retries,
                )
                self.update_failure_history(do_save=False)
                self.failed = timezone.now()
                new_status = (
                    "Maximum number of retries reached while retrying "
                    "image download for asset. The failure reason before retrying "
                    f"was {self.failure_reason} and the status was {self.status}"
                )
                self.update_status(new_status, do_save=False)
                self.failure_reason = TaskStatusModel.FailureReason.RETRIES
                self.save()
                return False
        return False


class VerifyAssetImageJob(BatchedJob):
    """
    Job that verifies a previously downloaded asset image.
    """

    asset = models.ForeignKey("concordia.Asset", on_delete=models.CASCADE)

    def __str__(self) -> str:
        return f"VerifyAssetImageJob for {self.asset}"

    class Meta:
        unique_together = (("asset", "batch"),)


class DownloadAssetImageJob(BatchedJob):
    """
    Job that downloads an asset image for later verification.
    """

    asset = models.ForeignKey("concordia.Asset", on_delete=models.CASCADE)

    def __str__(self) -> str:
        return f"DownloadAssetImageJob for {self.asset}"

    class Meta:
        unique_together = (("asset", "batch"),)


================================================
FILE: importer/setup.py
================================================
#!/usr/bin/env python
from setuptools import find_packages, setup

VERSION = __import__("importer").get_version()
INSTALL_REQUIREMENTS = ["boto3", "celery", "requests", "Django>=2.1.5", "Pillow"]
DESCRIPTION = "Download collections of images from loc.gov"
CLASSIFIERS = """
Environment :: Web Environment
Framework :: Django :: 2.0
Development Status :: 2 - Pre-Alpha
Programming Language :: Python
Programming Language :: Python :: 3.12
""".splitlines()

with open("README.rst", "r") as f:
    LONG_DESCRIPTION = f.read()


setup(
    name="importer",
    version=VERSION,
    description=DESCRIPTION,
    long_description=LONG_DESCRIPTION,
    packages=find_packages(),
    include_package_data=True,
    install_requires=INSTALL_REQUIREMENTS,
    classifiers=CLASSIFIERS,
)


================================================
FILE: importer/tasks/__init__.py
================================================
import concurrent.futures
from logging import getLogger
from typing import Iterable

from .items import import_item_count_from_url

logger = getLogger(__name__)


def fetch_all_urls(items: Iterable[str]) -> tuple[list[str], int]:
    """
    Fetch counts for many item URLs concurrently.

    Uses a thread pool to call ``import_item_count_from_url`` for each input
    URL. Aggregates the returned values and the total score.

    Args:
        items: Iterable of item URLs.

    Returns:
        A 2-tuple of:
            - list of values returned for each URL, in the map order
            - integer sum of all scores
    """
    with concurrent.futures.ThreadPoolExecutor(max_workers=25) as executor:
        result = executor.map(import_item_count_from_url, items)

    finals: list[str] = []
    totals: int = 0

    for value, score in result:
        totals += score
        finals.append(value)

    return finals, totals


================================================
FILE: importer/tasks/assets.py
================================================
import hashlib
import os
from logging import getLogger
from tempfile import NamedTemporaryFile
from urllib.parse import urlparse

import boto3
import requests
from celery import Task
from django.conf import settings
from flags.state import flag_enabled
from requests.exceptions import HTTPError

from concordia.storage import ASSET_STORAGE
from importer import models
from importer.celery import app
from importer.exceptions import ImageImportFailure

from .decorators import update_task_status

logger = getLogger(__name__)


@app.task(
    bind=True,
    autoretry_for=(HTTPError,),
    retry_backoff=60 * 60,
    retry_backoff_max=8 * 60 * 60,
    retry_jitter=True,
    retry_kwargs={"max_retries": 3},
    rate_limit=1,
)
def download_asset_task(self: Task, import_asset_pk: int) -> None:
    """
    Download and persist an asset image for the given ImportItemAsset.

    Looks up the ImportItemAsset with related objects to reduce queries, then
    delegates to ``download_asset``. Retries on ``HTTPError`` per task config.

    Args:
        import_asset_pk: Primary key of the ImportItemAsset to process.

    Raises:
        models.ImportItemAsset.DoesNotExist: If the job row does not exist.
        ImageImportFailure: If the download or verification fails.
    """
    # Use select_related since slugs from the container objects form the path.
    qs = models.ImportItemAsset.objects.select_related(
        "import_item__item__project__campaign"
    )
    try:
        import_asset = qs.get(pk=import_asset_pk)
    except models.ImportItemAsset.DoesNotExist:
        logger.exception(
            "ImportItemAsset %s could not be found while attempting to "
            "spawn download_asset task",
            import_asset_pk,
        )
        raise

    download_asset(self, import_asset)


@update_task_status
def download_asset(self: Task, job: "models.ImportItemAsset") -> None:
    """
    Download the image for the given job and save it to working storage.

    The URL is taken from ``job.url`` when present, otherwise from
    ``job.asset.download_url``. The extension is inferred from the URL path
    and normalized so ``jpeg`` becomes ``jpg``. On success the asset's
    ``storage_image`` field is updated.

    Args:
        job: ImportItemAsset containing the target asset and optional URL.

    Raises:
        ImageImportFailure: If the download, upload or checksum check fails.
    """
    asset = job.asset
    download_url: str = job.url if hasattr(job, "url") else asset.download_url

    file_extension = (
        os.path.splitext(urlparse(download_url).path)[1].lstrip(".").lower()
    )
    if not file_extension or file_extension == "jpeg":
        file_extension = "jpg"

    asset_image_filename = asset.get_asset_image_filename(file_extension)

    storage_image = download_and_store_asset_image(download_url, asset_image_filename)
    logger.info(
        "Download and storage of asset image %s complete. Setting "
        "storage_image on asset %s (%s)",
        storage_image,
        asset,
        asset.id,
    )
    asset.storage_image = storage_image
    asset.save()


def download_and_store_asset_image(download_url: str, asset_image_filename: str) -> str:
    """
    Stream a remote image to a temp file, upload it to storage, then verify.

    The file is streamed and hashed with MD5, uploaded to ``ASSET_STORAGE``,
    then the object metadata is fetched via S3 ``head_object`` and the ETag is
    compared to the computed MD5. When the ``IMPORT_IMAGE_CHECKSUM`` flag is
    enabled a mismatch raises ``ImageImportFailure``. When disabled a warning
    is logged.

    Args:
        download_url: HTTP(S) URL of the image to fetch.
        asset_image_filename: Destination key or path in storage.

    Returns:
        The storage key that was written.

    Raises:
        ImageImportFailure: On HTTP errors, I/O errors or checksum mismatch.
    """
    try:
        hasher = hashlib.md5(usedforsecurity=False)
        # Download the remote file to a temp file then upload to storage.
        with NamedTemporaryFile(mode="x+b") as temp_file:
            resp = requests.get(download_url, stream=True, timeout=30)
            resp.raise_for_status()

            for chunk in resp.iter_content(chunk_size=256 * 1024):
                temp_file.write(chunk)
                hasher.update(chunk)

            temp_file.flush()
            temp_file.seek(0)
            ASSET_STORAGE.save(asset_image_filename, temp_file)
    except Exception as exc:
        logger.exception(
            "Unable to download %s to %s", download_url, asset_image_filename
        )
        raise ImageImportFailure(
            f"Unable to download {download_url} to {asset_image_filename}"
        ) from exc

    filehash = hasher.hexdigest()
    response = boto3.client("s3").head_object(
        Bucket=settings.AWS_STORAGE_BUCKET_NAME, Key=asset_image_filename
    )
    etag = response.get("ETag")[1:-1]  # trim quotes around hash

    if filehash != etag:
        if flag_enabled("IMPORT_IMAGE_CHECKSUM"):
            logger.error(
                "ETag (%s) for %s did not match calculated md5 hash (%s) and "
                "the IMPORT_IMAGE_CHECKSUM flag is enabled",
                etag,
                asset_image_filename,
                filehash,
            )
            raise ImageImportFailure(
                f"ETag {etag} for {asset_image_filename} did not match "
                f"calculated md5 hash {filehash}"
            )
        else:
            logger.warning(
                "ETag (%s) for %s did not match calculated md5 hash (%s) but "
                "the IMPORT_IMAGE_CHECKSUM flag is disabled",
                etag,
                asset_image_filename,
                filehash,
            )
    else:
        logger.info(
            "Checksums for %s matched. Upload successful.",
            asset_image_filename,
        )

    return asset_image_filename


================================================
FILE: importer/tasks/collections.py
================================================
from logging import getLogger
from typing import Optional
from urllib.parse import parse_qsl, urlencode, urlsplit, urlunsplit

import requests
from celery import Task
from django.core.cache import cache
from requests import Session
from requests.adapters import HTTPAdapter
from requests.packages.urllib3.util.retry import Retry

from importer import models
from importer.celery import app

from .decorators import update_task_status
from .items import create_item_import_task, get_item_info_from_result

logger = getLogger(__name__)

# Tasks


@app.task(bind=True)
def import_collection_task(
    self: Task, import_job_pk: int, redownload: bool = False
) -> None:
    """
    Celery entrypoint to import all items from a P1 collection or search URL.

    Looks up the ``ImportJob`` and delegates to ``import_collection``.

    Args:
        import_job_pk: Primary key of the ImportJob.
        redownload: If true, force re-download of assets when creating tasks.
    """
    import_job = models.ImportJob.objects.get(pk=import_job_pk)
    import_collection(self, import_job, redownload)


@update_task_status
def import_collection(
    self: Task, import_job: models.ImportJob, redownload: bool = False
) -> None:
    """
    Enqueue item import tasks for every item in a normalized collection URL.

    Args:
        import_job: The ImportJob that initiated the collection import.
        redownload: If true, force re-download of assets.
    """
    item_info = get_collection_items(normalize_collection_url(import_job.url))
    for _, item_url in item_info:
        create_item_import_task.delay(import_job.pk, item_url, redownload)


# End tasks


def requests_retry_session(
    retries: int = 3,
    backoff_factor: float = 60 * 60,
    status_forcelist: tuple[int, ...] = (429, 500, 502, 503, 504),
    session: Optional[Session] = None,
) -> Session:
    """
    Build a ``requests.Session`` with retry behavior for transient failures.

    Args:
        retries: Total number of retry attempts.
        backoff_factor: Multiplier for exponential backoff in seconds.
        status_forcelist: HTTP status codes that trigger a retry.
        session: Optional existing session to configure.

    Returns:
        A ``requests.Session`` with retry adapters mounted.
    """
    sess = session or requests.Session()
    retry = Retry(
        total=retries,
        read=retries,
        connect=retries,
        backoff_factor=backoff_factor,
        status_forcelist=status_forcelist,
    )
    adapter = HTTPAdapter(max_retries=retry)
    sess.mount("http://", adapter)
    sess.mount("https://", adapter)
    return sess


def normalize_collection_url(original_url: str) -> str:
    """
    Normalize a P1 collection or search URL for import.

    Rewrites query params needed for JSON output and pagination. Leaves other
    filters intact.

    Args:
        original_url: The source collection or search URL.

    Returns:
        A normalized URL with ``fo=json`` and without conflicting params.
    """
    parsed_url = urlsplit(original_url)

    new_qs = [("fo", "json")]

    for k, v in parse_qsl(parsed_url.query):
        if k not in ("fo", "at", "sp"):
            new_qs.append((k, v))

    return urlunsplit(
        (parsed_url.scheme, parsed_url.netloc, parsed_url.path, urlencode(new_qs), None)
    )


def get_collection_items(collection_url: str) -> list[tuple[str, str]]:
    """
    Walk a P1 collection or search endpoint and collect item IDs and URLs.

    Caches each page response for 48 hours to reduce repeated network calls.

    Args:
        collection_url: URL of a loc.gov collection or search results page.

    Returns:
        A list of ``(item_id, item_url)`` tuples discovered across pages.
    """
    items: list[tuple[str, str]] = []
    current_page_url: Optional[str] = collection_url

    while current_page_url:
        resp = cache.get(current_page_url)
        if resp is None:
            resp = requests_retry_session().get(current_page_url)
            # 48-hour timeout
            cache.set(current_page_url, resp, timeout=(3600 * 48))

        data = resp.json()

        results = data.get("results", None)
        if results:
            for result in results:
                try:
                    item_info = get_item_info_from_result(result)
                    if item_info:
                        items.append(item_info)
                except Exception:
                    logger.warning(
                        "Skipping result from %s which did not match expected format:",
                        current_page_url,
                        exc_info=True,
                        extra={"data": {"result": result, "url": current_page_url}},
                    )
        else:
            logger.error('Expected URL %s to include "results"', current_page_url)

        current_page_url = data.get("pagination", {}).get("next", None)

    if not items:
        logger.warning("No valid items found for collection url: %s", collection_url)

    return items


================================================
FILE: importer/tasks/decorators.py
================================================
from functools import wraps
from logging import getLogger
from typing import Any, Callable, Concatenate, ParamSpec, TypeVar

from celery import Task
from django.utils.timezone import now

from importer import models
from importer.exceptions import ImageImportFailure

logger = getLogger(__name__)

P = ParamSpec("P")
R = TypeVar("R")


def update_task_status(
    f: Callable[Concatenate[Task, Any, P], R],
) -> Callable[Concatenate[Task, Any, P], R]:
    """
    Decorator to track lifecycle and failure state for a task-like function.

    The wrapped function must take the Celery task self as the first argument
    and a TaskStatusModel instance as the second argument. On entry records
    last_started and task_id. On success sets completed and clears failure
    fields. On exception updates status, marks failed, sets failure_reason for
    known error types, saves the model, then attempts retry_if_possible before
    re-raising.

    Also guards against re-running a task already marked completed.

    Args:
        f: The function to wrap. Must accept
           ``(self, task_status_object, *args, **kwargs)``.

    Returns:
        A callable with the same signature as ``f``.
    """

    @wraps(f)
    def inner(
        self: Task, task_status_object: Any, *args: P.args, **kwargs: P.kwargs
    ) -> R:
        # Sanity guard: if another worker already completed this task, skip work.
        guard_qs = task_status_object.__class__._default_manager.filter(
            pk=task_status_object.pk, completed__isnull=False
        )
        if guard_qs.exists():
            logger.warning(
                "Task %s was already completed and will not be repeated",
                task_status_object,
                extra={
                    "data": {
                        "object": task_status_object,
                        "args": args,
                        "kwargs": kwargs,
                    }
                },
            )
            return  # noqa: RET504

        task_status_object.last_started = now()
        task_status_object.task_id = self.request.id
        task_status_object.save()
        try:
            result = f(self, task_status_object, *args, **kwargs)
            task_status_object.completed = now()
            task_status_object.failed = None
            task_status_object.failure_reason = ""
            task_status_object.update_status("Completed")
            return result
        except Exception as exc:
            new_status = "{}\n\nUnhandled exception: {}".format(
                task_status_object.status, exc
            ).strip()
            task_status_object.update_status(new_status, do_save=False)
            task_status_object.failed = now()
            if isinstance(exc, ImageImportFailure):
                task_status_object.failure_reason = (
                    models.TaskStatusModel.FailureReason.IMAGE
                )
            task_status_object.save()

            retry_result = task_status_object.retry_if_possible()
            if retry_result:
                task_status_object.last_started = now()
                task_status_object.task_id = retry_result.id
                task_status_object.save()
            else:
                logger.info("Retrying task %s was not possible", task_status_object)
            raise

    return inner


================================================
FILE: importer/tasks/images.py
================================================
from logging import getLogger
from typing import Any, Optional, Sequence
from uuid import UUID

from celery import Task, chord
from PIL import Image
from requests.exceptions import HTTPError

from concordia.models import Asset
from concordia.storage import ASSET_STORAGE
from importer import models
from importer.celery import app

from .assets import download_asset
from .decorators import update_task_status

logger = getLogger(__name__)


@app.task(
    bind=True,
    autoretry_for=(HTTPError,),
    retry_backoff=60 * 60,
    retry_backoff_max=8 * 60 * 60,
    retry_jitter=True,
    retry_kwargs={"max_retries": 3},
    rate_limit=1,
)
def redownload_image_task(self: Task, asset_pk: int) -> None:
    """
    Re-download an asset's image and persist it to storage, replacing any
    existing image.

    Looks up the Asset, creates a DownloadAssetImageJob to track work, then
    delegates to download_asset.

    Args:
        asset_pk: Primary key of the Asset to re-download.
    """
    asset = Asset.objects.get(pk=asset_pk)
    logger.info("Redownloading %s to %s", asset.download_url, asset.get_absolute_url())

    # Create a tracking job so download_asset can run under update_task_status.
    job = models.DownloadAssetImageJob.objects.create(asset=asset, batch=None)
    download_asset(self, job)


@app.task()
def batch_verify_asset_images_task_callback(
    results: Sequence[bool],
    batch: UUID,
    concurrency: int,
    failures_detected: bool,
) -> None:
    """
    Callback after a chord of VerifyAssetImageJobs completes.

    If no prior failure was noted and any result is False, mark failures as
    detected. In all cases enqueue the next verification batch.

    Args:
        results: Verification outcomes for this chord (True or False).
        batch: Identifier for the active batch.
        concurrency: Number of jobs to run in the next batch.
        failures_detected: Whether a failure was already seen.
    """
    # We only care if there are any failures, not exactly which or how many, since we
    # automatically create a DownliadImageAssetJob for each failure already, so here
    # we skip this check if we already have a detected failure
    if not failures_detected:
        # No failures so far, so we need to check the results from this latest
        # chord of tasks
        if any(result is False for result in results):
            logger.info(
                "At least one verification failure detected for batch %s", batch
            )
            failures_detected = True

    batch_verify_asset_images_task.delay(batch, concurrency, failures_detected)


@app.task(bind=True)
def batch_verify_asset_images_task(
    self: Task, batch: UUID, concurrency: int = 2, failures_detected: bool = False
) -> None:
    """
    Process VerifyAssetImageJobs in groups of size concurrency.

    After processing:
    - If any failure was detected, start a DownloadAssetImageJob batch.
    - Otherwise, end cleanly.

    Args:
        batch: Identifier for the batch to process.
        concurrency: Number of jobs to process at once. Defaults to 2.
        failures_detected: Whether earlier groups reported a failure.
            Defaults to False.
    """
    logger.info(
        "Processing next %s VerifyAssetImageJobs for batch %s", concurrency, batch
    )

    jobs_to_process = models.VerifyAssetImageJob.objects.filter(
        batch=batch, completed__isnull=True, failed__isnull=True
    ).order_by("created")

    if not jobs_to_process.exists():
        logger.info("No VerifyAssetImageJobs remain for batch %s", batch)
        if failures_detected:
            logger.info(
                "Failures in VerifyAssetImageJobs in batch %s detected, so "
                "starting DownloadAssetImageJob batch",
                batch,
            )
            batch_download_asset_images_task(batch, concurrency)
        else:
            logger.info(
                "No failures in VerifyAssetImageJob batch %s. Ending task.", batch
            )
        return

    task_group = [
        verify_asset_image_task.s(job.asset_id, batch)
        for job in jobs_to_process[:concurrency]
    ]

    chord(task_group)(
        batch_verify_asset_images_task_callback.s(batch, concurrency, failures_detected)
    )


@app.task(
    bind=True,
    autoretry_for=(HTTPError,),
    retry_backoff=60 * 60,
    retry_backoff_max=8 * 60 * 60,
    retry_jitter=True,
    retry_kwargs={"max_retries": 3},
    rate_limit=1,
)
def verify_asset_image_task(
    self: Task, asset_pk: int, batch: Optional[UUID] = None, create_job: bool = False
) -> bool:
    """
    Verify that an asset's storage image exists and is readable.

    Creates or retrieves a VerifyAssetImageJob, runs verification and updates
    status. Retries on HTTPError using exponential backoff.

    Args:
        asset_pk: Primary key of the Asset to verify.
        batch: Identifier for the verification batch, if any.
        create_job: If True, create a new job; otherwise fetch an existing one.

    Returns:
        True if verification succeeds, False otherwise.

    Raises:
        Asset.DoesNotExist: When the Asset cannot be found.
        models.VerifyAssetImageJob.DoesNotExist: When fetching a job that does
            not exist.
    """
    try:
        asset = Asset.objects.get(pk=asset_pk)
    except Asset.DoesNotExist:
        logger.exception(
            "Asset %s could not be found while attempting to "
            "spawn verify_asset_image task",
            asset_pk,
        )
        raise

    if create_job:
        job = models.VerifyAssetImageJob.objects.create(asset=asset, batch=batch)
    else:
        try:
            job = models.VerifyAssetImageJob.objects.get(
                asset=asset, batch=batch, completed=None
            )
        except models.VerifyAssetImageJob.DoesNotExist:
            logger.exception(
                "Uncompleted VerifyAssetImageJob for asset %s and batch %s could not "
                "be found while attempting to spawn verify_asset_image task",
                asset,
                batch,
            )
            raise

    result = verify_asset_image(self, job)
    if result is True:
        job.update_status("Storage image verified")
    return result


def create_download_asset_image_job(asset: Asset, batch: Optional[UUID]) -> None:
    """
    Ensure a DownloadAssetImageJob exists for the given asset and batch.

    Args:
        asset: Asset to download.
        batch: Batch identifier or None.
    """
    existing_job = models.DownloadAssetImageJob.objects.filter(
        asset=asset, batch=batch
    ).first()

    if not existing_job:
        models.DownloadAssetImageJob.objects.create(asset=asset, batch=batch)


@update_task_status
def verify_asset_image(task: Task, job: Any) -> bool:
    """
    Verify the presence and integrity of an Asset's storage image.

    Checks that a storage image is set, the object exists in storage, and that
    the image bytes are not corrupt. On failure, updates job status and creates
    a DownloadAssetImageJob.

    Args:
        task: Celery task instance.
        job: VerifyAssetImageJob instance.

    Returns:
        True if verification succeeds, False otherwise.
    """
    asset = job.asset

    if not asset.storage_image or not asset.storage_image.name:
        status = f"No storage image set on {asset} ({asset.id})"
        logger.info(status)
        job.update_status(status)
        create_download_asset_image_job(asset, job.batch)
        return False
    else:
        logger.info("Storage image set on %s (%s)", asset, asset.id)

    if not ASSET_STORAGE.exists(asset.storage_image.name):
        status = f"Storage image for {asset} ({asset.id}) missing from storage"
        logger.info(status)
        job.update_status(status)
        create_download_asset_image_job(asset, job.batch)
        return False
    else:
        logger.info("Storage image for %s (%s) found in storage", asset, asset.id)

    try:
        with ASSET_STORAGE.open(asset.storage_image.name, "rb") as image_file:
            with Image.open(image_file) as image:
                image.verify()
        logger.info("Storage image for %s (%s) is not corrupt", asset, asset.id)
    except Exception as exc:
        status = (
            f"Storage image for {asset} ({asset.id}), {asset.storage_image.name}, "
            f"is corrupt. The exception raised was Type: {type(exc).__name__}, "
            f"Message: {exc}"
        )
        logger.info(status)
        job.update_status(status)
        create_download_asset_image_job(asset, job.batch)
        return False

    logger.info(
        "Storage image for %s (%s), %s, verified successfully",
        asset,
        asset.id,
        asset.storage_image.name,
    )
    return True


@app.task()
def batch_download_asset_images_task_callback(
    results: Sequence[Any], batch: UUID, concurrency: int
) -> None:
    """
    Callback after a chord of DownloadAssetImageJobs completes.

    Results are ignored. Enqueue the next download batch.

    Args:
        results: Ignored chord results.
        batch: Identifier for the batch.
        concurrency: Number of jobs to run in the next batch.
    """
    # We do not care about the results of these tasks, so we simply call the
    # original task again to continue processing the batch.
    batch_download_asset_images_task.delay(batch, concurrency)


@app.task(bind=True)
def batch_download_asset_images_task(
    self: Task, batch: UUID, concurrency: int = 10
) -> None:
    """
    Process DownloadAssetImageJobs in groups of size concurrency.

    Retrieves pending jobs for the batch, runs up to concurrency tasks, then
    schedules the next group via a chord callback until none remain.

    Args:
        batch: Identifier for the batch to process.
        concurrency: Number of concurrent tasks per group. Defaults to 10.
    """
    logger.info(
        "Processing next %s DownloadAssetImageJobs for batch %s", concurrency, batch
    )

    jobs_to_process = models.DownloadAssetImageJob.objects.filter(
        batch=batch, completed__isnull=True, failed__isnull=True
    ).order_by("created")

    if not jobs_to_process.exists():
        logger.info("No DownloadAssetImageJobs found for batch %s", batch)
        return

    task_groups = [
        download_asset_image_task.s(job.asset.pk, batch)
        for job in jobs_to_process[:concurrency]
    ]

    # Use a chord so when the tasks finish it calls the callback to start the
    # remaining jobs until no more remain. The callback just re-invokes this
    # task with the same batch and concurrency.
    chord(task_groups)(batch_download_asset_images_task_callback.s(batch, concurrency))


@app.task(
    bind=True,
    autoretry_for=(HTTPError,),
    retry_backoff=60 * 60,
    retry_backoff_max=8 * 60 * 60,
    retry_jitter=True,
    retry_kwargs={"max_retries": 3},
    rate_limit=1,
)
def download_asset_image_task(
    self: Task, asset_pk: int, batch: Optional[UUID] = None, create_job: bool = False
) -> None:
    """
    Download an asset's image and track it via DownloadAssetImageJob.

    Creates or retrieves a job and delegates to download_asset. Retries on
    HTTPError using exponential backoff.

    Args:
        asset_pk: Primary key of the Asset to download.
        batch: Identifier for the batch, if any.
        create_job: If True, create a new job; otherwise fetch an existing one.

    Raises:
        Asset.DoesNotExist: When the Asset cannot be found.
        models.DownloadAssetImageJob.DoesNotExist: When fetching a job that
            does not exist.
    """
    try:
        asset = Asset.objects.get(pk=asset_pk)
    except Asset.DoesNotExist:
        logger.exception(
            "Asset %s could not be found while attempting to "
            "spawn verify_asset_image task",
            asset_pk,
        )
        raise

    if create_job:
        job = models.DownloadAssetImageJob.objects.create(asset=asset, batch=batch)
    else:
        try:
            job = models.DownloadAssetImageJob.objects.get(
                asset=asset, batch=batch, completed=None
            )
        except models.DownloadAssetImageJob.DoesNotExist:
            logger.exception(
                "Uncompleted DownloadAssetImageJob for asset %s and batch %s could not "
                "be found while attempting to spawn download_asset_image task",
                asset,
                batch,
            )
            raise

    return download_asset(self, job)


================================================
FILE: importer/tasks/items.py
================================================
import io
import mimetypes
import os
import re
from logging import getLogger
from typing import Any, List, Optional, Tuple
from urllib.parse import urljoin, urlparse

import requests
from celery import Task, group
from django.core.exceptions import ValidationError
from django.core.files.base import ContentFile
from django.db import transaction
from django.utils.text import slugify
from django.utils.timezone import now
from PIL import Image, UnidentifiedImageError
from requests.exceptions import HTTPError

from concordia.models import Asset, Item, MediaType
from importer import models
from importer.celery import app

from .assets import download_asset_task
from .decorators import update_task_status

#: P1 has generic search / item pages and a number of top-level format-specific
#: "context portals" which expose the same JSON interface.
#: jq 'to_entries[] | select(.value.type == "context-portal") | .key' < manifest.json
ACCEPTED_P1_URL_PREFIXES = [
    "collections",
    "search",
    "item",
    "audio",
    "books",
    "film-and-videos",
    "manuscripts",
    "maps",
    "newspapers",
    "notated-music",
    "photos",
    "websites",
]

logger = getLogger(__name__)

# Tasks


@app.task(
    bind=True,
    autoretry_for=(HTTPError,),
    retry_backoff=60 * 60,
    retry_backoff_max=8 * 60 * 60,
    retry_jitter=True,
    retry_kwargs={"max_retries": 3},
    rate_limit=2,
)
def create_item_import_task(
    self: Task, import_job_pk: int, item_url: str, redownload: bool = False
) -> Any:
    """
    Create an ImportItem for the given job and item URL, then enqueue its
    import.

    Fetches item metadata from the remote URL, ensures the Item and
    ImportItem exist, skips fully-imported items when not redownloading, and
    finally schedules ``import_item_task``.

    Args:
        import_job_pk: Primary key of the ImportJob.
        item_url: Absolute item URL on loc.gov.
        redownload: Reprocess an existing item even if it has all assets.

    Returns:
        The AsyncResult returned by ``import_item_task.delay``.
    """
    import_job = models.ImportJob.objects.get(pk=import_job_pk)

    # Load the Item record with metadata from the remote URL:
    resp = requests.get(item_url, params={"fo": "json"}, timeout=30)
    resp.raise_for_status()
    item_data = resp.json()

    item, item_created = Item.objects.get_or_create(
        item_id=get_item_id_from_item_url(item_data["item"]["id"]),
        defaults={"item_url": item_url, "project": import_job.project},
    )

    import_item, import_item_created = import_job.items.get_or_create(
        url=item_url, item=item
    )

    if not item_created and redownload is False:
        # Item has already been imported and we are not redownloading all items.
        asset_urls, item_resource_url = get_asset_urls_from_item_resources(
            item.metadata.get("resources", [])
        )
        if item.asset_set.count() >= len(asset_urls):
            # The item has all of its assets, so we can skip it.
            logger.warning("Not reprocessing existing item with all assets: %s", item)
            import_item.update_status(
                f"Not reprocessing existing item with all assets: {item}",
                do_save=False,
            )
            import_item.completed = import_item.last_started = now()
            import_item.task_id = self.request.id
            import_item.full_clean()
            import_item.save()
            return
        else:
            # The item is missing one or more of its assets, so reprocess it.
            logger.warning("Reprocessing existing item %s that is missing assets", item)

    import_item.item.metadata.update(item_data)
    thumbnail_url = populate_item_from_data(import_item.item, item_data["item"])

    try:
        item.full_clean()
        item.save()
    except Exception as exc:
        # We create the import jobs here, so we cannot rely on the decorator to
        # update status. Update the ImportItem status manually then re-raise.
        logger.exception("Unhandled exception when importing item %s", item)
        new_status = "{}\n\nUnhandled exception: {}".format(
            import_item.status, exc
        ).strip()
        import_item.update_status(new_status, do_save=False)
        import_item.failed = now()
        import_item.task_id = self.request.id
        import_item.save()
        raise

    download_and_set_item_thumbnail(item, thumbnail_url)

    return import_item_task.delay(import_item.pk)


@app.task(bind=True)
def import_item_task(self: Task, import_item_pk: int) -> Any:
    """
    Enqueue downloads for all assets of a previously created ImportItem.

    Args:
        import_item_pk: Primary key of the ImportItem to process.

    Returns:
        The result of the celery group that downloads assets.
    """
    i = models.ImportItem.objects.select_related("item").get(pk=import_item_pk)
    return import_item(self, i)


@update_task_status
def import_item(self: Task, import_item: Any) -> Any:
    """
    Create Asset rows for an ImportItem, create ImportItemAsset rows, then
    enqueue downloads for all assets.

    Wrapped with ``update_task_status`` to keep job fields updated.

    Args:
        self: Celery Task instance.
        import_item: ImportItem instance being processed.

    Returns:
        A celery group result for the scheduled download tasks.
    """
    # Using transaction.atomic here ensures the data is available in the
    # database for the download_asset_task calls. If we do not do this some
    # tasks could execute before the transaction is committed, causing failures.
    with transaction.atomic():
        item_assets: List[Asset] = []
        import_assets: List[Any] = []
        item_resource_url: Optional[str] = None

        asset_urls, item_resource_url = get_asset_urls_from_item_resources(
            import_item.item.metadata.get("resources", [])
        )
        relative_asset_file_path = "/".join(
            [
                import_item.item.project.campaign.slug,
                import_item.item.project.slug,
                import_item.item.item_id,
            ]
        )

        for sequence, asset_url in enumerate(asset_urls, start=1):
            asset_title = f"{import_item.item.item_id}-{sequence}"
            file_extension = (
                os.path.splitext(urlparse(asset_url).path)[1].lstrip(".").lower()
            )
            item_asset = Asset(
                item=import_item.item,
                campaign=import_item.item.project.campaign,
                title=asset_title,
                slug=slugify(asset_title, allow_unicode=True),
                sequence=sequence,
                media_type=MediaType.IMAGE,
                download_url=asset_url,
                resource_url=item_resource_url,
                storage_image="/".join(
                    [relative_asset_file_path, f"{sequence}.{file_extension}"]
                ),
            )
            # Previously any asset that raised a validation error was ignored.
            # We want validation errors to fail the import.
            try:
                item_asset.full_clean()
            except ValidationError as exc:
                raise ValidationError(
                    f"Importing asset with slug '{item_asset.slug}' for "
                    f"item '{item_asset.item}' with resource URL "
                    f"'{item_asset.resource_url}' failed with the following "
                    f"exception: {exc}"
                ) from exc
            item_assets.append(item_asset)

        Asset.objects.bulk_create(item_assets)

        for asset in item_assets:
            import_asset = models.ImportItemAsset(
                import_item=import_item,
                asset=asset,
                url=asset.download_url,
                sequence_number=asset.sequence,
            )
            import_asset.full_clean()
            import_assets.append(import_asset)

        import_item.assets.bulk_create(import_assets)

        import_item.full_clean()
        import_item.save()

    download_asset_group = group(download_asset_task.s(i.pk) for i in import_assets)
    return download_asset_group()


# End tasks


def import_item_count_from_url(import_url: str) -> Tuple[str, int]:
    """
    Return a tuple of status string and asset count for a loc.gov item URL.

    Args:
        import_url: Absolute item URL.

    Returns:
        A pair of ``(status_message, count)``. On error returns a message and
        count 0.
    """
    try:
        resp = requests.get(import_url, params={"fo": "json"}, timeout=30)
        resp.raise_for_status()
        item_data = resp.json()
        output = len(item_data["resources"][0]["files"])
        return f"{import_url} - Asset Count: {output}", output
    except Exception as exc:
        return f"Unhandled exception importing {import_url} {exc}", 0


def get_item_info_from_result(
    result: dict,
) -> Optional[Tuple[str, str]]:
    """
    Extract an item_id and item_url from a P1 search result.

    Skips results with unsupported formats or without an image_url.

    Args:
        result: A single result object from the P1 JSON response.

    Returns:
        ``(item_id, item_url)`` when supported, otherwise None.
    """
    ignored_formats = {"collection", "web page"}

    item_id = result["id"]
    original_format = result["original_format"]

    if ignored_formats.intersection(original_format):
        logger.info(
            "Skipping result %s because it contains an unsupported format: %s",
            item_id,
            original_format,
            extra={"data": {"result": result}},
        )
        return None

    image_url = result.get("image_url")
    if not image_url:
        logger.info(
            "Skipping result %s because it lacks an image_url",
            item_id,
            extra={"data": {"result": result}},
        )
        return None

    item_url = result["url"]

    m = re.search(r"loc.gov/item/([^/]+)", item_url)
    if not m:
        logger.info(
            "Skipping %s because the URL %s doesn't appear to be an item!",
            item_id,
            item_url,
            extra={"data": {"result": result}},
        )
        return None

    return m.group(1), item_url


def get_item_id_from_item_url(item_url: str) -> str:
    """
    Extract the item_id component from a loc.gov item URL.

    Args:
        item_url: Absolute item URL.

    Returns:
        The item_id string.
    """
    if item_url.endswith("/"):
        item_id = item_url.split("/")[-2]
    else:
        item_id = item_url.split("/")[-1]
    return item_id


def import_items_into_project_from_url(
    requesting_user: Any, project: Any, import_url: str, redownload: bool = False
) -> Any:
    """
    Create an ImportJob for the given URL and enqueue item or collection import.

    Determines whether the URL is an item or a collection/search URL and
    schedules the appropriate task.

    Args:
        requesting_user: User creating the ImportJob.
        project: Project that will own the imported Items.
        import_url: loc.gov item or collection/search URL.
        redownload: Reprocess existing items even if they have all assets.

    Returns:
        The created ImportJob instance.
    """
    parsed_url = urlparse(import_url)

    m = re.match(
        r"^/(%s)/" % "|".join(map(re.escape, ACCEPTED_P1_URL_PREFIXES)), parsed_url.path
    )
    if not m:
        raise ValueError(
            f"{import_url} doesn't match one of the known importable patterns"
        )
    url_type = m.group(1)

    import_job = models.ImportJob(
        project=project, created_by=requesting_user, url=import_url
    )
    import_job.full_clean()
    import_job.save()

    if url_type == "item":
        create_item_import_task.delay(import_job.pk, import_url, redownload)
    else:
        # Both collections and search results return the same format JSON
        # response so we can use the same code to process them.
        from .collections import import_collection_task

        import_collection_task.delay(import_job.pk, redownload)

    return import_job


def populate_item_from_data(item: Item, item_info: dict) -> Optional[str]:
    """
    Populate an Item from a loc.gov item JSON fragment.

    Sets title and description when present. Chooses a JPG thumbnail URL if
    available, stores it on the Item, and returns the resolved URL.

    Args:
        item: The Item instance to update.
        item_info: The ``item`` object from the P1 response.

    Returns:
        The resolved thumbnail URL when found, otherwise None.
    """
    for k in ("title", "description"):
        v = item_info.get(k)
        if v:
            setattr(item, k, v)

    # FIXME: this was never set before so we do not have selection logic.
    thumb_urls = [i for i in item_info["image_url"] if ".jpg" in i]
    if thumb_urls:
        item.thumbnail_url = urljoin(item.item_url, thumb_urls[0])
    try:
        image_urls = item_info.get("image_url") or []
        thumb_urls = [u for u in image_urls if ".jpg" in u]
    except Exception:
        thumb_urls = []

    if thumb_urls:
        resolved = urljoin(item.item_url, thumb_urls[0])
        # TODO: remove setting thumbnail_url once field is removed.
        item.thumbnail_url = resolved
        return resolved
    return None


def get_asset_urls_from_item_resources(
    resources: List[dict],
) -> Tuple[List[str], str]:
    """
    From a P1 resources list, pick best image URL per file.

    Prefers the largest JPEG variant per file. If no JPEGs exist, falls back
    to the largest GIF. Also returns the item resource URL when available.

    Args:
        resources: The ``resources`` array from the P1 response.

    Returns:
        A tuple of ``(asset_urls, item_resource_url)``.
    """
    assets: List[str] = []
    try:
        item_resource_url = resources[0]["url"] or ""
    except (IndexError, KeyError):
        item_resource_url = ""

    for resource in resources:
        # Each "file" contains a set of variants. Select the largest preferred
        # type per file.
        for item_file in resource.get("files", []):
            candidates: List[Tuple[str, int]] = []
            backup_candidates: List[Tuple[str, int]] = []

            for variant in item_file:
                if any(i for i in ("url", "height", "width") if i not in variant):
                    continue

                url = variant["url"]
                height = variant["height"]
                width = variant["width"]
                mimetype = variant.get("mimetype")

                # Prefer JPEG; if none exist use GIF.
                if mimetype == "image/jpeg":
                    candidates.append((url, height * width))
                elif mimetype == "image/gif":
                    backup_candidates.append((url, height * width))

            if candidates:
                candidates.sort(key=lambda i: i[1], reverse=True)
                assets.append(candidates[0][0])
            elif backup_candidates:
                backup_candidates.sort(key=lambda i: i[1], reverse=True)
                assets.append(backup_candidates[0][0])

    return assets, item_resource_url


def _guess_extension(content_type: Optional[str], url_path: str) -> str:
    """Guess a safe extension from Content-Type or URL, defaulting to .bin."""
    if content_type:
        ext = mimetypes.guess_extension(content_type.split(";")[0].strip())
        if ext:
            return ext
    _, ext = os.path.splitext(url_path)
    if ext:
        return ext.lower()
    return ".bin"


def _safe_filename(item: Item, ext: str) -> str:
    """Build a filename for the item's thumbnail."""
    base = slugify(item.item_id or f"item-{item.pk}") or f"item-{item.pk}"
    return f"{base}{ext}"


def download_and_set_item_thumbnail(
    item: Item,
    url: str,
    force: bool = False,
    connect_timeout: float = 5.0,
    read_timeout: float = 30.0,
) -> str:
    """
    Download an image from url and save it to item.thumbnail_image.

    The image is validated with Pillow. The function will not set a new
    thumbnail_image if one already exists unless ``force=True``. Filename is
    stable per item and inferred from Content-Type or URL with a safe fallback.

    Args:
        item: The Item instance to modify and save.
        url: Absolute URL for the image to download.
        force: Overwrite an existing thumbnail if True.
        connect_timeout: Requests connect timeout in seconds.
        read_timeout: Requests read timeout in seconds.

    Returns:
        The storage path of the saved image, or a message if skipped.

    Raises:
        ValueError: If the image is invalid.
        requests.RequestException: Network errors during download.
    """
    # Lock the row briefly to avoid pointless work if someone else is writing.
    with transaction.atomic():
        locked = (
            Item.objects.select_for_update(of=("self",))
            .only("id", "thumbnail_image")
            .get(pk=item.pk)
        )
        if locked.thumbnail_image and not force:
            msg = "Thumbnail already exists; skipping (use force=True to overwrite)."
            logger.warning(
                "download_and_set_item_thumbnail: %s item_pk=%s", msg, item.pk
            )
            return msg

    timeout = (connect_timeout, read_timeout)
    logger.info(
        "download_and_set_item_thumbnail: downloading url=%s item_pk=%s",
        url,
        item.pk,
    )

    with requests.get(url, stream=True, timeout=timeout) as resp:
        resp.raise_for_status()
        content_type = (resp.headers.get("Content-Type") or "").lower()

        buf = io.BytesIO()
        for chunk in resp.iter_content(chunk_size=64 * 1024):
            if not chunk:
                continue
            buf.write(chunk)

    # Validate image integrity with Pillow.
    try:
        buf.seek(0)
        with Image.open(buf) as img:
            img.verify()
    except UnidentifiedImageError as exc:
        raise ValueError("Downloaded file is not a valid image.") from exc

    # Decide file extension. Try header, URL, then Pillow.
    url_path = urlparse(url).path
    ext = _guess_extension(content_type, url_path)
    # If we got a blank or .bin extension we could not infer it from headers
    # or URL. Inspect bytes with Pillow, default to jpg.
    if ext in (".bin", ""):
        try:
            buf.seek(0)
            with Image.open(buf) as probe:
                fmt = (probe.format or "").lower()
            ext = {
                "jpeg": ".jpg",
                "jpg": ".jpg",
                "png": ".png",
                "gif": ".gif",
                "webp": ".webp",
                "tiff": ".tif",
                "bmp": ".bmp",
            }.get(fmt, ".jpg")
        finally:
            buf.seek(0)

    filename = _safe_filename(item, ext)
    content = ContentFile(buf.getvalue())

    with transaction.atomic():
        locked = Item.objects.select_for_update(of=("self",)).get(pk=item.pk)
        if locked.thumbnail_image and not force:
            msg = (
                "Thumbnail already present after download; skipping save. "
                "Use force=True to overwrite."
            )
            logger.warning(
                "download_and_set_item_thumbnail: %s item_id=%s", msg, item.pk
            )
            return msg
        locked.thumbnail_image.save(filename, content, save=True)
        logger.info(
            "download_and_set_item_thumbnail: saved as %s item_id=%s",
            locked.thumbnail_image.name,
            locked.pk,
        )
    return locked.thumbnail_image.name


================================================
FILE: importer/tests/README.md
================================================
# Importer Tests

This directory contains tests for the importer application. It has a
combination of Django TestCases (which will create a test database
before running each test), and pyunit tests.

## Pre-requisites

-   Regarding Django TestCases, since these tests create a test database, the docker container with the db must be running — for example:

    ```console
    $ docker-compose up -d db
    ```

-   Use the settings module with defaults appropriate for testing:

    ```console
    $ export DJANGO_SETTINGS_MODULE=concordia.settings_test
    ```

    or

    ```console
    $ pipenv run manage.py test --settings=concordia.settings_test
    ```

## Running the tests

-   To run all tests:

    ```console
    $ python manage.py test importer
    ```

-   To run a single unittest module:

    ```console
    $ python manage.py test importer.tests.test_importer
    ```

-   To run a single unittest in a django unittest module:

    ```console
    $ python manage.py test
    importer.tests.test_importer.CreateCampaignViewTest.test_create_item_campaign
    ```


================================================
FILE: importer/tests/__init__.py
================================================


================================================
FILE: importer/tests/test_admin.py
================================================
import uuid
from unittest import mock

from django.contrib import messages
from django.test import RequestFactory, TestCase
from django.utils import timezone

from concordia.models import Campaign
from concordia.tests.utils import create_asset, create_campaign
from importer.admin import (
    BatchFilter,
    ImportCampaignListFilter,
    TaskStatusModelAdmin,
    retry_download_task,
)
from importer.models import ImportItemAsset, VerifyAssetImageJob

from .utils import create_import_asset, create_verify_asset_image_job


@mock.patch("importer.admin.download_asset_task.delay", autospec=True)
@mock.patch("importer.admin.messages.add_message", autospec=True)
class ActionTests(TestCase):
    def test_retry_download_task(self, messages_mock, task_mock):
        import_asset1 = create_import_asset(0)
        import_assets = [import_asset1] + [
            create_import_asset(i, import_item=import_asset1.import_item)
            for i in range(1, 10)
        ]
        import_asset_count = len(import_assets)
        import_asset_args = [(import_asset.pk,) for import_asset in import_assets]
        modeladmin_mock = mock.MagicMock()
        request = RequestFactory().get("/")

        retry_download_task(modeladmin_mock, request, ImportItemAsset.objects.all())
        args_list = [arg for arg, kwargs in task_mock.call_args_list]

        self.assertEqual(task_mock.call_count, import_asset_count)
        self.assertEqual(args_list, import_asset_args)
        self.assertEqual(messages_mock.call_count, 1)
        self.assertEqual(
            messages_mock.call_args.args,
            (request, messages.INFO, f"Queued {import_asset_count} tasks"),
        )


class ImportCampaignListFilterTest(TestCase):
    def test_lookups(self):
        class TestImportCampaignListFilter(ImportCampaignListFilter):
            # We need a subclass because ImportCampaignListFilter itself
            # isn't meant to be used directly, and can't be due
            # to not having a parameter_name configured
            parameter_name = "campaign"

        campaigns = [create_campaign(slug=f"test-campaign-{i}") for i in range(5)]
        campaigns += [
            create_campaign(
                slug="test-campaign-completed", status=Campaign.Status.COMPLETED
            )
        ]
        retired_campaign = create_campaign(
            slug="test-campaign-retired",
            title="Retired Campaign",
            status=Campaign.Status.RETIRED,
        )

        philter = TestImportCampaignListFilter(
            None, {}, mock.MagicMock(), mock.MagicMock()
        )
        values_list = philter.lookups(mock.MagicMock(), mock.MagicMock())

        self.assertEqual(len(values_list), len(campaigns))
        for idx, title in values_list:
            self.assertNotEqual(idx, retired_campaign.id)
            self.assertNotIn("Retired", title)


@mock.patch("importer.admin.naturaltime")
class TaskStatusModelAdminTest(TestCase):
    def test_generate_natural_timestamp_display_property(self, naturaltime_mock):
        inner = TaskStatusModelAdmin.generate_natural_timestamp_display_property(
            "test_field"
        )

        obj = mock.MagicMock()
        value = inner(obj)
        self.assertTrue(naturaltime_mock.called)

        naturaltime_mock.reset_mock()
        obj = mock.MagicMock(spec=["test_field"])
        obj.test_field = None
        value = inner(obj)
        self.assertEqual(value, None)
        self.assertFalse(naturaltime_mock.called)

        naturaltime_mock.reset_mock()
        # Passing an empty list to spec means there are no
        # attributes on the mock, so accessing any attribute
        # will raise an AttributeError
        obj = mock.MagicMock(spec=[])
        value = inner(obj)
        self.assertEqual(value, None)
        self.assertFalse(naturaltime_mock.called)


class BatchFilterTests(TestCase):
    def setUp(self):
        self.request = mock.MagicMock()
        self.model_admin = mock.MagicMock()
        self.filter = BatchFilter(
            self.request, {}, VerifyAssetImageJob, self.model_admin
        )
        self.batch1 = str(uuid.uuid4())
        self.batch2 = str(uuid.uuid4())
        self.batch3 = str(uuid.uuid4())
        self.batch4 = str(uuid.uuid4())
        self.batch5 = str(uuid.uuid4())
        self.batch6 = str(uuid.uuid4())

        asset1 = create_asset()
        asset2 = create_asset(item=asset1.item, slug="test-asset-2")
        asset3 = create_asset(item=asset1.item, slug="test-asset-3")

        create_verify_asset_image_job(asset=asset1, batch=self.batch1, completed=None)
        create_verify_asset_image_job(asset=asset2, batch=self.batch2, completed=None)
        create_verify_asset_image_job(asset=asset3, batch=self.batch3, completed=None)
        create_verify_asset_image_job(asset=asset3, batch=self.batch4, completed=None)
        create_verify_asset_image_job(asset=asset3, batch=self.batch5, completed=None)
        create_verify_asset_image_job(asset=asset3, batch=self.batch6, completed=None)

    @mock.patch("importer.admin.BatchFilter.value", return_value=None)
    def test_lookups_incomplete_batches(self, mock_value):
        self.model_admin.get_queryset.return_value = VerifyAssetImageJob.objects.all()
        lookups = self.filter.lookups(self.request, self.model_admin)
        self.assertEqual(len(lookups), 5)

    @mock.patch("importer.admin.BatchFilter.value", return_value=None)
    def test_lookups_includes_current_batch(self, mock_value):
        mock_value.return_value = self.batch2
        self.model_admin.get_queryset.return_value = VerifyAssetImageJob.objects.all()
        lookups = self.filter.lookups(self.request, self.model_admin)
        batch_ids = [batch[0] for batch in lookups]
        self.assertIn(self.batch2, batch_ids)

    @mock.patch("importer.admin.BatchFilter.value", return_value=None)
    def test_lookups_includes_recent_completed_batch(self, mock_value):
        VerifyAssetImageJob.objects.filter(batch=self.batch6).update(
            completed=timezone.now()
        )
        self.model_admin.get_queryset.return_value = VerifyAssetImageJob.objects.all()
        lookups = self.filter.lookups(self.request, self.model_admin)
        batch_ids = [batch[0] for batch in lookups]
        self.assertIn(self.batch6, batch_ids)

    @mock.patch("importer.admin.BatchFilter.value", return_value=None)
    def test_lookups_fills_with_completed_batches(self, mock_value):
        batch_list = [self.batch1, self.batch2, self.batch3, self.batch4, self.batch5]
        VerifyAssetImageJob.objects.filter(batch__in=batch_list).update(
            completed=timezone.now()
        )
        self.model_admin.get_queryset.return_value = VerifyAssetImageJob.objects.all()
        lookups = self.filter.lookups(self.request, self.model_admin)
        self.assertEqual(len(lookups), 5)

    @mock.patch("importer.admin.BatchFilter.value", return_value=None)
    def test_queryset_filters_correctly(self, mock_value):
        mock_value.return_value = self.batch1
        queryset = self.filter.queryset(self.request, VerifyAssetImageJob.objects.all())
        batch_ids = queryset.values_list("batch", flat=True)
        self.assertTrue(all(str(batch) == self.batch1 for batch in batch_ids))

    @mock.patch("importer.admin.BatchFilter.value", return_value=None)
    def test_queryset_returns_all_when_no_batch_selected(self, mock_value):
        mock_value.return_value = None
        queryset = self.filter.queryset(self.request, VerifyAssetImageJob.objects.all())
        self.assertEqual(queryset.count(), VerifyAssetImageJob.objects.count())


================================================
FILE: importer/tests/test_celery.py
================================================
import tempfile
from types import SimpleNamespace
from unittest import mock

from django.test import TestCase

import importer.celery as celery_mod
from importer.celery import import_all_submodules


class ImporterCeleryTests(TestCase):
    def test_returns_early_for_non_package(self):
        mock_pkg = SimpleNamespace(__name__="not_a_pkg")  # no __path__

        with (
            mock.patch.object(
                celery_mod.importlib, "import_module", return_value=mock_pkg
            ) as mock_import,
            mock.patch.object(celery_mod.pkgutil, "walk_packages") as mock_walk,
        ):
            import_all_submodules("not_a_pkg")

        mock_import.assert_called_once_with("not_a_pkg")
        mock_walk.assert_not_called()

    def test_imports_all_submodules_for_package(self):
        sub1 = SimpleNamespace(name="dummy_pkg.sub1")
        sub2 = SimpleNamespace(name="dummy_pkg.sub2")

        with tempfile.TemporaryDirectory() as td:
            mock_pkg = SimpleNamespace(__name__="dummy_pkg", __path__=[td])

            with (
                mock.patch.object(celery_mod.importlib, "import_module") as mock_import,
                mock.patch.object(
                    celery_mod.pkgutil, "walk_packages", return_value=[sub1, sub2]
                ) as mock_walk,
            ):

                def side_effect(name):
                    if name == "dummy_pkg":
                        return mock_pkg
                    return SimpleNamespace(__name__=name)

                mock_import.side_effect = side_effect
                import_all_submodules("dummy_pkg")

        mock_walk.assert_called_once()
        args, _kwargs = mock_walk.call_args
        self.assertEqual(args[0], mock_pkg.__path__)
        self.assertEqual(args[1], mock_pkg.__name__ + ".")

        self.assertIn(mock.call("dummy_pkg"), mock_import.mock_calls)
        self.assertIn(mock.call("dummy_pkg.sub1"), mock_import.mock_calls)
        self.assertIn(mock.call("dummy_pkg.sub2"), mock_import.mock_calls)

    def test_package_with_no_submodules(self):
        with tempfile.TemporaryDirectory() as td:
            mock_pkg = SimpleNamespace(__name__="empty_pkg", __path__=[td])

            with (
                mock.patch.object(celery_mod.importlib, "import_module") as mock_import,
                mock.patch.object(
                    celery_mod.pkgutil, "walk_packages", return_value=[]
                ) as mock_walk,
            ):

                mock_import.side_effect = lambda name: (
                    mock_pkg if name == "empty_pkg" else SimpleNamespace(__name__=name)
                )
                import_all_submodules("empty_pkg")

        mock_walk.assert_called_once()
        mock_import.assert_called_once_with("empty_pkg")

    def test__load_all_task_modules_invokes_imports(self):
        with mock.patch.object(celery_mod, "import_all_submodules") as mock_import_all:
            celery_mod._load_all_task_modules(sender=celery_mod.app)

        mock_import_all.assert_has_calls(
            [
                mock.call("concordia.tasks"),
                mock.call("importer.tasks"),
            ],
            any_order=False,
        )

    def test_on_after_finalize_signal_triggers_handler(self):
        with mock.patch.object(celery_mod, "import_all_submodules") as mock_import_all:
            celery_mod.app.on_after_finalize.send(sender=celery_mod.app)

        mock_import_all.assert_has_calls(
            [mock.call("concordia.tasks"), mock.call("importer.tasks")],
            any_order=False,
        )
        self.assertEqual(mock_import_all.call_count, 2)


================================================
FILE: importer/tests/test_models.py
================================================
import uuid

from django.test import TestCase
from django.urls import reverse
from django.utils import timezone

from concordia.tests.utils import CreateTestUsers, create_asset, create_project
from importer.models import TaskStatusModel

from .utils import (
    create_download_asset_image_job,
    create_import_asset,
    create_import_item,
    create_import_job,
    create_verify_asset_image_job,
)


class ImportJobTests(TestCase, CreateTestUsers):
    def test_str(self):
        user = self.create_test_user()
        project = create_project()
        url = "http://example.com"

        job = create_import_job(project=project)

        self.assertEqual(
            str(job), f"ImportJob(created_by=None, project={project.title}, url=)"
        )

        job.created_by = user
        job.url = url

        self.assertEqual(
            str(job),
            f"ImportJob(created_by={user.username}, "
            f"project={project.title}, url={url})",
        )

    def test_retry_if_possible(self):
        # This method is just a placeholder for this model,
        # so we're just testing to make sure it doesn't error
        # and returns False, since any other value will cause issues
        job = create_import_job()

        self.assertFalse(job.retry_if_possible())

    def test_update_failure_history(self):
        job = create_import_job()
        job.failed = timezone.now()
        job.failure_reason = TaskStatusModel.FailureReason.IMAGE
        job.status = "Test failure status"
        job.failure_history = []
        job.save()
        job.update_failure_history()

        failure_history = job.failure_history
        self.assertEqual(len(failure_history), 1)
        self.assertNotEqual(failure_history[0]["failed"], "")
        self.assertEqual(
            failure_history[0]["failure_reason"], TaskStatusModel.FailureReason.IMAGE
        )
        self.assertEqual(failure_history[0]["status"], "Test failure status")


class ImportItemTests(TestCase, CreateTestUsers):
    def test_str(self):
        job = create_import_job()
        url = "http://example.com"

        item = create_import_item(import_job=job)

        self.assertEqual(str(item), f"ImportItem(job={job}, url=)")

        item.url = url

        self.assertEqual(str(item), f"ImportItem(job={job}, url={url})")

    def test_retry_if_possible(self):
        # This method is just a placeholder for this model,
        # so we're just testing to make sure it doesn't error
        # and returns False, since any other value will cause issues
        item = create_import_item()

        self.assertFalse(item.retry_if_possible())


class ImportItemAssetTests(TestCase, CreateTestUsers):
    def test_str(self):
        item = create_import_item()
        url = "http://example.com"

        asset = create_import_asset(import_item=item)

        self.assertEqual(str(asset), f"ImportItemAsset(import_item={item}, url=)")

        asset.url = url

        self.assertEqual(str(asset), f"ImportItemAsset(import_item={item}, url={url})")


class VerifyAssetImageJobTests(TestCase):
    def setUp(self):
        self.asset = create_asset()
        self.batch_id = uuid.uuid4()
        self.job = create_verify_asset_image_job(asset=self.asset, batch=self.batch_id)

    def test_str_representation(self):
        self.assertEqual(str(self.job), f"VerifyAssetImageJob for {self.asset}")

    def test_batch_admin_url(self):
        expected_url = (
            reverse("admin:importer_verifyassetimagejob_changelist")
            + f"?batch={self.batch_id}"
        )
        self.assertEqual(self.job.batch_admin_url, expected_url)

    def test_get_batch_admin_url(self):
        expected_url = (
            reverse("admin:importer_verifyassetimagejob_changelist")
            + f"?batch={self.batch_id}"
        )
        url = self.job.__class__.get_batch_admin_url(self.batch_id)
        self.assertEqual(url, expected_url)

    def test_get_batch_admin_url_error(self):
        with self.assertRaises(ValueError):
            self.job.__class__.get_batch_admin_url("")

    def test_update_failure_history(self):
        self.job.failed = timezone.now()
        self.job.failure_reason = "Image"
        self.job.status = "Failed due to image error"
        self.job.update_failure_history()
        self.assertEqual(len(self.job.failure_history), 1)
        self.assertEqual(self.job.failure_history[0]["failure_reason"], "Image")

    def test_update_status(self):
        self.job.update_status("Processing")
        self.assertEqual(self.job.status, "Processing")
        self.assertEqual(len(self.job.status_history), 1)
        self.assertEqual(self.job.status_history[0]["status"], "")

    def test_reset_for_retry(self):
        self.job.failed = timezone.now()
        self.assertTrue(self.job.reset_for_retry())
        self.assertIsNone(self.job.failed)
        self.assertEqual(self.job.retry_count, 1)

    def test_reset_for_retry_when_not_failed(self):
        self.assertFalse(self.job.reset_for_retry())
        self.assertEqual(
            self.job.status,
            "Task was not marked as failed, so it will not be reset for retrying.",
        )


class DownloadAssetImageJobTests(TestCase):
    def setUp(self):
        self.asset = create_asset()
        self.batch_id = uuid.uuid4()
        self.job = create_download_asset_image_job(
            asset=self.asset, batch=self.batch_id
        )

    def test_str_representation(self):
        self.assertEqual(str(self.job), f"DownloadAssetImageJob for {self.asset}")

    def test_batch_admin_url(self):
        expected_url = (
            reverse("admin:importer_downloadassetimagejob_changelist")
            + f"?batch={self.batch_id}"
        )
        self.assertEqual(self.job.batch_admin_url, expected_url)

    def test_get_batch_admin_url(self):
        expected_url = (
            reverse("admin:importer_downloadassetimagejob_changelist")
            + f"?batch={self.batch_id}"
        )
        url = self.job.__class__.get_batch_admin_url(self.batch_id)
        self.assertEqual(url, expected_url)

    def test_get_batch_admin_url_error(self):
        with self.assertRaises(ValueError):
            self.job.__class__.get_batch_admin_url("")

    def test_update_failure_history(self):
        self.job.failed = timezone.now()
        self.job.failure_reason = "Image"
        self.job.status = "Failed due to image error"
        self.job.update_failure_history()
        self.assertEqual(len(self.job.failure_history), 1)
        self.assertEqual(self.job.failure_history[0]["failure_reason"], "Image")

    def test_update_status(self):
        self.job.update_status("Processing")
        self.assertEqual(self.job.status, "Processing")
        self.assertEqual(len(self.job.status_history), 1)
        self.assertEqual(self.job.status_history[0]["status"], "")

    def test_reset_for_retry(self):
        self.job.failed = timezone.now()
        self.assertTrue(self.job.reset_for_retry())
        self.assertIsNone(self.job.failed)
        self.assertEqual(self.job.retry_count, 1)

    def test_reset_for_retry_when_not_failed(self):
        self.assertFalse(self.job.reset_for_retry())
        self.assertEqual(
            self.job.status,
            "Task was not marked as failed, so it will not be reset for retrying.",
        )


================================================
FILE: importer/tests/test_tasks_assets.py
================================================
import uuid
from unittest import mock

import requests
from django.core.cache import caches
from django.db.models import Max
from django.test import TestCase, override_settings
from django.utils import timezone
from PIL import UnidentifiedImageError

from concordia.models import Asset
from concordia.tests.utils import create_asset
from configuration.models import Configuration
from importer import exceptions, tasks
from importer.models import (
    DownloadAssetImageJob,
    ImportItemAsset,
    TaskStatusModel,
    VerifyAssetImageJob,
)

from .utils import (
    create_download_asset_image_job,
    create_import_asset,
    create_verify_asset_image_job,
)


class RedownloadImageTaskTests(TestCase):
    @mock.patch("importer.tasks.images.download_asset")
    def test_redownload_image_task(self, mock_download):
        tasks.images.redownload_image_task(create_asset().pk)
        self.assertTrue(mock_download.called)


class AssetImportTests(TestCase):
    def setUp(self):
        for cache in caches.all():
            cache.clear()

        self.import_asset = create_import_asset(url="http://example.com")
        self.asset = self.import_asset.asset
        self.job = create_download_asset_image_job(asset=self.asset)

        # It's difficult/impossible to cleanly mock a decorator due to the way
        # they're applied when the decorated object/function is evaluated on
        # import, so we unfortunately have to handle the update_task_status
        # decorator, so we need a mock object that can pass for a Celery task
        # object so update_task_status doesn't error during the test
        self.task_mock = mock.MagicMock()
        self.task_mock.request.id = "f81d4fae-7dec-11d0-a765-00a0c91e6bf6"

        self.get_return_value = [b"chunk1", b"chunk2"]

        self.valid_hash = "097c42989a9e5d9dcced7b35ec4b0486"
        self.invalid_hash = "bad-hash"

        self.filename = self.asset.get_asset_image_filename()

        self.head_object_mock = mock.MagicMock()
        self.s3_client_mock = mock.MagicMock()
        self.s3_client_mock.head_object = self.head_object_mock

    def tearDown(self):
        for cache in caches.all():
            cache.clear()

    def test_get_asset_urls_from_item_resources_empty(self):
        self.assertEqual(tasks.items.get_asset_urls_from_item_resources([]), ([], ""))

    def test_get_asset_urls_from_item_resources_url_only(self):
        results = tasks.items.get_asset_urls_from_item_resources(
            [{"url": "http://example.com"}]
        )
        self.assertEqual(results, ([], "http://example.com"))

    def test_get_asset_urls_from_item_resources_valid(self):
        results = tasks.items.get_asset_urls_from_item_resources(
            [
                {
                    "url": "http://example.com",
                    "files": [
                        [
                            {
                                "url": "http://example.com/1.jpg",
                                "height": 1,
                                "width": 1,
                                "mimetype": "image/jpeg",
                            },
                            {"url": "http://example.com/2.jpg"},
                            {
                                "url": "http://example.com/3.jpg",
                                "height": 2,
                                "width": 2,
                                "mimetype": "image/jpeg",
                            },
                            {
                                "url": "http://example.com/4.jpg",
                                "height": 100,
                                "width": 100,
                                "mimetype": "image/gif",
                            },
                        ]
                    ],
                }
            ]
        )
        self.assertEqual(results, (["http://example.com/3.jpg"], "http://example.com"))

    def test_get_asset_urls_from_item_resource_no_valid(self):
        results = tasks.items.get_asset_urls_from_item_resources(
            [
                {
                    "url": "http://example.com",
                    "files": [
                        [
                            {
                                "url": "http://example.com/1.jpg",
                                "height": 1,
                                "width": 1,
                                "mimetype": "file/pdf",
                            },
                            {"url": "http://example.com/2.jpg"},
                            {
                                "url": "http://example.com/3.jpg",
                                "height": 2,
                                "width": 2,
                                "mimetype": "video/mov",
                            },
                            {
                                "url": "http://example.com/4.jpg",
                                "height": 100,
                                "width": 100,
                                "mimetype": "image/tiff",
                            },
                        ]
                    ],
                }
            ]
        )
        self.assertEqual(results, ([], "http://example.com"))

    def test_get_asset_urls_from_item_resource_no_jpgs(self):
        results = tasks.items.get_asset_urls_from_item_resources(
            [
                {
                    "url": "http://example.com",
                    "files": [
                        [
                            {
                                "url": "http://example.com/1.jpg",
                                "height": 1,
                                "width": 1,
                                "mimetype": "file/pdf",
                            },
                            {"url": "http://example.com/2.jpg"},
                            {
                                "url": "http://example.com/3.gif",
                                "height": 2,
                                "width": 2,
                                "mimetype": "image/gif",
                            },
                            {
                                "url": "http://example.com/4.gif",
                                "height": 100,
                                "width": 100,
                                "mimetype": "image/gif",
                            },
                        ]
                    ],
                }
            ]
        )
        self.assertEqual(results, (["http://example.com/4.gif"], "http://example.com"))

    def test_download_asset_task(self):
        with mock.patch("importer.tasks.assets.download_asset") as task_mock:
            tasks.assets.download_asset_task(self.import_asset.pk)
            self.assertTrue(task_mock.called)
            task, called_import_asset = task_mock.call_args.args
            self.assertTrue(called_import_asset, self.import_asset)

            # Test sending a bad pk
            task_mock.reset_mock()
            max_pk = ImportItemAsset.objects.aggregate(Max("pk"))["pk__max"]
            with self.assertRaises(ImportItemAsset.DoesNotExist):
                tasks.assets.download_asset_task(max_pk + 1)
            self.assertFalse(task_mock.called)

    @override_settings(
        STORAGES={
            "default": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
            "assets": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
        },
        AWS_STORAGE_BUCKET_NAME="test-bucket",
    )
    def test_download_asset_valid(self):
        with (
            mock.patch("importer.tasks.assets.requests.get") as get_mock,
            mock.patch("importer.tasks.assets.boto3.client") as boto_mock,
            mock.patch("importer.tasks.assets.flag_enabled") as flag_mock,
        ):
            get_mock.return_value.iter_content.return_value = self.get_return_value
            boto_mock.return_value = self.s3_client_mock
            flag_mock.return_value = True
            self.head_object_mock.return_value = {"ETag": f'"{self.valid_hash}"'}

            tasks.assets.download_asset(self.task_mock, self.import_asset)

            self.assertEqual(get_mock.call_args[0], ("http://example.com",))
            self.assertTrue(get_mock.call_args[1]["stream"])

    @override_settings(
        STORAGES={
            "default": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
            "assets": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
        },
        AWS_STORAGE_BUCKET_NAME="test-bucket",
    )
    def test_download_asset_valid_checksum_fail(self):
        with (
            mock.patch("importer.tasks.assets.requests.get") as get_mock,
            mock.patch("importer.tasks.assets.boto3.client") as boto_mock,
            mock.patch("importer.tasks.assets.flag_enabled") as flag_mock,
        ):
            get_mock.return_value.iter_content.return_value = self.get_return_value
            boto_mock.return_value = self.s3_client_mock
            flag_mock.return_value = True
            self.head_object_mock.return_value = {"ETag": f'"{self.invalid_hash}"'}

            with self.assertRaises(Exception) as assertion:
                tasks.assets.download_asset(self.task_mock, self.import_asset)

            self.assertEqual(
                str(assertion.exception),
                f"ETag {self.invalid_hash} for {self.filename} did not match "
                f"calculated md5 hash {self.valid_hash}",
            )

    @override_settings(
        STORAGES={
            "default": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
            "assets": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
        },
        AWS_STORAGE_BUCKET_NAME="test-bucket",
    )
    def test_download_asset_valid_checksum_fail_without_flag(self):
        with (
            mock.patch("importer.tasks.assets.requests.get") as get_mock,
            mock.patch("importer.tasks.assets.boto3.client") as boto_mock,
            self.assertLogs("importer.tasks", level="WARN") as log,
        ):
            get_mock.return_value.iter_content.return_value = self.get_return_value
            boto_mock.return_value = self.s3_client_mock
            self.head_object_mock.return_value = {"ETag": f'"{self.invalid_hash}"'}

            tasks.assets.download_asset(self.task_mock, self.import_asset)
            self.assertEqual(
                log.output[0],
                f"WARNING:importer.tasks.assets:ETag ({self.invalid_hash}) for "
                f"{self.filename} did not match calculated md5 hash "
                f"({self.valid_hash}) but the IMPORT_IMAGE_CHECKSUM flag is disabled",
            )

    @override_settings(
        STORAGES={
            "default": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
            "assets": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
        },
        AWS_STORAGE_BUCKET_NAME="test-bucket",
    )
    def test_download_asset_invalid(self):
        with (
            mock.patch("importer.tasks.assets.requests.get") as get_mock,
            self.assertLogs("importer.tasks", level="ERROR") as log,
        ):
            get_mock.return_value.raise_for_status.side_effect = AttributeError
            with self.assertRaises(exceptions.ImageImportFailure):
                tasks.assets.download_asset(self.task_mock, self.import_asset)
            # Since the logging includes a stacktrace, we just check the
            # beginning of the log entry with assertIn
            self.assertIn(
                "ERROR:importer.tasks.assets:"
                "Unable to download http://example.com to "
                "test-campaign/test-project/testitem.0123456789/1.jpg",
                log.output[0],
            )

    @override_settings(
        STORAGES={
            "default": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
            "assets": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
        },
        AWS_STORAGE_BUCKET_NAME="test-bucket",
    )
    def test_download_asset_retry_success(self):
        import_asset = self.import_asset
        import_asset.failed = timezone.now()
        import_asset.completed = None
        import_asset.failure_reason = TaskStatusModel.FailureReason.IMAGE
        import_asset.status = "Test failed status"
        import_asset.retry_count = 0
        import_asset.failure_history = []
        import_asset.save()

        with mock.patch(
            "importer.models.tasks.assets.download_asset_task"
        ) as task_mock:
            response = import_asset.retry_if_possible()

            self.assertNotEqual(response, False)
            self.assertTrue(task_mock.apply_async.called)
            self.assertEqual(len(import_asset.failure_history), 1)
            self.assertEqual(import_asset.failed, None)
            self.assertEqual(import_asset.retry_count, 1)
            self.assertEqual(import_asset.failure_reason, "")

    @override_settings(
        STORAGES={
            "default": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
            "assets": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
        },
        AWS_STORAGE_BUCKET_NAME="test-bucket",
    )
    def test_download_asset_retry_maximum_exceeded(self):
        try:
            config = Configuration.objects.get(key="asset_image_import_max_retries")
            config.value = "1"
            config.data_type = Configuration.DataType.NUMBER
            config.save()
        except Configuration.DoesNotExist:
            Configuration.objects.create(
                key="asset_image_import_max_retries",
                value="1",
                data_type=Configuration.DataType.NUMBER,
            )

        import_asset = self.import_asset
        import_asset.failed = timezone.now()
        import_asset.completed = None
        import_asset.failure_reason = TaskStatusModel.FailureReason.IMAGE
        import_asset.status = "Test failed status"
        import_asset.retry_count = 1
        import_asset.failure_history = []
        import_asset.save()

        with mock.patch(
            "importer.models.tasks.assets.download_asset_task"
        ) as task_mock:
            response = import_asset.retry_if_possible()

            self.assertFalse(response)
            self.assertFalse(task_mock.apply_async.called)
            self.assertEqual(len(import_asset.failure_history), 1)
            self.assertNotEqual(import_asset.failed, None)
            self.assertEqual(
                import_asset.status,
                "Maximum number of retries reached while retrying image download "
                "for asset. The failure reason before retrying was Image and the "
                "status was Test failed status",
            )
            self.assertEqual(import_asset.retry_count, 1)
            self.assertEqual(
                import_asset.failure_reason, TaskStatusModel.FailureReason.RETRIES
            )

    @override_settings(
        STORAGES={
            "default": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
            "assets": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
        },
        AWS_STORAGE_BUCKET_NAME="test-bucket",
    )
    def test_download_asset_retry_cant_reset(self):
        import_asset = self.import_asset
        import_asset.completed = None
        import_asset.failure_reason = TaskStatusModel.FailureReason.IMAGE
        import_asset.status = "Test failed status"
        import_asset.retry_count = 0
        import_asset.failure_history = []
        import_asset.save()

        with mock.patch(
            "importer.models.tasks.assets.download_asset_task"
        ) as task_mock:
            response = import_asset.retry_if_possible()

            self.assertFalse(response)
            self.assertFalse(task_mock.apply_async.called)
            self.assertNotEqual(import_asset.status, "Test failed status")
            self.assertEqual(len(import_asset.failure_history), 0)
            self.assertEqual(import_asset.failed, None)
            self.assertEqual(import_asset.retry_count, 0)
            self.assertEqual(
                import_asset.failure_reason, TaskStatusModel.FailureReason.IMAGE
            )

    @override_settings(
        STORAGES={
            "default": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
            "assets": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
        },
        AWS_STORAGE_BUCKET_NAME="test-bucket",
    )
    def test_download_asset_retry_invalid_failure_reason(self):
        import_asset = self.import_asset
        import_asset.failed = timezone.now()
        import_asset.completed = None
        import_asset.failure_reason = ""
        import_asset.status = "Test failed status"
        import_asset.retry_count = 0
        import_asset.failure_history = []
        import_asset.save()

        with mock.patch(
            "importer.models.tasks.assets.download_asset_task"
        ) as task_mock:
            response = import_asset.retry_if_possible()

            self.assertFalse(response)
            self.assertFalse(task_mock.apply_async.called)
            self.assertEqual(import_asset.status, "Test failed status")
            self.assertEqual(len(import_asset.failure_history), 0)
            self.assertNotEqual(import_asset.failed, None)
            self.assertEqual(import_asset.retry_count, 0)
            self.assertEqual(import_asset.failure_reason, "")

    @override_settings(
        STORAGES={
            "default": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
            "assets": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
        },
        AWS_STORAGE_BUCKET_NAME="test-bucket",
    )
    def test_download_asset_manual_retry_success(self):
        # This mimics an admin manually retrying the task, rather than
        # the automatic retry system (such as through an admin action).
        # We want to be sure the failure information is correctly reset.
        import_asset = self.import_asset
        import_asset.failed = timezone.now()
        import_asset.completed = None
        import_asset.failure_reason = ""
        import_asset.status = "Test failed status"
        import_asset.retry_count = 0
        import_asset.failure_history = []
        import_asset.save()

        with mock.patch(
            "importer.models.tasks.assets.download_and_store_asset_image"
        ) as download_mock:
            download_mock.return_value = "image.jpg"

            tasks.assets.download_asset_task.delay(import_asset.pk)
            import_asset.refresh_from_db()
            self.assertTrue(download_mock.called)
            self.assertEqual(import_asset.status, "Completed")
            self.assertEqual(len(import_asset.failure_history), 0)
            self.assertEqual(import_asset.failed, None)
            self.assertEqual(import_asset.retry_count, 0)
            self.assertEqual(import_asset.failure_reason, "")

    @mock.patch("importer.tasks.assets.download_and_store_asset_image")
    @mock.patch("importer.tasks.assets.logger.info")
    def test_download_url_from_asset(self, mock_logger, mock_download):
        self.asset.download_url = "https://example.com/image.png"
        self.asset.save()
        self.job.refresh_from_db()

        mock_download.return_value = "stored_image.png"

        tasks.assets.download_asset(self.task_mock, self.job)

        mock_download.assert_called_once_with(self.asset.download_url, mock.ANY)
        self.asset.refresh_from_db()
        self.assertEqual(self.asset.storage_image, "stored_image.png")
        mock_logger.assert_any_call(
            "Download and storage of asset image %s complete. Setting storage_image "
            "on asset %s (%s)",
            "stored_image.png",
            self.asset,
            self.asset.id,
        )

    @mock.patch("importer.tasks.assets.download_and_store_asset_image")
    @mock.patch("importer.tasks.assets.logger.info")
    def test_valid_file_extension(self, mock_logger, mock_download):
        self.asset.download_url = "https://example.com/image.png"
        self.asset.save()
        self.job.refresh_from_db()

        mock_download.return_value = "stored_image.png"
        tasks.assets.download_asset(self.task_mock, self.job)

        asset_image_filename = self.asset.get_asset_image_filename("png")
        mock_download.assert_called_once_with(
            self.asset.download_url, asset_image_filename
        )

        self.asset.refresh_from_db()
        self.assertEqual(self.asset.storage_image, "stored_image.png")
        mock_logger.assert_any_call(
            "Download and storage of asset image %s complete. Setting storage_image "
            "on asset %s (%s)",
            "stored_image.png",
            self.asset,
            self.asset.id,
        )


class BatchVerifyAssetImagesTaskCallbackTests(TestCase):
    def setUp(self):
        self.batch_id = uuid.uuid4()
        self.concurrency = 5

    @mock.patch("importer.tasks.images.batch_verify_asset_images_task.delay")
    def test_no_failures_detected_no_failures_in_results(self, mock_task):
        results = [True, True, True]
        tasks.images.batch_verify_asset_images_task_callback(
            results, self.batch_id, self.concurrency, False
        )
        mock_task.assert_called_once_with(self.batch_id, self.concurrency, False)

    @mock.patch("importer.tasks.images.batch_verify_asset_images_task.delay")
    def test_no_failures_detected_some_failures_in_results(self, mock_task):
        results = [True, False, True]
        with self.assertLogs("importer.tasks", level="INFO") as log:
            tasks.images.batch_verify_asset_images_task_callback(
                results, self.batch_id, self.concurrency, False
            )
            self.assertIn(
                "INFO:importer.tasks.images:At least one verification "
                f"failure detected for batch {self.batch_id}",
                log.output,
            )
        mock_task.assert_called_once_with(self.batch_id, self.concurrency, True)

    @mock.patch("importer.tasks.images.batch_verify_asset_images_task.delay")
    def test_failures_already_detected(self, mock_task):
        results = [True, False, True]
        tasks.images.batch_verify_asset_images_task_callback(
            results, self.batch_id, self.concurrency, True
        )
        mock_task.assert_called_once_with(self.batch_id, self.concurrency, True)


class BatchVerifyAssetImagesTaskTests(TestCase):
    def setUp(self):
        self.batch_id = uuid.uuid4()
        self.concurrency = 2
        asset1 = create_asset()
        asset2 = create_asset(item=asset1.item, slug="test-asset-2")
        self.job1 = create_verify_asset_image_job(batch=self.batch_id, asset=asset1)
        self.job2 = create_verify_asset_image_job(batch=self.batch_id, asset=asset2)

    @mock.patch("importer.tasks.images.logger.info")
    @mock.patch("importer.tasks.images.batch_download_asset_images_task")
    def test_no_jobs_remaining_with_failures(self, mock_batch_download, mock_logger):
        VerifyAssetImageJob.objects.all().delete()
        tasks.images.batch_verify_asset_images_task(
            self.batch_id, self.concurrency, True
        )
        mock_logger.assert_any_call(
            "Failures in VerifyAssetImageJobs in batch %s detected, so starting "
            "DownloadAssetImageJob batch",
            self.batch_id,
        )
        mock_batch_download.assert_called_once_with(self.batch_id, self.concurrency)

    @mock.patch("importer.tasks.images.logger.info")
    def test_no_jobs_remaining_no_failures(self, mock_logger):
        VerifyAssetImageJob.objects.all().delete()
        tasks.images.batch_verify_asset_images_task(
            self.batch_id, self.concurrency, False
        )
        mock_logger.assert_any_call(
            "No failures in VerifyAssetImageJob batch %s. Ending task.", self.batch_id
        )

    @mock.patch("importer.tasks.images.chord")
    @mock.patch("importer.tasks.images.verify_asset_image_task.s")
    def test_jobs_remaining(self, mock_task_s, mock_chord):
        tasks.images.batch_verify_asset_images_task(
            self.batch_id, self.concurrency, False
        )
        self.assertEqual(mock_task_s.call_count, 2)
        mock_chord.assert_called()


class VerifyAssetImageTaskTests(TestCase):
    def setUp(self):
        self.asset = create_asset()
        self.batch_id = uuid.uuid4()

    @mock.patch("importer.tasks.images.logger.exception")
    def test_asset_not_found(self, mock_logger):
        with self.assertRaises(Asset.DoesNotExist):
            tasks.images.verify_asset_image_task(999)
        mock_logger.assert_called()

    @mock.patch("importer.tasks.images.logger.exception")
    def test_verify_job_not_found(self, mock_logger):
        with self.assertRaises(VerifyAssetImageJob.DoesNotExist):
            tasks.images.verify_asset_image_task(
                self.asset.pk, self.batch_id, create_job=False
            )
        mock_logger.assert_called()

    @mock.patch("importer.tasks.images.verify_asset_image")
    def test_verify_asset_image_task_success(self, mock_verify):
        job = create_verify_asset_image_job(asset=self.asset, batch=self.batch_id)
        mock_verify.return_value = True

        result = tasks.images.verify_asset_image_task(self.asset.pk, self.batch_id)
        self.assertTrue(result)
        job.refresh_from_db()
        self.assertEqual(job.status, "Storage image verified")

    @mock.patch("importer.tasks.images.verify_asset_image")
    def test_verify_asset_image_task_failure(self, mock_verify):
        job = create_verify_asset_image_job(asset=self.asset, batch=self.batch_id)
        mock_verify.return_value = False

        result = tasks.images.verify_asset_image_task(self.asset.pk, self.batch_id)
        self.assertFalse(result)
        job.refresh_from_db()
        self.assertNotEqual(job.status, "Storage image verified")

    @mock.patch("importer.tasks.images.verify_asset_image")
    def test_create_verify_asset_image_job(self, mock_verify):
        mock_verify.return_value = True
        result = tasks.images.verify_asset_image_task(
            self.asset.pk, self.batch_id, create_job=True
        )
        self.assertTrue(result)
        self.assertTrue(
            VerifyAssetImageJob.objects.filter(
                asset=self.asset, batch=self.batch_id
            ).exists()
        )

    @mock.patch("importer.tasks.images.verify_asset_image")
    def test_http_error_retries(self, mock_verify):
        create_verify_asset_image_job(asset=self.asset, batch=self.batch_id)
        mock_verify.side_effect = requests.exceptions.HTTPError("HTTP Error Occurred")
        with self.assertRaises(requests.exceptions.HTTPError):
            tasks.images.verify_asset_image_task(self.asset.pk, self.batch_id)


class CreateDownloadAssetImageJobTests(TestCase):
    def setUp(self):
        self.asset = create_asset()
        self.batch_id = uuid.uuid4()

    def test_create_new_job(self):
        tasks.images.create_download_asset_image_job(self.asset, self.batch_id)
        self.assertTrue(
            DownloadAssetImageJob.objects.filter(
                asset=self.asset, batch=self.batch_id
            ).exists()
        )

    def test_existing_uncompleted_job_not_duplicated(self):
        create_download_asset_image_job(asset=self.asset, batch=self.batch_id)
        tasks.images.create_download_asset_image_job(self.asset, self.batch_id)
        job_count = DownloadAssetImageJob.objects.filter(
            asset=self.asset, batch=self.batch_id
        ).count()
        self.assertEqual(job_count, 1)

    def test_create_new_job_if_previous_failed(self):
        failed_job = create_download_asset_image_job(
            asset=self.asset, batch=self.batch_id
        )
        failed_job.failed = timezone.now()
        failed_job.save()

        new_batch = uuid.uuid4()

        tasks.images.create_download_asset_image_job(self.asset, new_batch)
        job_count = DownloadAssetImageJob.objects.filter(asset=self.asset).count()
        self.assertEqual(job_count, 2)


class VerifyAssetImageTests(TestCase):
    def setUp(self):
        self.asset = create_asset()
        self.job = create_verify_asset_image_job(asset=self.asset)
        self.mock_task = mock.MagicMock()
        self.mock_task.request.id = uuid.uuid4()

    @mock.patch("importer.tasks.images.logger.info")
    @mock.patch("importer.tasks.images.create_download_asset_image_job")
    def test_no_storage_image(self, mock_create_job, mock_logger):
        # Use update in order to avoid the validation of storage_image, since this is
        # an invalid value, but we have to account for it
        Asset.objects.filter(id=self.asset.id).update(storage_image="")
        # We need to update the job from the database to get rid of the cached asset
        self.job.refresh_from_db()

        result = tasks.images.verify_asset_image(self.mock_task, self.job)
        self.assertFalse(result)
        mock_create_job.assert_called_once_with(self.asset, self.job.batch)
        mock_logger.assert_any_call(
            f"No storage image set on {self.asset} ({self.asset.id})"
        )

    @mock.patch("importer.tasks.images.logger.info")
    @mock.patch("importer.tasks.images.create_download_asset_image_job")
    @mock.patch("importer.tasks.images.ASSET_STORAGE.exists", return_value=False)
    def test_storage_image_missing(self, mock_exists, mock_create_job, mock_logger):
        result = tasks.images.verify_asset_image(self.mock_task, self.job)
        self.assertFalse(result)
        mock_create_job.assert_called_once_with(self.asset, self.job.batch)
        mock_logger.assert_any_call(
            f"Storage image for {self.asset} ({self.asset.id}) missing from storage"
        )

    @mock.patch("importer.tasks.images.logger.info")
    @mock.patch("importer.tasks.images.create_download_asset_image_job")
    @mock.patch("importer.tasks.images.ASSET_STORAGE.exists", return_value=True)
    @mock.patch("importer.tasks.images.ASSET_STORAGE.open")
    @mock.patch(
        "importer.tasks.images.Image.open",
        side_effect=UnidentifiedImageError("Invalid image format"),
    )
    def test_storage_image_invalid(
        self, mock_image_open, mock_open, mock_exists, mock_create_job, mock_logger
    ):
        result = tasks.images.verify_asset_image(self.mock_task, self.job)
        self.assertFalse(result)
        mock_create_job.assert_called_once_with(self.asset, self.job.batch)
        mock_logger.assert_any_call(
            f"Storage image for {self.asset} ({self.asset.id}), "
            f"{self.asset.storage_image.name}, is corrupt. The exception "
            "raised was Type: UnidentifiedImageError, Message: Invalid image format"
        )

    @mock.patch("importer.tasks.images.logger.info")
    @mock.patch("importer.tasks.images.create_download_asset_image_job")
    @mock.patch("importer.tasks.images.ASSET_STORAGE.exists", return_value=True)
    @mock.patch("importer.tasks.images.ASSET_STORAGE.open")
    @mock.patch("importer.tasks.images.Image.open")
    def test_storage_image_verify_fail(
        self, mock_image_open, mock_open, mock_exists, mock_create_job, mock_logger
    ):
        mock_image = mock.MagicMock()
        mock_image.verify.side_effect = UnidentifiedImageError("Invalid image format")
        mock_image_open.return_value.__enter__.return_value = mock_image

        result = tasks.images.verify_asset_image(self.mock_task, self.job)
        self.assertFalse(result)
        mock_create_job.assert_called_once_with(self.asset, self.job.batch)
        mock_logger.assert_any_call(
            f"Storage image for {self.asset} ({self.asset.id}), "
            f"{self.asset.storage_image.name}, is corrupt. The exception "
            "raised was Type: UnidentifiedImageError, Message: Invalid image format"
        )

    @mock.patch("importer.tasks.images.logger.info")
    @mock.patch("importer.tasks.images.ASSET_STORAGE.exists", return_value=True)
    @mock.patch("importer.tasks.images.ASSET_STORAGE.open")
    @mock.patch("importer.tasks.images.Image.open")
    def test_storage_image_verification_success(
        self, mock_image_open, mock_open, mock_exists, mock_logger
    ):
        mock_image = mock.MagicMock()
        mock_image.verify.return_value = None
        mock_image_open.return_value.__enter__.return_value = mock_image

        result = tasks.images.verify_asset_image(self.mock_task, self.job)
        self.assertTrue(result)
        mock_logger.assert_any_call(
            "Storage image for %s (%s), %s, verified successfully",
            self.asset,
            self.asset.id,
            self.asset.storage_image.name,
        )


class BatchDownloadAssetImagesTaskCallbackTests(TestCase):
    def setUp(self):
        self.batch_id = uuid.uuid4()
        self.concurrency = 5

    @mock.patch("importer.tasks.images.batch_download_asset_images_task.delay")
    def test_callback_triggers_next_batch(self, mock_task):
        results = [True, False, True]

        tasks.images.batch_download_asset_images_task_callback(
            results, self.batch_id, self.concurrency
        )

        mock_task.assert_called_once_with(self.batch_id, self.concurrency)

    @mock.patch("importer.tasks.images.batch_download_asset_images_task.delay")
    def test_callback_with_no_results(self, mock_task):
        results = []

        tasks.images.batch_download_asset_images_task_callback(
            results, self.batch_id, self.concurrency
        )

        mock_task.assert_called_once_with(self.batch_id, self.concurrency)

    @mock.patch("importer.tasks.images.batch_download_asset_images_task.delay")
    def test_callback_with_all_successful_results(self, mock_task):
        results = [True, True, True]

        tasks.images.batch_download_asset_images_task_callback(
            results, self.batch_id, self.concurrency
        )

        mock_task.assert_called_once_with(self.batch_id, self.concurrency)


class BatchDownloadAssetImagesTaskTests(TestCase):
    def setUp(self):
        self.batch_id = uuid.uuid4()
        self.concurrency = 3
        asset1 = create_asset()
        asset2 = create_asset(item=asset1.item, slug="test-asset-2")
        asset3 = create_asset(item=asset1.item, slug="test-asset-3")
        self.job1 = create_download_asset_image_job(batch=self.batch_id, asset=asset1)
        self.job2 = create_download_asset_image_job(batch=self.batch_id, asset=asset2)
        self.job3 = create_download_asset_image_job(batch=self.batch_id, asset=asset3)

    @mock.patch("importer.tasks.images.logger.info")
    @mock.patch("importer.tasks.images.chord")
    @mock.patch("importer.tasks.images.download_asset_image_task.s")
    def test_jobs_remaining(self, mock_task_s, mock_chord, mock_logger):
        tasks.images.batch_download_asset_images_task(self.batch_id, self.concurrency)
        self.assertEqual(mock_task_s.call_count, 3)
        mock_chord.assert_called()
        mock_logger.assert_any_call(
            "Processing next %s DownloadAssetImageJobs for batch %s",
            self.concurrency,
            self.batch_id,
        )

    @mock.patch("importer.tasks.images.logger.info")
    def test_no_jobs_remaining(self, mock_logger):
        DownloadAssetImageJob.objects.all().delete()
        tasks.images.batch_download_asset_images_task(self.batch_id, self.concurrency)
        mock_logger.assert_any_call(
            "No DownloadAssetImageJobs found for batch %s", self.batch_id
        )


class DownloadAssetImageTaskTests(TestCase):
    def setUp(self):
        self.asset = create_asset()
        self.batch_id = uuid.uuid4()

    @mock.patch("importer.tasks.images.logger.exception")
    def test_asset_not_found(self, mock_logger):
        with self.assertRaises(Asset.DoesNotExist):
            tasks.images.download_asset_image_task(999)
        mock_logger.assert_called()

    @mock.patch("importer.tasks.images.logger.exception")
    def test_download_job_not_found(self, mock_logger):
        with self.assertRaises(DownloadAssetImageJob.DoesNotExist):
            tasks.images.download_asset_image_task(
                self.asset.pk, self.batch_id, create_job=False
            )
        mock_logger.assert_called()

    @mock.patch("importer.tasks.images.download_asset")
    def test_download_asset_image_task_success(self, mock_download):
        create_download_asset_image_job(asset=self.asset, batch=self.batch_id)
        mock_download.return_value = "Download successful"

        result = tasks.images.download_asset_image_task(self.asset.pk, self.batch_id)
        self.assertEqual(result, "Download successful")

    @mock.patch("importer.tasks.images.download_asset")
    def test_create_download_asset_image_job(self, mock_download):
        mock_download.return_value = "Download successful"
        result = tasks.images.download_asset_image_task(
            self.asset.pk, self.batch_id, create_job=True
        )
        self.assertEqual(result, "Download successful")
        self.assertTrue(
            DownloadAssetImageJob.objects.filter(
                asset=self.asset, batch=self.batch_id
            ).exists()
        )

    @mock.patch("importer.tasks.images.download_asset")
    def test_http_error_retries(self, mock_download):
        mock_download.side_effect = requests.exceptions.HTTPError("HTTP Error Occurred")
        with self.assertRaises(requests.exceptions.HTTPError):
            tasks.images.download_asset_image_task(
                self.asset.pk, self.batch_id, create_job=True
            )


================================================
FILE: importer/tests/test_tasks_collections.py
================================================
import sys
from unittest import mock

import requests
from django.core.cache.backends.base import BaseCache
from django.test import TestCase, override_settings

from concordia.tests.utils import CreateTestUsers
from importer import tasks
from importer.tasks.collections import (
    import_collection_task,
    normalize_collection_url,
)
from importer.tests.utils import create_import_job


class MockResponse:
    def __init__(self, original_format="item"):
        self.original_format = original_format

    def json(self):
        url = "https://www.loc.gov/item/%s/" % "mss859430021"
        return {
            "results": [
                {
                    "id": 1,
                    "image_url": "https://www.loc.gov/resource/mss85943.000212/",
                    "original_format": {self.original_format},
                    "url": url,
                },
            ],
            "pagination": {},
        }


class MockCache(BaseCache):
    def __init__(self, host, *args, **kwargs):
        params = {}
        super().__init__(params, **kwargs)

    def get(self, key, default=None, version=None):
        resp = MockResponse()
        return resp


# Ensure dotted path used in override_settings still resolves after splitting.
# The original tests referenced "importer.tests.test_tasks.MockCache".
# Point that module name at this module so the cache backend can import it.
sys.modules.setdefault("importer.tests.test_tasks", sys.modules[__name__])


class GetCollectionItemsTests(TestCase):
    @mock.patch.object(requests.Session, "get")
    @override_settings(
        CACHES={
            "default": {
                "BACKEND": "django.core.cache.backends.dummy.DummyCache",
            }
        }
    )
    def test_cache_miss(self, mock_get):
        mock_get.return_value = MockResponse()
        mock_get.return_value.url = "https://www.loc.gov/collections/example/"
        items = tasks.collections.get_collection_items(
            "https://www.loc.gov/collections/example/"
        )
        self.assertEqual(len(items), 1)

    @override_settings(
        CACHES={
            "default": {
                "BACKEND": "importer.tests.test_tasks.MockCache",
            }
        }
    )
    def test_cache_hit(self):
        items = tasks.collections.get_collection_items(
            "https://www.loc.gov/collections/example/"
        )
        self.assertEqual(len(items), 1)

    @mock.patch.object(requests.Session, "get")
    @override_settings(
        CACHES={
            "default": {
                "BACKEND": "django.core.cache.backends.dummy.DummyCache",
            }
        }
    )
    def test_ignored_format(self, mock_get):
        mock_get.return_value = MockResponse(original_format="collection")
        mock_get.return_value.url = "https://www.loc.gov/collections/example/"
        with self.assertLogs("importer.tasks", level="INFO") as log:
            items = tasks.collections.get_collection_items(
                "https://www.loc.gov/collections/example/"
            )

            self.assertEqual(
                log.output[0],
                "INFO:importer.tasks.items:"
                "Skipping result 1 because it contains an "
                "unsupported format: {'collection'}",
            )
        self.assertEqual(len(items), 0)

    def test_multiple_items(self):
        with (
            mock.patch("importer.tasks.collections.cache") as cache_mock,
            mock.patch(
                "importer.tasks.collections.requests_retry_session"
            ) as requests_mock,
            mock.patch(
                "importer.tasks.collections.get_item_info_from_result"
            ) as result_mock,
        ):
            cache_mock.get.return_value = None
            requests_mock.return_value.get.return_value.json.return_value = {
                "results": [1, 2, 3]
            }
            # Each time this mock is called, the next value in the list
            # is returned
            result_mock.side_effect = [4, 5, None]

            items = tasks.collections.get_collection_items("http://example.com")

            self.assertEqual(items, [4, 5])
            self.assertEqual(result_mock.call_count, 3)

    def test_no_results(self):
        with (
            mock.patch("importer.tasks.collections.cache") as cache_mock,
            mock.patch(
                "importer.tasks.collections.requests_retry_session"
            ) as requests_mock,
            self.assertLogs("importer.tasks", level="ERROR") as log,
        ):
            cache_mock.get.return_value = None
            requests_mock.return_value.get.return_value.json.return_value = {}
            items = tasks.collections.get_collection_items("http://example.com")
            self.assertEqual(items, [])
            self.assertEqual(
                log.output,
                [
                    "ERROR:importer.tasks.collections:"
                    'Expected URL http://example.com to include "results"'
                ],
            )

    def test_get_info_exception(self):
        with (
            mock.patch("importer.tasks.collections.cache") as cache_mock,
            mock.patch(
                "importer.tasks.collections.requests_retry_session"
            ) as requests_mock,
            mock.patch("importer.tasks.items.get_item_info_from_result") as result_mock,
            self.assertLogs("importer.tasks", level="WARNING") as log,
        ):
            cache_mock.get.return_value = None
            requests_mock.return_value.get.return_value.json.return_value = {
                "results": [1]
            }
            result_mock.side_effect = AttributeError

            items = tasks.collections.get_collection_items("http://example.com")

            self.assertEqual(items, [])
            # The first log entry contains a stack trace, so we use assertIn
            # rather than assertEqual here
            self.assertIn(
                "WARNING:importer.tasks.collections:"
                "Skipping result from http://example.com which did not match "
                "expected format:",
                log.output[0],
            )
            self.assertEqual(
                log.output[1],
                "WARNING:importer.tasks.collections:"
                "No valid items found for collection url: http://example.com",
            )


class ImportCollectionTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.login_user()

    @mock.patch("importer.tasks.collections.get_collection_items")
    @mock.patch("importer.tasks.collections.normalize_collection_url")
    def test_import_collection(self, mock_get, mock_normalize):
        magic_mock = mock.MagicMock()
        magic_mock.request = mock.MagicMock()
        magic_mock.request.id = 1
        import_job = create_import_job(created_by=self.user)
        mock_get.return_value = ((None, None),)
        import_collection_task(import_job.pk)
        self.assertTrue(mock_get.called)

    @mock.patch("importer.tasks.collections.create_item_import_task.delay")
    @mock.patch("importer.tasks.collections.get_collection_items")
    @mock.patch("importer.tasks.collections.normalize_collection_url")
    def test_import_collection_enqueues_item_tasks(
        self, mock_normalize, mock_get, mock_delay
    ):
        import_job = create_import_job(created_by=self.user)
        mock_normalize.return_value = "https://www.loc.gov/collections/example/?fo=json"
        mock_get.return_value = [
            ("mss1", "https://www.loc.gov/item/mss1/"),
            ("mss2", "https://www.loc.gov/item/mss2/"),
        ]

        # redownload=True so we can assert the third arg is propagated
        import_collection_task(import_job.pk, redownload=True)

        self.assertEqual(mock_delay.call_count, 2)
        self.assertEqual(
            mock_delay.call_args_list,
            [
                mock.call(import_job.pk, "https://www.loc.gov/item/mss1/", True),
                mock.call(import_job.pk, "https://www.loc.gov/item/mss2/", True),
            ],
        )


class CollectionURLNormalizationTests(TestCase):
    def test_basic_normalization(self):
        self.assertEqual(
            normalize_collection_url(
                "https://www.loc.gov/collections/branch-rickey-papers/"
            ),
            "https://www.loc.gov/collections/branch-rickey-papers/?fo=json",
        )

    def test_extra_querystring_parameters(self):
        self.assertEqual(
            normalize_collection_url(
                "https://www.loc.gov/collections/branch-rickey-papers/?foo=bar"
            ),
            "https://www.loc.gov/collections/branch-rickey-papers/?fo=json&foo=bar",
        )

    def test_conflicting_querystring_parameters(self):
        self.assertEqual(
            normalize_collection_url(
                "https://www.loc.gov/collections/branch-rickey-papers/?foo=bar&fo=xml&sp=99&at=item"  # NOQA
            ),
            "https://www.loc.gov/collections/branch-rickey-papers/?fo=json&foo=bar",
        )


================================================
FILE: importer/tests/test_tasks_core.py
================================================
import concurrent.futures
from unittest import mock

from django.test import TestCase

from importer.tasks import fetch_all_urls


class FetchAllUrlsTests(TestCase):
    @mock.patch.object(concurrent.futures.ThreadPoolExecutor, "map")
    def test_fetch_all_urls(self, mock_map):
        output = "https://www.loc.gov/item/mss859430021/ - Asset Count: 0"
        mock_map.return_value = ((output, 0),)
        finals, totals = fetch_all_urls(
            [
                "https://www.loc.gov/item/mss859430021/",
            ]
        )
        self.assertEqual(finals, [output])
        self.assertEqual(totals, 0)


================================================
FILE: importer/tests/test_tasks_decorators.py
================================================
from unittest import mock

from django.test import TestCase
from django.utils import timezone

from importer.exceptions import ImageImportFailure
from importer.models import ImportJob, TaskStatusModel
from importer.tasks.decorators import update_task_status
from importer.tests.utils import create_import_job


class TaskDecoratorTests(TestCase):
    def test_update_task_status(self):
        def test_function(self, task_status_object, raise_exception=False):
            task_status_object.test_function_ran = True
            if raise_exception:
                raise Exception("Test Exception")
            task_status_object.test_function_finished = True

        wrapped_test_function = update_task_status(test_function)

        # We create this non-mocked completed job here to use in a later test
        # because we can't easily do this once we mock ImportJob.save
        test_job = create_import_job(completed=timezone.now())

        # We can't just mock the entire model here or use easily use a custom
        # class because update_task_status depends on Django model internals,
        # particularly __class__._default_manager. __class__ cannot be overriden
        # (it points to MagicMock), Model._default_manager cannot be set directly
        # and mocking Model.objects does not cause called on Model._default_manager
        # to properly use the mock--it continues to use the actual Model.objects
        with mock.patch.multiple(
            ImportJob,
            save=mock.MagicMock(),
            __str__=mock.MagicMock(return_value="Mock Job"),
        ):
            job = ImportJob()
            wrapped_test_function(mock.MagicMock(), job)
            self.assertTrue(hasattr(job, "test_function_ran"))
            self.assertTrue(job.test_function_ran)
            self.assertTrue(hasattr(job, "test_function_finished"))
            self.assertTrue(job.test_function_finished)
            self.assertNotEqual(job.last_started, None)
            self.assertNotEqual(job.task_id, None)
            self.assertTrue(job.completed)
            self.assertTrue(job.save.called)

            ImportJob.save.reset_mock()
            job2 = ImportJob()
            job2.status = "Original Status"
            with self.assertRaisesRegex(Exception, "Test Exception"):
                wrapped_test_function(mock.MagicMock(), job2, True)
            self.assertTrue(hasattr(job2, "test_function_ran"))
            self.assertTrue(job2.test_function_ran)
            self.assertFalse(hasattr(job2, "test_function_finished"))
            self.assertNotEqual(job2.last_started, None)
            self.assertNotEqual(job2.task_id, None)
            self.assertFalse(job2.completed)
            self.assertTrue(job2.save.called)
            self.assertEqual(
                job2.status, "Original Status\n\nUnhandled exception: Test Exception"
            )

            ImportJob.save.reset_mock()
            job3 = ImportJob()
            job3.id = test_job.id
            with self.assertLogs("importer.tasks", level="WARNING") as log:
                wrapped_test_function(mock.MagicMock(), job3)
                self.assertEqual(
                    log.output,
                    [
                        "WARNING:importer.tasks.decorators:Task Mock Job was "
                        "already completed and will not be repeated"
                    ],
                )
            self.assertFalse(hasattr(job3, "test_function_ran"))
            self.assertFalse(hasattr(job3, "test_function_finished"))
            self.assertEqual(job3.last_started, None)
            self.assertEqual(job3.task_id, None)
            self.assertFalse(job3.completed)
            self.assertFalse(job3.save.called)

    @mock.patch.multiple(
        ImportJob,
        save=mock.MagicMock(),
        __str__=mock.MagicMock(return_value="Mock Job"),
        retry_if_possible=mock.MagicMock(),
    )
    def test_update_task_status_retry_path_sets_last_started_and_task_id(self):
        def test_function(self, task_status_object):
            raise Exception("boom")

        wrapped = update_task_status(test_function)

        job = ImportJob()
        # Simulate Celery task self with a request.id
        task_self = mock.MagicMock()
        task_self.request.id = "orig-task-id"

        # Make retry_if_possible return an object with an id, like an AsyncResult
        retry_result = mock.MagicMock()
        retry_result.id = "retry-123"
        ImportJob.retry_if_possible.return_value = retry_result

        with self.assertRaisesRegex(Exception, "boom"):
            wrapped(task_self, job)

        # After a retriable exception, the decorator should set these from retry_result
        self.assertEqual(job.task_id, "retry-123")
        self.assertIsNotNone(job.last_started)

        # Saves: one before calling f(), one after exception handling, one after retry
        self.assertGreaterEqual(ImportJob.save.call_count, 3)
        ImportJob.retry_if_possible.assert_called_once_with()

    @mock.patch.multiple(
        ImportJob,
        save=mock.MagicMock(),
        __str__=mock.MagicMock(return_value="Mock Job"),
        retry_if_possible=mock.MagicMock(return_value=False),
    )
    def test_update_task_status_sets_image_failure_reason(self):
        def test_function(self, task_status_object):
            # Raising ImageImportFailure should set failure_reason to IMAGE.
            raise ImageImportFailure("bad image")

        wrapped = update_task_status(test_function)

        job = ImportJob()
        task_self = mock.MagicMock()
        task_self.request.id = "task-123"

        with self.assertRaises(ImageImportFailure):
            wrapped(task_self, job)

        self.assertEqual(job.failure_reason, TaskStatusModel.FailureReason.IMAGE)
        self.assertIsNotNone(job.failed)
        # save() should have been called at least twice (pre & post exception path)
        self.assertGreaterEqual(ImportJob.save.call_count, 2)


================================================
FILE: importer/tests/test_tasks_images.py
================================================
import uuid
from unittest import mock

import requests
from django.test import TestCase
from django.utils import timezone
from PIL import Image

from concordia.models import Asset
from concordia.tests.utils import (
    create_asset,
)
from importer import tasks
from importer.models import (
    DownloadAssetImageJob,
    VerifyAssetImageJob,
)
from importer.tasks.images import redownload_image_task

from .utils import (
    create_download_asset_image_job,
    create_verify_asset_image_job,
)


class RedownloadImageTaskTests(TestCase):
    @mock.patch("importer.tasks.images.download_asset")
    def test_redownload_image_task(self, mock_download):
        redownload_image_task(create_asset().pk)
        self.assertTrue(mock_download.called)


class BatchVerifyAssetImagesTaskCallbackTests(TestCase):
    def setUp(self):
        self.batch_id = uuid.uuid4()
        self.concurrency = 5

    @mock.patch("importer.tasks.images.batch_verify_asset_images_task.delay")
    def test_no_failures_detected_no_failures_in_results(self, mock_task):
        results = [True, True, True]
        tasks.images.batch_verify_asset_images_task_callback(
            results, self.batch_id, self.concurrency, False
        )
        mock_task.assert_called_once_with(self.batch_id, self.concurrency, False)

    @mock.patch("importer.tasks.images.batch_verify_asset_images_task.delay")
    def test_no_failures_detected_some_failures_in_results(self, mock_task):
        results = [True, False, True]
        with self.assertLogs("importer.tasks", level="INFO") as log:
            tasks.images.batch_verify_asset_images_task_callback(
                results, self.batch_id, self.concurrency, False
            )
            self.assertIn(
                "INFO:importer.tasks.images:At least one verification "
                f"failure detected for batch {self.batch_id}",
                log.output,
            )
        mock_task.assert_called_once_with(self.batch_id, self.concurrency, True)

    @mock.patch("importer.tasks.images.batch_verify_asset_images_task.delay")
    def test_failures_already_detected(self, mock_task):
        results = [True, False, True]
        tasks.images.batch_verify_asset_images_task_callback(
            results, self.batch_id, self.concurrency, True
        )
        mock_task.assert_called_once_with(self.batch_id, self.concurrency, True)


class BatchVerifyAssetImagesTaskTests(TestCase):
    def setUp(self):
        self.batch_id = uuid.uuid4()
        self.concurrency = 2
        asset1 = create_asset()
        asset2 = create_asset(item=asset1.item, slug="test-asset-2")
        self.job1 = create_verify_asset_image_job(batch=self.batch_id, asset=asset1)
        self.job2 = create_verify_asset_image_job(batch=self.batch_id, asset=asset2)

    @mock.patch("importer.tasks.images.logger.info")
    @mock.patch("importer.tasks.images.batch_download_asset_images_task")
    def test_no_jobs_remaining_with_failures(self, mock_batch_download, mock_logger):
        VerifyAssetImageJob.objects.all().delete()
        tasks.images.batch_verify_asset_images_task(
            self.batch_id, self.concurrency, True
        )
        mock_logger.assert_any_call(
            "Failures in VerifyAssetImageJobs in batch %s detected, so starting "
            "DownloadAssetImageJob batch",
            self.batch_id,
        )
        mock_batch_download.assert_called_once_with(self.batch_id, self.concurrency)

    @mock.patch("importer.tasks.images.logger.info")
    def test_no_jobs_remaining_no_failures(self, mock_logger):
        VerifyAssetImageJob.objects.all().delete()
        tasks.images.batch_verify_asset_images_task(
            self.batch_id, self.concurrency, False
        )
        mock_logger.assert_any_call(
            "No failures in VerifyAssetImageJob batch %s. Ending task.", self.batch_id
        )

    @mock.patch("importer.tasks.images.chord")
    @mock.patch("importer.tasks.images.verify_asset_image_task.s")
    def test_jobs_remaining(self, mock_task_s, mock_chord):
        tasks.images.batch_verify_asset_images_task(
            self.batch_id, self.concurrency, False
        )
        self.assertEqual(mock_task_s.call_count, 2)
        mock_chord.assert_called()


class VerifyAssetImageTaskTests(TestCase):
    def setUp(self):
        self.asset = create_asset()
        self.batch_id = uuid.uuid4()

    @mock.patch("importer.tasks.images.logger.exception")
    def test_asset_not_found(self, mock_logger):
        with self.assertRaises(Asset.DoesNotExist):
            tasks.images.verify_asset_image_task(999)
        mock_logger.assert_called()

    @mock.patch("importer.tasks.images.logger.exception")
    def test_verify_job_not_found(self, mock_logger):
        with self.assertRaises(VerifyAssetImageJob.DoesNotExist):
            tasks.images.verify_asset_image_task(
                self.asset.pk, self.batch_id, create_job=False
            )
        mock_logger.assert_called()

    @mock.patch("importer.tasks.images.verify_asset_image")
    def test_verify_asset_image_task_success(self, mock_verify):
        job = create_verify_asset_image_job(asset=self.asset, batch=self.batch_id)
        mock_verify.return_value = True

        result = tasks.images.verify_asset_image_task(self.asset.pk, self.batch_id)
        self.assertTrue(result)
        job.refresh_from_db()
        self.assertEqual(job.status, "Storage image verified")

    @mock.patch("importer.tasks.images.verify_asset_image")
    def test_verify_asset_image_task_failure(self, mock_verify):
        job = create_verify_asset_image_job(asset=self.asset, batch=self.batch_id)
        mock_verify.return_value = False

        result = tasks.images.verify_asset_image_task(self.asset.pk, self.batch_id)
        self.assertFalse(result)
        job.refresh_from_db()
        self.assertNotEqual(job.status, "Storage image verified")

    @mock.patch("importer.tasks.images.verify_asset_image")
    def test_create_verify_asset_image_job(self, mock_verify):
        mock_verify.return_value = True
        result = tasks.images.verify_asset_image_task(
            self.asset.pk, self.batch_id, create_job=True
        )
        self.assertTrue(result)
        self.assertTrue(
            VerifyAssetImageJob.objects.filter(
                asset=self.asset, batch=self.batch_id
            ).exists()
        )

    @mock.patch("importer.tasks.images.verify_asset_image")
    def test_http_error_retries(self, mock_verify):
        create_verify_asset_image_job(asset=self.asset, batch=self.batch_id)
        mock_verify.side_effect = requests.exceptions.HTTPError("HTTP Error Occurred")
        with self.assertRaises(requests.exceptions.HTTPError):
            tasks.images.verify_asset_image_task(self.asset.pk, self.batch_id)


class CreateDownloadAssetImageJobTests(TestCase):
    def setUp(self):
        self.asset = create_asset()
        self.batch_id = uuid.uuid4()

    def test_create_new_job(self):
        tasks.images.create_download_asset_image_job(self.asset, self.batch_id)
        self.assertTrue(
            DownloadAssetImageJob.objects.filter(
                asset=self.asset, batch=self.batch_id
            ).exists()
        )

    def test_existing_uncompleted_job_not_duplicated(self):
        create_download_asset_image_job(asset=self.asset, batch=self.batch_id)
        tasks.images.create_download_asset_image_job(self.asset, self.batch_id)
        job_count = DownloadAssetImageJob.objects.filter(
            asset=self.asset, batch=self.batch_id
        ).count()
        self.assertEqual(job_count, 1)

    def test_create_new_job_if_previous_failed(self):
        failed_job = create_download_asset_image_job(
            asset=self.asset, batch=self.batch_id
        )
        failed_job.failed = timezone.now()
        failed_job.save()

        new_batch = uuid.uuid4()

        tasks.images.create_download_asset_image_job(self.asset, new_batch)
        job_count = DownloadAssetImageJob.objects.filter(asset=self.asset).count()
        self.assertEqual(job_count, 2)


class VerifyAssetImageTests(TestCase):
    def setUp(self):
        self.asset = create_asset()
        self.job = create_verify_asset_image_job(asset=self.asset)
        self.mock_task = mock.MagicMock()
        self.mock_task.request.id = uuid.uuid4()

    @mock.patch("importer.tasks.images.logger.info")
    @mock.patch("importer.tasks.images.create_download_asset_image_job")
    def test_no_storage_image(self, mock_create_job, mock_logger):
        # Use update to avoid validation of storage_image with invalid value
        Asset.objects.filter(id=self.asset.id).update(storage_image="")
        self.job.refresh_from_db()

        result = tasks.images.verify_asset_image(self.mock_task, self.job)
        self.assertFalse(result)
        mock_create_job.assert_called_once_with(self.asset, self.job.batch)
        mock_logger.assert_any_call(
            f"No storage image set on {self.asset} ({self.asset.id})"
        )

    @mock.patch("importer.tasks.images.logger.info")
    @mock.patch("importer.tasks.images.create_download_asset_image_job")
    @mock.patch("importer.tasks.images.ASSET_STORAGE.exists", return_value=False)
    def test_storage_image_missing(self, mock_exists, mock_create_job, mock_logger):
        result = tasks.images.verify_asset_image(self.mock_task, self.job)
        self.assertFalse(result)
        mock_create_job.assert_called_once_with(self.asset, self.job.batch)
        mock_logger.assert_any_call(
            f"Storage image for {self.asset} ({self.asset.id}) missing from storage"
        )

    @mock.patch("importer.tasks.images.logger.info")
    @mock.patch("importer.tasks.images.create_download_asset_image_job")
    @mock.patch("importer.tasks.images.ASSET_STORAGE.exists", return_value=True)
    @mock.patch("importer.tasks.images.ASSET_STORAGE.open")
    @mock.patch(
        "importer.tasks.images.Image.open",
        side_effect=Image.UnidentifiedImageError("Invalid image format"),
    )
    def test_storage_image_invalid(
        self, mock_image_open, mock_open, mock_exists, mock_create_job, mock_logger
    ):
        result = tasks.images.verify_asset_image(self.mock_task, self.job)
        self.assertFalse(result)
        mock_create_job.assert_called_once_with(self.asset, self.job.batch)
        mock_logger.assert_any_call(
            f"Storage image for {self.asset} ({self.asset.id}), "
            f"{self.asset.storage_image.name}, is corrupt. The exception "
            "raised was Type: UnidentifiedImageError, Message: Invalid image format"
        )

    @mock.patch("importer.tasks.images.logger.info")
    @mock.patch("importer.tasks.images.create_download_asset_image_job")
    @mock.patch("importer.tasks.images.ASSET_STORAGE.exists", return_value=True)
    @mock.patch("importer.tasks.images.ASSET_STORAGE.open")
    @mock.patch("importer.tasks.images.Image.open")
    def test_storage_image_verify_fail(
        self, mock_image_open, mock_open, mock_exists, mock_create_job, mock_logger
    ):
        mock_image = mock.MagicMock()
        mock_image.verify.side_effect = Image.UnidentifiedImageError(
            "Invalid image format"
        )
        mock_image_open.return_value.__enter__.return_value = mock_image

        result = tasks.images.verify_asset_image(self.mock_task, self.job)
        self.assertFalse(result)
        mock_create_job.assert_called_once_with(self.asset, self.job.batch)
        mock_logger.assert_any_call(
            f"Storage image for {self.asset} ({self.asset.id}), "
            f"{self.asset.storage_image.name}, is corrupt. The exception "
            "raised was Type: UnidentifiedImageError, Message: Invalid image format"
        )

    @mock.patch("importer.tasks.images.logger.info")
    @mock.patch("importer.tasks.images.ASSET_STORAGE.exists", return_value=True)
    @mock.patch("importer.tasks.images.ASSET_STORAGE.open")
    @mock.patch("importer.tasks.images.Image.open")
    def test_storage_image_verification_success(
        self, mock_image_open, mock_open, mock_exists, mock_logger
    ):
        mock_image = mock.MagicMock()
        mock_image.verify.return_value = None
        mock_image_open.return_value.__enter__.return_value = mock_image

        result = tasks.images.verify_asset_image(self.mock_task, self.job)
        self.assertTrue(result)
        mock_logger.assert_any_call(
            "Storage image for %s (%s), %s, verified successfully",
            self.asset,
            self.asset.id,
            self.asset.storage_image.name,
        )


class BatchDownloadAssetImagesTaskCallbackTests(TestCase):
    def setUp(self):
        self.batch_id = uuid.uuid4()
        self.concurrency = 5

    @mock.patch("importer.tasks.images.batch_download_asset_images_task.delay")
    def test_callback_triggers_next_batch(self, mock_task):
        results = [True, False, True]

        tasks.images.batch_download_asset_images_task_callback(
            results, self.batch_id, self.concurrency
        )

        mock_task.assert_called_once_with(self.batch_id, self.concurrency)

    @mock.patch("importer.tasks.images.batch_download_asset_images_task.delay")
    def test_callback_with_no_results(self, mock_task):
        results = []

        tasks.images.batch_download_asset_images_task_callback(
            results, self.batch_id, self.concurrency
        )

        mock_task.assert_called_once_with(self.batch_id, self.concurrency)

    @mock.patch("importer.tasks.images.batch_download_asset_images_task.delay")
    def test_callback_with_all_successful_results(self, mock_task):
        results = [True, True, True]

        tasks.images.batch_download_asset_images_task_callback(
            results, self.batch_id, self.concurrency
        )

        mock_task.assert_called_once_with(self.batch_id, self.concurrency)


class BatchDownloadAssetImagesTaskTests(TestCase):
    def setUp(self):
        self.batch_id = uuid.uuid4()
        self.concurrency = 3
        asset1 = create_asset()
        asset2 = create_asset(item=asset1.item, slug="test-asset-2")
        asset3 = create_asset(item=asset1.item, slug="test-asset-3")
        self.job1 = create_download_asset_image_job(batch=self.batch_id, asset=asset1)
        self.job2 = create_download_asset_image_job(batch=self.batch_id, asset=asset2)
        self.job3 = create_download_asset_image_job(batch=self.batch_id, asset=asset3)

    @mock.patch("importer.tasks.images.logger.info")
    @mock.patch("importer.tasks.images.chord")
    @mock.patch("importer.tasks.images.download_asset_image_task.s")
    def test_jobs_remaining(self, mock_task_s, mock_chord, mock_logger):
        tasks.images.batch_download_asset_images_task(self.batch_id, self.concurrency)
        self.assertEqual(mock_task_s.call_count, 3)
        mock_chord.assert_called()
        mock_logger.assert_any_call(
            "Processing next %s DownloadAssetImageJobs for batch %s",
            self.concurrency,
            self.batch_id,
        )

    @mock.patch("importer.tasks.images.logger.info")
    def test_no_jobs_remaining(self, mock_logger):
        DownloadAssetImageJob.objects.all().delete()
        tasks.images.batch_download_asset_images_task(self.batch_id, self.concurrency)
        mock_logger.assert_any_call(
            "No DownloadAssetImageJobs found for batch %s", self.batch_id
        )


class DownloadAssetImageTaskTests(TestCase):
    def setUp(self):
        self.asset = create_asset()
        self.batch_id = uuid.uuid4()

    @mock.patch("importer.tasks.images.logger.exception")
    def test_asset_not_found(self, mock_logger):
        with self.assertRaises(Asset.DoesNotExist):
            tasks.images.download_asset_image_task(999)
        mock_logger.assert_called()

    @mock.patch("importer.tasks.images.logger.exception")
    def test_download_job_not_found(self, mock_logger):
        with self.assertRaises(DownloadAssetImageJob.DoesNotExist):
            tasks.images.download_asset_image_task(
                self.asset.pk, self.batch_id, create_job=False
            )
        mock_logger.assert_called()

    @mock.patch("importer.tasks.images.download_asset")
    def test_download_asset_image_task_success(self, mock_download):
        create_download_asset_image_job(asset=self.asset, batch=self.batch_id)
        mock_download.return_value = "Download successful"

        result = tasks.images.download_asset_image_task(self.asset.pk, self.batch_id)
        self.assertEqual(result, "Download successful")

    @mock.patch("importer.tasks.images.download_asset")
    def test_create_download_asset_image_job(self, mock_download):
        mock_download.return_value = "Download successful"
        result = tasks.images.download_asset_image_task(
            self.asset.pk, self.batch_id, create_job=True
        )
        self.assertEqual(result, "Download successful")
        self.assertTrue(
            DownloadAssetImageJob.objects.filter(
                asset=self.asset, batch=self.batch_id
            ).exists()
        )

    @mock.patch("importer.tasks.images.download_asset")
    def test_http_error_retries(self, mock_download):
        mock_download.side_effect = requests.exceptions.HTTPError("HTTP Error Occurred")
        with self.assertRaises(requests.exceptions.HTTPError):
            tasks.images.download_asset_image_task(
                self.asset.pk, self.batch_id, create_job=True
            )


================================================
FILE: importer/tests/test_tasks_items.py
================================================
import io
import shutil
import tempfile
from unittest import mock

import requests
from django.core.exceptions import ValidationError
from django.core.files.base import ContentFile
from django.core.files.storage import default_storage
from django.test import TestCase, override_settings
from PIL import Image

from concordia.models import Item
from concordia.tests.utils import (
    CreateTestUsers,
    create_asset,
    create_item,
    create_project,
)
from importer import tasks
from importer.models import ImportItem
from importer.tasks.items import (
    _guess_extension,
    download_and_set_item_thumbnail,
    get_item_id_from_item_url,
    get_item_info_from_result,
    import_items_into_project_from_url,
)
from importer.tests.utils import (
    create_import_item,
    create_import_job,
)


class ImportItemCountFromUrlTests(TestCase):
    def mocked_requests_get(*args, **kwargs):
        class MockResponse:
            def json(self):
                item_data = {
                    "resources": [
                        {"files": []},
                    ]
                }
                return item_data

            def raise_for_status(self):
                pass

        return MockResponse()

    @mock.patch("requests.get", side_effect=mocked_requests_get)
    @override_settings(
        CACHES={
            "default": {
                "BACKEND": "django.core.cache.backends.dummy.DummyCache",
            }
        }
    )
    def test_import_item_count_from_url(self, mock_get):
        self.assertEqual(
            tasks.items.import_item_count_from_url(None),
            ("None - Asset Count: 0", 0),
        )

    def test_unhandled_exception_importing(self):
        with mock.patch("importer.tasks.items.requests.get") as get_mock:
            get_mock.side_effect = AttributeError("Error message")
            self.assertEqual(
                tasks.items.import_item_count_from_url("http://example.com"),
                (
                    "Unhandled exception importing http://example.com " "Error message",
                    0,
                ),
            )


@override_settings(
    STORAGES={
        "default": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
        "assets": {"BACKEND": "django.core.files.storage.InMemoryStorage"},
    },
    AWS_STORAGE_BUCKET_NAME="test-bucket",
)
class ImportItemsIntoProjectFromUrlTests(CreateTestUsers, TestCase):
    def setUp(self):
        self.login_user()
        self.project = create_project()

    @mock.patch("importer.tasks.items.create_item_import_task.delay")
    def test_no_match(self, mock_task):
        with self.assertRaises(ValueError):
            import_items_into_project_from_url(
                None, None, "https://www.loc.gov/resource/mss859430021/"
            )
        self.assertFalse(mock_task.called)

    @mock.patch("importer.tasks.items.create_item_import_task.delay")
    def test_item(self, mock_task):
        import_job = import_items_into_project_from_url(
            self.user, self.project, "https://www.loc.gov/item/mss859430021/"
        )
        self.assertEqual(import_job.project, self.project)
        self.assertTrue(mock_task.called)

    @mock.patch("importer.tasks.collections.import_collection_task.delay")
    def test_other_url_type(self, mock_task):
        import_job = import_items_into_project_from_url(
            self.user,
            self.project,
            "https://www.loc.gov/collections/branch-rickey-papers/",
        )
        self.assertEqual(import_job.project, self.project)
        self.assertTrue(mock_task.called)
        mock_task.assert_called_with(import_job.pk, False)


class GetItemIdFromItemURLTests(TestCase):
    def test_get_item_id_from_item_url_with_slash(self):
        """
        Testing get item id from item url if ends with /
        """
        url = "https://www.loc.gov/item/mss859430021/"
        resp = get_item_id_from_item_url(url)
        self.assertEqual(resp, "mss859430021")

    def test_get_item_id_from_item_url_without_slash(self):
        """
        Testing get item id from item url if ends without /
        """
        url = "https://www.loc.gov/item/mss859430021"
        resp = get_item_id_from_item_url(url)
        self.assertEqual(resp, "mss859430021")


class GetItemInfoFromResultTests(TestCase):
    def test_no_image_url(self):
        item_info = get_item_info_from_result(
            {
                "id": 1,
                "image_url": False,
                "original_format": {"item"},
            }
        )
        self.assertEqual(item_info, None)

    def test_no_match(self):
        item_info = get_item_info_from_result(
            {
                "id": 1,
                "image_url": "https://www.loc.gov/resource/mss85943.000212/",
                "original_format": {"item"},
                "url": "https://www.loc.com/item/mss859430021/",
            },
        )
        self.assertEqual(item_info, None)

    def test_match(self):
        url = "https://www.loc.gov/item/%s/" % "mss859430021"
        item_info = get_item_info_from_result(
            {
                "id": 1,
                "image_url": "https://www.loc.gov/resource/mss85943.000212/",
                "original_format": {"item"},
                "url": url,
            },
        )
        self.assertEqual(item_info[0], "mss859430021")
        self.assertEqual(item_info[1], url)

    def test_ignored_format(self):
        result = {
            "id": 42,
            "image_url": "https://www.loc.gov/resource/foo/",
            "original_format": {"collection"},
            "url": "https://www.loc.gov/item/abc123/",
        }
        with self.assertLogs("importer.tasks", level="INFO") as log:
            out = get_item_info_from_result(result)
        self.assertIsNone(out)
        self.assertEqual(
            log.output[0],
            "INFO:importer.tasks.items:Skipping result 42 because it contains an "
            "unsupported format: {'collection'}",
        )


@mock.patch("importer.tasks.items.requests.get")
class CreateItemImportTaskTests(TestCase):
    def setUp(self):
        self.job = create_import_job()
        self.item_url = "http://example.com"
        self.response_mock = mock.MagicMock()
        self.item_id = "testid1"
        self.item_title = "Test Title"
        self.image_url = []
        self.item_data = {
            "item": {
                "id": self.item_id,
                "title": self.item_title,
                "image_url": self.image_url,
            }
        }

    def test_create_item_import_task_http_error(self, get_mock):
        get_mock.return_value = self.response_mock
        self.response_mock.raise_for_status.side_effect = requests.exceptions.HTTPError

        with self.assertRaises(requests.exceptions.HTTPError):
            tasks.items.create_item_import_task(self.job.pk, self.item_url)

    def test_create_item_import_task_new_item(self, get_mock):
        get_mock.return_value = self.response_mock
        self.response_mock.json.return_value = self.item_data

        with (
            mock.patch("importer.tasks.items.import_item_task.delay") as task_mock,
            mock.patch("importer.tasks.items.download_and_set_item_thumbnail"),
        ):
            tasks.items.create_item_import_task(self.job.pk, self.item_url)
            self.assertTrue(task_mock.called)
            self.assertEqual(Item.objects.count(), 1)
            self.assertTrue(Item.objects.filter(item_id=self.item_id).exists())

    def test_create_item_import_task_existing_item_missing_assets(self, get_mock):
        item = create_item(item_id="testid1", project=self.job.project)
        get_mock.return_value = self.response_mock
        self.response_mock.json.return_value = self.item_data

        with (
            self.assertLogs("importer.tasks", level="WARNING") as log,
            mock.patch(
                "importer.tasks.items.get_asset_urls_from_item_resources"
            ) as asset_url_mock,
            mock.patch("importer.tasks.items.import_item_task.delay") as task_mock,
            mock.patch("importer.tasks.items.download_and_set_item_thumbnail"),
        ):
            asset_url_mock.return_value = [
                ["http://example.com/test.jpg"],
                self.item_url,
            ]
            tasks.items.create_item_import_task(self.job.pk, self.item_url)
            self.assertEqual(
                log.output,
                [
                    f"WARNING:importer.tasks.items:"
                    f"Reprocessing existing item {item} that is missing assets"
                ],
            )
            self.assertEqual(Item.objects.count(), 1)
            self.assertTrue(task_mock.called)

    def test_create_item_import_task_existing_item_no_missing_assets(self, get_mock):
        item = create_item(item_id="testid1", project=self.job.project)
        # Ensure at least one asset exists for the item
        create_asset(item=item)
        get_mock.return_value = self.response_mock
        self.response_mock.json.return_value = self.item_data

        with (
            self.assertLogs("importer.tasks", level="WARNING") as log,
            mock.patch(
                "importer.tasks.items.get_asset_urls_from_item_resources"
            ) as asset_url_mock,
            mock.patch("importer.tasks.items.import_item_task.delay") as task_mock,
            mock.patch("importer.tasks.items.download_and_set_item_thumbnail"),
        ):
            asset_url_mock.return_value = [
                ["http://example.com/test.jpg"],
                self.item_url,
            ]
            tasks.items.create_item_import_task(self.job.pk, self.item_url)

            self.assertEqual(
                log.output,
                [
                    f"WARNING:importer.tasks.items:"
                    f"Not reprocessing existing item with all assets: {item}"
                ],
            )
            self.assertEqual(
                ImportItem.objects.get(item=item).status,
                f"Not reprocessing existing item with all assets: {item}",
            )
            self.assertFalse(task_mock.called)

    def test_create_item_import_task_existing_item_redownload(self, get_mock):
        item = create_item(item_id="testid1", project=self.job.project)
        create_asset(item=item)
        get_mock.return_value = self.response_mock
        self.response_mock.json.return_value = {
            "item": {"id": "testid1", "title": "Test Title", "image_url": []}
        }

        with (
            mock.patch(
                "importer.tasks.items.get_asset_urls_from_item_resources"
            ) as asset_url_mock,
            mock.patch("importer.tasks.items.import_item_task.delay") as task_mock,
            mock.patch("importer.tasks.items.download_and_set_item_thumbnail"),
        ):
            asset_url_mock.return_value = [
                ["http://example.com/test.jpg"],
                self.item_url,
            ]
            tasks.items.create_item_import_task(
                self.job.pk, self.item_url, redownload=True
            )
            self.assertTrue(task_mock.called)

    def test_create_item_import_task_full_clean_exception_updates_status_and_reraises(
        self, get_mock
    ):
        get_mock.return_value = self.response_mock
        self.response_mock.json.return_value = self.item_data

        with (
            self.assertLogs("importer.tasks", level="ERROR") as log,
            mock.patch("importer.tasks.items.Item.full_clean") as full_clean_mock,
            mock.patch("importer.tasks.items.import_item_task.delay") as task_mock,
            mock.patch(
                "importer.tasks.items.download_and_set_item_thumbnail"
            ) as thumb_mock,
        ):
            full_clean_mock.side_effect = RuntimeError("boom")
            with self.assertRaises(RuntimeError):
                tasks.items.create_item_import_task(self.job.pk, self.item_url)

            self.assertTrue(
                any("Unhandled exception when importing item" in m for m in log.output)
            )
            thumb_mock.assert_not_called()
            task_mock.assert_not_called()

        item = Item.objects.get(item_id=self.item_id)
        import_item = ImportItem.objects.get(item=item)
        self.assertIsNotNone(import_item.failed)
        self.assertIn("Unhandled exception: boom", import_item.status)

    def test_create_item_import_task_save_exception_updates_status_and_reraises(
        self, get_mock
    ):
        get_mock.return_value = self.response_mock
        self.response_mock.json.return_value = self.item_data

        # Grab the real save before patching so we can wrap it.
        from importer.tasks.items import Item as _Item

        real_save = _Item.save
        call_count = {"n": 0}

        def save_side_effect(self, *args, **kwargs):
            call_count["n"] += 1
            # First call is from Item.objects.get_or_create(...) -> allow it to
            # persist.
            if call_count["n"] == 1:
                return real_save(self, *args, **kwargs)
            # Second call is the one under test -> raise.
            raise RuntimeError("save failed")

        with (
            self.assertLogs("importer.tasks", level="ERROR") as log,
            mock.patch("importer.tasks.items.Item.full_clean") as full_clean_mock,
            mock.patch(
                "importer.tasks.items.Item.save",
                side_effect=save_side_effect,
                autospec=True,
            ),
            mock.patch("importer.tasks.items.import_item_task.delay") as task_mock,
            mock.patch(
                "importer.tasks.items.download_and_set_item_thumbnail"
            ) as thumb_mock,
        ):
            # Ensure full_clean does not fail so we reach save().
            full_clean_mock.return_value = None

            with self.assertRaises(RuntimeError):
                tasks.items.create_item_import_task(self.job.pk, self.item_url)

            self.assertTrue(
                any("Unhandled exception when importing item" in m for m in log.output)
            )
            thumb_mock.assert_not_called()
            task_mock.assert_not_called()

        item = Item.objects.get(item_id=self.item_id)
        import_item = ImportItem.objects.get(item=item)
        self.assertIsNotNone(import_item.failed)
        self.assertIn("Unhandled exception: save failed", import_item.status)


class ItemImportTests(TestCase):
    def setUp(self):
        self.item_url = "http://example.com"
        self.job = create_import_job()
        self.import_item = create_import_item(import_job=self.job, url=self.item_url)

    def test_import_item_task(self):
        with mock.patch("importer.tasks.items.import_item") as task_mock:
            tasks.items.import_item_task(self.import_item.pk)
            self.assertTrue(task_mock.called)
            task, called_import_item = task_mock.call_args.args
            self.assertTrue(called_import_item, self.import_item)

    def test_import_item(self):
        with (
            mock.patch(
                "importer.tasks.items.get_asset_urls_from_item_resources"
            ) as asset_url_mock,
            mock.patch("importer.tasks.assets.download_asset_task.s") as download_mock,
            mock.patch("importer.tasks.items.group") as group_mock,
        ):
            # It's difficult/impossible to cleanly mock a decorator due to the way
            # they're applied when the decorated object/function is evaluated on
            # import, so we unfortunately have to handle the update_task_status
            # decorator, so we need a mock object that can pass for a Celery task
            # object so update_task_status doesn't error during the test
            task_mock = mock.MagicMock()
            task_mock.request.id = "f81d4fae-7dec-11d0-a765-00a0c91e6bf6"

            asset_url_mock.return_value = [
                ["http://example.com/test.jpg"],
                self.item_url,
            ]

            tasks.items.import_item(task_mock, self.import_item)
            self.assertFalse(download_mock.called)
            self.assertTrue(group_mock.called)

            # Test that it properly errors if we try to import the same item again
            self.import_item.completed = None
            self.import_item.save()
            with self.assertRaises(ValidationError):
                tasks.items.import_item(task_mock, self.import_item)

            asset_url_mock.return_value = [
                [],
                "",
            ]

            self.import_item.completed = None
            self.import_item.save()
            tasks.items.import_item(task_mock, self.import_item)
            self.assertFalse(download_mock.called)
            self.assertTrue(group_mock.called)

    def test_populate_item_from_data(self):
        item = Item(item_url="http://example.com")
        item_info = {
            "title": "Test Title",
            "description": "Test description",
            "image_url": ["image.gif", "image.jpg", "image2.jpg"],
        }

        tasks.items.populate_item_from_data(item, item_info)

        self.assertEqual(item.item_url, "http://example.com")
        self.assertEqual(item.title, "Test Title")
        self.assertEqual(item.description, "Test description")
        self.assertEqual(item.thumbnail_url, "http://example.com/image.jpg")

    def test_populate_item_from_data_handles_exception_and_returns_none(self):
        # Proxy dict that explodes only when .get("image_url") is called,
        # but still works with indexing for the earlier code path.
        class ExplodingImageInfo(dict):
            def get(self, key, default=None):
                if key == "image_url":
                    raise RuntimeError("error")
                return super().get(key, default)

        item = Item(item_url="http://example.com")
        info = ExplodingImageInfo(
            {
                "title": "T",
                "description": "D",
                "image_url": ["image.jpg"],  # used by the earlier indexing path
            }
        )

        result = tasks.items.populate_item_from_data(item, info)
        # Early indexing still sets thumbnail_url, but the try/except branch
        # should swallow the error and return None.
        self.assertIsNone(result)
        self.assertEqual(item.thumbnail_url, "http://example.com/image.jpg")


@override_settings(DEFAULT_FILE_STORAGE="django.core.files.storage.FileSystemStorage")
class DownloadItemThumbnailTests(TestCase):
    class FakeResponse:
        """Minimal streamable response for mocking requests.get(...)."""

        def __init__(self, content, content_type="image/png", on_iter=None):
            self.headers = {"Content-Type": content_type} if content_type else {}
            self._content = content
            self._on_iter = on_iter
            self._iter_called = False

        def __enter__(self):
            return self

        def __exit__(self, exc_type, exc, tb):
            return False

        def raise_for_status(self):
            return

        def iter_content(self, chunk_size=64 * 1024):
            if self._on_iter and not self._iter_called:
                self._on_iter()
                self._iter_called = True
            yield self._content

    def setUp(self):
        self.temp_media = tempfile.mkdtemp(prefix="test-media-")
        self._override = override_settings(MEDIA_ROOT=self.temp_media)
        self._override.enable()

    def tearDown(self):
        self._override.disable()
        shutil.rmtree(self.temp_media, ignore_errors=True)

    def make_image_bytes(self, fmt="PNG", size=(2, 2), color=(1, 2, 3)):
        buf = io.BytesIO()
        img = Image.new("RGB", size, color)
        img.save(buf, format=fmt)
        return buf.getvalue()

    def test_skip_when_already_present_and_not_force(self):
        item = create_item()
        # Seed an existing thumbnail
        item.thumbnail_image.save("existing.jpg", ContentFile(b"old"), save=True)
        with mock.patch("importer.tasks.items.requests.get") as get_mock:
            msg = download_and_set_item_thumbnail(item, "https://example.com/test.jpg")
        self.assertIn("skipping", msg.lower())
        self.assertFalse(get_mock.called)
        item.refresh_from_db()
        self.assertTrue(item.thumbnail_image.name.endswith("existing.jpg"))
        self.assertTrue(default_storage.exists(item.thumbnail_image.name))

    def test_success_with_content_type_extension(self):
        item = create_item()
        payload = self.make_image_bytes(fmt="PNG")
        url = "https://example.com/path/name.png"
        with mock.patch(
            "importer.tasks.items.requests.get",
            return_value=type(self).FakeResponse(payload, "image/png"),
        ):
            saved = download_and_set_item_thumbnail(item, url)
        item.refresh_from_db()
        self.assertEqual(saved, item.thumbnail_image.name)
        self.assertTrue(saved.endswith(".png"))
        self.assertTrue(default_storage.exists(saved))
        with default_storage.open(saved, "rb") as fh:
            self.assertEqual(fh.read(), payload)

    def test_fallback_extension_via_pillow_sniff_when_guess_is_bin(self):
        item = create_item()
        payload = self.make_image_bytes(fmt="PNG")
        url = "https://example.com/noext"  # no extension to force sniff path
        with (
            mock.patch("importer.tasks.items._guess_extension", return_value=".bin"),
            mock.patch(
                "importer.tasks.items.requests.get",
                return_value=type(self).FakeResponse(payload, content_type=""),
            ),
        ):
            saved = download_and_set_item_thumbnail(item, url)
        item.refresh_from_db()
        self.assertEqual(saved, item.thumbnail_image.name)
        # Pillow sniff sees PNG, so .png via the mapping in the function
        self.assertTrue(saved.endswith(".png"))
        self.assertTrue(default_storage.exists(saved))

    def test_invalid_image_raises_value_error(self):
        item = create_item()
        bad_bytes = b"not-an-image"
        with mock.patch(
            "importer.tasks.items.requests.get",
            return_value=type(self).FakeResponse(bad_bytes, "application/octet-stream"),
        ):
            with self.assertRaises(ValueError):
                download_and_set_item_thumbnail(item, "https://example.com/notimg")
        item.refresh_from_db()
        self.assertFalse(bool(item.thumbnail_image))

    def test_requests_exception_propagates(self):
        item = create_item()
        with mock.patch(
            "importer.tasks.items.requests.get",
            side_effect=requests.RequestException("error"),
        ):
            with self.assertRaises(requests.RequestException):
                download_and_set_item_thumbnail(item, "https://example.com/error")

    def test_race_present_after_download_skips_final_save(self):
        """Simulate another writer saving the thumbnail mid-download."""
        item = create_item()

        def _concurrent_writer():
            # Another process writes a thumbnail before the second transaction.
            item.refresh_from_db()
            item.thumbnail_image.save("pre.jpg", ContentFile(b"pre"), save=True)

        payload = self.make_image_bytes(fmt="PNG")
        with mock.patch(
            "importer.tasks.items.requests.get",
            return_value=type(self).FakeResponse(
                payload, "image/png", on_iter=_concurrent_writer
            ),
        ):
            msg = download_and_set_item_thumbnail(item, "https://example.com/new.png")
        self.assertIn("skipping save", msg.lower())
        item.refresh_from_db()
        self.assertTrue(item.thumbnail_image.name.endswith("pre.jpg"))
        self.assertTrue(default_storage.exists(item.thumbnail_image.name))

    def test_force_overwrite_path_runs_and_sets_thumbnail(self):
        item = create_item()
        # Seed an existing thumbnail
        item.thumbnail_image.save("existing.jpg", ContentFile(b"old"), save=True)
        payload = self.make_image_bytes(fmt="PNG")
        with mock.patch(
            "importer.tasks.items.requests.get",
            return_value=type(self).FakeResponse(payload, "image/png"),
        ):
            saved = download_and_set_item_thumbnail(
                item, "https://example.com/new.png", force=True
            )
        item.refresh_from_db()
        self.assertEqual(saved, item.thumbnail_image.name)
        self.assertTrue(saved.endswith(".png"))
        self.assertTrue(default_storage.exists(saved))

    def test_stream_with_empty_chunk_is_skipped(self):
        item = create_item()
        payload = self.make_image_bytes(fmt="PNG")
        url = "https://example.com/streamed.png"

        class TwoChunkResponse:
            def __init__(self, content, content_type="image/png"):
                self.headers = {"Content-Type": content_type}
                self._chunks = [b"", content]  # first empty, then real data

            def __enter__(self):
                return self

            def __exit__(self, exc_type, exc, tb):
                return False

            def raise_for_status(self):
                return

            def iter_content(self, chunk_size=64 * 1024):
                for c in self._chunks:
                    yield c

        with mock.patch(
            "importer.tasks.items.requests.get",
            return_value=TwoChunkResponse(payload, "image/png"),
        ):
            saved = download_and_set_item_thumbnail(item, url)

        item.refresh_from_db()
        self.assertEqual(saved, item.thumbnail_image.name)
        self.assertTrue(saved.endswith(".png"))
        with default_storage.open(saved, "rb") as fh:
            self.assertEqual(fh.read(), payload)

    def test_guess_extension_uses_url_path_extension_lowercases(self):
        self.assertEqual(
            _guess_extension("", "/path/TO/NAME.JPG"),
            ".jpg",
        )

    def test_guess_extension_returns_bin_when_no_ext_and_no_content_type(self):
        self.assertEqual(
            _guess_extension("", "/noext"),
            ".bin",
        )

    @mock.patch("importer.tasks.items.mimetypes.guess_extension", return_value=None)
    def test_header_guess_none_uses_url_extension(self, _guess):
        item = create_item()
        payload = self.make_image_bytes(fmt="JPEG")
        # Upper-case extension to assert lower-casing behavior
        url = "https://example.com/path/name.JPEG"
        with mock.patch(
            "importer.tasks.items.requests.get",
            return_value=type(self).FakeResponse(payload, "image/unknown"),
        ):
            saved = download_and_set_item_thumbnail(item, url)
        item.refresh_from_db()
        self.assertTrue(saved.endswith(".jpeg"))


class GetAssetUrlsFromItemResourcesTests(TestCase):
    def test_empty_resources(self):
        assets, resource_url = tasks.items.get_asset_urls_from_item_resources([])
        self.assertEqual(assets, [])
        self.assertEqual(resource_url, "")

    def test_missing_item_resource_url_key(self):
        resources = [
            {
                # 'url' intentionally omitted to hit KeyError path
                "files": [
                    [
                        {
                            "url": "http://example.com/ok.jpg",
                            "height": 2,
                            "width": 2,
                            "mimetype": "image/jpeg",
                        },
                        {"url": "http://example.com/missing_dims.jpg"},  # skipped
                    ]
                ],
            }
        ]
        assets, resource_url = tasks.items.get_asset_urls_from_item_resources(resources)
        self.assertEqual(resource_url, "")
        self.assertEqual(assets, ["http://example.com/ok.jpg"])

    def test_files_key_missing(self):
        resources = [{"url": "http://example.com"}]  # no 'files' key
        assets, resource_url = tasks.items.get_asset_urls_from_item_resources(resources)
        self.assertEqual(assets, [])
        self.assertEqual(resource_url, "http://example.com")

    def test_picks_largest_jpeg_when_present(self):
        resources = [
            {
                "url": "http://example.com",
                "files": [
                    [
                        {
                            "url": "http://example.com/small.jpg",
                            "height": 1,
                            "width": 1,
                            "mimetype": "image/jpeg",
                        },
                        {
                            "url": "http://example.com/large.jpg",
                            "height": 3,
                            "width": 3,
                            "mimetype": "image/jpeg",
                        },
                    ]
                ],
            }
        ]
        assets, resource_url = tasks.items.get_asset_urls_from_item_resources(resources)
        self.assertEqual(resource_url, "http://example.com")
        self.assertEqual(assets, ["http://example.com/large.jpg"])

    def test_falls_back_to_largest_gif_when_no_jpeg(self):
        resources = [
            {
                "url": "http://example.com",
                "files": [
                    [
                        {
                            "url": "http://example.com/small.gif",
                            "height": 2,
                            "width": 2,
                            "mimetype": "image/gif",
                        },
                        {
                            "url": "http://example.com/large.gif",
                            "height": 5,
                            "width": 5,
                            "mimetype": "image/gif",
                        },
                        # unacceptable types are ignored
                        {
                            "url": "http://example.com/file.tif",
                            "height": 100,
                            "width": 100,
                            "mimetype": "image/tiff",
                        },
                    ]
                ],
            }
        ]
        assets, resource_url = tasks.items.get_asset_urls_from_item_resources(resources)
        self.assertEqual(resource_url, "http://example.com")
        self.assertEqual(assets, ["http://example.com/large.gif"])

    def test_variants_missing_required_keys_are_ignored(self):
        resources = [
            {
                "url": "http://example.com",
                "files": [
                    [
                        {"url": "http://example.com/nw.jpg", "height": 2},  # no width
                        {"height": 2, "width": 2, "mimetype": "image/jpeg"},  # no url
                        {
                            "url": "http://example.com/valid.jpg",
                            "height": 2,
                            "width": 3,
                            "mimetype": "image/jpeg",
                        },
                    ]
                ],
            }
        ]
        assets, resource_url = tasks.items.get_asset_urls_from_item_resources(resources)
        self.assertEqual(resource_url, "http://example.com")
        self.assertEqual(assets, ["http://example.com/valid.jpg"])

    def test_no_candidates_or_backups_skips_appending(self):
        resources = [
            {
                "url": "http://example.com",
                "files": [
                    [
                        {
                            "url": "http://example.com/file1.tif",
                            "height": 10,
                            "width": 10,
                            "mimetype": "image/tiff",  # unsupported
                        },
                        {
                            "url": "http://example.com/file2",
                            "height": 5,
                            "width": 5,
                            # no mimetype -> not added to candidates/backups
                        },
                    ]
                ],
            }
        ]
        assets, resource_url = tasks.items.get_asset_urls_from_item_resources(resources)
        self.assertEqual(resource_url, "http://example.com")
        self.assertEqual(assets, [])


================================================
FILE: importer/tests/test_utils.py
================================================
import uuid
from unittest import mock

from django.test import TestCase

from concordia.tests.utils import create_asset
from importer.models import VerifyAssetImageJob
from importer.utils import create_verify_asset_image_job_batch
from importer.utils.excel import clean_cell_value, slurp_excel


class CreateVerifyAssetImageJobBatchTests(TestCase):
    def setUp(self):
        self.batch_id = uuid.uuid4()
        self.asset = create_asset()
        self.assets = [self.asset] + [
            create_asset(item=self.asset.item, slug=f"test-asset-{i}")
            for i in range(1, 5)
        ]
        self.asset_pks = [asset.pk for asset in self.assets]

    @mock.patch("importer.tasks.images.batch_verify_asset_images_task.delay")
    def test_create_jobs_single_batch(self, mock_task):
        job_count, batch_url = create_verify_asset_image_job_batch(
            self.asset_pks, self.batch_id
        )

        self.assertEqual(job_count, 5)
        self.assertEqual(
            VerifyAssetImageJob.objects.filter(batch=self.batch_id).count(), 5
        )
        mock_task.assert_called_once_with(batch=self.batch_id)
        self.assertEqual(
            batch_url, VerifyAssetImageJob.get_batch_admin_url(self.batch_id)
        )

    @mock.patch("importer.tasks.images.batch_verify_asset_images_task.delay")
    def test_create_jobs_multiple_batches(self, mock_task):
        asset_pks = self.asset_pks + [
            asset.pk
            for asset in [
                create_asset(item=self.asset.item, slug=f"test-asset-{i}")
                for i in range(5, 150)
            ]
        ]
        job_count, _ = create_verify_asset_image_job_batch(asset_pks, self.batch_id)

        self.assertEqual(job_count, 150)
        self.assertEqual(
            VerifyAssetImageJob.objects.filter(batch=self.batch_id).count(), 150
        )
        mock_task.assert_called_once_with(batch=self.batch_id)

    @mock.patch("importer.tasks.images.batch_verify_asset_images_task.delay")
    def test_no_assets_provided(self, mock_task):
        job_count, batch_url = create_verify_asset_image_job_batch([], self.batch_id)

        self.assertEqual(job_count, 0)
        self.assertEqual(
            VerifyAssetImageJob.objects.filter(batch=self.batch_id).count(), 0
        )
        mock_task.assert_called_once_with(batch=self.batch_id)
        self.assertEqual(
            batch_url, VerifyAssetImageJob.get_batch_admin_url(self.batch_id)
        )


class ExcelUtilsTests(TestCase):
    class _Cell:
        def __init__(self, data_type, value):
            self.data_type = data_type
            self.value = value

    class _Worksheet:
        def __init__(self, rows):
            # rows is a list of tuples of _Cell
            self._rows = rows

        @property
        def rows(self):
            return iter(self._rows)

    class _Workbook:
        def __init__(self, worksheets):
            self.worksheets = worksheets

    @mock.patch("importer.utils.excel.load_workbook")
    def test_slurp_excel_single_worksheet_single_row(self, load_mock):
        ws_rows = [
            (
                type(self)._Cell("s", " Name "),
                type(self)._Cell("s", "Age"),
            ),
            (
                type(self)._Cell("s", " Alice "),
                type(self)._Cell("n", 30),
            ),
        ]
        wb = type(self)._Workbook([type(self)._Worksheet(ws_rows)])
        load_mock.return_value = wb

        out = slurp_excel("ignored.xlsx")

        self.assertEqual(out, [{"Name": "Alice", "Age": 30}])

    @mock.patch("importer.utils.excel.load_workbook")
    def test_slurp_excel_multiple_worksheets_multiple_rows(self, load_mock):
        ws1_rows = [
            (type(self)._Cell("s", "H1"),),
            (type(self)._Cell("s", "v1"),),
            (type(self)._Cell("s", " v2 "),),
        ]
        ws2_rows = [
            (
                type(self)._Cell("s", " H2 "),
                type(self)._Cell("s", "H3"),
            ),
            (
                type(self)._Cell("n", 1),
                type(self)._Cell("s", "  x "),
            ),
        ]
        wb = type(self)._Workbook(
            [type(self)._Worksheet(ws1_rows), type(self)._Worksheet(ws2_rows)]
        )
        load_mock.return_value = wb

        out = slurp_excel("ignored.xlsx")

        # Order is by worksheet, then row order within each worksheet.
        self.assertEqual(
            out,
            [
                {"H1": "v1"},
                {"H1": "v2"},
                {"H2": 1, "H3": "x"},
            ],
        )

    def test_clean_cell_value_trims_strings(self):
        c = type(self)._Cell("s", "  padded  ")
        self.assertEqual(clean_cell_value(c), "padded")

    def test_clean_cell_value_passthrough_non_strings(self):
        c_num = type(self)._Cell("n", 42)
        c_bool = type(self)._Cell("b", True)
        self.assertEqual(clean_cell_value(c_num), 42)
        self.assertTrue(clean_cell_value(c_bool))


================================================
FILE: importer/tests/utils.py
================================================
from django.utils.text import slugify

from concordia.tests.utils import create_asset, create_item, create_project
from importer.models import (
    DownloadAssetImageJob,
    ImportItem,
    ImportItemAsset,
    ImportJob,
    VerifyAssetImageJob,
)


def create_import_job(*, project=None, **kwargs):
    # project is a concordia.models.Project instance
    if project is None:
        project = create_project()
    import_job = ImportJob(project=project, **kwargs)
    import_job.save()
    return import_job


def create_import_item(item=None, project=None, import_job=None, **kwargs):
    # item is a concordia.models.Item instance
    # project is a concordia.models.Project instance
    # import_job is an importer.models.ImportJob instance
    if import_job is None:
        import_job = create_import_job(project=project)
    if item is None:
        item = create_item(project=import_job.project)
    import_item = ImportItem(item=item, job=import_job, **kwargs)
    import_item.save()
    return import_item


def create_import_asset(
    sequence_number=1,
    asset=None,
    item=None,
    import_item=None,
    project=None,
    import_job=None,
    **kwargs,
):
    # sequence_number has to be unique to a particular import_item
    # asset is a concordia.models.Asset instance
    # item is a concordia.models.Item instance
    # import_item is an importer.models.ImportItem instance
    # project is a concordia.models.Project instance
    # import_job is an importer.models.ImportJob instance
    if import_item is None:
        import_item = create_import_item(
            item=item, import_job=import_job, project=project
        )
    if asset is None:
        item_slug = slugify(import_item.item.title)
        slug = f"{item_slug}-{sequence_number}"
        asset = create_asset(item=import_item.item, slug=slug)
    import_asset = ImportItemAsset(
        sequence_number=sequence_number, asset=asset, import_item=import_item, **kwargs
    )
    import_asset.save()
    return import_asset


def create_verify_asset_image_job(asset=None, batch=None, **kwargs):
    """
    Create a VerifyAssetImageJob instance.
    If no asset is provided, a new one is created.
    """
    if asset is None:
        asset = create_asset()
    job = VerifyAssetImageJob.objects.create(asset=asset, batch=batch, **kwargs)
    return job


def create_download_asset_image_job(asset=None, batch=None, **kwargs):
    """
    Create a DownloadAssetImageJob instance.
    If no asset is provided, a new one is created.
    """
    if asset is None:
        asset = create_asset()
    job = DownloadAssetImageJob.objects.create(asset=asset, batch=batch, **kwargs)
    return job


================================================
FILE: importer/utils/__init__.py
================================================
from .excel import slurp_excel
from .verify_images import create_verify_asset_image_job_batch

__all__ = [
    "slurp_excel",
    "create_verify_asset_image_job_batch",
]


================================================
FILE: importer/utils/excel.py
================================================
from typing import Any

from openpyxl import load_workbook
from openpyxl.cell.cell import Cell


def slurp_excel(filename: str) -> list[dict[str, Any]]:
    """
    Parse an Excel workbook into a list of row dictionaries.

    Each worksheet is read in order. The first row of each sheet is treated
    as the header; subsequent rows become dictionaries mapping header names
    to cell values (after basic cleaning via `clean_cell_value`).

    Args:
        filename (str): Path to the XLSX file.

    Returns:
        list[dict[str, Any]]: One dict per non-header row across all sheets.
    """
    wb = load_workbook(filename=filename)

    cells: list[dict[str, Any]] = []

    for worksheet in wb.worksheets:
        rows = worksheet.rows
        headers = [clean_cell_value(i) for i in next(rows)]

        for row in rows:
            values: list[Any] = []
            for cell in row:
                values.append(clean_cell_value(cell))

            cells.append(dict(zip(headers, values, strict=True)))

    return cells


def clean_cell_value(cell: Cell) -> Any:
    """
    Return a normalized Python value for an openpyxl cell.

    If the cell is a string type ('s'), leading/trailing whitespace is stripped;
    otherwise the raw value is returned.

    Args:
        cell (Cell): openpyxl cell to normalize.

    Returns:
        Any: Cleaned value suitable for serialization.
    """
    if cell.data_type in ("s",):
        return cell.value.strip()
    else:
        return cell.value


================================================
FILE: importer/utils/verify_images.py
================================================
from collections.abc import Iterable
from itertools import islice
from uuid import UUID

from importer.models import VerifyAssetImageJob
from importer.tasks.images import batch_verify_asset_images_task

BATCH_SIZE: int = 100


def create_verify_asset_image_job_batch(
    asset_pks: Iterable[int],
    batch: UUID,
) -> tuple[int, str]:
    """
    Create verification jobs in chunks and enqueue a single batch task.

    Iterates through the provided asset primary keys in chunks of
    `BATCH_SIZE`, creating `VerifyAssetImageJob` rows via `bulk_create`.
    After all jobs are created, schedules the Celery task that verifies
    the images for the given batch. Returns the number of jobs created
    and the admin URL prefiltered to the batch.

    Args:
        asset_pks (Iterable[int]): Asset primary keys to generate jobs for.
        batch (UUID): Identifier to group jobs; unrelated to chunk size.

    Returns:
        tuple[int, str]: A pair of `(job_count, batch_admin_url)`.
    """

    job_count = 0
    # Make sure asset_pks is an iterator, for proper use with islice
    # Not doing this causes an infinite loop if asset_pks is not an iterator/generator
    asset_pks = iter(asset_pks)
    while True:
        asset_batch = list(islice(asset_pks, BATCH_SIZE))
        if not asset_batch:
            break
        job_count += len(
            VerifyAssetImageJob.objects.bulk_create(
                [
                    VerifyAssetImageJob(asset_id=asset_pk, batch=batch)
                    for asset_pk in asset_batch
                ],
                batch_size=BATCH_SIZE,
            )
        )

    batch_verify_asset_images_task.delay(batch=batch)

    return job_count, VerifyAssetImageJob.get_batch_admin_url(batch)


================================================
FILE: load_test.sh
================================================
#!/bin/bash
set -euo pipefail

LOCUST_USERS="${LOCUST_USERS:-100}"
LOCUST_SPAWN_RATE="${LOCUST_SPAWN_RATE:-2}"
LOCUST_RUN_TIME="${LOCUST_RUN_TIME:-1m30s}"
LOCUST_HOST="${LOCUST_HOST:-https://crowd-dev.loc.gov}"

exec locust \
  --headless \
  -u "${LOCUST_USERS}" \
  -r "${LOCUST_SPAWN_RATE}" \
  --run-time "${LOCUST_RUN_TIME}" \
  --host "${LOCUST_HOST}"


================================================
FILE: locustfile.py
================================================
import logging
import random
import string
import time
from html.parser import HTMLParser
from pathlib import Path
from urllib.parse import urlencode, urljoin, urlparse

from gevent import sleep
from gevent.event import Event
from locust import HttpUser, between, events, runners, task
from locust.exception import StopUser

ABORT_WHEN_NO_WORK = True  # stop the run if a next-* page has no work
NO_WORK_DUMP_HTML = False  # set True to write an HTML dump for debugging

HOMEPAGE_PATH = "/"
NEXT_ASSET_PATH = "/next-transcribable-asset/"
NEXT_REVIEWABLE_ASSET_PATH = "/next-reviewable-asset/"
AJAX_STATUS_PATH = "/account/ajax-status/"
AJAX_MSG_PATH = "/account/ajax-messages/"
LOGIN_PATH = "/account/login/"
CSRF_COOKIE_NAME = "csrftoken"
SESSION_COOKIE_NAME = "sessionid"
CSRF_SEED_PATH = HOMEPAGE_PATH
POST_FIELD_NAME = "text"
POST_MIN_CHARS = 10
POST_MAX_CHARS = 200
SAME_PAGE_REPEAT_PROB = 0.75
REDIRECT_RETRIES = 3
REDIRECT_BACKOFF = 0.25

TEST_USER_PREFIX = "locusttest"
TEST_USER_DOMAIN = "example.test"
TEST_USER_COUNT = 10_000
TEST_USER_PASSWORD = "locustpass123"  # nosec B105
LOGIN_BAD_PASSWORD_PROB = 0.10
LOGIN_MAX_ATTEMPTS = 5

REVIEWER_SHARE = 0.20
REVIEW_EDIT_PROB = 0.50

NO_WORK_ERROR_MESSAGE = (
    "Did you need to refresh the load test database? "
    "Try running the 'prepare_load_test_db' command or "
    "'create_load_test_fixtures' if you need fixtures first."
)

logger = logging.getLogger(__name__)

# ---------- global abort plumbing ----------

GLOBAL_ABORT_EVENT: Event = Event()
GLOBAL_ABORT_REASON: str | None = None


@events.init.add_listener
def _on_locust_init(environment, **_):
    # stop immediately; don’t wait for graceful wind down
    environment.stop_timeout = 0

    # Register a message handler so both master and workers react to global abort
    runner = getattr(environment, "runner", None)
    if not runner:
        return

    def _handle_global_abort(env, msg, **kwargs):
        reason = ""
        try:
            data = getattr(msg, "data", {}) or {}
            reason = data.get("reason") or ""
        except Exception:
            pass
        _trigger_global_abort(
            env, f"Global abort requested. {reason}", dump_html=None, broadcast=True
        )

    try:
        runner.register_message("global-abort", _handle_global_abort)
    except Exception as e:
        logger.debug("register_message failed (non-distributed run is fine): %s", e)


@events.quitting.add_listener
def _on_quitting(environment, **_):
    """Print a final, unmissable banner at shutdown."""
    if not (GLOBAL_ABORT_EVENT.is_set() or GLOBAL_ABORT_REASON):
        return
    reason = GLOBAL_ABORT_REASON or "Aborted"
    banner = (
        "\n" + "=" * 80 + "\n"
        " LOAD TEST ABORTED\n" + "-" * 80 + "\n"
        f"{reason}\n\n{NO_WORK_ERROR_MESSAGE}\n" + "=" * 80 + "\n"
    )
    # Print to stdout and log as error so it's visible in any context
    try:
        print(banner, flush=True)
    except Exception:
        pass
    logger.error(banner)


def _trigger_global_abort(
    environment, reason: str, dump_html: str | None = None, *, broadcast: bool = True
) -> None:
    """
    Set a global flag so all users bail, set a failing exit code,
    and in distributed mode coordinate master<->workers via custom messages.
    """
    global GLOBAL_ABORT_REASON
    if GLOBAL_ABORT_EVENT.is_set():
        return

    GLOBAL_ABORT_REASON = reason
    GLOBAL_ABORT_EVENT.set()

    logger.error("Aborting load test: %s", reason)
    logger.error(NO_WORK_ERROR_MESSAGE)

    if dump_html:
        try:
            ts = int(time.time())
            out = Path(f"no_work_{ts}.html").resolve()
            out.write_text(dump_html, encoding="utf-8")
            logger.error("No-work HTML dumped to %s", out)
        except Exception as e:
            logger.error("Failed to dump no-work HTML (%s)", e)

    try:
        if hasattr(environment, "process_exit_code"):
            environment.process_exit_code = 2
    except Exception:
        pass

    runner = getattr(environment, "runner", None)
    if not runner:
        return

    try:
        # Worker that discovers the problem -> tell master
        if isinstance(runner, runners.WorkerRunner):
            runner.send_message("global-abort", {"reason": reason})

        # Master -> broadcast to all workers
        if broadcast and isinstance(runner, runners.MasterRunner):
            runner.send_message("global-abort", {"reason": reason})

        runner.quit()
    except Exception as e:
        logger.error("Error quitting runner: %s", e)


# ---------- helpers ----------


def _is_local(path_or_url: str, base: str) -> bool:
    if not path_or_url:
        return False
    if path_or_url.startswith("/"):
        return True
    parsed = urlparse(path_or_url)
    if not parsed.scheme:
        return True
    return urlparse(base).netloc == parsed.netloc


class _ResourceParser(HTMLParser):
    """Extract local script and stylesheet URLs from the page."""

    def __init__(self, base_url: str):
        super().__init__()
        self.base_url = base_url
        self.resources = []

    def handle_starttag(self, tag, attrs):
        attrs = dict(attrs)
        if tag == "script":
            src = attrs.get("src")
            if src and _is_local(src, self.base_url):
                self.resources.append(urljoin(self.base_url, src))
        elif tag == "link":
            rel = (attrs.get("rel") or "").lower()
            href = attrs.get("href")
            if "stylesheet" in rel and href and _is_local(href, self.base_url):
                self.resources.append(urljoin(self.base_url, href))


class _AssetPageParser(HTMLParser):
    """
    Extract form action, supersedes, reserve URL
    and review endpoints from an asset page.
    """

    def __init__(self, base_url: str):
        super().__init__()
        self.base_url = base_url
        self.in_transcription_form = False
        self.form_action = None
        self.supersedes = None
        self.reserve_url = None
        self.review_url = None
        self.submit_url = None

    def handle_starttag(self, tag, attrs):
        a = dict(attrs)
        if tag == "form":
            if a.get("id") == "transcription-editor":
                self.in_transcription_form = True
                action = a.get("action")
                if action is not None:
                    resolved = (
                        self.base_url
                        if action.strip() == ""
                        else urljoin(self.base_url, action)
                    )
                    self.form_action = resolved
                review_attr = a.get("data-review-url")
                if review_attr:
                    self.review_url = urljoin(self.base_url, review_attr)
                submit_attr = a.get("data-submit-url")
                if submit_attr:
                    self.submit_url = urljoin(self.base_url, submit_attr)
        elif tag == "input":
            if a.get("name") == "supersedes" and a.get("value"):
                self.supersedes = a["value"]
        elif tag == "script":
            if a.get("id") == "asset-reservation-data":
                reserve = a.get("data-reserve-asset-url")
                if reserve:
                    self.reserve_url = urljoin(self.base_url, reserve)

    def handle_endtag(self, tag):
        if tag == "form" and self.in_transcription_form:
            self.in_transcription_form = False


def _random_text(min_len=10, max_len=200) -> str:
    n = random.randint(min_len, max_len)
    alphabet = string.ascii_letters + string.digits + "     "
    s = "".join(random.choice(alphabet) for _ in range(n))
    return " ".join(s.split())


# ---------- users ----------


class BaseBrowsingUser(HttpUser):
    """
    Shared browse/post behavior. Subclasses provide their own on_start.
    """

    abstract = True
    wait_time = between(3.0, 8.0)

    current_target_path: str | None = None
    current_form_action_path: str | None = None
    current_supersedes: str | None = None
    current_reserve_path: str | None = None
    current_review_url_path: str | None = None
    current_submit_url_path: str | None = None

    next_redirect_path: str = NEXT_ASSET_PATH
    next_redirect_label: str = "next asset (redirect)"

    _fatal_already_triggered = False

    def _fatal_dump_and_quit(self, page_url: str, html: str) -> None:
        if self.__class__._fatal_already_triggered:
            return
        self.__class__._fatal_already_triggered = True

        ts = int(time.time())
        out = Path(f"asset_parse_failure_{ts}.html").resolve()
        try:
            out.write_text(html or "", encoding="utf-8")
            logger.error(
                "FATAL: transcription form not found. Page URL=%s ; HTML dumped to %s",
                page_url,
                out,
            )
        except Exception as e:
            logger.error(
                "FATAL: failed to write HTML dump (%s). Page URL=%s", e, page_url
            )

        try:
            self.environment.runner.quit()
        except Exception as e:
            logger.error("Error calling runner.quit(): %s", e)

    def _after_request_ajax(self):
        # simulate normal page load
        self.client.get(AJAX_STATUS_PATH, name="AJAX status")
        self.client.get(AJAX_MSG_PATH, name="AJAX messaging")

    def _get(self, path_or_url: str, *, page: bool = True, **kwargs):
        r = self.client.get(path_or_url, **kwargs)
        if page:
            self._after_request_ajax()
        return r

    def _post(self, path_or_url: str, **kwargs):
        return self.client.post(path_or_url, **kwargs)

    def _load_homepage_and_resources(self, *, name_suffix: str = ""):
        base = self.environment.host.rstrip("/")
        r_home = self._get(HOMEPAGE_PATH, page=True)

        parser = _ResourceParser(base_url=base + "/")
        try:
            parser.feed(r_home.text or "")
        except Exception:
            parser.resources = []

        for res_url in parser.resources:
            label = "resource " + urlparse(res_url).path
            if name_suffix:
                label = f"{label} {name_suffix}"
            self._get(res_url, name=label, page=False)

    def _parse_asset_page_and_reserve(self, target_path: str) -> None:
        base = self.environment.host.rstrip("/")
        r = self._get(target_path, name="target page", page=True)

        parser = _AssetPageParser(base_url=r.url)
        try:
            parser.feed(r.text or "")
        except Exception:
            self._fatal_dump_and_quit(r.url, r.text or "")
            return

        if parser.form_action:
            fa = urlparse(parser.form_action)
            self.current_form_action_path = fa.path + (
                ("?" + fa.query) if fa.query else ""
            )
        else:
            self.current_form_action_path = None

        self.current_supersedes = parser.supersedes

        if parser.reserve_url:
            ru = urlparse(parser.reserve_url)
            self.current_reserve_path = ru.path + (("?" + ru.query) if ru.query else "")
        else:
            self.current_reserve_path = None

        if parser.review_url:
            rvu = urlparse(parser.review_url)
            self.current_review_url_path = rvu.path + (
                ("?" + rvu.query) if rvu.query else ""
            )
        else:
            self.current_review_url_path = None

        if parser.submit_url:
            su = urlparse(parser.submit_url)
            self.current_submit_url_path = su.path + (
                ("?" + su.query) if su.query else ""
            )
        else:
            self.current_submit_url_path = None

        if not self.current_form_action_path:
            if ABORT_WHEN_NO_WORK:
                _trigger_global_abort(
                    self.environment,
                    f"No work available (no transcription form) on {r.url}",
                    (r.text or "") if NO_WORK_DUMP_HTML else None,
                    broadcast=True,
                )
            else:
                logger.info("No transcription form on %s; treating as no work", r.url)
                self.current_target_path = None
                self.current_review_url_path = None
                self.current_submit_url_path = None
            return

        if self.current_reserve_path:
            csrftoken = self.client.cookies.get(CSRF_COOKIE_NAME)
            referer = urljoin(base + "/", target_path.lstrip("/"))
            self._post(
                self.current_reserve_path,
                headers={"X-CSRFToken": csrftoken or "", "Referer": referer},
                name="reserve asset",
            )

    def _ensure_csrf(self, target_path: str | None) -> str | None:
        if not target_path:
            return None

        if (
            self.current_form_action_path is None
            and self.current_review_url_path is None
        ):
            self._parse_asset_page_and_reserve(target_path)

        csrftoken = self.client.cookies.get(CSRF_COOKIE_NAME)

        if not csrftoken and CSRF_SEED_PATH:
            self._get(CSRF_SEED_PATH, name="csrf seed", page=True)
            self._parse_asset_page_and_reserve(target_path)
            csrftoken = self.client.cookies.get(CSRF_COOKIE_NAME)

        return csrftoken

    def _follow_next(self, redirect_path: str, label: str) -> str | None:
        """
        Follow the next-* redirect. If it lands on the homepage, treat that as no work.
        """
        last_body = None
        for attempt in range(1, REDIRECT_RETRIES + 1):
            with self.client.get(
                redirect_path,
                name=label,
                allow_redirects=True,
                catch_response=True,
            ) as resp:
                try:
                    last_body = (resp.text or "")[:10000]
                except Exception:
                    last_body = None

                if 200 <= resp.status_code < 400:
                    final_path = urlparse(resp.url).path or "/"
                    if final_path == HOMEPAGE_PATH:
                        msg = f"{label} landed on homepage -> no work"
                        resp.failure(msg)
                        logger.error(msg)
                        if ABORT_WHEN_NO_WORK:
                            _trigger_global_abort(
                                self.environment,
                                f"No work available from {label} ({redirect_path})",
                                last_body if NO_WORK_DUMP_HTML else None,
                                broadcast=True,
                            )
                        return None
                    return final_path

                msg = (
                    f"redirect failed (status={resp.status_code}) "
                    f"attempt={attempt}/{REDIRECT_RETRIES}"
                )
                resp.failure(msg)
                logger.warning("%s retry: %s", label, msg)

            sleep(REDIRECT_BACKOFF * attempt)

        logger.error("%s: all %d retries failed", label, REDIRECT_RETRIES)
        return None

    def _post_then_get_same_page(
        self, target_path: str | None, csrftoken: str, name_prefix: str
    ):
        if not target_path:
            return
        base = self.environment.host.rstrip("/")
        referer = urljoin(base + "/", target_path.lstrip("/"))
        post_path = self.current_form_action_path
        if not post_path:
            logger.warning("No form action parsed for %s; skipping POST", target_path)
            return

        data = {POST_FIELD_NAME: _random_text(POST_MIN_CHARS, POST_MAX_CHARS)}
        if self.current_supersedes:
            data["supersedes"] = self.current_supersedes

        self._post(
            post_path,
            data=data,
            headers={"X-CSRFToken": csrftoken, "Referer": referer},
            name=f"{name_prefix} POST",
        )
        self._parse_asset_page_and_reserve(target_path)

    def _review_decision(self, target_path: str, decision: str) -> None:
        if not self.current_review_url_path:
            return
        base = self.environment.host.rstrip("/")
        referer = urljoin(base + "/", target_path.lstrip("/"))
        csrftoken = self.client.cookies.get(CSRF_COOKIE_NAME) or ""

        form = {"csrfmiddlewaretoken": csrftoken, "decision": decision}
        name = "review accept" if decision == "accept" else "review reject"
        self._post(
            self.current_review_url_path,
            data=form,
            headers={"X-CSRFToken": csrftoken, "Referer": referer},
            name=name,
        )

    @task
    def browse_and_submit(self):
        # if someone already pulled the plug, stop this user
        if GLOBAL_ABORT_EVENT.is_set():
            raise StopUser()

        if not self.current_target_path:
            new_path = self._follow_next(
                self.next_redirect_path, self.next_redirect_label
            )
            if new_path is None:
                return
            self.current_target_path = new_path
            self.current_form_action_path = None
            self.current_supersedes = None
            self.current_reserve_path = None
            self.current_review_url_path = None
            self.current_submit_url_path = None
        else:
            maybe_switch = getattr(self, "is_reviewer", False) is False
            if maybe_switch and random.random() >= SAME_PAGE_REPEAT_PROB:
                new_path = self._follow_next(
                    self.next_redirect_path, self.next_redirect_label
                )
                if new_path is None:
                    return
                self.current_target_path = new_path
                self.current_form_action_path = None
                self.current_supersedes = None
                self.current_reserve_path = None
                self.current_review_url_path = None
                self.current_submit_url_path = None

        csrftoken = self._ensure_csrf(self.current_target_path)
        if not csrftoken:
            if self.current_target_path:
                self._get(
                    self.current_target_path, name="target page (no CSRF)", page=True
                )
            return

        if getattr(self, "is_reviewer", False):
            do_edit = random.random() < REVIEW_EDIT_PROB
            if do_edit:
                self._review_decision(self.current_target_path, "reject")
                self._parse_asset_page_and_reserve(self.current_target_path)
                csrftoken = self._ensure_csrf(self.current_target_path) or ""
                if csrftoken:
                    self._post_then_get_same_page(
                        self.current_target_path, csrftoken, "review edit save"
                    )
            else:
                self._review_decision(self.current_target_path, "accept")

            self.current_target_path = None
            self.current_form_action_path = None
            self.current_supersedes = None
            self.current_reserve_path = None
            self.current_review_url_path = None
            self.current_submit_url_path = None
            return

        # Transcriber branch
        self._post_then_get_same_page(self.current_target_path, csrftoken, "target")

        if random.random() < SAME_PAGE_REPEAT_PROB:
            csrftoken = self.client.cookies.get(CSRF_COOKIE_NAME) or self._ensure_csrf(
                self.current_target_path
            )
            if csrftoken:
                self._post_then_get_same_page(
                    self.current_target_path, csrftoken, "target (repeat)"
                )


class AnonUser(BaseBrowsingUser):
    """Anonymous user flow."""

    def on_start(self):
        self._load_homepage_and_resources()


class AuthUser(BaseBrowsingUser):
    """Authenticated user flow."""

    chosen_username: str | None = None
    chosen_email: str | None = None
    is_reviewer: bool = False

    def _pick_fixture_user(self):
        index = random.randint(1, TEST_USER_COUNT)
        username = f"{TEST_USER_PREFIX}{index:05d}"
        email = f"{username}@{TEST_USER_DOMAIN}"
        self.chosen_username = username
        self.chosen_email = email

    def _login_once(self, login_url: str, referer: str) -> bool:
        csrftoken = self.client.cookies.get(CSRF_COOKIE_NAME) or ""
        if not csrftoken:
            self._get(login_url, name="login page", page=True)
            csrftoken = self.client.cookies.get(CSRF_COOKIE_NAME) or ""

        assert self.chosen_username and self.chosen_email
        identifier = (
            self.chosen_username if random.random() < 0.5 else self.chosen_email
        )

        wrong = random.random() < LOGIN_BAD_PASSWORD_PROB
        password = TEST_USER_PASSWORD if not wrong else TEST_USER_PASSWORD + "x"

        form = {
            "username": identifier,
            "password": password,
            "csrfmiddlewaretoken": csrftoken,
            "next": "/",
        }

        self._post(
            login_url,
            data=form,
            headers={"X-CSRFToken": csrftoken, "Referer": referer},
            name="login POST",
        )

        has_session = bool(self.client.cookies.get(SESSION_COOKIE_NAME))
        if has_session:
            return True

        self._get("/", name="post-login home probe", page=True)
        has_session = bool(self.client.cookies.get(SESSION_COOKIE_NAME))
        return has_session

    def on_start(self):
        self._get(HOMEPAGE_PATH, page=True)

        self._pick_fixture_user()
        query = urlencode({"next": "/"})
        login_url = f"{LOGIN_PATH}?{query}"
        base = self.environment.host.rstrip("/")
        referer = urljoin(base + "/", LOGIN_PATH.lstrip("/"))

        self._get(login_url, name="login page", page=True)

        success = False
        for _ in range(LOGIN_MAX_ATTEMPTS):
            if self._login_once(login_url, referer):
                success = True
                break
            self._get(login_url, name="login page (retry)", page=True)

        if not success:
            logger.error(
                "AuthUser failed to authenticate after %d attempts (user=%s / %s)",
                LOGIN_MAX_ATTEMPTS,
                self.chosen_username,
                self.chosen_email,
            )

        self.is_reviewer = random.random() < REVIEWER_SHARE
        if self.is_reviewer:
            self.next_redirect_path = NEXT_REVIEWABLE_ASSET_PATH
            self.next_redirect_label = "next reviewable (redirect)"
        else:
            self.next_redirect_path = NEXT_ASSET_PATH
            self.next_redirect_label = "next asset (redirect)"

        self._load_homepage_and_resources(name_suffix="(authed)")


================================================
FILE: manage.py
================================================
#!/usr/bin/env python3
import sys

if __name__ == "__main__":
    try:
        from django.core.management import execute_from_command_line
    except ImportError as exc:
        raise ImportError(
            "Couldn't import Django. Are you sure it's installed and "
            "available on your PYTHONPATH environment variable? Did you "
            "forget to activate a virtual environment?"
        ) from exc
    execute_from_command_line(sys.argv)


================================================
FILE: package.json
================================================
{
    "devDependencies": {
        "@axe-core/cli": "^4.11.3",
        "@puppeteer/browsers": "^2.10.13",
        "child_process": "^1.0.2",
        "sass-embedded": "^1.99.0",
        "stylelint-value-no-unknown-custom-properties": "^6.1.1",
        "vite": "^8.0.10",
        "vite-plugin-compression2": "^2.5.2"
    },
    "dependencies": {
        "@duetds/date-picker": "^1.4.0",
        "@fortawesome/fontawesome-free": "^7.1.0",
        "@popperjs/core": "^2.11.8",
        "@sentry/browser": "^10.49.0",
        "@sentry/core": "^10.48.0",
        "@sentry/tracing": "^7.120.4",
        "bootstrap": "^5.3.8",
        "chart.js": "^4.5.1",
        "chroma-js": "^3.2.0",
        "codemirror": "^5.65.19",
        "fancy-log": "^2.0.0",
        "jquery": "^3.5.1",
        "js-cookie": "^3.0.5",
        "openseadragon": "^6.0.2",
        "openseadragon-filters": "^2.2.0",
        "prettier": "^2.8.8",
        "remarkable": "^2.0.1",
        "screenfull": "^6.0.0",
        "split.js": "^1.6.2",
        "urijs": "^1.19.11"
    },
    "name": "concordia",
    "private": true,
    "version": "1.0.0",
    "directories": {
        "doc": "docs"
    },
    "repository": {
        "type": "git",
        "url": "git+https://github.com/LibraryOfCongress/concordia.git"
    },
    "license": "CC0-1.0",
    "bugs": {
        "url": "https://github.com/LibraryOfCongress/concordia/issues"
    },
    "homepage": "https://github.com/LibraryOfCongress/concordia",
    "scripts": {
        "dev": "vite",
        "copy-vendor": "mkdir -p concordia/static/openseadragon/images && cp -R node_modules/openseadragon/build/openseadragon/images/* concordia/static/openseadragon/images/",
        "build": "npm run copy-vendor && vite build",
        "preview": "vite preview",
        "postinstall": "npm run copy-vendor"
    }
}


================================================
FILE: postgresql/create-multiple-postgresql-databases.sh
================================================
#!/bin/bash
set -e
set -u

function create_user_and_database() {
	local database=$1
	echo "  Creating user and database '$database'"
	psql -v ON_ERROR_STOP=1 --username "$POSTGRES_USER" <<-EOSQL
	    CREATE USER $database;
	    CREATE DATABASE $database;
	    GRANT ALL PRIVILEGES ON DATABASE $database TO $database;
EOSQL
}

if [ -n "$POSTGRES_MULTIPLE_DATABASES" ]; then
	echo "Multiple database creation requested: $POSTGRES_MULTIPLE_DATABASES"
	for db in $(echo $POSTGRES_MULTIPLE_DATABASES | tr ',' ' '); do
		create_user_and_database $db
        if [ $db = "sentry" ]
        then
           echo "  Giving sentry superuser powers!!"
           psql -v ON_ERROR_STOP=1 --username postgres  -c "ALTER ROLE sentry superuser;"
        fi
	done
	echo "Multiple databases created"
fi


================================================
FILE: prometheus_metrics/LICENSE
================================================
MIT License

Copyright (c) 2017 Jimdo GmbH

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.


================================================
FILE: prometheus_metrics/__init__.py
================================================


================================================
FILE: prometheus_metrics/apps.py
================================================
from django.apps import AppConfig


class PrometheusMetricsConfig(AppConfig):
    name = "prometheus_metrics"
    verbose_name = "Prometheus Metrics"


================================================
FILE: prometheus_metrics/middleware.py
================================================
from timeit import default_timer

from django.utils.deprecation import MiddlewareMixin
from prometheus_client import Counter, Histogram

requests_total = Counter(
    "django_http_requests_total",
    "Total count of requests",
    ["status_code", "method", "view"],
)
requests_latency = Histogram(
    "django_http_requests_latency_seconds",
    "Histogram of requests processing time",
    ["status_code", "method", "view"],
)


class PrometheusBeforeMiddleware(MiddlewareMixin):
    def process_request(self, request):
        request.prometheus_middleware_request_start = default_timer()

    def process_response(self, request, response):
        resolver_match = request.resolver_match
        if resolver_match:
            handler = resolver_match.url_name
            if not handler:
                handler = resolver_match.view_name
            handler = handler.replace("-", "_")
        else:
            handler = "<unnamed view>"

        requests_total.labels(response.status_code, request.method, handler).inc()

        if hasattr(request, "prometheus_middleware_request_start"):
            requests_latency.labels(
                response.status_code, request.method, handler
            ).observe(default_timer() - request.prometheus_middleware_request_start)
        return response


================================================
FILE: prometheus_metrics/models.py
================================================
from prometheus_client import Counter

model_inserts_total = Counter(
    "django_model_inserts_total", "Number of inserts on a certain model", ["model"]
)
model_updates_total = Counter(
    "django_model_updates_total", "Number of updates on a certain model", ["model"]
)
model_deletes_total = Counter(
    "django_model_deletes_total", "Number of deletes on a certain model", ["model"]
)


def MetricsModelMixin(name):
    class Mixin(object):
        def _do_insert(self, *args, **kwargs):
            model_inserts_total.labels(name).inc()
            return super(Mixin, self)._do_insert(*args, **kwargs)

        def _do_update(self, *args, **kwargs):
            model_updates_total.labels(name).inc()
            return super(Mixin, self)._do_update(*args, **kwargs)

        def _do_delete(self, *args, **kwargs):
            model_deletes_total.labels(name).inc()
            return super(Mixin, self).delete(*args, **kwargs)

    return Mixin


================================================
FILE: prometheus_metrics/views.py
================================================
import prometheus_client
from django.http import HttpResponse
from django.views import View


class MetricsView(View):
    def get(self, request, *args, **kwargs):
        metrics_page = prometheus_client.generate_latest()
        return HttpResponse(
            metrics_page, content_type=prometheus_client.CONTENT_TYPE_LATEST
        )


================================================
FILE: pylenium.json
================================================
{
    "driver": {
        "browser": "chrome",
        "remote_url": "",
        "wait_time": 10,
        "page_load_wait_time": 0,
        "options": [
            "headless",
            "no-sandbox",
            "disable-gpu"
        ],
        "capabilities": {},
        "experimental_options": null,
        "extension_paths": [],
        "webdriver_kwargs": {},
        "seleniumwire_enabled": false,
        "seleniumwire_options": {},
        "local_path": ""
    },
    "logging": {
        "screenshots_on": true
    },
    "viewport": {
        "maximize": true,
        "width": 1440,
        "height": 900,
        "orientation": "portrait"
    },
    "customer": {}
}


================================================
FILE: pyproject.toml
================================================
[tool.black]
target_version = ["py312"]
exclude = '''
(
  /(
    | \.git
    | node_modules
  )/
)
'''

[tool.ruff]
target-version = "py310"
select = [
    "E",
    "F",
    "W",
    "A", # flake8-builtins
    "B", # flake8-bugbear
    "C4", # flake8-comprehensions
    "ERA", # flake8-eradicate
    "G", # flake8-logging-format
    "I", # isort
]
ignore-init-module-imports = true  # Prevents removing imports from __init__.py

extend-exclude = [
        "concordia/settings_dev_*.py"
]

# Ignore line length in migrations
[tool.ruff.per-file-ignores]
"*/migrations/*" = ["E501"]

# v8.0.4 broke original setup config to produce git version - required configuration
[tool.setuptools_scm]


================================================
FILE: setup.cfg
================================================
[pycodestyle]
exclude = .venv,docs/conf.py
ignore =
max-line-length = 88

[tool:pytest]
DJANGO_SETTINGS_MODULE = concordia.settings_test
addopts = -rf

[isort]
default_section = THIRDPARTY
force_grid_wrap = 0
include_trailing_comma = True
known_first_party = concordia,importer,exporter
line_length = 88
multi_line_output = 3
skip = .venv
use_parentheses = True

[flake8]
exclude = .venv,node_modules,concordia/settings_dev_*.py
max-line-length = 88
enable-extensions = G
per-file-ignores =
    */migrations/*:E501

[readme_check]
readmes =
    concordia/views/README.md


================================================
FILE: setup.py
================================================
#!/usr/bin/env python
from setuptools import find_packages, setup

VERSION = __import__("concordia").get_version()
INSTALL_REQUIREMENTS = ["boto3", "Django>=4.2"]
SCRIPTS = ["manage.py"]
DESCRIPTION = "Transcription crowdsourcing"
CLASSIFIERS = """\
Environment :: Web Environment
Framework :: Django
Programming Language :: Python
Programming Language :: Python :: 3.12
""".splitlines()

with open("README.md", "r") as f:
    LONG_DESCRIPTION = f.read()


setup(
    name="concordia",
    version=VERSION,
    description=DESCRIPTION,
    long_description=LONG_DESCRIPTION,
    packages=find_packages(),
    include_package_data=True,
    scripts=SCRIPTS,
    install_requires=INSTALL_REQUIREMENTS,
    classifiers=CLASSIFIERS,
    use_scm_version={
        "write_to": "version.txt",
        "tag_regex": r"^(?P<prefix>v)?(?P<version>[^\+]+)(?P<suffix>.*)?$",
    },
    setup_requires=["setuptools_scm"],
)


================================================
FILE: src/about.js
================================================
import '../concordia/static/js/src/modules/concordia-visualization.js';
import '../concordia/static/js/src/visualizations/asset-status-overview.js';
import '../concordia/static/js/src/visualizations/daily-activity.js';


================================================
FILE: src/main.js
================================================
import $ from 'jquery';
window.$ = window.jQuery = $;
import 'bootstrap';
import 'bootstrap/dist/css/bootstrap.min.css';

/* local scripts */
import '../concordia/static/js/src/about-accordions.js';
import '../concordia/static/js/src/asset-reservation.js';
import '../concordia/static/js/src/banner.js';
import '../concordia/static/js/src/contribute.js';
import '../concordia/static/js/src/filter-assets.js';
import '../concordia/static/js/src/guide.js';
import '../concordia/static/js/src/homepage-carousel.js';
import '../concordia/static/js/src/ocr.js';
import {setTutorialHeight} from '../concordia/static/js/src/modules/quick-tips.js';
import '../concordia/static/js/src/quick-tips-setup.js';
import '../concordia/static/js/src/viewer.js';
import '../concordia/static/js/src/viewer-split.js';

/*- Third-party */
import OpenSeadragon from 'openseadragon';

window.OpenSeadragon = OpenSeadragon;

if (setTutorialHeight) {
    window.setTutorialHeight = setTutorialHeight;
}


================================================
FILE: src/profile.js
================================================
import '../concordia/static/js/src/campaign-selection.js';
import '../concordia/static/js/src/recent-pages.js';
import '../concordia/static/js/src/profile-fields.js';


================================================
FILE: static/.gitignore
================================================
css
js
sourcemaps
frontend


================================================
FILE: tools/readme_symbol_check.py
================================================
#!/usr/bin/env python3
"""
README Symbol Checker

This script verifies that all top-level class and function names defined in Python
files under the directory containing a given README.md file are mentioned somewhere
in the README.

To use it, configure `setup.cfg` with a [readme_check] section like:

    [readme_check]
    readmes =
        concordia/views/README.md

This will recursively scan all `.py` files in `concordia/views/` and ensure every
class/function defined in them appears by name (case-sensitive) somewhere in the
corresponding README.md.
"""

import ast
import configparser
import sys
from pathlib import Path
from typing import List


def collect_defined_symbols(py_path: Path) -> List[str]:
    """
    Parse a Python file and return all top-level class and function names.
    """
    with py_path.open(encoding="utf-8") as f:
        tree = ast.parse(f.read(), filename=str(py_path))
    return [
        node.name
        for node in tree.body
        if isinstance(node, (ast.FunctionDef, ast.ClassDef))
    ]


def read_readme_text(readme_path: Path) -> str:
    return readme_path.read_text(encoding="utf-8")


def check_readme(readme_path: Path) -> int:
    """
    Check that each symbol defined in the Python files under the same directory
    as the README appears in the README text. Returns exit code (0 or 1).
    """
    readme_text = read_readme_text(readme_path)
    search_dir = readme_path.parent
    exit_code = 0

    for py_file in search_dir.rglob("*.py"):
        defined = collect_defined_symbols(py_file)
        for name in defined:
            if name not in readme_text:
                print(f"V001 Symbol '{name}' is not documented in {readme_path.name}")
                exit_code = 1

    return exit_code


def load_readmes_from_config() -> List[Path]:
    """
    Read the list of README.md files from setup.cfg under the [readme_check] section.
    """
    cfg_path = Path("setup.cfg")
    if not cfg_path.exists():
        sys.stderr.write("ERROR: setup.cfg not found\n")
        sys.exit(2)

    config = configparser.ConfigParser()
    config.read(cfg_path)

    try:
        section = config["readme_check"]
        readmes = [
            Path(p.strip())
            for p in section.get("readmes", "").splitlines()
            if p.strip()
        ]
        if not readmes:
            raise ValueError
        return readmes
    except (KeyError, ValueError):
        sys.stderr.write("ERROR: No [readme_check] readmes configured in setup.cfg\n")
        sys.exit(2)


def main() -> None:
    exit_code = 0
    readmes = load_readmes_from_config()

    for readme in readmes:
        if not readme.exists():
            print(f"ERROR: README file not found: {readme}", file=sys.stderr)
            exit_code = 2
        else:
            exit_code = max(exit_code, check_readme(readme))

    sys.exit(exit_code)


if __name__ == "__main__":
    main()


================================================
FILE: vite.config.js
================================================
import {defineConfig} from 'vite';
import {compression} from 'vite-plugin-compression2';
import path from 'node:path';
import {fileURLToPath} from 'node:url';

// Define __dirname for ES Modules
const __dirname = path.dirname(fileURLToPath(import.meta.url));

export default defineConfig({
    base: '/static/',
    resolve: {
        alias: {
            // Map the custom name to its actual directory
            // Adjust the path below to where your visualization logic actually lives
            'concordia-visualization': path.resolve(
                __dirname,
                './concordia/static/js/src/modules/concordia-visualization.js',
            ),
        },
    },
    optimizeDeps: {
        include: ['openseadragon', 'openseadragon-filters'],
    },
    build: {
        // collectstatic ignores hidden files - so 'true' not enough
        manifest: 'manifest.json',
        // Using 'dist' prevents Vite from writing into your source folders
        outDir: 'concordia/static/dist', // where the compiled files go
        emptyOutDir: true,
        rollupOptions: {
            input: {
                // Existing entry points
                main: './src/main.js',
                about: './src/about.js',
                profile: './src/profile.js',

                // ADD the new standalone JS files
                admin_custom: './concordia/static/admin/custom-inline.js',
                admin_editor: './concordia/static/admin/editor-preview.js',
                js_base: './concordia/static/js/src/base.js',
                accessible_colors:
                    './concordia/static/js/src/modules/accessible-colors.js',
                chroma_esm: './concordia/static/js/src/modules/chroma-esm.js',
                turnstile: './concordia/static/js/src/modules/turnstile.js',
                viz_errors:
                    './concordia/static/js/src/modules/visualization-errors.js',
                password_validation:
                    './concordia/static/js/src/password-validation.js',
                viz_asset_status:
                    './concordia/static/js/src/visualizations/asset-status-by-campaign.js',
                jquery_cookie: './concordia/static/vendor/jquery.cookie.js',

                // The SCSS entry point
                base_styles: './concordia/static/scss/base.scss',
            },
            output: {
                // 1. Enable hashing so Vite handles versioning
                entryFileNames: 'js/[name]-[hash].js',
                chunkFileNames: 'js/[name]-[hash].js',
                assetFileNames: 'assets/[name]-[hash][extname]',
            },
        },
    },
    plugins: [
        // 2. Pre-compress files so WhiteNoise doesn't have to at startup
        compression({algorithm: 'gzip'}),
        compression({algorithm: 'brotliCompress'}),
    ],
});