Schedule organization snapshot refresh
All checks were successful
CI/CD Pipeline / Quality Gate (push) Successful in 22s
CI/CD Pipeline / Build and Push Images (push) Successful in 5s
CI/CD Pipeline / Internal Notify (push) Successful in 1s
CI/CD Pipeline / Deploy Dev in Dokploy (push) Successful in 1s

This commit is contained in:
2026-05-06 20:54:13 +02:00
parent 0f17ff6773
commit 507ae2063a
3 changed files with 140 additions and 0 deletions

View File

@@ -0,0 +1,59 @@
import json
from django.db import migrations
DAILY_ORGANIZATION_SNAPSHOT_TASK_NAME = "organizations:data-snapshots:daily-msk"
DAILY_ORGANIZATION_SNAPSHOT_TASK_PATH = (
"organizations.tasks.refresh_all_organization_data_snapshots"
)
DAILY_MSK_CRON = {
"minute": "30",
"hour": "4",
"day_of_week": "*",
"day_of_month": "*",
"month_of_year": "*",
"timezone": "Europe/Moscow",
}
def seed_daily_snapshot_refresh_schedule(apps, schema_editor):
CrontabSchedule = apps.get_model("django_celery_beat", "CrontabSchedule")
PeriodicTask = apps.get_model("django_celery_beat", "PeriodicTask")
crontab, _ = CrontabSchedule.objects.get_or_create(**DAILY_MSK_CRON)
field_names = {field.name for field in PeriodicTask._meta.fields}
schedule_fields = {"crontab": crontab}
for field_name in ("interval", "solar", "clocked"):
if field_name in field_names:
schedule_fields[field_name] = None
PeriodicTask.objects.update_or_create(
name=DAILY_ORGANIZATION_SNAPSHOT_TASK_NAME,
defaults={
"task": DAILY_ORGANIZATION_SNAPSHOT_TASK_PATH,
"args": json.dumps([]),
"kwargs": json.dumps({"batch_size": 100}),
"enabled": True,
"description": "Daily full refresh for API v2 organization snapshots.",
**schedule_fields,
},
)
def remove_daily_snapshot_refresh_schedule(apps, schema_editor):
PeriodicTask = apps.get_model("django_celery_beat", "PeriodicTask")
PeriodicTask.objects.filter(name=DAILY_ORGANIZATION_SNAPSHOT_TASK_NAME).delete()
class Migration(migrations.Migration):
dependencies = [
("django_celery_beat", "0018_improve_crontab_helptext"),
("organizations", "0003_allow_branch_kpp_organizations"),
]
operations = [
migrations.RunPython(
seed_daily_snapshot_refresh_schedule,
reverse_code=remove_daily_snapshot_refresh_schedule,
),
]

View File

@@ -12,6 +12,20 @@ from organizations.services import OrganizationDataSnapshotRefreshService
logger = logging.getLogger(__name__)
@shared_task
def refresh_all_organization_data_snapshots(batch_size: int = 100) -> dict:
"""Refresh all organization data snapshots for API v2."""
result = OrganizationDataSnapshotRefreshService.refresh(batch_size=batch_size)
cache.clear()
payload = {
"processed": result.processed,
"created": result.created,
"updated": result.updated,
}
logger.info("All organization data snapshots refreshed: %s", payload)
return payload
@shared_task
def refresh_organization_data_snapshots_for_parser_batch(
*,

View File

@@ -0,0 +1,67 @@
"""Tests for organization snapshot tasks and schedules."""
from importlib import import_module
from django.apps import apps as django_apps
from django.core.cache import cache
from django.test import TestCase
from django_celery_beat.models import PeriodicTask
from organizations.models import Organization
from organizations.tasks import refresh_all_organization_data_snapshots
from tests.apps.parsers.factories import IndustrialCertificateRecordFactory
class OrganizationSnapshotTasksTest(TestCase):
"""Checks Celery tasks that maintain API v2 organization snapshots."""
def test_refresh_all_task_rebuilds_snapshots_and_clears_api_cache(self):
organization = Organization.objects.create(
name='ООО "Снапшот"',
inn="7800000401",
ogrn="1027700144401",
)
IndustrialCertificateRecordFactory(
inn=organization.inn,
ogrn=organization.ogrn,
certificate_number="FULL-SNAPSHOT-CERT",
)
cache.set("api:v2:organizations:test", {"stale": True}, timeout=60)
result = refresh_all_organization_data_snapshots(batch_size=10)
self.assertEqual(result["processed"], 1)
self.assertEqual(result["created"], 1)
self.assertEqual(result["updated"], 0)
self.assertIsNone(cache.get("api:v2:organizations:test"))
snapshot = organization.data_snapshot
self.assertEqual(
snapshot.data["industrial"][0]["certificate_number"],
"FULL-SNAPSHOT-CERT",
)
class OrganizationSnapshotScheduleMigrationTest(TestCase):
"""Checks data migration that schedules full snapshot refresh."""
def test_migration_seeds_daily_snapshot_refresh_periodic_task(self):
migration = import_module(
"organizations.migrations.0004_seed_daily_snapshot_refresh_schedule"
)
migration.seed_daily_snapshot_refresh_schedule(django_apps, None)
migration.seed_daily_snapshot_refresh_schedule(django_apps, None)
task = PeriodicTask.objects.get(
name=migration.DAILY_ORGANIZATION_SNAPSHOT_TASK_NAME
)
self.assertEqual(
task.task,
"organizations.tasks.refresh_all_organization_data_snapshots",
)
self.assertTrue(task.enabled)
self.assertEqual(task.args, "[]")
self.assertEqual(task.kwargs, '{"batch_size": 100}')
self.assertEqual(task.crontab.minute, "30")
self.assertEqual(task.crontab.hour, "4")
self.assertEqual(str(task.crontab.timezone), "Europe/Moscow")