broadinstitute · bpblanken · Oct 24, 2025 · Oct 23, 2025 · Oct 23, 2025 · Oct 23, 2025
diff --git a/clickhouse_search/migrations/0018_queue_rebuild_gt_stats_jobs.py b/clickhouse_search/migrations/0018_queue_rebuild_gt_stats_jobs.py
@@ -0,0 +1,56 @@
+# Generated manually by the seqr team
+import math
+
+from django.db import migrations
+import requests
+
+from settings import PIPELINE_RUNNER_SERVER
+
+
+def batch_project_guids(project_guids, max_batches=30, min_batch_size=5):
+    n = len(project_guids)
+    if n == 0:
+        return []
+    batch_size = max(math.ceil(n / max_batches), min_batch_size)
+    return [project_guids[i : i + batch_size] for i in range(0, n, batch_size)]
+
+
+def queue_rebuild_gt_stats_jobs(apps, schema_editor):
+    ProjectGtStatsGRCh37SnvIndel = apps.get_model(
+        "clickhouse_search", "ProjectGtStatsGRCh37SnvIndel"
+    )
+    ProjectGtStatsSnvIndel = apps.get_model(
+        "clickhouse_search", "ProjectGtStatsSnvIndel"
+    )
+    db_alias = schema_editor.connection.alias
+    for batch in batch_project_guids(
+        list(
+            set(
+                ProjectGtStatsGRCh37SnvIndel.objects.using(db_alias)
+                .values_list("project_guid", flat=True)
+                .distinct()
+            )
+            | set(
+                ProjectGtStatsSnvIndel.objects.using(db_alias)
+                .values_list("project_guid", flat=True)
+                .distinct()
+            )
+        )
+    ):
+        response = requests.post(
+            f"{PIPELINE_RUNNER_SERVER}/rebuild_gt_stats_enqueue",
+            json={"project_guids": batch},
+            timeout=60,
+        )
+        response.raise_for_status()
+        print(f"Triggered rebuild_gt_stats_enqueue for {batch}")
+
+
+class Migration(migrations.Migration):
+    dependencies = [
+        ("clickhouse_search", "0017_fix_affected_status_column_order"),
+    ]
+
+    operations = [
+        migrations.RunPython(queue_rebuild_gt_stats_jobs),
+    ]