fix(migrations): avoid startup outage from 061 full-table backfill

2026-03-03 11:01:22 +08:00
parent b7df7ce5d5
commit 99f1e3ff35
3 changed files with 58 additions and 7 deletions
--- a/backend/migrations/061_add_usage_log_request_type.sql
+++ b/backend/migrations/061_add_usage_log_request_type.sql
@@ -19,11 +19,47 @@ $$;
 CREATE INDEX IF NOT EXISTS idx_usage_logs_request_type_created_at
    ON usage_logs (request_type, created_at);

-- Backfill from legacy fields. openai_ws_mode has higher priority than stream.
-UPDATE usage_logs
-SET request_type = CASE
-    WHEN openai_ws_mode = TRUE THEN 3
-    WHEN stream = TRUE THEN 2
-    ELSE 1
+-- Backfill from legacy fields in bounded batches.
+-- Why bounded:
+-- 1) Full-table UPDATE on large usage_logs can block startup for a long time.
+-- 2) request_type=0 rows remain query-compatible via legacy fallback logic
+--    (stream/openai_ws_mode) in repository filters.
+-- 3) Subsequent writes will use explicit request_type and gradually dilute
+--    historical unknown rows.
+--
+-- openai_ws_mode has higher priority than stream.
+DO $$
+DECLARE
+    v_rows         INTEGER := 0;
+    v_total_rows   INTEGER := 0;
+    v_batch_size   INTEGER := 5000;
+    v_started_at   TIMESTAMPTZ := clock_timestamp();
+    v_max_duration INTERVAL := INTERVAL '8 seconds';
+BEGIN
+    LOOP
+        WITH batch AS (
+            SELECT id
+            FROM usage_logs
+            WHERE request_type = 0
+            ORDER BY id
+            LIMIT v_batch_size
+        )
+        UPDATE usage_logs ul
+        SET request_type = CASE
+            WHEN ul.openai_ws_mode = TRUE THEN 3
+            WHEN ul.stream = TRUE THEN 2
+            ELSE 1
+        END
+        FROM batch
+        WHERE ul.id = batch.id;
+
+        GET DIAGNOSTICS v_rows = ROW_COUNT;
+        EXIT WHEN v_rows = 0;
+
+        v_total_rows := v_total_rows + v_rows;
+        EXIT WHEN clock_timestamp() - v_started_at >= v_max_duration;
+    END LOOP;
+
+    RAISE NOTICE 'usage_logs.request_type startup backfill rows=%', v_total_rows;
 END
-WHERE request_type = 0;
+$$;