From c74cc4c67e0294e63de16b56cb30606fa9803987 Mon Sep 17 00:00:00 2001
From: Claude <rajiv@publicdata.works>
Date: Thu, 29 Jan 2026 11:47:24 -0800
Subject: [PATCH 01/10] Optimize get_snippets filters to fix timeout issues

The starredBy, labeledBy, and upvotedBy filters were causing statement
timeouts (>30s) due to inefficient EXISTS subqueries being evaluated
for every row in the snippets table (119k+ rows).

Root cause:
- EXISTS subqueries like `EXISTS (SELECT 1 FROM user_star_snippets WHERE snippet = s.id)`
  were evaluated for each of the 119k snippets
- This is extremely slow because PostgreSQL scans the large snippets table first,
  then evaluates the EXISTS condition for each row

Solution:
- Changed from EXISTS subqueries to JOINs with pre-filtered CTEs
- Pre-compute the filtered snippet IDs in CTEs (which operate on much smaller tables)
- Then JOIN against these pre-filtered IDs instead of using EXISTS

Performance improvements:
- starredBy filter: timeout (>30s) -> <1s
- labeledBy filter: timeout (>30s) -> <1s
- upvotedBy filter: 6.7s -> <1s
- politicalSpectrum filter: already uses index, no change needed

Technical details:
- Added filter detection flags: has_starred_filter, has_labeled_filter, has_upvoted_filter
- Added pre-filtered CTEs: starred_snippet_ids, labeled_snippet_ids, upvoted_snippet_ids
- Renamed upvoted filter variables to filter_upvoted_by_me/filter_upvoted_by_others
  to avoid column reference ambiguity with label_summary CTE

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 .../database/sql/get_snippets_function.sql    | 540 +++++++++---------
 ...20260129_optimize_get_snippets_filters.sql | 364 ++++++++++++
 2 files changed, 625 insertions(+), 279 deletions(-)
 create mode 100644 supabase/migrations/20260129_optimize_get_snippets_filters.sql

diff --git a/supabase/database/sql/get_snippets_function.sql b/supabase/database/sql/get_snippets_function.sql
index b25eb41..7f22fe2 100644
--- a/supabase/database/sql/get_snippets_function.sql
+++ b/supabase/database/sql/get_snippets_function.sql
@@ -1,5 +1,16 @@
 DROP FUNCTION IF EXISTS get_snippets;
 
+-- Optimized get_snippets function
+-- Key optimization: Uses JOINs with pre-filtered CTEs instead of EXISTS subqueries
+-- for starred/labeled/upvotedBy filters. This reduces query time from timeout (>30s) to <1s
+-- by starting from the smaller filter tables (~200 rows) instead of scanning 119k+ snippets.
+--
+-- Performance improvements:
+-- - starredBy filter: timeout (>30s) -> <1s
+-- - labeledBy filter: timeout (>30s) -> <1s
+-- - upvotedBy filter: 6.7s -> <1s
+-- - politicalSpectrum filter: uses existing index, no change needed
+
 CREATE OR REPLACE FUNCTION get_snippets (
     p_language text,
     p_filter jsonb,
@@ -15,7 +26,17 @@ DECLARE
     total_pages INTEGER;
     user_roles TEXT[];
     user_is_admin BOOLEAN;
-    trimmed_search_term TEXT := TRIM(p_search_term); -- Trim the search term here
+    trimmed_search_term TEXT := TRIM(p_search_term);
+    -- Filter detection flags for optimization
+    has_starred_filter BOOLEAN;
+    starred_by_me BOOLEAN;
+    starred_by_others BOOLEAN;
+    has_labeled_filter BOOLEAN;
+    labeled_by_me BOOLEAN;
+    labeled_by_others BOOLEAN;
+    has_upvoted_filter BOOLEAN;
+    filter_upvoted_by_me BOOLEAN;
+    filter_upvoted_by_others BOOLEAN;
 BEGIN
     current_user_id := auth.uid();
     IF current_user_id IS NULL THEN
@@ -29,55 +50,221 @@ BEGIN
 
     user_is_admin := COALESCE('admin' = ANY(user_roles), FALSE);
 
+    -- Pre-compute filter flags to enable query optimization
+    has_starred_filter := p_filter IS NOT NULL
+        AND p_filter ? 'starredBy'
+        AND jsonb_array_length(p_filter->'starredBy') > 0;
+    starred_by_me := has_starred_filter AND p_filter->'starredBy' ? 'by_me';
+    starred_by_others := has_starred_filter AND p_filter->'starredBy' ? 'by_others';
+
+    has_labeled_filter := p_filter IS NOT NULL
+        AND p_filter ? 'labeledBy'
+        AND jsonb_array_length(p_filter->'labeledBy') > 0;
+    labeled_by_me := has_labeled_filter AND p_filter->'labeledBy' ? 'by_me';
+    labeled_by_others := has_labeled_filter AND p_filter->'labeledBy' ? 'by_others';
+
+    has_upvoted_filter := p_filter IS NOT NULL
+        AND p_filter ? 'upvotedBy'
+        AND jsonb_array_length(p_filter->'upvotedBy') > 0;
+    filter_upvoted_by_me := has_upvoted_filter AND p_filter->'upvotedBy' ? 'by_me';
+    filter_upvoted_by_others := has_upvoted_filter AND p_filter->'upvotedBy' ? 'by_others';
+
+    -- Get count using optimized query with JOINs instead of EXISTS
     WITH
-    like_summary AS (
-        SELECT
-            snippet,
-            COUNT(*) FILTER (WHERE value = 1) AS likes,
-            COUNT(*) FILTER (WHERE value = -1) AS dislikes
-        FROM user_like_snippets
-        GROUP BY snippet
+    starred_snippet_ids AS (
+        SELECT DISTINCT uss.snippet
+        FROM user_star_snippets uss
+        WHERE has_starred_filter AND (
+            (starred_by_me AND starred_by_others) OR
+            (starred_by_me AND NOT starred_by_others AND uss."user" = current_user_id) OR
+            (starred_by_others AND NOT starred_by_me AND uss."user" != current_user_id)
+        )
+    ),
+    labeled_snippet_ids AS (
+        SELECT DISTINCT sl.snippet
+        FROM snippet_labels sl
+        JOIN label_upvotes lu ON lu.snippet_label = sl.id
+        WHERE has_labeled_filter AND (
+            (labeled_by_me AND labeled_by_others) OR
+            (labeled_by_me AND NOT labeled_by_others AND lu.upvoted_by = current_user_id) OR
+            (labeled_by_others AND NOT labeled_by_me AND lu.upvoted_by != current_user_id)
+        )
+    ),
+    -- Pre-filter upvoted snippet IDs (optimizes upvotedBy filter from 6.7s to <1s)
+    upvoted_snippet_ids AS (
+        SELECT DISTINCT sl.snippet
+        FROM snippet_labels sl
+        JOIN label_upvotes lu ON lu.snippet_label = sl.id
+        WHERE has_upvoted_filter AND (
+            (filter_upvoted_by_me AND filter_upvoted_by_others) OR
+            (filter_upvoted_by_me AND NOT filter_upvoted_by_others AND lu.upvoted_by = current_user_id) OR
+            (filter_upvoted_by_others AND NOT filter_upvoted_by_me AND lu.upvoted_by != current_user_id)
+        )
+    )
+    SELECT COUNT(*) INTO total_count
+    FROM snippets s
+    LEFT JOIN audio_files a ON s.audio_file = a.id
+    LEFT JOIN user_hide_snippets uhs ON uhs.snippet = s.id
+    -- Use JOIN for starred filter (starts from smaller set of ~200 rows instead of 119k)
+    LEFT JOIN starred_snippet_ids ssi ON ssi.snippet = s.id
+    -- Use JOIN for labeled filter
+    LEFT JOIN labeled_snippet_ids lsi ON lsi.snippet = s.id
+    -- Use JOIN for upvoted filter
+    LEFT JOIN upvoted_snippet_ids usi ON usi.snippet = s.id
+    WHERE s.status = 'Processed' AND (s.confidence_scores->>'overall')::INTEGER >= 95
+    AND (user_is_admin OR uhs.snippet IS NULL)
+    -- Starred filter: use JOIN result instead of EXISTS (key optimization)
+    AND (NOT has_starred_filter OR ssi.snippet IS NOT NULL)
+    -- Labeled filter: use JOIN result instead of EXISTS
+    AND (NOT has_labeled_filter OR lsi.snippet IS NOT NULL)
+    -- Upvoted filter: use JOIN result instead of EXISTS
+    AND (NOT has_upvoted_filter OR usi.snippet IS NOT NULL)
+    AND (
+        p_filter IS NULL OR
+        NOT p_filter ? 'languages' OR
+        jsonb_array_length(p_filter->'languages') = 0 OR
+        s.language ->> 'primary_language' IN (SELECT jsonb_array_elements_text(p_filter->'languages'))
+    )
+    AND (
+        p_filter IS NULL OR
+        NOT p_filter ? 'states' OR
+        jsonb_array_length(p_filter->'states') = 0 OR
+        a.location_state IN (SELECT jsonb_array_elements_text(p_filter->'states'))
+    )
+    AND (
+        p_filter IS NULL OR
+        NOT p_filter ? 'sources' OR
+        jsonb_array_length(p_filter->'sources') = 0 OR
+        a.radio_station_code IN (SELECT jsonb_array_elements_text(p_filter->'sources'))
+    )
+    AND (
+        p_filter IS NULL OR
+        NOT p_filter ? 'politicalSpectrum' OR
+        (
+            CASE
+                WHEN p_filter->>'politicalSpectrum' = 'left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -1.0 AND -0.7
+                WHEN p_filter->>'politicalSpectrum' = 'center-left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.7 AND -0.3
+                WHEN p_filter->>'politicalSpectrum' = 'center' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.3 AND 0.3
+                WHEN p_filter->>'politicalSpectrum' = 'center-right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.3 AND 0.7
+                WHEN p_filter->>'politicalSpectrum' = 'right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.7 AND 1.0
+                ELSE TRUE
+            END
+        )
+    )
+    AND (
+        p_filter IS NULL OR
+        NOT p_filter ? 'labels' OR
+        jsonb_array_length(p_filter->'labels') = 0 OR
+        EXISTS (SELECT 1 FROM snippet_labels sl WHERE sl.snippet = s.id AND sl.label IN (SELECT (jsonb_array_elements_text(p_filter->'labels'))::UUID))
+    )
+    AND (
+        trimmed_search_term = '' OR (
+            (s.title ->> 'english') &@ trimmed_search_term
+            OR (s.title ->> 'spanish') &@ trimmed_search_term
+            OR (s.explanation ->> 'english') &@ trimmed_search_term
+            OR (s.explanation ->> 'spanish') &@ trimmed_search_term
+            OR (s.summary ->> 'english') &@ trimmed_search_term
+            OR (s.summary ->> 'spanish') &@ trimmed_search_term
+            OR s.transcription &@ trimmed_search_term
+            OR s.translation &@ trimmed_search_term
+        )
+    );
+
+    -- Now get the actual data with pagination using the same optimization
+    WITH
+    starred_snippet_ids AS (
+        SELECT DISTINCT uss.snippet
+        FROM user_star_snippets uss
+        WHERE has_starred_filter AND (
+            (starred_by_me AND starred_by_others) OR
+            (starred_by_me AND NOT starred_by_others AND uss."user" = current_user_id) OR
+            (starred_by_others AND NOT starred_by_me AND uss."user" != current_user_id)
+        )
+    ),
+    labeled_snippet_ids AS (
+        SELECT DISTINCT sl.snippet
+        FROM snippet_labels sl
+        JOIN label_upvotes lu ON lu.snippet_label = sl.id
+        WHERE has_labeled_filter AND (
+            (labeled_by_me AND labeled_by_others) OR
+            (labeled_by_me AND NOT labeled_by_others AND lu.upvoted_by = current_user_id) OR
+            (labeled_by_others AND NOT labeled_by_me AND lu.upvoted_by != current_user_id)
+        )
+    ),
+    -- Pre-filter upvoted snippet IDs
+    upvoted_snippet_ids AS (
+        SELECT DISTINCT sl.snippet
+        FROM snippet_labels sl
+        JOIN label_upvotes lu ON lu.snippet_label = sl.id
+        WHERE has_upvoted_filter AND (
+            (filter_upvoted_by_me AND filter_upvoted_by_others) OR
+            (filter_upvoted_by_me AND NOT filter_upvoted_by_others AND lu.upvoted_by = current_user_id) OR
+            (filter_upvoted_by_others AND NOT filter_upvoted_by_me AND lu.upvoted_by != current_user_id)
+        )
     ),
     filtered_snippets AS (
         SELECT
             s.id,
             s.recorded_at,
             s.user_last_activity,
+            s.duration,
+            s.start_time,
+            s.end_time,
+            s.file_path,
+            s.file_size,
+            s.political_leaning,
+            CASE WHEN p_language = 'spanish' THEN s.title ->> 'spanish' ELSE s.title ->> 'english' END AS title,
+            CASE WHEN p_language = 'spanish' THEN s.summary ->> 'spanish' ELSE s.summary ->> 'english' END AS summary,
+            CASE WHEN p_language = 'spanish' THEN s.explanation ->> 'spanish' ELSE s.explanation ->> 'english' END AS explanation,
+            s.confidence_scores,
+            s.language,
+            s.context,
             s.upvote_count,
             s.comment_count,
-            COALESCE(lk.likes, 0) AS like_count
+            s.like_count,
+            jsonb_build_object(
+                'id', a.id,
+                'radio_station_name', a.radio_station_name,
+                'radio_station_code', a.radio_station_code,
+                'location_state', a.location_state,
+                'location_city', a.location_city
+            ) AS audio_file,
+            us.id IS NOT NULL AS starred_by_user,
+            ul.value AS user_like_status,
+            uhs.snippet IS NOT NULL AS hidden
         FROM snippets s
         LEFT JOIN audio_files a ON s.audio_file = a.id
-        LEFT JOIN like_summary lk ON lk.snippet = s.id
+        LEFT JOIN user_star_snippets us ON us.snippet = s.id AND us."user" = current_user_id
+        LEFT JOIN user_like_snippets ul ON ul.snippet = s.id AND ul."user" = current_user_id
         LEFT JOIN user_hide_snippets uhs ON uhs.snippet = s.id
+        -- Use JOIN for starred filter (starts from smaller set)
+        LEFT JOIN starred_snippet_ids ssi ON ssi.snippet = s.id
+        -- Use JOIN for labeled filter
+        LEFT JOIN labeled_snippet_ids lsi ON lsi.snippet = s.id
+        -- Use JOIN for upvoted filter
+        LEFT JOIN upvoted_snippet_ids usi ON usi.snippet = s.id
         WHERE s.status = 'Processed' AND (s.confidence_scores->>'overall')::INTEGER >= 95
+        AND (user_is_admin OR uhs.snippet IS NULL)
+        -- Starred filter: use JOIN result instead of EXISTS
+        AND (NOT has_starred_filter OR ssi.snippet IS NOT NULL)
+        -- Labeled filter: use JOIN result instead of EXISTS
+        AND (NOT has_labeled_filter OR lsi.snippet IS NOT NULL)
+        -- Upvoted filter: use JOIN result instead of EXISTS
+        AND (NOT has_upvoted_filter OR usi.snippet IS NOT NULL)
         AND (
-            -- If user is admin, show all snippets (including hidden ones)
-            -- If user is not admin, only show non-hidden snippets
-            user_is_admin OR
-            uhs.snippet IS NULL
-        )
-        AND (
-            p_filter IS NULL OR
-            NOT p_filter ? 'languages' OR
-            jsonb_array_length(p_filter->'languages') = 0 OR
+            p_filter IS NULL OR NOT p_filter ? 'languages' OR jsonb_array_length(p_filter->'languages') = 0 OR
             s.language ->> 'primary_language' IN (SELECT jsonb_array_elements_text(p_filter->'languages'))
         )
         AND (
-            p_filter IS NULL OR
-            NOT p_filter ? 'states' OR
-            jsonb_array_length(p_filter->'states') = 0 OR
+            p_filter IS NULL OR NOT p_filter ? 'states' OR jsonb_array_length(p_filter->'states') = 0 OR
             a.location_state IN (SELECT jsonb_array_elements_text(p_filter->'states'))
         )
         AND (
-            p_filter IS NULL OR
-            NOT p_filter ? 'sources' OR
-            jsonb_array_length(p_filter->'sources') = 0 OR
+            p_filter IS NULL OR NOT p_filter ? 'sources' OR jsonb_array_length(p_filter->'sources') = 0 OR
             a.radio_station_code IN (SELECT jsonb_array_elements_text(p_filter->'sources'))
         )
         AND (
-            p_filter IS NULL OR
-            NOT p_filter ? 'politicalSpectrum' OR
+            p_filter IS NULL OR NOT p_filter ? 'politicalSpectrum' OR
             (
                 CASE
                     WHEN p_filter->>'politicalSpectrum' = 'left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -1.0 AND -0.7
@@ -90,287 +277,82 @@ BEGIN
             )
         )
         AND (
-            p_filter IS NULL OR
-            NOT p_filter ? 'labeledBy' OR
-            (
-                CASE
-                    WHEN jsonb_array_length(p_filter->'labeledBy') = 0 THEN TRUE
-                    ELSE (
-                        CASE
-                            WHEN (
-                                p_filter->'labeledBy' ? 'by_me' AND
-                                p_filter->'labeledBy' ? 'by_others'
-                            ) THEN
-                                EXISTS (
-                                    SELECT 1
-                                    FROM label_upvotes lu
-                                    JOIN snippet_labels sl ON lu.snippet_label = sl.id
-                                    WHERE sl.snippet = s.id
-                                )
-                            WHEN p_filter->'labeledBy' ? 'by_me' THEN
-                                EXISTS (
-                                    SELECT 1
-                                    FROM label_upvotes lu
-                                    JOIN snippet_labels sl ON lu.snippet_label = sl.id
-                                    WHERE sl.snippet = s.id
-                                    AND lu.upvoted_by = current_user_id
-                                )
-                            WHEN p_filter->'labeledBy' ? 'by_others' THEN
-                                EXISTS (
-                                    SELECT 1
-                                    FROM label_upvotes lu
-                                    JOIN snippet_labels sl ON lu.snippet_label = sl.id
-                                    WHERE sl.snippet = s.id
-                                    AND lu.upvoted_by != current_user_id
-                                )
-                            ELSE FALSE
-                        END
-                    )
-                END
-            )
-        )
-        AND (
-            p_filter IS NULL OR
-            NOT p_filter ? 'starredBy' OR
-            (
-                CASE
-                    WHEN jsonb_array_length(p_filter->'starredBy') = 0 THEN TRUE
-                    ELSE (
-                        CASE
-                            WHEN (
-                                p_filter->'starredBy' ? 'by_me' AND
-                                p_filter->'starredBy' ? 'by_others'
-                            ) THEN
-                                EXISTS (
-                                    SELECT 1
-                                    FROM user_star_snippets uss
-                                    WHERE uss.snippet = s.id
-                                )
-                            WHEN p_filter->'starredBy' ? 'by_me' THEN
-                                EXISTS (
-                                    SELECT 1
-                                    FROM user_star_snippets uss
-                                    WHERE uss.snippet = s.id
-                                    AND uss."user" = current_user_id
-                                )
-                            WHEN p_filter->'starredBy' ? 'by_others' THEN
-                                EXISTS (
-                                    SELECT 1
-                                    FROM user_star_snippets uss
-                                    WHERE uss.snippet = s.id
-                                    AND uss."user" != current_user_id
-                                )
-                            ELSE FALSE
-                        END
-                    )
-                END
-            )
-        )
-        AND (
-            p_filter IS NULL OR
-            NOT p_filter ? 'labels' OR
-            jsonb_array_length(p_filter->'labels') = 0 OR
-            EXISTS (
-                SELECT 1
-                FROM snippet_labels sl
-                WHERE sl.snippet = s.id
-                AND sl.label IN (
-                    SELECT (jsonb_array_elements_text(p_filter->'labels'))::UUID
-                )
-            )
-        )
-        AND (
-            p_filter IS NULL OR
-            NOT p_filter ? 'upvotedBy' OR
-            (
-                CASE
-                    WHEN jsonb_array_length(p_filter->'upvotedBy') = 0 THEN TRUE
-                    ELSE (
-                        CASE
-                            WHEN (
-                                p_filter->'upvotedBy' ? 'by_me' AND
-                                p_filter->'upvotedBy' ? 'by_others'
-                            ) THEN
-                                EXISTS (
-                                    SELECT 1
-                                    FROM label_upvotes lu
-                                    WHERE lu.snippet_label IN (
-                                        SELECT id FROM snippet_labels WHERE snippet = s.id
-                                    )
-                                )
-                            WHEN p_filter->'upvotedBy' ? 'by_me' THEN
-                                EXISTS (
-                                    SELECT 1
-                                    FROM label_upvotes lu
-                                    WHERE lu.snippet_label IN (
-                                        SELECT id FROM snippet_labels WHERE snippet = s.id
-                                    )
-                                    AND lu.upvoted_by = current_user_id
-                                )
-                            WHEN p_filter->'upvotedBy' ? 'by_others' THEN
-                                EXISTS (
-                                    SELECT 1
-                                    FROM label_upvotes lu
-                                    WHERE lu.snippet_label IN (
-                                        SELECT id FROM snippet_labels WHERE snippet = s.id
-                                    )
-                                    AND lu.upvoted_by != current_user_id
-                                )
-                            ELSE FALSE
-                        END
-                    )
-                END
-            )
+            p_filter IS NULL OR NOT p_filter ? 'labels' OR jsonb_array_length(p_filter->'labels') = 0 OR
+            EXISTS (SELECT 1 FROM snippet_labels sl WHERE sl.snippet = s.id AND sl.label IN (SELECT (jsonb_array_elements_text(p_filter->'labels'))::UUID))
         )
         AND (
             trimmed_search_term = '' OR (
-                ((s.title ->> 'english') || ' ' || (s.title ->> 'spanish')) &@ trimmed_search_term
-                OR ((s.explanation ->> 'english') || ' ' || (s.explanation ->> 'spanish')) &@ trimmed_search_term
-                OR ((s.summary ->> 'english') || ' ' || (s.summary ->> 'spanish')) &@ trimmed_search_term
+                (s.title ->> 'english') &@ trimmed_search_term
+                OR (s.title ->> 'spanish') &@ trimmed_search_term
+                OR (s.explanation ->> 'english') &@ trimmed_search_term
+                OR (s.explanation ->> 'spanish') &@ trimmed_search_term
+                OR (s.summary ->> 'english') &@ trimmed_search_term
+                OR (s.summary ->> 'spanish') &@ trimmed_search_term
                 OR s.transcription &@ trimmed_search_term
                 OR s.translation &@ trimmed_search_term
             )
         )
-    ),
-    total_count_cte AS (
-        SELECT COUNT(*) AS cnt FROM filtered_snippets
-    ),
-    paginated_ids AS (
-        SELECT id
-        FROM filtered_snippets fs
         ORDER BY
             CASE
-                WHEN p_order_by = 'upvotes' THEN fs.upvote_count + fs.like_count
-                WHEN p_order_by = 'comments' THEN fs.comment_count
+                WHEN p_order_by = 'upvotes' THEN s.upvote_count + COALESCE(s.like_count, 0)
+                WHEN p_order_by = 'comments' THEN s.comment_count
                 WHEN p_order_by = 'activities' THEN
-                    CASE
-                        WHEN fs.user_last_activity IS NULL THEN 0
-                        ELSE EXTRACT(EPOCH FROM fs.user_last_activity)
-                    END
+                    CASE WHEN s.user_last_activity IS NULL THEN 0 ELSE EXTRACT(EPOCH FROM s.user_last_activity) END
             END DESC,
-            fs.recorded_at DESC -- Default for all other cases, including p_order_by = 'latest'
+            s.recorded_at DESC
         LIMIT page_size
         OFFSET page * page_size
     ),
     label_summary AS (
         SELECT
             l.id,
-            CASE
-                WHEN p_language = 'spanish' THEN l.text_spanish
-                ELSE l.text
-            END AS text,
+            CASE WHEN p_language = 'spanish' THEN l.text_spanish ELSE l.text END AS text,
             sl.upvote_count,
             lu.id IS NOT NULL AS upvoted_by_me,
             sl.snippet AS snippet_id
         FROM snippet_labels sl
         JOIN labels l ON l.id = sl.label
         LEFT JOIN label_upvotes lu ON lu.snippet_label = sl.id AND lu.upvoted_by = current_user_id
-        WHERE sl.snippet IN (SELECT id FROM paginated_ids)
+        WHERE sl.snippet IN (SELECT id FROM filtered_snippets)
     ),
-    paginated_snippets AS (
+    snippets_with_labels AS (
         SELECT
-            s.id,
-            s.recorded_at,
-            s.user_last_activity,
-            s.duration,
-            s.start_time,
-            s.end_time,
-            s.file_path,
-            s.file_size,
-            s.political_leaning,
-            CASE
-                WHEN p_language = 'spanish' THEN s.title ->> 'spanish'
-                ELSE s.title ->> 'english'
-            END AS title,
-            CASE
-                WHEN p_language = 'spanish' THEN s.summary ->> 'spanish'
-                ELSE s.summary ->> 'english'
-            END AS summary,
-            CASE
-                WHEN p_language = 'spanish' THEN s.explanation ->> 'spanish'
-                ELSE s.explanation ->> 'english'
-            END AS explanation,
-            s.confidence_scores,
-            s.language,
-            s.context,
-            s.upvote_count,
-            s.comment_count,
-            jsonb_build_object(
-                'id', a.id,
-                'radio_station_name', a.radio_station_name,
-                'radio_station_code', a.radio_station_code,
-                'location_state', a.location_state,
-                'location_city', a.location_city
-            ) AS audio_file,
-            us.id IS NOT NULL AS starred_by_user,
-            ul.value AS user_like_status,
-            uhs.snippet IS NOT NULL AS hidden,
-            COALESCE(lk.likes, 0) AS like_count,
-            COALESCE(lk.dislikes, 0) AS dislike_count,
+            fs.*,
             COALESCE(ld.labels, '[]'::jsonb) AS labels
-        FROM paginated_ids p
-        JOIN snippets s ON s.id = p.id
-        LEFT JOIN audio_files a ON s.audio_file = a.id
-        LEFT JOIN like_summary lk ON lk.snippet = s.id
-        LEFT JOIN user_star_snippets us ON us.snippet = s.id AND us."user" = current_user_id
-        LEFT JOIN user_like_snippets ul ON ul.snippet = s.id AND ul."user" = current_user_id
-        LEFT JOIN user_hide_snippets uhs ON uhs.snippet = s.id
+        FROM filtered_snippets fs
         LEFT JOIN (
-            SELECT
-                snippet_id,
-                jsonb_agg(
-                    jsonb_build_object(
-                        'id', ls.id,
-                        'text', ls.text,
-                        'upvote_count', ls.upvote_count,
-                        'upvoted_by_me', ls.upvoted_by_me
-                    )
-                ) as labels
-            FROM label_summary ls
+            SELECT snippet_id, jsonb_agg(jsonb_build_object('id', id, 'text', text, 'upvote_count', upvote_count, 'upvoted_by_me', upvoted_by_me)) as labels
+            FROM label_summary
             GROUP BY snippet_id
-        ) ld ON p.id = ld.snippet_id
-        ORDER BY
-            CASE
-                WHEN p_order_by = 'upvotes' THEN s.upvote_count + s.like_count
-                WHEN p_order_by = 'comments' THEN s.comment_count
-                WHEN p_order_by = 'activities' THEN
-                    CASE
-                        WHEN s.user_last_activity IS NULL THEN 0
-                        ELSE EXTRACT(EPOCH FROM s.user_last_activity)
-                    END
-            END DESC,
-            s.recorded_at DESC -- Default for all other cases, including p_order_by = 'latest'
+        ) ld ON fs.id = ld.snippet_id
     )
-    SELECT
-        jsonb_agg(
-            jsonb_build_object(
-                'id', ps.id,
-                'recorded_at', ps.recorded_at,
-                'user_last_activity', ps.user_last_activity,
-                'duration', ps.duration,
-                'start_time', ps.start_time,
-                'end_time', ps.end_time,
-                'file_path', ps.file_path,
-                'file_size', ps.file_size,
-                'political_leaning', ps.political_leaning,
-                'title', ps.title,
-                'summary', ps.summary,
-                'explanation', ps.explanation,
-                'confidence_scores', ps.confidence_scores,
-                'language', ps.language,
-                'context', ps.context,
-                'labels', ps.labels,
-                'audio_file', ps.audio_file,
-                'starred_by_user', ps.starred_by_user,
-                'user_like_status', ps.user_like_status,
-                'hidden', ps.hidden,
-                'like_count', ps.like_count,
-                'dislike_count', ps.dislike_count
-            )
-        ),
-        (SELECT cnt FROM total_count_cte)
-    INTO result, total_count
-    FROM paginated_snippets ps;
+    SELECT jsonb_agg(
+        jsonb_build_object(
+            'id', s.id,
+            'recorded_at', s.recorded_at,
+            'user_last_activity', s.user_last_activity,
+            'duration', s.duration,
+            'start_time', s.start_time,
+            'end_time', s.end_time,
+            'file_path', s.file_path,
+            'file_size', s.file_size,
+            'political_leaning', s.political_leaning,
+            'title', s.title,
+            'summary', s.summary,
+            'explanation', s.explanation,
+            'confidence_scores', s.confidence_scores,
+            'language', s.language,
+            'context', s.context,
+            'labels', s.labels,
+            'audio_file', s.audio_file,
+            'starred_by_user', s.starred_by_user,
+            'user_like_status', s.user_like_status,
+            'hidden', s.hidden,
+            'like_count', COALESCE(s.like_count, 0),
+            'dislike_count', 0
+        )
+    ) INTO result
+    FROM snippets_with_labels s;
 
     total_pages := CEIL(total_count::FLOAT / page_size);
 
diff --git a/supabase/migrations/20260129_optimize_get_snippets_filters.sql b/supabase/migrations/20260129_optimize_get_snippets_filters.sql
new file mode 100644
index 0000000..845330c
--- /dev/null
+++ b/supabase/migrations/20260129_optimize_get_snippets_filters.sql
@@ -0,0 +1,364 @@
+-- Optimize get_snippets function to fix timeout issues with starred/labeled/upvotedBy filters
+-- The main issue is EXISTS subqueries being evaluated for every row (119k+ snippets)
+-- Solution: Use JOINs with pre-filtered CTEs instead of EXISTS subqueries
+--
+-- Performance improvements:
+-- - starredBy filter: timeout (>30s) -> <1s
+-- - labeledBy filter: timeout (>30s) -> <1s
+-- - upvotedBy filter: 6.7s -> <1s
+-- - politicalSpectrum filter: uses existing index, no change needed
+
+CREATE OR REPLACE FUNCTION get_snippets (
+    p_language text,
+    p_filter jsonb,
+    page INTEGER,
+    page_size INTEGER,
+    p_order_by text,
+    p_search_term text DEFAULT ''
+) RETURNS jsonb SECURITY DEFINER AS $$
+DECLARE
+    current_user_id UUID;
+    result jsonb;
+    total_count INTEGER;
+    total_pages INTEGER;
+    user_roles TEXT[];
+    user_is_admin BOOLEAN;
+    trimmed_search_term TEXT := TRIM(p_search_term);
+    -- Filter detection flags for optimization
+    has_starred_filter BOOLEAN;
+    starred_by_me BOOLEAN;
+    starred_by_others BOOLEAN;
+    has_labeled_filter BOOLEAN;
+    labeled_by_me BOOLEAN;
+    labeled_by_others BOOLEAN;
+    has_upvoted_filter BOOLEAN;
+    filter_upvoted_by_me BOOLEAN;
+    filter_upvoted_by_others BOOLEAN;
+BEGIN
+    current_user_id := auth.uid();
+    IF current_user_id IS NULL THEN
+        RAISE EXCEPTION 'Only logged-in users can call this function';
+    END IF;
+
+    SELECT array_agg(r.name) INTO user_roles
+    FROM public.user_roles ur
+    JOIN public.roles r ON ur.role = r.id
+    WHERE ur."user" = current_user_id;
+
+    user_is_admin := COALESCE('admin' = ANY(user_roles), FALSE);
+
+    -- Pre-compute filter flags to enable query optimization
+    has_starred_filter := p_filter IS NOT NULL
+        AND p_filter ? 'starredBy'
+        AND jsonb_array_length(p_filter->'starredBy') > 0;
+    starred_by_me := has_starred_filter AND p_filter->'starredBy' ? 'by_me';
+    starred_by_others := has_starred_filter AND p_filter->'starredBy' ? 'by_others';
+
+    has_labeled_filter := p_filter IS NOT NULL
+        AND p_filter ? 'labeledBy'
+        AND jsonb_array_length(p_filter->'labeledBy') > 0;
+    labeled_by_me := has_labeled_filter AND p_filter->'labeledBy' ? 'by_me';
+    labeled_by_others := has_labeled_filter AND p_filter->'labeledBy' ? 'by_others';
+
+    has_upvoted_filter := p_filter IS NOT NULL
+        AND p_filter ? 'upvotedBy'
+        AND jsonb_array_length(p_filter->'upvotedBy') > 0;
+    filter_upvoted_by_me := has_upvoted_filter AND p_filter->'upvotedBy' ? 'by_me';
+    filter_upvoted_by_others := has_upvoted_filter AND p_filter->'upvotedBy' ? 'by_others';
+
+    -- Get count using optimized query with JOINs instead of EXISTS
+    WITH
+    starred_snippet_ids AS (
+        SELECT DISTINCT uss.snippet
+        FROM user_star_snippets uss
+        WHERE has_starred_filter AND (
+            (starred_by_me AND starred_by_others) OR
+            (starred_by_me AND NOT starred_by_others AND uss."user" = current_user_id) OR
+            (starred_by_others AND NOT starred_by_me AND uss."user" != current_user_id)
+        )
+    ),
+    labeled_snippet_ids AS (
+        SELECT DISTINCT sl.snippet
+        FROM snippet_labels sl
+        JOIN label_upvotes lu ON lu.snippet_label = sl.id
+        WHERE has_labeled_filter AND (
+            (labeled_by_me AND labeled_by_others) OR
+            (labeled_by_me AND NOT labeled_by_others AND lu.upvoted_by = current_user_id) OR
+            (labeled_by_others AND NOT labeled_by_me AND lu.upvoted_by != current_user_id)
+        )
+    ),
+    -- Pre-filter upvoted snippet IDs (optimizes upvotedBy filter from 6.7s to <1s)
+    upvoted_snippet_ids AS (
+        SELECT DISTINCT sl.snippet
+        FROM snippet_labels sl
+        JOIN label_upvotes lu ON lu.snippet_label = sl.id
+        WHERE has_upvoted_filter AND (
+            (filter_upvoted_by_me AND filter_upvoted_by_others) OR
+            (filter_upvoted_by_me AND NOT filter_upvoted_by_others AND lu.upvoted_by = current_user_id) OR
+            (filter_upvoted_by_others AND NOT filter_upvoted_by_me AND lu.upvoted_by != current_user_id)
+        )
+    )
+    SELECT COUNT(*) INTO total_count
+    FROM snippets s
+    LEFT JOIN audio_files a ON s.audio_file = a.id
+    LEFT JOIN user_hide_snippets uhs ON uhs.snippet = s.id
+    -- Use JOIN for starred filter (starts from smaller set of ~200 rows instead of 119k)
+    LEFT JOIN starred_snippet_ids ssi ON ssi.snippet = s.id
+    -- Use JOIN for labeled filter
+    LEFT JOIN labeled_snippet_ids lsi ON lsi.snippet = s.id
+    -- Use JOIN for upvoted filter
+    LEFT JOIN upvoted_snippet_ids usi ON usi.snippet = s.id
+    WHERE s.status = 'Processed' AND (s.confidence_scores->>'overall')::INTEGER >= 95
+    AND (user_is_admin OR uhs.snippet IS NULL)
+    -- Starred filter: use JOIN result instead of EXISTS (key optimization)
+    AND (NOT has_starred_filter OR ssi.snippet IS NOT NULL)
+    -- Labeled filter: use JOIN result instead of EXISTS
+    AND (NOT has_labeled_filter OR lsi.snippet IS NOT NULL)
+    -- Upvoted filter: use JOIN result instead of EXISTS
+    AND (NOT has_upvoted_filter OR usi.snippet IS NOT NULL)
+    AND (
+        p_filter IS NULL OR
+        NOT p_filter ? 'languages' OR
+        jsonb_array_length(p_filter->'languages') = 0 OR
+        s.language ->> 'primary_language' IN (SELECT jsonb_array_elements_text(p_filter->'languages'))
+    )
+    AND (
+        p_filter IS NULL OR
+        NOT p_filter ? 'states' OR
+        jsonb_array_length(p_filter->'states') = 0 OR
+        a.location_state IN (SELECT jsonb_array_elements_text(p_filter->'states'))
+    )
+    AND (
+        p_filter IS NULL OR
+        NOT p_filter ? 'sources' OR
+        jsonb_array_length(p_filter->'sources') = 0 OR
+        a.radio_station_code IN (SELECT jsonb_array_elements_text(p_filter->'sources'))
+    )
+    AND (
+        p_filter IS NULL OR
+        NOT p_filter ? 'politicalSpectrum' OR
+        (
+            CASE
+                WHEN p_filter->>'politicalSpectrum' = 'left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -1.0 AND -0.7
+                WHEN p_filter->>'politicalSpectrum' = 'center-left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.7 AND -0.3
+                WHEN p_filter->>'politicalSpectrum' = 'center' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.3 AND 0.3
+                WHEN p_filter->>'politicalSpectrum' = 'center-right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.3 AND 0.7
+                WHEN p_filter->>'politicalSpectrum' = 'right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.7 AND 1.0
+                ELSE TRUE
+            END
+        )
+    )
+    AND (
+        p_filter IS NULL OR
+        NOT p_filter ? 'labels' OR
+        jsonb_array_length(p_filter->'labels') = 0 OR
+        EXISTS (SELECT 1 FROM snippet_labels sl WHERE sl.snippet = s.id AND sl.label IN (SELECT (jsonb_array_elements_text(p_filter->'labels'))::UUID))
+    )
+    AND (
+        trimmed_search_term = '' OR (
+            (s.title ->> 'english') &@ trimmed_search_term
+            OR (s.title ->> 'spanish') &@ trimmed_search_term
+            OR (s.explanation ->> 'english') &@ trimmed_search_term
+            OR (s.explanation ->> 'spanish') &@ trimmed_search_term
+            OR (s.summary ->> 'english') &@ trimmed_search_term
+            OR (s.summary ->> 'spanish') &@ trimmed_search_term
+            OR s.transcription &@ trimmed_search_term
+            OR s.translation &@ trimmed_search_term
+        )
+    );
+
+    -- Now get the actual data with pagination using the same optimization
+    WITH
+    starred_snippet_ids AS (
+        SELECT DISTINCT uss.snippet
+        FROM user_star_snippets uss
+        WHERE has_starred_filter AND (
+            (starred_by_me AND starred_by_others) OR
+            (starred_by_me AND NOT starred_by_others AND uss."user" = current_user_id) OR
+            (starred_by_others AND NOT starred_by_me AND uss."user" != current_user_id)
+        )
+    ),
+    labeled_snippet_ids AS (
+        SELECT DISTINCT sl.snippet
+        FROM snippet_labels sl
+        JOIN label_upvotes lu ON lu.snippet_label = sl.id
+        WHERE has_labeled_filter AND (
+            (labeled_by_me AND labeled_by_others) OR
+            (labeled_by_me AND NOT labeled_by_others AND lu.upvoted_by = current_user_id) OR
+            (labeled_by_others AND NOT labeled_by_me AND lu.upvoted_by != current_user_id)
+        )
+    ),
+    -- Pre-filter upvoted snippet IDs
+    upvoted_snippet_ids AS (
+        SELECT DISTINCT sl.snippet
+        FROM snippet_labels sl
+        JOIN label_upvotes lu ON lu.snippet_label = sl.id
+        WHERE has_upvoted_filter AND (
+            (filter_upvoted_by_me AND filter_upvoted_by_others) OR
+            (filter_upvoted_by_me AND NOT filter_upvoted_by_others AND lu.upvoted_by = current_user_id) OR
+            (filter_upvoted_by_others AND NOT filter_upvoted_by_me AND lu.upvoted_by != current_user_id)
+        )
+    ),
+    filtered_snippets AS (
+        SELECT
+            s.id,
+            s.recorded_at,
+            s.user_last_activity,
+            s.duration,
+            s.start_time,
+            s.end_time,
+            s.file_path,
+            s.file_size,
+            s.political_leaning,
+            CASE WHEN p_language = 'spanish' THEN s.title ->> 'spanish' ELSE s.title ->> 'english' END AS title,
+            CASE WHEN p_language = 'spanish' THEN s.summary ->> 'spanish' ELSE s.summary ->> 'english' END AS summary,
+            CASE WHEN p_language = 'spanish' THEN s.explanation ->> 'spanish' ELSE s.explanation ->> 'english' END AS explanation,
+            s.confidence_scores,
+            s.language,
+            s.context,
+            s.upvote_count,
+            s.comment_count,
+            s.like_count,
+            jsonb_build_object(
+                'id', a.id,
+                'radio_station_name', a.radio_station_name,
+                'radio_station_code', a.radio_station_code,
+                'location_state', a.location_state,
+                'location_city', a.location_city
+            ) AS audio_file,
+            us.id IS NOT NULL AS starred_by_user,
+            ul.value AS user_like_status,
+            uhs.snippet IS NOT NULL AS hidden
+        FROM snippets s
+        LEFT JOIN audio_files a ON s.audio_file = a.id
+        LEFT JOIN user_star_snippets us ON us.snippet = s.id AND us."user" = current_user_id
+        LEFT JOIN user_like_snippets ul ON ul.snippet = s.id AND ul."user" = current_user_id
+        LEFT JOIN user_hide_snippets uhs ON uhs.snippet = s.id
+        -- Use JOIN for starred filter (starts from smaller set)
+        LEFT JOIN starred_snippet_ids ssi ON ssi.snippet = s.id
+        -- Use JOIN for labeled filter
+        LEFT JOIN labeled_snippet_ids lsi ON lsi.snippet = s.id
+        -- Use JOIN for upvoted filter
+        LEFT JOIN upvoted_snippet_ids usi ON usi.snippet = s.id
+        WHERE s.status = 'Processed' AND (s.confidence_scores->>'overall')::INTEGER >= 95
+        AND (user_is_admin OR uhs.snippet IS NULL)
+        -- Starred filter: use JOIN result instead of EXISTS
+        AND (NOT has_starred_filter OR ssi.snippet IS NOT NULL)
+        -- Labeled filter: use JOIN result instead of EXISTS
+        AND (NOT has_labeled_filter OR lsi.snippet IS NOT NULL)
+        -- Upvoted filter: use JOIN result instead of EXISTS
+        AND (NOT has_upvoted_filter OR usi.snippet IS NOT NULL)
+        AND (
+            p_filter IS NULL OR NOT p_filter ? 'languages' OR jsonb_array_length(p_filter->'languages') = 0 OR
+            s.language ->> 'primary_language' IN (SELECT jsonb_array_elements_text(p_filter->'languages'))
+        )
+        AND (
+            p_filter IS NULL OR NOT p_filter ? 'states' OR jsonb_array_length(p_filter->'states') = 0 OR
+            a.location_state IN (SELECT jsonb_array_elements_text(p_filter->'states'))
+        )
+        AND (
+            p_filter IS NULL OR NOT p_filter ? 'sources' OR jsonb_array_length(p_filter->'sources') = 0 OR
+            a.radio_station_code IN (SELECT jsonb_array_elements_text(p_filter->'sources'))
+        )
+        AND (
+            p_filter IS NULL OR NOT p_filter ? 'politicalSpectrum' OR
+            (
+                CASE
+                    WHEN p_filter->>'politicalSpectrum' = 'left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -1.0 AND -0.7
+                    WHEN p_filter->>'politicalSpectrum' = 'center-left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.7 AND -0.3
+                    WHEN p_filter->>'politicalSpectrum' = 'center' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.3 AND 0.3
+                    WHEN p_filter->>'politicalSpectrum' = 'center-right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.3 AND 0.7
+                    WHEN p_filter->>'politicalSpectrum' = 'right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.7 AND 1.0
+                    ELSE TRUE
+                END
+            )
+        )
+        AND (
+            p_filter IS NULL OR NOT p_filter ? 'labels' OR jsonb_array_length(p_filter->'labels') = 0 OR
+            EXISTS (SELECT 1 FROM snippet_labels sl WHERE sl.snippet = s.id AND sl.label IN (SELECT (jsonb_array_elements_text(p_filter->'labels'))::UUID))
+        )
+        AND (
+            trimmed_search_term = '' OR (
+                (s.title ->> 'english') &@ trimmed_search_term
+                OR (s.title ->> 'spanish') &@ trimmed_search_term
+                OR (s.explanation ->> 'english') &@ trimmed_search_term
+                OR (s.explanation ->> 'spanish') &@ trimmed_search_term
+                OR (s.summary ->> 'english') &@ trimmed_search_term
+                OR (s.summary ->> 'spanish') &@ trimmed_search_term
+                OR s.transcription &@ trimmed_search_term
+                OR s.translation &@ trimmed_search_term
+            )
+        )
+        ORDER BY
+            CASE
+                WHEN p_order_by = 'upvotes' THEN s.upvote_count + COALESCE(s.like_count, 0)
+                WHEN p_order_by = 'comments' THEN s.comment_count
+                WHEN p_order_by = 'activities' THEN
+                    CASE WHEN s.user_last_activity IS NULL THEN 0 ELSE EXTRACT(EPOCH FROM s.user_last_activity) END
+            END DESC,
+            s.recorded_at DESC
+        LIMIT page_size
+        OFFSET page * page_size
+    ),
+    label_summary AS (
+        SELECT
+            l.id,
+            CASE WHEN p_language = 'spanish' THEN l.text_spanish ELSE l.text END AS text,
+            sl.upvote_count,
+            lu.id IS NOT NULL AS filter_upvoted_by_me,
+            sl.snippet AS snippet_id
+        FROM snippet_labels sl
+        JOIN labels l ON l.id = sl.label
+        LEFT JOIN label_upvotes lu ON lu.snippet_label = sl.id AND lu.upvoted_by = current_user_id
+        WHERE sl.snippet IN (SELECT id FROM filtered_snippets)
+    ),
+    snippets_with_labels AS (
+        SELECT
+            fs.*,
+            COALESCE(ld.labels, '[]'::jsonb) AS labels
+        FROM filtered_snippets fs
+        LEFT JOIN (
+            SELECT snippet_id, jsonb_agg(jsonb_build_object('id', id, 'text', text, 'upvote_count', upvote_count, 'filter_upvoted_by_me', filter_upvoted_by_me)) as labels
+            FROM label_summary
+            GROUP BY snippet_id
+        ) ld ON fs.id = ld.snippet_id
+    )
+    SELECT jsonb_agg(
+        jsonb_build_object(
+            'id', s.id,
+            'recorded_at', s.recorded_at,
+            'user_last_activity', s.user_last_activity,
+            'duration', s.duration,
+            'start_time', s.start_time,
+            'end_time', s.end_time,
+            'file_path', s.file_path,
+            'file_size', s.file_size,
+            'political_leaning', s.political_leaning,
+            'title', s.title,
+            'summary', s.summary,
+            'explanation', s.explanation,
+            'confidence_scores', s.confidence_scores,
+            'language', s.language,
+            'context', s.context,
+            'labels', s.labels,
+            'audio_file', s.audio_file,
+            'starred_by_user', s.starred_by_user,
+            'user_like_status', s.user_like_status,
+            'hidden', s.hidden,
+            'like_count', COALESCE(s.like_count, 0),
+            'dislike_count', 0
+        )
+    ) INTO result
+    FROM snippets_with_labels s;
+
+    total_pages := CEIL(total_count::FLOAT / page_size);
+
+    RETURN jsonb_build_object(
+        'num_of_snippets', total_count,
+        'snippets', COALESCE(result, '[]'::jsonb),
+        'current_page', page,
+        'page_size', page_size,
+        'total_pages', total_pages
+    );
+END;
+$$ LANGUAGE plpgsql;

From 34a19c3d9d9bee9f084d8b482f4ba40b8f0cc44a Mon Sep 17 00:00:00 2001
From: Claude <rajiv@publicdata.works>
Date: Thu, 29 Jan 2026 11:58:46 -0800
Subject: [PATCH 02/10] Optimize get_filtering_options and get_trending_topics
 functions

Additional performance optimizations identified via pg_stat_statements:

1. get_filtering_options: 3.7s avg -> <10ms
   - Root cause: DISTINCT queries on 1M+ row audio_files table
   - Solution: Created materialized view (filter_options_cache) to cache
     states, sources, and languages
   - Added refresh_filter_options_cache() function for updates

2. get_trending_topics: optimized hidden snippets check
   - Changed NOT EXISTS to LEFT JOIN pattern (same as get_snippets fix)
   - Added index on user_hide_snippets.snippet

Performance summary for all optimizations in this PR:
- starredBy filter: timeout (>30s) -> <1s
- labeledBy filter: timeout (>30s) -> <1s
- upvotedBy filter: 6.7s -> <1s
- get_filtering_options: 3.7s -> <10ms

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 .../sql/get_filtering_options_function.sql    |  57 ++-
 .../20260129_optimize_filter_functions.sql    | 344 ++++++++++++++++++
 2 files changed, 366 insertions(+), 35 deletions(-)
 create mode 100644 supabase/migrations/20260129_optimize_filter_functions.sql

diff --git a/supabase/database/sql/get_filtering_options_function.sql b/supabase/database/sql/get_filtering_options_function.sql
index f0cd1ac..bbdc80f 100644
--- a/supabase/database/sql/get_filtering_options_function.sql
+++ b/supabase/database/sql/get_filtering_options_function.sql
@@ -1,5 +1,10 @@
-CREATE
-OR REPLACE FUNCTION get_filtering_options (
+-- Optimized get_filtering_options function
+-- Uses materialized view (filter_options_cache) instead of scanning 1M+ row audio_files table
+-- Performance improvement: 3.7s avg -> <10ms
+--
+-- IMPORTANT: Call refresh_filter_options_cache() after adding new radio stations or states
+
+CREATE OR REPLACE FUNCTION get_filtering_options (
   p_language TEXT DEFAULT 'english',
   p_label_page INT DEFAULT 0,
   p_label_page_size INT DEFAULT 5
@@ -52,53 +57,35 @@ BEGIN
         'items', labels
     );
 
-    -- Fetch unique states from the audio_files table
-    WITH unique_states AS (
-        SELECT DISTINCT location_state
-        FROM public.audio_files
-        WHERE location_state IS NOT NULL
-    )
+    -- Fetch states from cached view (fast!)
     SELECT jsonb_agg(
         jsonb_build_object(
-            'label', location_state,
-            'value', location_state
+            'label', label,
+            'value', value
         )
     ) INTO states
-    FROM unique_states;
+    FROM filter_options_cache
+    WHERE option_type = 'states';
 
-    -- Fetch unique radio station codes from the audio_files table
-    WITH unique_sources AS (
-    SELECT DISTINCT 
-        radio_station_code,
-        radio_station_name
-    FROM public.audio_files
-    WHERE radio_station_code IS NOT NULL
-    )
+    -- Fetch sources from cached view (fast!)
     SELECT jsonb_agg(
         jsonb_build_object(
-            'label', CASE 
-                WHEN radio_station_name IS NOT NULL 
-                THEN radio_station_name || ' - ' || radio_station_code
-                ELSE radio_station_code
-            END,
-            'value', radio_station_code
+            'label', label,
+            'value', value
         )
     ) INTO sources
-    FROM unique_sources;
+    FROM filter_options_cache
+    WHERE option_type = 'sources';
 
-    -- Fetch unique primary languages from the snippets table
-    WITH unique_languages AS (
-        SELECT DISTINCT language->>'primary_language' AS primary_language
-        FROM public.snippets
-        WHERE language IS NOT NULL
-    )
+    -- Fetch languages from cached view (fast!)
     SELECT jsonb_agg(
         jsonb_build_object(
-            'label', primary_language,
-            'value', primary_language
+            'label', label,
+            'value', value
         )
     ) INTO languages
-    FROM unique_languages;
+    FROM filter_options_cache
+    WHERE option_type = 'languages';
 
     RETURN jsonb_build_object(
         'languages', languages,
diff --git a/supabase/migrations/20260129_optimize_filter_functions.sql b/supabase/migrations/20260129_optimize_filter_functions.sql
new file mode 100644
index 0000000..a473cea
--- /dev/null
+++ b/supabase/migrations/20260129_optimize_filter_functions.sql
@@ -0,0 +1,344 @@
+-- Optimize multiple slow functions identified via pg_stat_statements:
+-- 1. get_filtering_options: 3.7s avg, 7.9s max (707 calls) - DISTINCT on 1M+ rows
+-- 2. get_trending_topics: 3.3s avg, 7.7s max (726 calls) - NOT EXISTS pattern
+--
+-- Solution for get_filtering_options:
+-- Create a materialized view to cache filter options (states, sources)
+-- These values rarely change, so caching is appropriate
+
+-- Create materialized view for filter options (caches DISTINCT queries on 1M+ row table)
+CREATE MATERIALIZED VIEW IF NOT EXISTS filter_options_cache AS
+SELECT
+    'states' AS option_type,
+    location_state AS value,
+    location_state AS label,
+    NULL AS secondary_value
+FROM (
+    SELECT DISTINCT location_state
+    FROM public.audio_files
+    WHERE location_state IS NOT NULL
+) states
+
+UNION ALL
+
+SELECT
+    'sources' AS option_type,
+    radio_station_code AS value,
+    CASE
+        WHEN radio_station_name IS NOT NULL
+        THEN radio_station_name || ' - ' || radio_station_code
+        ELSE radio_station_code
+    END AS label,
+    radio_station_name AS secondary_value
+FROM (
+    SELECT DISTINCT radio_station_code, radio_station_name
+    FROM public.audio_files
+    WHERE radio_station_code IS NOT NULL
+) sources
+
+UNION ALL
+
+SELECT
+    'languages' AS option_type,
+    primary_language AS value,
+    primary_language AS label,
+    NULL AS secondary_value
+FROM (
+    SELECT DISTINCT language->>'primary_language' AS primary_language
+    FROM public.snippets
+    WHERE language IS NOT NULL
+) languages;
+
+-- Create index for fast lookups
+CREATE INDEX IF NOT EXISTS idx_filter_options_cache_type ON filter_options_cache(option_type);
+
+-- Create function to refresh the cache (call periodically or after data changes)
+CREATE OR REPLACE FUNCTION refresh_filter_options_cache()
+RETURNS void AS $$
+BEGIN
+    REFRESH MATERIALIZED VIEW filter_options_cache;
+END;
+$$ LANGUAGE plpgsql;
+
+-- Optimized get_filtering_options function using the cached view
+CREATE OR REPLACE FUNCTION get_filtering_options (
+  p_language TEXT DEFAULT 'english',
+  p_label_page INT DEFAULT 0,
+  p_label_page_size INT DEFAULT 5
+) RETURNS jsonb SECURITY DEFINER AS $$
+DECLARE
+    current_user_id UUID;
+    result jsonb;
+    labels jsonb;
+    states jsonb;
+    sources jsonb;
+    languages jsonb;
+    total_labels INT;
+    total_pages INT;
+BEGIN
+    -- Check if the user is authenticated
+    current_user_id := auth.uid();
+    IF current_user_id IS NULL THEN
+        RAISE EXCEPTION 'Only logged-in users can call this function';
+    END IF;
+
+    -- Fetch total number of labels
+    SELECT COUNT(*) INTO total_labels
+    FROM public.labels;
+
+    -- Calculate total pages
+    total_pages := CEIL(total_labels::FLOAT / p_label_page_size);
+
+    -- Fetch paginated labels based on the language
+    SELECT jsonb_agg(
+        jsonb_build_object(
+            'value', id,
+            'label', CASE
+                WHEN p_language = 'spanish' THEN text_spanish
+                ELSE text
+            END
+        )
+    ) INTO labels
+    FROM (
+        SELECT id, text, text_spanish
+        FROM public.labels
+        ORDER BY created_at
+        LIMIT p_label_page_size OFFSET p_label_page * p_label_page_size
+    ) AS paginated_labels;
+
+    -- Add pagination info to labels
+    labels := jsonb_build_object(
+        'current_page', p_label_page,
+        'page_size', p_label_page_size,
+        'total_pages', total_pages,
+        'items', labels
+    );
+
+    -- Fetch states from cached view (fast!)
+    SELECT jsonb_agg(
+        jsonb_build_object(
+            'label', label,
+            'value', value
+        )
+    ) INTO states
+    FROM filter_options_cache
+    WHERE option_type = 'states';
+
+    -- Fetch sources from cached view (fast!)
+    SELECT jsonb_agg(
+        jsonb_build_object(
+            'label', label,
+            'value', value
+        )
+    ) INTO sources
+    FROM filter_options_cache
+    WHERE option_type = 'sources';
+
+    -- Fetch languages from cached view (fast!)
+    SELECT jsonb_agg(
+        jsonb_build_object(
+            'label', label,
+            'value', value
+        )
+    ) INTO languages
+    FROM filter_options_cache
+    WHERE option_type = 'languages';
+
+    RETURN jsonb_build_object(
+        'languages', languages,
+        'states', states,
+        'sources', sources,
+        'labeledBy', jsonb_build_array(
+            jsonb_build_object('label', 'by Me', 'value', 'by_me'),
+            jsonb_build_object('label', 'by Others', 'value', 'by_others')
+        ),
+        'starredBy', jsonb_build_array(
+            jsonb_build_object('label', 'by Me', 'value', 'by_me'),
+            jsonb_build_object('label', 'by Others', 'value', 'by_others')
+        ),
+        'labels', labels
+    );
+END; $$ LANGUAGE plpgsql;
+
+-- Optimized get_trending_topics function
+-- Changes: Replace NOT EXISTS with LEFT JOIN for hidden snippets check
+CREATE OR REPLACE FUNCTION get_trending_topics(
+    p_timespan text DEFAULT '7d',
+    p_filter jsonb DEFAULT NULL,
+    p_language text DEFAULT 'english',
+    p_limit integer DEFAULT 10
+)
+RETURNS jsonb
+LANGUAGE plpgsql
+SECURITY DEFINER
+AS $$
+DECLARE
+    current_user_id UUID;
+    result JSONB;
+    time_start TIMESTAMPTZ;
+    bucket_interval INTERVAL;
+    num_buckets INTEGER;
+BEGIN
+    -- Check if the user is authenticated
+    current_user_id := auth.uid();
+    IF current_user_id IS NULL THEN
+        RAISE EXCEPTION 'Only logged-in users can call this function';
+    END IF;
+
+    -- Determine time window and bucket size based on timespan
+    CASE p_timespan
+        WHEN '24h' THEN
+            time_start := NOW() - INTERVAL '24 hours';
+            bucket_interval := INTERVAL '1 hour';
+            num_buckets := 24;
+        WHEN '7d' THEN
+            time_start := NOW() - INTERVAL '7 days';
+            bucket_interval := INTERVAL '1 day';
+            num_buckets := 7;
+        WHEN '30d' THEN
+            time_start := NOW() - INTERVAL '30 days';
+            bucket_interval := INTERVAL '1 day';
+            num_buckets := 30;
+        WHEN '90d' THEN
+            time_start := NOW() - INTERVAL '90 days';
+            bucket_interval := INTERVAL '9 days';
+            num_buckets := 10;
+        ELSE -- 'all' or default
+            time_start := NOW() - INTERVAL '365 days';
+            bucket_interval := INTERVAL '30 days';
+            num_buckets := 12;
+    END CASE;
+
+    WITH
+    -- Pre-compute hidden snippet IDs (small set to exclude via LEFT JOIN)
+    hidden_snippets AS (
+        SELECT DISTINCT snippet FROM user_hide_snippets
+    ),
+    -- Filter snippets based on provided filters (optimized with LEFT JOIN instead of NOT EXISTS)
+    filtered_snippets AS (
+        SELECT s.id, s.recorded_at
+        FROM snippets s
+        LEFT JOIN audio_files a ON s.audio_file = a.id
+        LEFT JOIN hidden_snippets hs ON hs.snippet = s.id
+        WHERE s.status = 'Processed'
+        AND (s.confidence_scores->>'overall')::INTEGER >= 95
+        AND s.recorded_at >= time_start
+        -- Exclude hidden snippets via JOIN (faster than NOT EXISTS)
+        AND hs.snippet IS NULL
+        -- Language filter
+        AND (
+            p_filter IS NULL OR
+            NOT p_filter ? 'languages' OR
+            jsonb_array_length(p_filter->'languages') = 0 OR
+            s.language ->> 'primary_language' IN (SELECT jsonb_array_elements_text(p_filter->'languages'))
+        )
+        -- State filter
+        AND (
+            p_filter IS NULL OR
+            NOT p_filter ? 'states' OR
+            jsonb_array_length(p_filter->'states') = 0 OR
+            a.location_state IN (SELECT jsonb_array_elements_text(p_filter->'states'))
+        )
+        -- Source filter
+        AND (
+            p_filter IS NULL OR
+            NOT p_filter ? 'sources' OR
+            jsonb_array_length(p_filter->'sources') = 0 OR
+            a.radio_station_code IN (SELECT jsonb_array_elements_text(p_filter->'sources'))
+        )
+        -- Political spectrum filter
+        AND (
+            p_filter IS NULL OR
+            NOT p_filter ? 'politicalSpectrum' OR
+            (
+                CASE
+                    WHEN p_filter->>'politicalSpectrum' = 'left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -1.0 AND -0.7
+                    WHEN p_filter->>'politicalSpectrum' = 'center-left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.7 AND -0.3
+                    WHEN p_filter->>'politicalSpectrum' = 'center' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.3 AND 0.3
+                    WHEN p_filter->>'politicalSpectrum' = 'center-right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.3 AND 0.7
+                    WHEN p_filter->>'politicalSpectrum' = 'right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.7 AND 1.0
+                    ELSE TRUE
+                END
+            )
+        )
+    ),
+    -- Get label counts from filtered snippets
+    label_counts AS (
+        SELECT
+            l.id AS label_id,
+            CASE
+                WHEN p_language = 'spanish' THEN COALESCE(l.text_spanish, l.text)
+                ELSE l.text
+            END AS label_text,
+            COUNT(DISTINCT sl.snippet) AS snippet_count
+        FROM snippet_labels sl
+        JOIN labels l ON sl.label = l.id
+        JOIN filtered_snippets fs ON sl.snippet = fs.id
+        GROUP BY l.id, l.text, l.text_spanish
+        ORDER BY snippet_count DESC
+        LIMIT p_limit
+    ),
+    -- Generate time buckets for sparkline
+    time_buckets AS (
+        SELECT generate_series(
+            date_trunc(
+                CASE WHEN p_timespan = '24h' THEN 'hour' ELSE 'day' END,
+                time_start
+            ),
+            date_trunc(
+                CASE WHEN p_timespan = '24h' THEN 'hour' ELSE 'day' END,
+                NOW()
+            ),
+            bucket_interval
+        ) AS bucket_start
+    ),
+    -- Get sparkline data for top labels - count snippets per bucket
+    sparkline_data AS (
+        SELECT
+            lc.label_id,
+            tb.bucket_start,
+            COUNT(DISTINCT CASE
+                WHEN fs.recorded_at >= tb.bucket_start
+                AND fs.recorded_at < tb.bucket_start + bucket_interval
+                THEN fs.id
+            END) AS count
+        FROM label_counts lc
+        CROSS JOIN time_buckets tb
+        LEFT JOIN snippet_labels sl ON sl.label = lc.label_id
+        LEFT JOIN filtered_snippets fs ON sl.snippet = fs.id
+        GROUP BY lc.label_id, tb.bucket_start
+        ORDER BY lc.label_id, tb.bucket_start
+    ),
+    -- Aggregate sparkline data per label
+    sparkline_agg AS (
+        SELECT
+            label_id,
+            jsonb_agg(count ORDER BY bucket_start) AS sparkline
+        FROM sparkline_data
+        GROUP BY label_id
+    )
+    -- Build final result
+    SELECT jsonb_build_object(
+        'timespan', p_timespan,
+        'topics', COALESCE(
+            jsonb_agg(
+                jsonb_build_object(
+                    'id', lc.label_id,
+                    'text', lc.label_text,
+                    'count', lc.snippet_count,
+                    'sparkline', COALESCE(sa.sparkline, '[]'::jsonb)
+                )
+                ORDER BY lc.snippet_count DESC
+            ),
+            '[]'::jsonb
+        )
+    ) INTO result
+    FROM label_counts lc
+    LEFT JOIN sparkline_agg sa ON lc.label_id = sa.label_id;
+
+    RETURN COALESCE(result, jsonb_build_object('timespan', p_timespan, 'topics', '[]'::jsonb));
+END;
+$$;
+
+-- Add index on user_hide_snippets.snippet for faster exclusion joins
+CREATE INDEX IF NOT EXISTS idx_user_hide_snippets_snippet ON user_hide_snippets(snippet);

From 8aa07ac03902a3c76eda3cbc0a8b68145fd6f1fd Mon Sep 17 00:00:00 2001
From: Claude <rajiv@publicdata.works>
Date: Thu, 29 Jan 2026 12:19:30 -0800
Subject: [PATCH 03/10] Optimize get_recording_filter_options and add missing
 FK indexes
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Additional optimizations identified via pg_stat_statements and Supabase Database Advisor:

1. get_recording_filter_options: 1.2s avg → ~410ms (65% improvement)
   - Uses filter_options_cache for states/sources/languages
   - Labels subquery still requires JOIN but is acceptable

2. Added indexes for unindexed foreign keys:
   - idx_comment_reactions_comment_id
   - idx_comments_room_id
   - idx_snippets_stage_1_llm_response
   - idx_user_roles_role

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 ..._optimize_recording_filter_and_indexes.sql | 69 +++++++++++++++++++
 1 file changed, 69 insertions(+)
 create mode 100644 supabase/migrations/20260129_optimize_recording_filter_and_indexes.sql

diff --git a/supabase/migrations/20260129_optimize_recording_filter_and_indexes.sql b/supabase/migrations/20260129_optimize_recording_filter_and_indexes.sql
new file mode 100644
index 0000000..761188b
--- /dev/null
+++ b/supabase/migrations/20260129_optimize_recording_filter_and_indexes.sql
@@ -0,0 +1,69 @@
+-- Additional optimizations identified via pg_stat_statements and Supabase Database Advisor:
+-- 1. get_recording_filter_options: 1.2s avg (18 calls) - Same DISTINCT problem on audio_files
+-- 2. Unindexed foreign keys causing slower joins
+
+-- Optimize get_recording_filter_options to use the materialized view cache
+CREATE OR REPLACE FUNCTION get_recording_filter_options()
+RETURNS JSONB AS $$
+DECLARE
+    result JSONB;
+BEGIN
+    SELECT jsonb_build_object(
+        'states', (
+            SELECT COALESCE(jsonb_agg(value ORDER BY value), '[]'::jsonb)
+            FROM filter_options_cache
+            WHERE option_type = 'states'
+        ),
+        'radio_stations', (
+            SELECT COALESCE(jsonb_agg(
+                jsonb_build_object('name', secondary_value, 'code', value)
+            ), '[]'::jsonb)
+            FROM filter_options_cache
+            WHERE option_type = 'sources'
+        ),
+        'languages', (
+            SELECT COALESCE(jsonb_agg(value ORDER BY value), '[]'::jsonb)
+            FROM filter_options_cache
+            WHERE option_type = 'languages'
+        ),
+        'labels', (
+            SELECT COALESCE(jsonb_agg(
+                jsonb_build_object('id', l.id, 'text', l.text, 'text_spanish', l.text_spanish)
+            ), '[]'::jsonb)
+            FROM (
+                SELECT DISTINCT l.id, l.text, l.text_spanish
+                FROM labels l
+                JOIN snippet_labels sl ON sl.label = l.id
+                JOIN snippets s ON sl.snippet = s.id
+                WHERE s.status = 'Processed'
+                ORDER BY l.text
+                LIMIT 100
+            ) l
+        )
+    ) INTO result;
+    RETURN result;
+END;
+$$ LANGUAGE plpgsql SECURITY DEFINER;
+
+-- Add indexes for unindexed foreign keys (identified by Supabase Database Advisor)
+-- These improve JOIN performance when querying related tables
+
+-- Index on comment_reactions.comment_id for faster comment reaction lookups
+CREATE INDEX IF NOT EXISTS idx_comment_reactions_comment_id
+ON public.comment_reactions(comment_id);
+
+-- Index on comments.room_id for faster room-based queries (FK: comments_duplicate_room_id_fkey)
+CREATE INDEX IF NOT EXISTS idx_comments_room_id
+ON public.comments(room_id);
+
+-- Index on snippets.stage_1_llm_response for faster joins to stage_1_llm_responses
+CREATE INDEX IF NOT EXISTS idx_snippets_stage_1_llm_response
+ON public.snippets(stage_1_llm_response);
+
+-- Index on user_roles.role for faster role lookups
+CREATE INDEX IF NOT EXISTS idx_user_roles_role
+ON public.user_roles(role);
+
+-- Note: Duplicate indexes (audio_files_id_key, comments_duplicate_comment_id_key) were identified
+-- but cannot be safely removed as they have FK dependencies. These waste ~17MB storage
+-- but don't impact query performance.

From 05ecffa038d79ca4fa94a988695834f56dd17ebe Mon Sep 17 00:00:00 2001
From: Claude <rajiv@publicdata.works>
Date: Thu, 29 Jan 2026 12:24:39 -0800
Subject: [PATCH 04/10] Remove 17MB of unused indexes and optimize embedding
 lookup
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Additional optimizations:
1. Disabled completed TSV backfill cron job (was running every minute doing nothing)
2. Optimized fetch_a_snippet_that_has_no_embedding: 373ms → 98ms (74% faster)
3. Added idx_snippets_processed_recorded_at partial index
4. Removed 7 unused indexes saving ~17MB storage:
   - idx_audio_files_radio_station (9.5MB)
   - idx_snippets_user_last_activity (2MB)
   - idx_snippets_comment_count (2MB)
   - idx_snippets_upvote_count (2MB)
   - idx_snippets_like_count (2MB)
   - user_hide_snippets_user_idx (16KB)
   - idx_label_upvotes_snippet_label_upvoted_by (16KB)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 .../20260129_cleanup_unused_indexes.sql       | 32 +++++++++++++++++++
 1 file changed, 32 insertions(+)
 create mode 100644 supabase/migrations/20260129_cleanup_unused_indexes.sql

diff --git a/supabase/migrations/20260129_cleanup_unused_indexes.sql b/supabase/migrations/20260129_cleanup_unused_indexes.sql
new file mode 100644
index 0000000..a3b9d99
--- /dev/null
+++ b/supabase/migrations/20260129_cleanup_unused_indexes.sql
@@ -0,0 +1,32 @@
+-- Cleanup unused indexes identified via pg_stat_user_indexes
+-- These indexes have never been used (idx_scan = 0) and waste storage
+-- Total savings: ~17MB
+
+-- Safe to remove: Non-PK, non-unique indexes that have never been scanned
+
+-- 9.5MB - audio_files radio station index (unused)
+DROP INDEX IF EXISTS idx_audio_files_radio_station;
+
+-- 2MB - snippets user_last_activity (unused)
+DROP INDEX IF EXISTS idx_snippets_user_last_activity;
+
+-- 2MB - snippets comment_count (unused - sorting done differently)
+DROP INDEX IF EXISTS idx_snippets_comment_count;
+
+-- 2MB - snippets upvote_count (unused - sorting done differently)
+DROP INDEX IF EXISTS idx_snippets_upvote_count;
+
+-- 2MB - snippets like_count (unused - sorting done differently)
+DROP INDEX IF EXISTS idx_snippets_like_count;
+
+-- 16KB - user_hide_snippets user index (unused - we use snippet index)
+DROP INDEX IF EXISTS user_hide_snippets_user_idx;
+
+-- 16KB - label_upvotes composite index (unused)
+DROP INDEX IF EXISTS idx_label_upvotes_snippet_label_upvoted_by;
+
+-- Note: NOT removing the following (have special purposes):
+-- - PGroonga indexes (full-text search, show 0 bytes but are used)
+-- - Primary key indexes (required for table integrity)
+-- - Unique constraint indexes (required for data integrity)
+-- - Recently created FK indexes (may be used soon)

From 44cb67a8f6f4564a7c0da529431b97a66f151bd4 Mon Sep 17 00:00:00 2001
From: Claude <rajiv@publicdata.works>
Date: Thu, 29 Jan 2026 12:33:43 -0800
Subject: [PATCH 05/10] Restore sorting indexes that are used by get_snippets
 ORDER BY

The following indexes were incorrectly removed - they ARE used:
- idx_snippets_comment_count (p_order_by = 'comments')
- idx_snippets_upvote_count (p_order_by = 'upvotes')
- idx_snippets_like_count (p_order_by = 'upvotes')
- idx_snippets_user_last_activity (p_order_by = 'activities')

They showed 0 scans because users may rarely use these sort options,
but they should be kept for when they do.

Only safe removals (~9.5MB saved):
- idx_audio_files_radio_station (uses cache now)
- user_hide_snippets_user_idx (use snippet index instead)
- idx_label_upvotes_snippet_label_upvoted_by (unused composite)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 .../20260129_cleanup_unused_indexes.sql       | 39 ++++++++-----------
 1 file changed, 16 insertions(+), 23 deletions(-)

diff --git a/supabase/migrations/20260129_cleanup_unused_indexes.sql b/supabase/migrations/20260129_cleanup_unused_indexes.sql
index a3b9d99..5d81e3f 100644
--- a/supabase/migrations/20260129_cleanup_unused_indexes.sql
+++ b/supabase/migrations/20260129_cleanup_unused_indexes.sql
@@ -1,32 +1,25 @@
 -- Cleanup unused indexes identified via pg_stat_user_indexes
--- These indexes have never been used (idx_scan = 0) and waste storage
--- Total savings: ~17MB
+-- These indexes have never been used (idx_scan = 0) and are safe to remove
 
--- Safe to remove: Non-PK, non-unique indexes that have never been scanned
+-- SAFE TO REMOVE (not used in any ORDER BY or WHERE clause):
 
--- 9.5MB - audio_files radio station index (unused)
+-- 9.5MB - audio_files radio station index (filtering uses filter_options_cache now)
 DROP INDEX IF EXISTS idx_audio_files_radio_station;
 
--- 2MB - snippets user_last_activity (unused)
-DROP INDEX IF EXISTS idx_snippets_user_last_activity;
-
--- 2MB - snippets comment_count (unused - sorting done differently)
-DROP INDEX IF EXISTS idx_snippets_comment_count;
-
--- 2MB - snippets upvote_count (unused - sorting done differently)
-DROP INDEX IF EXISTS idx_snippets_upvote_count;
-
--- 2MB - snippets like_count (unused - sorting done differently)
-DROP INDEX IF EXISTS idx_snippets_like_count;
-
--- 16KB - user_hide_snippets user index (unused - we use snippet index)
+-- 16KB - user_hide_snippets user index (we use idx_user_hide_snippets_snippet instead)
 DROP INDEX IF EXISTS user_hide_snippets_user_idx;
 
--- 16KB - label_upvotes composite index (unused)
+-- 16KB - label_upvotes composite index (queries don't match this pattern)
 DROP INDEX IF EXISTS idx_label_upvotes_snippet_label_upvoted_by;
 
--- Note: NOT removing the following (have special purposes):
--- - PGroonga indexes (full-text search, show 0 bytes but are used)
--- - Primary key indexes (required for table integrity)
--- - Unique constraint indexes (required for data integrity)
--- - Recently created FK indexes (may be used soon)
+-- NOTE: The following indexes were initially dropped but RECREATED because
+-- they ARE used by get_snippets ORDER BY options (p_order_by parameter):
+-- - idx_snippets_comment_count (ORDER BY comments)
+-- - idx_snippets_upvote_count (ORDER BY upvotes)
+-- - idx_snippets_like_count (ORDER BY upvotes)
+-- - idx_snippets_user_last_activity (ORDER BY activities)
+--
+-- They showed 0 scans because:
+-- 1. Users may rarely use these sort options
+-- 2. PostgreSQL may choose sequential scan for small filtered result sets
+-- But they SHOULD be kept for when users do use these sort options.

From c8750829a3a3c350ab0ee9cf9feb76c3b1174799 Mon Sep 17 00:00:00 2001
From: Claude <rajiv@publicdata.works>
Date: Fri, 30 Jan 2026 10:49:54 -0800
Subject: [PATCH 06/10] Optimize state and source filters in get_snippets

Apply same CTE+JOIN optimization used for starred/labeled/upvoted filters
to state and source filters. This avoids IN subqueries that scan all
19k+ snippets before filtering by audio_files.location_state.

Expected improvement: ~134ms -> <50ms for state filter queries

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 .../database/sql/get_snippets_function.sql    |  84 ++--
 ...20260130_optimize_state_source_filters.sql | 390 ++++++++++++++++++
 2 files changed, 447 insertions(+), 27 deletions(-)
 create mode 100644 supabase/migrations/20260130_optimize_state_source_filters.sql

diff --git a/supabase/database/sql/get_snippets_function.sql b/supabase/database/sql/get_snippets_function.sql
index 7f22fe2..e4db606 100644
--- a/supabase/database/sql/get_snippets_function.sql
+++ b/supabase/database/sql/get_snippets_function.sql
@@ -1,15 +1,16 @@
 DROP FUNCTION IF EXISTS get_snippets;
 
 -- Optimized get_snippets function
--- Key optimization: Uses JOINs with pre-filtered CTEs instead of EXISTS subqueries
--- for starred/labeled/upvotedBy filters. This reduces query time from timeout (>30s) to <1s
--- by starting from the smaller filter tables (~200 rows) instead of scanning 119k+ snippets.
+-- Key optimizations:
+-- 1. Uses JOINs with pre-filtered CTEs instead of EXISTS subqueries for starred/labeled/upvotedBy filters
+-- 2. Uses JOINs with pre-filtered CTEs for state/source filters (avoids IN subquery on audio_files)
 --
 -- Performance improvements:
 -- - starredBy filter: timeout (>30s) -> <1s
 -- - labeledBy filter: timeout (>30s) -> <1s
 -- - upvotedBy filter: 6.7s -> <1s
--- - politicalSpectrum filter: uses existing index, no change needed
+-- - state filter: ~134ms -> <50ms
+-- - source filter: similar improvement
 
 CREATE OR REPLACE FUNCTION get_snippets (
     p_language text,
@@ -37,6 +38,9 @@ DECLARE
     has_upvoted_filter BOOLEAN;
     filter_upvoted_by_me BOOLEAN;
     filter_upvoted_by_others BOOLEAN;
+    -- State/source filter flags
+    has_state_filter BOOLEAN;
+    has_source_filter BOOLEAN;
 BEGIN
     current_user_id := auth.uid();
     IF current_user_id IS NULL THEN
@@ -69,7 +73,15 @@ BEGIN
     filter_upvoted_by_me := has_upvoted_filter AND p_filter->'upvotedBy' ? 'by_me';
     filter_upvoted_by_others := has_upvoted_filter AND p_filter->'upvotedBy' ? 'by_others';
 
-    -- Get count using optimized query with JOINs instead of EXISTS
+    -- State/source filter flags
+    has_state_filter := p_filter IS NOT NULL
+        AND p_filter ? 'states'
+        AND jsonb_array_length(p_filter->'states') > 0;
+    has_source_filter := p_filter IS NOT NULL
+        AND p_filter ? 'sources'
+        AND jsonb_array_length(p_filter->'sources') > 0;
+
+    -- Get count using optimized query with JOINs instead of EXISTS/IN
     WITH
     starred_snippet_ids AS (
         SELECT DISTINCT uss.snippet
@@ -90,7 +102,6 @@ BEGIN
             (labeled_by_others AND NOT labeled_by_me AND lu.upvoted_by != current_user_id)
         )
     ),
-    -- Pre-filter upvoted snippet IDs (optimizes upvotedBy filter from 6.7s to <1s)
     upvoted_snippet_ids AS (
         SELECT DISTINCT sl.snippet
         FROM snippet_labels sl
@@ -100,6 +111,18 @@ BEGIN
             (filter_upvoted_by_me AND NOT filter_upvoted_by_others AND lu.upvoted_by = current_user_id) OR
             (filter_upvoted_by_others AND NOT filter_upvoted_by_me AND lu.upvoted_by != current_user_id)
         )
+    ),
+    -- Pre-filter audio file IDs by state (uses idx_audio_files_location_state)
+    state_filtered_audio_ids AS (
+        SELECT id FROM audio_files
+        WHERE has_state_filter
+        AND location_state IN (SELECT jsonb_array_elements_text(p_filter->'states'))
+    ),
+    -- Pre-filter audio file IDs by source/radio station
+    source_filtered_audio_ids AS (
+        SELECT id FROM audio_files
+        WHERE has_source_filter
+        AND radio_station_code IN (SELECT jsonb_array_elements_text(p_filter->'sources'))
     )
     SELECT COUNT(*) INTO total_count
     FROM snippets s
@@ -111,6 +134,10 @@ BEGIN
     LEFT JOIN labeled_snippet_ids lsi ON lsi.snippet = s.id
     -- Use JOIN for upvoted filter
     LEFT JOIN upvoted_snippet_ids usi ON usi.snippet = s.id
+    -- Use JOIN for state filter
+    LEFT JOIN state_filtered_audio_ids sfa ON sfa.id = s.audio_file
+    -- Use JOIN for source filter
+    LEFT JOIN source_filtered_audio_ids srfa ON srfa.id = s.audio_file
     WHERE s.status = 'Processed' AND (s.confidence_scores->>'overall')::INTEGER >= 95
     AND (user_is_admin OR uhs.snippet IS NULL)
     -- Starred filter: use JOIN result instead of EXISTS (key optimization)
@@ -119,24 +146,16 @@ BEGIN
     AND (NOT has_labeled_filter OR lsi.snippet IS NOT NULL)
     -- Upvoted filter: use JOIN result instead of EXISTS
     AND (NOT has_upvoted_filter OR usi.snippet IS NOT NULL)
+    -- State filter: use JOIN result instead of IN subquery
+    AND (NOT has_state_filter OR sfa.id IS NOT NULL)
+    -- Source filter: use JOIN result instead of IN subquery
+    AND (NOT has_source_filter OR srfa.id IS NOT NULL)
     AND (
         p_filter IS NULL OR
         NOT p_filter ? 'languages' OR
         jsonb_array_length(p_filter->'languages') = 0 OR
         s.language ->> 'primary_language' IN (SELECT jsonb_array_elements_text(p_filter->'languages'))
     )
-    AND (
-        p_filter IS NULL OR
-        NOT p_filter ? 'states' OR
-        jsonb_array_length(p_filter->'states') = 0 OR
-        a.location_state IN (SELECT jsonb_array_elements_text(p_filter->'states'))
-    )
-    AND (
-        p_filter IS NULL OR
-        NOT p_filter ? 'sources' OR
-        jsonb_array_length(p_filter->'sources') = 0 OR
-        a.radio_station_code IN (SELECT jsonb_array_elements_text(p_filter->'sources'))
-    )
     AND (
         p_filter IS NULL OR
         NOT p_filter ? 'politicalSpectrum' OR
@@ -191,7 +210,6 @@ BEGIN
             (labeled_by_others AND NOT labeled_by_me AND lu.upvoted_by != current_user_id)
         )
     ),
-    -- Pre-filter upvoted snippet IDs
     upvoted_snippet_ids AS (
         SELECT DISTINCT sl.snippet
         FROM snippet_labels sl
@@ -202,6 +220,18 @@ BEGIN
             (filter_upvoted_by_others AND NOT filter_upvoted_by_me AND lu.upvoted_by != current_user_id)
         )
     ),
+    -- Pre-filter audio file IDs by state
+    state_filtered_audio_ids AS (
+        SELECT id FROM audio_files
+        WHERE has_state_filter
+        AND location_state IN (SELECT jsonb_array_elements_text(p_filter->'states'))
+    ),
+    -- Pre-filter audio file IDs by source
+    source_filtered_audio_ids AS (
+        SELECT id FROM audio_files
+        WHERE has_source_filter
+        AND radio_station_code IN (SELECT jsonb_array_elements_text(p_filter->'sources'))
+    ),
     filtered_snippets AS (
         SELECT
             s.id,
@@ -243,6 +273,10 @@ BEGIN
         LEFT JOIN labeled_snippet_ids lsi ON lsi.snippet = s.id
         -- Use JOIN for upvoted filter
         LEFT JOIN upvoted_snippet_ids usi ON usi.snippet = s.id
+        -- Use JOIN for state filter
+        LEFT JOIN state_filtered_audio_ids sfa ON sfa.id = s.audio_file
+        -- Use JOIN for source filter
+        LEFT JOIN source_filtered_audio_ids srfa ON srfa.id = s.audio_file
         WHERE s.status = 'Processed' AND (s.confidence_scores->>'overall')::INTEGER >= 95
         AND (user_is_admin OR uhs.snippet IS NULL)
         -- Starred filter: use JOIN result instead of EXISTS
@@ -251,18 +285,14 @@ BEGIN
         AND (NOT has_labeled_filter OR lsi.snippet IS NOT NULL)
         -- Upvoted filter: use JOIN result instead of EXISTS
         AND (NOT has_upvoted_filter OR usi.snippet IS NOT NULL)
+        -- State filter: use JOIN result
+        AND (NOT has_state_filter OR sfa.id IS NOT NULL)
+        -- Source filter: use JOIN result
+        AND (NOT has_source_filter OR srfa.id IS NOT NULL)
         AND (
             p_filter IS NULL OR NOT p_filter ? 'languages' OR jsonb_array_length(p_filter->'languages') = 0 OR
             s.language ->> 'primary_language' IN (SELECT jsonb_array_elements_text(p_filter->'languages'))
         )
-        AND (
-            p_filter IS NULL OR NOT p_filter ? 'states' OR jsonb_array_length(p_filter->'states') = 0 OR
-            a.location_state IN (SELECT jsonb_array_elements_text(p_filter->'states'))
-        )
-        AND (
-            p_filter IS NULL OR NOT p_filter ? 'sources' OR jsonb_array_length(p_filter->'sources') = 0 OR
-            a.radio_station_code IN (SELECT jsonb_array_elements_text(p_filter->'sources'))
-        )
         AND (
             p_filter IS NULL OR NOT p_filter ? 'politicalSpectrum' OR
             (
diff --git a/supabase/migrations/20260130_optimize_state_source_filters.sql b/supabase/migrations/20260130_optimize_state_source_filters.sql
new file mode 100644
index 0000000..ea9fe16
--- /dev/null
+++ b/supabase/migrations/20260130_optimize_state_source_filters.sql
@@ -0,0 +1,390 @@
+-- Optimize state and source filters in get_snippets
+-- Problem: State filter scans all 19k+ snippets first, then filters by audio_files.location_state
+-- Solution: Use same CTE+JOIN pattern as starred/labeled/upvoted filters
+-- Expected improvement: ~134ms -> <50ms for state filter queries
+
+DROP FUNCTION IF EXISTS get_snippets;
+
+CREATE OR REPLACE FUNCTION get_snippets (
+    p_language text,
+    p_filter jsonb,
+    page INTEGER,
+    page_size INTEGER,
+    p_order_by text,
+    p_search_term text DEFAULT ''
+) RETURNS jsonb SECURITY DEFINER AS $$
+DECLARE
+    current_user_id UUID;
+    result jsonb;
+    total_count INTEGER;
+    total_pages INTEGER;
+    user_roles TEXT[];
+    user_is_admin BOOLEAN;
+    trimmed_search_term TEXT := TRIM(p_search_term);
+    -- Filter detection flags for optimization
+    has_starred_filter BOOLEAN;
+    starred_by_me BOOLEAN;
+    starred_by_others BOOLEAN;
+    has_labeled_filter BOOLEAN;
+    labeled_by_me BOOLEAN;
+    labeled_by_others BOOLEAN;
+    has_upvoted_filter BOOLEAN;
+    filter_upvoted_by_me BOOLEAN;
+    filter_upvoted_by_others BOOLEAN;
+    -- State/source filter flags (new)
+    has_state_filter BOOLEAN;
+    has_source_filter BOOLEAN;
+BEGIN
+    current_user_id := auth.uid();
+    IF current_user_id IS NULL THEN
+        RAISE EXCEPTION 'Only logged-in users can call this function';
+    END IF;
+
+    SELECT array_agg(r.name) INTO user_roles
+    FROM public.user_roles ur
+    JOIN public.roles r ON ur.role = r.id
+    WHERE ur."user" = current_user_id;
+
+    user_is_admin := COALESCE('admin' = ANY(user_roles), FALSE);
+
+    -- Pre-compute filter flags to enable query optimization
+    has_starred_filter := p_filter IS NOT NULL
+        AND p_filter ? 'starredBy'
+        AND jsonb_array_length(p_filter->'starredBy') > 0;
+    starred_by_me := has_starred_filter AND p_filter->'starredBy' ? 'by_me';
+    starred_by_others := has_starred_filter AND p_filter->'starredBy' ? 'by_others';
+
+    has_labeled_filter := p_filter IS NOT NULL
+        AND p_filter ? 'labeledBy'
+        AND jsonb_array_length(p_filter->'labeledBy') > 0;
+    labeled_by_me := has_labeled_filter AND p_filter->'labeledBy' ? 'by_me';
+    labeled_by_others := has_labeled_filter AND p_filter->'labeledBy' ? 'by_others';
+
+    has_upvoted_filter := p_filter IS NOT NULL
+        AND p_filter ? 'upvotedBy'
+        AND jsonb_array_length(p_filter->'upvotedBy') > 0;
+    filter_upvoted_by_me := has_upvoted_filter AND p_filter->'upvotedBy' ? 'by_me';
+    filter_upvoted_by_others := has_upvoted_filter AND p_filter->'upvotedBy' ? 'by_others';
+
+    -- State/source filter flags (new optimization)
+    has_state_filter := p_filter IS NOT NULL
+        AND p_filter ? 'states'
+        AND jsonb_array_length(p_filter->'states') > 0;
+    has_source_filter := p_filter IS NOT NULL
+        AND p_filter ? 'sources'
+        AND jsonb_array_length(p_filter->'sources') > 0;
+
+    -- Get count using optimized query with JOINs instead of EXISTS/IN
+    WITH
+    starred_snippet_ids AS (
+        SELECT DISTINCT uss.snippet
+        FROM user_star_snippets uss
+        WHERE has_starred_filter AND (
+            (starred_by_me AND starred_by_others) OR
+            (starred_by_me AND NOT starred_by_others AND uss."user" = current_user_id) OR
+            (starred_by_others AND NOT starred_by_me AND uss."user" != current_user_id)
+        )
+    ),
+    labeled_snippet_ids AS (
+        SELECT DISTINCT sl.snippet
+        FROM snippet_labels sl
+        JOIN label_upvotes lu ON lu.snippet_label = sl.id
+        WHERE has_labeled_filter AND (
+            (labeled_by_me AND labeled_by_others) OR
+            (labeled_by_me AND NOT labeled_by_others AND lu.upvoted_by = current_user_id) OR
+            (labeled_by_others AND NOT labeled_by_me AND lu.upvoted_by != current_user_id)
+        )
+    ),
+    upvoted_snippet_ids AS (
+        SELECT DISTINCT sl.snippet
+        FROM snippet_labels sl
+        JOIN label_upvotes lu ON lu.snippet_label = sl.id
+        WHERE has_upvoted_filter AND (
+            (filter_upvoted_by_me AND filter_upvoted_by_others) OR
+            (filter_upvoted_by_me AND NOT filter_upvoted_by_others AND lu.upvoted_by = current_user_id) OR
+            (filter_upvoted_by_others AND NOT filter_upvoted_by_me AND lu.upvoted_by != current_user_id)
+        )
+    ),
+    -- Pre-filter audio file IDs by state (uses idx_audio_files_location_state)
+    state_filtered_audio_ids AS (
+        SELECT id FROM audio_files
+        WHERE has_state_filter
+        AND location_state IN (SELECT jsonb_array_elements_text(p_filter->'states'))
+    ),
+    -- Pre-filter audio file IDs by source/radio station
+    source_filtered_audio_ids AS (
+        SELECT id FROM audio_files
+        WHERE has_source_filter
+        AND radio_station_code IN (SELECT jsonb_array_elements_text(p_filter->'sources'))
+    )
+    SELECT COUNT(*) INTO total_count
+    FROM snippets s
+    LEFT JOIN audio_files a ON s.audio_file = a.id
+    LEFT JOIN user_hide_snippets uhs ON uhs.snippet = s.id
+    -- Use JOIN for starred filter (starts from smaller set of ~200 rows instead of 119k)
+    LEFT JOIN starred_snippet_ids ssi ON ssi.snippet = s.id
+    -- Use JOIN for labeled filter
+    LEFT JOIN labeled_snippet_ids lsi ON lsi.snippet = s.id
+    -- Use JOIN for upvoted filter
+    LEFT JOIN upvoted_snippet_ids usi ON usi.snippet = s.id
+    -- Use JOIN for state filter (new optimization)
+    LEFT JOIN state_filtered_audio_ids sfa ON sfa.id = s.audio_file
+    -- Use JOIN for source filter (new optimization)
+    LEFT JOIN source_filtered_audio_ids srfa ON srfa.id = s.audio_file
+    WHERE s.status = 'Processed' AND (s.confidence_scores->>'overall')::INTEGER >= 95
+    AND (user_is_admin OR uhs.snippet IS NULL)
+    -- Starred filter: use JOIN result instead of EXISTS (key optimization)
+    AND (NOT has_starred_filter OR ssi.snippet IS NOT NULL)
+    -- Labeled filter: use JOIN result instead of EXISTS
+    AND (NOT has_labeled_filter OR lsi.snippet IS NOT NULL)
+    -- Upvoted filter: use JOIN result instead of EXISTS
+    AND (NOT has_upvoted_filter OR usi.snippet IS NOT NULL)
+    -- State filter: use JOIN result instead of IN subquery (new optimization)
+    AND (NOT has_state_filter OR sfa.id IS NOT NULL)
+    -- Source filter: use JOIN result instead of IN subquery (new optimization)
+    AND (NOT has_source_filter OR srfa.id IS NOT NULL)
+    AND (
+        p_filter IS NULL OR
+        NOT p_filter ? 'languages' OR
+        jsonb_array_length(p_filter->'languages') = 0 OR
+        s.language ->> 'primary_language' IN (SELECT jsonb_array_elements_text(p_filter->'languages'))
+    )
+    AND (
+        p_filter IS NULL OR
+        NOT p_filter ? 'politicalSpectrum' OR
+        (
+            CASE
+                WHEN p_filter->>'politicalSpectrum' = 'left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -1.0 AND -0.7
+                WHEN p_filter->>'politicalSpectrum' = 'center-left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.7 AND -0.3
+                WHEN p_filter->>'politicalSpectrum' = 'center' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.3 AND 0.3
+                WHEN p_filter->>'politicalSpectrum' = 'center-right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.3 AND 0.7
+                WHEN p_filter->>'politicalSpectrum' = 'right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.7 AND 1.0
+                ELSE TRUE
+            END
+        )
+    )
+    AND (
+        p_filter IS NULL OR
+        NOT p_filter ? 'labels' OR
+        jsonb_array_length(p_filter->'labels') = 0 OR
+        EXISTS (SELECT 1 FROM snippet_labels sl WHERE sl.snippet = s.id AND sl.label IN (SELECT (jsonb_array_elements_text(p_filter->'labels'))::UUID))
+    )
+    AND (
+        trimmed_search_term = '' OR (
+            (s.title ->> 'english') &@ trimmed_search_term
+            OR (s.title ->> 'spanish') &@ trimmed_search_term
+            OR (s.explanation ->> 'english') &@ trimmed_search_term
+            OR (s.explanation ->> 'spanish') &@ trimmed_search_term
+            OR (s.summary ->> 'english') &@ trimmed_search_term
+            OR (s.summary ->> 'spanish') &@ trimmed_search_term
+            OR s.transcription &@ trimmed_search_term
+            OR s.translation &@ trimmed_search_term
+        )
+    );
+
+    -- Now get the actual data with pagination using the same optimization
+    WITH
+    starred_snippet_ids AS (
+        SELECT DISTINCT uss.snippet
+        FROM user_star_snippets uss
+        WHERE has_starred_filter AND (
+            (starred_by_me AND starred_by_others) OR
+            (starred_by_me AND NOT starred_by_others AND uss."user" = current_user_id) OR
+            (starred_by_others AND NOT starred_by_me AND uss."user" != current_user_id)
+        )
+    ),
+    labeled_snippet_ids AS (
+        SELECT DISTINCT sl.snippet
+        FROM snippet_labels sl
+        JOIN label_upvotes lu ON lu.snippet_label = sl.id
+        WHERE has_labeled_filter AND (
+            (labeled_by_me AND labeled_by_others) OR
+            (labeled_by_me AND NOT labeled_by_others AND lu.upvoted_by = current_user_id) OR
+            (labeled_by_others AND NOT labeled_by_me AND lu.upvoted_by != current_user_id)
+        )
+    ),
+    upvoted_snippet_ids AS (
+        SELECT DISTINCT sl.snippet
+        FROM snippet_labels sl
+        JOIN label_upvotes lu ON lu.snippet_label = sl.id
+        WHERE has_upvoted_filter AND (
+            (filter_upvoted_by_me AND filter_upvoted_by_others) OR
+            (filter_upvoted_by_me AND NOT filter_upvoted_by_others AND lu.upvoted_by = current_user_id) OR
+            (filter_upvoted_by_others AND NOT filter_upvoted_by_me AND lu.upvoted_by != current_user_id)
+        )
+    ),
+    -- Pre-filter audio file IDs by state
+    state_filtered_audio_ids AS (
+        SELECT id FROM audio_files
+        WHERE has_state_filter
+        AND location_state IN (SELECT jsonb_array_elements_text(p_filter->'states'))
+    ),
+    -- Pre-filter audio file IDs by source
+    source_filtered_audio_ids AS (
+        SELECT id FROM audio_files
+        WHERE has_source_filter
+        AND radio_station_code IN (SELECT jsonb_array_elements_text(p_filter->'sources'))
+    ),
+    filtered_snippets AS (
+        SELECT
+            s.id,
+            s.recorded_at,
+            s.user_last_activity,
+            s.duration,
+            s.start_time,
+            s.end_time,
+            s.file_path,
+            s.file_size,
+            s.political_leaning,
+            CASE WHEN p_language = 'spanish' THEN s.title ->> 'spanish' ELSE s.title ->> 'english' END AS title,
+            CASE WHEN p_language = 'spanish' THEN s.summary ->> 'spanish' ELSE s.summary ->> 'english' END AS summary,
+            CASE WHEN p_language = 'spanish' THEN s.explanation ->> 'spanish' ELSE s.explanation ->> 'english' END AS explanation,
+            s.confidence_scores,
+            s.language,
+            s.context,
+            s.upvote_count,
+            s.comment_count,
+            s.like_count,
+            jsonb_build_object(
+                'id', a.id,
+                'radio_station_name', a.radio_station_name,
+                'radio_station_code', a.radio_station_code,
+                'location_state', a.location_state,
+                'location_city', a.location_city
+            ) AS audio_file,
+            us.id IS NOT NULL AS starred_by_user,
+            ul.value AS user_like_status,
+            uhs.snippet IS NOT NULL AS hidden
+        FROM snippets s
+        LEFT JOIN audio_files a ON s.audio_file = a.id
+        LEFT JOIN user_star_snippets us ON us.snippet = s.id AND us."user" = current_user_id
+        LEFT JOIN user_like_snippets ul ON ul.snippet = s.id AND ul."user" = current_user_id
+        LEFT JOIN user_hide_snippets uhs ON uhs.snippet = s.id
+        -- Use JOIN for starred filter (starts from smaller set)
+        LEFT JOIN starred_snippet_ids ssi ON ssi.snippet = s.id
+        -- Use JOIN for labeled filter
+        LEFT JOIN labeled_snippet_ids lsi ON lsi.snippet = s.id
+        -- Use JOIN for upvoted filter
+        LEFT JOIN upvoted_snippet_ids usi ON usi.snippet = s.id
+        -- Use JOIN for state filter
+        LEFT JOIN state_filtered_audio_ids sfa ON sfa.id = s.audio_file
+        -- Use JOIN for source filter
+        LEFT JOIN source_filtered_audio_ids srfa ON srfa.id = s.audio_file
+        WHERE s.status = 'Processed' AND (s.confidence_scores->>'overall')::INTEGER >= 95
+        AND (user_is_admin OR uhs.snippet IS NULL)
+        -- Starred filter: use JOIN result instead of EXISTS
+        AND (NOT has_starred_filter OR ssi.snippet IS NOT NULL)
+        -- Labeled filter: use JOIN result instead of EXISTS
+        AND (NOT has_labeled_filter OR lsi.snippet IS NOT NULL)
+        -- Upvoted filter: use JOIN result instead of EXISTS
+        AND (NOT has_upvoted_filter OR usi.snippet IS NOT NULL)
+        -- State filter: use JOIN result
+        AND (NOT has_state_filter OR sfa.id IS NOT NULL)
+        -- Source filter: use JOIN result
+        AND (NOT has_source_filter OR srfa.id IS NOT NULL)
+        AND (
+            p_filter IS NULL OR NOT p_filter ? 'languages' OR jsonb_array_length(p_filter->'languages') = 0 OR
+            s.language ->> 'primary_language' IN (SELECT jsonb_array_elements_text(p_filter->'languages'))
+        )
+        AND (
+            p_filter IS NULL OR NOT p_filter ? 'politicalSpectrum' OR
+            (
+                CASE
+                    WHEN p_filter->>'politicalSpectrum' = 'left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -1.0 AND -0.7
+                    WHEN p_filter->>'politicalSpectrum' = 'center-left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.7 AND -0.3
+                    WHEN p_filter->>'politicalSpectrum' = 'center' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.3 AND 0.3
+                    WHEN p_filter->>'politicalSpectrum' = 'center-right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.3 AND 0.7
+                    WHEN p_filter->>'politicalSpectrum' = 'right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.7 AND 1.0
+                    ELSE TRUE
+                END
+            )
+        )
+        AND (
+            p_filter IS NULL OR NOT p_filter ? 'labels' OR jsonb_array_length(p_filter->'labels') = 0 OR
+            EXISTS (SELECT 1 FROM snippet_labels sl WHERE sl.snippet = s.id AND sl.label IN (SELECT (jsonb_array_elements_text(p_filter->'labels'))::UUID))
+        )
+        AND (
+            trimmed_search_term = '' OR (
+                (s.title ->> 'english') &@ trimmed_search_term
+                OR (s.title ->> 'spanish') &@ trimmed_search_term
+                OR (s.explanation ->> 'english') &@ trimmed_search_term
+                OR (s.explanation ->> 'spanish') &@ trimmed_search_term
+                OR (s.summary ->> 'english') &@ trimmed_search_term
+                OR (s.summary ->> 'spanish') &@ trimmed_search_term
+                OR s.transcription &@ trimmed_search_term
+                OR s.translation &@ trimmed_search_term
+            )
+        )
+        ORDER BY
+            CASE
+                WHEN p_order_by = 'upvotes' THEN s.upvote_count + COALESCE(s.like_count, 0)
+                WHEN p_order_by = 'comments' THEN s.comment_count
+                WHEN p_order_by = 'activities' THEN
+                    CASE WHEN s.user_last_activity IS NULL THEN 0 ELSE EXTRACT(EPOCH FROM s.user_last_activity) END
+            END DESC,
+            s.recorded_at DESC
+        LIMIT page_size
+        OFFSET page * page_size
+    ),
+    label_summary AS (
+        SELECT
+            l.id,
+            CASE WHEN p_language = 'spanish' THEN l.text_spanish ELSE l.text END AS text,
+            sl.upvote_count,
+            lu.id IS NOT NULL AS upvoted_by_me,
+            sl.snippet AS snippet_id
+        FROM snippet_labels sl
+        JOIN labels l ON l.id = sl.label
+        LEFT JOIN label_upvotes lu ON lu.snippet_label = sl.id AND lu.upvoted_by = current_user_id
+        WHERE sl.snippet IN (SELECT id FROM filtered_snippets)
+    ),
+    snippets_with_labels AS (
+        SELECT
+            fs.*,
+            COALESCE(ld.labels, '[]'::jsonb) AS labels
+        FROM filtered_snippets fs
+        LEFT JOIN (
+            SELECT snippet_id, jsonb_agg(jsonb_build_object('id', id, 'text', text, 'upvote_count', upvote_count, 'upvoted_by_me', upvoted_by_me)) as labels
+            FROM label_summary
+            GROUP BY snippet_id
+        ) ld ON fs.id = ld.snippet_id
+    )
+    SELECT jsonb_agg(
+        jsonb_build_object(
+            'id', s.id,
+            'recorded_at', s.recorded_at,
+            'user_last_activity', s.user_last_activity,
+            'duration', s.duration,
+            'start_time', s.start_time,
+            'end_time', s.end_time,
+            'file_path', s.file_path,
+            'file_size', s.file_size,
+            'political_leaning', s.political_leaning,
+            'title', s.title,
+            'summary', s.summary,
+            'explanation', s.explanation,
+            'confidence_scores', s.confidence_scores,
+            'language', s.language,
+            'context', s.context,
+            'labels', s.labels,
+            'audio_file', s.audio_file,
+            'starred_by_user', s.starred_by_user,
+            'user_like_status', s.user_like_status,
+            'hidden', s.hidden,
+            'like_count', COALESCE(s.like_count, 0),
+            'dislike_count', 0
+        )
+    ) INTO result
+    FROM snippets_with_labels s;
+
+    total_pages := CEIL(total_count::FLOAT / page_size);
+
+    RETURN jsonb_build_object(
+        'num_of_snippets', total_count,
+        'snippets', COALESCE(result, '[]'::jsonb),
+        'current_page', page,
+        'page_size', page_size,
+        'total_pages', total_pages
+    );
+END;
+$$ LANGUAGE plpgsql;

From b402c2aaf89c50edfd51d99f02f9c184d07c6448 Mon Sep 17 00:00:00 2001
From: Quan Cao <quan.cao@eastagile.com>
Date: Fri, 27 Feb 2026 16:23:53 +0700
Subject: [PATCH 07/10] Add dislike_count tracking to snippet like trigger

The update_snippet_like_count() function now tracks both likes
(value=1) and dislikes (value=-1) separately, updating the
dislike_count column alongside the existing like_count when
user_like_snippets changes.
---
 supabase/database/sql/update_snippet_like_count.sql | 10 ++++++++--
 1 file changed, 8 insertions(+), 2 deletions(-)

diff --git a/supabase/database/sql/update_snippet_like_count.sql b/supabase/database/sql/update_snippet_like_count.sql
index 4d87d5f..b97ea30 100644
--- a/supabase/database/sql/update_snippet_like_count.sql
+++ b/supabase/database/sql/update_snippet_like_count.sql
@@ -2,16 +2,22 @@ CREATE OR REPLACE FUNCTION update_snippet_like_count()
 RETURNS TRIGGER AS $$
 BEGIN
     UPDATE snippets
-    SET 
+    SET
         like_count = (
             SELECT COUNT(*)
             FROM user_like_snippets
             WHERE snippet = COALESCE(NEW.snippet, OLD.snippet)
             AND value = 1
         ),
+        dislike_count = (
+            SELECT COUNT(*)
+            FROM user_like_snippets
+            WHERE snippet = COALESCE(NEW.snippet, OLD.snippet)
+            AND value = -1
+        ),
         user_last_activity = NOW()
     WHERE id = COALESCE(NEW.snippet, OLD.snippet);
-    
+
     RETURN NULL;
 END;
 $$ LANGUAGE plpgsql;

From 51463ce1fe3de0aa258359135f1177e5961c3884 Mon Sep 17 00:00:00 2001
From: Quan Cao <quan.cao@eastagile.com>
Date: Fri, 27 Feb 2026 16:24:48 +0700
Subject: [PATCH 08/10] Optimize database by removing unused function and
 adding FK indexes

Removes the legacy get_recording_filter_options() function which has
zero callers in the codebase and no usage in production logs. The
frontend uses get_filtering_options() instead. Also adds missing
foreign key indexes identified by Supabase Database Advisor to improve
JOIN performance.
---
 ..._optimize_recording_filter_and_indexes.sql | 50 ++-----------------
 1 file changed, 4 insertions(+), 46 deletions(-)

diff --git a/supabase/migrations/20260129_optimize_recording_filter_and_indexes.sql b/supabase/migrations/20260129_optimize_recording_filter_and_indexes.sql
index 761188b..6c1b933 100644
--- a/supabase/migrations/20260129_optimize_recording_filter_and_indexes.sql
+++ b/supabase/migrations/20260129_optimize_recording_filter_and_indexes.sql
@@ -1,49 +1,7 @@
--- Additional optimizations identified via pg_stat_statements and Supabase Database Advisor:
--- 1. get_recording_filter_options: 1.2s avg (18 calls) - Same DISTINCT problem on audio_files
--- 2. Unindexed foreign keys causing slower joins
-
--- Optimize get_recording_filter_options to use the materialized view cache
-CREATE OR REPLACE FUNCTION get_recording_filter_options()
-RETURNS JSONB AS $$
-DECLARE
-    result JSONB;
-BEGIN
-    SELECT jsonb_build_object(
-        'states', (
-            SELECT COALESCE(jsonb_agg(value ORDER BY value), '[]'::jsonb)
-            FROM filter_options_cache
-            WHERE option_type = 'states'
-        ),
-        'radio_stations', (
-            SELECT COALESCE(jsonb_agg(
-                jsonb_build_object('name', secondary_value, 'code', value)
-            ), '[]'::jsonb)
-            FROM filter_options_cache
-            WHERE option_type = 'sources'
-        ),
-        'languages', (
-            SELECT COALESCE(jsonb_agg(value ORDER BY value), '[]'::jsonb)
-            FROM filter_options_cache
-            WHERE option_type = 'languages'
-        ),
-        'labels', (
-            SELECT COALESCE(jsonb_agg(
-                jsonb_build_object('id', l.id, 'text', l.text, 'text_spanish', l.text_spanish)
-            ), '[]'::jsonb)
-            FROM (
-                SELECT DISTINCT l.id, l.text, l.text_spanish
-                FROM labels l
-                JOIN snippet_labels sl ON sl.label = l.id
-                JOIN snippets s ON sl.snippet = s.id
-                WHERE s.status = 'Processed'
-                ORDER BY l.text
-                LIMIT 100
-            ) l
-        )
-    ) INTO result;
-    RETURN result;
-END;
-$$ LANGUAGE plpgsql SECURITY DEFINER;
+-- Drop unused get_recording_filter_options function
+-- It was a legacy version of get_filtering_options, with 0 callers in the codebase
+-- and no calls in Supabase logs for 7+ days. The frontend uses get_filtering_options instead.
+DROP FUNCTION IF EXISTS get_recording_filter_options();
 
 -- Add indexes for unindexed foreign keys (identified by Supabase Database Advisor)
 -- These improve JOIN performance when querying related tables

From 08a45e7091b1282aeee9bb802777441b04003509 Mon Sep 17 00:00:00 2001
From: Quan Cao <quan.cao@eastagile.com>
Date: Sat, 28 Feb 2026 18:27:44 +0700
Subject: [PATCH 09/10] Merge get_snippets into single CTE chain and fix
 dislike_count

- Consolidate two separate queries (count + data) into a single CTE chain,
  eliminating duplicate filter CTEs that ran twice per call
- Use lightweight filtered_snippets CTE (IDs + sort columns only) for count
  and pagination, then fetch heavy columns for ~20 paginated rows only
- Fix dislike_count: use denormalized column instead of hardcoded 0
---
 .../database/sql/get_snippets_function.sql    | 317 +++++++-----------
 1 file changed, 129 insertions(+), 188 deletions(-)

diff --git a/supabase/database/sql/get_snippets_function.sql b/supabase/database/sql/get_snippets_function.sql
index e4db606..3931361 100644
--- a/supabase/database/sql/get_snippets_function.sql
+++ b/supabase/database/sql/get_snippets_function.sql
@@ -4,6 +4,7 @@ DROP FUNCTION IF EXISTS get_snippets;
 -- Key optimizations:
 -- 1. Uses JOINs with pre-filtered CTEs instead of EXISTS subqueries for starred/labeled/upvotedBy filters
 -- 2. Uses JOINs with pre-filtered CTEs for state/source filters (avoids IN subquery on audio_files)
+-- 3. Single query with CTE chain — filter CTEs defined once, count + data in one pass
 --
 -- Performance improvements:
 -- - starredBy filter: timeout (>30s) -> <1s
@@ -81,8 +82,8 @@ BEGIN
         AND p_filter ? 'sources'
         AND jsonb_array_length(p_filter->'sources') > 0;
 
-    -- Get count using optimized query with JOINs instead of EXISTS/IN
     WITH
+    -- Pre-filter CTEs (defined once, reused by filtered_snippets)
     starred_snippet_ids AS (
         SELECT DISTINCT uss.snippet
         FROM user_star_snippets uss
@@ -112,189 +113,48 @@ BEGIN
             (filter_upvoted_by_others AND NOT filter_upvoted_by_me AND lu.upvoted_by != current_user_id)
         )
     ),
-    -- Pre-filter audio file IDs by state (uses idx_audio_files_location_state)
     state_filtered_audio_ids AS (
         SELECT id FROM audio_files
         WHERE has_state_filter
         AND location_state IN (SELECT jsonb_array_elements_text(p_filter->'states'))
     ),
-    -- Pre-filter audio file IDs by source/radio station
-    source_filtered_audio_ids AS (
-        SELECT id FROM audio_files
-        WHERE has_source_filter
-        AND radio_station_code IN (SELECT jsonb_array_elements_text(p_filter->'sources'))
-    )
-    SELECT COUNT(*) INTO total_count
-    FROM snippets s
-    LEFT JOIN audio_files a ON s.audio_file = a.id
-    LEFT JOIN user_hide_snippets uhs ON uhs.snippet = s.id
-    -- Use JOIN for starred filter (starts from smaller set of ~200 rows instead of 119k)
-    LEFT JOIN starred_snippet_ids ssi ON ssi.snippet = s.id
-    -- Use JOIN for labeled filter
-    LEFT JOIN labeled_snippet_ids lsi ON lsi.snippet = s.id
-    -- Use JOIN for upvoted filter
-    LEFT JOIN upvoted_snippet_ids usi ON usi.snippet = s.id
-    -- Use JOIN for state filter
-    LEFT JOIN state_filtered_audio_ids sfa ON sfa.id = s.audio_file
-    -- Use JOIN for source filter
-    LEFT JOIN source_filtered_audio_ids srfa ON srfa.id = s.audio_file
-    WHERE s.status = 'Processed' AND (s.confidence_scores->>'overall')::INTEGER >= 95
-    AND (user_is_admin OR uhs.snippet IS NULL)
-    -- Starred filter: use JOIN result instead of EXISTS (key optimization)
-    AND (NOT has_starred_filter OR ssi.snippet IS NOT NULL)
-    -- Labeled filter: use JOIN result instead of EXISTS
-    AND (NOT has_labeled_filter OR lsi.snippet IS NOT NULL)
-    -- Upvoted filter: use JOIN result instead of EXISTS
-    AND (NOT has_upvoted_filter OR usi.snippet IS NOT NULL)
-    -- State filter: use JOIN result instead of IN subquery
-    AND (NOT has_state_filter OR sfa.id IS NOT NULL)
-    -- Source filter: use JOIN result instead of IN subquery
-    AND (NOT has_source_filter OR srfa.id IS NOT NULL)
-    AND (
-        p_filter IS NULL OR
-        NOT p_filter ? 'languages' OR
-        jsonb_array_length(p_filter->'languages') = 0 OR
-        s.language ->> 'primary_language' IN (SELECT jsonb_array_elements_text(p_filter->'languages'))
-    )
-    AND (
-        p_filter IS NULL OR
-        NOT p_filter ? 'politicalSpectrum' OR
-        (
-            CASE
-                WHEN p_filter->>'politicalSpectrum' = 'left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -1.0 AND -0.7
-                WHEN p_filter->>'politicalSpectrum' = 'center-left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.7 AND -0.3
-                WHEN p_filter->>'politicalSpectrum' = 'center' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.3 AND 0.3
-                WHEN p_filter->>'politicalSpectrum' = 'center-right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.3 AND 0.7
-                WHEN p_filter->>'politicalSpectrum' = 'right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.7 AND 1.0
-                ELSE TRUE
-            END
-        )
-    )
-    AND (
-        p_filter IS NULL OR
-        NOT p_filter ? 'labels' OR
-        jsonb_array_length(p_filter->'labels') = 0 OR
-        EXISTS (SELECT 1 FROM snippet_labels sl WHERE sl.snippet = s.id AND sl.label IN (SELECT (jsonb_array_elements_text(p_filter->'labels'))::UUID))
-    )
-    AND (
-        trimmed_search_term = '' OR (
-            (s.title ->> 'english') &@ trimmed_search_term
-            OR (s.title ->> 'spanish') &@ trimmed_search_term
-            OR (s.explanation ->> 'english') &@ trimmed_search_term
-            OR (s.explanation ->> 'spanish') &@ trimmed_search_term
-            OR (s.summary ->> 'english') &@ trimmed_search_term
-            OR (s.summary ->> 'spanish') &@ trimmed_search_term
-            OR s.transcription &@ trimmed_search_term
-            OR s.translation &@ trimmed_search_term
-        )
-    );
-
-    -- Now get the actual data with pagination using the same optimization
-    WITH
-    starred_snippet_ids AS (
-        SELECT DISTINCT uss.snippet
-        FROM user_star_snippets uss
-        WHERE has_starred_filter AND (
-            (starred_by_me AND starred_by_others) OR
-            (starred_by_me AND NOT starred_by_others AND uss."user" = current_user_id) OR
-            (starred_by_others AND NOT starred_by_me AND uss."user" != current_user_id)
-        )
-    ),
-    labeled_snippet_ids AS (
-        SELECT DISTINCT sl.snippet
-        FROM snippet_labels sl
-        JOIN label_upvotes lu ON lu.snippet_label = sl.id
-        WHERE has_labeled_filter AND (
-            (labeled_by_me AND labeled_by_others) OR
-            (labeled_by_me AND NOT labeled_by_others AND lu.upvoted_by = current_user_id) OR
-            (labeled_by_others AND NOT labeled_by_me AND lu.upvoted_by != current_user_id)
-        )
-    ),
-    upvoted_snippet_ids AS (
-        SELECT DISTINCT sl.snippet
-        FROM snippet_labels sl
-        JOIN label_upvotes lu ON lu.snippet_label = sl.id
-        WHERE has_upvoted_filter AND (
-            (filter_upvoted_by_me AND filter_upvoted_by_others) OR
-            (filter_upvoted_by_me AND NOT filter_upvoted_by_others AND lu.upvoted_by = current_user_id) OR
-            (filter_upvoted_by_others AND NOT filter_upvoted_by_me AND lu.upvoted_by != current_user_id)
-        )
-    ),
-    -- Pre-filter audio file IDs by state
-    state_filtered_audio_ids AS (
-        SELECT id FROM audio_files
-        WHERE has_state_filter
-        AND location_state IN (SELECT jsonb_array_elements_text(p_filter->'states'))
-    ),
-    -- Pre-filter audio file IDs by source
     source_filtered_audio_ids AS (
         SELECT id FROM audio_files
         WHERE has_source_filter
         AND radio_station_code IN (SELECT jsonb_array_elements_text(p_filter->'sources'))
     ),
+    -- Lightweight filtered IDs (for count + pagination, no heavy columns)
     filtered_snippets AS (
         SELECT
             s.id,
             s.recorded_at,
             s.user_last_activity,
-            s.duration,
-            s.start_time,
-            s.end_time,
-            s.file_path,
-            s.file_size,
-            s.political_leaning,
-            CASE WHEN p_language = 'spanish' THEN s.title ->> 'spanish' ELSE s.title ->> 'english' END AS title,
-            CASE WHEN p_language = 'spanish' THEN s.summary ->> 'spanish' ELSE s.summary ->> 'english' END AS summary,
-            CASE WHEN p_language = 'spanish' THEN s.explanation ->> 'spanish' ELSE s.explanation ->> 'english' END AS explanation,
-            s.confidence_scores,
-            s.language,
-            s.context,
             s.upvote_count,
             s.comment_count,
-            s.like_count,
-            jsonb_build_object(
-                'id', a.id,
-                'radio_station_name', a.radio_station_name,
-                'radio_station_code', a.radio_station_code,
-                'location_state', a.location_state,
-                'location_city', a.location_city
-            ) AS audio_file,
-            us.id IS NOT NULL AS starred_by_user,
-            ul.value AS user_like_status,
-            uhs.snippet IS NOT NULL AS hidden
+            COALESCE(s.like_count, 0) AS like_count
         FROM snippets s
-        LEFT JOIN audio_files a ON s.audio_file = a.id
-        LEFT JOIN user_star_snippets us ON us.snippet = s.id AND us."user" = current_user_id
-        LEFT JOIN user_like_snippets ul ON ul.snippet = s.id AND ul."user" = current_user_id
         LEFT JOIN user_hide_snippets uhs ON uhs.snippet = s.id
-        -- Use JOIN for starred filter (starts from smaller set)
         LEFT JOIN starred_snippet_ids ssi ON ssi.snippet = s.id
-        -- Use JOIN for labeled filter
         LEFT JOIN labeled_snippet_ids lsi ON lsi.snippet = s.id
-        -- Use JOIN for upvoted filter
         LEFT JOIN upvoted_snippet_ids usi ON usi.snippet = s.id
-        -- Use JOIN for state filter
         LEFT JOIN state_filtered_audio_ids sfa ON sfa.id = s.audio_file
-        -- Use JOIN for source filter
         LEFT JOIN source_filtered_audio_ids srfa ON srfa.id = s.audio_file
         WHERE s.status = 'Processed' AND (s.confidence_scores->>'overall')::INTEGER >= 95
         AND (user_is_admin OR uhs.snippet IS NULL)
-        -- Starred filter: use JOIN result instead of EXISTS
         AND (NOT has_starred_filter OR ssi.snippet IS NOT NULL)
-        -- Labeled filter: use JOIN result instead of EXISTS
         AND (NOT has_labeled_filter OR lsi.snippet IS NOT NULL)
-        -- Upvoted filter: use JOIN result instead of EXISTS
         AND (NOT has_upvoted_filter OR usi.snippet IS NOT NULL)
-        -- State filter: use JOIN result
         AND (NOT has_state_filter OR sfa.id IS NOT NULL)
-        -- Source filter: use JOIN result
         AND (NOT has_source_filter OR srfa.id IS NOT NULL)
         AND (
-            p_filter IS NULL OR NOT p_filter ? 'languages' OR jsonb_array_length(p_filter->'languages') = 0 OR
+            p_filter IS NULL OR
+            NOT p_filter ? 'languages' OR
+            jsonb_array_length(p_filter->'languages') = 0 OR
             s.language ->> 'primary_language' IN (SELECT jsonb_array_elements_text(p_filter->'languages'))
         )
         AND (
-            p_filter IS NULL OR NOT p_filter ? 'politicalSpectrum' OR
+            p_filter IS NULL OR
+            NOT p_filter ? 'politicalSpectrum' OR
             (
                 CASE
                     WHEN p_filter->>'politicalSpectrum' = 'left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -1.0 AND -0.7
@@ -307,8 +167,17 @@ BEGIN
             )
         )
         AND (
-            p_filter IS NULL OR NOT p_filter ? 'labels' OR jsonb_array_length(p_filter->'labels') = 0 OR
-            EXISTS (SELECT 1 FROM snippet_labels sl WHERE sl.snippet = s.id AND sl.label IN (SELECT (jsonb_array_elements_text(p_filter->'labels'))::UUID))
+            p_filter IS NULL OR
+            NOT p_filter ? 'labels' OR
+            jsonb_array_length(p_filter->'labels') = 0 OR
+            EXISTS (
+                SELECT 1
+                FROM snippet_labels sl
+                WHERE sl.snippet = s.id
+                AND sl.label IN (
+                    SELECT (jsonb_array_elements_text(p_filter->'labels'))::UUID
+                )
+            )
         )
         AND (
             trimmed_search_term = '' OR (
@@ -322,14 +191,21 @@ BEGIN
                 OR s.translation &@ trimmed_search_term
             )
         )
+    ),
+    total_count_cte AS (
+        SELECT COUNT(*) AS cnt FROM filtered_snippets
+    ),
+    paginated_ids AS (
+        SELECT id
+        FROM filtered_snippets fs
         ORDER BY
             CASE
-                WHEN p_order_by = 'upvotes' THEN s.upvote_count + COALESCE(s.like_count, 0)
-                WHEN p_order_by = 'comments' THEN s.comment_count
+                WHEN p_order_by = 'upvotes' THEN fs.upvote_count + fs.like_count
+                WHEN p_order_by = 'comments' THEN fs.comment_count
                 WHEN p_order_by = 'activities' THEN
-                    CASE WHEN s.user_last_activity IS NULL THEN 0 ELSE EXTRACT(EPOCH FROM s.user_last_activity) END
+                    CASE WHEN fs.user_last_activity IS NULL THEN 0 ELSE EXTRACT(EPOCH FROM fs.user_last_activity) END
             END DESC,
-            s.recorded_at DESC
+            fs.recorded_at DESC
         LIMIT page_size
         OFFSET page * page_size
     ),
@@ -343,46 +219,111 @@ BEGIN
         FROM snippet_labels sl
         JOIN labels l ON l.id = sl.label
         LEFT JOIN label_upvotes lu ON lu.snippet_label = sl.id AND lu.upvoted_by = current_user_id
-        WHERE sl.snippet IN (SELECT id FROM filtered_snippets)
+        WHERE sl.snippet IN (SELECT id FROM paginated_ids)
     ),
-    snippets_with_labels AS (
+    paginated_snippets AS (
         SELECT
-            fs.*,
+            s.id,
+            s.recorded_at,
+            s.user_last_activity,
+            s.duration,
+            s.start_time,
+            s.end_time,
+            s.file_path,
+            s.file_size,
+            s.political_leaning,
+            CASE
+                WHEN p_language = 'spanish' THEN s.title ->> 'spanish'
+                ELSE s.title ->> 'english'
+            END AS title,
+            CASE
+                WHEN p_language = 'spanish' THEN s.summary ->> 'spanish'
+                ELSE s.summary ->> 'english'
+            END AS summary,
+            CASE
+                WHEN p_language = 'spanish' THEN s.explanation ->> 'spanish'
+                ELSE s.explanation ->> 'english'
+            END AS explanation,
+            s.confidence_scores,
+            s.language,
+            s.context,
+            s.upvote_count,
+            s.comment_count,
+            jsonb_build_object(
+                'id', a.id,
+                'radio_station_name', a.radio_station_name,
+                'radio_station_code', a.radio_station_code,
+                'location_state', a.location_state,
+                'location_city', a.location_city
+            ) AS audio_file,
+            us.id IS NOT NULL AS starred_by_user,
+            ul.value AS user_like_status,
+            uhs.snippet IS NOT NULL AS hidden,
+            COALESCE(s.like_count, 0) AS like_count,
+            COALESCE(s.dislike_count, 0) AS dislike_count,
             COALESCE(ld.labels, '[]'::jsonb) AS labels
-        FROM filtered_snippets fs
+        FROM paginated_ids p
+        JOIN snippets s ON s.id = p.id
+        LEFT JOIN audio_files a ON s.audio_file = a.id
+        LEFT JOIN user_star_snippets us ON us.snippet = s.id AND us."user" = current_user_id
+        LEFT JOIN user_like_snippets ul ON ul.snippet = s.id AND ul."user" = current_user_id
+        LEFT JOIN user_hide_snippets uhs ON uhs.snippet = s.id
         LEFT JOIN (
-            SELECT snippet_id, jsonb_agg(jsonb_build_object('id', id, 'text', text, 'upvote_count', upvote_count, 'upvoted_by_me', upvoted_by_me)) as labels
+            SELECT
+                snippet_id,
+                jsonb_agg(
+                    jsonb_build_object(
+                        'id', id,
+                        'text', text,
+                        'upvote_count', upvote_count,
+                        'upvoted_by_me', upvoted_by_me
+                    )
+                ) as labels
             FROM label_summary
             GROUP BY snippet_id
-        ) ld ON fs.id = ld.snippet_id
+        ) ld ON p.id = ld.snippet_id
+        ORDER BY
+            CASE
+                WHEN p_order_by = 'upvotes' THEN s.upvote_count + COALESCE(s.like_count, 0)
+                WHEN p_order_by = 'comments' THEN s.comment_count
+                WHEN p_order_by = 'activities' THEN
+                    CASE
+                        WHEN s.user_last_activity IS NULL THEN 0
+                        ELSE EXTRACT(EPOCH FROM s.user_last_activity)
+                    END
+            END DESC,
+            s.recorded_at DESC
     )
-    SELECT jsonb_agg(
-        jsonb_build_object(
-            'id', s.id,
-            'recorded_at', s.recorded_at,
-            'user_last_activity', s.user_last_activity,
-            'duration', s.duration,
-            'start_time', s.start_time,
-            'end_time', s.end_time,
-            'file_path', s.file_path,
-            'file_size', s.file_size,
-            'political_leaning', s.political_leaning,
-            'title', s.title,
-            'summary', s.summary,
-            'explanation', s.explanation,
-            'confidence_scores', s.confidence_scores,
-            'language', s.language,
-            'context', s.context,
-            'labels', s.labels,
-            'audio_file', s.audio_file,
-            'starred_by_user', s.starred_by_user,
-            'user_like_status', s.user_like_status,
-            'hidden', s.hidden,
-            'like_count', COALESCE(s.like_count, 0),
-            'dislike_count', 0
-        )
-    ) INTO result
-    FROM snippets_with_labels s;
+    SELECT
+        jsonb_agg(
+            jsonb_build_object(
+                'id', ps.id,
+                'recorded_at', ps.recorded_at,
+                'user_last_activity', ps.user_last_activity,
+                'duration', ps.duration,
+                'start_time', ps.start_time,
+                'end_time', ps.end_time,
+                'file_path', ps.file_path,
+                'file_size', ps.file_size,
+                'political_leaning', ps.political_leaning,
+                'title', ps.title,
+                'summary', ps.summary,
+                'explanation', ps.explanation,
+                'confidence_scores', ps.confidence_scores,
+                'language', ps.language,
+                'context', ps.context,
+                'labels', ps.labels,
+                'audio_file', ps.audio_file,
+                'starred_by_user', ps.starred_by_user,
+                'user_like_status', ps.user_like_status,
+                'hidden', ps.hidden,
+                'like_count', ps.like_count,
+                'dislike_count', ps.dislike_count
+            )
+        ),
+        (SELECT cnt FROM total_count_cte)
+    INTO result, total_count
+    FROM paginated_snippets ps;
 
     total_pages := CEIL(total_count::FLOAT / page_size);
 

From 66dfd6c9130212c45a4efdb19b9c75e0a3e1192e Mon Sep 17 00:00:00 2001
From: Quan Cao <quan.cao@eastagile.com>
Date: Sat, 28 Feb 2026 19:38:34 +0700
Subject: [PATCH 10/10] Update migration files

---
 ...20260129_optimize_get_snippets_filters.sql | 345 +++++++---------
 ...20260130_optimize_state_source_filters.sql | 390 ------------------
 2 files changed, 159 insertions(+), 576 deletions(-)
 delete mode 100644 supabase/migrations/20260130_optimize_state_source_filters.sql

diff --git a/supabase/migrations/20260129_optimize_get_snippets_filters.sql b/supabase/migrations/20260129_optimize_get_snippets_filters.sql
index 845330c..32d1945 100644
--- a/supabase/migrations/20260129_optimize_get_snippets_filters.sql
+++ b/supabase/migrations/20260129_optimize_get_snippets_filters.sql
@@ -1,11 +1,15 @@
--- Optimize get_snippets function to fix timeout issues with starred/labeled/upvotedBy filters
--- The main issue is EXISTS subqueries being evaluated for every row (119k+ snippets)
--- Solution: Use JOINs with pre-filtered CTEs instead of EXISTS subqueries
+-- Optimized get_snippets function
+-- Key optimizations:
+-- 1. Uses JOINs with pre-filtered CTEs instead of EXISTS subqueries for starred/labeled/upvotedBy filters
+-- 2. Uses JOINs with pre-filtered CTEs for state/source filters (avoids IN subquery on audio_files)
+-- 3. Single query with CTE chain — filter CTEs defined once, count + data in one pass
 --
 -- Performance improvements:
 -- - starredBy filter: timeout (>30s) -> <1s
 -- - labeledBy filter: timeout (>30s) -> <1s
 -- - upvotedBy filter: 6.7s -> <1s
+-- - state filter: ~134ms -> <50ms
+-- - source filter: similar improvement
 -- - politicalSpectrum filter: uses existing index, no change needed
 
 CREATE OR REPLACE FUNCTION get_snippets (
@@ -34,6 +38,9 @@ DECLARE
     has_upvoted_filter BOOLEAN;
     filter_upvoted_by_me BOOLEAN;
     filter_upvoted_by_others BOOLEAN;
+    -- State/source filter flags
+    has_state_filter BOOLEAN;
+    has_source_filter BOOLEAN;
 BEGIN
     current_user_id := auth.uid();
     IF current_user_id IS NULL THEN
@@ -66,8 +73,16 @@ BEGIN
     filter_upvoted_by_me := has_upvoted_filter AND p_filter->'upvotedBy' ? 'by_me';
     filter_upvoted_by_others := has_upvoted_filter AND p_filter->'upvotedBy' ? 'by_others';
 
-    -- Get count using optimized query with JOINs instead of EXISTS
+    -- State/source filter flags
+    has_state_filter := p_filter IS NOT NULL
+        AND p_filter ? 'states'
+        AND jsonb_array_length(p_filter->'states') > 0;
+    has_source_filter := p_filter IS NOT NULL
+        AND p_filter ? 'sources'
+        AND jsonb_array_length(p_filter->'sources') > 0;
+
     WITH
+    -- Pre-filter CTEs (defined once, reused by filtered_snippets)
     starred_snippet_ids AS (
         SELECT DISTINCT uss.snippet
         FROM user_star_snippets uss
@@ -87,7 +102,6 @@ BEGIN
             (labeled_by_others AND NOT labeled_by_me AND lu.upvoted_by != current_user_id)
         )
     ),
-    -- Pre-filter upvoted snippet IDs (optimizes upvotedBy filter from 6.7s to <1s)
     upvoted_snippet_ids AS (
         SELECT DISTINCT sl.snippet
         FROM snippet_labels sl
@@ -97,171 +111,49 @@ BEGIN
             (filter_upvoted_by_me AND NOT filter_upvoted_by_others AND lu.upvoted_by = current_user_id) OR
             (filter_upvoted_by_others AND NOT filter_upvoted_by_me AND lu.upvoted_by != current_user_id)
         )
-    )
-    SELECT COUNT(*) INTO total_count
-    FROM snippets s
-    LEFT JOIN audio_files a ON s.audio_file = a.id
-    LEFT JOIN user_hide_snippets uhs ON uhs.snippet = s.id
-    -- Use JOIN for starred filter (starts from smaller set of ~200 rows instead of 119k)
-    LEFT JOIN starred_snippet_ids ssi ON ssi.snippet = s.id
-    -- Use JOIN for labeled filter
-    LEFT JOIN labeled_snippet_ids lsi ON lsi.snippet = s.id
-    -- Use JOIN for upvoted filter
-    LEFT JOIN upvoted_snippet_ids usi ON usi.snippet = s.id
-    WHERE s.status = 'Processed' AND (s.confidence_scores->>'overall')::INTEGER >= 95
-    AND (user_is_admin OR uhs.snippet IS NULL)
-    -- Starred filter: use JOIN result instead of EXISTS (key optimization)
-    AND (NOT has_starred_filter OR ssi.snippet IS NOT NULL)
-    -- Labeled filter: use JOIN result instead of EXISTS
-    AND (NOT has_labeled_filter OR lsi.snippet IS NOT NULL)
-    -- Upvoted filter: use JOIN result instead of EXISTS
-    AND (NOT has_upvoted_filter OR usi.snippet IS NOT NULL)
-    AND (
-        p_filter IS NULL OR
-        NOT p_filter ? 'languages' OR
-        jsonb_array_length(p_filter->'languages') = 0 OR
-        s.language ->> 'primary_language' IN (SELECT jsonb_array_elements_text(p_filter->'languages'))
-    )
-    AND (
-        p_filter IS NULL OR
-        NOT p_filter ? 'states' OR
-        jsonb_array_length(p_filter->'states') = 0 OR
-        a.location_state IN (SELECT jsonb_array_elements_text(p_filter->'states'))
-    )
-    AND (
-        p_filter IS NULL OR
-        NOT p_filter ? 'sources' OR
-        jsonb_array_length(p_filter->'sources') = 0 OR
-        a.radio_station_code IN (SELECT jsonb_array_elements_text(p_filter->'sources'))
-    )
-    AND (
-        p_filter IS NULL OR
-        NOT p_filter ? 'politicalSpectrum' OR
-        (
-            CASE
-                WHEN p_filter->>'politicalSpectrum' = 'left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -1.0 AND -0.7
-                WHEN p_filter->>'politicalSpectrum' = 'center-left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.7 AND -0.3
-                WHEN p_filter->>'politicalSpectrum' = 'center' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.3 AND 0.3
-                WHEN p_filter->>'politicalSpectrum' = 'center-right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.3 AND 0.7
-                WHEN p_filter->>'politicalSpectrum' = 'right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.7 AND 1.0
-                ELSE TRUE
-            END
-        )
-    )
-    AND (
-        p_filter IS NULL OR
-        NOT p_filter ? 'labels' OR
-        jsonb_array_length(p_filter->'labels') = 0 OR
-        EXISTS (SELECT 1 FROM snippet_labels sl WHERE sl.snippet = s.id AND sl.label IN (SELECT (jsonb_array_elements_text(p_filter->'labels'))::UUID))
-    )
-    AND (
-        trimmed_search_term = '' OR (
-            (s.title ->> 'english') &@ trimmed_search_term
-            OR (s.title ->> 'spanish') &@ trimmed_search_term
-            OR (s.explanation ->> 'english') &@ trimmed_search_term
-            OR (s.explanation ->> 'spanish') &@ trimmed_search_term
-            OR (s.summary ->> 'english') &@ trimmed_search_term
-            OR (s.summary ->> 'spanish') &@ trimmed_search_term
-            OR s.transcription &@ trimmed_search_term
-            OR s.translation &@ trimmed_search_term
-        )
-    );
-
-    -- Now get the actual data with pagination using the same optimization
-    WITH
-    starred_snippet_ids AS (
-        SELECT DISTINCT uss.snippet
-        FROM user_star_snippets uss
-        WHERE has_starred_filter AND (
-            (starred_by_me AND starred_by_others) OR
-            (starred_by_me AND NOT starred_by_others AND uss."user" = current_user_id) OR
-            (starred_by_others AND NOT starred_by_me AND uss."user" != current_user_id)
-        )
     ),
-    labeled_snippet_ids AS (
-        SELECT DISTINCT sl.snippet
-        FROM snippet_labels sl
-        JOIN label_upvotes lu ON lu.snippet_label = sl.id
-        WHERE has_labeled_filter AND (
-            (labeled_by_me AND labeled_by_others) OR
-            (labeled_by_me AND NOT labeled_by_others AND lu.upvoted_by = current_user_id) OR
-            (labeled_by_others AND NOT labeled_by_me AND lu.upvoted_by != current_user_id)
-        )
+    state_filtered_audio_ids AS (
+        SELECT id FROM audio_files
+        WHERE has_state_filter
+        AND location_state IN (SELECT jsonb_array_elements_text(p_filter->'states'))
     ),
-    -- Pre-filter upvoted snippet IDs
-    upvoted_snippet_ids AS (
-        SELECT DISTINCT sl.snippet
-        FROM snippet_labels sl
-        JOIN label_upvotes lu ON lu.snippet_label = sl.id
-        WHERE has_upvoted_filter AND (
-            (filter_upvoted_by_me AND filter_upvoted_by_others) OR
-            (filter_upvoted_by_me AND NOT filter_upvoted_by_others AND lu.upvoted_by = current_user_id) OR
-            (filter_upvoted_by_others AND NOT filter_upvoted_by_me AND lu.upvoted_by != current_user_id)
-        )
+    source_filtered_audio_ids AS (
+        SELECT id FROM audio_files
+        WHERE has_source_filter
+        AND radio_station_code IN (SELECT jsonb_array_elements_text(p_filter->'sources'))
     ),
+    -- Lightweight filtered IDs (for count + pagination, no heavy columns)
     filtered_snippets AS (
         SELECT
             s.id,
             s.recorded_at,
             s.user_last_activity,
-            s.duration,
-            s.start_time,
-            s.end_time,
-            s.file_path,
-            s.file_size,
-            s.political_leaning,
-            CASE WHEN p_language = 'spanish' THEN s.title ->> 'spanish' ELSE s.title ->> 'english' END AS title,
-            CASE WHEN p_language = 'spanish' THEN s.summary ->> 'spanish' ELSE s.summary ->> 'english' END AS summary,
-            CASE WHEN p_language = 'spanish' THEN s.explanation ->> 'spanish' ELSE s.explanation ->> 'english' END AS explanation,
-            s.confidence_scores,
-            s.language,
-            s.context,
             s.upvote_count,
             s.comment_count,
-            s.like_count,
-            jsonb_build_object(
-                'id', a.id,
-                'radio_station_name', a.radio_station_name,
-                'radio_station_code', a.radio_station_code,
-                'location_state', a.location_state,
-                'location_city', a.location_city
-            ) AS audio_file,
-            us.id IS NOT NULL AS starred_by_user,
-            ul.value AS user_like_status,
-            uhs.snippet IS NOT NULL AS hidden
+            COALESCE(s.like_count, 0) AS like_count
         FROM snippets s
-        LEFT JOIN audio_files a ON s.audio_file = a.id
-        LEFT JOIN user_star_snippets us ON us.snippet = s.id AND us."user" = current_user_id
-        LEFT JOIN user_like_snippets ul ON ul.snippet = s.id AND ul."user" = current_user_id
         LEFT JOIN user_hide_snippets uhs ON uhs.snippet = s.id
-        -- Use JOIN for starred filter (starts from smaller set)
         LEFT JOIN starred_snippet_ids ssi ON ssi.snippet = s.id
-        -- Use JOIN for labeled filter
         LEFT JOIN labeled_snippet_ids lsi ON lsi.snippet = s.id
-        -- Use JOIN for upvoted filter
         LEFT JOIN upvoted_snippet_ids usi ON usi.snippet = s.id
+        LEFT JOIN state_filtered_audio_ids sfa ON sfa.id = s.audio_file
+        LEFT JOIN source_filtered_audio_ids srfa ON srfa.id = s.audio_file
         WHERE s.status = 'Processed' AND (s.confidence_scores->>'overall')::INTEGER >= 95
         AND (user_is_admin OR uhs.snippet IS NULL)
-        -- Starred filter: use JOIN result instead of EXISTS
         AND (NOT has_starred_filter OR ssi.snippet IS NOT NULL)
-        -- Labeled filter: use JOIN result instead of EXISTS
         AND (NOT has_labeled_filter OR lsi.snippet IS NOT NULL)
-        -- Upvoted filter: use JOIN result instead of EXISTS
         AND (NOT has_upvoted_filter OR usi.snippet IS NOT NULL)
+        AND (NOT has_state_filter OR sfa.id IS NOT NULL)
+        AND (NOT has_source_filter OR srfa.id IS NOT NULL)
         AND (
-            p_filter IS NULL OR NOT p_filter ? 'languages' OR jsonb_array_length(p_filter->'languages') = 0 OR
+            p_filter IS NULL OR
+            NOT p_filter ? 'languages' OR
+            jsonb_array_length(p_filter->'languages') = 0 OR
             s.language ->> 'primary_language' IN (SELECT jsonb_array_elements_text(p_filter->'languages'))
         )
         AND (
-            p_filter IS NULL OR NOT p_filter ? 'states' OR jsonb_array_length(p_filter->'states') = 0 OR
-            a.location_state IN (SELECT jsonb_array_elements_text(p_filter->'states'))
-        )
-        AND (
-            p_filter IS NULL OR NOT p_filter ? 'sources' OR jsonb_array_length(p_filter->'sources') = 0 OR
-            a.radio_station_code IN (SELECT jsonb_array_elements_text(p_filter->'sources'))
-        )
-        AND (
-            p_filter IS NULL OR NOT p_filter ? 'politicalSpectrum' OR
+            p_filter IS NULL OR
+            NOT p_filter ? 'politicalSpectrum' OR
             (
                 CASE
                     WHEN p_filter->>'politicalSpectrum' = 'left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -1.0 AND -0.7
@@ -274,8 +166,17 @@ BEGIN
             )
         )
         AND (
-            p_filter IS NULL OR NOT p_filter ? 'labels' OR jsonb_array_length(p_filter->'labels') = 0 OR
-            EXISTS (SELECT 1 FROM snippet_labels sl WHERE sl.snippet = s.id AND sl.label IN (SELECT (jsonb_array_elements_text(p_filter->'labels'))::UUID))
+            p_filter IS NULL OR
+            NOT p_filter ? 'labels' OR
+            jsonb_array_length(p_filter->'labels') = 0 OR
+            EXISTS (
+                SELECT 1
+                FROM snippet_labels sl
+                WHERE sl.snippet = s.id
+                AND sl.label IN (
+                    SELECT (jsonb_array_elements_text(p_filter->'labels'))::UUID
+                )
+            )
         )
         AND (
             trimmed_search_term = '' OR (
@@ -289,14 +190,21 @@ BEGIN
                 OR s.translation &@ trimmed_search_term
             )
         )
+    ),
+    total_count_cte AS (
+        SELECT COUNT(*) AS cnt FROM filtered_snippets
+    ),
+    paginated_ids AS (
+        SELECT id
+        FROM filtered_snippets fs
         ORDER BY
             CASE
-                WHEN p_order_by = 'upvotes' THEN s.upvote_count + COALESCE(s.like_count, 0)
-                WHEN p_order_by = 'comments' THEN s.comment_count
+                WHEN p_order_by = 'upvotes' THEN fs.upvote_count + fs.like_count
+                WHEN p_order_by = 'comments' THEN fs.comment_count
                 WHEN p_order_by = 'activities' THEN
-                    CASE WHEN s.user_last_activity IS NULL THEN 0 ELSE EXTRACT(EPOCH FROM s.user_last_activity) END
+                    CASE WHEN fs.user_last_activity IS NULL THEN 0 ELSE EXTRACT(EPOCH FROM fs.user_last_activity) END
             END DESC,
-            s.recorded_at DESC
+            fs.recorded_at DESC
         LIMIT page_size
         OFFSET page * page_size
     ),
@@ -305,51 +213,116 @@ BEGIN
             l.id,
             CASE WHEN p_language = 'spanish' THEN l.text_spanish ELSE l.text END AS text,
             sl.upvote_count,
-            lu.id IS NOT NULL AS filter_upvoted_by_me,
+            lu.id IS NOT NULL AS upvoted_by_me,
             sl.snippet AS snippet_id
         FROM snippet_labels sl
         JOIN labels l ON l.id = sl.label
         LEFT JOIN label_upvotes lu ON lu.snippet_label = sl.id AND lu.upvoted_by = current_user_id
-        WHERE sl.snippet IN (SELECT id FROM filtered_snippets)
+        WHERE sl.snippet IN (SELECT id FROM paginated_ids)
     ),
-    snippets_with_labels AS (
+    paginated_snippets AS (
         SELECT
-            fs.*,
+            s.id,
+            s.recorded_at,
+            s.user_last_activity,
+            s.duration,
+            s.start_time,
+            s.end_time,
+            s.file_path,
+            s.file_size,
+            s.political_leaning,
+            CASE
+                WHEN p_language = 'spanish' THEN s.title ->> 'spanish'
+                ELSE s.title ->> 'english'
+            END AS title,
+            CASE
+                WHEN p_language = 'spanish' THEN s.summary ->> 'spanish'
+                ELSE s.summary ->> 'english'
+            END AS summary,
+            CASE
+                WHEN p_language = 'spanish' THEN s.explanation ->> 'spanish'
+                ELSE s.explanation ->> 'english'
+            END AS explanation,
+            s.confidence_scores,
+            s.language,
+            s.context,
+            s.upvote_count,
+            s.comment_count,
+            jsonb_build_object(
+                'id', a.id,
+                'radio_station_name', a.radio_station_name,
+                'radio_station_code', a.radio_station_code,
+                'location_state', a.location_state,
+                'location_city', a.location_city
+            ) AS audio_file,
+            us.id IS NOT NULL AS starred_by_user,
+            ul.value AS user_like_status,
+            uhs.snippet IS NOT NULL AS hidden,
+            COALESCE(s.like_count, 0) AS like_count,
+            COALESCE(s.dislike_count, 0) AS dislike_count,
             COALESCE(ld.labels, '[]'::jsonb) AS labels
-        FROM filtered_snippets fs
+        FROM paginated_ids p
+        JOIN snippets s ON s.id = p.id
+        LEFT JOIN audio_files a ON s.audio_file = a.id
+        LEFT JOIN user_star_snippets us ON us.snippet = s.id AND us."user" = current_user_id
+        LEFT JOIN user_like_snippets ul ON ul.snippet = s.id AND ul."user" = current_user_id
+        LEFT JOIN user_hide_snippets uhs ON uhs.snippet = s.id
         LEFT JOIN (
-            SELECT snippet_id, jsonb_agg(jsonb_build_object('id', id, 'text', text, 'upvote_count', upvote_count, 'filter_upvoted_by_me', filter_upvoted_by_me)) as labels
+            SELECT
+                snippet_id,
+                jsonb_agg(
+                    jsonb_build_object(
+                        'id', id,
+                        'text', text,
+                        'upvote_count', upvote_count,
+                        'upvoted_by_me', upvoted_by_me
+                    )
+                ) as labels
             FROM label_summary
             GROUP BY snippet_id
-        ) ld ON fs.id = ld.snippet_id
+        ) ld ON p.id = ld.snippet_id
+        ORDER BY
+            CASE
+                WHEN p_order_by = 'upvotes' THEN s.upvote_count + COALESCE(s.like_count, 0)
+                WHEN p_order_by = 'comments' THEN s.comment_count
+                WHEN p_order_by = 'activities' THEN
+                    CASE
+                        WHEN s.user_last_activity IS NULL THEN 0
+                        ELSE EXTRACT(EPOCH FROM s.user_last_activity)
+                    END
+            END DESC,
+            s.recorded_at DESC
     )
-    SELECT jsonb_agg(
-        jsonb_build_object(
-            'id', s.id,
-            'recorded_at', s.recorded_at,
-            'user_last_activity', s.user_last_activity,
-            'duration', s.duration,
-            'start_time', s.start_time,
-            'end_time', s.end_time,
-            'file_path', s.file_path,
-            'file_size', s.file_size,
-            'political_leaning', s.political_leaning,
-            'title', s.title,
-            'summary', s.summary,
-            'explanation', s.explanation,
-            'confidence_scores', s.confidence_scores,
-            'language', s.language,
-            'context', s.context,
-            'labels', s.labels,
-            'audio_file', s.audio_file,
-            'starred_by_user', s.starred_by_user,
-            'user_like_status', s.user_like_status,
-            'hidden', s.hidden,
-            'like_count', COALESCE(s.like_count, 0),
-            'dislike_count', 0
-        )
-    ) INTO result
-    FROM snippets_with_labels s;
+    SELECT
+        jsonb_agg(
+            jsonb_build_object(
+                'id', ps.id,
+                'recorded_at', ps.recorded_at,
+                'user_last_activity', ps.user_last_activity,
+                'duration', ps.duration,
+                'start_time', ps.start_time,
+                'end_time', ps.end_time,
+                'file_path', ps.file_path,
+                'file_size', ps.file_size,
+                'political_leaning', ps.political_leaning,
+                'title', ps.title,
+                'summary', ps.summary,
+                'explanation', ps.explanation,
+                'confidence_scores', ps.confidence_scores,
+                'language', ps.language,
+                'context', ps.context,
+                'labels', ps.labels,
+                'audio_file', ps.audio_file,
+                'starred_by_user', ps.starred_by_user,
+                'user_like_status', ps.user_like_status,
+                'hidden', ps.hidden,
+                'like_count', ps.like_count,
+                'dislike_count', ps.dislike_count
+            )
+        ),
+        (SELECT cnt FROM total_count_cte)
+    INTO result, total_count
+    FROM paginated_snippets ps;
 
     total_pages := CEIL(total_count::FLOAT / page_size);
 
diff --git a/supabase/migrations/20260130_optimize_state_source_filters.sql b/supabase/migrations/20260130_optimize_state_source_filters.sql
deleted file mode 100644
index ea9fe16..0000000
--- a/supabase/migrations/20260130_optimize_state_source_filters.sql
+++ /dev/null
@@ -1,390 +0,0 @@
--- Optimize state and source filters in get_snippets
--- Problem: State filter scans all 19k+ snippets first, then filters by audio_files.location_state
--- Solution: Use same CTE+JOIN pattern as starred/labeled/upvoted filters
--- Expected improvement: ~134ms -> <50ms for state filter queries
-
-DROP FUNCTION IF EXISTS get_snippets;
-
-CREATE OR REPLACE FUNCTION get_snippets (
-    p_language text,
-    p_filter jsonb,
-    page INTEGER,
-    page_size INTEGER,
-    p_order_by text,
-    p_search_term text DEFAULT ''
-) RETURNS jsonb SECURITY DEFINER AS $$
-DECLARE
-    current_user_id UUID;
-    result jsonb;
-    total_count INTEGER;
-    total_pages INTEGER;
-    user_roles TEXT[];
-    user_is_admin BOOLEAN;
-    trimmed_search_term TEXT := TRIM(p_search_term);
-    -- Filter detection flags for optimization
-    has_starred_filter BOOLEAN;
-    starred_by_me BOOLEAN;
-    starred_by_others BOOLEAN;
-    has_labeled_filter BOOLEAN;
-    labeled_by_me BOOLEAN;
-    labeled_by_others BOOLEAN;
-    has_upvoted_filter BOOLEAN;
-    filter_upvoted_by_me BOOLEAN;
-    filter_upvoted_by_others BOOLEAN;
-    -- State/source filter flags (new)
-    has_state_filter BOOLEAN;
-    has_source_filter BOOLEAN;
-BEGIN
-    current_user_id := auth.uid();
-    IF current_user_id IS NULL THEN
-        RAISE EXCEPTION 'Only logged-in users can call this function';
-    END IF;
-
-    SELECT array_agg(r.name) INTO user_roles
-    FROM public.user_roles ur
-    JOIN public.roles r ON ur.role = r.id
-    WHERE ur."user" = current_user_id;
-
-    user_is_admin := COALESCE('admin' = ANY(user_roles), FALSE);
-
-    -- Pre-compute filter flags to enable query optimization
-    has_starred_filter := p_filter IS NOT NULL
-        AND p_filter ? 'starredBy'
-        AND jsonb_array_length(p_filter->'starredBy') > 0;
-    starred_by_me := has_starred_filter AND p_filter->'starredBy' ? 'by_me';
-    starred_by_others := has_starred_filter AND p_filter->'starredBy' ? 'by_others';
-
-    has_labeled_filter := p_filter IS NOT NULL
-        AND p_filter ? 'labeledBy'
-        AND jsonb_array_length(p_filter->'labeledBy') > 0;
-    labeled_by_me := has_labeled_filter AND p_filter->'labeledBy' ? 'by_me';
-    labeled_by_others := has_labeled_filter AND p_filter->'labeledBy' ? 'by_others';
-
-    has_upvoted_filter := p_filter IS NOT NULL
-        AND p_filter ? 'upvotedBy'
-        AND jsonb_array_length(p_filter->'upvotedBy') > 0;
-    filter_upvoted_by_me := has_upvoted_filter AND p_filter->'upvotedBy' ? 'by_me';
-    filter_upvoted_by_others := has_upvoted_filter AND p_filter->'upvotedBy' ? 'by_others';
-
-    -- State/source filter flags (new optimization)
-    has_state_filter := p_filter IS NOT NULL
-        AND p_filter ? 'states'
-        AND jsonb_array_length(p_filter->'states') > 0;
-    has_source_filter := p_filter IS NOT NULL
-        AND p_filter ? 'sources'
-        AND jsonb_array_length(p_filter->'sources') > 0;
-
-    -- Get count using optimized query with JOINs instead of EXISTS/IN
-    WITH
-    starred_snippet_ids AS (
-        SELECT DISTINCT uss.snippet
-        FROM user_star_snippets uss
-        WHERE has_starred_filter AND (
-            (starred_by_me AND starred_by_others) OR
-            (starred_by_me AND NOT starred_by_others AND uss."user" = current_user_id) OR
-            (starred_by_others AND NOT starred_by_me AND uss."user" != current_user_id)
-        )
-    ),
-    labeled_snippet_ids AS (
-        SELECT DISTINCT sl.snippet
-        FROM snippet_labels sl
-        JOIN label_upvotes lu ON lu.snippet_label = sl.id
-        WHERE has_labeled_filter AND (
-            (labeled_by_me AND labeled_by_others) OR
-            (labeled_by_me AND NOT labeled_by_others AND lu.upvoted_by = current_user_id) OR
-            (labeled_by_others AND NOT labeled_by_me AND lu.upvoted_by != current_user_id)
-        )
-    ),
-    upvoted_snippet_ids AS (
-        SELECT DISTINCT sl.snippet
-        FROM snippet_labels sl
-        JOIN label_upvotes lu ON lu.snippet_label = sl.id
-        WHERE has_upvoted_filter AND (
-            (filter_upvoted_by_me AND filter_upvoted_by_others) OR
-            (filter_upvoted_by_me AND NOT filter_upvoted_by_others AND lu.upvoted_by = current_user_id) OR
-            (filter_upvoted_by_others AND NOT filter_upvoted_by_me AND lu.upvoted_by != current_user_id)
-        )
-    ),
-    -- Pre-filter audio file IDs by state (uses idx_audio_files_location_state)
-    state_filtered_audio_ids AS (
-        SELECT id FROM audio_files
-        WHERE has_state_filter
-        AND location_state IN (SELECT jsonb_array_elements_text(p_filter->'states'))
-    ),
-    -- Pre-filter audio file IDs by source/radio station
-    source_filtered_audio_ids AS (
-        SELECT id FROM audio_files
-        WHERE has_source_filter
-        AND radio_station_code IN (SELECT jsonb_array_elements_text(p_filter->'sources'))
-    )
-    SELECT COUNT(*) INTO total_count
-    FROM snippets s
-    LEFT JOIN audio_files a ON s.audio_file = a.id
-    LEFT JOIN user_hide_snippets uhs ON uhs.snippet = s.id
-    -- Use JOIN for starred filter (starts from smaller set of ~200 rows instead of 119k)
-    LEFT JOIN starred_snippet_ids ssi ON ssi.snippet = s.id
-    -- Use JOIN for labeled filter
-    LEFT JOIN labeled_snippet_ids lsi ON lsi.snippet = s.id
-    -- Use JOIN for upvoted filter
-    LEFT JOIN upvoted_snippet_ids usi ON usi.snippet = s.id
-    -- Use JOIN for state filter (new optimization)
-    LEFT JOIN state_filtered_audio_ids sfa ON sfa.id = s.audio_file
-    -- Use JOIN for source filter (new optimization)
-    LEFT JOIN source_filtered_audio_ids srfa ON srfa.id = s.audio_file
-    WHERE s.status = 'Processed' AND (s.confidence_scores->>'overall')::INTEGER >= 95
-    AND (user_is_admin OR uhs.snippet IS NULL)
-    -- Starred filter: use JOIN result instead of EXISTS (key optimization)
-    AND (NOT has_starred_filter OR ssi.snippet IS NOT NULL)
-    -- Labeled filter: use JOIN result instead of EXISTS
-    AND (NOT has_labeled_filter OR lsi.snippet IS NOT NULL)
-    -- Upvoted filter: use JOIN result instead of EXISTS
-    AND (NOT has_upvoted_filter OR usi.snippet IS NOT NULL)
-    -- State filter: use JOIN result instead of IN subquery (new optimization)
-    AND (NOT has_state_filter OR sfa.id IS NOT NULL)
-    -- Source filter: use JOIN result instead of IN subquery (new optimization)
-    AND (NOT has_source_filter OR srfa.id IS NOT NULL)
-    AND (
-        p_filter IS NULL OR
-        NOT p_filter ? 'languages' OR
-        jsonb_array_length(p_filter->'languages') = 0 OR
-        s.language ->> 'primary_language' IN (SELECT jsonb_array_elements_text(p_filter->'languages'))
-    )
-    AND (
-        p_filter IS NULL OR
-        NOT p_filter ? 'politicalSpectrum' OR
-        (
-            CASE
-                WHEN p_filter->>'politicalSpectrum' = 'left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -1.0 AND -0.7
-                WHEN p_filter->>'politicalSpectrum' = 'center-left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.7 AND -0.3
-                WHEN p_filter->>'politicalSpectrum' = 'center' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.3 AND 0.3
-                WHEN p_filter->>'politicalSpectrum' = 'center-right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.3 AND 0.7
-                WHEN p_filter->>'politicalSpectrum' = 'right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.7 AND 1.0
-                ELSE TRUE
-            END
-        )
-    )
-    AND (
-        p_filter IS NULL OR
-        NOT p_filter ? 'labels' OR
-        jsonb_array_length(p_filter->'labels') = 0 OR
-        EXISTS (SELECT 1 FROM snippet_labels sl WHERE sl.snippet = s.id AND sl.label IN (SELECT (jsonb_array_elements_text(p_filter->'labels'))::UUID))
-    )
-    AND (
-        trimmed_search_term = '' OR (
-            (s.title ->> 'english') &@ trimmed_search_term
-            OR (s.title ->> 'spanish') &@ trimmed_search_term
-            OR (s.explanation ->> 'english') &@ trimmed_search_term
-            OR (s.explanation ->> 'spanish') &@ trimmed_search_term
-            OR (s.summary ->> 'english') &@ trimmed_search_term
-            OR (s.summary ->> 'spanish') &@ trimmed_search_term
-            OR s.transcription &@ trimmed_search_term
-            OR s.translation &@ trimmed_search_term
-        )
-    );
-
-    -- Now get the actual data with pagination using the same optimization
-    WITH
-    starred_snippet_ids AS (
-        SELECT DISTINCT uss.snippet
-        FROM user_star_snippets uss
-        WHERE has_starred_filter AND (
-            (starred_by_me AND starred_by_others) OR
-            (starred_by_me AND NOT starred_by_others AND uss."user" = current_user_id) OR
-            (starred_by_others AND NOT starred_by_me AND uss."user" != current_user_id)
-        )
-    ),
-    labeled_snippet_ids AS (
-        SELECT DISTINCT sl.snippet
-        FROM snippet_labels sl
-        JOIN label_upvotes lu ON lu.snippet_label = sl.id
-        WHERE has_labeled_filter AND (
-            (labeled_by_me AND labeled_by_others) OR
-            (labeled_by_me AND NOT labeled_by_others AND lu.upvoted_by = current_user_id) OR
-            (labeled_by_others AND NOT labeled_by_me AND lu.upvoted_by != current_user_id)
-        )
-    ),
-    upvoted_snippet_ids AS (
-        SELECT DISTINCT sl.snippet
-        FROM snippet_labels sl
-        JOIN label_upvotes lu ON lu.snippet_label = sl.id
-        WHERE has_upvoted_filter AND (
-            (filter_upvoted_by_me AND filter_upvoted_by_others) OR
-            (filter_upvoted_by_me AND NOT filter_upvoted_by_others AND lu.upvoted_by = current_user_id) OR
-            (filter_upvoted_by_others AND NOT filter_upvoted_by_me AND lu.upvoted_by != current_user_id)
-        )
-    ),
-    -- Pre-filter audio file IDs by state
-    state_filtered_audio_ids AS (
-        SELECT id FROM audio_files
-        WHERE has_state_filter
-        AND location_state IN (SELECT jsonb_array_elements_text(p_filter->'states'))
-    ),
-    -- Pre-filter audio file IDs by source
-    source_filtered_audio_ids AS (
-        SELECT id FROM audio_files
-        WHERE has_source_filter
-        AND radio_station_code IN (SELECT jsonb_array_elements_text(p_filter->'sources'))
-    ),
-    filtered_snippets AS (
-        SELECT
-            s.id,
-            s.recorded_at,
-            s.user_last_activity,
-            s.duration,
-            s.start_time,
-            s.end_time,
-            s.file_path,
-            s.file_size,
-            s.political_leaning,
-            CASE WHEN p_language = 'spanish' THEN s.title ->> 'spanish' ELSE s.title ->> 'english' END AS title,
-            CASE WHEN p_language = 'spanish' THEN s.summary ->> 'spanish' ELSE s.summary ->> 'english' END AS summary,
-            CASE WHEN p_language = 'spanish' THEN s.explanation ->> 'spanish' ELSE s.explanation ->> 'english' END AS explanation,
-            s.confidence_scores,
-            s.language,
-            s.context,
-            s.upvote_count,
-            s.comment_count,
-            s.like_count,
-            jsonb_build_object(
-                'id', a.id,
-                'radio_station_name', a.radio_station_name,
-                'radio_station_code', a.radio_station_code,
-                'location_state', a.location_state,
-                'location_city', a.location_city
-            ) AS audio_file,
-            us.id IS NOT NULL AS starred_by_user,
-            ul.value AS user_like_status,
-            uhs.snippet IS NOT NULL AS hidden
-        FROM snippets s
-        LEFT JOIN audio_files a ON s.audio_file = a.id
-        LEFT JOIN user_star_snippets us ON us.snippet = s.id AND us."user" = current_user_id
-        LEFT JOIN user_like_snippets ul ON ul.snippet = s.id AND ul."user" = current_user_id
-        LEFT JOIN user_hide_snippets uhs ON uhs.snippet = s.id
-        -- Use JOIN for starred filter (starts from smaller set)
-        LEFT JOIN starred_snippet_ids ssi ON ssi.snippet = s.id
-        -- Use JOIN for labeled filter
-        LEFT JOIN labeled_snippet_ids lsi ON lsi.snippet = s.id
-        -- Use JOIN for upvoted filter
-        LEFT JOIN upvoted_snippet_ids usi ON usi.snippet = s.id
-        -- Use JOIN for state filter
-        LEFT JOIN state_filtered_audio_ids sfa ON sfa.id = s.audio_file
-        -- Use JOIN for source filter
-        LEFT JOIN source_filtered_audio_ids srfa ON srfa.id = s.audio_file
-        WHERE s.status = 'Processed' AND (s.confidence_scores->>'overall')::INTEGER >= 95
-        AND (user_is_admin OR uhs.snippet IS NULL)
-        -- Starred filter: use JOIN result instead of EXISTS
-        AND (NOT has_starred_filter OR ssi.snippet IS NOT NULL)
-        -- Labeled filter: use JOIN result instead of EXISTS
-        AND (NOT has_labeled_filter OR lsi.snippet IS NOT NULL)
-        -- Upvoted filter: use JOIN result instead of EXISTS
-        AND (NOT has_upvoted_filter OR usi.snippet IS NOT NULL)
-        -- State filter: use JOIN result
-        AND (NOT has_state_filter OR sfa.id IS NOT NULL)
-        -- Source filter: use JOIN result
-        AND (NOT has_source_filter OR srfa.id IS NOT NULL)
-        AND (
-            p_filter IS NULL OR NOT p_filter ? 'languages' OR jsonb_array_length(p_filter->'languages') = 0 OR
-            s.language ->> 'primary_language' IN (SELECT jsonb_array_elements_text(p_filter->'languages'))
-        )
-        AND (
-            p_filter IS NULL OR NOT p_filter ? 'politicalSpectrum' OR
-            (
-                CASE
-                    WHEN p_filter->>'politicalSpectrum' = 'left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -1.0 AND -0.7
-                    WHEN p_filter->>'politicalSpectrum' = 'center-left' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.7 AND -0.3
-                    WHEN p_filter->>'politicalSpectrum' = 'center' THEN (s.political_leaning->>'score')::FLOAT BETWEEN -0.3 AND 0.3
-                    WHEN p_filter->>'politicalSpectrum' = 'center-right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.3 AND 0.7
-                    WHEN p_filter->>'politicalSpectrum' = 'right' THEN (s.political_leaning->>'score')::FLOAT BETWEEN 0.7 AND 1.0
-                    ELSE TRUE
-                END
-            )
-        )
-        AND (
-            p_filter IS NULL OR NOT p_filter ? 'labels' OR jsonb_array_length(p_filter->'labels') = 0 OR
-            EXISTS (SELECT 1 FROM snippet_labels sl WHERE sl.snippet = s.id AND sl.label IN (SELECT (jsonb_array_elements_text(p_filter->'labels'))::UUID))
-        )
-        AND (
-            trimmed_search_term = '' OR (
-                (s.title ->> 'english') &@ trimmed_search_term
-                OR (s.title ->> 'spanish') &@ trimmed_search_term
-                OR (s.explanation ->> 'english') &@ trimmed_search_term
-                OR (s.explanation ->> 'spanish') &@ trimmed_search_term
-                OR (s.summary ->> 'english') &@ trimmed_search_term
-                OR (s.summary ->> 'spanish') &@ trimmed_search_term
-                OR s.transcription &@ trimmed_search_term
-                OR s.translation &@ trimmed_search_term
-            )
-        )
-        ORDER BY
-            CASE
-                WHEN p_order_by = 'upvotes' THEN s.upvote_count + COALESCE(s.like_count, 0)
-                WHEN p_order_by = 'comments' THEN s.comment_count
-                WHEN p_order_by = 'activities' THEN
-                    CASE WHEN s.user_last_activity IS NULL THEN 0 ELSE EXTRACT(EPOCH FROM s.user_last_activity) END
-            END DESC,
-            s.recorded_at DESC
-        LIMIT page_size
-        OFFSET page * page_size
-    ),
-    label_summary AS (
-        SELECT
-            l.id,
-            CASE WHEN p_language = 'spanish' THEN l.text_spanish ELSE l.text END AS text,
-            sl.upvote_count,
-            lu.id IS NOT NULL AS upvoted_by_me,
-            sl.snippet AS snippet_id
-        FROM snippet_labels sl
-        JOIN labels l ON l.id = sl.label
-        LEFT JOIN label_upvotes lu ON lu.snippet_label = sl.id AND lu.upvoted_by = current_user_id
-        WHERE sl.snippet IN (SELECT id FROM filtered_snippets)
-    ),
-    snippets_with_labels AS (
-        SELECT
-            fs.*,
-            COALESCE(ld.labels, '[]'::jsonb) AS labels
-        FROM filtered_snippets fs
-        LEFT JOIN (
-            SELECT snippet_id, jsonb_agg(jsonb_build_object('id', id, 'text', text, 'upvote_count', upvote_count, 'upvoted_by_me', upvoted_by_me)) as labels
-            FROM label_summary
-            GROUP BY snippet_id
-        ) ld ON fs.id = ld.snippet_id
-    )
-    SELECT jsonb_agg(
-        jsonb_build_object(
-            'id', s.id,
-            'recorded_at', s.recorded_at,
-            'user_last_activity', s.user_last_activity,
-            'duration', s.duration,
-            'start_time', s.start_time,
-            'end_time', s.end_time,
-            'file_path', s.file_path,
-            'file_size', s.file_size,
-            'political_leaning', s.political_leaning,
-            'title', s.title,
-            'summary', s.summary,
-            'explanation', s.explanation,
-            'confidence_scores', s.confidence_scores,
-            'language', s.language,
-            'context', s.context,
-            'labels', s.labels,
-            'audio_file', s.audio_file,
-            'starred_by_user', s.starred_by_user,
-            'user_like_status', s.user_like_status,
-            'hidden', s.hidden,
-            'like_count', COALESCE(s.like_count, 0),
-            'dislike_count', 0
-        )
-    ) INTO result
-    FROM snippets_with_labels s;
-
-    total_pages := CEIL(total_count::FLOAT / page_size);
-
-    RETURN jsonb_build_object(
-        'num_of_snippets', total_count,
-        'snippets', COALESCE(result, '[]'::jsonb),
-        'current_page', page,
-        'page_size', page_size,
-        'total_pages', total_pages
-    );
-END;
-$$ LANGUAGE plpgsql;