From 21df140643c319206b5c41a4474ba9c0609b62e5 Mon Sep 17 00:00:00 2001
From: yuenmichelle1 <michelle.dano.yuen@gmail.com>
Date: Wed, 18 Oct 2023 19:04:49 -0500
Subject: [PATCH] Update backfill scripts for classifications (#44)

* update classifications backfill script to chunk and save in file

* update to <= remove unused limit in query

* update copy into source

* split backfill to file creation then copy from files

* cast to int

* revert accidental adding commas on limit

* add keepalives to hopefully ensure connection does not get lost

* remove order by desc

* update to use the correct query
---
 scripts/save_classifications_chunk_in_files.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/scripts/save_classifications_chunk_in_files.py b/scripts/save_classifications_chunk_in_files.py
index 789351f..7758aa6 100644
--- a/scripts/save_classifications_chunk_in_files.py
+++ b/scripts/save_classifications_chunk_in_files.py
@@ -29,7 +29,7 @@
 
   with psycopg.connect(f"host={PANOPTES_CONN} port={PANOPTES_PORT} dbname={PANOPTES_DB} user={PANOPTES_USER} password={PANOPTES_PW} sslmode=require keepalives=1 keepalives_idle=30 keepalives_interval=10 keepalives_count=20") as panoptes_db_conn:
     with open(f"prod_classifications_{offset}.csv", "wb") as f:
-        with panoptes_db_conn.cursor(name="panoptes_cursor").copy(f"COPY ({classifications_query}) TO STDOUT WITH CSV HEADER", (FIRST_INGESTED_CLASSIFICATION_ID,)) as panoptes_copy:
+        with panoptes_db_conn.cursor(name="panoptes_cursor").copy(f"COPY ({query}) TO STDOUT WITH CSV HEADER", (FIRST_INGESTED_CLASSIFICATION_ID,)) as panoptes_copy:
            for data in panoptes_copy:
              f.write(data)
     offset+= 1