From 86cff37533ed2bfb176a6b10ae9c5b936c7d14f3 Mon Sep 17 00:00:00 2001 From: Joe Lothan Date: Wed, 20 May 2026 09:35:06 -0400 Subject: [PATCH] download cc-index to home not tmp (which is tmpfs) --- pipeline/01_cc_index/query.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/pipeline/01_cc_index/query.sh b/pipeline/01_cc_index/query.sh index c485b48..931d20f 100755 --- a/pipeline/01_cc_index/query.sh +++ b/pipeline/01_cc_index/query.sh @@ -65,7 +65,7 @@ if [ "$LIMIT" -gt 0 ] 2>/dev/null; then fi S3_PATH="s3://commoncrawl/cc-index/table/cc-main/warc/crawl=${CRAWL}/subset=warc/" -LOCAL_INDEX="/tmp/cc-index" +LOCAL_INDEX="$HOME/cc-index" QUERY=" INSTALL postgres;