From 29940d51eb8b6b220d53940ecbc212cea78159ae Mon Sep 17 00:00:00 2001 From: Terry Truong Date: Tue, 17 May 2022 10:41:12 +1000 Subject: Improve enwiki description extraction Adjust enwiki code to handle single dump file, and add scripts for 'convenient' page-content lookup. --- .gitignore | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) (limited to '.gitignore') diff --git a/.gitignore b/.gitignore index 908fc4f..7fa730c 100644 --- a/.gitignore +++ b/.gitignore @@ -14,7 +14,7 @@ /backend/data/imgsForReview/ /backend/data/imgsReviewed/ /backend/data/img/ -/backend/data/enwiki/*.gz +/backend/data/enwiki/*.bz2 /backend/data/enwiki/*.db /backend/data/enwiki/enwiki_content/ /backend/data/enwiki/.venv/ -- cgit v1.2.3