aboutsummaryrefslogtreecommitdiff
path: root/backend/hist_data/enwiki/gen_img_data.py
diff options
context:
space:
mode:
Diffstat (limited to 'backend/hist_data/enwiki/gen_img_data.py')
-rwxr-xr-xbackend/hist_data/enwiki/gen_img_data.py9
1 files changed, 5 insertions, 4 deletions
diff --git a/backend/hist_data/enwiki/gen_img_data.py b/backend/hist_data/enwiki/gen_img_data.py
index 05df63d..044e5a0 100755
--- a/backend/hist_data/enwiki/gen_img_data.py
+++ b/backend/hist_data/enwiki/gen_img_data.py
@@ -16,10 +16,11 @@ import html
import urllib.parse
import sqlite3
-DUMP_FILE = 'enwiki-20220501-pages-articles-multistream.xml.bz2'
-INDEX_DB = 'dump_index.db'
-IMG_DB = 'img_data.db' # The database to create
-DB_FILE = os.path.join('..', 'data.db')
+ENWIKI_DIR = os.path.dirname(os.path.realpath(__file__))
+DUMP_FILE = os.path.join(ENWIKI_DIR, 'enwiki-20220501-pages-articles-multistream.xml.bz2')
+INDEX_DB = os.path.join(ENWIKI_DIR, 'dump_index.db')
+IMG_DB = os.path.join(ENWIKI_DIR, 'img_data.db') # The database to create
+DB_FILE = os.path.join(ENWIKI_DIR, '..', 'data.db')
ID_LINE_REGEX = re.compile(r'<id>(.*)</id>')
IMG_LINE_REGEX = re.compile(r'.*\| *image *= *([^|]*)')