aboutsummaryrefslogtreecommitdiff
path: root/backend/data/genEnwikiDescData.py
diff options
context:
space:
mode:
authorTerry Truong <terry06890@gmail.com>2022-06-15 20:48:31 +1000
committerTerry Truong <terry06890@gmail.com>2022-06-15 20:48:31 +1000
commiteabec97d80e5f43e4710dd4c8327d0bc8519ab8c (patch)
tree0fd6d93f306b6dc7db2b9233ce63b65ebdc994bc /backend/data/genEnwikiDescData.py
parent3402f3d6e906afb500b95448d7d0b136b6b5ee86 (diff)
Separate node-wiki_id association from 'descs' table
Diffstat (limited to 'backend/data/genEnwikiDescData.py')
-rwxr-xr-xbackend/data/genEnwikiDescData.py6
1 files changed, 3 insertions, 3 deletions
diff --git a/backend/data/genEnwikiDescData.py b/backend/data/genEnwikiDescData.py
index 4445c3f..debd3fd 100755
--- a/backend/data/genEnwikiDescData.py
+++ b/backend/data/genEnwikiDescData.py
@@ -40,7 +40,7 @@ print(f"Read in {len(nameToPickedTitle)} titles to use for certain names")
# Get node names without descriptions
print("Getting node names")
nodeNames = set()
-query = "SELECT nodes.name FROM nodes LEFT JOIN descs ON nodes.name = descs.name WHERE desc IS NULL"
+query = "SELECT nodes.name FROM nodes LEFT JOIN wiki_ids ON nodes.name = wiki_ids.name WHERE wiki_ids.id IS NULL"
for row in dbCur.execute(query):
nodeNames.add(row[0])
print(f"Found {len(nodeNames)} names")
@@ -90,8 +90,8 @@ for (name, pageId) in nodeToPageId.items():
#
row = enwikiCur.execute("SELECT desc FROM descs where descs.id = ?", (pageId,)).fetchone()
if row != None:
- dbCur.execute("INSERT INTO descs VALUES (?, ?, ?, ?, ?)",
- (name, row[0], 1 if name in redirectingNames else 0, pageId, 0))
+ dbCur.execute("INSERT INTO wiki_ids VALUES (?, ?, ?)", (name, pageId, 1 if name in redirectingNames else 0))
+ dbCur.execute("INSERT OR IGNORE INTO descs VALUES (?, ?, ?)", (pageId, row[0], 0))
# Close dbs
dbCon.commit()
dbCon.close()