aboutsummaryrefslogtreecommitdiff
path: root/backend/data
diff options
context:
space:
mode:
authorTerry Truong <terry06890@gmail.com>2022-05-10 19:07:02 +1000
committerTerry Truong <terry06890@gmail.com>2022-05-10 19:13:06 +1000
commit9b4fd83e8f88858a7a8d440b129397561fb1fcac (patch)
tree9a8a7ecc73b9bfda9e7221d502a0d1d87c078ad4 /backend/data
parent3d895370a608d4f51726b74e2560dcf5f4ec43a8 (diff)
Split nodes table into nodes and edgessplit-nodes-table
This noticeably slowed server responses. Responses to a client's initial node query slowed from 20-30ms to 200-300ms.
Diffstat (limited to 'backend/data')
-rw-r--r--backend/data/README.md8
-rwxr-xr-xbackend/data/genOtolData.py15
2 files changed, 14 insertions, 9 deletions
diff --git a/backend/data/README.md b/backend/data/README.md
index 9f0ea82..b3fd53b 100644
--- a/backend/data/README.md
+++ b/backend/data/README.md
@@ -3,8 +3,8 @@ File Generation Process
1 Tree Structure Data
1 Obtain data in otol/, as specified in it's README.
- 2 Run genOtolData.py, which creates data.db, and adds a 'nodes'
- table using data in otol/*.
+ 2 Run genOtolData.py, which creates data.db, and adds
+ 'nodes' and 'edges' tables using data in otol/*.
2 Name Data for Search
1 Obtain data in eol/, as specified in it's README.
2 Run genEolNameData.py, which adds 'names' and 'eol\_ids' tables to data.db,
@@ -26,7 +26,9 @@ File Generation Process
data.db tables
==============
- nodes <br>
- name TEXT PRIMARY KEY, children TEXT, parent TEXT, tips INT, p\_support INT
+ name TEXT PRIMARY KEY, tips INT
+- edges <br>
+ node TEXT, child TEXT, p\_support INT, PRIMARY KEY (node, child)
- names <br>
name TEXT, alt\_name TEXT, pref\_alt INT, PRIMARY KEY(name, alt\_name)
- eol\_ids <br>
diff --git a/backend/data/genOtolData.py b/backend/data/genOtolData.py
index 7dfac54..236c537 100755
--- a/backend/data/genOtolData.py
+++ b/backend/data/genOtolData.py
@@ -210,14 +210,17 @@ for [id, node] in nodeMap.items():
if node["parent"] == None:
node["pSupport"] = True
# Create db
-print("Creating nodes table")
+print("Creating nodes and edges tables")
dbCon = sqlite3.connect(dbFile)
dbCur = dbCon.cursor()
-dbCur.execute("CREATE TABLE nodes (name TEXT PRIMARY KEY, children TEXT, parent TEXT, tips INT, p_support INT)")
+dbCur.execute("CREATE TABLE nodes (name TEXT PRIMARY KEY, tips INT)")
+dbCur.execute("CREATE TABLE edges (node TEXT, child TEXT, p_support INT, PRIMARY KEY (node, child))")
for node in nodeMap.values():
- childNames = [nodeMap[id]["name"] for id in node["children"]]
- parentName = "" if node["parent"] == None else nodeMap[node["parent"]]["name"]
- dbCur.execute("INSERT INTO nodes VALUES (?, ?, ?, ?, ?)",
- (node["name"], json.dumps(childNames), parentName, node["tips"], 1 if node["pSupport"] else 0))
+ dbCur.execute("INSERT INTO nodes VALUES (?, ?)", (node["name"], node["tips"]))
+ childIds = node["children"]
+ for childId in childIds:
+ childNode = nodeMap[childId]
+ dbCur.execute("INSERT INTO edges VALUES (?, ?, ?)",
+ (node["name"], childNode["name"], 1 if childNode["pSupport"] else 0))
dbCon.commit()
dbCon.close()