aboutsummaryrefslogtreecommitdiff
path: root/backend/data/genEolNameData.py
diff options
context:
space:
mode:
authorTerry Truong <terry06890@gmail.com>2022-05-19 22:01:33 +1000
committerTerry Truong <terry06890@gmail.com>2022-05-19 22:01:33 +1000
commit8ce802ef223ac082975da9d04f10e5dc78529410 (patch)
tree250565dbe6938586ee6fd3125ac03407068be0b4 /backend/data/genEolNameData.py
parent80057ee1ffe3dbceceb9ae98c4e84e56847a4899 (diff)
Unescape EOL alt-name data
Diffstat (limited to 'backend/data/genEolNameData.py')
-rwxr-xr-xbackend/data/genEolNameData.py4
1 files changed, 2 insertions, 2 deletions
diff --git a/backend/data/genEolNameData.py b/backend/data/genEolNameData.py
index 0f9c4b5..fb91e8a 100755
--- a/backend/data/genEolNameData.py
+++ b/backend/data/genEolNameData.py
@@ -1,7 +1,7 @@
#!/usr/bin/python3
import sys, re
-import csv, sqlite3
+import html, csv, sqlite3
usageInfo = f"usage: {sys.argv[0]}\n"
usageInfo += "Reads vernacular-names CSV data (from the Encyclopedia of Life site),\n"
@@ -52,7 +52,7 @@ with open(vnamesFile, newline="") as csvfile:
# Parse line
pid = int(row[0])
name1 = re.sub(r"<[^>]+>", "", row[1].lower()) # Remove tags
- name2 = row[2].lower()
+ name2 = html.unescape(row[2]).lower()
lang = row[3]
preferred = row[6] == "preferred"
# Add to maps