diff options
Diffstat (limited to 'backend/data')
| -rw-r--r-- | backend/data/README.md | 8 | ||||
| -rwxr-xr-x | backend/data/downloadEolImgs.py (renamed from backend/data/downloadImgsForReview.py) | 2 | ||||
| -rwxr-xr-x | backend/data/genImgsForWeb.py | 2 | ||||
| -rwxr-xr-x | backend/data/reviewEolImgs.py (renamed from backend/data/reviewImgs.py) | 4 |
4 files changed, 8 insertions, 8 deletions
diff --git a/backend/data/README.md b/backend/data/README.md index 8ee6e41..ece8efb 100644 --- a/backend/data/README.md +++ b/backend/data/README.md @@ -10,12 +10,12 @@ File Generation Process 2 Run genEolNameData.py, which adds 'names' and 'eol\_ids' tables to data.db, using data in eol/vernacularNames.csv and the 'nodes' table. 3 Image Data - 1 Run downloadImgsForReview.py to download EOL images into imgsForReview/. + 1 Run downloadEolImgs.py to download EOL images into eolImgsForReview/. It uses data in eol/imagesList.db, and the 'eol\_ids' table. - 2 Run reviewImgs.py to filter images in imgsForReview/ into EOL-id-unique - images in imgsReviewed/ (uses 'names' and 'eol\_ids' to display extra info). + 2 Run reviewEolImgs.py to filter images in eolImgsForReview/ into EOL-id-unique + images in eolImgsReviewed/ (uses 'names' and 'eol\_ids' to display extra info). 3 Run genImgsForWeb.py to create cropped/resized images in img/, using - images in imgsReviewed, and also to add an 'images' table to data.db. + images in eolImgsReviewed/, and also to add an 'images' table to data.db. 4 Run genLinkedImgs.py to add a 'linked_imgs' table to data.db, which uses 'nodes', 'edges', 'eol_ids', and 'images', to associate nodes without images to child images. diff --git a/backend/data/downloadImgsForReview.py b/backend/data/downloadEolImgs.py index d1191d7..8cf2ba2 100755 --- a/backend/data/downloadImgsForReview.py +++ b/backend/data/downloadEolImgs.py @@ -21,7 +21,7 @@ if len(sys.argv) > 1: imagesListDb = "eol/imagesList.db" dbFile = "data.db" -outDir = "imgsForReview/" +outDir = "eolImgsForReview/" LICENSE_REGEX = r"cc-by((-nc)?(-sa)?(-[234]\.[05])?)|cc-publicdomain|cc-0-1\.0|public domain" POST_DL_DELAY_MIN = 2 # Minimum delay in seconds to pause after download before starting another (for each thread) POST_DL_DELAY_MAX = 3 diff --git a/backend/data/genImgsForWeb.py b/backend/data/genImgsForWeb.py index 9db260f..d1eef1b 100755 --- a/backend/data/genImgsForWeb.py +++ b/backend/data/genImgsForWeb.py @@ -16,7 +16,7 @@ if len(sys.argv) > 1: print(usageInfo, file=sys.stderr) sys.exit(1) -imgDir = "imgsReviewed/" +imgDir = "eolImgsReviewed/" outDir = "img/" imagesListDb = "eol/imagesList.db" dbFile = "data.db" diff --git a/backend/data/reviewImgs.py b/backend/data/reviewEolImgs.py index 63e7dd5..08b8478 100755 --- a/backend/data/reviewImgs.py +++ b/backend/data/reviewEolImgs.py @@ -16,8 +16,8 @@ if len(sys.argv) > 1: print(usageInfo, file=sys.stderr) sys.exit(1) -imgDir = "imgsForReview/" -outDir = "imgsReviewed/" +imgDir = "eolImgsForReview/" +outDir = "eolImgsReviewed/" dbFile = "data.db" IMG_DISPLAY_SZ = 400 MAX_IMGS_PER_ID = 3 |
