1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
|
import unittest
import tempfile
import os
from tests.common import createTestFile, createTestDbTable, readTestDbTable
from tol_data.gen_name_data import genData
class TestGenData(unittest.TestCase):
def test_gen(self):
with tempfile.TemporaryDirectory() as tempDir:
# Create temp eol names file
eolNamesFile = os.path.join(tempDir, 'vernacular_names.csv')
createTestFile(eolNamesFile, (
'page_id,,vernacular_string,language_code,,,is_preferred_by_eol\n'
'10,,cat,eng,,,preferred\n'
'10,,kitty,eng,,,\n'
'20,,apple,eng,,,preferred\n'
'20,,pomme,fr,,,preferred\n'
'20,,apples,eng,,,\n'
'30,,those things with wings,eng,,,\n'
))
# Create temp enwiki db
enwikiDb = os.path.join(tempDir, 'desc_data.db')
createTestDbTable(
enwikiDb,
'CREATE TABLE pages (id INT PRIMARY KEY, title TEXT UNIQUE)',
'INSERT INTO pages VALUES (?, ?)',
[
(1, 'abc'),
(2, 'def'),
(3, 'ghi'),
]
)
createTestDbTable(
enwikiDb,
'CREATE TABLE redirects (id INT PRIMARY KEY, target TEXT)',
'INSERT INTO redirects VALUES (?, ?)',
[
(3, 'abc'),
(4, 'def'),
]
)
# Create temp picked-names file
pickedNamesFile = os.path.join(tempDir, 'picked_names.txt')
createTestFile(pickedNamesFile, (
'three|xxx|1\n'
'one|kitty|\n'
'two|two|\n'
))
# Create temp db
dbFile = os.path.join(tempDir, 'data.db')
createTestDbTable(
dbFile,
'CREATE TABLE nodes (name TEXT PRIMARY KEY, id TEXT UNIQUE, tips INT)',
'INSERT INTO nodes VALUES (?, ?, ?)',
[
('one', 'ott1', 1),
('two', 'ott2', 1),
('three', 'ott3', 1),
]
)
createTestDbTable(
dbFile,
'CREATE TABLE eol_ids (name TEXT PRIMARY KEY, id INT)',
'INSERT INTO eol_ids VALUES (?, ?)',
[
('one', 10),
('two', 20),
('three', 30),
]
)
createTestDbTable(
dbFile,
'CREATE TABLE wiki_ids (name TEXT PRIMARY KEY, id INT)',
'INSERT INTO wiki_ids VALUES (?, ?)',
[
('one', 1),
('two', 3),
('three', 2),
]
)
# Run
genData(eolNamesFile, enwikiDb, pickedNamesFile, dbFile)
# Check
self.assertEqual(
readTestDbTable(dbFile, 'SELECT name, alt_name, pref_alt, src FROM names'),
{
('one', 'cat', 1, 'eol'),
('one', 'ghi', 0, 'enwiki'),
('two', 'apple', 0, 'eol'),
('two', 'apples', 0, 'eol'),
('three', 'xxx', 1, 'picked'),
}
)
|