1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
|
import unittest
from unittest.mock import Mock, patch
import tempfile
import os
from tests.common import readTestFile, createTestDbTable
from hist_data.enwiki.download_imgs import downloadImgs
class TestDownloadInfo(unittest.TestCase):
@patch('requests.get', autospec=True)
def test_download(self, requestsGetMock):
requestsGetMock.side_effect = lambda url, **kwargs: Mock(content=('img:' + url).encode())
with tempfile.TemporaryDirectory() as tempDir:
# Create temp image-data db
imgDb = os.path.join(tempDir, 'img_data.db')
createTestDbTable(
imgDb,
'CREATE TABLE page_imgs (page_id INT PRIMARY KEY, img_name TEXT)',
'INSERT into page_imgs VALUES (?, ?)',
{
(1, 'one'),
(2, 'two'),
(3, 'three'),
(4, 'four'),
(5, 'five'),
(6, 'six'),
(7, 'seven'),
}
)
createTestDbTable(
imgDb,
'CREATE TABLE imgs (id INT PRIMARY KEY, name TEXT UNIQUE, ' \
'license TEXT, artist TEXT, credit TEXT, restrictions TEXT, url TEXT)',
'INSERT INTO imgs VALUES (?, ?, ?, ?, ?, ?, ?)',
{
(11, 'one','cc-by','alice','anna','','https://upload.wikimedia.org/1.jpg'),
(12, 'two','???','bob','barbara','','https://upload.wikimedia.org/2.png'),
(13, 'three','cc-by-sa','clare','File:?','','https://upload.wikimedia.org/3.gif'),
(14, 'four','cc-by-sa 4.0','dave','dan','all','https://upload.wikimedia.org/4.jpeg'),
(15, 'five','cc0','eve','eric',None,'https://upload.wikimedia.org/5.png'),
(16, 'six','cc-by','','fred','','https://upload.wikimedia.org/6.png'),
}
)
# Create temp output directory
with tempfile.TemporaryDirectory() as outDir:
# Run
downloadImgs(imgDb, outDir, 0)
# Check
expectedImgs = {
'11.jpg': 'img:https://upload.wikimedia.org/1.jpg',
'15.png': 'img:https://upload.wikimedia.org/5.png',
}
self.assertEqual(set(os.listdir(outDir)), set(expectedImgs.keys()))
for imgName, content in expectedImgs.items():
self.assertEqual(readTestFile(os.path.join(outDir, imgName)), content)
|