aboutsummaryrefslogtreecommitdiff
path: root/backend/tests/enwiki/test_download_imgs.py
blob: 949d88506839a77a9603d822dfd3ab42f956fab8 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
import unittest
from unittest.mock import Mock, patch
import tempfile
import os

from tests.common import readTestFile, createTestDbTable
from hist_data.enwiki.download_imgs import downloadImgs

class TestDownloadInfo(unittest.TestCase):
	@patch('requests.get', autospec=True)
	def test_download(self, requestsGetMock):
		requestsGetMock.side_effect = lambda url, **kwargs: Mock(content=('img:' + url).encode())
		with tempfile.TemporaryDirectory() as tempDir:
			# Create temp image-data db
			imgDb = os.path.join(tempDir, 'img_data.db')
			createTestDbTable(
				imgDb,
				'CREATE TABLE page_imgs (page_id INT PRIMARY KEY, img_name TEXT)',
				'INSERT into page_imgs VALUES (?, ?)',
				{
					(1, 'one'),
					(2, 'two'),
					(3, 'three'),
					(4, 'four'),
					(5, 'five'),
					(6, 'six'),
					(7, 'seven'),
				}
			)
			createTestDbTable(
				imgDb,
				'CREATE TABLE imgs (id INT  PRIMARY KEY, name TEXT UNIQUE, ' \
					'license TEXT, artist TEXT, credit TEXT, restrictions TEXT, url TEXT)',
				'INSERT INTO imgs VALUES (?, ?, ?, ?, ?, ?, ?)',
				{
					(11, 'one','cc-by','alice','anna','','https://upload.wikimedia.org/1.jpg'),
					(12, 'two','???','bob','barbara','','https://upload.wikimedia.org/2.png'),
					(13, 'three','cc-by-sa','clare','File:?','','https://upload.wikimedia.org/3.gif'),
					(14, 'four','cc-by-sa 4.0','dave','dan','all','https://upload.wikimedia.org/4.jpeg'),
					(15, 'five','cc0','eve','eric',None,'https://upload.wikimedia.org/5.png'),
					(16, 'six','cc-by','','fred','','https://upload.wikimedia.org/6.png'),
				}
			)

			# Create temp output directory
			with tempfile.TemporaryDirectory() as outDir:
				# Run
				downloadImgs(imgDb, outDir, 0)
				# Check
				expectedImgs = {
					'11.jpg': 'img:https://upload.wikimedia.org/1.jpg',
					'15.png': 'img:https://upload.wikimedia.org/5.png',
				}
				self.assertEqual(set(os.listdir(outDir)), set(expectedImgs.keys()))
				for imgName, content in expectedImgs.items():
					self.assertEqual(readTestFile(os.path.join(outDir, imgName)), content)