This repository was archived by the owner on Nov 29, 2019. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 3
Expand file tree
/
Copy pathtests.py
More file actions
153 lines (137 loc) · 5.82 KB
/
tests.py
File metadata and controls
153 lines (137 loc) · 5.82 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
# -*- coding: utf-8 -*-
# Copyright (c) 2018 by Ecreall and Bluenove under licence AGPL terms
# available on http://www.gnu.org/licenses/agpl.html
# licence: AGPL
# author: Amen Souissi
import unittest
from micawber import *
from micawber.test_utils import test_pr
from url_metadata.utils import get_favicon_url, get_url_domain, get_url_metadata, parse_url_metadata
empty_document = '<html><head></head><body></body></html>'
def get_document(title, site_name, description, url, image, favicon):
return '<html><head>' + \
'<meta http-equiv="Content-Type" content="text/html; charset=utf-8">' + \
'<title>Site title Foo bar</title>' + \
'<meta property="og:site_name" content="'+site_name+'">' + \
'<meta property="og:type" content="website">' + \
'<meta property="og:locale" content="fr_FR">' + \
'<meta property="og:title" content="'+title+'">' + \
'<meta property="og:description" content="'+description+'">' + \
'<meta property="og:url" content="'+url+'">' + \
'<meta property="og:image:type" content="image/png">' + \
'<meta property="og:image:width" content="1880">' + \
'<meta property="og:image:height" content="984">' + \
'<meta property="og:image" content="'+image+'">' + \
'<meta name="twitter:card" content="summary">' + \
'<meta name="twitter:site" content="'+site_name+'">' + \
'<meta name="twitter:url" content="'+url+'">' + \
'<meta name="twitter:title" content="'+title+'">' + \
'<meta name="twitter:description" content="'+description+'">' + \
'<link rel="shortcut icon" href="'+favicon+'">'+ \
'</head><body></body></html>'
class TestURLMetadata(unittest.TestCase):
def test_get_favicon_url(self):
url = 'http://link-test1'
favicon = 'http://link-test1/favicon.ico'
image = 'http://link-test1/foobar.png'
title = 'FooBar title'
site_name = 'FooBar'
description = 'FooBar description'
document = get_document(title, site_name, description, url, image, favicon)
favicon_url = get_favicon_url(document, url)
self.assertEqual(favicon_url, favicon)
def test_get_favicon_url_empty_doc(self):
url = 'http://link-test1'
favicon_url = get_favicon_url(empty_document, url)
self.assertIsNone(favicon_url)
def test_get_url_domain(self):
url = 'http://link-test1.com'
domain = get_url_domain(url)
self.assertEqual(domain, 'http://link-test1.com/')
url = 'http://link-test1.com/foo/bar?re=1'
domain = get_url_domain(url)
self.assertEqual(domain, 'http://link-test1.com/')
domain = get_url_domain(url, True)
self.assertEqual(domain, 'link-test1')
def test_parse_url_metadata(self):
url = 'http://link-test1'
favicon = 'http://link-test1/favicon.ico'
image = 'http://link-test1/foobar.png'
title = 'FooBar title'
site_name = 'FooBar'
description = 'FooBar description'
document = get_document(title, site_name, description, url, image, favicon)
metadata = parse_url_metadata(url, document.encode())
expected = {
'favicon_url': favicon,
'description': description,
'url': url,
'title': title,
'thumbnail_url': image,
'provider_name': site_name
}
self.assertEqual(metadata, expected)
def test_parse_url_metadata_empty_doc(self):
url = 'http://link-test1'
metadata = parse_url_metadata(url, empty_document.encode())
expected = {
'description': None,
'thumbnail_url': None,
'favicon_url': None,
'url': 'http://link-test1',
'title': None, 'provider_name':
'link-test1'
}
self.assertEqual(metadata, expected)
def test_get_url_metadata(self):
url = 'http://video-test1'
favicon = 'http://video-test1/favicon.ico'
image = 'http://video-test1/foobar.png'
title = 'FooBar title'
site_name = 'FooBar'
description = 'FooBar description'
document = get_document(title, site_name, description, url, image, favicon)
metadata = get_url_metadata(url, document.encode(), providers=test_pr)
expected = {
'favicon_url': favicon,
'description': description,
'url': url,
'title': title,
'thumbnail_url': image,
'provider_name': site_name,
'type': 'video',
'html': '<test1>video</test1>'
}
self.assertEqual(metadata, expected)
def test_get_url_metadata_empty_doc(self):
url = 'http://video-test1'
metadata = get_url_metadata(url, empty_document.encode(), providers=test_pr)
expected = {
'description': None,
'thumbnail_url': None,
'favicon_url': None,
'url': 'http://video-test1',
'title': None,
'provider_name': 'video-test1',
'type': 'video',
'html': '<test1>video</test1>'
}
self.assertEqual(metadata, expected)
def test_get_url_metadata_no_oembed(self):
url = 'http://site-bar'
favicon = 'http://site-bar/favicon.ico'
image = 'http://site-bar/foobar.png'
title = 'FooBar title'
site_name = 'FooBar'
description = 'FooBar description'
document = get_document(title, site_name, description, url, image, favicon)
metadata = get_url_metadata(url, document.encode(), providers=test_pr)
expected = {
'favicon_url': favicon,
'description': description,
'url': url,
'title': title,
'thumbnail_url': image,
'provider_name': site_name
}
self.assertEqual(metadata, expected)