From e09bf7a4d4d037b7b88ee21f89514d6a3e15a380 Mon Sep 17 00:00:00 2001 From: Marian Steinbach Date: Fri, 4 May 2018 00:38:44 +0200 Subject: [PATCH] Add basic test for check_content --- test.py | 35 +++++++++++++++++++++++++++++++++++ 1 file changed, 35 insertions(+) diff --git a/test.py b/test.py index 2f465fb..e165a45 100644 --- a/test.py +++ b/test.py @@ -1,4 +1,6 @@ import unittest +import requests +import responses import spider class TestSpider(unittest.TestCase): @@ -24,6 +26,39 @@ class TestSpider(unittest.TestCase): result = spider.reduce_urls(testdata) self.assertEqual(result, expected_result) + @responses.activate + def test_check_content1(self): + """ + Very basic test of our content analysis function + """ + url = 'http://my.url' + responses.add(responses.GET, url, status=200, + content_type='text/html', + body=''' + + + + + The title + + + ''') + r = requests.get(url) + result = spider.check_content(r) + + del result['html'] # don't want to have the messy HTML part in comparison + + expected_result = { + 'icon': None, + 'title': 'The title', + 'generator': None, + 'feeds': [], + 'encoding': 'ISO-8859-1', + 'canonical_link': None, + 'opengraph': None + } + self.assertDictEqual(result, expected_result) + if __name__ == '__main__': unittest.main()