-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathpipeline_test.py
72 lines (58 loc) · 3.36 KB
/
pipeline_test.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
import unittest
import sentiment_analysis.sentiment_dictionary as sd
import article_selection.article_selection as arts
import sentiment_analysis.bert as bert
import os
class TestSentimentDictionary(unittest.TestCase):
def test_wrong_input(self):
text = "Flüchtlinge haben leider ein schlechtes Image."
self.assertRaises(TypeError, sd.analyse_sentiment,text, [])
self.assertRaises(TypeError, sd.analyse_sentiment,text, [2,3,4,"hallo"])
self.assertRaises(TypeError, sd.analyse_sentiment,3, ["c"])
self.assertRaises(TypeError, sd.analyse_sentiment,[text], ["c"])
self.assertRaises(TypeError, sd.analyse_sentiment,True, ["c"])
def test_running(self):
sd.test()
class TestSentimentBert(unittest.TestCase):
def test_running(self):
bert.test()
class TestArticleSelection(unittest.TestCase):
def test_wrong_input_is_topic_relevant(self):
# first argument is not a dictionary
self.assertRaises(TypeError,arts.is_topic_relevant,"test")
self.assertRaises(TypeError,arts.is_topic_relevant,3)
self.assertRaises(TypeError,arts.is_topic_relevant,False)
valid_article = {'date':'01.01.2020','title':"title",'text':"texttext", 'url':"http//a.de"}
# second type is not a list of strings
self.assertRaises(TypeError,arts.is_topic_relevant,valid_article,3)
self.assertRaises(TypeError,arts.is_topic_relevant,valid_article,True)
self.assertRaises(TypeError,arts.is_topic_relevant,valid_article,[])
self.assertRaises(TypeError,arts.is_topic_relevant,valid_article,[2,3,5])
def test_right_output_is_topic_relevant(self):
# use article with wrong key
self.assertEqual(arts.is_topic_relevant({"test":3}),False)
valid_article = {'date':'01.01.2020','title':"title",'text':"texttext", 'url':"http//a.de"}
# no keyword of default list in valid_article -> False
self.assertEqual(arts.is_topic_relevant(valid_article),False)
valid_list = ["text"]
# use other keyword list with keyword text -> True
self.assertEqual(arts.is_topic_relevant(valid_article,valid_list),True)
# use nearly valid article with always one missing key
article_missing_date = {'title':"title",'text':"texttext", 'url':"http//a.de"}
article_missing_title = {'date':'01.01.2020','text':"texttext", 'url':"http//a.de"}
article_missing_text = {'date':'01.01.2020','title':"title", 'url':"http//a.de"}
article_missing_url = {'date':'01.01.2020','title':"title",'text':"texttext"}
self.assertEqual(arts.is_topic_relevant(article_missing_date,valid_list),False)
self.assertEqual(arts.is_topic_relevant(article_missing_title,valid_list),False)
self.assertEqual(arts.is_topic_relevant(article_missing_text,valid_list),False)
self.assertEqual(arts.is_topic_relevant(article_missing_url,valid_list),False)
def test_wrong_input_write_relevant_content_to_file(self):
# Test: should run without error
# file list with articles in wrong format
file_list = ["data/spiegel.json", "data/test.json"]
relevant_articles_base = "base"
search_keywords = ["test"]
arts.write_relevant_content_to_file(file_list, relevant_articles_base, search_keywords)
os.system("rm base_evaluation.json")
if __name__ == '__main__':
unittest.main()