Start writing some analyzaton code

This commit is contained in:
Arne Schlüter 2015-01-17 11:45:52 +01:00
commit 06814ecae8

25
analyze.py Normal file
View file

@ -0,0 +1,25 @@
def get_district(article_headline):
"""
Returns a geo-coded version of a district an article is about, based on its
headline.
"""
pass
def get_categories(article_body):
"""
Gives a list of categories an article falls into, which is empty if none of
the following are matched:
- sexism
- antisemitism
- homophobia
- racism
"""
bad_words = {
'antisemit': 'antisemitism',
'homophob': 'homophobia',
'sexis': 'sexism',
'rassis': 'racism'
}
found_categories = [bad_words[key] for key in bad_words
if key in article_body.lower()]
return found_categories or ['other']