mirror of
https://github.com/heyarne/berliner-winter.git
synced 2026-05-06 19:23:39 +02:00
25 lines
701 B
Python
25 lines
701 B
Python
def get_district(article_headline):
|
|
"""
|
|
Returns a geo-coded version of a district an article is about, based on its
|
|
headline.
|
|
"""
|
|
pass
|
|
|
|
def get_categories(article_body):
|
|
"""
|
|
Gives a list of categories an article falls into, which is empty if none of
|
|
the following are matched:
|
|
- sexism
|
|
- antisemitism
|
|
- homophobia
|
|
- racism
|
|
"""
|
|
bad_words = {
|
|
'antisemit': 'antisemitism',
|
|
'homophob': 'homophobia',
|
|
'sexis': 'sexism',
|
|
'rassis': 'racism'
|
|
}
|
|
found_categories = [bad_words[key] for key in bad_words
|
|
if key in article_body.lower()]
|
|
return found_categories or ['other']
|