Filtering base function

So that global and account filtering are treated the same
main
Bob Mottram 2020-12-19 13:21:06 +00:00
parent 7c6d7d158e
commit de1bfa8ed4
1 changed files with 26 additions and 24 deletions

View File

@ -89,6 +89,29 @@ def isTwitterPost(content: str) -> bool:
return False
def isFilteredBase(filename: str, content: str) -> bool:
"""Uses the given file containing filtered words to check
the given content
"""
with open(filename, 'r') as fp:
for line in fp:
filterStr = line.replace('\n', '').replace('\r', '')
if not filterStr:
continue
if len(filterStr) < 2:
continue
if '+' not in filterStr:
if filterStr in content:
return True
else:
filterWords = filterStr.replace('"', '').split('+')
for word in filterWords:
if word not in content:
return False
return True
return False
def isFiltered(baseDir: str, nickname: str, domain: str, content: str) -> bool:
"""Should the given content be filtered out?
This is a simple type of filter which just matches words, not a regex
@ -96,15 +119,7 @@ def isFiltered(baseDir: str, nickname: str, domain: str, content: str) -> bool:
words must be present although not necessarily adjacent
"""
globalFiltersFilename = baseDir + '/accounts/filters.txt'
if os.path.isfile(globalFiltersFilename):
wordsFile = open(globalFiltersFilename, 'r')
if wordsFile:
wordsList = wordsFile.read().split('\n')
for word in wordsList:
if not word:
continue
if len(word) > 1:
if word in content:
if isFilteredBase(globalFiltersFilename, content):
return True
if not nickname or not domain:
@ -119,17 +134,4 @@ def isFiltered(baseDir: str, nickname: str, domain: str, content: str) -> bool:
accountFiltersFilename = baseDir + '/accounts/' + \
nickname + '@' + domain + '/filters.txt'
if os.path.isfile(accountFiltersFilename):
with open(accountFiltersFilename, 'r') as fp:
for line in fp:
filterStr = line.replace('\n', '').replace('\r', '')
if '+' not in filterStr:
if filterStr in content:
return True
else:
filterWords = filterStr.replace('"', '').split('+')
for word in filterWords:
if word not in content:
return False
return True
return False
return isFilteredBase(accountFiltersFilename, content)