diff --git a/newswire.py b/newswire.py index 606bf1dd..295579de 100644 --- a/newswire.py +++ b/newswire.py @@ -227,10 +227,14 @@ def xml2StrToHashtagCategories(baseDir: str, domain: str, xmlStr: str, categoryStr = categoryStr.split('')[0].strip() if not categoryStr: continue + if 'CDATA' in categoryStr: + continue hashtagListStr = rssItem.split('')[1] hashtagListStr = hashtagListStr.split('')[0].strip() if not hashtagListStr: continue + if 'CDATA' in hashtagListStr: + continue hashtagList = hashtagListStr.split(' ') if not isBlockedHashtag(baseDir, categoryStr): for hashtag in hashtagList: