import decorator_utils
import string_utils
-
logger = logging.getLogger(__name__)
'girl gone wild',
'girl on top',
'girl on',
+ 'give head',
+ 'giving head',
+ 'gave head',
'goatcx',
'goatse',
'goddamn',
def tokenize(self, text: str):
for x in nltk.word_tokenize(text):
- for y in re.split('\W+', x):
+ for y in re.split(r'\W+', x):
yield y
def contains_bad_word(self, text: str) -> bool:
break
return out
- words = self.tokenize(text)
+ words = [x for x in self.tokenize(text)]
words.append('')
words.append('')
words.append('')