Skip to content

Commit

Permalink
lower case
Browse files Browse the repository at this point in the history
  • Loading branch information
observerss committed Jan 5, 2012
1 parent 0be8132 commit a60a2a8
Showing 1 changed file with 6 additions and 3 deletions.
9 changes: 6 additions & 3 deletions filter.py
Original file line number Diff line number Diff line change
Expand Up @@ -23,10 +23,10 @@ def __init__(self):

def parse(self,path):
for keyword in open(path):
self.keywords.add(keyword.strip().decode('utf-8'))
self.keywords.add(keyword.strip().decode('utf-8').lower())

def filter(self,message,repl="*"):
message = unicode(message)
message = unicode(message).lower()
for kw in self.keywords:
message = message.replace(kw,repl)
return message
Expand All @@ -51,6 +51,7 @@ def __init__(self):
def add(self,keyword):
if not isinstance(keyword,unicode):
keyword = keyword.decode('utf-8')
keyword = keyword.lower()
if keyword not in self.kwsets:
self.keywords.append(keyword)
self.kwsets.add(keyword)
Expand All @@ -70,6 +71,7 @@ def parse(self,path):
def filter(self,message,repl="*"):
if not isinstance(message,unicode):
message = message.decode('utf-8')
message = message.lower()
for word in message.split():
if self.pat_en.search(word):
for index in self.bsdict[word]:
Expand Down Expand Up @@ -97,6 +99,7 @@ def __init__(self):
def add(self,keyword):
if not isinstance(keyword,unicode):
keyword = keyword.decode('utf-8')
keyword = keyword.lower()
chars = keyword.strip()
if not chars:
return
Expand Down Expand Up @@ -125,7 +128,7 @@ def parse(self,path):
def filter(self,message,repl="*"):
if not isinstance(message,unicode):
message = message.decode('utf-8')

message = message.lower()
ret = []
start = 0
while start < len(message):
Expand Down

0 comments on commit a60a2a8

Please sign in to comment.