Fixed Non-ASCII character error in the English OCR cleanup backend

This commit is contained in:
Roberto Rosario
2011-04-13 03:26:55 -04:00
parent 6b5a17af39
commit f87beff00e

View File

@@ -13,7 +13,7 @@ def check_word(word):
if len(word) > 20:
return None
#(A) If a strings ratio of alphanumeric characters to total
#(A) If a string's ratio of alphanumeric characters to total
#characters is less than 50%, the string is garbage
if len(ALL_ALPHANUM.findall(word)) < len(word) / 2:
return None