Skip to content

Commit

Permalink
Added a try/except to catch unicode errors.
Browse files Browse the repository at this point in the history
  • Loading branch information
elgatito committed Jan 13, 2022
1 parent 701f323 commit 7415707
Showing 1 changed file with 14 additions and 11 deletions.
25 changes: 14 additions & 11 deletions burst/normalize.py
Original file line number Diff line number Diff line change
Expand Up @@ -184,20 +184,23 @@ def normalize_string(string, charset=None, replacing=False):
string = unicode(string, errors='ignore')
pass

string = remove_control_chars(string)
string = fix_bad_unicode(string)
string = unquote(string)
string = string.replace(u'<![CDATA[', u'').replace(u']]', u'')
try:
string = remove_control_chars(string)
string = fix_bad_unicode(string)
string = unquote(string)
string = string.replace(u'<![CDATA[', u'').replace(u']]', u'')

if PY3:
string = html.unescape(string)
else:
string = HTMLParser().unescape(string)
if PY3:
string = html.unescape(string)
else:
string = HTMLParser().unescape(string)

if replacing:
string = string.replace(u"'", '')
if replacing:
string = string.replace(u"'", '')

string = string.lower()
string = string.lower()
except:
pass

return string

Expand Down

0 comments on commit 7415707

Please sign in to comment.