This commit is contained in:
Kovid Goyal 2008-06-14 08:03:25 -07:00
parent 48930e7847
commit ee9316a76c

View File

@ -46,7 +46,10 @@ def xml_to_unicode(raw, verbose=False):
if match is not None:
encoding = match.group(1)
if encoding is None:
try:
chardet = detect(raw)
except:
chardet = {'encoding':'utf-8', 'confidence':0}
encoding = chardet['encoding']
if chardet['confidence'] < 1 and verbose:
print 'WARNING: Encoding detection confidence %d%%'%(chardet['confidence']*100)