make sure part is encoded string (BeautifulSoup sometimes does not encode input

This commit is contained in:
Helmut Merz 2013-08-13 13:04:27 +02:00
parent 51cc5a6d36
commit 707d7abf6d

View file

@ -115,4 +115,6 @@ def extractFirstPart(value):
else: else:
text = stripAll(value) text = stripAll(value)
part = sentencePattern.split(text)[0] part = sentencePattern.split(text)[0]
if isinstance(part, unicode):
part = part.encode('UTF-8')
return ('<p>%s</p>' % part).decode('utf8') return ('<p>%s</p>' % part).decode('utf8')