We do not have to decode the unicode string again since we already have our data from html5lib in utf-8 encoded format.

Fixes issue 1552.
diff --git a/app/soc/logic/cleaning.py b/app/soc/logic/cleaning.py
index 61c1f1a..14eba95 100644
--- a/app/soc/logic/cleaning.py
+++ b/app/soc/logic/cleaning.py
@@ -424,12 +424,7 @@
   except (HTMLParseError, ParseError), msg:
     raise forms.ValidationError(msg)
 
-  try:
-    content = cleaned_content.decode("utf-8")
-  except Exception, e:
-    raise forms.ValidationError(str(e))
-
-  return content
+  return cleaned_content
 
 
 def clean_html_content(field_name):