<?xml version="1.0" encoding="UTF-8"?>
<commit>
  <added type="array"/>
  <modified type="array">
    <modified>
      <diff>@@ -102,12 +102,14 @@ def sanitize_html(html='&lt;p&gt;No comment&lt;/p&gt;', encoding=None,
 
     if isinstance(html, unicode) and not encoding:
         logging.debug(&quot;Sanitizing unicode input.&quot;)
-        soup = BeautifulSoup(html)
+        soup = BeautifulSoup(html,  
+                            convertEntities=BeautifulSoup.XHTML_ENTITIES)
     else:
         if not encoding:
             encoding = 'latin-1'
         logging.debug(&quot;Sanitizing string input, assuming %s&quot;, encoding)
-        soup = BeautifulSoup(html.decode(encoding, 'ignore'))
+        soup = BeautifulSoup(html.decode(encoding, 'ignore'),
+                             convertEntities=BeautifulSoup.XHTML_ENTITIES)
     for comment in soup.findAll(
                     text = lambda text: isinstance(text, Comment)):
         comment.extract()</diff>
      <filename>utils/sanitizer.py</filename>
    </modified>
  </modified>
  <removed type="array"/>
  <parents type="array">
    <parent>
      <id>4bfe1ddd1aaeb8d6abb0a02463cbe8a4af4c2fac</id>
    </parent>
  </parents>
  <author>
    <name>Bill Katz</name>
    <email>billkatz@gmail.com</email>
  </author>
  <url>http://github.com/DocSavage/bloog/commit/b5f9622ce02428cd6dac80a8239d6f26460ec16c</url>
  <id>b5f9622ce02428cd6dac80a8239d6f26460ec16c</id>
  <committed-date>2008-08-23T20:29:57-07:00</committed-date>
  <authored-date>2008-08-23T12:57:54-07:00</authored-date>
  <message>Convert HTML entities on receiving data.  This should prevent errors in Atom feed as well.</message>
  <tree>df5b8a6804a1563adf2327d570f307eb8fedd28a</tree>
  <committer>
    <name>Bill Katz</name>
    <email>billkatz@gmail.com</email>
  </committer>
</commit>
