Added:
trunk/feedparser/tests/illformed/rss/item_description_code_br.xml
trunk/feedparser/tests/wellformed/rss/item_description_code_br.xml
Modified:
trunk/feedparser/feedparser.py
Log:
http://blog.mozilla.com/rob-sayre/2009/02/18/engineer-for-serendipity/
Modified: trunk/feedparser/feedparser.py
==============================================================================
--- trunk/feedparser/feedparser.py (original)
+++ trunk/feedparser/feedparser.py Fri Feb 20 15:19:53 2009
@@ -1654,7 +1654,7 @@
def feed(self, data):
data = re.compile(r'<!((?!DOCTYPE|--|\[))',
re.IGNORECASE).sub(r'<!\1', data)
#data = re.sub(r'<(\S+?)\s*?/>', self._shorttag_replace, data) #
bug [ 1399464 ] Bad regexp for _shorttag_replace
- data = re.sub(r'<([^<\s]+?)\s*/>', self._shorttag_replace, data)
+ data = re.sub(r'<([^<>\s]+?)\s*/>', self._shorttag_replace, data)
data = data.replace(''', "'")
data = data.replace('"', '"')
if self.encoding and type(data) == type(u''):
Added: trunk/feedparser/tests/illformed/rss/item_description_code_br.xml
==============================================================================
--- (empty file)
+++ trunk/feedparser/tests/illformed/rss/item_description_code_br.xml Fri
Feb 20 15:19:53 2009
@@ -0,0 +1,12 @@
+<!--
+Description: item description contains <code> with <br />
+Expect: bozo and entries[0]['description'] == u'<code><br
/></code>'
+-->
+<rss version="2.0">
+<channel>
+<item>
+<link>http://www.example.com/</link>
+<description><![CDATA[<code><br /></code>]]></description>
+</item>
+</channel>
+</rss
Added: trunk/feedparser/tests/wellformed/rss/item_description_code_br.xml
==============================================================================
--- (empty file)
+++ trunk/feedparser/tests/wellformed/rss/item_description_code_br.xml Fri
Feb 20 15:19:53 2009
@@ -0,0 +1,12 @@
+<!--
+Description: item description contains <code> with <br />
+Expect: not bozo and entries[0]['description'] == u'<code><br
/></code>'
+-->
+<rss version="2.0">
+<channel>
+<item>
+<link>http://www.example.com/</link>
+<description><![CDATA[<code><br /></code>]]></description>
+</item>
+</channel>
+</rss>