changeset: 83586:9cb90c1a1a46 branch: 3.3 parent: 83583:4f45f9cde9b4 user: Ezio Melotti date: Wed May 01 16:18:25 2013 +0300 files: Lib/html/parser.py Lib/test/test_htmlparser.py Misc/NEWS description: #17802: Fix an UnboundLocalError in html.parser. Initial tests by Thomas Barlow. diff -r 4f45f9cde9b4 -r 9cb90c1a1a46 Lib/html/parser.py --- a/Lib/html/parser.py Wed May 01 15:12:20 2013 +0200 +++ b/Lib/html/parser.py Wed May 01 16:18:25 2013 +0300 @@ -249,6 +249,7 @@ if self.strict: self.error("EOF in middle of entity or char ref") else: + k = match.end() if k <= i: k = n i = self.updatepos(i, i + 1) diff -r 4f45f9cde9b4 -r 9cb90c1a1a46 Lib/test/test_htmlparser.py --- a/Lib/test/test_htmlparser.py Wed May 01 15:12:20 2013 +0200 +++ b/Lib/test/test_htmlparser.py Wed May 01 16:18:25 2013 +0300 @@ -535,6 +535,20 @@ ] self._run_check(html, expected) + def test_EOF_in_charref(self): + # see #17802 + # This test checks that the UnboundLocalError reported in the issue + # is not raised, however I'm not sure the returned values are correct. + # Maybe HTMLParser should use self.unescape for these + data = [ + ('a&', [('data', 'a&')]), + ('a&b', [('data', 'ab')]), + ('a&b ', [('data', 'a'), ('entityref', 'b'), ('data', ' ')]), + ('a&b;', [('data', 'a'), ('entityref', 'b')]), + ] + for html, expected in data: + self._run_check(html, expected) + def test_unescape_function(self): p = self.get_collector() self.assertEqual(p.unescape('&#bad;'),'&#bad;') diff -r 4f45f9cde9b4 -r 9cb90c1a1a46 Misc/NEWS --- a/Misc/NEWS Wed May 01 15:12:20 2013 +0200 +++ b/Misc/NEWS Wed May 01 16:18:25 2013 +0300 @@ -44,6 +44,9 @@ Library ------- +- Issue #17802: Fix an UnboundLocalError in html.parser. Initial tests by + Thomas Barlow. + - Issue #17192: Restore the patch for Issue #11729 which was ommitted in 3.3.1 when updating the bundled version of libffi used by ctypes. Update many libffi files that were missed in 3.3.1's update to libffi-3.0.13.

AltStyle によって変換されたページ (->オリジナル) /