mirror of
https://github.com/python/cpython.git
synced 2025-08-23 18:24:46 +00:00
#13273: fix a bug that prevented HTMLParser to properly detect some tags when strict=False.
This commit is contained in:
parent
0b85cd0680
commit
f50ffa94ab
3 changed files with 38 additions and 3 deletions
|
@ -373,6 +373,39 @@ class HTMLParserTolerantTestCase(TestCaseBase):
|
|||
[('action', 'bogus|&#()value')])],
|
||||
collector = self.collector)
|
||||
|
||||
def test_issue13273(self):
|
||||
html = ('<div style="" ><b>The <a href="some_url">rain</a> '
|
||||
'<br /> in <span>Spain</span></b></div>')
|
||||
expected = [
|
||||
('starttag', 'div', [('style', '')]),
|
||||
('starttag', 'b', []),
|
||||
('data', 'The '),
|
||||
('starttag', 'a', [('href', 'some_url')]),
|
||||
('data', 'rain'),
|
||||
('endtag', 'a'),
|
||||
('data', ' '),
|
||||
('startendtag', 'br', []),
|
||||
('data', ' in '),
|
||||
('starttag', 'span', []),
|
||||
('data', 'Spain'),
|
||||
('endtag', 'span'),
|
||||
('endtag', 'b'),
|
||||
('endtag', 'div')
|
||||
]
|
||||
self._run_check(html, expected, collector=self.collector)
|
||||
|
||||
def test_issue13273_2(self):
|
||||
html = '<div style="", foo = "bar" ><b>The <a href="some_url">rain</a>'
|
||||
expected = [
|
||||
('starttag', 'div', [('style', ''), ('foo', 'bar')]),
|
||||
('starttag', 'b', []),
|
||||
('data', 'The '),
|
||||
('starttag', 'a', [('href', 'some_url')]),
|
||||
('data', 'rain'),
|
||||
('endtag', 'a'),
|
||||
]
|
||||
self._run_check(html, expected, collector=self.collector)
|
||||
|
||||
def test_unescape_function(self):
|
||||
p = html.parser.HTMLParser()
|
||||
self.assertEqual(p.unescape('&#bad;'),'&#bad;')
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue