gh-77057: Fix handling of invalid markup declarations in HTMLParser (GH-9295)

Co-authored-by: Serhiy Storchaka <storchaka@gmail.com>
This commit is contained in:
Ezio Melotti 2025-05-10 16:31:43 +02:00 committed by GitHub
parent e7741dd773
commit 76c0b01bc4
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
3 changed files with 68 additions and 19 deletions

View file

@ -278,7 +278,7 @@ def parse_html_declaration(self, i):
if rawdata[i:i+4] == '<!--':
# this case is actually already handled in goahead()
return self.parse_comment(i)
elif rawdata[i:i+3] == '<![':
elif rawdata[i:i+9] == '<![CDATA[':
return self.parse_marked_section(i)
elif rawdata[i:i+9].lower() == '<!doctype':
# find the closing >
@ -295,7 +295,7 @@ def parse_html_declaration(self, i):
def parse_bogus_comment(self, i, report=1):
rawdata = self.rawdata
assert rawdata[i:i+2] in ('<!', '</'), ('unexpected call to '
'parse_comment()')
'parse_bogus_comment()')
pos = rawdata.find('>', i+2)
if pos == -1:
return -1