From 1cab4cd3d653d3d3f4485b0b52ea6e352a508dd1 Mon Sep 17 00:00:00 2001 From: Packit Service Date: Jan 05 2021 22:32:05 +0000 Subject: Apply patch CVE-2020-27783.patch patch_name: CVE-2020-27783.patch present_in_specfile: true location_in_specfile: 1 --- diff --git a/src/lxml/html/clean.py b/src/lxml/html/clean.py index adc3f45..6f3f7de 100644 --- a/src/lxml/html/clean.py +++ b/src/lxml/html/clean.py @@ -61,12 +61,15 @@ __all__ = ['clean_html', 'clean', 'Cleaner', 'autolink', 'autolink_html', # This is an IE-specific construct you can have in a stylesheet to # run some Javascript: -_css_javascript_re = re.compile( - r'expression\s*\(.*?\)', re.S|re.I) +_replace_css_javascript = re.compile( + r'expression\s*\(.*?\)', re.S|re.I).sub # Do I have to worry about @\nimport? -_css_import_re = re.compile( - r'@\s*import', re.I) +_replace_css_import = re.compile( + r'@\s*import', re.I).sub + +_looks_like_tag_content = re.compile( + r'' + return True return False def clean_html(self, html): diff --git a/src/lxml/html/tests/test_clean.py b/src/lxml/html/tests/test_clean.py index 3bcaaf5..451eec2 100644 --- a/src/lxml/html/tests/test_clean.py +++ b/src/lxml/html/tests/test_clean.py @@ -69,6 +69,26 @@ class CleanerTest(unittest.TestCase): s = lxml.html.fromstring('child') self.assertEqual('child', clean_html(s).text_content()) + def test_sneaky_noscript_in_style(self): + # This gets parsed as through into the output. + html = '', + lxml.html.tostring(clean_html(s))) + + def test_sneaky_js_in_math_style(self): + # This gets parsed as -> + # thus passing any tag/script/whatever content through into the output. + html = '' + s = lxml.html.fragment_fromstring(html) + + self.assertEqual( + b'', + lxml.html.tostring(clean_html(s))) + def test_suite(): suite = unittest.TestSuite() diff --git a/src/lxml/html/tests/test_clean.txt b/src/lxml/html/tests/test_clean.txt index c78ab4f..c901871 100644 --- a/src/lxml/html/tests/test_clean.txt +++ b/src/lxml/html/tests/test_clean.txt @@ -104,7 +104,11 @@ >>> print(Cleaner(page_structure=False, safe_attrs_only=False).clean_html(doc)) - + a link @@ -168,7 +172,11 @@ - + a link