Skip to content

Commit c5a8007

Browse files
committed
Add a better test for encoding prescan length
1 parent 9dc49f6 commit c5a8007

File tree

1 file changed

+9
-0
lines changed

1 file changed

+9
-0
lines changed

html5lib/tests/test_encoding.py

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -12,6 +12,15 @@
1212
from html5lib import HTMLParser, inputstream
1313

1414

15+
def test_basic_prescan_length():
16+
data = "<title>Caf\u00E9</title><!--a--><meta charset='utf-8'>".encode('utf-8')
17+
pad = 1024 - len(data) + 1
18+
data = data.replace(b"-a-", b"-" + (b"a" * pad) + b"-")
19+
assert len(data) == 1024 # Sanity
20+
stream = inputstream.HTMLBinaryInputStream(data, chardet=False)
21+
assert 'utf-8' == stream.charEncoding[0].name
22+
23+
1524
def runParserEncodingTest(data, encoding):
1625
p = HTMLParser()
1726
assert p.documentEncoding is None

0 commit comments

Comments
 (0)