Skip to content
This repository was archived by the owner on Nov 8, 2023. It is now read-only.

Commit c6af101

Browse files
committed
html: Test tokenizer against html5lib test suite
1 parent 27752f7 commit c6af101

30 files changed

+33254
-0
lines changed

result/html-tokenizer/NOTICE

+27
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,27 @@
1+
The test cases in this directory are derived from the html5lib test
2+
suite available from https://github.com/html5lib/html5lib-tests under
3+
the following license:
4+
5+
---
6+
7+
Copyright (c) 2006-2013 James Graham, Geoffrey Sneddon, and
8+
other contributors
9+
10+
Permission is hereby granted, free of charge, to any person obtaining
11+
a copy of this software and associated documentation files (the
12+
"Software"), to deal in the Software without restriction, including
13+
without limitation the rights to use, copy, modify, merge, publish,
14+
distribute, sublicense, and/or sell copies of the Software, and to
15+
permit persons to whom the Software is furnished to do so, subject to
16+
the following conditions:
17+
18+
The above copyright notice and this permission notice shall be
19+
included in all copies or substantial portions of the Software.
20+
21+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
22+
EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
23+
MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
24+
NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
25+
LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
26+
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
27+
WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,96 @@
1+
0
2+
Character
3+
<head>&body;
4+
1
5+
Character
6+
</plaintext>&body;
7+
2
8+
Character
9+
foo
10+
EndTag
11+
xmp
12+
3
13+
Character
14+
foo
15+
EndTag
16+
xmp
17+
4
18+
Character
19+
foo
20+
EndTag
21+
xmp
22+
5
23+
Character
24+
foo
25+
EndTag
26+
xmp
27+
6
28+
Character
29+
foo
30+
7
31+
Character
32+
foo
33+
8
34+
Character
35+
foo</xmp
36+
9
37+
Character
38+
foo</xmp
39+
10
40+
Character
41+
foo
42+
11
43+
Character
44+
foo
45+
12
46+
Character
47+
foo</xmp<
48+
13
49+
Character
50+
foo</xmp<
51+
14
52+
Character
53+
</foo>bar
54+
EndTag
55+
xmp
56+
15
57+
Character
58+
</foo>bar
59+
EndTag
60+
xmp
61+
16
62+
Character
63+
</xmp</xmp
64+
EndTag
65+
xmp
66+
17
67+
Character
68+
</xmp</xmp
69+
EndTag
70+
xmp
71+
18
72+
Character
73+
</foo>bar</xmpaar>
74+
19
75+
Character
76+
</foo>bar</xmpaar>
77+
20
78+
Character
79+
foo
80+
EndTag
81+
xmp
82+
EndTag
83+
baz
84+
21
85+
Character
86+
foo
87+
EndTag
88+
xmp
89+
EndTag
90+
baz
91+
22
92+
Character
93+
&foo;
94+
23
95+
Character
96+
<

result/html-tokenizer/domjs.test

+190
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,190 @@
1+
0
2+
Comment
3+
?
4+
5+
1
6+
Comment
7+
?
8+
9+
2
10+
Comment
11+
?
12+
13+
14+
3
15+
Character
16+
17+
4
18+
Character
19+
20+
5
21+
Character
22+
23+
6
24+
Character
25+
26+
7
27+
Character
28+
<!--test�--><!--test-�--><!--test--�-->
29+
8
30+
Character
31+
<!--<script>�--><!--<script>-�--><!--<script>--�-->
32+
9
33+
Character
34+
<!--test
35+
10
36+
Character
37+
<!--test-
38+
11
39+
Character
40+
<!--test--
41+
12
42+
Character
43+
<!--<script>-
44+
13
45+
Character
46+
<!--<script>--
47+
14
48+
Character
49+
<!--<script>
50+
15
51+
Character
52+
<!-- - -->
53+
16
54+
Character
55+
<!-- -< -->
56+
17
57+
Character
58+
<!--test--->
59+
18
60+
Character
61+
<!--
62+
EndTag
63+
script
64+
Character
65+
-->
66+
EndTag
67+
script
68+
19
69+
Character
70+
<!-- <script></script> -->
71+
EndTag
72+
script
73+
20
74+
Character
75+
<!-- <script><script></script>
76+
EndTag
77+
script
78+
Character
79+
-->
80+
EndTag
81+
script
82+
21
83+
Character
84+
<!-- <script>-->
85+
EndTag
86+
script
87+
Character
88+
-->
89+
EndTag
90+
script
91+
22
92+
Character
93+
<!--<scrip>
94+
EndTag
95+
script
96+
Character
97+
-->
98+
23
99+
Character
100+
<!--<script
101+
EndTag
102+
script
103+
Character
104+
-->
105+
24
106+
Character
107+
<!--<script></scrip>-->
108+
25
109+
Character
110+
<!--<script></script-->
111+
26
112+
Character
113+
foobar
114+
27
115+
Character
116+
foobar
117+
28
118+
Character
119+
foobar
120+
29
121+
Character
122+
foobar
123+
30
124+
Character
125+
≂̸
126+
31
127+
Character
128+
&NotEqualTild;
129+
32
130+
EndTag
131+
xmp
132+
33
133+
EndTag
134+
xmp
135+
34
136+
EndTag
137+
xmp
138+
35
139+
Character
140+
</ XMP>
141+
36
142+
Character
143+
</ XMP>
144+
37
145+
Character
146+
</ XMP>
147+
38
148+
Character
149+
</xm>
150+
39
151+
Character
152+
</xm>
153+
40
154+
Character
155+
</xm>
156+
41
157+
Character
158+
</xm
159+
42
160+
Character
161+
</xm
162+
43
163+
Character
164+
</xm
165+
44
166+
Character
167+
</xm/
168+
45
169+
Character
170+
</xm/
171+
46
172+
Character
173+
</xm/
174+
47
175+
StartTag
176+
p id=≂̸
177+
48
178+
Comment
179+
--!�
180+
49
181+
DOCTYPE
182+
html
183+
<none>
184+
<none>
185+
50
186+
Comment
187+
[CDATA[foo]]
188+
51
189+
Character
190+
<b>hello world</b>

0 commit comments

Comments
 (0)