2020-08-09 04:13:34 +02:00
|
|
|
module html
|
|
|
|
|
2020-12-09 20:08:15 +01:00
|
|
|
import strings
|
2020-08-09 04:13:34 +02:00
|
|
|
|
|
|
|
fn test_split_parse() {
|
|
|
|
mut parser := Parser{}
|
2020-12-09 20:08:15 +01:00
|
|
|
parser.init()
|
2020-08-09 04:13:34 +02:00
|
|
|
parser.split_parse('<!doctype htm')
|
|
|
|
parser.split_parse('l public')
|
|
|
|
parser.split_parse('><html><he')
|
|
|
|
parser.split_parse('ad><t')
|
|
|
|
parser.split_parse('itle> Hum... ')
|
|
|
|
parser.split_parse('A Tit')
|
|
|
|
parser.split_parse('\nle</ti\ntle>')
|
|
|
|
parser.split_parse('</\nhead><body>\t\t\t<h3>')
|
|
|
|
parser.split_parse('Nice Test!</h3>')
|
|
|
|
parser.split_parse('</bo\n\n\ndy></html>')
|
|
|
|
parser.finalize()
|
2020-12-09 20:08:15 +01:00
|
|
|
assert parser.tags.len == 11
|
|
|
|
assert parser.tags[3].content == ' Hum... A Tit\nle'
|
2020-08-09 04:13:34 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
fn test_giant_string() {
|
2020-12-09 20:08:15 +01:00
|
|
|
mut temp_html := strings.new_builder(200)
|
|
|
|
mut parser := Parser{}
|
2021-02-22 12:18:11 +01:00
|
|
|
temp_html.write_string('<!doctype html><html><head><title>Giant String</title></head><body>')
|
2020-08-09 04:13:34 +02:00
|
|
|
for counter := 0; counter < 2000; counter++ {
|
2021-02-22 12:18:11 +01:00
|
|
|
temp_html.write_string("<div id='name_$counter' class='several-$counter'>Look at $counter</div>")
|
2020-08-09 04:13:34 +02:00
|
|
|
}
|
2021-02-22 12:18:11 +01:00
|
|
|
temp_html.write_string('</body></html>')
|
2020-12-09 20:08:15 +01:00
|
|
|
parser.parse_html(temp_html.str())
|
|
|
|
assert parser.tags.len == 4009
|
2020-08-09 04:13:34 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
fn test_script_tag() {
|
|
|
|
mut parser := Parser{}
|
2020-12-09 20:08:15 +01:00
|
|
|
script_content := "\nvar googletag = googletag || {};\ngoogletag.cmd = googletag.cmd || [];if(3 > 5) {console.log(\'Birl\');}\n"
|
|
|
|
temp_html := '<html><body><script>$script_content</script></body></html>'
|
|
|
|
parser.parse_html(temp_html)
|
|
|
|
assert parser.tags[2].content.len == script_content.replace('\n', '').len
|
2020-08-09 04:13:34 +02:00
|
|
|
}
|