diff options
author | Martin Fischer <martin@push-f.com> | 2023-08-12 11:06:02 +0200 |
---|---|---|
committer | Martin Fischer <martin@push-f.com> | 2023-08-19 06:41:55 +0200 |
commit | 9f1019afa7a8e9102d67356d85bd632044eb2d0c (patch) | |
tree | 4c6664aad5a11a942d6684a62e507de28193f5bb /integration_tests/tests | |
parent | c3d60e88efa32329614178dfc9455ef33ea0a88d (diff) |
break!: merge Tokenizer::new_with_emitter into Tokenizer::new
The Tokenizer does not perform any state switching, since
proper state switching requires a feedback loop between
tokenization and DOM tree building. Using the Tokenizer
directly therefore is a bit of a pitfall, since you might
not expect it to e.g. tokenize `<script><b>` as:
StartTag(StartTag { name: "script", .. })
StartTag(StartTag { name: "b", .. })
Since we don't want to make walking into pitfalls
particularly easy, this commit changes the Tokenizer::new
method so that you have to specify the Emitter.
Since this makes new_with_emitter redundant it is removed.
Diffstat (limited to 'integration_tests/tests')
-rw-r--r-- | integration_tests/tests/test_html5lib.rs | 9 |
1 files changed, 6 insertions, 3 deletions
diff --git a/integration_tests/tests/test_html5lib.rs b/integration_tests/tests/test_html5lib.rs index 23adec0..f5a69c3 100644 --- a/integration_tests/tests/test_html5lib.rs +++ b/integration_tests/tests/test_html5lib.rs @@ -3,7 +3,7 @@ use std::{fs::File, io::BufReader, path::Path}; use html5lib_tests::{ parse_tests, Error as TestError, InitialState, Output, Test, Token as TestToken, }; -use html5tokenizer::{InternalState, Reader, Token, Tokenizer}; +use html5tokenizer::{DefaultEmitter, InternalState, Reader, Token, Tokenizer}; use pretty_assertions::assert_eq; /// Path to a local checkout of [html5lib-tests], relative to the @@ -69,7 +69,7 @@ fn run_test(fname: &str, test_i: usize, test: Test) { test_i, &test, state, - Tokenizer::new(&test.input), + Tokenizer::new(&test.input, DefaultEmitter::default()), "string", ); @@ -78,7 +78,10 @@ fn run_test(fname: &str, test_i: usize, test: Test) { test_i, &test, state, - Tokenizer::new(BufReader::new(test.input.as_bytes())), + Tokenizer::new( + BufReader::new(test.input.as_bytes()), + DefaultEmitter::default(), + ), "bufread", ); } |