diff --git a/test-gen/src/main.rs b/test-gen/src/main.rs index 65b77d7d..92a1e89f 100644 --- a/test-gen/src/main.rs +++ b/test-gen/src/main.rs @@ -284,6 +284,15 @@ fn main() { .expect(&format!("label `{}` is unsupported", label)); process_index(enc, &codepoints); + if enc == ISO_8859_8 { + // ISO_8859_8_I does not have its own index in encoding/indexes.json, + // but it have the same mapping as ISO_8859_8. + // + // Wikipedia (https://en.wikipedia.org/wiki/ISO-8859-8-I): + // The WHATWG Encoding Standard used by HTML5 treats ISO-8859-8 and ISO-8859-8-I + // as distinct encodings with the same mapping due to influence on the layout direction + process_index(ISO_8859_8_I, &codepoints); + } } // https://encoding.spec.whatwg.org/#x-user-defined-decoder make_xml(X_USER_DEFINED, '\u{F780}'..='\u{F7FF}'); diff --git a/tests/documents/encoding/ISO-8859-8-I.xml b/tests/documents/encoding/ISO-8859-8-I.xml index af5aadbb..9ee16eef 100644 --- a/tests/documents/encoding/ISO-8859-8-I.xml +++ b/tests/documents/encoding/ISO-8859-8-I.xml @@ -1,16 +1,17 @@ - - + + - - -  -  !"#$%'()*+,-./0123456789:;=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\]^_`abcdefghijklmnopqrstuvwxyz{|}~ - - <[[CDATA[[ -  !"#$%'()*+,-./0123456789:;=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\]^_`abcdefghijklmnopqrstuvwxyz{|}~]]> + + + + !"#$%'()*+,-./0123456789:;=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\]^_`abcdefghijklmnopqrstuvwxyz{|}~ + + ?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\]^_`abcdefghijklmnopqrstuvwxyz{|}~]]> \ No newline at end of file