From cd177d94ec3c65f338110490807c40e2fec498dc Mon Sep 17 00:00:00 2001 From: Andrew Gallant Date: Thu, 12 Mar 2020 21:40:48 -0400 Subject: [PATCH] syntax: update to Unicode 13 --- regex-syntax/src/unicode.rs | 1 + regex-syntax/src/unicode_tables/age.rs | 183 ++-- .../src/unicode_tables/case_folding_simple.rs | 38 +- .../src/unicode_tables/general_category.rs | 575 ++++++----- .../unicode_tables/grapheme_cluster_break.rs | 38 +- .../src/unicode_tables/perl_decimal.rs | 10 +- regex-syntax/src/unicode_tables/perl_space.rs | 4 +- regex-syntax/src/unicode_tables/perl_word.rs | 100 +- .../src/unicode_tables/property_bool.rs | 960 +++++++++++------- .../src/unicode_tables/property_names.rs | 13 +- .../src/unicode_tables/property_values.rs | 22 +- regex-syntax/src/unicode_tables/script.rs | 179 ++-- .../src/unicode_tables/script_extension.rs | 187 ++-- .../src/unicode_tables/sentence_break.rs | 129 ++- regex-syntax/src/unicode_tables/word_break.rs | 99 +- 15 files changed, 1577 insertions(+), 961 deletions(-) diff --git a/regex-syntax/src/unicode.rs b/regex-syntax/src/unicode.rs index 506529d117..7e414396f5 100644 --- a/regex-syntax/src/unicode.rs +++ b/regex-syntax/src/unicode.rs @@ -595,6 +595,7 @@ fn ages(canonical_age: &str) -> Result> { ("V11_0", age::V11_0), ("V12_0", age::V12_0), ("V12_1", age::V12_1), + ("V13_0", age::V13_0), ]; assert_eq!(AGES.len(), age::BY_NAME.len(), "ages are out of sync"); diff --git a/regex-syntax/src/unicode_tables/age.rs b/regex-syntax/src/unicode_tables/age.rs index 30e6ee174a..1452a521c5 100644 --- a/regex-syntax/src/unicode_tables/age.rs +++ b/regex-syntax/src/unicode_tables/age.rs @@ -1,14 +1,15 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate age /tmp/ucd/12.1.0/ --chars +// ucd-generate age ucd-13.0.0 --chars // -// ucd-generate is available on crates.io. +// ucd-generate 0.2.7 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("V10_0", V10_0), ("V11_0", V11_0), ("V12_0", V12_0), ("V12_1", V12_1), + ("V13_0", V13_0), ("V1_1", V1_1), ("V2_0", V2_0), ("V2_1", V2_1), @@ -135,69 +136,131 @@ pub const V11_0: &'static [(char, char)] = &[ ]; pub const V12_0: &'static [(char, char)] = &[ - ('\u{c77}', '\u{c77}'), - ('\u{e86}', '\u{e86}'), - ('\u{e89}', '\u{e89}'), - ('\u{e8c}', '\u{e8c}'), - ('\u{e8e}', '\u{e93}'), - ('\u{e98}', '\u{e98}'), - ('\u{ea0}', '\u{ea0}'), - ('\u{ea8}', '\u{ea9}'), - ('\u{eac}', '\u{eac}'), + ('౷', '౷'), + ('ຆ', 'ຆ'), + ('ຉ', 'ຉ'), + ('ຌ', 'ຌ'), + ('ຎ', 'ຓ'), + ('ຘ', 'ຘ'), + ('ຠ', 'ຠ'), + ('ຨ', 'ຩ'), + ('ຬ', 'ຬ'), ('\u{eba}', '\u{eba}'), - ('\u{1cfa}', '\u{1cfa}'), - ('\u{2bc9}', '\u{2bc9}'), - ('\u{2bff}', '\u{2bff}'), - ('\u{2e4f}', '\u{2e4f}'), - ('\u{a7ba}', '\u{a7bf}'), - ('\u{a7c2}', '\u{a7c6}'), - ('\u{ab66}', '\u{ab67}'), - ('\u{10fe0}', '\u{10ff6}'), - ('\u{1145f}', '\u{1145f}'), - ('\u{116b8}', '\u{116b8}'), - ('\u{119a0}', '\u{119a7}'), - ('\u{119aa}', '\u{119d7}'), - ('\u{119da}', '\u{119e4}'), - ('\u{11a84}', '\u{11a85}'), - ('\u{11fc0}', '\u{11ff1}'), - ('\u{11fff}', '\u{11fff}'), + ('ᳺ', 'ᳺ'), + ('⯉', '⯉'), + ('⯿', '⯿'), + ('⹏', '⹏'), + ('Ꞻ', 'ꞿ'), + ('Ꟃ', 'Ᶎ'), + ('ꭦ', 'ꭧ'), + ('𐿠', '𐿶'), + ('𑑟', '𑑟'), + ('𑚸', '𑚸'), + ('𑦠', '𑦧'), + ('𑦪', '\u{119d7}'), + ('\u{119da}', '𑧤'), + ('𑪄', '𑪅'), + ('𑿀', '𑿱'), + ('𑿿', '𑿿'), ('\u{13430}', '\u{13438}'), - ('\u{16f45}', '\u{16f4a}'), + ('𖽅', '𖽊'), ('\u{16f4f}', '\u{16f4f}'), - ('\u{16f7f}', '\u{16f87}'), - ('\u{16fe2}', '\u{16fe3}'), - ('\u{187f2}', '\u{187f7}'), - ('\u{1b150}', '\u{1b152}'), - ('\u{1b164}', '\u{1b167}'), - ('\u{1e100}', '\u{1e12c}'), - ('\u{1e130}', '\u{1e13d}'), - ('\u{1e140}', '\u{1e149}'), - ('\u{1e14e}', '\u{1e14f}'), - ('\u{1e2c0}', '\u{1e2f9}'), - ('\u{1e2ff}', '\u{1e2ff}'), - ('\u{1e94b}', '\u{1e94b}'), - ('\u{1ed01}', '\u{1ed3d}'), - ('\u{1f16c}', '\u{1f16c}'), - ('\u{1f6d5}', '\u{1f6d5}'), - ('\u{1f6fa}', '\u{1f6fa}'), - ('\u{1f7e0}', '\u{1f7eb}'), - ('\u{1f90d}', '\u{1f90f}'), - ('\u{1f93f}', '\u{1f93f}'), - ('\u{1f971}', '\u{1f971}'), - ('\u{1f97b}', '\u{1f97b}'), - ('\u{1f9a5}', '\u{1f9aa}'), - ('\u{1f9ae}', '\u{1f9af}'), - ('\u{1f9ba}', '\u{1f9bf}'), - ('\u{1f9c3}', '\u{1f9ca}'), - ('\u{1f9cd}', '\u{1f9cf}'), - ('\u{1fa00}', '\u{1fa53}'), - ('\u{1fa70}', '\u{1fa73}'), - ('\u{1fa78}', '\u{1fa7a}'), - ('\u{1fa80}', '\u{1fa82}'), - ('\u{1fa90}', '\u{1fa95}'), + ('𖽿', '𖾇'), + ('𖿢', '𖿣'), + ('𘟲', '𘟷'), + ('𛅐', '𛅒'), + ('𛅤', '𛅧'), + ('𞄀', '𞄬'), + ('\u{1e130}', '𞄽'), + ('𞅀', '𞅉'), + ('𞅎', '𞅏'), + ('𞋀', '𞋹'), + ('𞋿', '𞋿'), + ('𞥋', '𞥋'), + ('𞴁', '𞴽'), + ('🅬', '🅬'), + ('🛕', '🛕'), + ('🛺', '🛺'), + ('🟠', '🟫'), + ('🤍', '🤏'), + ('🤿', '🤿'), + ('🥱', '🥱'), + ('🥻', '🥻'), + ('🦥', '🦪'), + ('🦮', '🦯'), + ('🦺', '🦿'), + ('🧃', '🧊'), + ('🧍', '🧏'), + ('🨀', '🩓'), + ('🩰', '🩳'), + ('🩸', '🩺'), + ('🪀', '🪂'), + ('🪐', '🪕'), ]; -pub const V12_1: &'static [(char, char)] = &[('\u{32ff}', '\u{32ff}')]; +pub const V12_1: &'static [(char, char)] = &[('㋿', '㋿')]; + +pub const V13_0: &'static [(char, char)] = &[ + ('\u{8be}', '\u{8c7}'), + ('\u{b55}', '\u{b55}'), + ('\u{d04}', '\u{d04}'), + ('\u{d81}', '\u{d81}'), + ('\u{1abf}', '\u{1ac0}'), + ('\u{2b97}', '\u{2b97}'), + ('\u{2e50}', '\u{2e52}'), + ('\u{31bb}', '\u{31bf}'), + ('\u{4db6}', '\u{4dbf}'), + ('\u{9ff0}', '\u{9ffc}'), + ('\u{a7c7}', '\u{a7ca}'), + ('\u{a7f5}', '\u{a7f6}'), + ('\u{a82c}', '\u{a82c}'), + ('\u{ab68}', '\u{ab6b}'), + ('\u{1019c}', '\u{1019c}'), + ('\u{10e80}', '\u{10ea9}'), + ('\u{10eab}', '\u{10ead}'), + ('\u{10eb0}', '\u{10eb1}'), + ('\u{10fb0}', '\u{10fcb}'), + ('\u{11147}', '\u{11147}'), + ('\u{111ce}', '\u{111cf}'), + ('\u{1145a}', '\u{1145a}'), + ('\u{11460}', '\u{11461}'), + ('\u{11900}', '\u{11906}'), + ('\u{11909}', '\u{11909}'), + ('\u{1190c}', '\u{11913}'), + ('\u{11915}', '\u{11916}'), + ('\u{11918}', '\u{11935}'), + ('\u{11937}', '\u{11938}'), + ('\u{1193b}', '\u{11946}'), + ('\u{11950}', '\u{11959}'), + ('\u{11fb0}', '\u{11fb0}'), + ('\u{16fe4}', '\u{16fe4}'), + ('\u{16ff0}', '\u{16ff1}'), + ('\u{18af3}', '\u{18cd5}'), + ('\u{18d00}', '\u{18d08}'), + ('\u{1f10d}', '\u{1f10f}'), + ('\u{1f16d}', '\u{1f16f}'), + ('\u{1f1ad}', '\u{1f1ad}'), + ('\u{1f6d6}', '\u{1f6d7}'), + ('\u{1f6fb}', '\u{1f6fc}'), + ('\u{1f8b0}', '\u{1f8b1}'), + ('\u{1f90c}', '\u{1f90c}'), + ('\u{1f972}', '\u{1f972}'), + ('\u{1f977}', '\u{1f978}'), + ('\u{1f9a3}', '\u{1f9a4}'), + ('\u{1f9ab}', '\u{1f9ad}'), + ('\u{1f9cb}', '\u{1f9cb}'), + ('\u{1fa74}', '\u{1fa74}'), + ('\u{1fa83}', '\u{1fa86}'), + ('\u{1fa96}', '\u{1faa8}'), + ('\u{1fab0}', '\u{1fab6}'), + ('\u{1fac0}', '\u{1fac2}'), + ('\u{1fad0}', '\u{1fad6}'), + ('\u{1fb00}', '\u{1fb92}'), + ('\u{1fb94}', '\u{1fbca}'), + ('\u{1fbf0}', '\u{1fbf9}'), + ('\u{2a6d7}', '\u{2a6dd}'), + ('\u{30000}', '\u{3134a}'), +]; pub const V1_1: &'static [(char, char)] = &[ ('\u{0}', 'ǵ'), diff --git a/regex-syntax/src/unicode_tables/case_folding_simple.rs b/regex-syntax/src/unicode_tables/case_folding_simple.rs index 39f4176585..6b4cad3a3f 100644 --- a/regex-syntax/src/unicode_tables/case_folding_simple.rs +++ b/regex-syntax/src/unicode_tables/case_folding_simple.rs @@ -1,8 +1,8 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate case-folding-simple /tmp/ucd/12.1.0/ --chars --all-pairs +// ucd-generate case-folding-simple ucd-13.0.0 --chars --all-pairs // -// ucd-generate is available on crates.io. +// ucd-generate 0.2.7 is available on crates.io. pub const CASE_FOLDING_SIMPLE: &'static [(char, &'static [char])] = &[ ('A', &['a']), @@ -459,7 +459,7 @@ pub const CASE_FOLDING_SIMPLE: &'static [(char, &'static [char])] = &[ ('ɵ', &['Ɵ']), ('ɽ', &['Ɽ']), ('ʀ', &['Ʀ']), - ('ʂ', &['\u{a7c5}']), + ('ʂ', &['Ʂ']), ('ʃ', &['Ʃ']), ('ʇ', &['Ʇ']), ('ʈ', &['Ʈ']), @@ -1199,7 +1199,7 @@ pub const CASE_FOLDING_SIMPLE: &'static [(char, &'static [char])] = &[ ('Ჿ', &['ჿ']), ('ᵹ', &['Ᵹ']), ('ᵽ', &['Ᵽ']), - ('ᶎ', &['\u{a7c6}']), + ('ᶎ', &['Ᶎ']), ('Ḁ', &['ḁ']), ('ḁ', &['Ḁ']), ('Ḃ', &['ḃ']), @@ -2167,7 +2167,7 @@ pub const CASE_FOLDING_SIMPLE: &'static [(char, &'static [char])] = &[ ('ꞑ', &['Ꞑ']), ('Ꞓ', &['ꞓ']), ('ꞓ', &['Ꞓ']), - ('ꞔ', &['\u{a7c4}']), + ('ꞔ', &['Ꞔ']), ('Ꞗ', &['ꞗ']), ('ꞗ', &['Ꞗ']), ('Ꞙ', &['ꞙ']), @@ -2203,17 +2203,23 @@ pub const CASE_FOLDING_SIMPLE: &'static [(char, &'static [char])] = &[ ('ꞷ', &['Ꞷ']), ('Ꞹ', &['ꞹ']), ('ꞹ', &['Ꞹ']), - ('\u{a7ba}', &['\u{a7bb}']), - ('\u{a7bb}', &['\u{a7ba}']), - ('\u{a7bc}', &['\u{a7bd}']), - ('\u{a7bd}', &['\u{a7bc}']), - ('\u{a7be}', &['\u{a7bf}']), - ('\u{a7bf}', &['\u{a7be}']), - ('\u{a7c2}', &['\u{a7c3}']), - ('\u{a7c3}', &['\u{a7c2}']), - ('\u{a7c4}', &['ꞔ']), - ('\u{a7c5}', &['ʂ']), - ('\u{a7c6}', &['ᶎ']), + ('Ꞻ', &['ꞻ']), + ('ꞻ', &['Ꞻ']), + ('Ꞽ', &['ꞽ']), + ('ꞽ', &['Ꞽ']), + ('Ꞿ', &['ꞿ']), + ('ꞿ', &['Ꞿ']), + ('Ꟃ', &['ꟃ']), + ('ꟃ', &['Ꟃ']), + ('Ꞔ', &['ꞔ']), + ('Ʂ', &['ʂ']), + ('Ᶎ', &['ᶎ']), + ('\u{a7c7}', &['\u{a7c8}']), + ('\u{a7c8}', &['\u{a7c7}']), + ('\u{a7c9}', &['\u{a7ca}']), + ('\u{a7ca}', &['\u{a7c9}']), + ('\u{a7f5}', &['\u{a7f6}']), + ('\u{a7f6}', &['\u{a7f5}']), ('ꭓ', &['Ꭓ']), ('ꭰ', &['Ꭰ']), ('ꭱ', &['Ꭱ']), diff --git a/regex-syntax/src/unicode_tables/general_category.rs b/regex-syntax/src/unicode_tables/general_category.rs index 7662c46aff..f2f9cef06a 100644 --- a/regex-syntax/src/unicode_tables/general_category.rs +++ b/regex-syntax/src/unicode_tables/general_category.rs @@ -1,8 +1,8 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate general-category /tmp/ucd/12.1.0/ --chars --exclude surrogate +// ucd-generate general-category ucd-13.0.0 --chars --exclude surrogate // -// ucd-generate is available on crates.io. +// ucd-generate 0.2.7 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Cased_Letter", CASED_LETTER), @@ -128,11 +128,12 @@ pub const CASED_LETTER: &'static [(char, char)] = &[ ('Ꜣ', 'ꝯ'), ('ꝱ', 'ꞇ'), ('Ꞌ', 'ꞎ'), - ('Ꞑ', '\u{a7bf}'), - ('\u{a7c2}', '\u{a7c6}'), + ('Ꞑ', 'ꞿ'), + ('Ꟃ', '\u{a7ca}'), + ('\u{a7f5}', '\u{a7f6}'), ('ꟺ', 'ꟺ'), ('ꬰ', 'ꭚ'), - ('ꭠ', '\u{ab67}'), + ('ꭠ', '\u{ab68}'), ('ꭰ', 'ꮿ'), ('ff', 'st'), ('ﬓ', 'ﬗ'), @@ -284,8 +285,8 @@ pub const CURRENCY_SYMBOL: &'static [(char, char)] = &[ ('$', '$'), ('¢', '£'), ('¥', '₩'), - ('\u{11fdd}', '\u{11fe0}'), - ('\u{1e2ff}', '\u{1e2ff}'), + ('𑿝', '𑿠'), + ('𞋿', '𞋿'), ('𞲰', '𞲰'), ]; @@ -307,6 +308,7 @@ pub const DASH_PUNCTUATION: &'static [(char, char)] = &[ ('﹘', '﹘'), ('﹣', '﹣'), ('-', '-'), + ('\u{10ead}', '\u{10ead}'), ]; pub const DECIMAL_NUMBER: &'static [(char, char)] = &[ @@ -360,15 +362,17 @@ pub const DECIMAL_NUMBER: &'static [(char, char)] = &[ ('𑛀', '𑛉'), ('𑜰', '𑜹'), ('𑣠', '𑣩'), + ('\u{11950}', '\u{11959}'), ('𑱐', '𑱙'), ('𑵐', '𑵙'), ('𑶠', '𑶩'), ('𖩠', '𖩩'), ('𖭐', '𖭙'), ('𝟎', '𝟿'), - ('\u{1e140}', '\u{1e149}'), - ('\u{1e2f0}', '\u{1e2f9}'), + ('𞅀', '𞅉'), + ('𞋰', '𞋹'), ('𞥐', '𞥙'), + ('\u{1fbf0}', '\u{1fbf9}'), ]; pub const ENCLOSING_MARK: &'static [(char, char)] = &[ @@ -480,7 +484,7 @@ pub const LETTER: &'static [(char, char)] = &[ ('ࡀ', 'ࡘ'), ('ࡠ', 'ࡪ'), ('ࢠ', 'ࢴ'), - ('ࢶ', 'ࢽ'), + ('ࢶ', '\u{8c7}'), ('ऄ', 'ह'), ('ऽ', 'ऽ'), ('ॐ', 'ॐ'), @@ -556,7 +560,7 @@ pub const LETTER: &'static [(char, char)] = &[ ('ೞ', 'ೞ'), ('ೠ', 'ೡ'), ('ೱ', 'ೲ'), - ('അ', 'ഌ'), + ('\u{d04}', 'ഌ'), ('എ', 'ഐ'), ('ഒ', 'ഺ'), ('ഽ', 'ഽ'), @@ -574,8 +578,8 @@ pub const LETTER: &'static [(char, char)] = &[ ('เ', 'ๆ'), ('ກ', 'ຂ'), ('ຄ', 'ຄ'), - ('\u{e86}', 'ຊ'), - ('\u{e8c}', 'ຣ'), + ('ຆ', 'ຊ'), + ('ຌ', 'ຣ'), ('ລ', 'ລ'), ('ວ', 'ະ'), ('າ', 'ຳ'), @@ -660,7 +664,7 @@ pub const LETTER: &'static [(char, char)] = &[ ('ᳩ', 'ᳬ'), ('ᳮ', 'ᳳ'), ('ᳵ', 'ᳶ'), - ('\u{1cfa}', '\u{1cfa}'), + ('ᳺ', 'ᳺ'), ('ᴀ', 'ᶿ'), ('Ḁ', 'ἕ'), ('Ἐ', 'Ἕ'), @@ -727,10 +731,10 @@ pub const LETTER: &'static [(char, char)] = &[ ('ー', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', 'ㆺ'), + ('ㆠ', '\u{31bf}'), ('ㇰ', 'ㇿ'), - ('㐀', '䶵'), - ('一', '鿯'), + ('㐀', '\u{4dbf}'), + ('一', '\u{9ffc}'), ('ꀀ', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), @@ -741,9 +745,9 @@ pub const LETTER: &'static [(char, char)] = &[ ('ꚠ', 'ꛥ'), ('ꜗ', 'ꜟ'), ('Ꜣ', 'ꞈ'), - ('Ꞌ', '\u{a7bf}'), - ('\u{a7c2}', '\u{a7c6}'), - ('ꟷ', 'ꠁ'), + ('Ꞌ', 'ꞿ'), + ('Ꟃ', '\u{a7ca}'), + ('\u{a7f5}', 'ꠁ'), ('ꠃ', 'ꠅ'), ('ꠇ', 'ꠊ'), ('ꠌ', 'ꠢ'), @@ -780,7 +784,7 @@ pub const LETTER: &'static [(char, char)] = &[ ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab67}'), + ('ꭜ', '\u{ab69}'), ('ꭰ', 'ꯢ'), ('가', '힣'), ('ힰ', 'ퟆ'), @@ -864,15 +868,19 @@ pub const LETTER: &'static [(char, char)] = &[ ('𐲀', '𐲲'), ('𐳀', '𐳲'), ('𐴀', '𐴣'), + ('\u{10e80}', '\u{10ea9}'), + ('\u{10eb0}', '\u{10eb1}'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '𐽅'), - ('\u{10fe0}', '\u{10ff6}'), + ('\u{10fb0}', '\u{10fc4}'), + ('𐿠', '𐿶'), ('𑀃', '𑀷'), ('𑂃', '𑂯'), ('𑃐', '𑃨'), ('𑄃', '𑄦'), ('𑅄', '𑅄'), + ('\u{11147}', '\u{11147}'), ('𑅐', '𑅲'), ('𑅶', '𑅶'), ('𑆃', '𑆲'), @@ -898,7 +906,7 @@ pub const LETTER: &'static [(char, char)] = &[ ('𑍝', '𑍡'), ('𑐀', '𑐴'), ('𑑇', '𑑊'), - ('\u{1145f}', '\u{1145f}'), + ('𑑟', '\u{11461}'), ('𑒀', '𑒯'), ('𑓄', '𑓅'), ('𑓇', '𑓇'), @@ -907,15 +915,21 @@ pub const LETTER: &'static [(char, char)] = &[ ('𑘀', '𑘯'), ('𑙄', '𑙄'), ('𑚀', '𑚪'), - ('\u{116b8}', '\u{116b8}'), + ('𑚸', '𑚸'), ('𑜀', '𑜚'), ('𑠀', '𑠫'), ('𑢠', '𑣟'), - ('𑣿', '𑣿'), - ('\u{119a0}', '\u{119a7}'), - ('\u{119aa}', '\u{119d0}'), - ('\u{119e1}', '\u{119e1}'), - ('\u{119e3}', '\u{119e3}'), + ('𑣿', '\u{11906}'), + ('\u{11909}', '\u{11909}'), + ('\u{1190c}', '\u{11913}'), + ('\u{11915}', '\u{11916}'), + ('\u{11918}', '\u{1192f}'), + ('\u{1193f}', '\u{1193f}'), + ('\u{11941}', '\u{11941}'), + ('𑦠', '𑦧'), + ('𑦪', '𑧐'), + ('𑧡', '𑧡'), + ('𑧣', '𑧣'), ('𑨀', '𑨀'), ('𑨋', '𑨲'), ('𑨺', '𑨺'), @@ -936,6 +950,7 @@ pub const LETTER: &'static [(char, char)] = &[ ('𑵪', '𑶉'), ('𑶘', '𑶘'), ('𑻠', '𑻲'), + ('\u{11fb0}', '\u{11fb0}'), ('𒀀', '𒎙'), ('𒒀', '𒕃'), ('𓀀', '𓐮'), @@ -948,16 +963,17 @@ pub const LETTER: &'static [(char, char)] = &[ ('𖭣', '𖭷'), ('𖭽', '𖮏'), ('𖹀', '𖹿'), - ('𖼀', '\u{16f4a}'), + ('𖼀', '𖽊'), ('𖽐', '𖽐'), ('𖾓', '𖾟'), ('𖿠', '𖿡'), - ('\u{16fe3}', '\u{16fe3}'), - ('𗀀', '\u{187f7}'), - ('𘠀', '𘫲'), + ('𖿣', '𖿣'), + ('𗀀', '𘟷'), + ('𘠀', '\u{18cd5}'), + ('\u{18d00}', '\u{18d08}'), ('𛀀', '𛄞'), - ('\u{1b150}', '\u{1b152}'), - ('\u{1b164}', '\u{1b167}'), + ('𛅐', '𛅒'), + ('𛅤', '𛅧'), ('𛅰', '𛋻'), ('𛰀', '𛱪'), ('𛱰', '𛱼'), @@ -993,13 +1009,13 @@ pub const LETTER: &'static [(char, char)] = &[ ('𝞊', '𝞨'), ('𝞪', '𝟂'), ('𝟄', '𝟋'), - ('\u{1e100}', '\u{1e12c}'), - ('\u{1e137}', '\u{1e13d}'), - ('\u{1e14e}', '\u{1e14e}'), - ('\u{1e2c0}', '\u{1e2eb}'), + ('𞄀', '𞄬'), + ('𞄷', '𞄽'), + ('𞅎', '𞅎'), + ('𞋀', '𞋫'), ('𞠀', '𞣄'), ('𞤀', '𞥃'), - ('\u{1e94b}', '\u{1e94b}'), + ('𞥋', '𞥋'), ('𞸀', '𞸃'), ('𞸅', '𞸟'), ('𞸡', '𞸢'), @@ -1033,12 +1049,13 @@ pub const LETTER: &'static [(char, char)] = &[ ('𞺡', '𞺣'), ('𞺥', '𞺩'), ('𞺫', '𞺻'), - ('𠀀', '𪛖'), + ('𠀀', '\u{2a6dd}'), ('𪜀', '𫜴'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), + ('\u{30000}', '\u{3134a}'), ]; pub const LETTER_NUMBER: &'static [(char, char)] = &[ @@ -1657,13 +1674,16 @@ pub const LOWERCASE_LETTER: &'static [(char, char)] = &[ ('ꞵ', 'ꞵ'), ('ꞷ', 'ꞷ'), ('ꞹ', 'ꞹ'), - ('\u{a7bb}', '\u{a7bb}'), - ('\u{a7bd}', '\u{a7bd}'), - ('\u{a7bf}', '\u{a7bf}'), - ('\u{a7c3}', '\u{a7c3}'), + ('ꞻ', 'ꞻ'), + ('ꞽ', 'ꞽ'), + ('ꞿ', 'ꞿ'), + ('ꟃ', 'ꟃ'), + ('\u{a7c8}', '\u{a7c8}'), + ('\u{a7ca}', '\u{a7ca}'), + ('\u{a7f6}', '\u{a7f6}'), ('ꟺ', 'ꟺ'), ('ꬰ', 'ꭚ'), - ('ꭠ', '\u{ab67}'), + ('ꭠ', '\u{ab68}'), ('ꭰ', 'ꮿ'), ('ff', 'st'), ('ﬓ', 'ﬗ'), @@ -1763,7 +1783,7 @@ pub const MARK: &'static [(char, char)] = &[ ('\u{b3e}', '\u{b44}'), ('େ', 'ୈ'), ('ୋ', '\u{b4d}'), - ('\u{b56}', '\u{b57}'), + ('\u{b55}', '\u{b57}'), ('\u{b62}', '\u{b63}'), ('\u{b82}', '\u{b82}'), ('\u{bbe}', 'ூ'), @@ -1790,7 +1810,7 @@ pub const MARK: &'static [(char, char)] = &[ ('ൊ', '\u{d4d}'), ('\u{d57}', '\u{d57}'), ('\u{d62}', '\u{d63}'), - ('ං', 'ඃ'), + ('\u{d81}', 'ඃ'), ('\u{dca}', '\u{dca}'), ('\u{dcf}', '\u{dd4}'), ('\u{dd6}', '\u{dd6}'), @@ -1837,7 +1857,7 @@ pub const MARK: &'static [(char, char)] = &[ ('ᩕ', '\u{1a5e}'), ('\u{1a60}', '\u{1a7c}'), ('\u{1a7f}', '\u{1a7f}'), - ('\u{1ab0}', '\u{1abe}'), + ('\u{1ab0}', '\u{1ac0}'), ('\u{1b00}', 'ᬄ'), ('\u{1b34}', '᭄'), ('\u{1b6b}', '\u{1b73}'), @@ -1866,6 +1886,7 @@ pub const MARK: &'static [(char, char)] = &[ ('\u{a806}', '\u{a806}'), ('\u{a80b}', '\u{a80b}'), ('ꠣ', 'ꠧ'), + ('\u{a82c}', '\u{a82c}'), ('ꢀ', 'ꢁ'), ('ꢴ', '\u{a8c5}'), ('\u{a8e0}', '\u{a8f1}'), @@ -1901,6 +1922,7 @@ pub const MARK: &'static [(char, char)] = &[ ('\u{10a3f}', '\u{10a3f}'), ('\u{10ae5}', '\u{10ae6}'), ('\u{10d24}', '\u{10d27}'), + ('\u{10eab}', '\u{10eac}'), ('\u{10f46}', '\u{10f50}'), ('𑀀', '𑀂'), ('\u{11038}', '\u{11046}'), @@ -1913,6 +1935,7 @@ pub const MARK: &'static [(char, char)] = &[ ('\u{11180}', '𑆂'), ('𑆳', '𑇀'), ('\u{111c9}', '\u{111cc}'), + ('\u{111ce}', '\u{111cf}'), ('𑈬', '\u{11237}'), ('\u{1123e}', '\u{1123e}'), ('\u{112df}', '\u{112ea}'), @@ -1935,9 +1958,14 @@ pub const MARK: &'static [(char, char)] = &[ ('\u{116ab}', '\u{116b7}'), ('\u{1171d}', '\u{1172b}'), ('𑠬', '\u{1183a}'), - ('\u{119d1}', '\u{119d7}'), + ('\u{11930}', '\u{11935}'), + ('\u{11937}', '\u{11938}'), + ('\u{1193b}', '\u{1193e}'), + ('\u{11940}', '\u{11940}'), + ('\u{11942}', '\u{11943}'), + ('𑧑', '\u{119d7}'), ('\u{119da}', '\u{119e0}'), - ('\u{119e4}', '\u{119e4}'), + ('𑧤', '𑧤'), ('\u{11a01}', '\u{11a0a}'), ('\u{11a33}', '𑨹'), ('\u{11a3b}', '\u{11a3e}'), @@ -1960,8 +1988,10 @@ pub const MARK: &'static [(char, char)] = &[ ('\u{16af0}', '\u{16af4}'), ('\u{16b30}', '\u{16b36}'), ('\u{16f4f}', '\u{16f4f}'), - ('𖽑', '\u{16f87}'), + ('𖽑', '𖾇'), ('\u{16f8f}', '\u{16f92}'), + ('\u{16fe4}', '\u{16fe4}'), + ('\u{16ff0}', '\u{16ff1}'), ('\u{1bc9d}', '\u{1bc9e}'), ('\u{1d165}', '\u{1d169}'), ('𝅭', '\u{1d172}'), @@ -2107,14 +2137,15 @@ pub const MODIFIER_LETTER: &'static [(char, char)] = &[ ('ꫝ', 'ꫝ'), ('ꫳ', 'ꫴ'), ('ꭜ', 'ꭟ'), + ('\u{ab69}', '\u{ab69}'), ('ー', 'ー'), ('\u{ff9e}', '\u{ff9f}'), ('𖭀', '𖭃'), ('𖾓', '𖾟'), ('𖿠', '𖿡'), - ('\u{16fe3}', '\u{16fe3}'), - ('\u{1e137}', '\u{1e13d}'), - ('\u{1e94b}', '\u{1e94b}'), + ('𖿣', '𖿣'), + ('𞄷', '𞄽'), + ('𞥋', '𞥋'), ]; pub const MODIFIER_SYMBOL: &'static [(char, char)] = &[ @@ -2142,6 +2173,7 @@ pub const MODIFIER_SYMBOL: &'static [(char, char)] = &[ ('꜠', '꜡'), ('꞉', '꞊'), ('꭛', '꭛'), + ('\u{ab6a}', '\u{ab6b}'), ('﮲', '﯁'), ('^', '^'), ('`', '`'), @@ -2208,7 +2240,7 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{b3f}', '\u{b3f}'), ('\u{b41}', '\u{b44}'), ('\u{b4d}', '\u{b4d}'), - ('\u{b56}', '\u{b56}'), + ('\u{b55}', '\u{b56}'), ('\u{b62}', '\u{b63}'), ('\u{b82}', '\u{b82}'), ('\u{bc0}', '\u{bc0}'), @@ -2231,6 +2263,7 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{d41}', '\u{d44}'), ('\u{d4d}', '\u{d4d}'), ('\u{d62}', '\u{d63}'), + ('\u{d81}', '\u{d81}'), ('\u{dca}', '\u{dca}'), ('\u{dd2}', '\u{dd4}'), ('\u{dd6}', '\u{dd6}'), @@ -2288,6 +2321,7 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{1a73}', '\u{1a7c}'), ('\u{1a7f}', '\u{1a7f}'), ('\u{1ab0}', '\u{1abd}'), + ('\u{1abf}', '\u{1ac0}'), ('\u{1b00}', '\u{1b03}'), ('\u{1b34}', '\u{1b34}'), ('\u{1b36}', '\u{1b3a}'), @@ -2328,6 +2362,7 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{a806}', '\u{a806}'), ('\u{a80b}', '\u{a80b}'), ('\u{a825}', '\u{a826}'), + ('\u{a82c}', '\u{a82c}'), ('\u{a8c4}', '\u{a8c5}'), ('\u{a8e0}', '\u{a8f1}'), ('\u{a8ff}', '\u{a8ff}'), @@ -2336,7 +2371,7 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{a980}', '\u{a982}'), ('\u{a9b3}', '\u{a9b3}'), ('\u{a9b6}', '\u{a9b9}'), - ('\u{a9bc}', 'ꦽ'), + ('\u{a9bc}', '\u{a9bd}'), ('\u{a9e5}', '\u{a9e5}'), ('\u{aa29}', '\u{aa2e}'), ('\u{aa31}', '\u{aa32}'), @@ -2367,6 +2402,7 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{10a3f}', '\u{10a3f}'), ('\u{10ae5}', '\u{10ae6}'), ('\u{10d24}', '\u{10d27}'), + ('\u{10eab}', '\u{10eac}'), ('\u{10f46}', '\u{10f50}'), ('\u{11001}', '\u{11001}'), ('\u{11038}', '\u{11046}'), @@ -2380,6 +2416,7 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{11180}', '\u{11181}'), ('\u{111b6}', '\u{111be}'), ('\u{111c9}', '\u{111cc}'), + ('\u{111cf}', '\u{111cf}'), ('\u{1122f}', '\u{11231}'), ('\u{11234}', '\u{11234}'), ('\u{11236}', '\u{11237}'), @@ -2415,6 +2452,9 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{11727}', '\u{1172b}'), ('\u{1182f}', '\u{11837}'), ('\u{11839}', '\u{1183a}'), + ('\u{1193b}', '\u{1193c}'), + ('\u{1193e}', '\u{1193e}'), + ('\u{11943}', '\u{11943}'), ('\u{119d4}', '\u{119d7}'), ('\u{119da}', '\u{119db}'), ('\u{119e0}', '\u{119e0}'), @@ -2446,6 +2486,7 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{16b30}', '\u{16b36}'), ('\u{16f4f}', '\u{16f4f}'), ('\u{16f8f}', '\u{16f92}'), + ('\u{16fe4}', '\u{16fe4}'), ('\u{1bc9d}', '\u{1bc9e}'), ('\u{1d167}', '\u{1d169}'), ('\u{1d17b}', '\u{1d182}'), @@ -2567,6 +2608,7 @@ pub const NUMBER: &'static [(char, char)] = &[ ('𐹠', '𐹾'), ('𐼝', '𐼦'), ('𐽑', '𐽔'), + ('\u{10fc5}', '\u{10fcb}'), ('𑁒', '𑁯'), ('𑃰', '𑃹'), ('𑄶', '𑄿'), @@ -2579,10 +2621,11 @@ pub const NUMBER: &'static [(char, char)] = &[ ('𑛀', '𑛉'), ('𑜰', '𑜻'), ('𑣠', '𑣲'), + ('\u{11950}', '\u{11959}'), ('𑱐', '𑱬'), ('𑵐', '𑵙'), ('𑶠', '𑶩'), - ('\u{11fc0}', '\u{11fd4}'), + ('𑿀', '𑿔'), ('𒐀', '𒑮'), ('𖩠', '𖩩'), ('𖭐', '𖭙'), @@ -2591,16 +2634,17 @@ pub const NUMBER: &'static [(char, char)] = &[ ('𝋠', '𝋳'), ('𝍠', '𝍸'), ('𝟎', '𝟿'), - ('\u{1e140}', '\u{1e149}'), - ('\u{1e2f0}', '\u{1e2f9}'), + ('𞅀', '𞅉'), + ('𞋰', '𞋹'), ('𞣇', '𞣏'), ('𞥐', '𞥙'), ('𞱱', '𞲫'), ('𞲭', '𞲯'), ('𞲱', '𞲴'), - ('\u{1ed01}', '\u{1ed2d}'), - ('\u{1ed2f}', '\u{1ed3d}'), + ('𞴁', '𞴭'), + ('𞴯', '𞴽'), ('🄀', '🄌'), + ('\u{1fbf0}', '\u{1fbf9}'), ]; pub const OPEN_PUNCTUATION: &'static [(char, char)] = &[ @@ -2709,7 +2753,7 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{85f}', '\u{85f}'), ('\u{86b}', '\u{89f}'), ('\u{8b5}', '\u{8b5}'), - ('\u{8be}', '\u{8d2}'), + ('\u{8c8}', '\u{8d2}'), ('\u{8e2}', '\u{8e2}'), ('\u{984}', '\u{984}'), ('\u{98d}', '\u{98e}'), @@ -2764,7 +2808,7 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{b3a}', '\u{b3b}'), ('\u{b45}', '\u{b46}'), ('\u{b49}', '\u{b4a}'), - ('\u{b4e}', '\u{b55}'), + ('\u{b4e}', '\u{b54}'), ('\u{b58}', '\u{b5b}'), ('\u{b5e}', '\u{b5e}'), ('\u{b64}', '\u{b65}'), @@ -2809,14 +2853,13 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{ce4}', '\u{ce5}'), ('\u{cf0}', '\u{cf0}'), ('\u{cf3}', '\u{cff}'), - ('\u{d04}', '\u{d04}'), ('\u{d0d}', '\u{d0d}'), ('\u{d11}', '\u{d11}'), ('\u{d45}', '\u{d45}'), ('\u{d49}', '\u{d49}'), ('\u{d50}', '\u{d53}'), ('\u{d64}', '\u{d65}'), - ('\u{d80}', '\u{d81}'), + ('\u{d80}', '\u{d80}'), ('\u{d84}', '\u{d84}'), ('\u{d97}', '\u{d99}'), ('\u{db2}', '\u{db2}'), @@ -2903,7 +2946,7 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{1a8a}', '\u{1a8f}'), ('\u{1a9a}', '\u{1a9f}'), ('\u{1aae}', '\u{1aaf}'), - ('\u{1abf}', '\u{1aff}'), + ('\u{1ac1}', '\u{1aff}'), ('\u{1b4c}', '\u{1b4f}'), ('\u{1b7d}', '\u{1b7f}'), ('\u{1bf4}', '\u{1bfb}'), @@ -2942,7 +2985,7 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{2427}', '\u{243f}'), ('\u{244b}', '\u{245f}'), ('\u{2b74}', '\u{2b75}'), - ('\u{2b96}', '\u{2b97}'), + ('\u{2b96}', '\u{2b96}'), ('\u{2c2f}', '\u{2c2f}'), ('\u{2c5f}', '\u{2c5f}'), ('\u{2cf4}', '\u{2cf8}'), @@ -2960,7 +3003,7 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{2dcf}', '\u{2dcf}'), ('\u{2dd7}', '\u{2dd7}'), ('\u{2ddf}', '\u{2ddf}'), - ('\u{2e50}', '\u{2e7f}'), + ('\u{2e53}', '\u{2e7f}'), ('\u{2e9a}', '\u{2e9a}'), ('\u{2ef4}', '\u{2eff}'), ('\u{2fd6}', '\u{2fef}'), @@ -2970,18 +3013,16 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{3100}', '\u{3104}'), ('\u{3130}', '\u{3130}'), ('\u{318f}', '\u{318f}'), - ('\u{31bb}', '\u{31bf}'), ('\u{31e4}', '\u{31ef}'), ('\u{321f}', '\u{321f}'), - ('\u{4db6}', '\u{4dbf}'), - ('\u{9ff0}', '\u{9fff}'), + ('\u{9ffd}', '\u{9fff}'), ('\u{a48d}', '\u{a48f}'), ('\u{a4c7}', '\u{a4cf}'), ('\u{a62c}', '\u{a63f}'), ('\u{a6f8}', '\u{a6ff}'), ('\u{a7c0}', '\u{a7c1}'), - ('\u{a7c7}', '\u{a7f6}'), - ('\u{a82c}', '\u{a82f}'), + ('\u{a7cb}', '\u{a7f4}'), + ('\u{a82d}', '\u{a82f}'), ('\u{a83a}', '\u{a83f}'), ('\u{a878}', '\u{a87f}'), ('\u{a8c6}', '\u{a8cd}'), @@ -3001,7 +3042,7 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{ab17}', '\u{ab1f}'), ('\u{ab27}', '\u{ab27}'), ('\u{ab2f}', '\u{ab2f}'), - ('\u{ab68}', '\u{ab6f}'), + ('\u{ab6c}', '\u{ab6f}'), ('\u{abee}', '\u{abef}'), ('\u{abfa}', '\u{abff}'), ('\u{d7a4}', '\u{d7af}'), @@ -3045,7 +3086,7 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{10103}', '\u{10106}'), ('\u{10134}', '\u{10136}'), ('\u{1018f}', '\u{1018f}'), - ('\u{1019c}', '\u{1019f}'), + ('\u{1019d}', '\u{1019f}'), ('\u{101a1}', '\u{101cf}'), ('\u{101fe}', '\u{1027f}'), ('\u{1029d}', '\u{1029f}'), @@ -3104,9 +3145,13 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{10cf3}', '\u{10cf9}'), ('\u{10d28}', '\u{10d2f}'), ('\u{10d3a}', '\u{10e5f}'), - ('\u{10e7f}', '\u{10eff}'), + ('\u{10e7f}', '\u{10e7f}'), + ('\u{10eaa}', '\u{10eaa}'), + ('\u{10eae}', '\u{10eaf}'), + ('\u{10eb2}', '\u{10eff}'), ('\u{10f28}', '\u{10f2f}'), - ('\u{10f5a}', '\u{10fdf}'), + ('\u{10f5a}', '\u{10faf}'), + ('\u{10fcc}', '\u{10fdf}'), ('\u{10ff7}', '\u{10fff}'), ('\u{1104e}', '\u{11051}'), ('\u{11070}', '\u{1107e}'), @@ -3115,9 +3160,8 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{110e9}', '\u{110ef}'), ('\u{110fa}', '\u{110ff}'), ('\u{11135}', '\u{11135}'), - ('\u{11147}', '\u{1114f}'), + ('\u{11148}', '\u{1114f}'), ('\u{11177}', '\u{1117f}'), - ('\u{111ce}', '\u{111cf}'), ('\u{111e0}', '\u{111e0}'), ('\u{111f5}', '\u{111ff}'), ('\u{11212}', '\u{11212}'), @@ -3144,9 +3188,8 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{11364}', '\u{11365}'), ('\u{1136d}', '\u{1136f}'), ('\u{11375}', '\u{113ff}'), - ('\u{1145a}', '\u{1145a}'), ('\u{1145c}', '\u{1145c}'), - ('\u{11460}', '\u{1147f}'), + ('\u{11462}', '\u{1147f}'), ('\u{114c8}', '\u{114cf}'), ('\u{114da}', '\u{1157f}'), ('\u{115b6}', '\u{115b7}'), @@ -3161,7 +3204,14 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{11740}', '\u{117ff}'), ('\u{1183c}', '\u{1189f}'), ('\u{118f3}', '\u{118fe}'), - ('\u{11900}', '\u{1199f}'), + ('\u{11907}', '\u{11908}'), + ('\u{1190a}', '\u{1190b}'), + ('\u{11914}', '\u{11914}'), + ('\u{11917}', '\u{11917}'), + ('\u{11936}', '\u{11936}'), + ('\u{11939}', '\u{1193a}'), + ('\u{11947}', '\u{1194f}'), + ('\u{1195a}', '\u{1199f}'), ('\u{119a8}', '\u{119a9}'), ('\u{119d8}', '\u{119d9}'), ('\u{119e5}', '\u{119ff}'), @@ -3188,7 +3238,8 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{11d92}', '\u{11d92}'), ('\u{11d99}', '\u{11d9f}'), ('\u{11daa}', '\u{11edf}'), - ('\u{11ef9}', '\u{11fbf}'), + ('\u{11ef9}', '\u{11faf}'), + ('\u{11fb1}', '\u{11fbf}'), ('\u{11ff2}', '\u{11ffe}'), ('\u{1239a}', '\u{123ff}'), ('\u{1246f}', '\u{1246f}'), @@ -3211,9 +3262,11 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{16f4b}', '\u{16f4e}'), ('\u{16f88}', '\u{16f8e}'), ('\u{16fa0}', '\u{16fdf}'), - ('\u{16fe4}', '\u{16fff}'), + ('\u{16fe5}', '\u{16fef}'), + ('\u{16ff2}', '\u{16fff}'), ('\u{187f8}', '\u{187ff}'), - ('\u{18af3}', '\u{1afff}'), + ('\u{18cd6}', '\u{18cff}'), + ('\u{18d09}', '\u{1afff}'), ('\u{1b11f}', '\u{1b14f}'), ('\u{1b153}', '\u{1b163}'), ('\u{1b168}', '\u{1b16f}'), @@ -3312,17 +3365,15 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{1f0c0}', '\u{1f0c0}'), ('\u{1f0d0}', '\u{1f0d0}'), ('\u{1f0f6}', '\u{1f0ff}'), - ('\u{1f10d}', '\u{1f10f}'), - ('\u{1f16d}', '\u{1f16f}'), - ('\u{1f1ad}', '\u{1f1e5}'), + ('\u{1f1ae}', '\u{1f1e5}'), ('\u{1f203}', '\u{1f20f}'), ('\u{1f23c}', '\u{1f23f}'), ('\u{1f249}', '\u{1f24f}'), ('\u{1f252}', '\u{1f25f}'), ('\u{1f266}', '\u{1f2ff}'), - ('\u{1f6d6}', '\u{1f6df}'), + ('\u{1f6d8}', '\u{1f6df}'), ('\u{1f6ed}', '\u{1f6ef}'), - ('\u{1f6fb}', '\u{1f6ff}'), + ('\u{1f6fd}', '\u{1f6ff}'), ('\u{1f774}', '\u{1f77f}'), ('\u{1f7d9}', '\u{1f7df}'), ('\u{1f7ec}', '\u{1f7ff}'), @@ -3330,25 +3381,29 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{1f848}', '\u{1f84f}'), ('\u{1f85a}', '\u{1f85f}'), ('\u{1f888}', '\u{1f88f}'), - ('\u{1f8ae}', '\u{1f8ff}'), - ('\u{1f90c}', '\u{1f90c}'), - ('\u{1f972}', '\u{1f972}'), - ('\u{1f977}', '\u{1f979}'), - ('\u{1f9a3}', '\u{1f9a4}'), - ('\u{1f9ab}', '\u{1f9ad}'), - ('\u{1f9cb}', '\u{1f9cc}'), + ('\u{1f8ae}', '\u{1f8af}'), + ('\u{1f8b2}', '\u{1f8ff}'), + ('\u{1f979}', '\u{1f979}'), + ('\u{1f9cc}', '\u{1f9cc}'), ('\u{1fa54}', '\u{1fa5f}'), ('\u{1fa6e}', '\u{1fa6f}'), - ('\u{1fa74}', '\u{1fa77}'), + ('\u{1fa75}', '\u{1fa77}'), ('\u{1fa7b}', '\u{1fa7f}'), - ('\u{1fa83}', '\u{1fa8f}'), - ('\u{1fa96}', '\u{1ffff}'), - ('\u{2a6d7}', '\u{2a6ff}'), + ('\u{1fa87}', '\u{1fa8f}'), + ('\u{1faa9}', '\u{1faaf}'), + ('\u{1fab7}', '\u{1fabf}'), + ('\u{1fac3}', '\u{1facf}'), + ('\u{1fad7}', '\u{1faff}'), + ('\u{1fb93}', '\u{1fb93}'), + ('\u{1fbcb}', '\u{1fbef}'), + ('\u{1fbfa}', '\u{1ffff}'), + ('\u{2a6de}', '\u{2a6ff}'), ('\u{2b735}', '\u{2b73f}'), ('\u{2b81e}', '\u{2b81f}'), ('\u{2cea2}', '\u{2ceaf}'), ('\u{2ebe1}', '\u{2f7ff}'), - ('\u{2fa1e}', '\u{e00ff}'), + ('\u{2fa1e}', '\u{2ffff}'), + ('\u{3134b}', '\u{e00ff}'), ('\u{e01f0}', '\u{10ffff}'), ]; @@ -3377,7 +3432,7 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('ࡀ', 'ࡘ'), ('ࡠ', 'ࡪ'), ('ࢠ', 'ࢴ'), - ('ࢶ', 'ࢽ'), + ('ࢶ', '\u{8c7}'), ('ऄ', 'ह'), ('ऽ', 'ऽ'), ('ॐ', 'ॐ'), @@ -3453,7 +3508,7 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('ೞ', 'ೞ'), ('ೠ', 'ೡ'), ('ೱ', 'ೲ'), - ('അ', 'ഌ'), + ('\u{d04}', 'ഌ'), ('എ', 'ഐ'), ('ഒ', 'ഺ'), ('ഽ', 'ഽ'), @@ -3471,8 +3526,8 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('เ', 'ๅ'), ('ກ', 'ຂ'), ('ຄ', 'ຄ'), - ('\u{e86}', 'ຊ'), - ('\u{e8c}', 'ຣ'), + ('ຆ', 'ຊ'), + ('ຌ', 'ຣ'), ('ລ', 'ລ'), ('ວ', 'ະ'), ('າ', 'ຳ'), @@ -3546,7 +3601,7 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('ᳩ', 'ᳬ'), ('ᳮ', 'ᳳ'), ('ᳵ', 'ᳶ'), - ('\u{1cfa}', '\u{1cfa}'), + ('ᳺ', 'ᳺ'), ('ℵ', 'ℸ'), ('ⴰ', 'ⵧ'), ('ⶀ', 'ⶖ'), @@ -3566,10 +3621,10 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('ヿ', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', 'ㆺ'), + ('ㆠ', '\u{31bf}'), ('ㇰ', 'ㇿ'), - ('㐀', '䶵'), - ('一', '鿯'), + ('㐀', '\u{4dbf}'), + ('一', '\u{9ffc}'), ('ꀀ', 'ꀔ'), ('ꀖ', 'ꒌ'), ('ꓐ', 'ꓷ'), @@ -3693,15 +3748,19 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('𐮀', '𐮑'), ('𐰀', '𐱈'), ('𐴀', '𐴣'), + ('\u{10e80}', '\u{10ea9}'), + ('\u{10eb0}', '\u{10eb1}'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '𐽅'), - ('\u{10fe0}', '\u{10ff6}'), + ('\u{10fb0}', '\u{10fc4}'), + ('𐿠', '𐿶'), ('𑀃', '𑀷'), ('𑂃', '𑂯'), ('𑃐', '𑃨'), ('𑄃', '𑄦'), ('𑅄', '𑅄'), + ('\u{11147}', '\u{11147}'), ('𑅐', '𑅲'), ('𑅶', '𑅶'), ('𑆃', '𑆲'), @@ -3727,7 +3786,7 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('𑍝', '𑍡'), ('𑐀', '𑐴'), ('𑑇', '𑑊'), - ('\u{1145f}', '\u{1145f}'), + ('𑑟', '\u{11461}'), ('𑒀', '𑒯'), ('𑓄', '𑓅'), ('𑓇', '𑓇'), @@ -3736,14 +3795,20 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('𑘀', '𑘯'), ('𑙄', '𑙄'), ('𑚀', '𑚪'), - ('\u{116b8}', '\u{116b8}'), + ('𑚸', '𑚸'), ('𑜀', '𑜚'), ('𑠀', '𑠫'), - ('𑣿', '𑣿'), - ('\u{119a0}', '\u{119a7}'), - ('\u{119aa}', '\u{119d0}'), - ('\u{119e1}', '\u{119e1}'), - ('\u{119e3}', '\u{119e3}'), + ('𑣿', '\u{11906}'), + ('\u{11909}', '\u{11909}'), + ('\u{1190c}', '\u{11913}'), + ('\u{11915}', '\u{11916}'), + ('\u{11918}', '\u{1192f}'), + ('\u{1193f}', '\u{1193f}'), + ('\u{11941}', '\u{11941}'), + ('𑦠', '𑦧'), + ('𑦪', '𑧐'), + ('𑧡', '𑧡'), + ('𑧣', '𑧣'), ('𑨀', '𑨀'), ('𑨋', '𑨲'), ('𑨺', '𑨺'), @@ -3764,6 +3829,7 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('𑵪', '𑶉'), ('𑶘', '𑶘'), ('𑻠', '𑻲'), + ('\u{11fb0}', '\u{11fb0}'), ('𒀀', '𒎙'), ('𒒀', '𒕃'), ('𓀀', '𓐮'), @@ -3774,21 +3840,22 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('𖬀', '𖬯'), ('𖭣', '𖭷'), ('𖭽', '𖮏'), - ('𖼀', '\u{16f4a}'), + ('𖼀', '𖽊'), ('𖽐', '𖽐'), - ('𗀀', '\u{187f7}'), - ('𘠀', '𘫲'), + ('𗀀', '𘟷'), + ('𘠀', '\u{18cd5}'), + ('\u{18d00}', '\u{18d08}'), ('𛀀', '𛄞'), - ('\u{1b150}', '\u{1b152}'), - ('\u{1b164}', '\u{1b167}'), + ('𛅐', '𛅒'), + ('𛅤', '𛅧'), ('𛅰', '𛋻'), ('𛰀', '𛱪'), ('𛱰', '𛱼'), ('𛲀', '𛲈'), ('𛲐', '𛲙'), - ('\u{1e100}', '\u{1e12c}'), - ('\u{1e14e}', '\u{1e14e}'), - ('\u{1e2c0}', '\u{1e2eb}'), + ('𞄀', '𞄬'), + ('𞅎', '𞅎'), + ('𞋀', '𞋫'), ('𞠀', '𞣄'), ('𞸀', '𞸃'), ('𞸅', '𞸟'), @@ -3823,12 +3890,13 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('𞺡', '𞺣'), ('𞺥', '𞺩'), ('𞺫', '𞺻'), - ('𠀀', '𪛖'), + ('𠀀', '\u{2a6dd}'), ('𪜀', '𫜴'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), + ('\u{30000}', '\u{3134a}'), ]; pub const OTHER_NUMBER: &'static [(char, char)] = &[ @@ -3885,12 +3953,13 @@ pub const OTHER_NUMBER: &'static [(char, char)] = &[ ('𐹠', '𐹾'), ('𐼝', '𐼦'), ('𐽑', '𐽔'), + ('\u{10fc5}', '\u{10fcb}'), ('𑁒', '𑁥'), ('𑇡', '𑇴'), ('𑜺', '𑜻'), ('𑣪', '𑣲'), ('𑱚', '𑱬'), - ('\u{11fc0}', '\u{11fd4}'), + ('𑿀', '𑿔'), ('𖭛', '𖭡'), ('𖺀', '𖺖'), ('𝋠', '𝋳'), @@ -3899,8 +3968,8 @@ pub const OTHER_NUMBER: &'static [(char, char)] = &[ ('𞱱', '𞲫'), ('𞲭', '𞲯'), ('𞲱', '𞲴'), - ('\u{1ed01}', '\u{1ed2d}'), - ('\u{1ed2f}', '\u{1ed3d}'), + ('𞴁', '𞴭'), + ('𞴯', '𞴽'), ('🄀', '🄌'), ]; @@ -3940,7 +4009,7 @@ pub const OTHER_PUNCTUATION: &'static [(char, char)] = &[ ('৽', '৽'), ('੶', '੶'), ('૰', '૰'), - ('\u{c77}', '\u{c77}'), + ('౷', '౷'), ('಄', '಄'), ('෴', '෴'), ('๏', '๏'), @@ -3992,7 +4061,8 @@ pub const OTHER_PUNCTUATION: &'static [(char, char)] = &[ ('⸰', '⸹'), ('⸼', '⸿'), ('⹁', '⹁'), - ('⹃', '\u{2e4f}'), + ('⹃', '⹏'), + ('\u{2e52}', '\u{2e52}'), ('、', '〃'), ('〽', '〽'), ('・', '・'), @@ -4058,7 +4128,7 @@ pub const OTHER_PUNCTUATION: &'static [(char, char)] = &[ ('𑈸', '𑈽'), ('𑊩', '𑊩'), ('𑑋', '𑑏'), - ('𑑛', '𑑛'), + ('\u{1145a}', '𑑛'), ('𑑝', '𑑝'), ('𑓆', '𑓆'), ('𑗁', '𑗗'), @@ -4066,21 +4136,22 @@ pub const OTHER_PUNCTUATION: &'static [(char, char)] = &[ ('𑙠', '𑙬'), ('𑜼', '𑜾'), ('𑠻', '𑠻'), - ('\u{119e2}', '\u{119e2}'), + ('\u{11944}', '\u{11946}'), + ('𑧢', '𑧢'), ('𑨿', '𑩆'), ('𑪚', '𑪜'), ('𑪞', '𑪢'), ('𑱁', '𑱅'), ('𑱰', '𑱱'), ('𑻷', '𑻸'), - ('\u{11fff}', '\u{11fff}'), + ('𑿿', '𑿿'), ('𒑰', '𒑴'), ('𖩮', '𖩯'), ('𖫵', '𖫵'), ('𖬷', '𖬻'), ('𖭄', '𖭄'), ('𖺗', '𖺚'), - ('\u{16fe2}', '\u{16fe2}'), + ('𖿢', '𖿢'), ('𛲟', '𛲟'), ('𝪇', '𝪋'), ('𞥞', '𞥟'), @@ -4167,8 +4238,9 @@ pub const OTHER_SYMBOL: &'static [(char, char)] = &[ ('⭅', '⭆'), ('⭍', '⭳'), ('⭶', '⮕'), - ('⮘', '\u{2bff}'), + ('\u{2b97}', '⯿'), ('⳥', '⳪'), + ('\u{2e50}', '\u{2e51}'), ('⺀', '⺙'), ('⺛', '⻳'), ('⼀', '⿕'), @@ -4201,14 +4273,14 @@ pub const OTHER_SYMBOL: &'static [(char, char)] = &[ ('𐄷', '𐄿'), ('𐅹', '𐆉'), ('𐆌', '𐆎'), - ('𐆐', '𐆛'), + ('𐆐', '\u{1019c}'), ('𐆠', '𐆠'), ('𐇐', '𐇼'), ('𐡷', '𐡸'), ('𐫈', '𐫈'), ('𑜿', '𑜿'), - ('\u{11fd5}', '\u{11fdc}'), - ('\u{11fe1}', '\u{11ff1}'), + ('𑿕', '𑿜'), + ('𑿡', '𑿱'), ('𖬼', '𖬿'), ('𖭅', '𖭅'), ('𛲜', '𛲜'), @@ -4227,46 +4299,47 @@ pub const OTHER_SYMBOL: &'static [(char, char)] = &[ ('𝩭', '𝩴'), ('𝩶', '𝪃'), ('𝪅', '𝪆'), - ('\u{1e14f}', '\u{1e14f}'), + ('𞅏', '𞅏'), ('𞲬', '𞲬'), - ('\u{1ed2e}', '\u{1ed2e}'), + ('𞴮', '𞴮'), ('🀀', '🀫'), ('🀰', '🂓'), ('🂠', '🂮'), ('🂱', '🂿'), ('🃁', '🃏'), ('🃑', '🃵'), - ('🄐', '\u{1f16c}'), - ('🅰', '🆬'), + ('\u{1f10d}', '\u{1f1ad}'), ('🇦', '🈂'), ('🈐', '🈻'), ('🉀', '🉈'), ('🉐', '🉑'), ('🉠', '🉥'), ('🌀', '🏺'), - ('🐀', '\u{1f6d5}'), + ('🐀', '\u{1f6d7}'), ('🛠', '🛬'), - ('🛰', '\u{1f6fa}'), + ('🛰', '\u{1f6fc}'), ('🜀', '🝳'), ('🞀', '🟘'), - ('\u{1f7e0}', '\u{1f7eb}'), + ('🟠', '🟫'), ('🠀', '🠋'), ('🠐', '🡇'), ('🡐', '🡙'), ('🡠', '🢇'), ('🢐', '🢭'), - ('🤀', '🤋'), - ('\u{1f90d}', '\u{1f971}'), - ('🥳', '🥶'), - ('🥺', '🦢'), - ('\u{1f9a5}', '\u{1f9aa}'), - ('\u{1f9ae}', '\u{1f9ca}'), - ('\u{1f9cd}', '\u{1fa53}'), + ('\u{1f8b0}', '\u{1f8b1}'), + ('🤀', '\u{1f978}'), + ('🥺', '\u{1f9cb}'), + ('🧍', '🩓'), ('🩠', '🩭'), - ('\u{1fa70}', '\u{1fa73}'), - ('\u{1fa78}', '\u{1fa7a}'), - ('\u{1fa80}', '\u{1fa82}'), - ('\u{1fa90}', '\u{1fa95}'), + ('🩰', '\u{1fa74}'), + ('🩸', '🩺'), + ('🪀', '\u{1fa86}'), + ('🪐', '\u{1faa8}'), + ('\u{1fab0}', '\u{1fab6}'), + ('\u{1fac0}', '\u{1fac2}'), + ('\u{1fad0}', '\u{1fad6}'), + ('\u{1fb00}', '\u{1fb92}'), + ('\u{1fb94}', '\u{1fbca}'), ]; pub const PARAGRAPH_SEPARATOR: &'static [(char, char)] = @@ -4318,7 +4391,7 @@ pub const PUNCTUATION: &'static [(char, char)] = &[ ('৽', '৽'), ('੶', '੶'), ('૰', '૰'), - ('\u{c77}', '\u{c77}'), + ('౷', '౷'), ('಄', '಄'), ('෴', '෴'), ('๏', '๏'), @@ -4368,7 +4441,8 @@ pub const PUNCTUATION: &'static [(char, char)] = &[ ('⳾', '⳿'), ('⵰', '⵰'), ('⸀', '⸮'), - ('⸰', '\u{2e4f}'), + ('⸰', '⹏'), + ('\u{2e52}', '\u{2e52}'), ('、', '〃'), ('〈', '】'), ('〔', '〟'), @@ -4422,6 +4496,7 @@ pub const PUNCTUATION: &'static [(char, char)] = &[ ('𐫰', '𐫶'), ('𐬹', '𐬿'), ('𐮙', '𐮜'), + ('\u{10ead}', '\u{10ead}'), ('𐽕', '𐽙'), ('𑁇', '𑁍'), ('𑂻', '𑂼'), @@ -4435,7 +4510,7 @@ pub const PUNCTUATION: &'static [(char, char)] = &[ ('𑈸', '𑈽'), ('𑊩', '𑊩'), ('𑑋', '𑑏'), - ('𑑛', '𑑛'), + ('\u{1145a}', '𑑛'), ('𑑝', '𑑝'), ('𑓆', '𑓆'), ('𑗁', '𑗗'), @@ -4443,21 +4518,22 @@ pub const PUNCTUATION: &'static [(char, char)] = &[ ('𑙠', '𑙬'), ('𑜼', '𑜾'), ('𑠻', '𑠻'), - ('\u{119e2}', '\u{119e2}'), + ('\u{11944}', '\u{11946}'), + ('𑧢', '𑧢'), ('𑨿', '𑩆'), ('𑪚', '𑪜'), ('𑪞', '𑪢'), ('𑱁', '𑱅'), ('𑱰', '𑱱'), ('𑻷', '𑻸'), - ('\u{11fff}', '\u{11fff}'), + ('𑿿', '𑿿'), ('𒑰', '𒑴'), ('𖩮', '𖩯'), ('𖫵', '𖫵'), ('𖬷', '𖬻'), ('𖭄', '𖭄'), ('𖺗', '𖺚'), - ('\u{16fe2}', '\u{16fe2}'), + ('𖿢', '𖿢'), ('𛲟', '𛲟'), ('𝪇', '𝪋'), ('𞥞', '𞥟'), @@ -4556,7 +4632,7 @@ pub const SPACING_MARK: &'static [(char, char)] = &[ ('ᩣ', 'ᩤ'), ('ᩭ', 'ᩲ'), ('ᬄ', 'ᬄ'), - ('ᬵ', 'ᬵ'), + ('\u{1b35}', '\u{1b35}'), ('ᬻ', 'ᬻ'), ('ᬽ', 'ᭁ'), ('ᭃ', '᭄'), @@ -4604,6 +4680,7 @@ pub const SPACING_MARK: &'static [(char, char)] = &[ ('𑆂', '𑆂'), ('𑆳', '𑆵'), ('𑆿', '𑇀'), + ('\u{111ce}', '\u{111ce}'), ('𑈬', '𑈮'), ('𑈲', '𑈳'), ('𑈵', '𑈵'), @@ -4635,9 +4712,14 @@ pub const SPACING_MARK: &'static [(char, char)] = &[ ('𑜦', '𑜦'), ('𑠬', '𑠮'), ('𑠸', '𑠸'), - ('\u{119d1}', '\u{119d3}'), - ('\u{119dc}', '\u{119df}'), - ('\u{119e4}', '\u{119e4}'), + ('\u{11930}', '\u{11935}'), + ('\u{11937}', '\u{11938}'), + ('\u{1193d}', '\u{1193d}'), + ('\u{11940}', '\u{11940}'), + ('\u{11942}', '\u{11942}'), + ('𑧑', '𑧓'), + ('𑧜', '𑧟'), + ('𑧤', '𑧤'), ('𑨹', '𑨹'), ('𑩗', '𑩘'), ('𑪗', '𑪗'), @@ -4650,7 +4732,8 @@ pub const SPACING_MARK: &'static [(char, char)] = &[ ('𑶓', '𑶔'), ('𑶖', '𑶖'), ('𑻵', '𑻶'), - ('𖽑', '\u{16f87}'), + ('𖽑', '𖾇'), + ('\u{16ff0}', '\u{16ff1}'), ('\u{1d165}', '𝅦'), ('𝅭', '\u{1d172}'), ]; @@ -4756,8 +4839,9 @@ pub const SYMBOL: &'static [(char, char)] = &[ ('⧜', '⧻'), ('⧾', '⭳'), ('⭶', '⮕'), - ('⮘', '\u{2bff}'), + ('\u{2b97}', '⯿'), ('⳥', '⳪'), + ('\u{2e50}', '\u{2e51}'), ('⺀', '⺙'), ('⺛', '⻳'), ('⼀', '⿕'), @@ -4786,6 +4870,7 @@ pub const SYMBOL: &'static [(char, char)] = &[ ('꠶', '꠹'), ('꩷', '꩹'), ('꭛', '꭛'), + ('\u{ab6a}', '\u{ab6b}'), ('﬩', '﬩'), ('﮲', '﯁'), ('﷼', '﷽'), @@ -4805,13 +4890,13 @@ pub const SYMBOL: &'static [(char, char)] = &[ ('𐄷', '𐄿'), ('𐅹', '𐆉'), ('𐆌', '𐆎'), - ('𐆐', '𐆛'), + ('𐆐', '\u{1019c}'), ('𐆠', '𐆠'), ('𐇐', '𐇼'), ('𐡷', '𐡸'), ('𐫈', '𐫈'), ('𑜿', '𑜿'), - ('\u{11fd5}', '\u{11ff1}'), + ('𑿕', '𑿱'), ('𖬼', '𖬿'), ('𖭅', '𖭅'), ('𛲜', '𛲜'), @@ -4840,11 +4925,11 @@ pub const SYMBOL: &'static [(char, char)] = &[ ('𝩭', '𝩴'), ('𝩶', '𝪃'), ('𝪅', '𝪆'), - ('\u{1e14f}', '\u{1e14f}'), - ('\u{1e2ff}', '\u{1e2ff}'), + ('𞅏', '𞅏'), + ('𞋿', '𞋿'), ('𞲬', '𞲬'), ('𞲰', '𞲰'), - ('\u{1ed2e}', '\u{1ed2e}'), + ('𞴮', '𞴮'), ('𞻰', '𞻱'), ('🀀', '🀫'), ('🀰', '🂓'), @@ -4852,36 +4937,37 @@ pub const SYMBOL: &'static [(char, char)] = &[ ('🂱', '🂿'), ('🃁', '🃏'), ('🃑', '🃵'), - ('🄐', '\u{1f16c}'), - ('🅰', '🆬'), + ('\u{1f10d}', '\u{1f1ad}'), ('🇦', '🈂'), ('🈐', '🈻'), ('🉀', '🉈'), ('🉐', '🉑'), ('🉠', '🉥'), - ('🌀', '\u{1f6d5}'), + ('🌀', '\u{1f6d7}'), ('🛠', '🛬'), - ('🛰', '\u{1f6fa}'), + ('🛰', '\u{1f6fc}'), ('🜀', '🝳'), ('🞀', '🟘'), - ('\u{1f7e0}', '\u{1f7eb}'), + ('🟠', '🟫'), ('🠀', '🠋'), ('🠐', '🡇'), ('🡐', '🡙'), ('🡠', '🢇'), ('🢐', '🢭'), - ('🤀', '🤋'), - ('\u{1f90d}', '\u{1f971}'), - ('🥳', '🥶'), - ('🥺', '🦢'), - ('\u{1f9a5}', '\u{1f9aa}'), - ('\u{1f9ae}', '\u{1f9ca}'), - ('\u{1f9cd}', '\u{1fa53}'), + ('\u{1f8b0}', '\u{1f8b1}'), + ('🤀', '\u{1f978}'), + ('🥺', '\u{1f9cb}'), + ('🧍', '🩓'), ('🩠', '🩭'), - ('\u{1fa70}', '\u{1fa73}'), - ('\u{1fa78}', '\u{1fa7a}'), - ('\u{1fa80}', '\u{1fa82}'), - ('\u{1fa90}', '\u{1fa95}'), + ('🩰', '\u{1fa74}'), + ('🩸', '🩺'), + ('🪀', '\u{1fa86}'), + ('🪐', '\u{1faa8}'), + ('\u{1fab0}', '\u{1fab6}'), + ('\u{1fac0}', '\u{1fac2}'), + ('\u{1fad0}', '\u{1fad6}'), + ('\u{1fb00}', '\u{1fb92}'), + ('\u{1fb94}', '\u{1fbca}'), ]; pub const TITLECASE_LETTER: &'static [(char, char)] = &[ @@ -4921,7 +5007,7 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{85f}', '\u{85f}'), ('\u{86b}', '\u{89f}'), ('\u{8b5}', '\u{8b5}'), - ('\u{8be}', '\u{8d2}'), + ('\u{8c8}', '\u{8d2}'), ('\u{984}', '\u{984}'), ('\u{98d}', '\u{98e}'), ('\u{991}', '\u{992}'), @@ -4975,7 +5061,7 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{b3a}', '\u{b3b}'), ('\u{b45}', '\u{b46}'), ('\u{b49}', '\u{b4a}'), - ('\u{b4e}', '\u{b55}'), + ('\u{b4e}', '\u{b54}'), ('\u{b58}', '\u{b5b}'), ('\u{b5e}', '\u{b5e}'), ('\u{b64}', '\u{b65}'), @@ -5020,14 +5106,13 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{ce4}', '\u{ce5}'), ('\u{cf0}', '\u{cf0}'), ('\u{cf3}', '\u{cff}'), - ('\u{d04}', '\u{d04}'), ('\u{d0d}', '\u{d0d}'), ('\u{d11}', '\u{d11}'), ('\u{d45}', '\u{d45}'), ('\u{d49}', '\u{d49}'), ('\u{d50}', '\u{d53}'), ('\u{d64}', '\u{d65}'), - ('\u{d80}', '\u{d81}'), + ('\u{d80}', '\u{d80}'), ('\u{d84}', '\u{d84}'), ('\u{d97}', '\u{d99}'), ('\u{db2}', '\u{db2}'), @@ -5114,7 +5199,7 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{1a8a}', '\u{1a8f}'), ('\u{1a9a}', '\u{1a9f}'), ('\u{1aae}', '\u{1aaf}'), - ('\u{1abf}', '\u{1aff}'), + ('\u{1ac1}', '\u{1aff}'), ('\u{1b4c}', '\u{1b4f}'), ('\u{1b7d}', '\u{1b7f}'), ('\u{1bf4}', '\u{1bfb}'), @@ -5151,7 +5236,7 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{2427}', '\u{243f}'), ('\u{244b}', '\u{245f}'), ('\u{2b74}', '\u{2b75}'), - ('\u{2b96}', '\u{2b97}'), + ('\u{2b96}', '\u{2b96}'), ('\u{2c2f}', '\u{2c2f}'), ('\u{2c5f}', '\u{2c5f}'), ('\u{2cf4}', '\u{2cf8}'), @@ -5169,7 +5254,7 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{2dcf}', '\u{2dcf}'), ('\u{2dd7}', '\u{2dd7}'), ('\u{2ddf}', '\u{2ddf}'), - ('\u{2e50}', '\u{2e7f}'), + ('\u{2e53}', '\u{2e7f}'), ('\u{2e9a}', '\u{2e9a}'), ('\u{2ef4}', '\u{2eff}'), ('\u{2fd6}', '\u{2fef}'), @@ -5179,18 +5264,16 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{3100}', '\u{3104}'), ('\u{3130}', '\u{3130}'), ('\u{318f}', '\u{318f}'), - ('\u{31bb}', '\u{31bf}'), ('\u{31e4}', '\u{31ef}'), ('\u{321f}', '\u{321f}'), - ('\u{4db6}', '\u{4dbf}'), - ('\u{9ff0}', '\u{9fff}'), + ('\u{9ffd}', '\u{9fff}'), ('\u{a48d}', '\u{a48f}'), ('\u{a4c7}', '\u{a4cf}'), ('\u{a62c}', '\u{a63f}'), ('\u{a6f8}', '\u{a6ff}'), ('\u{a7c0}', '\u{a7c1}'), - ('\u{a7c7}', '\u{a7f6}'), - ('\u{a82c}', '\u{a82f}'), + ('\u{a7cb}', '\u{a7f4}'), + ('\u{a82d}', '\u{a82f}'), ('\u{a83a}', '\u{a83f}'), ('\u{a878}', '\u{a87f}'), ('\u{a8c6}', '\u{a8cd}'), @@ -5210,7 +5293,7 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{ab17}', '\u{ab1f}'), ('\u{ab27}', '\u{ab27}'), ('\u{ab2f}', '\u{ab2f}'), - ('\u{ab68}', '\u{ab6f}'), + ('\u{ab6c}', '\u{ab6f}'), ('\u{abee}', '\u{abef}'), ('\u{abfa}', '\u{abff}'), ('\u{d7a4}', '\u{d7af}'), @@ -5255,7 +5338,7 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{10103}', '\u{10106}'), ('\u{10134}', '\u{10136}'), ('\u{1018f}', '\u{1018f}'), - ('\u{1019c}', '\u{1019f}'), + ('\u{1019d}', '\u{1019f}'), ('\u{101a1}', '\u{101cf}'), ('\u{101fe}', '\u{1027f}'), ('\u{1029d}', '\u{1029f}'), @@ -5314,9 +5397,13 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{10cf3}', '\u{10cf9}'), ('\u{10d28}', '\u{10d2f}'), ('\u{10d3a}', '\u{10e5f}'), - ('\u{10e7f}', '\u{10eff}'), + ('\u{10e7f}', '\u{10e7f}'), + ('\u{10eaa}', '\u{10eaa}'), + ('\u{10eae}', '\u{10eaf}'), + ('\u{10eb2}', '\u{10eff}'), ('\u{10f28}', '\u{10f2f}'), - ('\u{10f5a}', '\u{10fdf}'), + ('\u{10f5a}', '\u{10faf}'), + ('\u{10fcc}', '\u{10fdf}'), ('\u{10ff7}', '\u{10fff}'), ('\u{1104e}', '\u{11051}'), ('\u{11070}', '\u{1107e}'), @@ -5325,9 +5412,8 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{110e9}', '\u{110ef}'), ('\u{110fa}', '\u{110ff}'), ('\u{11135}', '\u{11135}'), - ('\u{11147}', '\u{1114f}'), + ('\u{11148}', '\u{1114f}'), ('\u{11177}', '\u{1117f}'), - ('\u{111ce}', '\u{111cf}'), ('\u{111e0}', '\u{111e0}'), ('\u{111f5}', '\u{111ff}'), ('\u{11212}', '\u{11212}'), @@ -5354,9 +5440,8 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{11364}', '\u{11365}'), ('\u{1136d}', '\u{1136f}'), ('\u{11375}', '\u{113ff}'), - ('\u{1145a}', '\u{1145a}'), ('\u{1145c}', '\u{1145c}'), - ('\u{11460}', '\u{1147f}'), + ('\u{11462}', '\u{1147f}'), ('\u{114c8}', '\u{114cf}'), ('\u{114da}', '\u{1157f}'), ('\u{115b6}', '\u{115b7}'), @@ -5371,7 +5456,14 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{11740}', '\u{117ff}'), ('\u{1183c}', '\u{1189f}'), ('\u{118f3}', '\u{118fe}'), - ('\u{11900}', '\u{1199f}'), + ('\u{11907}', '\u{11908}'), + ('\u{1190a}', '\u{1190b}'), + ('\u{11914}', '\u{11914}'), + ('\u{11917}', '\u{11917}'), + ('\u{11936}', '\u{11936}'), + ('\u{11939}', '\u{1193a}'), + ('\u{11947}', '\u{1194f}'), + ('\u{1195a}', '\u{1199f}'), ('\u{119a8}', '\u{119a9}'), ('\u{119d8}', '\u{119d9}'), ('\u{119e5}', '\u{119ff}'), @@ -5398,7 +5490,8 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{11d92}', '\u{11d92}'), ('\u{11d99}', '\u{11d9f}'), ('\u{11daa}', '\u{11edf}'), - ('\u{11ef9}', '\u{11fbf}'), + ('\u{11ef9}', '\u{11faf}'), + ('\u{11fb1}', '\u{11fbf}'), ('\u{11ff2}', '\u{11ffe}'), ('\u{1239a}', '\u{123ff}'), ('\u{1246f}', '\u{1246f}'), @@ -5422,9 +5515,11 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{16f4b}', '\u{16f4e}'), ('\u{16f88}', '\u{16f8e}'), ('\u{16fa0}', '\u{16fdf}'), - ('\u{16fe4}', '\u{16fff}'), + ('\u{16fe5}', '\u{16fef}'), + ('\u{16ff2}', '\u{16fff}'), ('\u{187f8}', '\u{187ff}'), - ('\u{18af3}', '\u{1afff}'), + ('\u{18cd6}', '\u{18cff}'), + ('\u{18d09}', '\u{1afff}'), ('\u{1b11f}', '\u{1b14f}'), ('\u{1b153}', '\u{1b163}'), ('\u{1b168}', '\u{1b16f}'), @@ -5522,17 +5617,15 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{1f0c0}', '\u{1f0c0}'), ('\u{1f0d0}', '\u{1f0d0}'), ('\u{1f0f6}', '\u{1f0ff}'), - ('\u{1f10d}', '\u{1f10f}'), - ('\u{1f16d}', '\u{1f16f}'), - ('\u{1f1ad}', '\u{1f1e5}'), + ('\u{1f1ae}', '\u{1f1e5}'), ('\u{1f203}', '\u{1f20f}'), ('\u{1f23c}', '\u{1f23f}'), ('\u{1f249}', '\u{1f24f}'), ('\u{1f252}', '\u{1f25f}'), ('\u{1f266}', '\u{1f2ff}'), - ('\u{1f6d6}', '\u{1f6df}'), + ('\u{1f6d8}', '\u{1f6df}'), ('\u{1f6ed}', '\u{1f6ef}'), - ('\u{1f6fb}', '\u{1f6ff}'), + ('\u{1f6fd}', '\u{1f6ff}'), ('\u{1f774}', '\u{1f77f}'), ('\u{1f7d9}', '\u{1f7df}'), ('\u{1f7ec}', '\u{1f7ff}'), @@ -5540,25 +5633,29 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{1f848}', '\u{1f84f}'), ('\u{1f85a}', '\u{1f85f}'), ('\u{1f888}', '\u{1f88f}'), - ('\u{1f8ae}', '\u{1f8ff}'), - ('\u{1f90c}', '\u{1f90c}'), - ('\u{1f972}', '\u{1f972}'), - ('\u{1f977}', '\u{1f979}'), - ('\u{1f9a3}', '\u{1f9a4}'), - ('\u{1f9ab}', '\u{1f9ad}'), - ('\u{1f9cb}', '\u{1f9cc}'), + ('\u{1f8ae}', '\u{1f8af}'), + ('\u{1f8b2}', '\u{1f8ff}'), + ('\u{1f979}', '\u{1f979}'), + ('\u{1f9cc}', '\u{1f9cc}'), ('\u{1fa54}', '\u{1fa5f}'), ('\u{1fa6e}', '\u{1fa6f}'), - ('\u{1fa74}', '\u{1fa77}'), + ('\u{1fa75}', '\u{1fa77}'), ('\u{1fa7b}', '\u{1fa7f}'), - ('\u{1fa83}', '\u{1fa8f}'), - ('\u{1fa96}', '\u{1ffff}'), - ('\u{2a6d7}', '\u{2a6ff}'), + ('\u{1fa87}', '\u{1fa8f}'), + ('\u{1faa9}', '\u{1faaf}'), + ('\u{1fab7}', '\u{1fabf}'), + ('\u{1fac3}', '\u{1facf}'), + ('\u{1fad7}', '\u{1faff}'), + ('\u{1fb93}', '\u{1fb93}'), + ('\u{1fbcb}', '\u{1fbef}'), + ('\u{1fbfa}', '\u{1ffff}'), + ('\u{2a6de}', '\u{2a6ff}'), ('\u{2b735}', '\u{2b73f}'), ('\u{2b81e}', '\u{2b81f}'), ('\u{2cea2}', '\u{2ceaf}'), ('\u{2ebe1}', '\u{2f7ff}'), - ('\u{2fa1e}', '\u{e0000}'), + ('\u{2fa1e}', '\u{2ffff}'), + ('\u{3134b}', '\u{e0000}'), ('\u{e0002}', '\u{e001f}'), ('\u{e0080}', '\u{e00ff}'), ('\u{e01f0}', '\u{effff}'), @@ -6160,11 +6257,13 @@ pub const UPPERCASE_LETTER: &'static [(char, char)] = &[ ('Ʞ', 'Ꞵ'), ('Ꞷ', 'Ꞷ'), ('Ꞹ', 'Ꞹ'), - ('\u{a7ba}', '\u{a7ba}'), - ('\u{a7bc}', '\u{a7bc}'), - ('\u{a7be}', '\u{a7be}'), - ('\u{a7c2}', '\u{a7c2}'), - ('\u{a7c4}', '\u{a7c6}'), + ('Ꞻ', 'Ꞻ'), + ('Ꞽ', 'Ꞽ'), + ('Ꞿ', 'Ꞿ'), + ('Ꟃ', 'Ꟃ'), + ('Ꞔ', '\u{a7c7}'), + ('\u{a7c9}', '\u{a7c9}'), + ('\u{a7f5}', '\u{a7f5}'), ('A', 'Z'), ('𐐀', '𐐧'), ('𐒰', '𐓓'), diff --git a/regex-syntax/src/unicode_tables/grapheme_cluster_break.rs b/regex-syntax/src/unicode_tables/grapheme_cluster_break.rs index 2855eadc58..1d0b285111 100644 --- a/regex-syntax/src/unicode_tables/grapheme_cluster_break.rs +++ b/regex-syntax/src/unicode_tables/grapheme_cluster_break.rs @@ -1,8 +1,8 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate grapheme-cluster-break /tmp/ucd/12.1.0/ --chars +// ucd-generate grapheme-cluster-break ucd-13.0.0 --chars // -// ucd-generate is available on crates.io. +// ucd-generate 0.2.7 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("CR", CR), @@ -105,7 +105,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{b3e}', '\u{b3f}'), ('\u{b41}', '\u{b44}'), ('\u{b4d}', '\u{b4d}'), - ('\u{b56}', '\u{b57}'), + ('\u{b55}', '\u{b57}'), ('\u{b62}', '\u{b63}'), ('\u{b82}', '\u{b82}'), ('\u{bbe}', '\u{bbe}'), @@ -134,6 +134,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{d4d}', '\u{d4d}'), ('\u{d57}', '\u{d57}'), ('\u{d62}', '\u{d63}'), + ('\u{d81}', '\u{d81}'), ('\u{dca}', '\u{dca}'), ('\u{dcf}', '\u{dcf}'), ('\u{dd2}', '\u{dd4}'), @@ -192,7 +193,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{1a65}', '\u{1a6c}'), ('\u{1a73}', '\u{1a7c}'), ('\u{1a7f}', '\u{1a7f}'), - ('\u{1ab0}', '\u{1abe}'), + ('\u{1ab0}', '\u{1ac0}'), ('\u{1b00}', '\u{1b03}'), ('\u{1b34}', '\u{1b3a}'), ('\u{1b3c}', '\u{1b3c}'), @@ -231,6 +232,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{a806}', '\u{a806}'), ('\u{a80b}', '\u{a80b}'), ('\u{a825}', '\u{a826}'), + ('\u{a82c}', '\u{a82c}'), ('\u{a8c4}', '\u{a8c5}'), ('\u{a8e0}', '\u{a8f1}'), ('\u{a8ff}', '\u{a8ff}'), @@ -239,7 +241,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{a980}', '\u{a982}'), ('\u{a9b3}', '\u{a9b3}'), ('\u{a9b6}', '\u{a9b9}'), - ('\u{a9bc}', 'ꦽ'), + ('\u{a9bc}', '\u{a9bd}'), ('\u{a9e5}', '\u{a9e5}'), ('\u{aa29}', '\u{aa2e}'), ('\u{aa31}', '\u{aa32}'), @@ -271,6 +273,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{10a3f}', '\u{10a3f}'), ('\u{10ae5}', '\u{10ae6}'), ('\u{10d24}', '\u{10d27}'), + ('\u{10eab}', '\u{10eac}'), ('\u{10f46}', '\u{10f50}'), ('\u{11001}', '\u{11001}'), ('\u{11038}', '\u{11046}'), @@ -284,6 +287,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{11180}', '\u{11181}'), ('\u{111b6}', '\u{111be}'), ('\u{111c9}', '\u{111cc}'), + ('\u{111cf}', '\u{111cf}'), ('\u{1122f}', '\u{11231}'), ('\u{11234}', '\u{11234}'), ('\u{11236}', '\u{11237}'), @@ -324,6 +328,10 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{11727}', '\u{1172b}'), ('\u{1182f}', '\u{11837}'), ('\u{11839}', '\u{1183a}'), + ('\u{11930}', '\u{11930}'), + ('\u{1193b}', '\u{1193c}'), + ('\u{1193e}', '\u{1193e}'), + ('\u{11943}', '\u{11943}'), ('\u{119d4}', '\u{119d7}'), ('\u{119da}', '\u{119db}'), ('\u{119e0}', '\u{119e0}'), @@ -355,6 +363,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{16b30}', '\u{16b36}'), ('\u{16f4f}', '\u{16f4f}'), ('\u{16f8f}', '\u{16f92}'), + ('\u{16fe4}', '\u{16fe4}'), ('\u{1bc9d}', '\u{1bc9e}'), ('\u{1d165}', '\u{1d165}'), ('\u{1d167}', '\u{1d169}'), @@ -1200,8 +1209,10 @@ pub const PREPEND: &'static [(char, char)] = &[ ('\u{110bd}', '\u{110bd}'), ('\u{110cd}', '\u{110cd}'), ('𑇂', '𑇃'), + ('\u{1193f}', '\u{1193f}'), + ('\u{11941}', '\u{11941}'), ('𑨺', '𑨺'), - ('\u{11a84}', '𑪉'), + ('𑪄', '𑪉'), ('𑵆', '𑵆'), ]; @@ -1311,6 +1322,7 @@ pub const SPACINGMARK: &'static [(char, char)] = &[ ('𑆂', '𑆂'), ('𑆳', '𑆵'), ('𑆿', '𑇀'), + ('\u{111ce}', '\u{111ce}'), ('𑈬', '𑈮'), ('𑈲', '𑈳'), ('𑈵', '𑈵'), @@ -1342,9 +1354,14 @@ pub const SPACINGMARK: &'static [(char, char)] = &[ ('𑜦', '𑜦'), ('𑠬', '𑠮'), ('𑠸', '𑠸'), - ('\u{119d1}', '\u{119d3}'), - ('\u{119dc}', '\u{119df}'), - ('\u{119e4}', '\u{119e4}'), + ('\u{11931}', '\u{11935}'), + ('\u{11937}', '\u{11938}'), + ('\u{1193d}', '\u{1193d}'), + ('\u{11940}', '\u{11940}'), + ('\u{11942}', '\u{11942}'), + ('𑧑', '𑧓'), + ('𑧜', '𑧟'), + ('𑧤', '𑧤'), ('𑨹', '𑨹'), ('𑩗', '𑩘'), ('𑪗', '𑪗'), @@ -1357,7 +1374,8 @@ pub const SPACINGMARK: &'static [(char, char)] = &[ ('𑶓', '𑶔'), ('𑶖', '𑶖'), ('𑻵', '𑻶'), - ('𖽑', '\u{16f87}'), + ('𖽑', '𖾇'), + ('\u{16ff0}', '\u{16ff1}'), ('𝅦', '𝅦'), ('𝅭', '𝅭'), ]; diff --git a/regex-syntax/src/unicode_tables/perl_decimal.rs b/regex-syntax/src/unicode_tables/perl_decimal.rs index 8f6a046f65..541f3246bf 100644 --- a/regex-syntax/src/unicode_tables/perl_decimal.rs +++ b/regex-syntax/src/unicode_tables/perl_decimal.rs @@ -1,8 +1,8 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate general-category /tmp/ucd/12.1.0/ --chars --include decimalnumber +// ucd-generate general-category ucd-13.0.0 --chars --include decimalnumber // -// ucd-generate is available on crates.io. +// ucd-generate 0.2.7 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[("Decimal_Number", DECIMAL_NUMBER)]; @@ -58,13 +58,15 @@ pub const DECIMAL_NUMBER: &'static [(char, char)] = &[ ('𑛀', '𑛉'), ('𑜰', '𑜹'), ('𑣠', '𑣩'), + ('\u{11950}', '\u{11959}'), ('𑱐', '𑱙'), ('𑵐', '𑵙'), ('𑶠', '𑶩'), ('𖩠', '𖩩'), ('𖭐', '𖭙'), ('𝟎', '𝟿'), - ('\u{1e140}', '\u{1e149}'), - ('\u{1e2f0}', '\u{1e2f9}'), + ('𞅀', '𞅉'), + ('𞋰', '𞋹'), ('𞥐', '𞥙'), + ('\u{1fbf0}', '\u{1fbf9}'), ]; diff --git a/regex-syntax/src/unicode_tables/perl_space.rs b/regex-syntax/src/unicode_tables/perl_space.rs index 515724521c..8f048f8de3 100644 --- a/regex-syntax/src/unicode_tables/perl_space.rs +++ b/regex-syntax/src/unicode_tables/perl_space.rs @@ -1,8 +1,8 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate property-bool /tmp/ucd/12.1.0/ --chars --include whitespace +// ucd-generate property-bool ucd-13.0.0 --chars --include whitespace // -// ucd-generate is available on crates.io. +// ucd-generate 0.2.7 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[("White_Space", WHITE_SPACE)]; diff --git a/regex-syntax/src/unicode_tables/perl_word.rs b/regex-syntax/src/unicode_tables/perl_word.rs index f4f5706242..68e9451899 100644 --- a/regex-syntax/src/unicode_tables/perl_word.rs +++ b/regex-syntax/src/unicode_tables/perl_word.rs @@ -1,8 +1,8 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate perl-word /tmp/ucd/12.1.0/ --chars +// ucd-generate perl-word ucd-13.0.0 --chars // -// ucd-generate is available on crates.io. +// ucd-generate 0.2.7 is available on crates.io. pub const PERL_WORD: &'static [(char, char)] = &[ ('0', '9'), @@ -56,7 +56,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('ࡀ', '\u{85b}'), ('ࡠ', 'ࡪ'), ('ࢠ', 'ࢴ'), - ('ࢶ', 'ࢽ'), + ('ࢶ', '\u{8c7}'), ('\u{8d3}', '\u{8e1}'), ('\u{8e3}', '\u{963}'), ('०', '९'), @@ -116,7 +116,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('\u{b3c}', '\u{b44}'), ('େ', 'ୈ'), ('ୋ', '\u{b4d}'), - ('\u{b56}', '\u{b57}'), + ('\u{b55}', '\u{b57}'), ('ଡ଼', 'ଢ଼'), ('ୟ', '\u{b63}'), ('୦', '୯'), @@ -162,8 +162,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('ೠ', '\u{ce3}'), ('೦', '೯'), ('ೱ', 'ೲ'), - ('\u{d00}', 'ഃ'), - ('അ', 'ഌ'), + ('\u{d00}', 'ഌ'), ('എ', 'ഐ'), ('ഒ', '\u{d44}'), ('െ', 'ൈ'), @@ -172,7 +171,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('ൟ', '\u{d63}'), ('൦', '൯'), ('ൺ', 'ൿ'), - ('ං', 'ඃ'), + ('\u{d81}', 'ඃ'), ('අ', 'ඖ'), ('ක', 'න'), ('ඳ', 'ර'), @@ -189,8 +188,8 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('๐', '๙'), ('ກ', 'ຂ'), ('ຄ', 'ຄ'), - ('\u{e86}', 'ຊ'), - ('\u{e8c}', 'ຣ'), + ('ຆ', 'ຊ'), + ('ຌ', 'ຣ'), ('ລ', 'ລ'), ('ວ', 'ຽ'), ('ເ', 'ໄ'), @@ -271,7 +270,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('\u{1a7f}', '᪉'), ('᪐', '᪙'), ('ᪧ', 'ᪧ'), - ('\u{1ab0}', '\u{1abe}'), + ('\u{1ab0}', '\u{1ac0}'), ('\u{1b00}', 'ᭋ'), ('᭐', '᭙'), ('\u{1b6b}', '\u{1b73}'), @@ -283,7 +282,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('Ა', 'Ჺ'), ('Ჽ', 'Ჿ'), ('\u{1cd0}', '\u{1cd2}'), - ('\u{1cd4}', '\u{1cfa}'), + ('\u{1cd4}', 'ᳺ'), ('ᴀ', '\u{1df9}'), ('\u{1dfb}', 'ἕ'), ('Ἐ', 'Ἕ'), @@ -357,10 +356,10 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('ー', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', 'ㆺ'), + ('ㆠ', '\u{31bf}'), ('ㇰ', 'ㇿ'), - ('㐀', '䶵'), - ('一', '鿯'), + ('㐀', '\u{4dbf}'), + ('一', '\u{9ffc}'), ('ꀀ', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), @@ -370,9 +369,10 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('ꙿ', '\u{a6f1}'), ('ꜗ', 'ꜟ'), ('Ꜣ', 'ꞈ'), - ('Ꞌ', '\u{a7bf}'), - ('\u{a7c2}', '\u{a7c6}'), - ('ꟷ', 'ꠧ'), + ('Ꞌ', 'ꞿ'), + ('Ꟃ', '\u{a7ca}'), + ('\u{a7f5}', 'ꠧ'), + ('\u{a82c}', '\u{a82c}'), ('ꡀ', 'ꡳ'), ('ꢀ', '\u{a8c5}'), ('꣐', '꣙'), @@ -398,7 +398,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab67}'), + ('ꭜ', '\u{ab69}'), ('ꭰ', 'ꯪ'), ('꯬', '\u{abed}'), ('꯰', '꯹'), @@ -497,10 +497,14 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('𐳀', '𐳲'), ('𐴀', '\u{10d27}'), ('𐴰', '𐴹'), + ('\u{10e80}', '\u{10ea9}'), + ('\u{10eab}', '\u{10eac}'), + ('\u{10eb0}', '\u{10eb1}'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '\u{10f50}'), - ('\u{10fe0}', '\u{10ff6}'), + ('\u{10fb0}', '\u{10fc4}'), + ('𐿠', '𐿶'), ('𑀀', '\u{11046}'), ('𑁦', '𑁯'), ('\u{1107f}', '\u{110ba}'), @@ -508,12 +512,12 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('𑃰', '𑃹'), ('\u{11100}', '\u{11134}'), ('𑄶', '𑄿'), - ('𑅄', '𑅆'), + ('𑅄', '\u{11147}'), ('𑅐', '\u{11173}'), ('𑅶', '𑅶'), ('\u{11180}', '𑇄'), ('\u{111c9}', '\u{111cc}'), - ('𑇐', '𑇚'), + ('\u{111ce}', '𑇚'), ('𑇜', '𑇜'), ('𑈀', '𑈑'), ('𑈓', '\u{11237}'), @@ -542,7 +546,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('\u{11370}', '\u{11374}'), ('𑐀', '𑑊'), ('𑑐', '𑑙'), - ('\u{1145e}', '\u{1145f}'), + ('\u{1145e}', '\u{11461}'), ('𑒀', '𑓅'), ('𑓇', '𑓇'), ('𑓐', '𑓙'), @@ -552,18 +556,25 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('𑘀', '\u{11640}'), ('𑙄', '𑙄'), ('𑙐', '𑙙'), - ('𑚀', '\u{116b8}'), + ('𑚀', '𑚸'), ('𑛀', '𑛉'), ('𑜀', '𑜚'), ('\u{1171d}', '\u{1172b}'), ('𑜰', '𑜹'), ('𑠀', '\u{1183a}'), ('𑢠', '𑣩'), - ('𑣿', '𑣿'), - ('\u{119a0}', '\u{119a7}'), - ('\u{119aa}', '\u{119d7}'), - ('\u{119da}', '\u{119e1}'), - ('\u{119e3}', '\u{119e4}'), + ('𑣿', '\u{11906}'), + ('\u{11909}', '\u{11909}'), + ('\u{1190c}', '\u{11913}'), + ('\u{11915}', '\u{11916}'), + ('\u{11918}', '\u{11935}'), + ('\u{11937}', '\u{11938}'), + ('\u{1193b}', '\u{11943}'), + ('\u{11950}', '\u{11959}'), + ('𑦠', '𑦧'), + ('𑦪', '\u{119d7}'), + ('\u{119da}', '𑧡'), + ('𑧣', '𑧤'), ('𑨀', '\u{11a3e}'), ('\u{11a47}', '\u{11a47}'), ('𑩐', '\u{11a99}'), @@ -590,6 +601,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('𑶓', '𑶘'), ('𑶠', '𑶩'), ('𑻠', '𑻶'), + ('\u{11fb0}', '\u{11fb0}'), ('𒀀', '𒎙'), ('𒐀', '𒑮'), ('𒒀', '𒕃'), @@ -606,16 +618,18 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('𖭣', '𖭷'), ('𖭽', '𖮏'), ('𖹀', '𖹿'), - ('𖼀', '\u{16f4a}'), - ('\u{16f4f}', '\u{16f87}'), + ('𖼀', '𖽊'), + ('\u{16f4f}', '𖾇'), ('\u{16f8f}', '𖾟'), ('𖿠', '𖿡'), - ('\u{16fe3}', '\u{16fe3}'), - ('𗀀', '\u{187f7}'), - ('𘠀', '𘫲'), + ('𖿣', '\u{16fe4}'), + ('\u{16ff0}', '\u{16ff1}'), + ('𗀀', '𘟷'), + ('𘠀', '\u{18cd5}'), + ('\u{18d00}', '\u{18d08}'), ('𛀀', '𛄞'), - ('\u{1b150}', '\u{1b152}'), - ('\u{1b164}', '\u{1b167}'), + ('𛅐', '𛅒'), + ('𛅤', '𛅧'), ('𛅰', '𛋻'), ('𛰀', '𛱪'), ('𛱰', '𛱼'), @@ -670,14 +684,14 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('\u{1e01b}', '\u{1e021}'), ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), - ('\u{1e100}', '\u{1e12c}'), - ('\u{1e130}', '\u{1e13d}'), - ('\u{1e140}', '\u{1e149}'), - ('\u{1e14e}', '\u{1e14e}'), - ('\u{1e2c0}', '\u{1e2f9}'), + ('𞄀', '𞄬'), + ('\u{1e130}', '𞄽'), + ('𞅀', '𞅉'), + ('𞅎', '𞅎'), + ('𞋀', '𞋹'), ('𞠀', '𞣄'), ('\u{1e8d0}', '\u{1e8d6}'), - ('𞤀', '\u{1e94b}'), + ('𞤀', '𞥋'), ('𞥐', '𞥙'), ('𞸀', '𞸃'), ('𞸅', '𞸟'), @@ -715,11 +729,13 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('🄰', '🅉'), ('🅐', '🅩'), ('🅰', '🆉'), - ('𠀀', '𪛖'), + ('\u{1fbf0}', '\u{1fbf9}'), + ('𠀀', '\u{2a6dd}'), ('𪜀', '𫜴'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), + ('\u{30000}', '\u{3134a}'), ('\u{e0100}', '\u{e01ef}'), ]; diff --git a/regex-syntax/src/unicode_tables/property_bool.rs b/regex-syntax/src/unicode_tables/property_bool.rs index efe6eb369d..a0ef0cf698 100644 --- a/regex-syntax/src/unicode_tables/property_bool.rs +++ b/regex-syntax/src/unicode_tables/property_bool.rs @@ -1,13 +1,14 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate property-bool /tmp/ucd/12.1.0/ --chars +// ucd-generate property-bool ucd-13.0.0 --chars // -// ucd-generate is available on crates.io. +// ucd-generate 0.2.7 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("ASCII_Hex_Digit", ASCII_HEX_DIGIT), ("Alphabetic", ALPHABETIC), ("Bidi_Control", BIDI_CONTROL), + ("Bidi_Mirrored", BIDI_MIRRORED), ("Case_Ignorable", CASE_IGNORABLE), ("Cased", CASED), ("Changes_When_Casefolded", CHANGES_WHEN_CASEFOLDED), @@ -123,7 +124,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('ࡀ', 'ࡘ'), ('ࡠ', 'ࡪ'), ('ࢠ', 'ࢴ'), - ('ࢶ', 'ࢽ'), + ('ࢶ', '\u{8c7}'), ('\u{8d4}', '\u{8df}'), ('\u{8e3}', '\u{8e9}'), ('\u{8f0}', 'ऻ'), @@ -227,8 +228,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('ೞ', 'ೞ'), ('ೠ', '\u{ce3}'), ('ೱ', 'ೲ'), - ('\u{d00}', 'ഃ'), - ('അ', 'ഌ'), + ('\u{d00}', 'ഌ'), ('എ', 'ഐ'), ('ഒ', 'ഺ'), ('ഽ', '\u{d44}'), @@ -238,7 +238,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('ൔ', '\u{d57}'), ('ൟ', '\u{d63}'), ('ൺ', 'ൿ'), - ('ං', 'ඃ'), + ('\u{d81}', 'ඃ'), ('අ', 'ඖ'), ('ක', 'න'), ('ඳ', 'ර'), @@ -253,8 +253,8 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('\u{e4d}', '\u{e4d}'), ('ກ', 'ຂ'), ('ຄ', 'ຄ'), - ('\u{e86}', 'ຊ'), - ('\u{e8c}', 'ຣ'), + ('ຆ', 'ຊ'), + ('ຌ', 'ຣ'), ('ລ', 'ລ'), ('ວ', '\u{eb9}'), ('\u{ebb}', 'ຽ'), @@ -326,8 +326,9 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('ᨠ', '\u{1a5e}'), ('ᩡ', '\u{1a74}'), ('ᪧ', 'ᪧ'), + ('\u{1abf}', '\u{1ac0}'), ('\u{1b00}', 'ᬳ'), - ('ᬵ', 'ᭃ'), + ('\u{1b35}', 'ᭃ'), ('ᭅ', 'ᭋ'), ('\u{1b80}', '\u{1ba9}'), ('\u{1bac}', 'ᮯ'), @@ -342,7 +343,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('ᳩ', 'ᳬ'), ('ᳮ', 'ᳳ'), ('ᳵ', 'ᳶ'), - ('\u{1cfa}', '\u{1cfa}'), + ('ᳺ', 'ᳺ'), ('ᴀ', 'ᶿ'), ('\u{1de7}', '\u{1df4}'), ('Ḁ', 'ἕ'), @@ -413,10 +414,10 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('ー', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', 'ㆺ'), + ('ㆠ', '\u{31bf}'), ('ㇰ', 'ㇿ'), - ('㐀', '䶵'), - ('一', '鿯'), + ('㐀', '\u{4dbf}'), + ('一', '\u{9ffc}'), ('ꀀ', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), @@ -427,9 +428,9 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('ꙿ', 'ꛯ'), ('ꜗ', 'ꜟ'), ('Ꜣ', 'ꞈ'), - ('Ꞌ', '\u{a7bf}'), - ('\u{a7c2}', '\u{a7c6}'), - ('ꟷ', 'ꠅ'), + ('Ꞌ', 'ꞿ'), + ('Ꟃ', '\u{a7ca}'), + ('\u{a7f5}', 'ꠅ'), ('ꠇ', 'ꠧ'), ('ꡀ', 'ꡳ'), ('ꢀ', 'ꣃ'), @@ -460,7 +461,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab67}'), + ('ꭜ', '\u{ab69}'), ('ꭰ', 'ꯪ'), ('가', '힣'), ('ힰ', 'ퟆ'), @@ -545,19 +546,24 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('𐲀', '𐲲'), ('𐳀', '𐳲'), ('𐴀', '\u{10d27}'), + ('\u{10e80}', '\u{10ea9}'), + ('\u{10eab}', '\u{10eac}'), + ('\u{10eb0}', '\u{10eb1}'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '𐽅'), - ('\u{10fe0}', '\u{10ff6}'), + ('\u{10fb0}', '\u{10fc4}'), + ('𐿠', '𐿶'), ('𑀀', '\u{11045}'), ('𑂂', '𑂸'), ('𑃐', '𑃨'), ('\u{11100}', '\u{11132}'), - ('𑅄', '𑅆'), + ('𑅄', '\u{11147}'), ('𑅐', '𑅲'), ('𑅶', '𑅶'), ('\u{11180}', '𑆿'), ('𑇁', '𑇄'), + ('\u{111ce}', '\u{111cf}'), ('𑇚', '𑇚'), ('𑇜', '𑇜'), ('𑈀', '𑈑'), @@ -586,7 +592,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('𑐀', '𑑁'), ('\u{11443}', '𑑅'), ('𑑇', '𑑊'), - ('\u{1145f}', '\u{1145f}'), + ('𑑟', '\u{11461}'), ('𑒀', '𑓁'), ('𑓄', '𑓅'), ('𑓇', '𑓇'), @@ -597,17 +603,24 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('\u{11640}', '\u{11640}'), ('𑙄', '𑙄'), ('𑚀', '\u{116b5}'), - ('\u{116b8}', '\u{116b8}'), + ('𑚸', '𑚸'), ('𑜀', '𑜚'), ('\u{1171d}', '\u{1172a}'), ('𑠀', '𑠸'), ('𑢠', '𑣟'), - ('𑣿', '𑣿'), - ('\u{119a0}', '\u{119a7}'), - ('\u{119aa}', '\u{119d7}'), - ('\u{119da}', '\u{119df}'), - ('\u{119e1}', '\u{119e1}'), - ('\u{119e3}', '\u{119e4}'), + ('𑣿', '\u{11906}'), + ('\u{11909}', '\u{11909}'), + ('\u{1190c}', '\u{11913}'), + ('\u{11915}', '\u{11916}'), + ('\u{11918}', '\u{11935}'), + ('\u{11937}', '\u{11938}'), + ('\u{1193b}', '\u{1193c}'), + ('\u{1193f}', '\u{11942}'), + ('𑦠', '𑦧'), + ('𑦪', '\u{119d7}'), + ('\u{119da}', '𑧟'), + ('𑧡', '𑧡'), + ('𑧣', '𑧤'), ('𑨀', '𑨲'), ('\u{11a35}', '\u{11a3e}'), ('𑩐', '𑪗'), @@ -635,6 +648,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('𑶓', '𑶖'), ('𑶘', '𑶘'), ('𑻠', '𑻶'), + ('\u{11fb0}', '\u{11fb0}'), ('𒀀', '𒎙'), ('𒐀', '𒑮'), ('𒒀', '𒕃'), @@ -648,16 +662,18 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('𖭣', '𖭷'), ('𖭽', '𖮏'), ('𖹀', '𖹿'), - ('𖼀', '\u{16f4a}'), - ('\u{16f4f}', '\u{16f87}'), + ('𖼀', '𖽊'), + ('\u{16f4f}', '𖾇'), ('\u{16f8f}', '𖾟'), ('𖿠', '𖿡'), - ('\u{16fe3}', '\u{16fe3}'), - ('𗀀', '\u{187f7}'), - ('𘠀', '𘫲'), + ('𖿣', '𖿣'), + ('\u{16ff0}', '\u{16ff1}'), + ('𗀀', '𘟷'), + ('𘠀', '\u{18cd5}'), + ('\u{18d00}', '\u{18d08}'), ('𛀀', '𛄞'), - ('\u{1b150}', '\u{1b152}'), - ('\u{1b164}', '\u{1b167}'), + ('𛅐', '𛅒'), + ('𛅤', '𛅧'), ('𛅰', '𛋻'), ('𛰀', '𛱪'), ('𛱰', '𛱼'), @@ -699,14 +715,14 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('\u{1e01b}', '\u{1e021}'), ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), - ('\u{1e100}', '\u{1e12c}'), - ('\u{1e137}', '\u{1e13d}'), - ('\u{1e14e}', '\u{1e14e}'), - ('\u{1e2c0}', '\u{1e2eb}'), + ('𞄀', '𞄬'), + ('𞄷', '𞄽'), + ('𞅎', '𞅎'), + ('𞋀', '𞋫'), ('𞠀', '𞣄'), ('𞤀', '𞥃'), ('\u{1e947}', '\u{1e947}'), - ('\u{1e94b}', '\u{1e94b}'), + ('𞥋', '𞥋'), ('𞸀', '𞸃'), ('𞸅', '𞸟'), ('𞸡', '𞸢'), @@ -743,12 +759,13 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('🄰', '🅉'), ('🅐', '🅩'), ('🅰', '🆉'), - ('𠀀', '𪛖'), + ('𠀀', '\u{2a6dd}'), ('𪜀', '𫜴'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), + ('\u{30000}', '\u{3134a}'), ]; pub const BIDI_CONTROL: &'static [(char, char)] = &[ @@ -758,6 +775,122 @@ pub const BIDI_CONTROL: &'static [(char, char)] = &[ ('\u{2066}', '\u{2069}'), ]; +pub const BIDI_MIRRORED: &'static [(char, char)] = &[ + ('(', ')'), + ('<', '<'), + ('>', '>'), + ('[', '['), + (']', ']'), + ('{', '{'), + ('}', '}'), + ('«', '«'), + ('»', '»'), + ('༺', '༽'), + ('᚛', '᚜'), + ('‹', '›'), + ('⁅', '⁆'), + ('⁽', '⁾'), + ('₍', '₎'), + ('⅀', '⅀'), + ('∁', '∄'), + ('∈', '∍'), + ('∑', '∑'), + ('∕', '∖'), + ('√', '∝'), + ('∟', '∢'), + ('∤', '∤'), + ('∦', '∦'), + ('∫', '∳'), + ('∹', '∹'), + ('∻', '≌'), + ('≒', '≕'), + ('≟', '≠'), + ('≢', '≢'), + ('≤', '≫'), + ('≮', '⊌'), + ('⊏', '⊒'), + ('⊘', '⊘'), + ('⊢', '⊣'), + ('⊦', '⊸'), + ('⊾', '⊿'), + ('⋉', '⋍'), + ('⋐', '⋑'), + ('⋖', '⋭'), + ('⋰', '⋿'), + ('⌈', '⌋'), + ('⌠', '⌡'), + ('〈', '〉'), + ('❨', '❵'), + ('⟀', '⟀'), + ('⟃', '⟆'), + ('⟈', '⟉'), + ('⟋', '⟍'), + ('⟓', '⟖'), + ('⟜', '⟞'), + ('⟢', '⟯'), + ('⦃', '⦘'), + ('⦛', '⦠'), + ('⦢', '⦯'), + ('⦸', '⦸'), + ('⧀', '⧅'), + ('⧉', '⧉'), + ('⧎', '⧒'), + ('⧔', '⧕'), + ('⧘', '⧜'), + ('⧡', '⧡'), + ('⧣', '⧥'), + ('⧨', '⧩'), + ('⧴', '⧹'), + ('⧼', '⧽'), + ('⨊', '⨜'), + ('⨞', '⨡'), + ('⨤', '⨤'), + ('⨦', '⨦'), + ('⨩', '⨩'), + ('⨫', '⨮'), + ('⨴', '⨵'), + ('⨼', '⨾'), + ('⩗', '⩘'), + ('⩤', '⩥'), + ('⩪', '⩭'), + ('⩯', '⩰'), + ('⩳', '⩴'), + ('⩹', '⪣'), + ('⪦', '⪭'), + ('⪯', '⫖'), + ('⫝̸', '⫝̸'), + ('⫞', '⫞'), + ('⫢', '⫦'), + ('⫬', '⫮'), + ('⫳', '⫳'), + ('⫷', '⫻'), + ('⫽', '⫽'), + ('⯾', '⯾'), + ('⸂', '⸅'), + ('⸉', '⸊'), + ('⸌', '⸍'), + ('⸜', '⸝'), + ('⸠', '⸩'), + ('〈', '】'), + ('〔', '〛'), + ('﹙', '﹞'), + ('﹤', '﹥'), + ('(', ')'), + ('<', '<'), + ('>', '>'), + ('[', '['), + (']', ']'), + ('{', '{'), + ('}', '}'), + ('⦅', '⦆'), + ('「', '」'), + ('𝛛', '𝛛'), + ('𝜕', '𝜕'), + ('𝝏', '𝝏'), + ('𝞉', '𝞉'), + ('𝟃', '𝟃'), +]; + pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\'', '\''), ('.', '.'), @@ -776,6 +909,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('·', '·'), ('\u{483}', '\u{489}'), ('ՙ', 'ՙ'), + ('՟', '՟'), ('\u{591}', '\u{5bd}'), ('\u{5bf}', '\u{5bf}'), ('\u{5c1}', '\u{5c2}'), @@ -834,7 +968,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{b3f}', '\u{b3f}'), ('\u{b41}', '\u{b44}'), ('\u{b4d}', '\u{b4d}'), - ('\u{b56}', '\u{b56}'), + ('\u{b55}', '\u{b56}'), ('\u{b62}', '\u{b63}'), ('\u{b82}', '\u{b82}'), ('\u{bc0}', '\u{bc0}'), @@ -857,6 +991,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{d41}', '\u{d44}'), ('\u{d4d}', '\u{d4d}'), ('\u{d62}', '\u{d63}'), + ('\u{d81}', '\u{d81}'), ('\u{dca}', '\u{dca}'), ('\u{dd2}', '\u{dd4}'), ('\u{dd6}', '\u{dd6}'), @@ -918,7 +1053,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{1a73}', '\u{1a7c}'), ('\u{1a7f}', '\u{1a7f}'), ('ᪧ', 'ᪧ'), - ('\u{1ab0}', '\u{1abe}'), + ('\u{1ab0}', '\u{1ac0}'), ('\u{1b00}', '\u{1b03}'), ('\u{1b34}', '\u{1b34}'), ('\u{1b36}', '\u{1b3a}'), @@ -991,6 +1126,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{a806}', '\u{a806}'), ('\u{a80b}', '\u{a80b}'), ('\u{a825}', '\u{a826}'), + ('\u{a82c}', '\u{a82c}'), ('\u{a8c4}', '\u{a8c5}'), ('\u{a8e0}', '\u{a8f1}'), ('\u{a8ff}', '\u{a8ff}'), @@ -999,7 +1135,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{a980}', '\u{a982}'), ('\u{a9b3}', '\u{a9b3}'), ('\u{a9b6}', '\u{a9b9}'), - ('\u{a9bc}', 'ꦽ'), + ('\u{a9bc}', '\u{a9bd}'), ('ꧏ', 'ꧏ'), ('\u{a9e5}', 'ꧦ'), ('\u{aa29}', '\u{aa2e}'), @@ -1019,6 +1155,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('ꫳ', 'ꫴ'), ('\u{aaf6}', '\u{aaf6}'), ('꭛', 'ꭟ'), + ('\u{ab69}', '\u{ab6b}'), ('\u{abe5}', '\u{abe5}'), ('\u{abe8}', '\u{abe8}'), ('\u{abed}', '\u{abed}'), @@ -1049,6 +1186,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{10a3f}', '\u{10a3f}'), ('\u{10ae5}', '\u{10ae6}'), ('\u{10d24}', '\u{10d27}'), + ('\u{10eab}', '\u{10eac}'), ('\u{10f46}', '\u{10f50}'), ('\u{11001}', '\u{11001}'), ('\u{11038}', '\u{11046}'), @@ -1064,6 +1202,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{11180}', '\u{11181}'), ('\u{111b6}', '\u{111be}'), ('\u{111c9}', '\u{111cc}'), + ('\u{111cf}', '\u{111cf}'), ('\u{1122f}', '\u{11231}'), ('\u{11234}', '\u{11234}'), ('\u{11236}', '\u{11237}'), @@ -1099,6 +1238,9 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{11727}', '\u{1172b}'), ('\u{1182f}', '\u{11837}'), ('\u{11839}', '\u{1183a}'), + ('\u{1193b}', '\u{1193c}'), + ('\u{1193e}', '\u{1193e}'), + ('\u{11943}', '\u{11943}'), ('\u{119d4}', '\u{119d7}'), ('\u{119da}', '\u{119db}'), ('\u{119e0}', '\u{119e0}'), @@ -1133,7 +1275,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{16f4f}', '\u{16f4f}'), ('\u{16f8f}', '𖾟'), ('𖿠', '𖿡'), - ('\u{16fe3}', '\u{16fe3}'), + ('𖿣', '\u{16fe4}'), ('\u{1bc9d}', '\u{1bc9e}'), ('\u{1bca0}', '\u{1bca3}'), ('\u{1d167}', '\u{1d169}'), @@ -1152,10 +1294,10 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{1e01b}', '\u{1e021}'), ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), - ('\u{1e130}', '\u{1e13d}'), + ('\u{1e130}', '𞄽'), ('\u{1e2ec}', '\u{1e2ef}'), ('\u{1e8d0}', '\u{1e8d6}'), - ('\u{1e944}', '\u{1e94b}'), + ('\u{1e944}', '𞥋'), ('🏻', '🏿'), ('\u{e0001}', '\u{e0001}'), ('\u{e0020}', '\u{e007f}'), @@ -1252,11 +1394,12 @@ pub const CASED: &'static [(char, char)] = &[ ('Ꚁ', 'ꚝ'), ('Ꜣ', 'ꞇ'), ('Ꞌ', 'ꞎ'), - ('Ꞑ', '\u{a7bf}'), - ('\u{a7c2}', '\u{a7c6}'), + ('Ꞑ', 'ꞿ'), + ('Ꟃ', '\u{a7ca}'), + ('\u{a7f5}', '\u{a7f6}'), ('ꟸ', 'ꟺ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab67}'), + ('ꭜ', '\u{ab68}'), ('ꭰ', 'ꮿ'), ('ff', 'st'), ('ﬓ', 'ﬗ'), @@ -1903,11 +2046,13 @@ pub const CHANGES_WHEN_CASEFOLDED: &'static [(char, char)] = &[ ('Ʞ', 'Ꞵ'), ('Ꞷ', 'Ꞷ'), ('Ꞹ', 'Ꞹ'), - ('\u{a7ba}', '\u{a7ba}'), - ('\u{a7bc}', '\u{a7bc}'), - ('\u{a7be}', '\u{a7be}'), - ('\u{a7c2}', '\u{a7c2}'), - ('\u{a7c4}', '\u{a7c6}'), + ('Ꞻ', 'Ꞻ'), + ('Ꞽ', 'Ꞽ'), + ('Ꞿ', 'Ꞿ'), + ('Ꟃ', 'Ꟃ'), + ('Ꞔ', '\u{a7c7}'), + ('\u{a7c9}', '\u{a7c9}'), + ('\u{a7f5}', '\u{a7f5}'), ('ꭰ', 'ꮿ'), ('ff', 'st'), ('ﬓ', 'ﬗ'), @@ -2028,8 +2173,9 @@ pub const CHANGES_WHEN_CASEMAPPED: &'static [(char, char)] = &[ ('Ꞌ', 'Ɥ'), ('Ꞑ', 'ꞔ'), ('Ꞗ', 'Ɪ'), - ('Ʞ', '\u{a7bf}'), - ('\u{a7c2}', '\u{a7c6}'), + ('Ʞ', 'ꞿ'), + ('Ꟃ', '\u{a7ca}'), + ('\u{a7f5}', '\u{a7f6}'), ('ꭓ', 'ꭓ'), ('ꭰ', 'ꮿ'), ('ff', 'st'), @@ -2634,11 +2780,13 @@ pub const CHANGES_WHEN_LOWERCASED: &'static [(char, char)] = &[ ('Ʞ', 'Ꞵ'), ('Ꞷ', 'Ꞷ'), ('Ꞹ', 'Ꞹ'), - ('\u{a7ba}', '\u{a7ba}'), - ('\u{a7bc}', '\u{a7bc}'), - ('\u{a7be}', '\u{a7be}'), - ('\u{a7c2}', '\u{a7c2}'), - ('\u{a7c4}', '\u{a7c6}'), + ('Ꞻ', 'Ꞻ'), + ('Ꞽ', 'Ꞽ'), + ('Ꞿ', 'Ꞿ'), + ('Ꟃ', 'Ꟃ'), + ('Ꞔ', '\u{a7c7}'), + ('\u{a7c9}', '\u{a7c9}'), + ('\u{a7f5}', '\u{a7f5}'), ('A', 'Z'), ('𐐀', '𐐧'), ('𐒰', '𐓓'), @@ -3249,10 +3397,13 @@ pub const CHANGES_WHEN_TITLECASED: &'static [(char, char)] = &[ ('ꞵ', 'ꞵ'), ('ꞷ', 'ꞷ'), ('ꞹ', 'ꞹ'), - ('\u{a7bb}', '\u{a7bb}'), - ('\u{a7bd}', '\u{a7bd}'), - ('\u{a7bf}', '\u{a7bf}'), - ('\u{a7c3}', '\u{a7c3}'), + ('ꞻ', 'ꞻ'), + ('ꞽ', 'ꞽ'), + ('ꞿ', 'ꞿ'), + ('ꟃ', 'ꟃ'), + ('\u{a7c8}', '\u{a7c8}'), + ('\u{a7ca}', '\u{a7ca}'), + ('\u{a7f6}', '\u{a7f6}'), ('ꭓ', 'ꭓ'), ('ꭰ', 'ꮿ'), ('ff', 'st'), @@ -3868,10 +4019,13 @@ pub const CHANGES_WHEN_UPPERCASED: &'static [(char, char)] = &[ ('ꞵ', 'ꞵ'), ('ꞷ', 'ꞷ'), ('ꞹ', 'ꞹ'), - ('\u{a7bb}', '\u{a7bb}'), - ('\u{a7bd}', '\u{a7bd}'), - ('\u{a7bf}', '\u{a7bf}'), - ('\u{a7c3}', '\u{a7c3}'), + ('ꞻ', 'ꞻ'), + ('ꞽ', 'ꞽ'), + ('ꞿ', 'ꞿ'), + ('ꟃ', 'ꟃ'), + ('\u{a7c8}', '\u{a7c8}'), + ('\u{a7ca}', '\u{a7ca}'), + ('\u{a7f6}', '\u{a7f6}'), ('ꭓ', 'ꭓ'), ('ꭰ', 'ꮿ'), ('ff', 'st'), @@ -3907,6 +4061,7 @@ pub const DASH: &'static [(char, char)] = &[ ('﹘', '﹘'), ('﹣', '﹣'), ('-', '-'), + ('\u{10ead}', '\u{10ead}'), ]; pub const DEFAULT_IGNORABLE_CODE_POINT: &'static [(char, char)] = &[ @@ -3983,6 +4138,7 @@ pub const DIACRITIC: &'static [(char, char)] = &[ ('\u{afd}', '\u{aff}'), ('\u{b3c}', '\u{b3c}'), ('\u{b4d}', '\u{b4d}'), + ('\u{b55}', '\u{b55}'), ('\u{bcd}', '\u{bcd}'), ('\u{c4d}', '\u{c4d}'), ('\u{cbc}', '\u{cbc}'), @@ -4060,6 +4216,7 @@ pub const DIACRITIC: &'static [(char, char)] = &[ ('\u{aabf}', 'ꫂ'), ('\u{aaf6}', '\u{aaf6}'), ('꭛', 'ꭟ'), + ('\u{ab69}', '\u{ab6b}'), ('꯬', '\u{abed}'), ('\u{fb1e}', '\u{fb1e}'), ('\u{fe20}', '\u{fe2f}'), @@ -4091,6 +4248,8 @@ pub const DIACRITIC: &'static [(char, char)] = &[ ('𑚶', '\u{116b7}'), ('\u{1172b}', '\u{1172b}'), ('\u{11839}', '\u{1183a}'), + ('\u{1193d}', '\u{1193e}'), + ('\u{11943}', '\u{11943}'), ('\u{119e0}', '\u{119e0}'), ('\u{11a34}', '\u{11a34}'), ('\u{11a47}', '\u{11a47}'), @@ -4102,6 +4261,7 @@ pub const DIACRITIC: &'static [(char, char)] = &[ ('\u{16af0}', '\u{16af4}'), ('\u{16b30}', '\u{16b36}'), ('\u{16f8f}', '𖾟'), + ('\u{16ff0}', '\u{16ff1}'), ('\u{1d167}', '\u{1d169}'), ('𝅭', '\u{1d172}'), ('\u{1d17b}', '\u{1d182}'), @@ -4161,6 +4321,7 @@ pub const EMOJI: &'static [(char, char)] = &[ ('⚙', '⚙'), ('⚛', '⚜'), ('⚠', '⚡'), + ('⚧', '⚧'), ('⚪', '⚫'), ('⚰', '⚱'), ('⚽', '⚾'), @@ -4247,25 +4408,25 @@ pub const EMOJI: &'static [(char, char)] = &[ ('🗺', '🙏'), ('🚀', '🛅'), ('🛋', '🛒'), - ('\u{1f6d5}', '\u{1f6d5}'), + ('🛕', '\u{1f6d7}'), ('🛠', '🛥'), ('🛩', '🛩'), ('🛫', '🛬'), ('🛰', '🛰'), - ('🛳', '\u{1f6fa}'), - ('\u{1f7e0}', '\u{1f7eb}'), - ('\u{1f90d}', '🤺'), + ('🛳', '\u{1f6fc}'), + ('🟠', '🟫'), + ('\u{1f90c}', '🤺'), ('🤼', '🥅'), - ('🥇', '\u{1f971}'), - ('🥳', '🥶'), - ('🥺', '🦢'), - ('\u{1f9a5}', '\u{1f9aa}'), - ('\u{1f9ae}', '\u{1f9ca}'), - ('\u{1f9cd}', '🧿'), - ('\u{1fa70}', '\u{1fa73}'), - ('\u{1fa78}', '\u{1fa7a}'), - ('\u{1fa80}', '\u{1fa82}'), - ('\u{1fa90}', '\u{1fa95}'), + ('🥇', '\u{1f978}'), + ('🥺', '\u{1f9cb}'), + ('🧍', '🧿'), + ('🩰', '\u{1fa74}'), + ('🩸', '🩺'), + ('🪀', '\u{1fa86}'), + ('🪐', '\u{1faa8}'), + ('\u{1fab0}', '\u{1fab6}'), + ('\u{1fac0}', '\u{1fac2}'), + ('\u{1fad0}', '\u{1fad6}'), ]; pub const EMOJI_COMPONENT: &'static [(char, char)] = &[ @@ -4310,15 +4471,17 @@ pub const EMOJI_MODIFIER_BASE: &'static [(char, char)] = &[ ('🚴', '🚶'), ('🛀', '🛀'), ('🛌', '🛌'), - ('\u{1f90f}', '\u{1f90f}'), + ('\u{1f90c}', '\u{1f90c}'), + ('🤏', '🤏'), ('🤘', '🤟'), ('🤦', '🤦'), ('🤰', '🤹'), ('🤼', '🤾'), + ('\u{1f977}', '\u{1f977}'), ('🦵', '🦶'), ('🦸', '🦹'), - ('\u{1f9bb}', '\u{1f9bb}'), - ('\u{1f9cd}', '\u{1f9cf}'), + ('🦻', '🦻'), + ('🧍', '🧏'), ('🧑', '🧝'), ]; @@ -4388,22 +4551,22 @@ pub const EMOJI_PRESENTATION: &'static [(char, char)] = &[ ('🚀', '🛅'), ('🛌', '🛌'), ('🛐', '🛒'), - ('\u{1f6d5}', '\u{1f6d5}'), + ('🛕', '\u{1f6d7}'), ('🛫', '🛬'), - ('🛴', '\u{1f6fa}'), - ('\u{1f7e0}', '\u{1f7eb}'), - ('\u{1f90d}', '🤺'), + ('🛴', '\u{1f6fc}'), + ('🟠', '🟫'), + ('\u{1f90c}', '🤺'), ('🤼', '🥅'), - ('🥇', '\u{1f971}'), - ('🥳', '🥶'), - ('🥺', '🦢'), - ('\u{1f9a5}', '\u{1f9aa}'), - ('\u{1f9ae}', '\u{1f9ca}'), - ('\u{1f9cd}', '🧿'), - ('\u{1fa70}', '\u{1fa73}'), - ('\u{1fa78}', '\u{1fa7a}'), - ('\u{1fa80}', '\u{1fa82}'), - ('\u{1fa90}', '\u{1fa95}'), + ('🥇', '\u{1f978}'), + ('🥺', '\u{1f9cb}'), + ('🧍', '🧿'), + ('🩰', '\u{1fa74}'), + ('🩸', '🩺'), + ('🪀', '\u{1fa86}'), + ('🪐', '\u{1faa8}'), + ('\u{1fab0}', '\u{1fab6}'), + ('\u{1fac0}', '\u{1fac2}'), + ('\u{1fad0}', '\u{1fad6}'), ]; pub const EXTENDED_PICTOGRAPHIC: &'static [(char, char)] = &[ @@ -4460,7 +4623,7 @@ pub const EXTENDED_PICTOGRAPHIC: &'static [(char, char)] = &[ ('🀀', '\u{1f0ff}'), ('\u{1f10d}', '\u{1f10f}'), ('🄯', '🄯'), - ('\u{1f16c}', '🅱'), + ('🅬', '🅱'), ('🅾', '🅿'), ('🆎', '🆎'), ('🆑', '🆚'), @@ -4483,7 +4646,8 @@ pub const EXTENDED_PICTOGRAPHIC: &'static [(char, char)] = &[ ('\u{1f8ae}', '\u{1f8ff}'), ('\u{1f90c}', '🤺'), ('🤼', '🥅'), - ('🥇', '\u{1fffd}'), + ('🥇', '\u{1faff}'), + ('\u{1fc00}', '\u{1fffd}'), ]; pub const EXTENDER: &'static [(char, char)] = &[ @@ -4491,6 +4655,7 @@ pub const EXTENDER: &'static [(char, char)] = &[ ('ː', 'ˑ'), ('ـ', 'ـ'), ('ߺ', 'ߺ'), + ('\u{b55}', '\u{b55}'), ('ๆ', 'ๆ'), ('ໆ', 'ໆ'), ('᠊', '᠊'), @@ -4515,8 +4680,8 @@ pub const EXTENDER: &'static [(char, char)] = &[ ('\u{11a98}', '\u{11a98}'), ('𖭂', '𖭃'), ('𖿠', '𖿡'), - ('\u{16fe3}', '\u{16fe3}'), - ('\u{1e13c}', '\u{1e13d}'), + ('𖿣', '𖿣'), + ('𞄼', '𞄽'), ('\u{1e944}', '\u{1e946}'), ]; @@ -4564,7 +4729,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('࡞', '࡞'), ('ࡠ', 'ࡪ'), ('ࢠ', 'ࢴ'), - ('ࢶ', 'ࢽ'), + ('ࢶ', '\u{8c7}'), ('ः', 'ह'), ('ऻ', 'ऻ'), ('ऽ', 'ी'), @@ -4655,7 +4820,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('ౘ', 'ౚ'), ('ౠ', 'ౡ'), ('౦', '౯'), - ('\u{c77}', 'ಀ'), + ('౷', 'ಀ'), ('ಂ', 'ಌ'), ('ಎ', 'ಐ'), ('ಒ', 'ನ'), @@ -4670,8 +4835,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('ೠ', 'ೡ'), ('೦', '೯'), ('ೱ', 'ೲ'), - ('ം', 'ഃ'), - ('അ', 'ഌ'), + ('ം', 'ഌ'), ('എ', 'ഐ'), ('ഒ', 'ഺ'), ('ഽ', 'ഽ'), @@ -4698,8 +4862,8 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('๏', '๛'), ('ກ', 'ຂ'), ('ຄ', 'ຄ'), - ('\u{e86}', 'ຊ'), - ('\u{e8c}', 'ຣ'), + ('ຆ', 'ຊ'), + ('ຌ', 'ຣ'), ('ລ', 'ລ'), ('ວ', 'ະ'), ('າ', 'ຳ'), @@ -4823,7 +4987,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('ᳩ', 'ᳬ'), ('ᳮ', 'ᳳ'), ('ᳵ', '᳷'), - ('\u{1cfa}', '\u{1cfa}'), + ('ᳺ', 'ᳺ'), ('ᴀ', 'ᶿ'), ('Ḁ', 'ἕ'), ('Ἐ', 'Ἕ'), @@ -4853,7 +5017,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('⑀', '⑊'), ('①', '⭳'), ('⭶', '⮕'), - ('⮘', 'Ⱞ'), + ('\u{2b97}', 'Ⱞ'), ('ⰰ', 'ⱞ'), ('Ⱡ', 'ⳮ'), ('Ⳳ', 'ⳳ'), @@ -4871,7 +5035,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('ⷈ', 'ⷎ'), ('ⷐ', 'ⷖ'), ('ⷘ', 'ⷞ'), - ('⸀', '\u{2e4f}'), + ('⸀', '\u{2e52}'), ('⺀', '⺙'), ('⺛', '⻳'), ('⼀', '⿕'), @@ -4882,11 +5046,9 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('゛', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('㆐', 'ㆺ'), - ('㇀', '㇣'), + ('㆐', '㇣'), ('ㇰ', '㈞'), - ('㈠', '䶵'), - ('䷀', '鿯'), + ('㈠', '\u{9ffc}'), ('ꀀ', 'ꒌ'), ('꒐', '꓆'), ('ꓐ', 'ꘫ'), @@ -4895,9 +5057,9 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('꙾', 'ꚝ'), ('ꚠ', 'ꛯ'), ('꛲', '꛷'), - ('꜀', '\u{a7bf}'), - ('\u{a7c2}', '\u{a7c6}'), - ('ꟷ', 'ꠁ'), + ('꜀', 'ꞿ'), + ('Ꟃ', '\u{a7ca}'), + ('\u{a7f5}', 'ꠁ'), ('ꠃ', 'ꠅ'), ('ꠇ', 'ꠊ'), ('ꠌ', 'ꠤ'), @@ -4939,7 +5101,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('ꬑ', 'ꬖ'), ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), - ('ꬰ', '\u{ab67}'), + ('ꬰ', '\u{ab6b}'), ('ꭰ', 'ꯤ'), ('ꯦ', 'ꯧ'), ('ꯩ', '꯬'), @@ -4987,7 +5149,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𐄀', '𐄂'), ('𐄇', '𐄳'), ('𐄷', '𐆎'), - ('𐆐', '𐆛'), + ('𐆐', '\u{1019c}'), ('𐆠', '𐆠'), ('𐇐', '𐇼'), ('𐊀', '𐊜'), @@ -5045,10 +5207,14 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𐳺', '𐴣'), ('𐴰', '𐴹'), ('𐹠', '𐹾'), + ('\u{10e80}', '\u{10ea9}'), + ('\u{10ead}', '\u{10ead}'), + ('\u{10eb0}', '\u{10eb1}'), ('𐼀', '𐼧'), ('𐼰', '𐽅'), ('𐽑', '𐽙'), - ('\u{10fe0}', '\u{10ff6}'), + ('\u{10fb0}', '\u{10fcb}'), + ('𐿠', '𐿶'), ('𑀀', '𑀀'), ('𑀂', '𑀷'), ('𑁇', '𑁍'), @@ -5061,12 +5227,12 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𑃰', '𑃹'), ('𑄃', '𑄦'), ('𑄬', '𑄬'), - ('𑄶', '𑅆'), + ('𑄶', '\u{11147}'), ('𑅐', '𑅲'), ('𑅴', '𑅶'), ('𑆂', '𑆵'), ('𑆿', '𑇈'), - ('𑇍', '𑇍'), + ('𑇍', '\u{111ce}'), ('𑇐', '𑇟'), ('𑇡', '𑇴'), ('𑈀', '𑈑'), @@ -5099,10 +5265,9 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𑐀', '𑐷'), ('𑑀', '𑑁'), ('𑑅', '𑑅'), - ('𑑇', '𑑙'), - ('𑑛', '𑑛'), + ('𑑇', '𑑛'), ('𑑝', '𑑝'), - ('\u{1145f}', '\u{1145f}'), + ('𑑟', '\u{11461}'), ('𑒀', '𑒯'), ('𑒱', '𑒲'), ('𑒹', '𑒹'), @@ -5126,7 +5291,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𑚬', '𑚬'), ('𑚮', '𑚯'), ('𑚶', '𑚶'), - ('\u{116b8}', '\u{116b8}'), + ('𑚸', '𑚸'), ('𑛀', '𑛉'), ('𑜀', '𑜚'), ('𑜠', '𑜡'), @@ -5136,11 +5301,21 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𑠸', '𑠸'), ('𑠻', '𑠻'), ('𑢠', '𑣲'), - ('𑣿', '𑣿'), - ('\u{119a0}', '\u{119a7}'), - ('\u{119aa}', '\u{119d3}'), - ('\u{119dc}', '\u{119df}'), - ('\u{119e1}', '\u{119e4}'), + ('𑣿', '\u{11906}'), + ('\u{11909}', '\u{11909}'), + ('\u{1190c}', '\u{11913}'), + ('\u{11915}', '\u{11916}'), + ('\u{11918}', '\u{1192f}'), + ('\u{11931}', '\u{11935}'), + ('\u{11937}', '\u{11938}'), + ('\u{1193d}', '\u{1193d}'), + ('\u{1193f}', '\u{11942}'), + ('\u{11944}', '\u{11946}'), + ('\u{11950}', '\u{11959}'), + ('𑦠', '𑦧'), + ('𑦪', '𑧓'), + ('𑧜', '𑧟'), + ('𑧡', '𑧤'), ('𑨀', '𑨀'), ('𑨋', '𑨲'), ('𑨹', '𑨺'), @@ -5174,8 +5349,9 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𑶠', '𑶩'), ('𑻠', '𑻲'), ('𑻵', '𑻸'), - ('\u{11fc0}', '\u{11ff1}'), - ('\u{11fff}', '𒎙'), + ('\u{11fb0}', '\u{11fb0}'), + ('𑿀', '𑿱'), + ('𑿿', '𒎙'), ('𒐀', '𒑮'), ('𒑰', '𒑴'), ('𒒀', '𒕃'), @@ -5194,15 +5370,17 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𖭣', '𖭷'), ('𖭽', '𖮏'), ('𖹀', '𖺚'), - ('𖼀', '\u{16f4a}'), - ('𖽐', '\u{16f87}'), + ('𖼀', '𖽊'), + ('𖽐', '𖾇'), ('𖾓', '𖾟'), - ('𖿠', '\u{16fe3}'), - ('𗀀', '\u{187f7}'), - ('𘠀', '𘫲'), + ('𖿠', '𖿣'), + ('\u{16ff0}', '\u{16ff1}'), + ('𗀀', '𘟷'), + ('𘠀', '\u{18cd5}'), + ('\u{18d00}', '\u{18d08}'), ('𛀀', '𛄞'), - ('\u{1b150}', '\u{1b152}'), - ('\u{1b164}', '\u{1b167}'), + ('𛅐', '𛅒'), + ('𛅤', '𛅧'), ('𛅰', '𛋻'), ('𛰀', '𛱪'), ('𛱰', '𛱼'), @@ -5248,21 +5426,21 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𝩭', '𝩴'), ('𝩶', '𝪃'), ('𝪅', '𝪋'), - ('\u{1e100}', '\u{1e12c}'), - ('\u{1e137}', '\u{1e13d}'), - ('\u{1e140}', '\u{1e149}'), - ('\u{1e14e}', '\u{1e14f}'), - ('\u{1e2c0}', '\u{1e2eb}'), - ('\u{1e2f0}', '\u{1e2f9}'), - ('\u{1e2ff}', '\u{1e2ff}'), + ('𞄀', '𞄬'), + ('𞄷', '𞄽'), + ('𞅀', '𞅉'), + ('𞅎', '𞅏'), + ('𞋀', '𞋫'), + ('𞋰', '𞋹'), + ('𞋿', '𞋿'), ('𞠀', '𞣄'), ('𞣇', '𞣏'), ('𞤀', '𞥃'), - ('\u{1e94b}', '\u{1e94b}'), + ('𞥋', '𞥋'), ('𞥐', '𞥙'), ('𞥞', '𞥟'), ('𞱱', '𞲴'), - ('\u{1ed01}', '\u{1ed3d}'), + ('𞴁', '𞴽'), ('𞸀', '𞸃'), ('𞸅', '𞸟'), ('𞸡', '𞸢'), @@ -5303,43 +5481,45 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('🂱', '🂿'), ('🃁', '🃏'), ('🃑', '🃵'), - ('🄀', '🄌'), - ('🄐', '\u{1f16c}'), - ('🅰', '🆬'), + ('🄀', '\u{1f1ad}'), ('🇦', '🈂'), ('🈐', '🈻'), ('🉀', '🉈'), ('🉐', '🉑'), ('🉠', '🉥'), - ('🌀', '\u{1f6d5}'), + ('🌀', '\u{1f6d7}'), ('🛠', '🛬'), - ('🛰', '\u{1f6fa}'), + ('🛰', '\u{1f6fc}'), ('🜀', '🝳'), ('🞀', '🟘'), - ('\u{1f7e0}', '\u{1f7eb}'), + ('🟠', '🟫'), ('🠀', '🠋'), ('🠐', '🡇'), ('🡐', '🡙'), ('🡠', '🢇'), ('🢐', '🢭'), - ('🤀', '🤋'), - ('\u{1f90d}', '\u{1f971}'), - ('🥳', '🥶'), - ('🥺', '🦢'), - ('\u{1f9a5}', '\u{1f9aa}'), - ('\u{1f9ae}', '\u{1f9ca}'), - ('\u{1f9cd}', '\u{1fa53}'), + ('\u{1f8b0}', '\u{1f8b1}'), + ('🤀', '\u{1f978}'), + ('🥺', '\u{1f9cb}'), + ('🧍', '🩓'), ('🩠', '🩭'), - ('\u{1fa70}', '\u{1fa73}'), - ('\u{1fa78}', '\u{1fa7a}'), - ('\u{1fa80}', '\u{1fa82}'), - ('\u{1fa90}', '\u{1fa95}'), - ('𠀀', '𪛖'), + ('🩰', '\u{1fa74}'), + ('🩸', '🩺'), + ('🪀', '\u{1fa86}'), + ('🪐', '\u{1faa8}'), + ('\u{1fab0}', '\u{1fab6}'), + ('\u{1fac0}', '\u{1fac2}'), + ('\u{1fad0}', '\u{1fad6}'), + ('\u{1fb00}', '\u{1fb92}'), + ('\u{1fb94}', '\u{1fbca}'), + ('\u{1fbf0}', '\u{1fbf9}'), + ('𠀀', '\u{2a6dd}'), ('𪜀', '𫜴'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), + ('\u{30000}', '\u{3134a}'), ]; pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ @@ -5403,7 +5583,7 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{b3e}', '\u{b3f}'), ('\u{b41}', '\u{b44}'), ('\u{b4d}', '\u{b4d}'), - ('\u{b56}', '\u{b57}'), + ('\u{b55}', '\u{b57}'), ('\u{b62}', '\u{b63}'), ('\u{b82}', '\u{b82}'), ('\u{bbe}', '\u{bbe}'), @@ -5432,6 +5612,7 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{d4d}', '\u{d4d}'), ('\u{d57}', '\u{d57}'), ('\u{d62}', '\u{d63}'), + ('\u{d81}', '\u{d81}'), ('\u{dca}', '\u{dca}'), ('\u{dcf}', '\u{dcf}'), ('\u{dd2}', '\u{dd4}'), @@ -5490,7 +5671,7 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{1a65}', '\u{1a6c}'), ('\u{1a73}', '\u{1a7c}'), ('\u{1a7f}', '\u{1a7f}'), - ('\u{1ab0}', '\u{1abe}'), + ('\u{1ab0}', '\u{1ac0}'), ('\u{1b00}', '\u{1b03}'), ('\u{1b34}', '\u{1b3a}'), ('\u{1b3c}', '\u{1b3c}'), @@ -5529,6 +5710,7 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{a806}', '\u{a806}'), ('\u{a80b}', '\u{a80b}'), ('\u{a825}', '\u{a826}'), + ('\u{a82c}', '\u{a82c}'), ('\u{a8c4}', '\u{a8c5}'), ('\u{a8e0}', '\u{a8f1}'), ('\u{a8ff}', '\u{a8ff}'), @@ -5537,7 +5719,7 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{a980}', '\u{a982}'), ('\u{a9b3}', '\u{a9b3}'), ('\u{a9b6}', '\u{a9b9}'), - ('\u{a9bc}', 'ꦽ'), + ('\u{a9bc}', '\u{a9bd}'), ('\u{a9e5}', '\u{a9e5}'), ('\u{aa29}', '\u{aa2e}'), ('\u{aa31}', '\u{aa32}'), @@ -5569,6 +5751,7 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{10a3f}', '\u{10a3f}'), ('\u{10ae5}', '\u{10ae6}'), ('\u{10d24}', '\u{10d27}'), + ('\u{10eab}', '\u{10eac}'), ('\u{10f46}', '\u{10f50}'), ('\u{11001}', '\u{11001}'), ('\u{11038}', '\u{11046}'), @@ -5582,6 +5765,7 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{11180}', '\u{11181}'), ('\u{111b6}', '\u{111be}'), ('\u{111c9}', '\u{111cc}'), + ('\u{111cf}', '\u{111cf}'), ('\u{1122f}', '\u{11231}'), ('\u{11234}', '\u{11234}'), ('\u{11236}', '\u{11237}'), @@ -5622,6 +5806,10 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{11727}', '\u{1172b}'), ('\u{1182f}', '\u{11837}'), ('\u{11839}', '\u{1183a}'), + ('\u{11930}', '\u{11930}'), + ('\u{1193b}', '\u{1193c}'), + ('\u{1193e}', '\u{1193e}'), + ('\u{11943}', '\u{11943}'), ('\u{119d4}', '\u{119d7}'), ('\u{119da}', '\u{119db}'), ('\u{119e0}', '\u{119e0}'), @@ -5653,6 +5841,7 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{16b30}', '\u{16b36}'), ('\u{16f4f}', '\u{16f4f}'), ('\u{16f8f}', '\u{16f92}'), + ('\u{16fe4}', '\u{16fe4}'), ('\u{1bc9d}', '\u{1bc9e}'), ('\u{1d165}', '\u{1d165}'), ('\u{1d167}', '\u{1d169}'), @@ -5705,6 +5894,7 @@ pub const GRAPHEME_LINK: &'static [(char, char)] = &[ ('᯲', '᯳'), ('\u{2d7f}', '\u{2d7f}'), ('\u{a806}', '\u{a806}'), + ('\u{a82c}', '\u{a82c}'), ('\u{a8c4}', '\u{a8c4}'), ('꥓', '꥓'), ('꧀', '꧀'), @@ -5726,6 +5916,7 @@ pub const GRAPHEME_LINK: &'static [(char, char)] = &[ ('𑚶', '𑚶'), ('\u{1172b}', '\u{1172b}'), ('\u{11839}', '\u{11839}'), + ('\u{1193d}', '\u{1193e}'), ('\u{119e0}', '\u{119e0}'), ('\u{11a34}', '\u{11a34}'), ('\u{11a47}', '\u{11a47}'), @@ -5815,7 +6006,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('ࡀ', '\u{85b}'), ('ࡠ', 'ࡪ'), ('ࢠ', 'ࢴ'), - ('ࢶ', 'ࢽ'), + ('ࢶ', '\u{8c7}'), ('\u{8d3}', '\u{8e1}'), ('\u{8e3}', '\u{963}'), ('०', '९'), @@ -5875,7 +6066,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('\u{b3c}', '\u{b44}'), ('େ', 'ୈ'), ('ୋ', '\u{b4d}'), - ('\u{b56}', '\u{b57}'), + ('\u{b55}', '\u{b57}'), ('ଡ଼', 'ଢ଼'), ('ୟ', '\u{b63}'), ('୦', '୯'), @@ -5921,8 +6112,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('ೠ', '\u{ce3}'), ('೦', '೯'), ('ೱ', 'ೲ'), - ('\u{d00}', 'ഃ'), - ('അ', 'ഌ'), + ('\u{d00}', 'ഌ'), ('എ', 'ഐ'), ('ഒ', '\u{d44}'), ('െ', 'ൈ'), @@ -5931,7 +6121,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('ൟ', '\u{d63}'), ('൦', '൯'), ('ൺ', 'ൿ'), - ('ං', 'ඃ'), + ('\u{d81}', 'ඃ'), ('අ', 'ඖ'), ('ක', 'න'), ('ඳ', 'ර'), @@ -5948,8 +6138,8 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('๐', '๙'), ('ກ', 'ຂ'), ('ຄ', 'ຄ'), - ('\u{e86}', 'ຊ'), - ('\u{e8c}', 'ຣ'), + ('ຆ', 'ຊ'), + ('ຌ', 'ຣ'), ('ລ', 'ລ'), ('ວ', 'ຽ'), ('ເ', 'ໄ'), @@ -6032,6 +6222,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('᪐', '᪙'), ('ᪧ', 'ᪧ'), ('\u{1ab0}', '\u{1abd}'), + ('\u{1abf}', '\u{1ac0}'), ('\u{1b00}', 'ᭋ'), ('᭐', '᭙'), ('\u{1b6b}', '\u{1b73}'), @@ -6043,7 +6234,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('Ა', 'Ჺ'), ('Ჽ', 'Ჿ'), ('\u{1cd0}', '\u{1cd2}'), - ('\u{1cd4}', '\u{1cfa}'), + ('\u{1cd4}', 'ᳺ'), ('ᴀ', '\u{1df9}'), ('\u{1dfb}', 'ἕ'), ('Ἐ', 'Ἕ'), @@ -6114,10 +6305,10 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('ー', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', 'ㆺ'), + ('ㆠ', '\u{31bf}'), ('ㇰ', 'ㇿ'), - ('㐀', '䶵'), - ('一', '鿯'), + ('㐀', '\u{4dbf}'), + ('一', '\u{9ffc}'), ('ꀀ', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), @@ -6127,9 +6318,10 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('ꙿ', '\u{a6f1}'), ('ꜗ', 'ꜟ'), ('Ꜣ', 'ꞈ'), - ('Ꞌ', '\u{a7bf}'), - ('\u{a7c2}', '\u{a7c6}'), - ('ꟷ', 'ꠧ'), + ('Ꞌ', 'ꞿ'), + ('Ꟃ', '\u{a7ca}'), + ('\u{a7f5}', 'ꠧ'), + ('\u{a82c}', '\u{a82c}'), ('ꡀ', 'ꡳ'), ('ꢀ', '\u{a8c5}'), ('꣐', '꣙'), @@ -6155,7 +6347,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab67}'), + ('ꭜ', '\u{ab69}'), ('ꭰ', 'ꯪ'), ('꯬', '\u{abed}'), ('꯰', '꯹'), @@ -6254,10 +6446,14 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('𐳀', '𐳲'), ('𐴀', '\u{10d27}'), ('𐴰', '𐴹'), + ('\u{10e80}', '\u{10ea9}'), + ('\u{10eab}', '\u{10eac}'), + ('\u{10eb0}', '\u{10eb1}'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '\u{10f50}'), - ('\u{10fe0}', '\u{10ff6}'), + ('\u{10fb0}', '\u{10fc4}'), + ('𐿠', '𐿶'), ('𑀀', '\u{11046}'), ('𑁦', '𑁯'), ('\u{1107f}', '\u{110ba}'), @@ -6265,12 +6461,12 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('𑃰', '𑃹'), ('\u{11100}', '\u{11134}'), ('𑄶', '𑄿'), - ('𑅄', '𑅆'), + ('𑅄', '\u{11147}'), ('𑅐', '\u{11173}'), ('𑅶', '𑅶'), ('\u{11180}', '𑇄'), ('\u{111c9}', '\u{111cc}'), - ('𑇐', '𑇚'), + ('\u{111ce}', '𑇚'), ('𑇜', '𑇜'), ('𑈀', '𑈑'), ('𑈓', '\u{11237}'), @@ -6299,7 +6495,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('\u{11370}', '\u{11374}'), ('𑐀', '𑑊'), ('𑑐', '𑑙'), - ('\u{1145e}', '\u{1145f}'), + ('\u{1145e}', '\u{11461}'), ('𑒀', '𑓅'), ('𑓇', '𑓇'), ('𑓐', '𑓙'), @@ -6309,18 +6505,25 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('𑘀', '\u{11640}'), ('𑙄', '𑙄'), ('𑙐', '𑙙'), - ('𑚀', '\u{116b8}'), + ('𑚀', '𑚸'), ('𑛀', '𑛉'), ('𑜀', '𑜚'), ('\u{1171d}', '\u{1172b}'), ('𑜰', '𑜹'), ('𑠀', '\u{1183a}'), ('𑢠', '𑣩'), - ('𑣿', '𑣿'), - ('\u{119a0}', '\u{119a7}'), - ('\u{119aa}', '\u{119d7}'), - ('\u{119da}', '\u{119e1}'), - ('\u{119e3}', '\u{119e4}'), + ('𑣿', '\u{11906}'), + ('\u{11909}', '\u{11909}'), + ('\u{1190c}', '\u{11913}'), + ('\u{11915}', '\u{11916}'), + ('\u{11918}', '\u{11935}'), + ('\u{11937}', '\u{11938}'), + ('\u{1193b}', '\u{11943}'), + ('\u{11950}', '\u{11959}'), + ('𑦠', '𑦧'), + ('𑦪', '\u{119d7}'), + ('\u{119da}', '𑧡'), + ('𑧣', '𑧤'), ('𑨀', '\u{11a3e}'), ('\u{11a47}', '\u{11a47}'), ('𑩐', '\u{11a99}'), @@ -6347,6 +6550,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('𑶓', '𑶘'), ('𑶠', '𑶩'), ('𑻠', '𑻶'), + ('\u{11fb0}', '\u{11fb0}'), ('𒀀', '𒎙'), ('𒐀', '𒑮'), ('𒒀', '𒕃'), @@ -6363,16 +6567,18 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('𖭣', '𖭷'), ('𖭽', '𖮏'), ('𖹀', '𖹿'), - ('𖼀', '\u{16f4a}'), - ('\u{16f4f}', '\u{16f87}'), + ('𖼀', '𖽊'), + ('\u{16f4f}', '𖾇'), ('\u{16f8f}', '𖾟'), ('𖿠', '𖿡'), - ('\u{16fe3}', '\u{16fe3}'), - ('𗀀', '\u{187f7}'), - ('𘠀', '𘫲'), + ('𖿣', '\u{16fe4}'), + ('\u{16ff0}', '\u{16ff1}'), + ('𗀀', '𘟷'), + ('𘠀', '\u{18cd5}'), + ('\u{18d00}', '\u{18d08}'), ('𛀀', '𛄞'), - ('\u{1b150}', '\u{1b152}'), - ('\u{1b164}', '\u{1b167}'), + ('𛅐', '𛅒'), + ('𛅤', '𛅧'), ('𛅰', '𛋻'), ('𛰀', '𛱪'), ('𛱰', '𛱼'), @@ -6427,14 +6633,14 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('\u{1e01b}', '\u{1e021}'), ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), - ('\u{1e100}', '\u{1e12c}'), - ('\u{1e130}', '\u{1e13d}'), - ('\u{1e140}', '\u{1e149}'), - ('\u{1e14e}', '\u{1e14e}'), - ('\u{1e2c0}', '\u{1e2f9}'), + ('𞄀', '𞄬'), + ('\u{1e130}', '𞄽'), + ('𞅀', '𞅉'), + ('𞅎', '𞅎'), + ('𞋀', '𞋹'), ('𞠀', '𞣄'), ('\u{1e8d0}', '\u{1e8d6}'), - ('𞤀', '\u{1e94b}'), + ('𞤀', '𞥋'), ('𞥐', '𞥙'), ('𞸀', '𞸃'), ('𞸅', '𞸟'), @@ -6469,12 +6675,14 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('𞺡', '𞺣'), ('𞺥', '𞺩'), ('𞺫', '𞺻'), - ('𠀀', '𪛖'), + ('\u{1fbf0}', '\u{1fbf9}'), + ('𠀀', '\u{2a6dd}'), ('𪜀', '𫜴'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), + ('\u{30000}', '\u{3134a}'), ('\u{e0100}', '\u{e01ef}'), ]; @@ -6529,7 +6737,7 @@ pub const ID_START: &'static [(char, char)] = &[ ('ࡀ', 'ࡘ'), ('ࡠ', 'ࡪ'), ('ࢠ', 'ࢴ'), - ('ࢶ', 'ࢽ'), + ('ࢶ', '\u{8c7}'), ('ऄ', 'ह'), ('ऽ', 'ऽ'), ('ॐ', 'ॐ'), @@ -6605,7 +6813,7 @@ pub const ID_START: &'static [(char, char)] = &[ ('ೞ', 'ೞ'), ('ೠ', 'ೡ'), ('ೱ', 'ೲ'), - ('അ', 'ഌ'), + ('\u{d04}', 'ഌ'), ('എ', 'ഐ'), ('ഒ', 'ഺ'), ('ഽ', 'ഽ'), @@ -6623,8 +6831,8 @@ pub const ID_START: &'static [(char, char)] = &[ ('เ', 'ๆ'), ('ກ', 'ຂ'), ('ຄ', 'ຄ'), - ('\u{e86}', 'ຊ'), - ('\u{e8c}', 'ຣ'), + ('ຆ', 'ຊ'), + ('ຌ', 'ຣ'), ('ລ', 'ລ'), ('ວ', 'ະ'), ('າ', 'ຳ'), @@ -6708,7 +6916,7 @@ pub const ID_START: &'static [(char, char)] = &[ ('ᳩ', 'ᳬ'), ('ᳮ', 'ᳳ'), ('ᳵ', 'ᳶ'), - ('\u{1cfa}', '\u{1cfa}'), + ('ᳺ', 'ᳺ'), ('ᴀ', 'ᶿ'), ('Ḁ', 'ἕ'), ('Ἐ', 'Ἕ'), @@ -6774,10 +6982,10 @@ pub const ID_START: &'static [(char, char)] = &[ ('ー', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', 'ㆺ'), + ('ㆠ', '\u{31bf}'), ('ㇰ', 'ㇿ'), - ('㐀', '䶵'), - ('一', '鿯'), + ('㐀', '\u{4dbf}'), + ('一', '\u{9ffc}'), ('ꀀ', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), @@ -6788,9 +6996,9 @@ pub const ID_START: &'static [(char, char)] = &[ ('ꚠ', 'ꛯ'), ('ꜗ', 'ꜟ'), ('Ꜣ', 'ꞈ'), - ('Ꞌ', '\u{a7bf}'), - ('\u{a7c2}', '\u{a7c6}'), - ('ꟷ', 'ꠁ'), + ('Ꞌ', 'ꞿ'), + ('Ꟃ', '\u{a7ca}'), + ('\u{a7f5}', 'ꠁ'), ('ꠃ', 'ꠅ'), ('ꠇ', 'ꠊ'), ('ꠌ', 'ꠢ'), @@ -6827,7 +7035,7 @@ pub const ID_START: &'static [(char, char)] = &[ ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab67}'), + ('ꭜ', '\u{ab69}'), ('ꭰ', 'ꯢ'), ('가', '힣'), ('ힰ', 'ퟆ'), @@ -6912,15 +7120,19 @@ pub const ID_START: &'static [(char, char)] = &[ ('𐲀', '𐲲'), ('𐳀', '𐳲'), ('𐴀', '𐴣'), + ('\u{10e80}', '\u{10ea9}'), + ('\u{10eb0}', '\u{10eb1}'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '𐽅'), - ('\u{10fe0}', '\u{10ff6}'), + ('\u{10fb0}', '\u{10fc4}'), + ('𐿠', '𐿶'), ('𑀃', '𑀷'), ('𑂃', '𑂯'), ('𑃐', '𑃨'), ('𑄃', '𑄦'), ('𑅄', '𑅄'), + ('\u{11147}', '\u{11147}'), ('𑅐', '𑅲'), ('𑅶', '𑅶'), ('𑆃', '𑆲'), @@ -6946,7 +7158,7 @@ pub const ID_START: &'static [(char, char)] = &[ ('𑍝', '𑍡'), ('𑐀', '𑐴'), ('𑑇', '𑑊'), - ('\u{1145f}', '\u{1145f}'), + ('𑑟', '\u{11461}'), ('𑒀', '𑒯'), ('𑓄', '𑓅'), ('𑓇', '𑓇'), @@ -6955,15 +7167,21 @@ pub const ID_START: &'static [(char, char)] = &[ ('𑘀', '𑘯'), ('𑙄', '𑙄'), ('𑚀', '𑚪'), - ('\u{116b8}', '\u{116b8}'), + ('𑚸', '𑚸'), ('𑜀', '𑜚'), ('𑠀', '𑠫'), ('𑢠', '𑣟'), - ('𑣿', '𑣿'), - ('\u{119a0}', '\u{119a7}'), - ('\u{119aa}', '\u{119d0}'), - ('\u{119e1}', '\u{119e1}'), - ('\u{119e3}', '\u{119e3}'), + ('𑣿', '\u{11906}'), + ('\u{11909}', '\u{11909}'), + ('\u{1190c}', '\u{11913}'), + ('\u{11915}', '\u{11916}'), + ('\u{11918}', '\u{1192f}'), + ('\u{1193f}', '\u{1193f}'), + ('\u{11941}', '\u{11941}'), + ('𑦠', '𑦧'), + ('𑦪', '𑧐'), + ('𑧡', '𑧡'), + ('𑧣', '𑧣'), ('𑨀', '𑨀'), ('𑨋', '𑨲'), ('𑨺', '𑨺'), @@ -6984,6 +7202,7 @@ pub const ID_START: &'static [(char, char)] = &[ ('𑵪', '𑶉'), ('𑶘', '𑶘'), ('𑻠', '𑻲'), + ('\u{11fb0}', '\u{11fb0}'), ('𒀀', '𒎙'), ('𒐀', '𒑮'), ('𒒀', '𒕃'), @@ -6997,16 +7216,17 @@ pub const ID_START: &'static [(char, char)] = &[ ('𖭣', '𖭷'), ('𖭽', '𖮏'), ('𖹀', '𖹿'), - ('𖼀', '\u{16f4a}'), + ('𖼀', '𖽊'), ('𖽐', '𖽐'), ('𖾓', '𖾟'), ('𖿠', '𖿡'), - ('\u{16fe3}', '\u{16fe3}'), - ('𗀀', '\u{187f7}'), - ('𘠀', '𘫲'), + ('𖿣', '𖿣'), + ('𗀀', '𘟷'), + ('𘠀', '\u{18cd5}'), + ('\u{18d00}', '\u{18d08}'), ('𛀀', '𛄞'), - ('\u{1b150}', '\u{1b152}'), - ('\u{1b164}', '\u{1b167}'), + ('𛅐', '𛅒'), + ('𛅤', '𛅧'), ('𛅰', '𛋻'), ('𛰀', '𛱪'), ('𛱰', '𛱼'), @@ -7042,13 +7262,13 @@ pub const ID_START: &'static [(char, char)] = &[ ('𝞊', '𝞨'), ('𝞪', '𝟂'), ('𝟄', '𝟋'), - ('\u{1e100}', '\u{1e12c}'), - ('\u{1e137}', '\u{1e13d}'), - ('\u{1e14e}', '\u{1e14e}'), - ('\u{1e2c0}', '\u{1e2eb}'), + ('𞄀', '𞄬'), + ('𞄷', '𞄽'), + ('𞅎', '𞅎'), + ('𞋀', '𞋫'), ('𞠀', '𞣄'), ('𞤀', '𞥃'), - ('\u{1e94b}', '\u{1e94b}'), + ('𞥋', '𞥋'), ('𞸀', '𞸃'), ('𞸅', '𞸟'), ('𞸡', '𞸢'), @@ -7082,31 +7302,35 @@ pub const ID_START: &'static [(char, char)] = &[ ('𞺡', '𞺣'), ('𞺥', '𞺩'), ('𞺫', '𞺻'), - ('𠀀', '𪛖'), + ('𠀀', '\u{2a6dd}'), ('𪜀', '𫜴'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), + ('\u{30000}', '\u{3134a}'), ]; pub const IDEOGRAPHIC: &'static [(char, char)] = &[ ('〆', '〇'), ('〡', '〩'), ('〸', '〺'), - ('㐀', '䶵'), - ('一', '鿯'), + ('㐀', '\u{4dbf}'), + ('一', '\u{9ffc}'), ('豈', '舘'), ('並', '龎'), - ('𗀀', '\u{187f7}'), - ('𘠀', '𘫲'), + ('\u{16fe4}', '\u{16fe4}'), + ('𗀀', '𘟷'), + ('𘠀', '\u{18cd5}'), + ('\u{18d00}', '\u{18d08}'), ('𛅰', '𛋻'), - ('𠀀', '𪛖'), + ('𠀀', '\u{2a6dd}'), ('𪜀', '𫜴'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), + ('\u{30000}', '\u{3134a}'), ]; pub const JOIN_CONTROL: &'static [(char, char)] = &[('\u{200c}', '\u{200d}')]; @@ -7726,13 +7950,16 @@ pub const LOWERCASE: &'static [(char, char)] = &[ ('ꞵ', 'ꞵ'), ('ꞷ', 'ꞷ'), ('ꞹ', 'ꞹ'), - ('\u{a7bb}', '\u{a7bb}'), - ('\u{a7bd}', '\u{a7bd}'), - ('\u{a7bf}', '\u{a7bf}'), - ('\u{a7c3}', '\u{a7c3}'), + ('ꞻ', 'ꞻ'), + ('ꞽ', 'ꞽ'), + ('ꞿ', 'ꞿ'), + ('ꟃ', 'ꟃ'), + ('\u{a7c8}', '\u{a7c8}'), + ('\u{a7ca}', '\u{a7ca}'), + ('\u{a7f6}', '\u{a7f6}'), ('ꟸ', 'ꟺ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab67}'), + ('ꭜ', '\u{ab68}'), ('ꭰ', 'ꮿ'), ('ff', 'st'), ('ﬓ', 'ﬗ'), @@ -8013,7 +8240,7 @@ pub const OTHER_ALPHABETIC: &'static [(char, char)] = &[ ('ൊ', 'ൌ'), ('\u{d57}', '\u{d57}'), ('\u{d62}', '\u{d63}'), - ('ං', 'ඃ'), + ('\u{d81}', 'ඃ'), ('\u{dcf}', '\u{dd4}'), ('\u{dd6}', '\u{dd6}'), ('ෘ', '\u{ddf}'), @@ -8051,8 +8278,9 @@ pub const OTHER_ALPHABETIC: &'static [(char, char)] = &[ ('\u{1a17}', '\u{1a1b}'), ('ᩕ', '\u{1a5e}'), ('ᩡ', '\u{1a74}'), + ('\u{1abf}', '\u{1ac0}'), ('\u{1b00}', 'ᬄ'), - ('ᬵ', 'ᭃ'), + ('\u{1b35}', 'ᭃ'), ('\u{1b80}', 'ᮂ'), ('ᮡ', '\u{1ba9}'), ('\u{1bac}', '\u{1bad}'), @@ -8092,6 +8320,7 @@ pub const OTHER_ALPHABETIC: &'static [(char, char)] = &[ ('\u{10a05}', '\u{10a06}'), ('\u{10a0c}', '\u{10a0f}'), ('\u{10d24}', '\u{10d27}'), + ('\u{10eab}', '\u{10eac}'), ('𑀀', '𑀂'), ('\u{11038}', '\u{11045}'), ('𑂂', '𑂂'), @@ -8101,6 +8330,7 @@ pub const OTHER_ALPHABETIC: &'static [(char, char)] = &[ ('𑅅', '𑅆'), ('\u{11180}', '𑆂'), ('𑆳', '𑆿'), + ('\u{111ce}', '\u{111cf}'), ('𑈬', '\u{11234}'), ('\u{11237}', '\u{11237}'), ('\u{1123e}', '\u{1123e}'), @@ -8122,9 +8352,14 @@ pub const OTHER_ALPHABETIC: &'static [(char, char)] = &[ ('\u{116ab}', '\u{116b5}'), ('\u{1171d}', '\u{1172a}'), ('𑠬', '𑠸'), - ('\u{119d1}', '\u{119d7}'), - ('\u{119da}', '\u{119df}'), - ('\u{119e4}', '\u{119e4}'), + ('\u{11930}', '\u{11935}'), + ('\u{11937}', '\u{11938}'), + ('\u{1193b}', '\u{1193c}'), + ('\u{11940}', '\u{11940}'), + ('\u{11942}', '\u{11942}'), + ('𑧑', '\u{119d7}'), + ('\u{119da}', '𑧟'), + ('𑧤', '𑧤'), ('\u{11a01}', '\u{11a0a}'), ('\u{11a35}', '𑨹'), ('\u{11a3b}', '\u{11a3e}'), @@ -8145,8 +8380,9 @@ pub const OTHER_ALPHABETIC: &'static [(char, char)] = &[ ('𑶓', '𑶖'), ('\u{11ef3}', '𑻶'), ('\u{16f4f}', '\u{16f4f}'), - ('𖽑', '\u{16f87}'), + ('𖽑', '𖾇'), ('\u{16f8f}', '\u{16f92}'), + ('\u{16ff0}', '\u{16ff1}'), ('\u{1bc9e}', '\u{1bc9e}'), ('\u{1e000}', '\u{1e006}'), ('\u{1e008}', '\u{1e018}'), @@ -8186,7 +8422,7 @@ pub const OTHER_GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{d57}', '\u{d57}'), ('\u{dcf}', '\u{dcf}'), ('\u{ddf}', '\u{ddf}'), - ('ᬵ', 'ᬵ'), + ('\u{1b35}', '\u{1b35}'), ('\u{200c}', '\u{200c}'), ('\u{302e}', '\u{302f}'), ('\u{ff9e}', '\u{ff9f}'), @@ -8195,6 +8431,7 @@ pub const OTHER_GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{114b0}', '\u{114b0}'), ('\u{114bd}', '\u{114bd}'), ('\u{115af}', '\u{115af}'), + ('\u{11930}', '\u{11930}'), ('\u{1d165}', '\u{1d165}'), ('\u{1d16e}', '\u{1d172}'), ('\u{e0020}', '\u{e007f}'), @@ -8391,7 +8628,7 @@ pub const PATTERN_SYNTAX: &'static [(char, char)] = &[ ('⁕', '⁞'), ('←', '\u{245f}'), ('─', '❵'), - ('➔', '\u{2bff}'), + ('➔', '⯿'), ('⸀', '\u{2e7f}'), ('、', '〃'), ('〈', '〠'), @@ -8502,6 +8739,8 @@ pub const SENTENCE_TERMINAL: &'static [(char, char)] = &[ ('𑗉', '𑗗'), ('𑙁', '𑙂'), ('𑜼', '𑜾'), + ('\u{11944}', '\u{11944}'), + ('\u{11946}', '\u{11946}'), ('𑩂', '𑩃'), ('𑪛', '𑪜'), ('𑱁', '𑱂'), @@ -8593,7 +8832,7 @@ pub const TERMINAL_PUNCTUATION: &'static [(char, char)] = &[ ('⸼', '⸼'), ('⹁', '⹁'), ('⹌', '⹌'), - ('⹎', '\u{2e4f}'), + ('⹎', '⹏'), ('、', '。'), ('꓾', '꓿'), ('꘍', '꘏'), @@ -8633,11 +8872,13 @@ pub const TERMINAL_PUNCTUATION: &'static [(char, char)] = &[ ('𑈸', '𑈼'), ('𑊩', '𑊩'), ('𑑋', '𑑍'), - ('𑑛', '𑑛'), + ('\u{1145a}', '𑑛'), ('𑗂', '𑗅'), ('𑗉', '𑗗'), ('𑙁', '𑙂'), ('𑜼', '𑜾'), + ('\u{11944}', '\u{11944}'), + ('\u{11946}', '\u{11946}'), ('𑩂', '𑩃'), ('𑪛', '𑪜'), ('𑪡', '𑪢'), @@ -8655,8 +8896,8 @@ pub const TERMINAL_PUNCTUATION: &'static [(char, char)] = &[ ]; pub const UNIFIED_IDEOGRAPH: &'static [(char, char)] = &[ - ('㐀', '䶵'), - ('一', '鿯'), + ('㐀', '\u{4dbf}'), + ('一', '\u{9ffc}'), ('﨎', '﨏'), ('﨑', '﨑'), ('﨓', '﨔'), @@ -8664,11 +8905,12 @@ pub const UNIFIED_IDEOGRAPH: &'static [(char, char)] = &[ ('﨡', '﨡'), ('﨣', '﨤'), ('﨧', '﨩'), - ('𠀀', '𪛖'), + ('𠀀', '\u{2a6dd}'), ('𪜀', '𫜴'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), + ('\u{30000}', '\u{3134a}'), ]; pub const UPPERCASE: &'static [(char, char)] = &[ @@ -9267,11 +9509,13 @@ pub const UPPERCASE: &'static [(char, char)] = &[ ('Ʞ', 'Ꞵ'), ('Ꞷ', 'Ꞷ'), ('Ꞹ', 'Ꞹ'), - ('\u{a7ba}', '\u{a7ba}'), - ('\u{a7bc}', '\u{a7bc}'), - ('\u{a7be}', '\u{a7be}'), - ('\u{a7c2}', '\u{a7c2}'), - ('\u{a7c4}', '\u{a7c6}'), + ('Ꞻ', 'Ꞻ'), + ('Ꞽ', 'Ꞽ'), + ('Ꞿ', 'Ꞿ'), + ('Ꟃ', 'Ꟃ'), + ('Ꞔ', '\u{a7c7}'), + ('\u{a7c9}', '\u{a7c9}'), + ('\u{a7f5}', '\u{a7f5}'), ('A', 'Z'), ('𐐀', '𐐧'), ('𐒰', '𐓓'), @@ -9387,7 +9631,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('ࡀ', '\u{85b}'), ('ࡠ', 'ࡪ'), ('ࢠ', 'ࢴ'), - ('ࢶ', 'ࢽ'), + ('ࢶ', '\u{8c7}'), ('\u{8d3}', '\u{8e1}'), ('\u{8e3}', '\u{963}'), ('०', '९'), @@ -9447,7 +9691,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('\u{b3c}', '\u{b44}'), ('େ', 'ୈ'), ('ୋ', '\u{b4d}'), - ('\u{b56}', '\u{b57}'), + ('\u{b55}', '\u{b57}'), ('ଡ଼', 'ଢ଼'), ('ୟ', '\u{b63}'), ('୦', '୯'), @@ -9493,8 +9737,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('ೠ', '\u{ce3}'), ('೦', '೯'), ('ೱ', 'ೲ'), - ('\u{d00}', 'ഃ'), - ('അ', 'ഌ'), + ('\u{d00}', 'ഌ'), ('എ', 'ഐ'), ('ഒ', '\u{d44}'), ('െ', 'ൈ'), @@ -9503,7 +9746,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('ൟ', '\u{d63}'), ('൦', '൯'), ('ൺ', 'ൿ'), - ('ං', 'ඃ'), + ('\u{d81}', 'ඃ'), ('අ', 'ඖ'), ('ක', 'න'), ('ඳ', 'ර'), @@ -9520,8 +9763,8 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('๐', '๙'), ('ກ', 'ຂ'), ('ຄ', 'ຄ'), - ('\u{e86}', 'ຊ'), - ('\u{e8c}', 'ຣ'), + ('ຆ', 'ຊ'), + ('ຌ', 'ຣ'), ('ລ', 'ລ'), ('ວ', 'ຽ'), ('ເ', 'ໄ'), @@ -9604,6 +9847,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('᪐', '᪙'), ('ᪧ', 'ᪧ'), ('\u{1ab0}', '\u{1abd}'), + ('\u{1abf}', '\u{1ac0}'), ('\u{1b00}', 'ᭋ'), ('᭐', '᭙'), ('\u{1b6b}', '\u{1b73}'), @@ -9615,7 +9859,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('Ა', 'Ჺ'), ('Ჽ', 'Ჿ'), ('\u{1cd0}', '\u{1cd2}'), - ('\u{1cd4}', '\u{1cfa}'), + ('\u{1cd4}', 'ᳺ'), ('ᴀ', '\u{1df9}'), ('\u{1dfb}', 'ἕ'), ('Ἐ', 'Ἕ'), @@ -9687,10 +9931,10 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('ー', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', 'ㆺ'), + ('ㆠ', '\u{31bf}'), ('ㇰ', 'ㇿ'), - ('㐀', '䶵'), - ('一', '鿯'), + ('㐀', '\u{4dbf}'), + ('一', '\u{9ffc}'), ('ꀀ', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), @@ -9700,9 +9944,10 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('ꙿ', '\u{a6f1}'), ('ꜗ', 'ꜟ'), ('Ꜣ', 'ꞈ'), - ('Ꞌ', '\u{a7bf}'), - ('\u{a7c2}', '\u{a7c6}'), - ('ꟷ', 'ꠧ'), + ('Ꞌ', 'ꞿ'), + ('Ꟃ', '\u{a7ca}'), + ('\u{a7f5}', 'ꠧ'), + ('\u{a82c}', '\u{a82c}'), ('ꡀ', 'ꡳ'), ('ꢀ', '\u{a8c5}'), ('꣐', '꣙'), @@ -9728,7 +9973,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab67}'), + ('ꭜ', '\u{ab69}'), ('ꭰ', 'ꯪ'), ('꯬', '\u{abed}'), ('꯰', '꯹'), @@ -9833,10 +10078,14 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('𐳀', '𐳲'), ('𐴀', '\u{10d27}'), ('𐴰', '𐴹'), + ('\u{10e80}', '\u{10ea9}'), + ('\u{10eab}', '\u{10eac}'), + ('\u{10eb0}', '\u{10eb1}'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '\u{10f50}'), - ('\u{10fe0}', '\u{10ff6}'), + ('\u{10fb0}', '\u{10fc4}'), + ('𐿠', '𐿶'), ('𑀀', '\u{11046}'), ('𑁦', '𑁯'), ('\u{1107f}', '\u{110ba}'), @@ -9844,12 +10093,12 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('𑃰', '𑃹'), ('\u{11100}', '\u{11134}'), ('𑄶', '𑄿'), - ('𑅄', '𑅆'), + ('𑅄', '\u{11147}'), ('𑅐', '\u{11173}'), ('𑅶', '𑅶'), ('\u{11180}', '𑇄'), ('\u{111c9}', '\u{111cc}'), - ('𑇐', '𑇚'), + ('\u{111ce}', '𑇚'), ('𑇜', '𑇜'), ('𑈀', '𑈑'), ('𑈓', '\u{11237}'), @@ -9878,7 +10127,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('\u{11370}', '\u{11374}'), ('𑐀', '𑑊'), ('𑑐', '𑑙'), - ('\u{1145e}', '\u{1145f}'), + ('\u{1145e}', '\u{11461}'), ('𑒀', '𑓅'), ('𑓇', '𑓇'), ('𑓐', '𑓙'), @@ -9888,18 +10137,25 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('𑘀', '\u{11640}'), ('𑙄', '𑙄'), ('𑙐', '𑙙'), - ('𑚀', '\u{116b8}'), + ('𑚀', '𑚸'), ('𑛀', '𑛉'), ('𑜀', '𑜚'), ('\u{1171d}', '\u{1172b}'), ('𑜰', '𑜹'), ('𑠀', '\u{1183a}'), ('𑢠', '𑣩'), - ('𑣿', '𑣿'), - ('\u{119a0}', '\u{119a7}'), - ('\u{119aa}', '\u{119d7}'), - ('\u{119da}', '\u{119e1}'), - ('\u{119e3}', '\u{119e4}'), + ('𑣿', '\u{11906}'), + ('\u{11909}', '\u{11909}'), + ('\u{1190c}', '\u{11913}'), + ('\u{11915}', '\u{11916}'), + ('\u{11918}', '\u{11935}'), + ('\u{11937}', '\u{11938}'), + ('\u{1193b}', '\u{11943}'), + ('\u{11950}', '\u{11959}'), + ('𑦠', '𑦧'), + ('𑦪', '\u{119d7}'), + ('\u{119da}', '𑧡'), + ('𑧣', '𑧤'), ('𑨀', '\u{11a3e}'), ('\u{11a47}', '\u{11a47}'), ('𑩐', '\u{11a99}'), @@ -9926,6 +10182,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('𑶓', '𑶘'), ('𑶠', '𑶩'), ('𑻠', '𑻶'), + ('\u{11fb0}', '\u{11fb0}'), ('𒀀', '𒎙'), ('𒐀', '𒑮'), ('𒒀', '𒕃'), @@ -9942,16 +10199,18 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('𖭣', '𖭷'), ('𖭽', '𖮏'), ('𖹀', '𖹿'), - ('𖼀', '\u{16f4a}'), - ('\u{16f4f}', '\u{16f87}'), + ('𖼀', '𖽊'), + ('\u{16f4f}', '𖾇'), ('\u{16f8f}', '𖾟'), ('𖿠', '𖿡'), - ('\u{16fe3}', '\u{16fe3}'), - ('𗀀', '\u{187f7}'), - ('𘠀', '𘫲'), + ('𖿣', '\u{16fe4}'), + ('\u{16ff0}', '\u{16ff1}'), + ('𗀀', '𘟷'), + ('𘠀', '\u{18cd5}'), + ('\u{18d00}', '\u{18d08}'), ('𛀀', '𛄞'), - ('\u{1b150}', '\u{1b152}'), - ('\u{1b164}', '\u{1b167}'), + ('𛅐', '𛅒'), + ('𛅤', '𛅧'), ('𛅰', '𛋻'), ('𛰀', '𛱪'), ('𛱰', '𛱼'), @@ -10006,14 +10265,14 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('\u{1e01b}', '\u{1e021}'), ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), - ('\u{1e100}', '\u{1e12c}'), - ('\u{1e130}', '\u{1e13d}'), - ('\u{1e140}', '\u{1e149}'), - ('\u{1e14e}', '\u{1e14e}'), - ('\u{1e2c0}', '\u{1e2f9}'), + ('𞄀', '𞄬'), + ('\u{1e130}', '𞄽'), + ('𞅀', '𞅉'), + ('𞅎', '𞅎'), + ('𞋀', '𞋹'), ('𞠀', '𞣄'), ('\u{1e8d0}', '\u{1e8d6}'), - ('𞤀', '\u{1e94b}'), + ('𞤀', '𞥋'), ('𞥐', '𞥙'), ('𞸀', '𞸃'), ('𞸅', '𞸟'), @@ -10048,12 +10307,14 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('𞺡', '𞺣'), ('𞺥', '𞺩'), ('𞺫', '𞺻'), - ('𠀀', '𪛖'), + ('\u{1fbf0}', '\u{1fbf9}'), + ('𠀀', '\u{2a6dd}'), ('𪜀', '𫜴'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), + ('\u{30000}', '\u{3134a}'), ('\u{e0100}', '\u{e01ef}'), ]; @@ -10108,7 +10369,7 @@ pub const XID_START: &'static [(char, char)] = &[ ('ࡀ', 'ࡘ'), ('ࡠ', 'ࡪ'), ('ࢠ', 'ࢴ'), - ('ࢶ', 'ࢽ'), + ('ࢶ', '\u{8c7}'), ('ऄ', 'ह'), ('ऽ', 'ऽ'), ('ॐ', 'ॐ'), @@ -10184,7 +10445,7 @@ pub const XID_START: &'static [(char, char)] = &[ ('ೞ', 'ೞ'), ('ೠ', 'ೡ'), ('ೱ', 'ೲ'), - ('അ', 'ഌ'), + ('\u{d04}', 'ഌ'), ('എ', 'ഐ'), ('ഒ', 'ഺ'), ('ഽ', 'ഽ'), @@ -10202,8 +10463,8 @@ pub const XID_START: &'static [(char, char)] = &[ ('เ', 'ๆ'), ('ກ', 'ຂ'), ('ຄ', 'ຄ'), - ('\u{e86}', 'ຊ'), - ('\u{e8c}', 'ຣ'), + ('ຆ', 'ຊ'), + ('ຌ', 'ຣ'), ('ລ', 'ລ'), ('ວ', 'ະ'), ('າ', 'າ'), @@ -10287,7 +10548,7 @@ pub const XID_START: &'static [(char, char)] = &[ ('ᳩ', 'ᳬ'), ('ᳮ', 'ᳳ'), ('ᳵ', 'ᳶ'), - ('\u{1cfa}', '\u{1cfa}'), + ('ᳺ', 'ᳺ'), ('ᴀ', 'ᶿ'), ('Ḁ', 'ἕ'), ('Ἐ', 'Ἕ'), @@ -10353,10 +10614,10 @@ pub const XID_START: &'static [(char, char)] = &[ ('ー', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', 'ㆺ'), + ('ㆠ', '\u{31bf}'), ('ㇰ', 'ㇿ'), - ('㐀', '䶵'), - ('一', '鿯'), + ('㐀', '\u{4dbf}'), + ('一', '\u{9ffc}'), ('ꀀ', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), @@ -10367,9 +10628,9 @@ pub const XID_START: &'static [(char, char)] = &[ ('ꚠ', 'ꛯ'), ('ꜗ', 'ꜟ'), ('Ꜣ', 'ꞈ'), - ('Ꞌ', '\u{a7bf}'), - ('\u{a7c2}', '\u{a7c6}'), - ('ꟷ', 'ꠁ'), + ('Ꞌ', 'ꞿ'), + ('Ꟃ', '\u{a7ca}'), + ('\u{a7f5}', 'ꠁ'), ('ꠃ', 'ꠅ'), ('ꠇ', 'ꠊ'), ('ꠌ', 'ꠢ'), @@ -10406,7 +10667,7 @@ pub const XID_START: &'static [(char, char)] = &[ ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab67}'), + ('ꭜ', '\u{ab69}'), ('ꭰ', 'ꯢ'), ('가', '힣'), ('ힰ', 'ퟆ'), @@ -10498,15 +10759,19 @@ pub const XID_START: &'static [(char, char)] = &[ ('𐲀', '𐲲'), ('𐳀', '𐳲'), ('𐴀', '𐴣'), + ('\u{10e80}', '\u{10ea9}'), + ('\u{10eb0}', '\u{10eb1}'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '𐽅'), - ('\u{10fe0}', '\u{10ff6}'), + ('\u{10fb0}', '\u{10fc4}'), + ('𐿠', '𐿶'), ('𑀃', '𑀷'), ('𑂃', '𑂯'), ('𑃐', '𑃨'), ('𑄃', '𑄦'), ('𑅄', '𑅄'), + ('\u{11147}', '\u{11147}'), ('𑅐', '𑅲'), ('𑅶', '𑅶'), ('𑆃', '𑆲'), @@ -10532,7 +10797,7 @@ pub const XID_START: &'static [(char, char)] = &[ ('𑍝', '𑍡'), ('𑐀', '𑐴'), ('𑑇', '𑑊'), - ('\u{1145f}', '\u{1145f}'), + ('𑑟', '\u{11461}'), ('𑒀', '𑒯'), ('𑓄', '𑓅'), ('𑓇', '𑓇'), @@ -10541,15 +10806,21 @@ pub const XID_START: &'static [(char, char)] = &[ ('𑘀', '𑘯'), ('𑙄', '𑙄'), ('𑚀', '𑚪'), - ('\u{116b8}', '\u{116b8}'), + ('𑚸', '𑚸'), ('𑜀', '𑜚'), ('𑠀', '𑠫'), ('𑢠', '𑣟'), - ('𑣿', '𑣿'), - ('\u{119a0}', '\u{119a7}'), - ('\u{119aa}', '\u{119d0}'), - ('\u{119e1}', '\u{119e1}'), - ('\u{119e3}', '\u{119e3}'), + ('𑣿', '\u{11906}'), + ('\u{11909}', '\u{11909}'), + ('\u{1190c}', '\u{11913}'), + ('\u{11915}', '\u{11916}'), + ('\u{11918}', '\u{1192f}'), + ('\u{1193f}', '\u{1193f}'), + ('\u{11941}', '\u{11941}'), + ('𑦠', '𑦧'), + ('𑦪', '𑧐'), + ('𑧡', '𑧡'), + ('𑧣', '𑧣'), ('𑨀', '𑨀'), ('𑨋', '𑨲'), ('𑨺', '𑨺'), @@ -10570,6 +10841,7 @@ pub const XID_START: &'static [(char, char)] = &[ ('𑵪', '𑶉'), ('𑶘', '𑶘'), ('𑻠', '𑻲'), + ('\u{11fb0}', '\u{11fb0}'), ('𒀀', '𒎙'), ('𒐀', '𒑮'), ('𒒀', '𒕃'), @@ -10583,16 +10855,17 @@ pub const XID_START: &'static [(char, char)] = &[ ('𖭣', '𖭷'), ('𖭽', '𖮏'), ('𖹀', '𖹿'), - ('𖼀', '\u{16f4a}'), + ('𖼀', '𖽊'), ('𖽐', '𖽐'), ('𖾓', '𖾟'), ('𖿠', '𖿡'), - ('\u{16fe3}', '\u{16fe3}'), - ('𗀀', '\u{187f7}'), - ('𘠀', '𘫲'), + ('𖿣', '𖿣'), + ('𗀀', '𘟷'), + ('𘠀', '\u{18cd5}'), + ('\u{18d00}', '\u{18d08}'), ('𛀀', '𛄞'), - ('\u{1b150}', '\u{1b152}'), - ('\u{1b164}', '\u{1b167}'), + ('𛅐', '𛅒'), + ('𛅤', '𛅧'), ('𛅰', '𛋻'), ('𛰀', '𛱪'), ('𛱰', '𛱼'), @@ -10628,13 +10901,13 @@ pub const XID_START: &'static [(char, char)] = &[ ('𝞊', '𝞨'), ('𝞪', '𝟂'), ('𝟄', '𝟋'), - ('\u{1e100}', '\u{1e12c}'), - ('\u{1e137}', '\u{1e13d}'), - ('\u{1e14e}', '\u{1e14e}'), - ('\u{1e2c0}', '\u{1e2eb}'), + ('𞄀', '𞄬'), + ('𞄷', '𞄽'), + ('𞅎', '𞅎'), + ('𞋀', '𞋫'), ('𞠀', '𞣄'), ('𞤀', '𞥃'), - ('\u{1e94b}', '\u{1e94b}'), + ('𞥋', '𞥋'), ('𞸀', '𞸃'), ('𞸅', '𞸟'), ('𞸡', '𞸢'), @@ -10668,10 +10941,11 @@ pub const XID_START: &'static [(char, char)] = &[ ('𞺡', '𞺣'), ('𞺥', '𞺩'), ('𞺫', '𞺻'), - ('𠀀', '𪛖'), + ('𠀀', '\u{2a6dd}'), ('𪜀', '𫜴'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), + ('\u{30000}', '\u{3134a}'), ]; diff --git a/regex-syntax/src/unicode_tables/property_names.rs b/regex-syntax/src/unicode_tables/property_names.rs index 1064b61cd4..19ca856d00 100644 --- a/regex-syntax/src/unicode_tables/property_names.rs +++ b/regex-syntax/src/unicode_tables/property_names.rs @@ -1,8 +1,8 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate property-names /tmp/ucd/12.1.0/ +// ucd-generate property-names ucd-13.0.0 // -// ucd-generate is available on crates.io. +// ucd-generate 0.2.7 is available on crates.io. pub const PROPERTY_NAMES: &'static [(&'static str, &'static str)] = &[ ("age", "Age"), @@ -47,7 +47,9 @@ pub const PROPERTY_NAMES: &'static [(&'static str, &'static str)] = &[ ("cjkirgkpsource", "kIRG_KPSource"), ("cjkirgksource", "kIRG_KSource"), ("cjkirgmsource", "kIRG_MSource"), + ("cjkirgssource", "kIRG_SSource"), ("cjkirgtsource", "kIRG_TSource"), + ("cjkirguksource", "kIRG_UKSource"), ("cjkirgusource", "kIRG_USource"), ("cjkirgvsource", "kIRG_VSource"), ("cjkothernumeric", "kOtherNumeric"), @@ -74,11 +76,15 @@ pub const PROPERTY_NAMES: &'static [(&'static str, &'static str)] = &[ ("dt", "Decomposition_Type"), ("ea", "East_Asian_Width"), ("eastasianwidth", "East_Asian_Width"), + ("ebase", "Emoji_Modifier_Base"), + ("ecomp", "Emoji_Component"), + ("emod", "Emoji_Modifier"), ("emoji", "Emoji"), ("emojicomponent", "Emoji_Component"), ("emojimodifier", "Emoji_Modifier"), ("emojimodifierbase", "Emoji_Modifier_Base"), ("emojipresentation", "Emoji_Presentation"), + ("epres", "Emoji_Presentation"), ("equideo", "Equivalent_Unified_Ideograph"), ("equivalentunifiedideograph", "Equivalent_Unified_Ideograph"), ("expandsonnfc", "Expands_On_NFC"), @@ -88,6 +94,7 @@ pub const PROPERTY_NAMES: &'static [(&'static str, &'static str)] = &[ ("ext", "Extender"), ("extendedpictographic", "Extended_Pictographic"), ("extender", "Extender"), + ("extpict", "Extended_Pictographic"), ("fcnfkc", "FC_NFKC_Closure"), ("fcnfkcclosure", "FC_NFKC_Closure"), ("fullcompositionexclusion", "Full_Composition_Exclusion"), @@ -138,7 +145,9 @@ pub const PROPERTY_NAMES: &'static [(&'static str, &'static str)] = &[ ("kirgkpsource", "kIRG_KPSource"), ("kirgksource", "kIRG_KSource"), ("kirgmsource", "kIRG_MSource"), + ("kirgssource", "kIRG_SSource"), ("kirgtsource", "kIRG_TSource"), + ("kirguksource", "kIRG_UKSource"), ("kirgusource", "kIRG_USource"), ("kirgvsource", "kIRG_VSource"), ("kothernumeric", "kOtherNumeric"), diff --git a/regex-syntax/src/unicode_tables/property_values.rs b/regex-syntax/src/unicode_tables/property_values.rs index 0f960b0d44..bff7d34563 100644 --- a/regex-syntax/src/unicode_tables/property_values.rs +++ b/regex-syntax/src/unicode_tables/property_values.rs @@ -1,8 +1,8 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate property-values /tmp/ucd/12.1.0/ --include gc,script,scx,age,gcb,wb,sb +// ucd-generate property-values ucd-13.0.0 --include gc,script,scx,age,gcb,wb,sb // -// ucd-generate is available on crates.io. +// ucd-generate 0.2.7 is available on crates.io. pub const PROPERTY_VALUES: &'static [( &'static str, @@ -16,6 +16,7 @@ pub const PROPERTY_VALUES: &'static [( ("11.0", "V11_0"), ("12.0", "V12_0"), ("12.1", "V12_1"), + ("13.0", "V13_0"), ("2.0", "V2_0"), ("2.1", "V2_1"), ("3.0", "V3_0"), @@ -40,6 +41,7 @@ pub const PROPERTY_VALUES: &'static [( ("v110", "V11_0"), ("v120", "V12_0"), ("v121", "V12_1"), + ("v130", "V13_0"), ("v20", "V2_0"), ("v21", "V2_1"), ("v30", "V3_0"), @@ -224,6 +226,8 @@ pub const PROPERTY_VALUES: &'static [( ("cham", "Cham"), ("cher", "Cherokee"), ("cherokee", "Cherokee"), + ("chorasmian", "Chorasmian"), + ("chrs", "Chorasmian"), ("common", "Common"), ("copt", "Coptic"), ("coptic", "Coptic"), @@ -235,6 +239,8 @@ pub const PROPERTY_VALUES: &'static [( ("deseret", "Deseret"), ("deva", "Devanagari"), ("devanagari", "Devanagari"), + ("diak", "Dives_Akuru"), + ("divesakuru", "Dives_Akuru"), ("dogr", "Dogra"), ("dogra", "Dogra"), ("dsrt", "Deseret"), @@ -299,11 +305,13 @@ pub const PROPERTY_VALUES: &'static [( ("kayahli", "Kayah_Li"), ("khar", "Kharoshthi"), ("kharoshthi", "Kharoshthi"), + ("khitansmallscript", "Khitan_Small_Script"), ("khmer", "Khmer"), ("khmr", "Khmer"), ("khoj", "Khojki"), ("khojki", "Khojki"), ("khudawadi", "Khudawadi"), + ("kits", "Khitan_Small_Script"), ("knda", "Kannada"), ("kthi", "Kaithi"), ("lana", "Tai_Tham"), @@ -477,6 +485,8 @@ pub const PROPERTY_VALUES: &'static [( ("wcho", "Wancho"), ("xpeo", "Old_Persian"), ("xsux", "Cuneiform"), + ("yezi", "Yezidi"), + ("yezidi", "Yezidi"), ("yi", "Yi"), ("yiii", "Yi"), ("zanabazarsquare", "Zanabazar_Square"), @@ -533,6 +543,8 @@ pub const PROPERTY_VALUES: &'static [( ("cham", "Cham"), ("cher", "Cherokee"), ("cherokee", "Cherokee"), + ("chorasmian", "Chorasmian"), + ("chrs", "Chorasmian"), ("common", "Common"), ("copt", "Coptic"), ("coptic", "Coptic"), @@ -544,6 +556,8 @@ pub const PROPERTY_VALUES: &'static [( ("deseret", "Deseret"), ("deva", "Devanagari"), ("devanagari", "Devanagari"), + ("diak", "Dives_Akuru"), + ("divesakuru", "Dives_Akuru"), ("dogr", "Dogra"), ("dogra", "Dogra"), ("dsrt", "Deseret"), @@ -608,11 +622,13 @@ pub const PROPERTY_VALUES: &'static [( ("kayahli", "Kayah_Li"), ("khar", "Kharoshthi"), ("kharoshthi", "Kharoshthi"), + ("khitansmallscript", "Khitan_Small_Script"), ("khmer", "Khmer"), ("khmr", "Khmer"), ("khoj", "Khojki"), ("khojki", "Khojki"), ("khudawadi", "Khudawadi"), + ("kits", "Khitan_Small_Script"), ("knda", "Kannada"), ("kthi", "Kaithi"), ("lana", "Tai_Tham"), @@ -786,6 +802,8 @@ pub const PROPERTY_VALUES: &'static [( ("wcho", "Wancho"), ("xpeo", "Old_Persian"), ("xsux", "Cuneiform"), + ("yezi", "Yezidi"), + ("yezidi", "Yezidi"), ("yi", "Yi"), ("yiii", "Yi"), ("zanabazarsquare", "Zanabazar_Square"), diff --git a/regex-syntax/src/unicode_tables/script.rs b/regex-syntax/src/unicode_tables/script.rs index 19dbc38e56..a48203e4ff 100644 --- a/regex-syntax/src/unicode_tables/script.rs +++ b/regex-syntax/src/unicode_tables/script.rs @@ -1,8 +1,8 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate script /tmp/ucd/12.1.0/ --chars +// ucd-generate script ucd-13.0.0 --chars // -// ucd-generate is available on crates.io. +// ucd-generate 0.2.7 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Adlam", ADLAM), @@ -28,6 +28,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Chakma", CHAKMA), ("Cham", CHAM), ("Cherokee", CHEROKEE), + ("Chorasmian", CHORASMIAN), ("Common", COMMON), ("Coptic", COPTIC), ("Cuneiform", CUNEIFORM), @@ -35,6 +36,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Cyrillic", CYRILLIC), ("Deseret", DESERET), ("Devanagari", DEVANAGARI), + ("Dives_Akuru", DIVES_AKURU), ("Dogra", DOGRA), ("Duployan", DUPLOYAN), ("Egyptian_Hieroglyphs", EGYPTIAN_HIEROGLYPHS), @@ -66,6 +68,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Katakana", KATAKANA), ("Kayah_Li", KAYAH_LI), ("Kharoshthi", KHAROSHTHI), + ("Khitan_Small_Script", KHITAN_SMALL_SCRIPT), ("Khmer", KHMER), ("Khojki", KHOJKI), ("Khudawadi", KHUDAWADI), @@ -155,12 +158,13 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Vai", VAI), ("Wancho", WANCHO), ("Warang_Citi", WARANG_CITI), + ("Yezidi", YEZIDI), ("Yi", YI), ("Zanabazar_Square", ZANABAZAR_SQUARE), ]; pub const ADLAM: &'static [(char, char)] = - &[('𞤀', '\u{1e94b}'), ('𞥐', '𞥙'), ('𞥞', '𞥟')]; + &[('𞤀', '𞥋'), ('𞥐', '𞥙'), ('𞥞', '𞥟')]; pub const AHOM: &'static [(char, char)] = &[('𑜀', '𑜚'), ('\u{1171d}', '\u{1172b}'), ('𑜰', '𑜿')]; @@ -180,7 +184,7 @@ pub const ARABIC: &'static [(char, char)] = &[ ('۞', 'ۿ'), ('ݐ', 'ݿ'), ('ࢠ', 'ࢴ'), - ('ࢶ', 'ࢽ'), + ('ࢶ', '\u{8c7}'), ('\u{8d3}', '\u{8e1}'), ('\u{8e3}', '\u{8ff}'), ('ﭐ', '﯁'), @@ -228,7 +232,7 @@ pub const ARABIC: &'static [(char, char)] = &[ ]; pub const ARMENIAN: &'static [(char, char)] = - &[('Ա', 'Ֆ'), ('ՙ', 'ֈ'), ('֊', '֊'), ('֍', '֏'), ('ﬓ', 'ﬗ')]; + &[('Ա', 'Ֆ'), ('ՙ', '֊'), ('֍', '֏'), ('ﬓ', 'ﬗ')]; pub const AVESTAN: &'static [(char, char)] = &[('𐬀', '𐬵'), ('𐬹', '𐬿')]; @@ -262,7 +266,7 @@ pub const BHAIKSUKI: &'static [(char, char)] = &[('𑰀', '𑰈'), ('𑰊', '\u{11c36}'), ('\u{11c38}', '𑱅'), ('𑱐', '𑱬')]; pub const BOPOMOFO: &'static [(char, char)] = - &[('˪', '˫'), ('ㄅ', 'ㄯ'), ('ㆠ', 'ㆺ')]; + &[('˪', '˫'), ('ㄅ', 'ㄯ'), ('ㆠ', '\u{31bf}')]; pub const BRAHMI: &'static [(char, char)] = &[('𑀀', '𑁍'), ('𑁒', '𑁯'), ('\u{1107f}', '\u{1107f}')]; @@ -282,7 +286,7 @@ pub const CAUCASIAN_ALBANIAN: &'static [(char, char)] = &[('𐔰', '𐕣'), ('𐕯', '𐕯')]; pub const CHAKMA: &'static [(char, char)] = - &[('\u{11100}', '\u{11134}'), ('𑄶', '𑅆')]; + &[('\u{11100}', '\u{11134}'), ('𑄶', '\u{11147}')]; pub const CHAM: &'static [(char, char)] = &[('ꨀ', '\u{aa36}'), ('ꩀ', 'ꩍ'), ('꩐', '꩙'), ('꩜', '꩟')]; @@ -290,6 +294,8 @@ pub const CHAM: &'static [(char, char)] = pub const CHEROKEE: &'static [(char, char)] = &[('Ꭰ', 'Ᏽ'), ('ᏸ', 'ᏽ'), ('ꭰ', 'ꮿ')]; +pub const CHORASMIAN: &'static [(char, char)] = &[('\u{10fb0}', '\u{10fcb}')]; + pub const COMMON: &'static [(char, char)] = &[ ('\u{0}', '@'), ('[', '`'), @@ -305,7 +311,6 @@ pub const COMMON: &'static [(char, char)] = &[ (';', ';'), ('΅', '΅'), ('·', '·'), - ('։', '։'), ('\u{605}', '\u{605}'), ('،', '،'), ('؛', '؛'), @@ -326,7 +331,7 @@ pub const COMMON: &'static [(char, char)] = &[ ('ᳩ', 'ᳬ'), ('ᳮ', 'ᳳ'), ('ᳵ', '᳷'), - ('\u{1cfa}', '\u{1cfa}'), + ('ᳺ', 'ᳺ'), ('\u{2000}', '\u{200b}'), ('\u{200e}', '\u{2064}'), ('\u{2066}', '⁰'), @@ -344,8 +349,8 @@ pub const COMMON: &'static [(char, char)] = &[ ('①', '⟿'), ('⤀', '⭳'), ('⭶', '⮕'), - ('⮘', '\u{2bff}'), - ('⸀', '\u{2e4f}'), + ('\u{2b97}', '⯿'), + ('⸀', '\u{2e52}'), ('⿰', '⿻'), ('\u{3000}', '〄'), ('〆', '〆'), @@ -359,7 +364,7 @@ pub const COMMON: &'static [(char, char)] = &[ ('㇀', '㇣'), ('㈠', '㉟'), ('㉿', '㋏'), - ('\u{32ff}', '\u{32ff}'), + ('㋿', '㋿'), ('㍘', '㏿'), ('䷀', '䷿'), ('꜀', '꜡'), @@ -368,6 +373,7 @@ pub const COMMON: &'static [(char, char)] = &[ ('꤮', '꤮'), ('ꧏ', 'ꧏ'), ('꭛', '꭛'), + ('\u{ab6a}', '\u{ab6b}'), ('﴾', '﴿'), ('︐', '︙'), ('︰', '﹒'), @@ -385,10 +391,10 @@ pub const COMMON: &'static [(char, char)] = &[ ('𐄀', '𐄂'), ('𐄇', '𐄳'), ('𐄷', '𐄿'), - ('𐆐', '𐆛'), + ('𐆐', '\u{1019c}'), ('𐇐', '𐇼'), ('𐋡', '𐋻'), - ('\u{16fe2}', '\u{16fe3}'), + ('𖿢', '𖿣'), ('\u{1bca0}', '\u{1bca3}'), ('𝀀', '𝃵'), ('𝄀', '𝄦'), @@ -422,45 +428,46 @@ pub const COMMON: &'static [(char, char)] = &[ ('𝚨', '𝟋'), ('𝟎', '𝟿'), ('𞱱', '𞲴'), - ('\u{1ed01}', '\u{1ed3d}'), + ('𞴁', '𞴽'), ('🀀', '🀫'), ('🀰', '🂓'), ('🂠', '🂮'), ('🂱', '🂿'), ('🃁', '🃏'), ('🃑', '🃵'), - ('🄀', '🄌'), - ('🄐', '\u{1f16c}'), - ('🅰', '🆬'), + ('🄀', '\u{1f1ad}'), ('🇦', '🇿'), ('🈁', '🈂'), ('🈐', '🈻'), ('🉀', '🉈'), ('🉐', '🉑'), ('🉠', '🉥'), - ('🌀', '\u{1f6d5}'), + ('🌀', '\u{1f6d7}'), ('🛠', '🛬'), - ('🛰', '\u{1f6fa}'), + ('🛰', '\u{1f6fc}'), ('🜀', '🝳'), ('🞀', '🟘'), - ('\u{1f7e0}', '\u{1f7eb}'), + ('🟠', '🟫'), ('🠀', '🠋'), ('🠐', '🡇'), ('🡐', '🡙'), ('🡠', '🢇'), ('🢐', '🢭'), - ('🤀', '🤋'), - ('\u{1f90d}', '\u{1f971}'), - ('🥳', '🥶'), - ('🥺', '🦢'), - ('\u{1f9a5}', '\u{1f9aa}'), - ('\u{1f9ae}', '\u{1f9ca}'), - ('\u{1f9cd}', '\u{1fa53}'), + ('\u{1f8b0}', '\u{1f8b1}'), + ('🤀', '\u{1f978}'), + ('🥺', '\u{1f9cb}'), + ('🧍', '🩓'), ('🩠', '🩭'), - ('\u{1fa70}', '\u{1fa73}'), - ('\u{1fa78}', '\u{1fa7a}'), - ('\u{1fa80}', '\u{1fa82}'), - ('\u{1fa90}', '\u{1fa95}'), + ('🩰', '\u{1fa74}'), + ('🩸', '🩺'), + ('🪀', '\u{1fa86}'), + ('🪐', '\u{1faa8}'), + ('\u{1fab0}', '\u{1fab6}'), + ('\u{1fac0}', '\u{1fac2}'), + ('\u{1fad0}', '\u{1fad6}'), + ('\u{1fb00}', '\u{1fb92}'), + ('\u{1fb94}', '\u{1fbca}'), + ('\u{1fbf0}', '\u{1fbf9}'), ('\u{e0001}', '\u{e0001}'), ('\u{e0020}', '\u{e007f}'), ]; @@ -494,6 +501,17 @@ pub const DEVANAGARI: &'static [(char, char)] = &[ ('\u{a8e0}', '\u{a8ff}'), ]; +pub const DIVES_AKURU: &'static [(char, char)] = &[ + ('\u{11900}', '\u{11906}'), + ('\u{11909}', '\u{11909}'), + ('\u{1190c}', '\u{11913}'), + ('\u{11915}', '\u{11916}'), + ('\u{11918}', '\u{11935}'), + ('\u{11937}', '\u{11938}'), + ('\u{1193b}', '\u{11946}'), + ('\u{11950}', '\u{11959}'), +]; + pub const DOGRA: &'static [(char, char)] = &[('𑠀', '𑠻')]; pub const DUPLOYAN: &'static [(char, char)] = @@ -504,7 +522,7 @@ pub const EGYPTIAN_HIEROGLYPHS: &'static [(char, char)] = pub const ELBASAN: &'static [(char, char)] = &[('𐔀', '𐔧')]; -pub const ELYMAIC: &'static [(char, char)] = &[('\u{10fe0}', '\u{10ff6}')]; +pub const ELYMAIC: &'static [(char, char)] = &[('𐿠', '𐿶')]; pub const ETHIOPIC: &'static [(char, char)] = &[ ('ሀ', 'ቈ'), @@ -676,16 +694,18 @@ pub const HAN: &'static [(char, char)] = &[ ('〇', '〇'), ('〡', '〩'), ('〸', '〻'), - ('㐀', '䶵'), - ('一', '鿯'), + ('㐀', '\u{4dbf}'), + ('一', '\u{9ffc}'), ('豈', '舘'), ('並', '龎'), - ('𠀀', '𪛖'), + ('\u{16ff0}', '\u{16ff1}'), + ('𠀀', '\u{2a6dd}'), ('𪜀', '𫜴'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), + ('\u{30000}', '\u{3134a}'), ]; pub const HANGUL: &'static [(char, char)] = &[ @@ -725,13 +745,8 @@ pub const HEBREW: &'static [(char, char)] = &[ ('צּ', 'ﭏ'), ]; -pub const HIRAGANA: &'static [(char, char)] = &[ - ('ぁ', 'ゖ'), - ('ゝ', 'ゟ'), - ('𛀁', '𛄞'), - ('\u{1b150}', '\u{1b152}'), - ('🈀', '🈀'), -]; +pub const HIRAGANA: &'static [(char, char)] = + &[('ぁ', 'ゖ'), ('ゝ', 'ゟ'), ('𛀁', '𛄞'), ('𛅐', '𛅒'), ('🈀', '🈀')]; pub const IMPERIAL_ARAMAIC: &'static [(char, char)] = &[('𐡀', '𐡕'), ('𐡗', '𐡟')]; @@ -742,7 +757,7 @@ pub const INHERITED: &'static [(char, char)] = &[ ('\u{64b}', '\u{655}'), ('\u{670}', '\u{670}'), ('\u{951}', '\u{954}'), - ('\u{1ab0}', '\u{1abe}'), + ('\u{1ab0}', '\u{1ac0}'), ('\u{1cd0}', '\u{1cd2}'), ('\u{1cd4}', '\u{1ce0}'), ('\u{1ce2}', '\u{1ce8}'), @@ -804,7 +819,7 @@ pub const KATAKANA: &'static [(char, char)] = &[ ('ヲ', 'ッ'), ('ア', 'ン'), ('𛀀', '𛀀'), - ('\u{1b164}', '\u{1b167}'), + ('𛅤', '𛅧'), ]; pub const KAYAH_LI: &'static [(char, char)] = &[('꤀', '\u{a92d}'), ('꤯', '꤯')]; @@ -820,6 +835,9 @@ pub const KHAROSHTHI: &'static [(char, char)] = &[ ('𐩐', '𐩘'), ]; +pub const KHITAN_SMALL_SCRIPT: &'static [(char, char)] = + &[('\u{16fe4}', '\u{16fe4}'), ('\u{18b00}', '\u{18cd5}')]; + pub const KHMER: &'static [(char, char)] = &[('ក', '\u{17dd}'), ('០', '៩'), ('៰', '៹'), ('᧠', '᧿')]; @@ -831,8 +849,8 @@ pub const KHUDAWADI: &'static [(char, char)] = pub const LAO: &'static [(char, char)] = &[ ('ກ', 'ຂ'), ('ຄ', 'ຄ'), - ('\u{e86}', 'ຊ'), - ('\u{e8c}', 'ຣ'), + ('ຆ', 'ຊ'), + ('ຌ', 'ຣ'), ('ລ', 'ລ'), ('ວ', 'ຽ'), ('ເ', 'ໄ'), @@ -866,12 +884,12 @@ pub const LATIN: &'static [(char, char)] = &[ ('Ⅰ', 'ↈ'), ('Ⱡ', 'Ɀ'), ('Ꜣ', 'ꞇ'), - ('Ꞌ', '\u{a7bf}'), - ('\u{a7c2}', '\u{a7c6}'), - ('ꟷ', 'ꟿ'), + ('Ꞌ', 'ꞿ'), + ('Ꟃ', '\u{a7ca}'), + ('\u{a7f5}', 'ꟿ'), ('ꬰ', 'ꭚ'), ('ꭜ', 'ꭤ'), - ('\u{ab66}', '\u{ab67}'), + ('ꭦ', '\u{ab69}'), ('ff', 'st'), ('A', 'Z'), ('a', 'z'), @@ -901,7 +919,8 @@ pub const LINEAR_B: &'static [(char, char)] = &[ ('𐂀', '𐃺'), ]; -pub const LISU: &'static [(char, char)] = &[('ꓐ', '꓿')]; +pub const LISU: &'static [(char, char)] = + &[('ꓐ', '꓿'), ('\u{11fb0}', '\u{11fb0}')]; pub const LYCIAN: &'static [(char, char)] = &[('𐊀', '𐊜')]; @@ -912,8 +931,7 @@ pub const MAHAJANI: &'static [(char, char)] = &[('𑅐', '𑅶')]; pub const MAKASAR: &'static [(char, char)] = &[('𑻠', '𑻸')]; pub const MALAYALAM: &'static [(char, char)] = &[ - ('\u{d00}', 'ഃ'), - ('അ', 'ഌ'), + ('\u{d00}', 'ഌ'), ('എ', 'ഐ'), ('ഒ', '\u{d44}'), ('െ', 'ൈ'), @@ -954,7 +972,7 @@ pub const MEROITIC_CURSIVE: &'static [(char, char)] = pub const MEROITIC_HIEROGLYPHS: &'static [(char, char)] = &[('𐦀', '𐦟')]; pub const MIAO: &'static [(char, char)] = - &[('𖼀', '\u{16f4a}'), ('\u{16f4f}', '\u{16f87}'), ('\u{16f8f}', '𖾟')]; + &[('𖼀', '𖽊'), ('\u{16f4f}', '𖾇'), ('\u{16f8f}', '𖾟')]; pub const MODI: &'static [(char, char)] = &[('𑘀', '𑙄'), ('𑙐', '𑙙')]; @@ -978,28 +996,20 @@ pub const MYANMAR: &'static [(char, char)] = pub const NABATAEAN: &'static [(char, char)] = &[('𐢀', '𐢞'), ('𐢧', '𐢯')]; -pub const NANDINAGARI: &'static [(char, char)] = &[ - ('\u{119a0}', '\u{119a7}'), - ('\u{119aa}', '\u{119d7}'), - ('\u{119da}', '\u{119e4}'), -]; +pub const NANDINAGARI: &'static [(char, char)] = + &[('𑦠', '𑦧'), ('𑦪', '\u{119d7}'), ('\u{119da}', '𑧤')]; pub const NEW_TAI_LUE: &'static [(char, char)] = &[('ᦀ', 'ᦫ'), ('ᦰ', 'ᧉ'), ('᧐', '᧚'), ('᧞', '᧟')]; -pub const NEWA: &'static [(char, char)] = - &[('𑐀', '𑑙'), ('𑑛', '𑑛'), ('𑑝', '\u{1145f}')]; +pub const NEWA: &'static [(char, char)] = &[('𑐀', '𑑛'), ('𑑝', '\u{11461}')]; pub const NKO: &'static [(char, char)] = &[('߀', 'ߺ'), ('\u{7fd}', '߿')]; pub const NUSHU: &'static [(char, char)] = &[('𖿡', '𖿡'), ('𛅰', '𛋻')]; -pub const NYIAKENG_PUACHUE_HMONG: &'static [(char, char)] = &[ - ('\u{1e100}', '\u{1e12c}'), - ('\u{1e130}', '\u{1e13d}'), - ('\u{1e140}', '\u{1e149}'), - ('\u{1e14e}', '\u{1e14f}'), -]; +pub const NYIAKENG_PUACHUE_HMONG: &'static [(char, char)] = + &[('𞄀', '𞄬'), ('\u{1e130}', '𞄽'), ('𞅀', '𞅉'), ('𞅎', '𞅏')]; pub const OGHAM: &'static [(char, char)] = &[('\u{1680}', '᚜')]; @@ -1033,7 +1043,7 @@ pub const ORIYA: &'static [(char, char)] = &[ ('\u{b3c}', '\u{b44}'), ('େ', 'ୈ'), ('ୋ', '\u{b4d}'), - ('\u{b56}', '\u{b57}'), + ('\u{b55}', '\u{b57}'), ('ଡ଼', 'ଢ଼'), ('ୟ', '\u{b63}'), ('୦', '୷'), @@ -1066,7 +1076,7 @@ pub const SAMARITAN: &'static [(char, char)] = &[('ࠀ', '\u{82d}'), ('࠰', ' pub const SAURASHTRA: &'static [(char, char)] = &[('ꢀ', '\u{a8c5}'), ('꣎', '꣙')]; -pub const SHARADA: &'static [(char, char)] = &[('\u{11180}', '𑇍'), ('𑇐', '𑇟')]; +pub const SHARADA: &'static [(char, char)] = &[('\u{11180}', '𑇟')]; pub const SHAVIAN: &'static [(char, char)] = &[('𐑐', '𐑿')]; @@ -1077,7 +1087,7 @@ pub const SIGNWRITING: &'static [(char, char)] = &[('𝠀', '𝪋'), ('\u{1da9b}', '\u{1da9f}'), ('\u{1daa1}', '\u{1daaf}')]; pub const SINHALA: &'static [(char, char)] = &[ - ('ං', 'ඃ'), + ('\u{d81}', 'ඃ'), ('අ', 'ඖ'), ('ක', 'න'), ('ඳ', 'ර'), @@ -1101,7 +1111,7 @@ pub const SOYOMBO: &'static [(char, char)] = &[('𑩐', '𑪢')]; pub const SUNDANESE: &'static [(char, char)] = &[('\u{1b80}', 'ᮿ'), ('᳀', '᳇')]; -pub const SYLOTI_NAGRI: &'static [(char, char)] = &[('ꠀ', '꠫')]; +pub const SYLOTI_NAGRI: &'static [(char, char)] = &[('ꠀ', '\u{a82c}')]; pub const SYRIAC: &'static [(char, char)] = &[('܀', '܍'), ('\u{70f}', '\u{74a}'), ('ݍ', 'ݏ'), ('ࡠ', 'ࡪ')]; @@ -1123,7 +1133,7 @@ pub const TAI_THAM: &'static [(char, char)] = &[ pub const TAI_VIET: &'static [(char, char)] = &[('ꪀ', 'ꫂ'), ('ꫛ', '꫟')]; -pub const TAKRI: &'static [(char, char)] = &[('𑚀', '\u{116b8}'), ('𑛀', '𑛉')]; +pub const TAKRI: &'static [(char, char)] = &[('𑚀', '𑚸'), ('𑛀', '𑛉')]; pub const TAMIL: &'static [(char, char)] = &[ ('\u{b82}', 'ஃ'), @@ -1142,12 +1152,16 @@ pub const TAMIL: &'static [(char, char)] = &[ ('ௐ', 'ௐ'), ('\u{bd7}', '\u{bd7}'), ('௦', '௺'), - ('\u{11fc0}', '\u{11ff1}'), - ('\u{11fff}', '\u{11fff}'), + ('𑿀', '𑿱'), + ('𑿿', '𑿿'), ]; -pub const TANGUT: &'static [(char, char)] = - &[('𖿠', '𖿠'), ('𗀀', '\u{187f7}'), ('𘠀', '𘫲')]; +pub const TANGUT: &'static [(char, char)] = &[ + ('𖿠', '𖿠'), + ('𗀀', '𘟷'), + ('𘠀', '\u{18aff}'), + ('\u{18d00}', '\u{18d08}'), +]; pub const TELUGU: &'static [(char, char)] = &[ ('\u{c00}', 'ఌ'), @@ -1161,7 +1175,7 @@ pub const TELUGU: &'static [(char, char)] = &[ ('ౘ', 'ౚ'), ('ౠ', '\u{c63}'), ('౦', '౯'), - ('\u{c77}', '౿'), + ('౷', '౿'), ]; pub const THAANA: &'static [(char, char)] = &[('ހ', 'ޱ')]; @@ -1187,11 +1201,16 @@ pub const UGARITIC: &'static [(char, char)] = &[('𐎀', '𐎝'), ('𐎟', '𐎟 pub const VAI: &'static [(char, char)] = &[('ꔀ', 'ꘫ')]; -pub const WANCHO: &'static [(char, char)] = - &[('\u{1e2c0}', '\u{1e2f9}'), ('\u{1e2ff}', '\u{1e2ff}')]; +pub const WANCHO: &'static [(char, char)] = &[('𞋀', '𞋹'), ('𞋿', '𞋿')]; pub const WARANG_CITI: &'static [(char, char)] = &[('𑢠', '𑣲'), ('𑣿', '𑣿')]; +pub const YEZIDI: &'static [(char, char)] = &[ + ('\u{10e80}', '\u{10ea9}'), + ('\u{10eab}', '\u{10ead}'), + ('\u{10eb0}', '\u{10eb1}'), +]; + pub const YI: &'static [(char, char)] = &[('ꀀ', 'ꒌ'), ('꒐', '꓆')]; pub const ZANABAZAR_SQUARE: &'static [(char, char)] = &[('𑨀', '\u{11a47}')]; diff --git a/regex-syntax/src/unicode_tables/script_extension.rs b/regex-syntax/src/unicode_tables/script_extension.rs index aa3894e575..1b6b4ff0a5 100644 --- a/regex-syntax/src/unicode_tables/script_extension.rs +++ b/regex-syntax/src/unicode_tables/script_extension.rs @@ -1,8 +1,8 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate script-extension /tmp/ucd/12.1.0/ --chars +// ucd-generate script-extension ucd-13.0.0 --chars // -// ucd-generate is available on crates.io. +// ucd-generate 0.2.7 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Adlam", ADLAM), @@ -28,6 +28,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Chakma", CHAKMA), ("Cham", CHAM), ("Cherokee", CHEROKEE), + ("Chorasmian", CHORASMIAN), ("Common", COMMON), ("Coptic", COPTIC), ("Cuneiform", CUNEIFORM), @@ -35,6 +36,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Cyrillic", CYRILLIC), ("Deseret", DESERET), ("Devanagari", DEVANAGARI), + ("Dives_Akuru", DIVES_AKURU), ("Dogra", DOGRA), ("Duployan", DUPLOYAN), ("Egyptian_Hieroglyphs", EGYPTIAN_HIEROGLYPHS), @@ -66,6 +68,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Katakana", KATAKANA), ("Kayah_Li", KAYAH_LI), ("Kharoshthi", KHAROSHTHI), + ("Khitan_Small_Script", KHITAN_SMALL_SCRIPT), ("Khmer", KHMER), ("Khojki", KHOJKI), ("Khudawadi", KHUDAWADI), @@ -155,12 +158,13 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Vai", VAI), ("Wancho", WANCHO), ("Warang_Citi", WARANG_CITI), + ("Yezidi", YEZIDI), ("Yi", YI), ("Zanabazar_Square", ZANABAZAR_SQUARE), ]; pub const ADLAM: &'static [(char, char)] = - &[('ـ', 'ـ'), ('𞤀', '\u{1e94b}'), ('𞥐', '𞥙'), ('𞥞', '𞥟')]; + &[('ـ', 'ـ'), ('𞤀', '𞥋'), ('𞥐', '𞥙'), ('𞥞', '𞥟')]; pub const AHOM: &'static [(char, char)] = &[('𑜀', '𑜚'), ('\u{1171d}', '\u{1172b}'), ('𑜰', '𑜿')]; @@ -174,7 +178,7 @@ pub const ARABIC: &'static [(char, char)] = &[ ('۞', 'ۿ'), ('ݐ', 'ݿ'), ('ࢠ', 'ࢴ'), - ('ࢶ', 'ࢽ'), + ('ࢶ', '\u{8c7}'), ('\u{8d3}', '\u{8e1}'), ('\u{8e3}', '\u{8ff}'), ('ﭐ', '﯁'), @@ -278,7 +282,7 @@ pub const BOPOMOFO: &'static [(char, char)] = &[ ('〷', '〷'), ('・', '・'), ('ㄅ', 'ㄯ'), - ('ㆠ', 'ㆺ'), + ('ㆠ', '\u{31bf}'), ('﹅', '﹆'), ('。', '・'), ]; @@ -302,7 +306,7 @@ pub const CAUCASIAN_ALBANIAN: &'static [(char, char)] = &[('𐔰', '𐕣'), ('𐕯', '𐕯')]; pub const CHAKMA: &'static [(char, char)] = - &[('০', '৯'), ('၀', '၉'), ('\u{11100}', '\u{11134}'), ('𑄶', '𑅆')]; + &[('০', '৯'), ('၀', '၉'), ('\u{11100}', '\u{11134}'), ('𑄶', '\u{11147}')]; pub const CHAM: &'static [(char, char)] = &[('ꨀ', '\u{aa36}'), ('ꩀ', 'ꩍ'), ('꩐', '꩙'), ('꩜', '꩟')]; @@ -310,6 +314,8 @@ pub const CHAM: &'static [(char, char)] = pub const CHEROKEE: &'static [(char, char)] = &[('Ꭰ', 'Ᏽ'), ('ᏸ', 'ᏽ'), ('ꭰ', 'ꮿ')]; +pub const CHORASMIAN: &'static [(char, char)] = &[('\u{10fb0}', '\u{10fcb}')]; + pub const COMMON: &'static [(char, char)] = &[ ('\u{0}', '@'), ('[', '`'), @@ -349,9 +355,9 @@ pub const COMMON: &'static [(char, char)] = &[ ('①', '⟿'), ('⤀', '⭳'), ('⭶', '⮕'), - ('⮘', '\u{2bff}'), + ('\u{2b97}', '⯿'), ('⸀', '⹂'), - ('⹄', '\u{2e4f}'), + ('⹄', '\u{2e52}'), ('⿰', '⿻'), ('\u{3000}', '\u{3000}'), ('〄', '〄'), @@ -366,9 +372,10 @@ pub const COMMON: &'static [(char, char)] = &[ ('㎀', '㏟'), ('㏿', '㏿'), ('䷀', '䷿'), - ('꜀', '꜡'), + ('꜈', '꜡'), ('ꞈ', '꞊'), ('꭛', '꭛'), + ('\u{ab6a}', '\u{ab6b}'), ('﴾', '﴿'), ('︐', '︙'), ('︰', '﹄'), @@ -382,9 +389,9 @@ pub const COMMON: &'static [(char, char)] = &[ ('¢', '₩'), ('│', '○'), ('\u{fff9}', '�'), - ('𐆐', '𐆛'), + ('𐆐', '\u{1019c}'), ('𐇐', '𐇼'), - ('\u{16fe2}', '\u{16fe3}'), + ('𖿢', '𖿣'), ('𝀀', '𝃵'), ('𝄀', '𝄦'), ('𝄩', '𝅦'), @@ -417,44 +424,45 @@ pub const COMMON: &'static [(char, char)] = &[ ('𝚨', '𝟋'), ('𝟎', '𝟿'), ('𞱱', '𞲴'), - ('\u{1ed01}', '\u{1ed3d}'), + ('𞴁', '𞴽'), ('🀀', '🀫'), ('🀰', '🂓'), ('🂠', '🂮'), ('🂱', '🂿'), ('🃁', '🃏'), ('🃑', '🃵'), - ('🄀', '🄌'), - ('🄐', '\u{1f16c}'), - ('🅰', '🆬'), + ('🄀', '\u{1f1ad}'), ('🇦', '🇿'), ('🈁', '🈂'), ('🈐', '🈻'), ('🉀', '🉈'), ('🉠', '🉥'), - ('🌀', '\u{1f6d5}'), + ('🌀', '\u{1f6d7}'), ('🛠', '🛬'), - ('🛰', '\u{1f6fa}'), + ('🛰', '\u{1f6fc}'), ('🜀', '🝳'), ('🞀', '🟘'), - ('\u{1f7e0}', '\u{1f7eb}'), + ('🟠', '🟫'), ('🠀', '🠋'), ('🠐', '🡇'), ('🡐', '🡙'), ('🡠', '🢇'), ('🢐', '🢭'), - ('🤀', '🤋'), - ('\u{1f90d}', '\u{1f971}'), - ('🥳', '🥶'), - ('🥺', '🦢'), - ('\u{1f9a5}', '\u{1f9aa}'), - ('\u{1f9ae}', '\u{1f9ca}'), - ('\u{1f9cd}', '\u{1fa53}'), + ('\u{1f8b0}', '\u{1f8b1}'), + ('🤀', '\u{1f978}'), + ('🥺', '\u{1f9cb}'), + ('🧍', '🩓'), ('🩠', '🩭'), - ('\u{1fa70}', '\u{1fa73}'), - ('\u{1fa78}', '\u{1fa7a}'), - ('\u{1fa80}', '\u{1fa82}'), - ('\u{1fa90}', '\u{1fa95}'), + ('🩰', '\u{1fa74}'), + ('🩸', '🩺'), + ('🪀', '\u{1fa86}'), + ('🪐', '\u{1faa8}'), + ('\u{1fab0}', '\u{1fab6}'), + ('\u{1fac0}', '\u{1fac2}'), + ('\u{1fad0}', '\u{1fad6}'), + ('\u{1fb00}', '\u{1fb92}'), + ('\u{1fb94}', '\u{1fbca}'), + ('\u{1fbf0}', '\u{1fbf9}'), ('\u{e0001}', '\u{e0001}'), ('\u{e0020}', '\u{e007f}'), ]; @@ -482,6 +490,7 @@ pub const CYRILLIC: &'static [(char, char)] = &[ ('ᲀ', 'ᲈ'), ('ᴫ', 'ᴫ'), ('ᵸ', 'ᵸ'), + ('\u{1df8}', '\u{1df8}'), ('\u{2de0}', '\u{2dff}'), ('⹃', '⹃'), ('Ꙁ', '\u{a69f}'), @@ -500,6 +509,17 @@ pub const DEVANAGARI: &'static [(char, char)] = &[ ('\u{a8e0}', '\u{a8ff}'), ]; +pub const DIVES_AKURU: &'static [(char, char)] = &[ + ('\u{11900}', '\u{11906}'), + ('\u{11909}', '\u{11909}'), + ('\u{1190c}', '\u{11913}'), + ('\u{11915}', '\u{11916}'), + ('\u{11918}', '\u{11935}'), + ('\u{11937}', '\u{11938}'), + ('\u{1193b}', '\u{11946}'), + ('\u{11950}', '\u{11959}'), +]; + pub const DOGRA: &'static [(char, char)] = &[('।', '९'), ('꠰', '꠹'), ('𑠀', '𑠻')]; @@ -511,7 +531,7 @@ pub const EGYPTIAN_HIEROGLYPHS: &'static [(char, char)] = pub const ELBASAN: &'static [(char, char)] = &[('𐔀', '𐔧')]; -pub const ELYMAIC: &'static [(char, char)] = &[('\u{10fe0}', '\u{10ff6}')]; +pub const ELYMAIC: &'static [(char, char)] = &[('𐿠', '𐿶')]; pub const ETHIOPIC: &'static [(char, char)] = &[ ('ሀ', 'ቈ'), @@ -549,7 +569,6 @@ pub const ETHIOPIC: &'static [(char, char)] = &[ ]; pub const GEORGIAN: &'static [(char, char)] = &[ - ('։', '։'), ('Ⴀ', 'Ⴥ'), ('Ⴧ', 'Ⴧ'), ('Ⴭ', 'Ⴭ'), @@ -601,8 +620,8 @@ pub const GRANTHA: &'static [(char, char)] = &[ ('𑍝', '𑍣'), ('\u{11366}', '\u{1136c}'), ('\u{11370}', '\u{11374}'), - ('\u{11fd0}', '\u{11fd1}'), - ('\u{11fd3}', '\u{11fd3}'), + ('𑿐', '𑿑'), + ('𑿓', '𑿓'), ]; pub const GREEK: &'static [(char, char)] = &[ @@ -714,24 +733,27 @@ pub const HAN: &'static [(char, char)] = &[ ('㈠', '㉇'), ('㊀', '㊰'), ('㋀', '㋋'), - ('\u{32ff}', '\u{32ff}'), + ('㋿', '㋿'), ('㍘', '㍰'), ('㍻', '㍿'), ('㏠', '㏾'), - ('㐀', '䶵'), - ('一', '鿯'), + ('㐀', '\u{4dbf}'), + ('一', '\u{9ffc}'), + ('꜀', '꜇'), ('豈', '舘'), ('並', '龎'), ('﹅', '﹆'), ('。', '・'), + ('\u{16ff0}', '\u{16ff1}'), ('𝍠', '𝍱'), ('🉐', '🉑'), - ('𠀀', '𪛖'), + ('𠀀', '\u{2a6dd}'), ('𪜀', '𫜴'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), + ('\u{30000}', '\u{3134a}'), ]; pub const HANGUL: &'static [(char, char)] = &[ @@ -800,7 +822,7 @@ pub const HIRAGANA: &'static [(char, char)] = &[ ('ー', 'ー'), ('\u{ff9e}', '\u{ff9f}'), ('𛀁', '𛄞'), - ('\u{1b150}', '\u{1b152}'), + ('𛅐', '𛅒'), ('🈀', '🈀'), ]; @@ -812,8 +834,9 @@ pub const INHERITED: &'static [(char, char)] = &[ ('\u{343}', '\u{344}'), ('\u{346}', '\u{362}'), ('\u{953}', '\u{954}'), - ('\u{1ab0}', '\u{1abe}'), - ('\u{1dc2}', '\u{1df9}'), + ('\u{1ab0}', '\u{1ac0}'), + ('\u{1dc2}', '\u{1df7}'), + ('\u{1df9}', '\u{1df9}'), ('\u{1dfb}', '\u{1dff}'), ('\u{200c}', '\u{200d}'), ('\u{20d0}', '\u{20ef}'), @@ -878,7 +901,7 @@ pub const KATAKANA: &'static [(char, char)] = &[ ('﹅', '﹆'), ('。', '\u{ff9f}'), ('𛀀', '𛀀'), - ('\u{1b164}', '\u{1b167}'), + ('𛅤', '𛅧'), ]; pub const KAYAH_LI: &'static [(char, char)] = &[('꤀', '꤯')]; @@ -894,6 +917,9 @@ pub const KHAROSHTHI: &'static [(char, char)] = &[ ('𐩐', '𐩘'), ]; +pub const KHITAN_SMALL_SCRIPT: &'static [(char, char)] = + &[('\u{16fe4}', '\u{16fe4}'), ('\u{18b00}', '\u{18cd5}')]; + pub const KHMER: &'static [(char, char)] = &[('ក', '\u{17dd}'), ('០', '៩'), ('៰', '៹'), ('᧠', '᧿')]; @@ -906,8 +932,8 @@ pub const KHUDAWADI: &'static [(char, char)] = pub const LAO: &'static [(char, char)] = &[ ('ກ', 'ຂ'), ('ຄ', 'ຄ'), - ('\u{e86}', 'ຊ'), - ('\u{e8c}', 'ຣ'), + ('ຆ', 'ຊ'), + ('ຌ', 'ຣ'), ('ລ', 'ລ'), ('ວ', 'ຽ'), ('ເ', 'ໄ'), @@ -946,14 +972,15 @@ pub const LATIN: &'static [(char, char)] = &[ ('ⅎ', 'ⅎ'), ('Ⅰ', 'ↈ'), ('Ⱡ', 'Ɀ'), + ('꜀', '꜇'), ('Ꜣ', 'ꞇ'), - ('Ꞌ', '\u{a7bf}'), - ('\u{a7c2}', '\u{a7c6}'), - ('ꟷ', 'ꟿ'), + ('Ꞌ', 'ꞿ'), + ('Ꟃ', '\u{a7ca}'), + ('\u{a7f5}', 'ꟿ'), ('꤮', '꤮'), ('ꬰ', 'ꭚ'), ('ꭜ', 'ꭤ'), - ('\u{ab66}', '\u{ab67}'), + ('ꭦ', '\u{ab69}'), ('ff', 'st'), ('A', 'Z'), ('a', 'z'), @@ -987,7 +1014,8 @@ pub const LINEAR_B: &'static [(char, char)] = &[ ('𐄷', '𐄿'), ]; -pub const LISU: &'static [(char, char)] = &[('ꓐ', '꓿')]; +pub const LISU: &'static [(char, char)] = + &[('ꓐ', '꓿'), ('\u{11fb0}', '\u{11fb0}')]; pub const LYCIAN: &'static [(char, char)] = &[('𐊀', '𐊜')]; @@ -1001,8 +1029,7 @@ pub const MAKASAR: &'static [(char, char)] = &[('𑻠', '𑻸')]; pub const MALAYALAM: &'static [(char, char)] = &[ ('\u{951}', '\u{952}'), ('।', '॥'), - ('\u{d00}', 'ഃ'), - ('അ', 'ഌ'), + ('\u{d00}', 'ഌ'), ('എ', 'ഐ'), ('ഒ', '\u{d44}'), ('െ', 'ൈ'), @@ -1047,7 +1074,7 @@ pub const MEROITIC_CURSIVE: &'static [(char, char)] = pub const MEROITIC_HIEROGLYPHS: &'static [(char, char)] = &[('𐦀', '𐦟')]; pub const MIAO: &'static [(char, char)] = - &[('𖼀', '\u{16f4a}'), ('\u{16f4f}', '\u{16f87}'), ('\u{16f8f}', '𖾟')]; + &[('𖼀', '𖽊'), ('\u{16f4f}', '𖾇'), ('\u{16f8f}', '𖾟')]; pub const MODI: &'static [(char, char)] = &[('꠰', '꠹'), ('𑘀', '𑙄'), ('𑙐', '𑙙')]; @@ -1076,29 +1103,24 @@ pub const NANDINAGARI: &'static [(char, char)] = &[ ('೦', '೯'), ('ᳩ', 'ᳩ'), ('ᳲ', 'ᳲ'), - ('\u{1cfa}', '\u{1cfa}'), + ('ᳺ', 'ᳺ'), ('꠰', '꠵'), - ('\u{119a0}', '\u{119a7}'), - ('\u{119aa}', '\u{119d7}'), - ('\u{119da}', '\u{119e4}'), + ('𑦠', '𑦧'), + ('𑦪', '\u{119d7}'), + ('\u{119da}', '𑧤'), ]; pub const NEW_TAI_LUE: &'static [(char, char)] = &[('ᦀ', 'ᦫ'), ('ᦰ', 'ᧉ'), ('᧐', '᧚'), ('᧞', '᧟')]; -pub const NEWA: &'static [(char, char)] = - &[('𑐀', '𑑙'), ('𑑛', '𑑛'), ('𑑝', '\u{1145f}')]; +pub const NEWA: &'static [(char, char)] = &[('𑐀', '𑑛'), ('𑑝', '\u{11461}')]; pub const NKO: &'static [(char, char)] = &[('߀', 'ߺ'), ('\u{7fd}', '߿')]; pub const NUSHU: &'static [(char, char)] = &[('𖿡', '𖿡'), ('𛅰', '𛋻')]; -pub const NYIAKENG_PUACHUE_HMONG: &'static [(char, char)] = &[ - ('\u{1e100}', '\u{1e12c}'), - ('\u{1e130}', '\u{1e13d}'), - ('\u{1e140}', '\u{1e149}'), - ('\u{1e14e}', '\u{1e14f}'), -]; +pub const NYIAKENG_PUACHUE_HMONG: &'static [(char, char)] = + &[('𞄀', '𞄬'), ('\u{1e130}', '𞄽'), ('𞅀', '𞅉'), ('𞅎', '𞅏')]; pub const OGHAM: &'static [(char, char)] = &[('\u{1680}', '᚜')]; @@ -1135,7 +1157,7 @@ pub const ORIYA: &'static [(char, char)] = &[ ('\u{b3c}', '\u{b44}'), ('େ', 'ୈ'), ('ୋ', '\u{b4d}'), - ('\u{b56}', '\u{b57}'), + ('\u{b55}', '\u{b57}'), ('ଡ଼', 'ଢ଼'), ('ୟ', '\u{b63}'), ('୦', '୷'), @@ -1177,8 +1199,7 @@ pub const SHARADA: &'static [(char, char)] = &[ ('\u{1cd9}', '\u{1cd9}'), ('\u{1cdc}', '\u{1cdd}'), ('\u{1ce0}', '\u{1ce0}'), - ('\u{11180}', '𑇍'), - ('𑇐', '𑇟'), + ('\u{11180}', '𑇟'), ]; pub const SHAVIAN: &'static [(char, char)] = &[('𐑐', '𐑿')]; @@ -1191,7 +1212,7 @@ pub const SIGNWRITING: &'static [(char, char)] = pub const SINHALA: &'static [(char, char)] = &[ ('।', '॥'), - ('ං', 'ඃ'), + ('\u{d81}', 'ඃ'), ('අ', 'ඖ'), ('ක', 'න'), ('ඳ', 'ර'), @@ -1216,7 +1237,7 @@ pub const SUNDANESE: &'static [(char, char)] = &[('\u{1b80}', 'ᮿ'), ('᳀', '᳇')]; pub const SYLOTI_NAGRI: &'static [(char, char)] = - &[('।', '॥'), ('০', '৯'), ('ꠀ', '꠫')]; + &[('।', '॥'), ('০', '৯'), ('ꠀ', '\u{a82c}')]; pub const SYRIAC: &'static [(char, char)] = &[ ('،', '،'), @@ -1229,6 +1250,7 @@ pub const SYRIAC: &'static [(char, char)] = &[ ('\u{70f}', '\u{74a}'), ('ݍ', 'ݏ'), ('ࡠ', 'ࡪ'), + ('\u{1df8}', '\u{1df8}'), ]; pub const TAGALOG: &'static [(char, char)] = @@ -1251,7 +1273,7 @@ pub const TAI_THAM: &'static [(char, char)] = &[ pub const TAI_VIET: &'static [(char, char)] = &[('ꪀ', 'ꫂ'), ('ꫛ', '꫟')]; pub const TAKRI: &'static [(char, char)] = - &[('।', '॥'), ('꠰', '꠹'), ('𑚀', '\u{116b8}'), ('𑛀', '𑛉')]; + &[('।', '॥'), ('꠰', '꠹'), ('𑚀', '𑚸'), ('𑛀', '𑛉')]; pub const TAMIL: &'static [(char, char)] = &[ ('\u{951}', '\u{952}'), @@ -1277,12 +1299,16 @@ pub const TAMIL: &'static [(char, char)] = &[ ('\u{11301}', '\u{11301}'), ('𑌃', '𑌃'), ('\u{1133b}', '\u{1133c}'), - ('\u{11fc0}', '\u{11ff1}'), - ('\u{11fff}', '\u{11fff}'), + ('𑿀', '𑿱'), + ('𑿿', '𑿿'), ]; -pub const TANGUT: &'static [(char, char)] = - &[('𖿠', '𖿠'), ('𗀀', '\u{187f7}'), ('𘠀', '𘫲')]; +pub const TANGUT: &'static [(char, char)] = &[ + ('𖿠', '𖿠'), + ('𗀀', '𘟷'), + ('𘠀', '\u{18aff}'), + ('\u{18d00}', '\u{18d08}'), +]; pub const TELUGU: &'static [(char, char)] = &[ ('\u{951}', '\u{952}'), @@ -1298,7 +1324,7 @@ pub const TELUGU: &'static [(char, char)] = &[ ('ౘ', 'ౚ'), ('ౠ', '\u{c63}'), ('౦', '౯'), - ('\u{c77}', '౿'), + ('౷', '౿'), ('\u{1cda}', '\u{1cda}'), ('ᳲ', 'ᳲ'), ]; @@ -1341,11 +1367,20 @@ pub const UGARITIC: &'static [(char, char)] = &[('𐎀', '𐎝'), ('𐎟', '𐎟 pub const VAI: &'static [(char, char)] = &[('ꔀ', 'ꘫ')]; -pub const WANCHO: &'static [(char, char)] = - &[('\u{1e2c0}', '\u{1e2f9}'), ('\u{1e2ff}', '\u{1e2ff}')]; +pub const WANCHO: &'static [(char, char)] = &[('𞋀', '𞋹'), ('𞋿', '𞋿')]; pub const WARANG_CITI: &'static [(char, char)] = &[('𑢠', '𑣲'), ('𑣿', '𑣿')]; +pub const YEZIDI: &'static [(char, char)] = &[ + ('،', '،'), + ('؛', '؛'), + ('؟', '؟'), + ('٠', '٩'), + ('\u{10e80}', '\u{10ea9}'), + ('\u{10eab}', '\u{10ead}'), + ('\u{10eb0}', '\u{10eb1}'), +]; + pub const YI: &'static [(char, char)] = &[ ('、', '。'), ('〈', '】'), diff --git a/regex-syntax/src/unicode_tables/sentence_break.rs b/regex-syntax/src/unicode_tables/sentence_break.rs index 2ee7ae5b63..e4840f4855 100644 --- a/regex-syntax/src/unicode_tables/sentence_break.rs +++ b/regex-syntax/src/unicode_tables/sentence_break.rs @@ -1,8 +1,8 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate sentence-break /tmp/ucd/12.1.0/ --chars +// ucd-generate sentence-break ucd-13.0.0 --chars // -// ucd-generate is available on crates.io. +// ucd-generate 0.2.7 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("ATerm", ATERM), @@ -132,7 +132,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{b3e}', '\u{b44}'), ('େ', 'ୈ'), ('ୋ', '\u{b4d}'), - ('\u{b56}', '\u{b57}'), + ('\u{b55}', '\u{b57}'), ('\u{b62}', '\u{b63}'), ('\u{b82}', '\u{b82}'), ('\u{bbe}', 'ூ'), @@ -159,7 +159,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('ൊ', '\u{d4d}'), ('\u{d57}', '\u{d57}'), ('\u{d62}', '\u{d63}'), - ('ං', 'ඃ'), + ('\u{d81}', 'ඃ'), ('\u{dca}', '\u{dca}'), ('\u{dcf}', '\u{dd4}'), ('\u{dd6}', '\u{dd6}'), @@ -206,7 +206,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('ᩕ', '\u{1a5e}'), ('\u{1a60}', '\u{1a7c}'), ('\u{1a7f}', '\u{1a7f}'), - ('\u{1ab0}', '\u{1abe}'), + ('\u{1ab0}', '\u{1ac0}'), ('\u{1b00}', 'ᬄ'), ('\u{1b34}', '᭄'), ('\u{1b6b}', '\u{1b73}'), @@ -236,6 +236,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{a806}', '\u{a806}'), ('\u{a80b}', '\u{a80b}'), ('ꠣ', 'ꠧ'), + ('\u{a82c}', '\u{a82c}'), ('ꢀ', 'ꢁ'), ('ꢴ', '\u{a8c5}'), ('\u{a8e0}', '\u{a8f1}'), @@ -272,6 +273,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{10a3f}', '\u{10a3f}'), ('\u{10ae5}', '\u{10ae6}'), ('\u{10d24}', '\u{10d27}'), + ('\u{10eab}', '\u{10eac}'), ('\u{10f46}', '\u{10f50}'), ('𑀀', '𑀂'), ('\u{11038}', '\u{11046}'), @@ -284,6 +286,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{11180}', '𑆂'), ('𑆳', '𑇀'), ('\u{111c9}', '\u{111cc}'), + ('\u{111ce}', '\u{111cf}'), ('𑈬', '\u{11237}'), ('\u{1123e}', '\u{1123e}'), ('\u{112df}', '\u{112ea}'), @@ -306,9 +309,14 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{116ab}', '\u{116b7}'), ('\u{1171d}', '\u{1172b}'), ('𑠬', '\u{1183a}'), - ('\u{119d1}', '\u{119d7}'), + ('\u{11930}', '\u{11935}'), + ('\u{11937}', '\u{11938}'), + ('\u{1193b}', '\u{1193e}'), + ('\u{11940}', '\u{11940}'), + ('\u{11942}', '\u{11943}'), + ('𑧑', '\u{119d7}'), ('\u{119da}', '\u{119e0}'), - ('\u{119e4}', '\u{119e4}'), + ('𑧤', '𑧤'), ('\u{11a01}', '\u{11a0a}'), ('\u{11a33}', '𑨹'), ('\u{11a3b}', '\u{11a3e}'), @@ -331,8 +339,10 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{16af0}', '\u{16af4}'), ('\u{16b30}', '\u{16b36}'), ('\u{16f4f}', '\u{16f4f}'), - ('𖽑', '\u{16f87}'), + ('𖽑', '𖾇'), ('\u{16f8f}', '\u{16f92}'), + ('\u{16fe4}', '\u{16fe4}'), + ('\u{16ff0}', '\u{16ff1}'), ('\u{1bc9d}', '\u{1bc9e}'), ('\u{1d165}', '\u{1d169}'), ('𝅭', '\u{1d172}'), @@ -986,13 +996,16 @@ pub const LOWER: &'static [(char, char)] = &[ ('ꞵ', 'ꞵ'), ('ꞷ', 'ꞷ'), ('ꞹ', 'ꞹ'), - ('\u{a7bb}', '\u{a7bb}'), - ('\u{a7bd}', '\u{a7bd}'), - ('\u{a7bf}', '\u{a7bf}'), - ('\u{a7c3}', '\u{a7c3}'), + ('ꞻ', 'ꞻ'), + ('ꞽ', 'ꞽ'), + ('ꞿ', 'ꞿ'), + ('ꟃ', 'ꟃ'), + ('\u{a7c8}', '\u{a7c8}'), + ('\u{a7ca}', '\u{a7ca}'), + ('\u{a7f6}', '\u{a7f6}'), ('ꟸ', 'ꟺ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab67}'), + ('ꭜ', '\u{ab68}'), ('ꭰ', 'ꮿ'), ('ff', 'st'), ('ﬓ', 'ﬗ'), @@ -1085,15 +1098,17 @@ pub const NUMERIC: &'static [(char, char)] = &[ ('𑛀', '𑛉'), ('𑜰', '𑜹'), ('𑣠', '𑣩'), + ('\u{11950}', '\u{11959}'), ('𑱐', '𑱙'), ('𑵐', '𑵙'), ('𑶠', '𑶩'), ('𖩠', '𖩩'), ('𖭐', '𖭙'), ('𝟎', '𝟿'), - ('\u{1e140}', '\u{1e149}'), - ('\u{1e2f0}', '\u{1e2f9}'), + ('𞅀', '𞅉'), + ('𞋰', '𞋹'), ('𞥐', '𞥙'), + ('\u{1fbf0}', '\u{1fbf9}'), ]; pub const OLETTER: &'static [(char, char)] = &[ @@ -1130,7 +1145,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ࡀ', 'ࡘ'), ('ࡠ', 'ࡪ'), ('ࢠ', 'ࢴ'), - ('ࢶ', 'ࢽ'), + ('ࢶ', '\u{8c7}'), ('ऄ', 'ह'), ('ऽ', 'ऽ'), ('ॐ', 'ॐ'), @@ -1206,7 +1221,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ೞ', 'ೞ'), ('ೠ', 'ೡ'), ('ೱ', 'ೲ'), - ('അ', 'ഌ'), + ('\u{d04}', 'ഌ'), ('എ', 'ഐ'), ('ഒ', 'ഺ'), ('ഽ', 'ഽ'), @@ -1224,8 +1239,8 @@ pub const OLETTER: &'static [(char, char)] = &[ ('เ', 'ๆ'), ('ກ', 'ຂ'), ('ຄ', 'ຄ'), - ('\u{e86}', 'ຊ'), - ('\u{e8c}', 'ຣ'), + ('ຆ', 'ຊ'), + ('ຌ', 'ຣ'), ('ລ', 'ລ'), ('ວ', 'ະ'), ('າ', 'ຳ'), @@ -1304,7 +1319,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ᳩ', 'ᳬ'), ('ᳮ', 'ᳳ'), ('ᳵ', 'ᳶ'), - ('\u{1cfa}', '\u{1cfa}'), + ('ᳺ', 'ᳺ'), ('ℵ', 'ℸ'), ('ↀ', 'ↂ'), ('ↅ', 'ↈ'), @@ -1330,10 +1345,10 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ー', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', 'ㆺ'), + ('ㆠ', '\u{31bf}'), ('ㇰ', 'ㇿ'), - ('㐀', '䶵'), - ('一', '鿯'), + ('㐀', '\u{4dbf}'), + ('一', '\u{9ffc}'), ('ꀀ', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), @@ -1382,6 +1397,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ꬑ', 'ꬖ'), ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), + ('\u{ab69}', '\u{ab69}'), ('ꯀ', 'ꯢ'), ('가', '힣'), ('ힰ', 'ퟆ'), @@ -1459,15 +1475,19 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𐮀', '𐮑'), ('𐰀', '𐱈'), ('𐴀', '𐴣'), + ('\u{10e80}', '\u{10ea9}'), + ('\u{10eb0}', '\u{10eb1}'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '𐽅'), - ('\u{10fe0}', '\u{10ff6}'), + ('\u{10fb0}', '\u{10fc4}'), + ('𐿠', '𐿶'), ('𑀃', '𑀷'), ('𑂃', '𑂯'), ('𑃐', '𑃨'), ('𑄃', '𑄦'), ('𑅄', '𑅄'), + ('\u{11147}', '\u{11147}'), ('𑅐', '𑅲'), ('𑅶', '𑅶'), ('𑆃', '𑆲'), @@ -1493,7 +1513,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𑍝', '𑍡'), ('𑐀', '𑐴'), ('𑑇', '𑑊'), - ('\u{1145f}', '\u{1145f}'), + ('𑑟', '\u{11461}'), ('𑒀', '𑒯'), ('𑓄', '𑓅'), ('𑓇', '𑓇'), @@ -1502,14 +1522,20 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𑘀', '𑘯'), ('𑙄', '𑙄'), ('𑚀', '𑚪'), - ('\u{116b8}', '\u{116b8}'), + ('𑚸', '𑚸'), ('𑜀', '𑜚'), ('𑠀', '𑠫'), - ('𑣿', '𑣿'), - ('\u{119a0}', '\u{119a7}'), - ('\u{119aa}', '\u{119d0}'), - ('\u{119e1}', '\u{119e1}'), - ('\u{119e3}', '\u{119e3}'), + ('𑣿', '\u{11906}'), + ('\u{11909}', '\u{11909}'), + ('\u{1190c}', '\u{11913}'), + ('\u{11915}', '\u{11916}'), + ('\u{11918}', '\u{1192f}'), + ('\u{1193f}', '\u{1193f}'), + ('\u{11941}', '\u{11941}'), + ('𑦠', '𑦧'), + ('𑦪', '𑧐'), + ('𑧡', '𑧡'), + ('𑧣', '𑧣'), ('𑨀', '𑨀'), ('𑨋', '𑨲'), ('𑨺', '𑨺'), @@ -1530,6 +1556,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𑵪', '𑶉'), ('𑶘', '𑶘'), ('𑻠', '𑻲'), + ('\u{11fb0}', '\u{11fb0}'), ('𒀀', '𒎙'), ('𒐀', '𒑮'), ('𒒀', '𒕃'), @@ -1542,27 +1569,28 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𖭀', '𖭃'), ('𖭣', '𖭷'), ('𖭽', '𖮏'), - ('𖼀', '\u{16f4a}'), + ('𖼀', '𖽊'), ('𖽐', '𖽐'), ('𖾓', '𖾟'), ('𖿠', '𖿡'), - ('\u{16fe3}', '\u{16fe3}'), - ('𗀀', '\u{187f7}'), - ('𘠀', '𘫲'), + ('𖿣', '𖿣'), + ('𗀀', '𘟷'), + ('𘠀', '\u{18cd5}'), + ('\u{18d00}', '\u{18d08}'), ('𛀀', '𛄞'), - ('\u{1b150}', '\u{1b152}'), - ('\u{1b164}', '\u{1b167}'), + ('𛅐', '𛅒'), + ('𛅤', '𛅧'), ('𛅰', '𛋻'), ('𛰀', '𛱪'), ('𛱰', '𛱼'), ('𛲀', '𛲈'), ('𛲐', '𛲙'), - ('\u{1e100}', '\u{1e12c}'), - ('\u{1e137}', '\u{1e13d}'), - ('\u{1e14e}', '\u{1e14e}'), - ('\u{1e2c0}', '\u{1e2eb}'), + ('𞄀', '𞄬'), + ('𞄷', '𞄽'), + ('𞅎', '𞅎'), + ('𞋀', '𞋫'), ('𞠀', '𞣄'), - ('\u{1e94b}', '\u{1e94b}'), + ('𞥋', '𞥋'), ('𞸀', '𞸃'), ('𞸅', '𞸟'), ('𞸡', '𞸢'), @@ -1596,12 +1624,13 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𞺡', '𞺣'), ('𞺥', '𞺩'), ('𞺫', '𞺻'), - ('𠀀', '𪛖'), + ('𠀀', '\u{2a6dd}'), ('𪜀', '𫜴'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), + ('\u{30000}', '\u{3134a}'), ]; pub const SCONTINUE: &'static [(char, char)] = &[ @@ -1687,6 +1716,8 @@ pub const STERM: &'static [(char, char)] = &[ ('𑗉', '𑗗'), ('𑙁', '𑙂'), ('𑜼', '𑜾'), + ('\u{11944}', '\u{11944}'), + ('\u{11946}', '\u{11946}'), ('𑩂', '𑩃'), ('𑪛', '𑪜'), ('𑱁', '𑱂'), @@ -2312,11 +2343,13 @@ pub const UPPER: &'static [(char, char)] = &[ ('Ʞ', 'Ꞵ'), ('Ꞷ', 'Ꞷ'), ('Ꞹ', 'Ꞹ'), - ('\u{a7ba}', '\u{a7ba}'), - ('\u{a7bc}', '\u{a7bc}'), - ('\u{a7be}', '\u{a7be}'), - ('\u{a7c2}', '\u{a7c2}'), - ('\u{a7c4}', '\u{a7c6}'), + ('Ꞻ', 'Ꞻ'), + ('Ꞽ', 'Ꞽ'), + ('Ꞿ', 'Ꞿ'), + ('Ꟃ', 'Ꟃ'), + ('Ꞔ', '\u{a7c7}'), + ('\u{a7c9}', '\u{a7c9}'), + ('\u{a7f5}', '\u{a7f5}'), ('A', 'Z'), ('𐐀', '𐐧'), ('𐒰', '𐓓'), diff --git a/regex-syntax/src/unicode_tables/word_break.rs b/regex-syntax/src/unicode_tables/word_break.rs index 24f6fefd2c..5c013420fd 100644 --- a/regex-syntax/src/unicode_tables/word_break.rs +++ b/regex-syntax/src/unicode_tables/word_break.rs @@ -1,8 +1,8 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate word-break /tmp/ucd/12.1.0/ --chars +// ucd-generate word-break ucd-13.0.0 --chars // -// ucd-generate is available on crates.io. +// ucd-generate 0.2.7 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("ALetter", ALETTER), @@ -34,8 +34,7 @@ pub const ALETTER: &'static [(char, char)] = &[ ('À', 'Ö'), ('Ø', 'ö'), ('ø', '˗'), - ('˞', 'ˤ'), - ('ˬ', '˿'), + ('˞', '˿'), ('Ͱ', 'ʹ'), ('Ͷ', 'ͷ'), ('ͺ', 'ͽ'), @@ -48,10 +47,10 @@ pub const ALETTER: &'static [(char, char)] = &[ ('Ϸ', 'ҁ'), ('Ҋ', 'ԯ'), ('Ա', 'Ֆ'), - ('ՙ', 'ՙ'), - ('՛', '՜'), + ('ՙ', '՜'), ('՞', '՞'), ('ՠ', 'ֈ'), + ('֊', '֊'), ('׳', '׳'), ('ؠ', 'ي'), ('ٮ', 'ٯ'), @@ -75,7 +74,7 @@ pub const ALETTER: &'static [(char, char)] = &[ ('ࡀ', 'ࡘ'), ('ࡠ', 'ࡪ'), ('ࢠ', 'ࢴ'), - ('ࢶ', 'ࢽ'), + ('ࢶ', '\u{8c7}'), ('ऄ', 'ह'), ('ऽ', 'ऽ'), ('ॐ', 'ॐ'), @@ -151,7 +150,7 @@ pub const ALETTER: &'static [(char, char)] = &[ ('ೞ', 'ೞ'), ('ೠ', 'ೡ'), ('ೱ', 'ೲ'), - ('അ', 'ഌ'), + ('\u{d04}', 'ഌ'), ('എ', 'ഐ'), ('ഒ', 'ഺ'), ('ഽ', 'ഽ'), @@ -223,7 +222,7 @@ pub const ALETTER: &'static [(char, char)] = &[ ('ᳩ', 'ᳬ'), ('ᳮ', 'ᳳ'), ('ᳵ', 'ᳶ'), - ('\u{1cfa}', '\u{1cfa}'), + ('ᳺ', 'ᳺ'), ('ᴀ', 'ᶿ'), ('Ḁ', 'ἕ'), ('Ἐ', 'Ἕ'), @@ -286,7 +285,7 @@ pub const ALETTER: &'static [(char, char)] = &[ ('〻', '〼'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', 'ㆺ'), + ('ㆠ', '\u{31bf}'), ('ꀀ', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), @@ -295,9 +294,9 @@ pub const ALETTER: &'static [(char, char)] = &[ ('Ꙁ', 'ꙮ'), ('ꙿ', 'ꚝ'), ('ꚠ', 'ꛯ'), - ('ꜗ', '\u{a7bf}'), - ('\u{a7c2}', '\u{a7c6}'), - ('ꟷ', 'ꠁ'), + ('꜈', 'ꞿ'), + ('Ꟃ', '\u{a7ca}'), + ('\u{a7f5}', 'ꠁ'), ('ꠃ', 'ꠅ'), ('ꠇ', 'ꠊ'), ('ꠌ', 'ꠢ'), @@ -321,7 +320,7 @@ pub const ALETTER: &'static [(char, char)] = &[ ('ꬑ', 'ꬖ'), ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), - ('ꬰ', '\u{ab67}'), + ('ꬰ', '\u{ab69}'), ('ꭰ', 'ꯢ'), ('가', '힣'), ('ힰ', 'ퟆ'), @@ -397,15 +396,19 @@ pub const ALETTER: &'static [(char, char)] = &[ ('𐲀', '𐲲'), ('𐳀', '𐳲'), ('𐴀', '𐴣'), + ('\u{10e80}', '\u{10ea9}'), + ('\u{10eb0}', '\u{10eb1}'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '𐽅'), - ('\u{10fe0}', '\u{10ff6}'), + ('\u{10fb0}', '\u{10fc4}'), + ('𐿠', '𐿶'), ('𑀃', '𑀷'), ('𑂃', '𑂯'), ('𑃐', '𑃨'), ('𑄃', '𑄦'), ('𑅄', '𑅄'), + ('\u{11147}', '\u{11147}'), ('𑅐', '𑅲'), ('𑅶', '𑅶'), ('𑆃', '𑆲'), @@ -431,7 +434,7 @@ pub const ALETTER: &'static [(char, char)] = &[ ('𑍝', '𑍡'), ('𑐀', '𑐴'), ('𑑇', '𑑊'), - ('\u{1145f}', '\u{1145f}'), + ('𑑟', '\u{11461}'), ('𑒀', '𑒯'), ('𑓄', '𑓅'), ('𑓇', '𑓇'), @@ -440,14 +443,20 @@ pub const ALETTER: &'static [(char, char)] = &[ ('𑘀', '𑘯'), ('𑙄', '𑙄'), ('𑚀', '𑚪'), - ('\u{116b8}', '\u{116b8}'), + ('𑚸', '𑚸'), ('𑠀', '𑠫'), ('𑢠', '𑣟'), - ('𑣿', '𑣿'), - ('\u{119a0}', '\u{119a7}'), - ('\u{119aa}', '\u{119d0}'), - ('\u{119e1}', '\u{119e1}'), - ('\u{119e3}', '\u{119e3}'), + ('𑣿', '\u{11906}'), + ('\u{11909}', '\u{11909}'), + ('\u{1190c}', '\u{11913}'), + ('\u{11915}', '\u{11916}'), + ('\u{11918}', '\u{1192f}'), + ('\u{1193f}', '\u{1193f}'), + ('\u{11941}', '\u{11941}'), + ('𑦠', '𑦧'), + ('𑦪', '𑧐'), + ('𑧡', '𑧡'), + ('𑧣', '𑧣'), ('𑨀', '𑨀'), ('𑨋', '𑨲'), ('𑨺', '𑨺'), @@ -468,6 +477,7 @@ pub const ALETTER: &'static [(char, char)] = &[ ('𑵪', '𑶉'), ('𑶘', '𑶘'), ('𑻠', '𑻲'), + ('\u{11fb0}', '\u{11fb0}'), ('𒀀', '𒎙'), ('𒐀', '𒑮'), ('𒒀', '𒕃'), @@ -481,11 +491,11 @@ pub const ALETTER: &'static [(char, char)] = &[ ('𖭣', '𖭷'), ('𖭽', '𖮏'), ('𖹀', '𖹿'), - ('𖼀', '\u{16f4a}'), + ('𖼀', '𖽊'), ('𖽐', '𖽐'), ('𖾓', '𖾟'), ('𖿠', '𖿡'), - ('\u{16fe3}', '\u{16fe3}'), + ('𖿣', '𖿣'), ('𛰀', '𛱪'), ('𛱰', '𛱼'), ('𛲀', '𛲈'), @@ -520,13 +530,13 @@ pub const ALETTER: &'static [(char, char)] = &[ ('𝞊', '𝞨'), ('𝞪', '𝟂'), ('𝟄', '𝟋'), - ('\u{1e100}', '\u{1e12c}'), - ('\u{1e137}', '\u{1e13d}'), - ('\u{1e14e}', '\u{1e14e}'), - ('\u{1e2c0}', '\u{1e2eb}'), + ('𞄀', '𞄬'), + ('𞄷', '𞄽'), + ('𞅎', '𞅎'), + ('𞋀', '𞋫'), ('𞠀', '𞣄'), ('𞤀', '𞥃'), - ('\u{1e94b}', '\u{1e94b}'), + ('𞥋', '𞥋'), ('𞸀', '𞸃'), ('𞸅', '𞸟'), ('𞸡', '𞸢'), @@ -628,7 +638,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{b3e}', '\u{b44}'), ('େ', 'ୈ'), ('ୋ', '\u{b4d}'), - ('\u{b56}', '\u{b57}'), + ('\u{b55}', '\u{b57}'), ('\u{b62}', '\u{b63}'), ('\u{b82}', '\u{b82}'), ('\u{bbe}', 'ூ'), @@ -655,7 +665,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('ൊ', '\u{d4d}'), ('\u{d57}', '\u{d57}'), ('\u{d62}', '\u{d63}'), - ('ං', 'ඃ'), + ('\u{d81}', 'ඃ'), ('\u{dca}', '\u{dca}'), ('\u{dcf}', '\u{dd4}'), ('\u{dd6}', '\u{dd6}'), @@ -702,7 +712,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('ᩕ', '\u{1a5e}'), ('\u{1a60}', '\u{1a7c}'), ('\u{1a7f}', '\u{1a7f}'), - ('\u{1ab0}', '\u{1abe}'), + ('\u{1ab0}', '\u{1ac0}'), ('\u{1b00}', 'ᬄ'), ('\u{1b34}', '᭄'), ('\u{1b6b}', '\u{1b73}'), @@ -732,6 +742,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{a806}', '\u{a806}'), ('\u{a80b}', '\u{a80b}'), ('ꠣ', 'ꠧ'), + ('\u{a82c}', '\u{a82c}'), ('ꢀ', 'ꢁ'), ('ꢴ', '\u{a8c5}'), ('\u{a8e0}', '\u{a8f1}'), @@ -768,6 +779,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{10a3f}', '\u{10a3f}'), ('\u{10ae5}', '\u{10ae6}'), ('\u{10d24}', '\u{10d27}'), + ('\u{10eab}', '\u{10eac}'), ('\u{10f46}', '\u{10f50}'), ('𑀀', '𑀂'), ('\u{11038}', '\u{11046}'), @@ -780,6 +792,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{11180}', '𑆂'), ('𑆳', '𑇀'), ('\u{111c9}', '\u{111cc}'), + ('\u{111ce}', '\u{111cf}'), ('𑈬', '\u{11237}'), ('\u{1123e}', '\u{1123e}'), ('\u{112df}', '\u{112ea}'), @@ -802,9 +815,14 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{116ab}', '\u{116b7}'), ('\u{1171d}', '\u{1172b}'), ('𑠬', '\u{1183a}'), - ('\u{119d1}', '\u{119d7}'), + ('\u{11930}', '\u{11935}'), + ('\u{11937}', '\u{11938}'), + ('\u{1193b}', '\u{1193e}'), + ('\u{11940}', '\u{11940}'), + ('\u{11942}', '\u{11943}'), + ('𑧑', '\u{119d7}'), ('\u{119da}', '\u{119e0}'), - ('\u{119e4}', '\u{119e4}'), + ('𑧤', '𑧤'), ('\u{11a01}', '\u{11a0a}'), ('\u{11a33}', '𑨹'), ('\u{11a3b}', '\u{11a3e}'), @@ -827,8 +845,10 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{16af0}', '\u{16af4}'), ('\u{16b30}', '\u{16b36}'), ('\u{16f4f}', '\u{16f4f}'), - ('𖽑', '\u{16f87}'), + ('𖽑', '𖾇'), ('\u{16f8f}', '\u{16f92}'), + ('\u{16fe4}', '\u{16fe4}'), + ('\u{16ff0}', '\u{16ff1}'), ('\u{1bc9d}', '\u{1bc9e}'), ('\u{1d165}', '\u{1d169}'), ('𝅭', '\u{1d172}'), @@ -911,7 +931,7 @@ pub const KATAKANA: &'static [(char, char)] = &[ ('㌀', '㍗'), ('ヲ', 'ン'), ('𛀀', '𛀀'), - ('\u{1b164}', '\u{1b167}'), + ('𛅤', '𛅧'), ]; pub const LF: &'static [(char, char)] = &[('\n', '\n')]; @@ -920,6 +940,7 @@ pub const MIDLETTER: &'static [(char, char)] = &[ (':', ':'), ('·', '·'), ('·', '·'), + ('՟', '՟'), ('״', '״'), ('‧', '‧'), ('︓', '︓'), @@ -1008,15 +1029,17 @@ pub const NUMERIC: &'static [(char, char)] = &[ ('𑛀', '𑛉'), ('𑜰', '𑜹'), ('𑣠', '𑣩'), + ('\u{11950}', '\u{11959}'), ('𑱐', '𑱙'), ('𑵐', '𑵙'), ('𑶠', '𑶩'), ('𖩠', '𖩩'), ('𖭐', '𖭙'), ('𝟎', '𝟿'), - ('\u{1e140}', '\u{1e149}'), - ('\u{1e2f0}', '\u{1e2f9}'), + ('𞅀', '𞅉'), + ('𞋰', '𞋹'), ('𞥐', '𞥙'), + ('\u{1fbf0}', '\u{1fbf9}'), ]; pub const REGIONAL_INDICATOR: &'static [(char, char)] = &[('🇦', '🇿')];