diff --git a/regex-syntax/src/unicode.rs b/regex-syntax/src/unicode.rs index 70d5954b7..8194d7f55 100644 --- a/regex-syntax/src/unicode.rs +++ b/regex-syntax/src/unicode.rs @@ -605,6 +605,7 @@ fn ages(canonical_age: &str) -> Result> { ("V12_1", age::V12_1), ("V13_0", age::V13_0), ("V14_0", age::V14_0), + ("V15_0", age::V15_0), ]; assert_eq!(AGES.len(), age::BY_NAME.len(), "ages are out of sync"); diff --git a/regex-syntax/src/unicode_tables/age.rs b/regex-syntax/src/unicode_tables/age.rs index ffdfef316..71f4861e0 100644 --- a/regex-syntax/src/unicode_tables/age.rs +++ b/regex-syntax/src/unicode_tables/age.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate age /tmp/ucd --chars +// ucd-generate age ucd-15.0.0 --chars // -// Unicode version: 14.0.0. +// Unicode version: 15.0.0. // -// ucd-generate 0.2.11 is available on crates.io. +// ucd-generate 0.2.14 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("V10_0", V10_0), @@ -13,6 +13,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("V12_1", V12_1), ("V13_0", V13_0), ("V14_0", V14_0), + ("V15_0", V15_0), ("V1_1", V1_1), ("V2_0", V2_0), ("V2_1", V2_1), @@ -346,6 +347,41 @@ pub const V14_0: &'static [(char, char)] = &[ ('๐ซœต', '๐ซœธ'), ]; +pub const V15_0: &'static [(char, char)] = &[ + ('เณณ', 'เณณ'), + ('\u{ece}', '\u{ece}'), + ('\u{10efd}', '\u{10eff}'), + ('๐‘ˆฟ', '\u{11241}'), + ('๐‘ฌ€', '๐‘ฌ‰'), + ('\u{11f00}', '๐‘ผ'), + ('๐‘ผ’', '\u{11f3a}'), + ('๐‘ผพ', '๐‘ฝ™'), + ('๐“ฏ', '๐“ฏ'), + ('\u{13439}', '\u{13455}'), + ('๐›„ฒ', '๐›„ฒ'), + ('๐›…•', '๐›…•'), + ('๐‹€', '๐‹“'), + ('๐ผฅ', '๐ผช'), + ('๐ž€ฐ', '๐žญ'), + ('\u{1e08f}', '\u{1e08f}'), + ('๐ž“', '๐ž“น'), + ('๐Ÿ›œ', '๐Ÿ›œ'), + ('๐Ÿด', '๐Ÿถ'), + ('๐Ÿป', '๐Ÿฟ'), + ('๐ŸŸ™', '๐ŸŸ™'), + ('๐Ÿฉต', '๐Ÿฉท'), + ('๐Ÿช‡', '๐Ÿชˆ'), + ('๐Ÿชญ', '๐Ÿชฏ'), + ('๐Ÿชป', '๐Ÿชฝ'), + ('๐Ÿชฟ', '๐Ÿชฟ'), + ('๐ŸซŽ', '๐Ÿซ'), + ('๐Ÿซš', '๐Ÿซ›'), + ('๐Ÿซจ', '๐Ÿซจ'), + ('๐Ÿซท', '๐Ÿซธ'), + ('๐ซœน', '๐ซœน'), + ('๐ฑ', '๐ฒŽฏ'), +]; + pub const V1_1: &'static [(char, char)] = &[ ('\0', 'วต'), ('วบ', 'ศ—'), diff --git a/regex-syntax/src/unicode_tables/case_folding_simple.rs b/regex-syntax/src/unicode_tables/case_folding_simple.rs index 766d21b48..23f9364ce 100644 --- a/regex-syntax/src/unicode_tables/case_folding_simple.rs +++ b/regex-syntax/src/unicode_tables/case_folding_simple.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate case-folding-simple /tmp/ucd --chars --all-pairs +// ucd-generate case-folding-simple ucd-15.0.0 --chars --all-pairs // -// Unicode version: 14.0.0. +// Unicode version: 15.0.0. // -// ucd-generate 0.2.11 is available on crates.io. +// ucd-generate 0.2.14 is available on crates.io. pub const CASE_FOLDING_SIMPLE: &'static [(char, &'static [char])] = &[ ('A', &['a']), diff --git a/regex-syntax/src/unicode_tables/general_category.rs b/regex-syntax/src/unicode_tables/general_category.rs index 8aa6b0078..8fc928912 100644 --- a/regex-syntax/src/unicode_tables/general_category.rs +++ b/regex-syntax/src/unicode_tables/general_category.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate general-category /tmp/ucd --chars --exclude surrogate +// ucd-generate general-category ucd-15.0.0 --chars --exclude surrogate // -// Unicode version: 14.0.0. +// Unicode version: 15.0.0. // -// ucd-generate 0.2.11 is available on crates.io. +// ucd-generate 0.2.14 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Cased_Letter", CASED_LETTER), @@ -188,6 +188,7 @@ pub const CASED_LETTER: &'static [(char, char)] = &[ ('๐Ÿ„', '๐Ÿ‹'), ('๐ผ€', '๐ผ‰'), ('๐ผ‹', '๐ผž'), + ('๐ผฅ', '๐ผช'), ('๐žค€', '๐žฅƒ'), ]; @@ -383,12 +384,14 @@ pub const DECIMAL_NUMBER: &'static [(char, char)] = &[ ('๐‘ฑ', '๐‘ฑ™'), ('๐‘ต', '๐‘ต™'), ('๐‘ถ ', '๐‘ถฉ'), + ('๐‘ฝ', '๐‘ฝ™'), ('๐–ฉ ', '๐–ฉฉ'), ('๐–ซ€', '๐–ซ‰'), ('๐–ญ', '๐–ญ™'), ('๐ŸŽ', '๐Ÿฟ'), ('๐ž…€', '๐ž…‰'), ('๐ž‹ฐ', '๐ž‹น'), + ('๐ž“ฐ', '๐ž“น'), ('๐žฅ', '๐žฅ™'), ('๐Ÿฏฐ', '๐Ÿฏน'), ]; @@ -431,7 +434,7 @@ pub const FORMAT: &'static [(char, char)] = &[ ('\u{fff9}', '\u{fffb}'), ('\u{110bd}', '\u{110bd}'), ('\u{110cd}', '\u{110cd}'), - ('\u{13430}', '\u{13438}'), + ('\u{13430}', '\u{1343f}'), ('\u{1bca0}', '\u{1bca3}'), ('\u{1d173}', '\u{1d17a}'), ('\u{e0001}', '\u{e0001}'), @@ -922,6 +925,7 @@ pub const LETTER: &'static [(char, char)] = &[ ('๐‘‡œ', '๐‘‡œ'), ('๐‘ˆ€', '๐‘ˆ‘'), ('๐‘ˆ“', '๐‘ˆซ'), + ('๐‘ˆฟ', '๐‘‰€'), ('๐‘Š€', '๐‘Š†'), ('๐‘Šˆ', '๐‘Šˆ'), ('๐‘ŠŠ', '๐‘Š'), @@ -984,11 +988,15 @@ pub const LETTER: &'static [(char, char)] = &[ ('๐‘ตช', '๐‘ถ‰'), ('๐‘ถ˜', '๐‘ถ˜'), ('๐‘ป ', '๐‘ปฒ'), + ('๐‘ผ‚', '๐‘ผ‚'), + ('๐‘ผ„', '๐‘ผ'), + ('๐‘ผ’', '๐‘ผณ'), ('๐‘พฐ', '๐‘พฐ'), ('๐’€€', '๐’Ž™'), ('๐’’€', '๐’•ƒ'), ('๐’พ', '๐’ฟฐ'), - ('๐“€€', '๐“ฎ'), + ('๐“€€', '๐“ฏ'), + ('๐“‘', '๐“‘†'), ('๐”€', '๐”™†'), ('๐– €', '๐–จธ'), ('๐–ฉ€', '๐–ฉž'), @@ -1011,7 +1019,9 @@ pub const LETTER: &'static [(char, char)] = &[ ('๐šฟต', '๐šฟป'), ('๐šฟฝ', '๐šฟพ'), ('๐›€€', '๐›„ข'), + ('๐›„ฒ', '๐›„ฒ'), ('๐›…', '๐›…’'), + ('๐›…•', '๐›…•'), ('๐›…ค', '๐›…ง'), ('๐›…ฐ', '๐›‹ป'), ('๐›ฐ€', '๐›ฑช'), @@ -1049,11 +1059,14 @@ pub const LETTER: &'static [(char, char)] = &[ ('๐žช', '๐Ÿ‚'), ('๐Ÿ„', '๐Ÿ‹'), ('๐ผ€', '๐ผž'), + ('๐ผฅ', '๐ผช'), + ('๐ž€ฐ', '๐žญ'), ('๐ž„€', '๐ž„ฌ'), ('๐ž„ท', '๐ž„ฝ'), ('๐ž…Ž', '๐ž…Ž'), ('๐žŠ', '๐žŠญ'), ('๐ž‹€', '๐ž‹ซ'), + ('๐ž“', '๐ž“ซ'), ('๐žŸ ', '๐žŸฆ'), ('๐žŸจ', '๐žŸซ'), ('๐žŸญ', '๐žŸฎ'), @@ -1095,12 +1108,13 @@ pub const LETTER: &'static [(char, char)] = &[ ('๐žบฅ', '๐žบฉ'), ('๐žบซ', '๐žบป'), ('๐ €€', '๐ช›Ÿ'), - ('๐ชœ€', '๐ซœธ'), + ('๐ชœ€', '๐ซœน'), ('๐ซ€', '๐ซ '), ('๐ซ  ', '๐ฌบก'), ('๐ฌบฐ', '๐ฎฏ '), ('๐ฏ €', '๐ฏจ'), ('๐ฐ€€', '๐ฑŠ'), + ('๐ฑ', '๐ฒŽฏ'), ]; pub const LETTER_NUMBER: &'static [(char, char)] = &[ @@ -1778,6 +1792,7 @@ pub const LOWERCASE_LETTER: &'static [(char, char)] = &[ ('๐Ÿ‹', '๐Ÿ‹'), ('๐ผ€', '๐ผ‰'), ('๐ผ‹', '๐ผž'), + ('๐ผฅ', '๐ผช'), ('๐žคข', '๐žฅƒ'), ]; @@ -1862,6 +1877,7 @@ pub const MARK: &'static [(char, char)] = &[ ('เณŠ', '\u{ccd}'), ('\u{cd5}', '\u{cd6}'), ('\u{ce2}', '\u{ce3}'), + ('เณณ', 'เณณ'), ('\u{d00}', 'เดƒ'), ('\u{d3b}', '\u{d3c}'), ('\u{d3e}', '\u{d44}'), @@ -1880,7 +1896,7 @@ pub const MARK: &'static [(char, char)] = &[ ('\u{e47}', '\u{e4e}'), ('\u{eb1}', '\u{eb1}'), ('\u{eb4}', '\u{ebc}'), - ('\u{ec8}', '\u{ecd}'), + ('\u{ec8}', '\u{ece}'), ('\u{f18}', '\u{f19}'), ('\u{f35}', '\u{f35}'), ('\u{f37}', '\u{f37}'), @@ -1982,6 +1998,7 @@ pub const MARK: &'static [(char, char)] = &[ ('\u{10ae5}', '\u{10ae6}'), ('\u{10d24}', '\u{10d27}'), ('\u{10eab}', '\u{10eac}'), + ('\u{10efd}', '\u{10eff}'), ('\u{10f46}', '\u{10f50}'), ('\u{10f82}', '\u{10f85}'), ('๐‘€€', '๐‘€‚'), @@ -2001,6 +2018,7 @@ pub const MARK: &'static [(char, char)] = &[ ('๐‘‡Ž', '\u{111cf}'), ('๐‘ˆฌ', '\u{11237}'), ('\u{1123e}', '\u{1123e}'), + ('\u{11241}', '\u{11241}'), ('\u{112df}', '\u{112ea}'), ('\u{11300}', '๐‘Œƒ'), ('\u{1133b}', '\u{1133c}'), @@ -2048,6 +2066,12 @@ pub const MARK: &'static [(char, char)] = &[ ('\u{11d90}', '\u{11d91}'), ('๐‘ถ“', '\u{11d97}'), ('\u{11ef3}', '๐‘ปถ'), + ('\u{11f00}', '\u{11f01}'), + ('๐‘ผƒ', '๐‘ผƒ'), + ('๐‘ผด', '\u{11f3a}'), + ('๐‘ผพ', '\u{11f42}'), + ('\u{13440}', '\u{13440}'), + ('\u{13447}', '\u{13455}'), ('\u{16af0}', '\u{16af4}'), ('\u{16b30}', '\u{16b36}'), ('\u{16f4f}', '\u{16f4f}'), @@ -2075,9 +2099,11 @@ pub const MARK: &'static [(char, char)] = &[ ('\u{1e01b}', '\u{1e021}'), ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), + ('\u{1e08f}', '\u{1e08f}'), ('\u{1e130}', '\u{1e136}'), ('\u{1e2ae}', '\u{1e2ae}'), ('\u{1e2ec}', '\u{1e2ef}'), + ('\u{1e4ec}', '\u{1e4ef}'), ('\u{1e8d0}', '\u{1e8d6}'), ('\u{1e944}', '\u{1e94a}'), ('\u{e0100}', '\u{e01ef}'), @@ -2218,7 +2244,9 @@ pub const MODIFIER_LETTER: &'static [(char, char)] = &[ ('๐šฟฐ', '๐šฟณ'), ('๐šฟต', '๐šฟป'), ('๐šฟฝ', '๐šฟพ'), + ('๐ž€ฐ', '๐žญ'), ('๐ž„ท', '๐ž„ฝ'), + ('๐ž“ซ', '๐ž“ซ'), ('๐žฅ‹', '๐žฅ‹'), ]; @@ -2349,7 +2377,7 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{e47}', '\u{e4e}'), ('\u{eb1}', '\u{eb1}'), ('\u{eb4}', '\u{ebc}'), - ('\u{ec8}', '\u{ecd}'), + ('\u{ec8}', '\u{ece}'), ('\u{f18}', '\u{f19}'), ('\u{f35}', '\u{f35}'), ('\u{f37}', '\u{f37}'), @@ -2480,6 +2508,7 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{10ae5}', '\u{10ae6}'), ('\u{10d24}', '\u{10d27}'), ('\u{10eab}', '\u{10eac}'), + ('\u{10efd}', '\u{10eff}'), ('\u{10f46}', '\u{10f50}'), ('\u{10f82}', '\u{10f85}'), ('\u{11001}', '\u{11001}'), @@ -2502,6 +2531,7 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{11234}', '\u{11234}'), ('\u{11236}', '\u{11237}'), ('\u{1123e}', '\u{1123e}'), + ('\u{11241}', '\u{11241}'), ('\u{112df}', '\u{112df}'), ('\u{112e3}', '\u{112ea}'), ('\u{11300}', '\u{11301}'), @@ -2563,6 +2593,12 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{11d95}', '\u{11d95}'), ('\u{11d97}', '\u{11d97}'), ('\u{11ef3}', '\u{11ef4}'), + ('\u{11f00}', '\u{11f01}'), + ('\u{11f36}', '\u{11f3a}'), + ('\u{11f40}', '\u{11f40}'), + ('\u{11f42}', '\u{11f42}'), + ('\u{13440}', '\u{13440}'), + ('\u{13447}', '\u{13455}'), ('\u{16af0}', '\u{16af4}'), ('\u{16b30}', '\u{16b36}'), ('\u{16f4f}', '\u{16f4f}'), @@ -2587,9 +2623,11 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{1e01b}', '\u{1e021}'), ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), + ('\u{1e08f}', '\u{1e08f}'), ('\u{1e130}', '\u{1e136}'), ('\u{1e2ae}', '\u{1e2ae}'), ('\u{1e2ec}', '\u{1e2ef}'), + ('\u{1e4ec}', '\u{1e4ef}'), ('\u{1e8d0}', '\u{1e8d6}'), ('\u{1e944}', '\u{1e94a}'), ('\u{e0100}', '\u{e01ef}'), @@ -2709,6 +2747,7 @@ pub const NUMBER: &'static [(char, char)] = &[ ('๐‘ฑ', '๐‘ฑฌ'), ('๐‘ต', '๐‘ต™'), ('๐‘ถ ', '๐‘ถฉ'), + ('๐‘ฝ', '๐‘ฝ™'), ('๐‘ฟ€', '๐‘ฟ”'), ('๐’€', '๐’‘ฎ'), ('๐–ฉ ', '๐–ฉฉ'), @@ -2716,11 +2755,13 @@ pub const NUMBER: &'static [(char, char)] = &[ ('๐–ญ', '๐–ญ™'), ('๐–ญ›', '๐–ญก'), ('๐–บ€', '๐–บ–'), + ('๐‹€', '๐‹“'), ('๐‹ ', '๐‹ณ'), ('๐ ', '๐ธ'), ('๐ŸŽ', '๐Ÿฟ'), ('๐ž…€', '๐ž…‰'), ('๐ž‹ฐ', '๐ž‹น'), + ('๐ž“ฐ', '๐ž“น'), ('๐žฃ‡', '๐žฃ'), ('๐žฅ', '๐žฅ™'), ('๐žฑฑ', '๐žฒซ'), @@ -2941,7 +2982,7 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{cdf}', '\u{cdf}'), ('\u{ce4}', '\u{ce5}'), ('\u{cf0}', '\u{cf0}'), - ('\u{cf3}', '\u{cff}'), + ('\u{cf4}', '\u{cff}'), ('\u{d0d}', '\u{d0d}'), ('\u{d11}', '\u{d11}'), ('\u{d45}', '\u{d45}'), @@ -2971,7 +3012,7 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{ebe}', '\u{ebf}'), ('\u{ec5}', '\u{ec5}'), ('\u{ec7}', '\u{ec7}'), - ('\u{ece}', '\u{ecf}'), + ('\u{ecf}', '\u{ecf}'), ('\u{eda}', '\u{edb}'), ('\u{ee0}', '\u{eff}'), ('\u{f48}', '\u{f48}'), @@ -3243,7 +3284,7 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{10e7f}', '\u{10e7f}'), ('\u{10eaa}', '\u{10eaa}'), ('\u{10eae}', '\u{10eaf}'), - ('\u{10eb2}', '\u{10eff}'), + ('\u{10eb2}', '\u{10efc}'), ('\u{10f28}', '\u{10f2f}'), ('\u{10f5a}', '\u{10f6f}'), ('\u{10f8a}', '\u{10faf}'), @@ -3261,7 +3302,7 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{111e0}', '\u{111e0}'), ('\u{111f5}', '\u{111ff}'), ('\u{11212}', '\u{11212}'), - ('\u{1123f}', '\u{1127f}'), + ('\u{11242}', '\u{1127f}'), ('\u{11287}', '\u{11287}'), ('\u{11289}', '\u{11289}'), ('\u{1128e}', '\u{1128e}'), @@ -3313,7 +3354,8 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{119e5}', '\u{119ff}'), ('\u{11a48}', '\u{11a4f}'), ('\u{11aa3}', '\u{11aaf}'), - ('\u{11af9}', '\u{11bff}'), + ('\u{11af9}', '\u{11aff}'), + ('\u{11b0a}', '\u{11bff}'), ('\u{11c09}', '\u{11c09}'), ('\u{11c37}', '\u{11c37}'), ('\u{11c46}', '\u{11c4f}'), @@ -3334,7 +3376,10 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{11d92}', '\u{11d92}'), ('\u{11d99}', '\u{11d9f}'), ('\u{11daa}', '\u{11edf}'), - ('\u{11ef9}', '\u{11faf}'), + ('\u{11ef9}', '\u{11eff}'), + ('\u{11f11}', '\u{11f11}'), + ('\u{11f3b}', '\u{11f3d}'), + ('\u{11f5a}', '\u{11faf}'), ('\u{11fb1}', '\u{11fbf}'), ('\u{11ff2}', '\u{11ffe}'), ('\u{1239a}', '\u{123ff}'), @@ -3342,7 +3387,8 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{12475}', '\u{1247f}'), ('\u{12544}', '\u{12f8f}'), ('\u{12ff3}', '\u{12fff}'), - ('\u{1342f}', '\u{143ff}'), + ('\u{13430}', '\u{1343f}'), + ('\u{13456}', '\u{143ff}'), ('\u{14647}', '\u{167ff}'), ('\u{16a39}', '\u{16a3f}'), ('\u{16a5f}', '\u{16a5f}'), @@ -3368,8 +3414,10 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{1aff4}', '\u{1aff4}'), ('\u{1affc}', '\u{1affc}'), ('\u{1afff}', '\u{1afff}'), - ('\u{1b123}', '\u{1b14f}'), - ('\u{1b153}', '\u{1b163}'), + ('\u{1b123}', '\u{1b131}'), + ('\u{1b133}', '\u{1b14f}'), + ('\u{1b153}', '\u{1b154}'), + ('\u{1b156}', '\u{1b163}'), ('\u{1b168}', '\u{1b16f}'), ('\u{1b2fc}', '\u{1bbff}'), ('\u{1bc6b}', '\u{1bc6f}'), @@ -3384,7 +3432,8 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{1d127}', '\u{1d128}'), ('\u{1d173}', '\u{1d17a}'), ('\u{1d1eb}', '\u{1d1ff}'), - ('\u{1d246}', '\u{1d2df}'), + ('\u{1d246}', '\u{1d2bf}'), + ('\u{1d2d4}', '\u{1d2df}'), ('\u{1d2f4}', '\u{1d2ff}'), ('\u{1d357}', '\u{1d35f}'), ('\u{1d379}', '\u{1d3ff}'), @@ -3411,19 +3460,23 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{1da8c}', '\u{1da9a}'), ('\u{1daa0}', '\u{1daa0}'), ('\u{1dab0}', '\u{1deff}'), - ('\u{1df1f}', '\u{1dfff}'), + ('\u{1df1f}', '\u{1df24}'), + ('\u{1df2b}', '\u{1dfff}'), ('\u{1e007}', '\u{1e007}'), ('\u{1e019}', '\u{1e01a}'), ('\u{1e022}', '\u{1e022}'), ('\u{1e025}', '\u{1e025}'), - ('\u{1e02b}', '\u{1e0ff}'), + ('\u{1e02b}', '\u{1e02f}'), + ('\u{1e06e}', '\u{1e08e}'), + ('\u{1e090}', '\u{1e0ff}'), ('\u{1e12d}', '\u{1e12f}'), ('\u{1e13e}', '\u{1e13f}'), ('\u{1e14a}', '\u{1e14d}'), ('\u{1e150}', '\u{1e28f}'), ('\u{1e2af}', '\u{1e2bf}'), ('\u{1e2fa}', '\u{1e2fe}'), - ('\u{1e300}', '\u{1e7df}'), + ('\u{1e300}', '\u{1e4cf}'), + ('\u{1e4fa}', '\u{1e7df}'), ('\u{1e7e7}', '\u{1e7e7}'), ('\u{1e7ec}', '\u{1e7ec}'), ('\u{1e7ef}', '\u{1e7ef}'), @@ -3481,11 +3534,11 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{1f249}', '\u{1f24f}'), ('\u{1f252}', '\u{1f25f}'), ('\u{1f266}', '\u{1f2ff}'), - ('\u{1f6d8}', '\u{1f6dc}'), + ('\u{1f6d8}', '\u{1f6db}'), ('\u{1f6ed}', '\u{1f6ef}'), ('\u{1f6fd}', '\u{1f6ff}'), - ('\u{1f774}', '\u{1f77f}'), - ('\u{1f7d9}', '\u{1f7df}'), + ('\u{1f777}', '\u{1f77a}'), + ('\u{1f7da}', '\u{1f7df}'), ('\u{1f7ec}', '\u{1f7ef}'), ('\u{1f7f1}', '\u{1f7ff}'), ('\u{1f80c}', '\u{1f80f}'), @@ -3496,25 +3549,24 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{1f8b2}', '\u{1f8ff}'), ('\u{1fa54}', '\u{1fa5f}'), ('\u{1fa6e}', '\u{1fa6f}'), - ('\u{1fa75}', '\u{1fa77}'), ('\u{1fa7d}', '\u{1fa7f}'), - ('\u{1fa87}', '\u{1fa8f}'), - ('\u{1faad}', '\u{1faaf}'), - ('\u{1fabb}', '\u{1fabf}'), - ('\u{1fac6}', '\u{1facf}'), - ('\u{1fada}', '\u{1fadf}'), - ('\u{1fae8}', '\u{1faef}'), - ('\u{1faf7}', '\u{1faff}'), + ('\u{1fa89}', '\u{1fa8f}'), + ('\u{1fabe}', '\u{1fabe}'), + ('\u{1fac6}', '\u{1facd}'), + ('\u{1fadc}', '\u{1fadf}'), + ('\u{1fae9}', '\u{1faef}'), + ('\u{1faf9}', '\u{1faff}'), ('\u{1fb93}', '\u{1fb93}'), ('\u{1fbcb}', '\u{1fbef}'), ('\u{1fbfa}', '\u{1ffff}'), ('\u{2a6e0}', '\u{2a6ff}'), - ('\u{2b739}', '\u{2b73f}'), + ('\u{2b73a}', '\u{2b73f}'), ('\u{2b81e}', '\u{2b81f}'), ('\u{2cea2}', '\u{2ceaf}'), ('\u{2ebe1}', '\u{2f7ff}'), ('\u{2fa1e}', '\u{2ffff}'), - ('\u{3134b}', '\u{e00ff}'), + ('\u{3134b}', '\u{3134f}'), + ('\u{323b0}', '\u{e00ff}'), ('\u{e01f0}', '\u{10ffff}'), ]; @@ -3883,6 +3935,7 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('๐‘‡œ', '๐‘‡œ'), ('๐‘ˆ€', '๐‘ˆ‘'), ('๐‘ˆ“', '๐‘ˆซ'), + ('๐‘ˆฟ', '๐‘‰€'), ('๐‘Š€', '๐‘Š†'), ('๐‘Šˆ', '๐‘Šˆ'), ('๐‘ŠŠ', '๐‘Š'), @@ -3944,11 +3997,15 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('๐‘ตช', '๐‘ถ‰'), ('๐‘ถ˜', '๐‘ถ˜'), ('๐‘ป ', '๐‘ปฒ'), + ('๐‘ผ‚', '๐‘ผ‚'), + ('๐‘ผ„', '๐‘ผ'), + ('๐‘ผ’', '๐‘ผณ'), ('๐‘พฐ', '๐‘พฐ'), ('๐’€€', '๐’Ž™'), ('๐’’€', '๐’•ƒ'), ('๐’พ', '๐’ฟฐ'), - ('๐“€€', '๐“ฎ'), + ('๐“€€', '๐“ฏ'), + ('๐“‘', '๐“‘†'), ('๐”€', '๐”™†'), ('๐– €', '๐–จธ'), ('๐–ฉ€', '๐–ฉž'), @@ -3963,7 +4020,9 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('๐˜ €', '๐˜ณ•'), ('๐˜ด€', '๐˜ดˆ'), ('๐›€€', '๐›„ข'), + ('๐›„ฒ', '๐›„ฒ'), ('๐›…', '๐›…’'), + ('๐›…•', '๐›…•'), ('๐›…ค', '๐›…ง'), ('๐›…ฐ', '๐›‹ป'), ('๐›ฐ€', '๐›ฑช'), @@ -3975,6 +4034,7 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('๐ž…Ž', '๐ž…Ž'), ('๐žŠ', '๐žŠญ'), ('๐ž‹€', '๐ž‹ซ'), + ('๐ž“', '๐ž“ช'), ('๐žŸ ', '๐žŸฆ'), ('๐žŸจ', '๐žŸซ'), ('๐žŸญ', '๐žŸฎ'), @@ -4014,12 +4074,13 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('๐žบฅ', '๐žบฉ'), ('๐žบซ', '๐žบป'), ('๐ €€', '๐ช›Ÿ'), - ('๐ชœ€', '๐ซœธ'), + ('๐ชœ€', '๐ซœน'), ('๐ซ€', '๐ซ '), ('๐ซ  ', '๐ฌบก'), ('๐ฌบฐ', '๐ฎฏ '), ('๐ฏ €', '๐ฏจ'), ('๐ฐ€€', '๐ฑŠ'), + ('๐ฑ', '๐ฒŽฏ'), ]; pub const OTHER_NUMBER: &'static [(char, char)] = &[ @@ -4085,6 +4146,7 @@ pub const OTHER_NUMBER: &'static [(char, char)] = &[ ('๐‘ฟ€', '๐‘ฟ”'), ('๐–ญ›', '๐–ญก'), ('๐–บ€', '๐–บ–'), + ('๐‹€', '๐‹“'), ('๐‹ ', '๐‹ณ'), ('๐ ', '๐ธ'), ('๐žฃ‡', '๐žฃ'), @@ -4267,9 +4329,11 @@ pub const OTHER_PUNCTUATION: &'static [(char, char)] = &[ ('๐‘จฟ', '๐‘ฉ†'), ('๐‘ชš', '๐‘ชœ'), ('๐‘ชž', '๐‘ชข'), + ('๐‘ฌ€', '๐‘ฌ‰'), ('๐‘ฑ', '๐‘ฑ…'), ('๐‘ฑฐ', '๐‘ฑฑ'), ('๐‘ปท', '๐‘ปธ'), + ('๐‘ฝƒ', '๐‘ฝ'), ('๐‘ฟฟ', '๐‘ฟฟ'), ('๐’‘ฐ', '๐’‘ด'), ('๐’ฟฑ', '๐’ฟฒ'), @@ -4446,10 +4510,10 @@ pub const OTHER_SYMBOL: &'static [(char, char)] = &[ ('๐Ÿ‰ ', '๐Ÿ‰ฅ'), ('๐ŸŒ€', '๐Ÿบ'), ('๐Ÿ€', '๐Ÿ›—'), - ('๐Ÿ›', '๐Ÿ›ฌ'), + ('๐Ÿ›œ', '๐Ÿ›ฌ'), ('๐Ÿ›ฐ', '๐Ÿ›ผ'), - ('๐Ÿœ€', '๐Ÿณ'), - ('๐Ÿž€', '๐ŸŸ˜'), + ('๐Ÿœ€', '๐Ÿถ'), + ('๐Ÿป', '๐ŸŸ™'), ('๐ŸŸ ', '๐ŸŸซ'), ('๐ŸŸฐ', '๐ŸŸฐ'), ('๐Ÿ €', '๐Ÿ ‹'), @@ -4460,15 +4524,13 @@ pub const OTHER_SYMBOL: &'static [(char, char)] = &[ ('๐Ÿขฐ', '๐Ÿขฑ'), ('๐Ÿค€', '๐Ÿฉ“'), ('๐Ÿฉ ', '๐Ÿฉญ'), - ('๐Ÿฉฐ', '๐Ÿฉด'), - ('๐Ÿฉธ', '๐Ÿฉผ'), - ('๐Ÿช€', '๐Ÿช†'), - ('๐Ÿช', '๐Ÿชฌ'), - ('๐Ÿชฐ', '๐Ÿชบ'), - ('๐Ÿซ€', '๐Ÿซ…'), - ('๐Ÿซ', '๐Ÿซ™'), - ('๐Ÿซ ', '๐Ÿซง'), - ('๐Ÿซฐ', '๐Ÿซถ'), + ('๐Ÿฉฐ', '๐Ÿฉผ'), + ('๐Ÿช€', '๐Ÿชˆ'), + ('๐Ÿช', '๐Ÿชฝ'), + ('๐Ÿชฟ', '๐Ÿซ…'), + ('๐ŸซŽ', '๐Ÿซ›'), + ('๐Ÿซ ', '๐Ÿซจ'), + ('๐Ÿซฐ', '๐Ÿซธ'), ('๐Ÿฌ€', '๐Ÿฎ’'), ('๐Ÿฎ”', '๐ŸฏŠ'), ]; @@ -4657,9 +4719,11 @@ pub const PUNCTUATION: &'static [(char, char)] = &[ ('๐‘จฟ', '๐‘ฉ†'), ('๐‘ชš', '๐‘ชœ'), ('๐‘ชž', '๐‘ชข'), + ('๐‘ฌ€', '๐‘ฌ‰'), ('๐‘ฑ', '๐‘ฑ…'), ('๐‘ฑฐ', '๐‘ฑฑ'), ('๐‘ปท', '๐‘ปธ'), + ('๐‘ฝƒ', '๐‘ฝ'), ('๐‘ฟฟ', '๐‘ฟฟ'), ('๐’‘ฐ', '๐’‘ด'), ('๐’ฟฑ', '๐’ฟฒ'), @@ -4731,6 +4795,7 @@ pub const SPACING_MARK: &'static [(char, char)] = &[ ('เณ‡', 'เณˆ'), ('เณŠ', 'เณ‹'), ('\u{cd5}', '\u{cd6}'), + ('เณณ', 'เณณ'), ('เด‚', 'เดƒ'), ('\u{d3e}', 'เต€'), ('เต†', 'เตˆ'), @@ -4869,6 +4934,10 @@ pub const SPACING_MARK: &'static [(char, char)] = &[ ('๐‘ถ“', '๐‘ถ”'), ('๐‘ถ–', '๐‘ถ–'), ('๐‘ปต', '๐‘ปถ'), + ('๐‘ผƒ', '๐‘ผƒ'), + ('๐‘ผด', '๐‘ผต'), + ('๐‘ผพ', '๐‘ผฟ'), + ('๐‘ฝ', '๐‘ฝ'), ('๐–ฝ‘', '๐–พ‡'), ('๐–ฟฐ', '๐–ฟฑ'), ('\u{1d165}', '๐…ฆ'), @@ -5085,10 +5154,10 @@ pub const SYMBOL: &'static [(char, char)] = &[ ('๐Ÿ‰', '๐Ÿ‰‘'), ('๐Ÿ‰ ', '๐Ÿ‰ฅ'), ('๐ŸŒ€', '๐Ÿ›—'), - ('๐Ÿ›', '๐Ÿ›ฌ'), + ('๐Ÿ›œ', '๐Ÿ›ฌ'), ('๐Ÿ›ฐ', '๐Ÿ›ผ'), - ('๐Ÿœ€', '๐Ÿณ'), - ('๐Ÿž€', '๐ŸŸ˜'), + ('๐Ÿœ€', '๐Ÿถ'), + ('๐Ÿป', '๐ŸŸ™'), ('๐ŸŸ ', '๐ŸŸซ'), ('๐ŸŸฐ', '๐ŸŸฐ'), ('๐Ÿ €', '๐Ÿ ‹'), @@ -5099,15 +5168,13 @@ pub const SYMBOL: &'static [(char, char)] = &[ ('๐Ÿขฐ', '๐Ÿขฑ'), ('๐Ÿค€', '๐Ÿฉ“'), ('๐Ÿฉ ', '๐Ÿฉญ'), - ('๐Ÿฉฐ', '๐Ÿฉด'), - ('๐Ÿฉธ', '๐Ÿฉผ'), - ('๐Ÿช€', '๐Ÿช†'), - ('๐Ÿช', '๐Ÿชฌ'), - ('๐Ÿชฐ', '๐Ÿชบ'), - ('๐Ÿซ€', '๐Ÿซ…'), - ('๐Ÿซ', '๐Ÿซ™'), - ('๐Ÿซ ', '๐Ÿซง'), - ('๐Ÿซฐ', '๐Ÿซถ'), + ('๐Ÿฉฐ', '๐Ÿฉผ'), + ('๐Ÿช€', '๐Ÿชˆ'), + ('๐Ÿช', '๐Ÿชฝ'), + ('๐Ÿชฟ', '๐Ÿซ…'), + ('๐ŸซŽ', '๐Ÿซ›'), + ('๐Ÿซ ', '๐Ÿซจ'), + ('๐Ÿซฐ', '๐Ÿซธ'), ('๐Ÿฌ€', '๐Ÿฎ’'), ('๐Ÿฎ”', '๐ŸฏŠ'), ]; @@ -5247,7 +5314,7 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{cdf}', '\u{cdf}'), ('\u{ce4}', '\u{ce5}'), ('\u{cf0}', '\u{cf0}'), - ('\u{cf3}', '\u{cff}'), + ('\u{cf4}', '\u{cff}'), ('\u{d0d}', '\u{d0d}'), ('\u{d11}', '\u{d11}'), ('\u{d45}', '\u{d45}'), @@ -5277,7 +5344,7 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{ebe}', '\u{ebf}'), ('\u{ec5}', '\u{ec5}'), ('\u{ec7}', '\u{ec7}'), - ('\u{ece}', '\u{ecf}'), + ('\u{ecf}', '\u{ecf}'), ('\u{eda}', '\u{edb}'), ('\u{ee0}', '\u{eff}'), ('\u{f48}', '\u{f48}'), @@ -5547,7 +5614,7 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{10e7f}', '\u{10e7f}'), ('\u{10eaa}', '\u{10eaa}'), ('\u{10eae}', '\u{10eaf}'), - ('\u{10eb2}', '\u{10eff}'), + ('\u{10eb2}', '\u{10efc}'), ('\u{10f28}', '\u{10f2f}'), ('\u{10f5a}', '\u{10f6f}'), ('\u{10f8a}', '\u{10faf}'), @@ -5565,7 +5632,7 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{111e0}', '\u{111e0}'), ('\u{111f5}', '\u{111ff}'), ('\u{11212}', '\u{11212}'), - ('\u{1123f}', '\u{1127f}'), + ('\u{11242}', '\u{1127f}'), ('\u{11287}', '\u{11287}'), ('\u{11289}', '\u{11289}'), ('\u{1128e}', '\u{1128e}'), @@ -5617,7 +5684,8 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{119e5}', '\u{119ff}'), ('\u{11a48}', '\u{11a4f}'), ('\u{11aa3}', '\u{11aaf}'), - ('\u{11af9}', '\u{11bff}'), + ('\u{11af9}', '\u{11aff}'), + ('\u{11b0a}', '\u{11bff}'), ('\u{11c09}', '\u{11c09}'), ('\u{11c37}', '\u{11c37}'), ('\u{11c46}', '\u{11c4f}'), @@ -5638,7 +5706,10 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{11d92}', '\u{11d92}'), ('\u{11d99}', '\u{11d9f}'), ('\u{11daa}', '\u{11edf}'), - ('\u{11ef9}', '\u{11faf}'), + ('\u{11ef9}', '\u{11eff}'), + ('\u{11f11}', '\u{11f11}'), + ('\u{11f3b}', '\u{11f3d}'), + ('\u{11f5a}', '\u{11faf}'), ('\u{11fb1}', '\u{11fbf}'), ('\u{11ff2}', '\u{11ffe}'), ('\u{1239a}', '\u{123ff}'), @@ -5646,8 +5717,7 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{12475}', '\u{1247f}'), ('\u{12544}', '\u{12f8f}'), ('\u{12ff3}', '\u{12fff}'), - ('\u{1342f}', '\u{1342f}'), - ('\u{13439}', '\u{143ff}'), + ('\u{13456}', '\u{143ff}'), ('\u{14647}', '\u{167ff}'), ('\u{16a39}', '\u{16a3f}'), ('\u{16a5f}', '\u{16a5f}'), @@ -5673,8 +5743,10 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{1aff4}', '\u{1aff4}'), ('\u{1affc}', '\u{1affc}'), ('\u{1afff}', '\u{1afff}'), - ('\u{1b123}', '\u{1b14f}'), - ('\u{1b153}', '\u{1b163}'), + ('\u{1b123}', '\u{1b131}'), + ('\u{1b133}', '\u{1b14f}'), + ('\u{1b153}', '\u{1b154}'), + ('\u{1b156}', '\u{1b163}'), ('\u{1b168}', '\u{1b16f}'), ('\u{1b2fc}', '\u{1bbff}'), ('\u{1bc6b}', '\u{1bc6f}'), @@ -5688,7 +5760,8 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{1d0f6}', '\u{1d0ff}'), ('\u{1d127}', '\u{1d128}'), ('\u{1d1eb}', '\u{1d1ff}'), - ('\u{1d246}', '\u{1d2df}'), + ('\u{1d246}', '\u{1d2bf}'), + ('\u{1d2d4}', '\u{1d2df}'), ('\u{1d2f4}', '\u{1d2ff}'), ('\u{1d357}', '\u{1d35f}'), ('\u{1d379}', '\u{1d3ff}'), @@ -5715,19 +5788,23 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{1da8c}', '\u{1da9a}'), ('\u{1daa0}', '\u{1daa0}'), ('\u{1dab0}', '\u{1deff}'), - ('\u{1df1f}', '\u{1dfff}'), + ('\u{1df1f}', '\u{1df24}'), + ('\u{1df2b}', '\u{1dfff}'), ('\u{1e007}', '\u{1e007}'), ('\u{1e019}', '\u{1e01a}'), ('\u{1e022}', '\u{1e022}'), ('\u{1e025}', '\u{1e025}'), - ('\u{1e02b}', '\u{1e0ff}'), + ('\u{1e02b}', '\u{1e02f}'), + ('\u{1e06e}', '\u{1e08e}'), + ('\u{1e090}', '\u{1e0ff}'), ('\u{1e12d}', '\u{1e12f}'), ('\u{1e13e}', '\u{1e13f}'), ('\u{1e14a}', '\u{1e14d}'), ('\u{1e150}', '\u{1e28f}'), ('\u{1e2af}', '\u{1e2bf}'), ('\u{1e2fa}', '\u{1e2fe}'), - ('\u{1e300}', '\u{1e7df}'), + ('\u{1e300}', '\u{1e4cf}'), + ('\u{1e4fa}', '\u{1e7df}'), ('\u{1e7e7}', '\u{1e7e7}'), ('\u{1e7ec}', '\u{1e7ec}'), ('\u{1e7ef}', '\u{1e7ef}'), @@ -5785,11 +5862,11 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{1f249}', '\u{1f24f}'), ('\u{1f252}', '\u{1f25f}'), ('\u{1f266}', '\u{1f2ff}'), - ('\u{1f6d8}', '\u{1f6dc}'), + ('\u{1f6d8}', '\u{1f6db}'), ('\u{1f6ed}', '\u{1f6ef}'), ('\u{1f6fd}', '\u{1f6ff}'), - ('\u{1f774}', '\u{1f77f}'), - ('\u{1f7d9}', '\u{1f7df}'), + ('\u{1f777}', '\u{1f77a}'), + ('\u{1f7da}', '\u{1f7df}'), ('\u{1f7ec}', '\u{1f7ef}'), ('\u{1f7f1}', '\u{1f7ff}'), ('\u{1f80c}', '\u{1f80f}'), @@ -5800,25 +5877,24 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{1f8b2}', '\u{1f8ff}'), ('\u{1fa54}', '\u{1fa5f}'), ('\u{1fa6e}', '\u{1fa6f}'), - ('\u{1fa75}', '\u{1fa77}'), ('\u{1fa7d}', '\u{1fa7f}'), - ('\u{1fa87}', '\u{1fa8f}'), - ('\u{1faad}', '\u{1faaf}'), - ('\u{1fabb}', '\u{1fabf}'), - ('\u{1fac6}', '\u{1facf}'), - ('\u{1fada}', '\u{1fadf}'), - ('\u{1fae8}', '\u{1faef}'), - ('\u{1faf7}', '\u{1faff}'), + ('\u{1fa89}', '\u{1fa8f}'), + ('\u{1fabe}', '\u{1fabe}'), + ('\u{1fac6}', '\u{1facd}'), + ('\u{1fadc}', '\u{1fadf}'), + ('\u{1fae9}', '\u{1faef}'), + ('\u{1faf9}', '\u{1faff}'), ('\u{1fb93}', '\u{1fb93}'), ('\u{1fbcb}', '\u{1fbef}'), ('\u{1fbfa}', '\u{1ffff}'), ('\u{2a6e0}', '\u{2a6ff}'), - ('\u{2b739}', '\u{2b73f}'), + ('\u{2b73a}', '\u{2b73f}'), ('\u{2b81e}', '\u{2b81f}'), ('\u{2cea2}', '\u{2ceaf}'), ('\u{2ebe1}', '\u{2f7ff}'), ('\u{2fa1e}', '\u{2ffff}'), - ('\u{3134b}', '\u{e0000}'), + ('\u{3134b}', '\u{3134f}'), + ('\u{323b0}', '\u{e0000}'), ('\u{e0002}', '\u{e001f}'), ('\u{e0080}', '\u{e00ff}'), ('\u{e01f0}', '\u{effff}'), diff --git a/regex-syntax/src/unicode_tables/grapheme_cluster_break.rs b/regex-syntax/src/unicode_tables/grapheme_cluster_break.rs index 38cfc73af..294dfbdcc 100644 --- a/regex-syntax/src/unicode_tables/grapheme_cluster_break.rs +++ b/regex-syntax/src/unicode_tables/grapheme_cluster_break.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate grapheme-cluster-break /tmp/ucd --chars +// ucd-generate grapheme-cluster-break ucd-15.0.0 --chars // -// Unicode version: 14.0.0. +// Unicode version: 15.0.0. // -// ucd-generate 0.2.11 is available on crates.io. +// ucd-generate 0.2.14 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("CR", CR), @@ -38,7 +38,7 @@ pub const CONTROL: &'static [(char, char)] = &[ ('\u{2060}', '\u{206f}'), ('\u{feff}', '\u{feff}'), ('\u{fff0}', '\u{fffb}'), - ('\u{13430}', '\u{13438}'), + ('\u{13430}', '\u{1343f}'), ('\u{1bca0}', '\u{1bca3}'), ('\u{1d173}', '\u{1d17a}'), ('\u{e0000}', '\u{e001f}'), @@ -149,7 +149,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{e47}', '\u{e4e}'), ('\u{eb1}', '\u{eb1}'), ('\u{eb4}', '\u{ebc}'), - ('\u{ec8}', '\u{ecd}'), + ('\u{ec8}', '\u{ece}'), ('\u{f18}', '\u{f19}'), ('\u{f35}', '\u{f35}'), ('\u{f37}', '\u{f37}'), @@ -278,6 +278,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{10ae5}', '\u{10ae6}'), ('\u{10d24}', '\u{10d27}'), ('\u{10eab}', '\u{10eac}'), + ('\u{10efd}', '\u{10eff}'), ('\u{10f46}', '\u{10f50}'), ('\u{10f82}', '\u{10f85}'), ('\u{11001}', '\u{11001}'), @@ -300,6 +301,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{11234}', '\u{11234}'), ('\u{11236}', '\u{11237}'), ('\u{1123e}', '\u{1123e}'), + ('\u{11241}', '\u{11241}'), ('\u{112df}', '\u{112df}'), ('\u{112e3}', '\u{112ea}'), ('\u{11300}', '\u{11301}'), @@ -367,6 +369,12 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{11d95}', '\u{11d95}'), ('\u{11d97}', '\u{11d97}'), ('\u{11ef3}', '\u{11ef4}'), + ('\u{11f00}', '\u{11f01}'), + ('\u{11f36}', '\u{11f3a}'), + ('\u{11f40}', '\u{11f40}'), + ('\u{11f42}', '\u{11f42}'), + ('\u{13440}', '\u{13440}'), + ('\u{13447}', '\u{13455}'), ('\u{16af0}', '\u{16af4}'), ('\u{16b30}', '\u{16b36}'), ('\u{16f4f}', '\u{16f4f}'), @@ -393,9 +401,11 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{1e01b}', '\u{1e021}'), ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), + ('\u{1e08f}', '\u{1e08f}'), ('\u{1e130}', '\u{1e136}'), ('\u{1e2ae}', '\u{1e2ae}'), ('\u{1e2ec}', '\u{1e2ef}'), + ('\u{1e4ec}', '\u{1e4ef}'), ('\u{1e8d0}', '\u{1e8d6}'), ('\u{1e944}', '\u{1e94a}'), ('๐Ÿป', '๐Ÿฟ'), @@ -1226,6 +1236,7 @@ pub const PREPEND: &'static [(char, char)] = &[ ('๐‘จบ', '๐‘จบ'), ('๐‘ช„', '๐‘ช‰'), ('๐‘ต†', '๐‘ต†'), + ('๐‘ผ‚', '๐‘ผ‚'), ]; pub const REGIONAL_INDICATOR: &'static [(char, char)] = &[('๐Ÿ‡ฆ', '๐Ÿ‡ฟ')]; @@ -1262,6 +1273,7 @@ pub const SPACINGMARK: &'static [(char, char)] = &[ ('เณƒ', 'เณ„'), ('เณ‡', 'เณˆ'), ('เณŠ', 'เณ‹'), + ('เณณ', 'เณณ'), ('เด‚', 'เดƒ'), ('เดฟ', 'เต€'), ('เต†', 'เตˆ'), @@ -1387,6 +1399,10 @@ pub const SPACINGMARK: &'static [(char, char)] = &[ ('๐‘ถ“', '๐‘ถ”'), ('๐‘ถ–', '๐‘ถ–'), ('๐‘ปต', '๐‘ปถ'), + ('๐‘ผƒ', '๐‘ผƒ'), + ('๐‘ผด', '๐‘ผต'), + ('๐‘ผพ', '๐‘ผฟ'), + ('๐‘ฝ', '๐‘ฝ'), ('๐–ฝ‘', '๐–พ‡'), ('๐–ฟฐ', '๐–ฟฑ'), ('๐…ฆ', '๐…ฆ'), diff --git a/regex-syntax/src/unicode_tables/perl_decimal.rs b/regex-syntax/src/unicode_tables/perl_decimal.rs index 9a14e4395..4f4c08a12 100644 --- a/regex-syntax/src/unicode_tables/perl_decimal.rs +++ b/regex-syntax/src/unicode_tables/perl_decimal.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate general-category /tmp/ucd --chars --include decimalnumber +// ucd-generate general-category ucd-15.0.0 --chars --include decimalnumber // -// Unicode version: 14.0.0. +// Unicode version: 15.0.0. // -// ucd-generate 0.2.11 is available on crates.io. +// ucd-generate 0.2.14 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[("Decimal_Number", DECIMAL_NUMBER)]; @@ -64,12 +64,14 @@ pub const DECIMAL_NUMBER: &'static [(char, char)] = &[ ('๐‘ฑ', '๐‘ฑ™'), ('๐‘ต', '๐‘ต™'), ('๐‘ถ ', '๐‘ถฉ'), + ('๐‘ฝ', '๐‘ฝ™'), ('๐–ฉ ', '๐–ฉฉ'), ('๐–ซ€', '๐–ซ‰'), ('๐–ญ', '๐–ญ™'), ('๐ŸŽ', '๐Ÿฟ'), ('๐ž…€', '๐ž…‰'), ('๐ž‹ฐ', '๐ž‹น'), + ('๐ž“ฐ', '๐ž“น'), ('๐žฅ', '๐žฅ™'), ('๐Ÿฏฐ', '๐Ÿฏน'), ]; diff --git a/regex-syntax/src/unicode_tables/perl_space.rs b/regex-syntax/src/unicode_tables/perl_space.rs index bb69ce1ba..174169579 100644 --- a/regex-syntax/src/unicode_tables/perl_space.rs +++ b/regex-syntax/src/unicode_tables/perl_space.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate property-bool /tmp/ucd --chars --include whitespace +// ucd-generate property-bool ucd-15.0.0 --chars --include whitespace // -// Unicode version: 14.0.0. +// Unicode version: 15.0.0. // -// ucd-generate 0.2.11 is available on crates.io. +// ucd-generate 0.2.14 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[("White_Space", WHITE_SPACE)]; diff --git a/regex-syntax/src/unicode_tables/perl_word.rs b/regex-syntax/src/unicode_tables/perl_word.rs index 2c8171b2b..c1b66bd9a 100644 --- a/regex-syntax/src/unicode_tables/perl_word.rs +++ b/regex-syntax/src/unicode_tables/perl_word.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate perl-word /tmp/ucd --chars +// ucd-generate perl-word ucd-15.0.0 --chars // -// Unicode version: 14.0.0. +// Unicode version: 15.0.0. // -// ucd-generate 0.2.11 is available on crates.io. +// ucd-generate 0.2.14 is available on crates.io. pub const PERL_WORD: &'static [(char, char)] = &[ ('0', '9'), @@ -164,7 +164,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('เณ', 'เณž'), ('เณ ', '\u{ce3}'), ('เณฆ', 'เณฏ'), - ('เณฑ', 'เณฒ'), + ('เณฑ', 'เณณ'), ('\u{d00}', 'เดŒ'), ('เดŽ', 'เด'), ('เด’', '\u{d44}'), @@ -197,7 +197,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('เบง', 'เบฝ'), ('เป€', 'เป„'), ('เป†', 'เป†'), - ('\u{ec8}', '\u{ecd}'), + ('\u{ec8}', '\u{ece}'), ('เป', 'เป™'), ('เปœ', 'เปŸ'), ('เผ€', 'เผ€'), @@ -511,7 +511,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('๐บ€', '๐บฉ'), ('\u{10eab}', '\u{10eac}'), ('๐บฐ', '๐บฑ'), - ('๐ผ€', '๐ผœ'), + ('\u{10efd}', '๐ผœ'), ('๐ผง', '๐ผง'), ('๐ผฐ', '\u{10f50}'), ('๐ฝฐ', '\u{10f85}'), @@ -534,7 +534,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('๐‘‡œ', '๐‘‡œ'), ('๐‘ˆ€', '๐‘ˆ‘'), ('๐‘ˆ“', '\u{11237}'), - ('\u{1123e}', '\u{1123e}'), + ('\u{1123e}', '\u{11241}'), ('๐‘Š€', '๐‘Š†'), ('๐‘Šˆ', '๐‘Šˆ'), ('๐‘ŠŠ', '๐‘Š'), @@ -615,12 +615,17 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('๐‘ถ“', '๐‘ถ˜'), ('๐‘ถ ', '๐‘ถฉ'), ('๐‘ป ', '๐‘ปถ'), + ('\u{11f00}', '๐‘ผ'), + ('๐‘ผ’', '\u{11f3a}'), + ('๐‘ผพ', '\u{11f42}'), + ('๐‘ฝ', '๐‘ฝ™'), ('๐‘พฐ', '๐‘พฐ'), ('๐’€€', '๐’Ž™'), ('๐’€', '๐’‘ฎ'), ('๐’’€', '๐’•ƒ'), ('๐’พ', '๐’ฟฐ'), - ('๐“€€', '๐“ฎ'), + ('๐“€€', '๐“ฏ'), + ('\u{13440}', '\u{13455}'), ('๐”€', '๐”™†'), ('๐– €', '๐–จธ'), ('๐–ฉ€', '๐–ฉž'), @@ -648,7 +653,9 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('๐šฟต', '๐šฟป'), ('๐šฟฝ', '๐šฟพ'), ('๐›€€', '๐›„ข'), + ('๐›„ฒ', '๐›„ฒ'), ('๐›…', '๐›…’'), + ('๐›…•', '๐›…•'), ('๐›…ค', '๐›…ง'), ('๐›…ฐ', '๐›‹ป'), ('๐›ฐ€', '๐›ฑช'), @@ -702,17 +709,21 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('\u{1da9b}', '\u{1da9f}'), ('\u{1daa1}', '\u{1daaf}'), ('๐ผ€', '๐ผž'), + ('๐ผฅ', '๐ผช'), ('\u{1e000}', '\u{1e006}'), ('\u{1e008}', '\u{1e018}'), ('\u{1e01b}', '\u{1e021}'), ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), + ('๐ž€ฐ', '๐žญ'), + ('\u{1e08f}', '\u{1e08f}'), ('๐ž„€', '๐ž„ฌ'), ('\u{1e130}', '๐ž„ฝ'), ('๐ž…€', '๐ž…‰'), ('๐ž…Ž', '๐ž…Ž'), ('๐žŠ', '\u{1e2ae}'), ('๐ž‹€', '๐ž‹น'), + ('๐ž“', '๐ž“น'), ('๐žŸ ', '๐žŸฆ'), ('๐žŸจ', '๐žŸซ'), ('๐žŸญ', '๐žŸฎ'), @@ -759,11 +770,12 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('๐Ÿ…ฐ', '๐Ÿ†‰'), ('๐Ÿฏฐ', '๐Ÿฏน'), ('๐ €€', '๐ช›Ÿ'), - ('๐ชœ€', '๐ซœธ'), + ('๐ชœ€', '๐ซœน'), ('๐ซ€', '๐ซ '), ('๐ซ  ', '๐ฌบก'), ('๐ฌบฐ', '๐ฎฏ '), ('๐ฏ €', '๐ฏจ'), ('๐ฐ€€', '๐ฑŠ'), + ('๐ฑ', '๐ฒŽฏ'), ('\u{e0100}', '\u{e01ef}'), ]; diff --git a/regex-syntax/src/unicode_tables/property_bool.rs b/regex-syntax/src/unicode_tables/property_bool.rs index 8fb211030..a3e84b519 100644 --- a/regex-syntax/src/unicode_tables/property_bool.rs +++ b/regex-syntax/src/unicode_tables/property_bool.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate property-bool /tmp/ucd --chars +// ucd-generate property-bool ucd-15.0.0 --chars // -// Unicode version: 14.0.0. +// Unicode version: 15.0.0. // -// ucd-generate 0.2.11 is available on crates.io. +// ucd-generate 0.2.14 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("ASCII_Hex_Digit", ASCII_HEX_DIGIT), @@ -207,8 +207,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('เฏŠ', 'เฏŒ'), ('เฏ', 'เฏ'), ('\u{bd7}', '\u{bd7}'), - ('\u{c00}', 'เฐƒ'), - ('เฐ…', 'เฐŒ'), + ('\u{c00}', 'เฐŒ'), ('เฐŽ', 'เฐ'), ('เฐ’', 'เฐจ'), ('เฐช', 'เฐน'), @@ -231,7 +230,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('\u{cd5}', '\u{cd6}'), ('เณ', 'เณž'), ('เณ ', '\u{ce3}'), - ('เณฑ', 'เณฒ'), + ('เณฑ', 'เณณ'), ('\u{d00}', 'เดŒ'), ('เดŽ', 'เด'), ('เด’', 'เดบ'), @@ -269,7 +268,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('เผ€', 'เผ€'), ('เฝ€', 'เฝ‡'), ('เฝ‰', 'เฝฌ'), - ('\u{f71}', '\u{f81}'), + ('\u{f71}', '\u{f83}'), ('เพˆ', '\u{f97}'), ('\u{f99}', '\u{fbc}'), ('แ€€', '\u{1036}'), @@ -571,7 +570,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('๐ฟ ', '๐ฟถ'), ('๐‘€€', '\u{11045}'), ('๐‘ฑ', '๐‘ต'), - ('๐‘‚‚', '๐‘‚ธ'), + ('\u{11080}', '๐‘‚ธ'), ('\u{110c2}', '\u{110c2}'), ('๐‘ƒ', '๐‘ƒจ'), ('\u{11100}', '\u{11132}'), @@ -586,7 +585,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('๐‘ˆ€', '๐‘ˆ‘'), ('๐‘ˆ“', '\u{11234}'), ('\u{11237}', '\u{11237}'), - ('\u{1123e}', '\u{1123e}'), + ('\u{1123e}', '\u{11241}'), ('๐‘Š€', '๐‘Š†'), ('๐‘Šˆ', '๐‘Šˆ'), ('๐‘ŠŠ', '๐‘Š'), @@ -666,12 +665,16 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('๐‘ถ“', '๐‘ถ–'), ('๐‘ถ˜', '๐‘ถ˜'), ('๐‘ป ', '๐‘ปถ'), + ('\u{11f00}', '๐‘ผ'), + ('๐‘ผ’', '\u{11f3a}'), + ('๐‘ผพ', '\u{11f40}'), ('๐‘พฐ', '๐‘พฐ'), ('๐’€€', '๐’Ž™'), ('๐’€', '๐’‘ฎ'), ('๐’’€', '๐’•ƒ'), ('๐’พ', '๐’ฟฐ'), - ('๐“€€', '๐“ฎ'), + ('๐“€€', '๐“ฏ'), + ('๐“‘', '๐“‘†'), ('๐”€', '๐”™†'), ('๐– €', '๐–จธ'), ('๐–ฉ€', '๐–ฉž'), @@ -695,7 +698,9 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('๐šฟต', '๐šฟป'), ('๐šฟฝ', '๐šฟพ'), ('๐›€€', '๐›„ข'), + ('๐›„ฒ', '๐›„ฒ'), ('๐›…', '๐›…’'), + ('๐›…•', '๐›…•'), ('๐›…ค', '๐›…ง'), ('๐›…ฐ', '๐›‹ป'), ('๐›ฐ€', '๐›ฑช'), @@ -734,16 +739,20 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('๐žช', '๐Ÿ‚'), ('๐Ÿ„', '๐Ÿ‹'), ('๐ผ€', '๐ผž'), + ('๐ผฅ', '๐ผช'), ('\u{1e000}', '\u{1e006}'), ('\u{1e008}', '\u{1e018}'), ('\u{1e01b}', '\u{1e021}'), ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), + ('๐ž€ฐ', '๐žญ'), + ('\u{1e08f}', '\u{1e08f}'), ('๐ž„€', '๐ž„ฌ'), ('๐ž„ท', '๐ž„ฝ'), ('๐ž…Ž', '๐ž…Ž'), ('๐žŠ', '๐žŠญ'), ('๐ž‹€', '๐ž‹ซ'), + ('๐ž“', '๐ž“ซ'), ('๐žŸ ', '๐žŸฆ'), ('๐žŸจ', '๐žŸซ'), ('๐žŸญ', '๐žŸฎ'), @@ -789,12 +798,13 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('๐Ÿ…', '๐Ÿ…ฉ'), ('๐Ÿ…ฐ', '๐Ÿ†‰'), ('๐ €€', '๐ช›Ÿ'), - ('๐ชœ€', '๐ซœธ'), + ('๐ชœ€', '๐ซœน'), ('๐ซ€', '๐ซ '), ('๐ซ  ', '๐ฌบก'), ('๐ฌบฐ', '๐ฎฏ '), ('๐ฏ €', '๐ฏจ'), ('๐ฐ€€', '๐ฑŠ'), + ('๐ฑ', '๐ฒŽฏ'), ]; pub const BIDI_CONTROL: &'static [(char, char)] = &[ @@ -1035,7 +1045,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{eb1}', '\u{eb1}'), ('\u{eb4}', '\u{ebc}'), ('เป†', 'เป†'), - ('\u{ec8}', '\u{ecd}'), + ('\u{ec8}', '\u{ece}'), ('\u{f18}', '\u{f19}'), ('\u{f35}', '\u{f35}'), ('\u{f37}', '\u{f37}'), @@ -1224,6 +1234,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{10ae5}', '\u{10ae6}'), ('\u{10d24}', '\u{10d27}'), ('\u{10eab}', '\u{10eac}'), + ('\u{10efd}', '\u{10eff}'), ('\u{10f46}', '\u{10f50}'), ('\u{10f82}', '\u{10f85}'), ('\u{11001}', '\u{11001}'), @@ -1248,6 +1259,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{11234}', '\u{11234}'), ('\u{11236}', '\u{11237}'), ('\u{1123e}', '\u{1123e}'), + ('\u{11241}', '\u{11241}'), ('\u{112df}', '\u{112df}'), ('\u{112e3}', '\u{112ea}'), ('\u{11300}', '\u{11301}'), @@ -1309,7 +1321,12 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{11d95}', '\u{11d95}'), ('\u{11d97}', '\u{11d97}'), ('\u{11ef3}', '\u{11ef4}'), - ('\u{13430}', '\u{13438}'), + ('\u{11f00}', '\u{11f01}'), + ('\u{11f36}', '\u{11f3a}'), + ('\u{11f40}', '\u{11f40}'), + ('\u{11f42}', '\u{11f42}'), + ('\u{13430}', '\u{13440}'), + ('\u{13447}', '\u{13455}'), ('\u{16af0}', '\u{16af4}'), ('\u{16b30}', '\u{16b36}'), ('๐–ญ€', '๐–ญƒ'), @@ -1340,9 +1357,12 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{1e01b}', '\u{1e021}'), ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), + ('๐ž€ฐ', '๐žญ'), + ('\u{1e08f}', '\u{1e08f}'), ('\u{1e130}', '๐ž„ฝ'), ('\u{1e2ae}', '\u{1e2ae}'), ('\u{1e2ec}', '\u{1e2ef}'), + ('๐ž“ซ', '\u{1e4ef}'), ('\u{1e8d0}', '\u{1e8d6}'), ('\u{1e944}', '๐žฅ‹'), ('๐Ÿป', '๐Ÿฟ'), @@ -1383,7 +1403,7 @@ pub const CASED: &'static [(char, char)] = &[ ('แƒ‡', 'แƒ‡'), ('แƒ', 'แƒ'), ('แƒ', 'แƒบ'), - ('แƒฝ', 'แƒฟ'), + ('แƒผ', 'แƒฟ'), ('แŽ ', 'แต'), ('แธ', 'แฝ'), ('แฒ€', 'แฒˆ'), @@ -1443,10 +1463,10 @@ pub const CASED: &'static [(char, char)] = &[ ('๊Ÿ', '๊Ÿ‘'), ('๊Ÿ“', '๊Ÿ“'), ('๊Ÿ•', '๊Ÿ™'), - ('๊Ÿต', '๊Ÿถ'), + ('๊Ÿฒ', '๊Ÿถ'), ('๊Ÿธ', '๊Ÿบ'), ('๊ฌฐ', '๊ญš'), - ('๊ญœ', '๊ญจ'), + ('๊ญœ', '๊ญฉ'), ('๊ญฐ', '๊ฎฟ'), ('๏ฌ€', '๏ฌ†'), ('๏ฌ“', '๏ฌ—'), @@ -1503,6 +1523,8 @@ pub const CASED: &'static [(char, char)] = &[ ('๐Ÿ„', '๐Ÿ‹'), ('๐ผ€', '๐ผ‰'), ('๐ผ‹', '๐ผž'), + ('๐ผฅ', '๐ผช'), + ('๐ž€ฐ', '๐žญ'), ('๐žค€', '๐žฅƒ'), ('๐Ÿ„ฐ', '๐Ÿ…‰'), ('๐Ÿ…', '๐Ÿ…ฉ'), @@ -4336,6 +4358,7 @@ pub const DIACRITIC: &'static [(char, char)] = &[ ('๐žฒ', '๐žบ'), ('\u{10ae5}', '\u{10ae6}'), ('๐ดข', '\u{10d27}'), + ('\u{10efd}', '\u{10eff}'), ('\u{10f46}', '\u{10f50}'), ('\u{10f82}', '\u{10f85}'), ('\u{11046}', '\u{11046}'), @@ -4369,6 +4392,7 @@ pub const DIACRITIC: &'static [(char, char)] = &[ ('\u{11d42}', '\u{11d42}'), ('\u{11d44}', '\u{11d45}'), ('\u{11d97}', '\u{11d97}'), + ('\u{13447}', '\u{13455}'), ('\u{16af0}', '\u{16af4}'), ('\u{16b30}', '\u{16b36}'), ('\u{16f8f}', '๐–พŸ'), @@ -4383,6 +4407,7 @@ pub const DIACRITIC: &'static [(char, char)] = &[ ('\u{1d17b}', '\u{1d182}'), ('\u{1d185}', '\u{1d18b}'), ('\u{1d1aa}', '\u{1d1ad}'), + ('๐ž€ฐ', '๐žญ'), ('\u{1e130}', '\u{1e136}'), ('\u{1e2ae}', '\u{1e2ae}'), ('\u{1e2ec}', '\u{1e2ef}'), @@ -4526,7 +4551,7 @@ pub const EMOJI: &'static [(char, char)] = &[ ('๐Ÿš€', '๐Ÿ›…'), ('๐Ÿ›‹', '๐Ÿ›’'), ('๐Ÿ›•', '๐Ÿ›—'), - ('๐Ÿ›', '๐Ÿ›ฅ'), + ('๐Ÿ›œ', '๐Ÿ›ฅ'), ('๐Ÿ›ฉ', '๐Ÿ›ฉ'), ('๐Ÿ›ซ', '๐Ÿ›ฌ'), ('๐Ÿ›ฐ', '๐Ÿ›ฐ'), @@ -4536,15 +4561,13 @@ pub const EMOJI: &'static [(char, char)] = &[ ('๐ŸคŒ', '๐Ÿคบ'), ('๐Ÿคผ', '๐Ÿฅ…'), ('๐Ÿฅ‡', '๐Ÿงฟ'), - ('๐Ÿฉฐ', '๐Ÿฉด'), - ('๐Ÿฉธ', '๐Ÿฉผ'), - ('๐Ÿช€', '๐Ÿช†'), - ('๐Ÿช', '๐Ÿชฌ'), - ('๐Ÿชฐ', '๐Ÿชบ'), - ('๐Ÿซ€', '๐Ÿซ…'), - ('๐Ÿซ', '๐Ÿซ™'), - ('๐Ÿซ ', '๐Ÿซง'), - ('๐Ÿซฐ', '๐Ÿซถ'), + ('๐Ÿฉฐ', '๐Ÿฉผ'), + ('๐Ÿช€', '๐Ÿชˆ'), + ('๐Ÿช', '๐Ÿชฝ'), + ('๐Ÿชฟ', '๐Ÿซ…'), + ('๐ŸซŽ', '๐Ÿซ›'), + ('๐Ÿซ ', '๐Ÿซจ'), + ('๐Ÿซฐ', '๐Ÿซธ'), ]; pub const EMOJI_COMPONENT: &'static [(char, char)] = &[ @@ -4602,7 +4625,7 @@ pub const EMOJI_MODIFIER_BASE: &'static [(char, char)] = &[ ('๐Ÿง', '๐Ÿง'), ('๐Ÿง‘', '๐Ÿง'), ('๐Ÿซƒ', '๐Ÿซ…'), - ('๐Ÿซฐ', '๐Ÿซถ'), + ('๐Ÿซฐ', '๐Ÿซธ'), ]; pub const EMOJI_PRESENTATION: &'static [(char, char)] = &[ @@ -4672,7 +4695,7 @@ pub const EMOJI_PRESENTATION: &'static [(char, char)] = &[ ('๐Ÿ›Œ', '๐Ÿ›Œ'), ('๐Ÿ›', '๐Ÿ›’'), ('๐Ÿ›•', '๐Ÿ›—'), - ('๐Ÿ›', '๐Ÿ›Ÿ'), + ('๐Ÿ›œ', '๐Ÿ›Ÿ'), ('๐Ÿ›ซ', '๐Ÿ›ฌ'), ('๐Ÿ›ด', '๐Ÿ›ผ'), ('๐ŸŸ ', '๐ŸŸซ'), @@ -4680,15 +4703,13 @@ pub const EMOJI_PRESENTATION: &'static [(char, char)] = &[ ('๐ŸคŒ', '๐Ÿคบ'), ('๐Ÿคผ', '๐Ÿฅ…'), ('๐Ÿฅ‡', '๐Ÿงฟ'), - ('๐Ÿฉฐ', '๐Ÿฉด'), - ('๐Ÿฉธ', '๐Ÿฉผ'), - ('๐Ÿช€', '๐Ÿช†'), - ('๐Ÿช', '๐Ÿชฌ'), - ('๐Ÿชฐ', '๐Ÿชบ'), - ('๐Ÿซ€', '๐Ÿซ…'), - ('๐Ÿซ', '๐Ÿซ™'), - ('๐Ÿซ ', '๐Ÿซง'), - ('๐Ÿซฐ', '๐Ÿซถ'), + ('๐Ÿฉฐ', '๐Ÿฉผ'), + ('๐Ÿช€', '๐Ÿชˆ'), + ('๐Ÿช', '๐Ÿชฝ'), + ('๐Ÿชฟ', '๐Ÿซ…'), + ('๐ŸซŽ', '๐Ÿซ›'), + ('๐Ÿซ ', '๐Ÿซจ'), + ('๐Ÿซฐ', '๐Ÿซธ'), ]; pub const EXTENDED_PICTOGRAPHIC: &'static [(char, char)] = &[ @@ -4759,7 +4780,7 @@ pub const EXTENDED_PICTOGRAPHIC: &'static [(char, char)] = &[ ('๐Ÿ€', '๐Ÿ”ฝ'), ('๐Ÿ•†', '๐Ÿ™'), ('๐Ÿš€', '\u{1f6ff}'), - ('\u{1f774}', '\u{1f77f}'), + ('๐Ÿด', '๐Ÿฟ'), ('๐ŸŸ•', '\u{1f7ff}'), ('\u{1f80c}', '\u{1f80f}'), ('\u{1f848}', '\u{1f84f}'), @@ -4958,7 +4979,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('เณ', 'เณž'), ('เณ ', 'เณก'), ('เณฆ', 'เณฏ'), - ('เณฑ', 'เณฒ'), + ('เณฑ', 'เณณ'), ('เด‚', 'เดŒ'), ('เดŽ', 'เด'), ('เด’', 'เดบ'), @@ -5377,6 +5398,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('๐‘ˆฒ', '๐‘ˆณ'), ('๐‘ˆต', '๐‘ˆต'), ('๐‘ˆธ', '๐‘ˆฝ'), + ('๐‘ˆฟ', '๐‘‰€'), ('๐‘Š€', '๐‘Š†'), ('๐‘Šˆ', '๐‘Šˆ'), ('๐‘ŠŠ', '๐‘Š'), @@ -5463,6 +5485,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('๐‘ช—', '๐‘ช—'), ('๐‘ชš', '๐‘ชข'), ('๐‘ชฐ', '๐‘ซธ'), + ('๐‘ฌ€', '๐‘ฌ‰'), ('๐‘ฐ€', '๐‘ฐˆ'), ('๐‘ฐŠ', '๐‘ฐฏ'), ('๐‘ฐพ', '๐‘ฐพ'), @@ -5486,6 +5509,11 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('๐‘ถ ', '๐‘ถฉ'), ('๐‘ป ', '๐‘ปฒ'), ('๐‘ปต', '๐‘ปธ'), + ('๐‘ผ‚', '๐‘ผ'), + ('๐‘ผ’', '๐‘ผต'), + ('๐‘ผพ', '๐‘ผฟ'), + ('๐‘ฝ', '๐‘ฝ'), + ('๐‘ฝƒ', '๐‘ฝ™'), ('๐‘พฐ', '๐‘พฐ'), ('๐‘ฟ€', '๐‘ฟฑ'), ('๐‘ฟฟ', '๐’Ž™'), @@ -5493,7 +5521,8 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('๐’‘ฐ', '๐’‘ด'), ('๐’’€', '๐’•ƒ'), ('๐’พ', '๐’ฟฒ'), - ('๐“€€', '๐“ฎ'), + ('๐“€€', '๐“ฏ'), + ('๐“‘', '๐“‘†'), ('๐”€', '๐”™†'), ('๐– €', '๐–จธ'), ('๐–ฉ€', '๐–ฉž'), @@ -5521,7 +5550,9 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('๐šฟต', '๐šฟป'), ('๐šฟฝ', '๐šฟพ'), ('๐›€€', '๐›„ข'), + ('๐›„ฒ', '๐›„ฒ'), ('๐›…', '๐›…’'), + ('๐›…•', '๐›…•'), ('๐›…ค', '๐›…ง'), ('๐›…ฐ', '๐›‹ป'), ('๐›ฐ€', '๐›ฑช'), @@ -5541,6 +5572,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('๐†ฎ', '๐‡ช'), ('๐ˆ€', '๐‰'), ('๐‰…', '๐‰…'), + ('๐‹€', '๐‹“'), ('๐‹ ', '๐‹ณ'), ('๐Œ€', '๐–'), ('๐ ', '๐ธ'), @@ -5570,6 +5602,8 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('๐ฉถ', '๐ชƒ'), ('๐ช…', '๐ช‹'), ('๐ผ€', '๐ผž'), + ('๐ผฅ', '๐ผช'), + ('๐ž€ฐ', '๐žญ'), ('๐ž„€', '๐ž„ฌ'), ('๐ž„ท', '๐ž„ฝ'), ('๐ž…€', '๐ž…‰'), @@ -5578,6 +5612,8 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('๐ž‹€', '๐ž‹ซ'), ('๐ž‹ฐ', '๐ž‹น'), ('๐ž‹ฟ', '๐ž‹ฟ'), + ('๐ž“', '๐ž“ซ'), + ('๐ž“ฐ', '๐ž“น'), ('๐žŸ ', '๐žŸฆ'), ('๐žŸจ', '๐žŸซ'), ('๐žŸญ', '๐žŸฎ'), @@ -5637,10 +5673,10 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('๐Ÿ‰', '๐Ÿ‰‘'), ('๐Ÿ‰ ', '๐Ÿ‰ฅ'), ('๐ŸŒ€', '๐Ÿ›—'), - ('๐Ÿ›', '๐Ÿ›ฌ'), + ('๐Ÿ›œ', '๐Ÿ›ฌ'), ('๐Ÿ›ฐ', '๐Ÿ›ผ'), - ('๐Ÿœ€', '๐Ÿณ'), - ('๐Ÿž€', '๐ŸŸ˜'), + ('๐Ÿœ€', '๐Ÿถ'), + ('๐Ÿป', '๐ŸŸ™'), ('๐ŸŸ ', '๐ŸŸซ'), ('๐ŸŸฐ', '๐ŸŸฐ'), ('๐Ÿ €', '๐Ÿ ‹'), @@ -5651,25 +5687,24 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('๐Ÿขฐ', '๐Ÿขฑ'), ('๐Ÿค€', '๐Ÿฉ“'), ('๐Ÿฉ ', '๐Ÿฉญ'), - ('๐Ÿฉฐ', '๐Ÿฉด'), - ('๐Ÿฉธ', '๐Ÿฉผ'), - ('๐Ÿช€', '๐Ÿช†'), - ('๐Ÿช', '๐Ÿชฌ'), - ('๐Ÿชฐ', '๐Ÿชบ'), - ('๐Ÿซ€', '๐Ÿซ…'), - ('๐Ÿซ', '๐Ÿซ™'), - ('๐Ÿซ ', '๐Ÿซง'), - ('๐Ÿซฐ', '๐Ÿซถ'), + ('๐Ÿฉฐ', '๐Ÿฉผ'), + ('๐Ÿช€', '๐Ÿชˆ'), + ('๐Ÿช', '๐Ÿชฝ'), + ('๐Ÿชฟ', '๐Ÿซ…'), + ('๐ŸซŽ', '๐Ÿซ›'), + ('๐Ÿซ ', '๐Ÿซจ'), + ('๐Ÿซฐ', '๐Ÿซธ'), ('๐Ÿฌ€', '๐Ÿฎ’'), ('๐Ÿฎ”', '๐ŸฏŠ'), ('๐Ÿฏฐ', '๐Ÿฏน'), ('๐ €€', '๐ช›Ÿ'), - ('๐ชœ€', '๐ซœธ'), + ('๐ชœ€', '๐ซœน'), ('๐ซ€', '๐ซ '), ('๐ซ  ', '๐ฌบก'), ('๐ฌบฐ', '๐ฎฏ '), ('๐ฏ €', '๐ฏจ'), ('๐ฐ€€', '๐ฑŠ'), + ('๐ฑ', '๐ฒŽฏ'), ]; pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ @@ -5775,7 +5810,7 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{e47}', '\u{e4e}'), ('\u{eb1}', '\u{eb1}'), ('\u{eb4}', '\u{ebc}'), - ('\u{ec8}', '\u{ecd}'), + ('\u{ec8}', '\u{ece}'), ('\u{f18}', '\u{f19}'), ('\u{f35}', '\u{f35}'), ('\u{f37}', '\u{f37}'), @@ -5904,6 +5939,7 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{10ae5}', '\u{10ae6}'), ('\u{10d24}', '\u{10d27}'), ('\u{10eab}', '\u{10eac}'), + ('\u{10efd}', '\u{10eff}'), ('\u{10f46}', '\u{10f50}'), ('\u{10f82}', '\u{10f85}'), ('\u{11001}', '\u{11001}'), @@ -5926,6 +5962,7 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{11234}', '\u{11234}'), ('\u{11236}', '\u{11237}'), ('\u{1123e}', '\u{1123e}'), + ('\u{11241}', '\u{11241}'), ('\u{112df}', '\u{112df}'), ('\u{112e3}', '\u{112ea}'), ('\u{11300}', '\u{11301}'), @@ -5993,6 +6030,12 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{11d95}', '\u{11d95}'), ('\u{11d97}', '\u{11d97}'), ('\u{11ef3}', '\u{11ef4}'), + ('\u{11f00}', '\u{11f01}'), + ('\u{11f36}', '\u{11f3a}'), + ('\u{11f40}', '\u{11f40}'), + ('\u{11f42}', '\u{11f42}'), + ('\u{13440}', '\u{13440}'), + ('\u{13447}', '\u{13455}'), ('\u{16af0}', '\u{16af4}'), ('\u{16b30}', '\u{16b36}'), ('\u{16f4f}', '\u{16f4f}'), @@ -6019,9 +6062,11 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{1e01b}', '\u{1e021}'), ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), + ('\u{1e08f}', '\u{1e08f}'), ('\u{1e130}', '\u{1e136}'), ('\u{1e2ae}', '\u{1e2ae}'), ('\u{1e2ec}', '\u{1e2ef}'), + ('\u{1e4ec}', '\u{1e4ef}'), ('\u{1e8d0}', '\u{1e8d6}'), ('\u{1e944}', '\u{1e94a}'), ('\u{e0020}', '\u{e007f}'), @@ -6084,6 +6129,7 @@ pub const GRAPHEME_LINK: &'static [(char, char)] = &[ ('\u{11c3f}', '\u{11c3f}'), ('\u{11d44}', '\u{11d45}'), ('\u{11d97}', '\u{11d97}'), + ('๐‘ฝ', '\u{11f42}'), ]; pub const HEX_DIGIT: &'static [(char, char)] = &[ @@ -6272,7 +6318,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('เณ', 'เณž'), ('เณ ', '\u{ce3}'), ('เณฆ', 'เณฏ'), - ('เณฑ', 'เณฒ'), + ('เณฑ', 'เณณ'), ('\u{d00}', 'เดŒ'), ('เดŽ', 'เด'), ('เด’', '\u{d44}'), @@ -6305,7 +6351,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('เบง', 'เบฝ'), ('เป€', 'เป„'), ('เป†', 'เป†'), - ('\u{ec8}', '\u{ecd}'), + ('\u{ec8}', '\u{ece}'), ('เป', 'เป™'), ('เปœ', 'เปŸ'), ('เผ€', 'เผ€'), @@ -6618,7 +6664,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('๐บ€', '๐บฉ'), ('\u{10eab}', '\u{10eac}'), ('๐บฐ', '๐บฑ'), - ('๐ผ€', '๐ผœ'), + ('\u{10efd}', '๐ผœ'), ('๐ผง', '๐ผง'), ('๐ผฐ', '\u{10f50}'), ('๐ฝฐ', '\u{10f85}'), @@ -6641,7 +6687,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('๐‘‡œ', '๐‘‡œ'), ('๐‘ˆ€', '๐‘ˆ‘'), ('๐‘ˆ“', '\u{11237}'), - ('\u{1123e}', '\u{1123e}'), + ('\u{1123e}', '\u{11241}'), ('๐‘Š€', '๐‘Š†'), ('๐‘Šˆ', '๐‘Šˆ'), ('๐‘ŠŠ', '๐‘Š'), @@ -6722,12 +6768,17 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('๐‘ถ“', '๐‘ถ˜'), ('๐‘ถ ', '๐‘ถฉ'), ('๐‘ป ', '๐‘ปถ'), + ('\u{11f00}', '๐‘ผ'), + ('๐‘ผ’', '\u{11f3a}'), + ('๐‘ผพ', '\u{11f42}'), + ('๐‘ฝ', '๐‘ฝ™'), ('๐‘พฐ', '๐‘พฐ'), ('๐’€€', '๐’Ž™'), ('๐’€', '๐’‘ฎ'), ('๐’’€', '๐’•ƒ'), ('๐’พ', '๐’ฟฐ'), - ('๐“€€', '๐“ฎ'), + ('๐“€€', '๐“ฏ'), + ('\u{13440}', '\u{13455}'), ('๐”€', '๐”™†'), ('๐– €', '๐–จธ'), ('๐–ฉ€', '๐–ฉž'), @@ -6755,7 +6806,9 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('๐šฟต', '๐šฟป'), ('๐šฟฝ', '๐šฟพ'), ('๐›€€', '๐›„ข'), + ('๐›„ฒ', '๐›„ฒ'), ('๐›…', '๐›…’'), + ('๐›…•', '๐›…•'), ('๐›…ค', '๐›…ง'), ('๐›…ฐ', '๐›‹ป'), ('๐›ฐ€', '๐›ฑช'), @@ -6809,17 +6862,21 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('\u{1da9b}', '\u{1da9f}'), ('\u{1daa1}', '\u{1daaf}'), ('๐ผ€', '๐ผž'), + ('๐ผฅ', '๐ผช'), ('\u{1e000}', '\u{1e006}'), ('\u{1e008}', '\u{1e018}'), ('\u{1e01b}', '\u{1e021}'), ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), + ('๐ž€ฐ', '๐žญ'), + ('\u{1e08f}', '\u{1e08f}'), ('๐ž„€', '๐ž„ฌ'), ('\u{1e130}', '๐ž„ฝ'), ('๐ž…€', '๐ž…‰'), ('๐ž…Ž', '๐ž…Ž'), ('๐žŠ', '\u{1e2ae}'), ('๐ž‹€', '๐ž‹น'), + ('๐ž“', '๐ž“น'), ('๐žŸ ', '๐žŸฆ'), ('๐žŸจ', '๐žŸซ'), ('๐žŸญ', '๐žŸฎ'), @@ -6863,12 +6920,13 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('๐žบซ', '๐žบป'), ('๐Ÿฏฐ', '๐Ÿฏน'), ('๐ €€', '๐ช›Ÿ'), - ('๐ชœ€', '๐ซœธ'), + ('๐ชœ€', '๐ซœน'), ('๐ซ€', '๐ซ '), ('๐ซ  ', '๐ฌบก'), ('๐ฌบฐ', '๐ฎฏ '), ('๐ฏ €', '๐ฏจ'), ('๐ฐ€€', '๐ฑŠ'), + ('๐ฑ', '๐ฒŽฏ'), ('\u{e0100}', '\u{e01ef}'), ]; @@ -7341,6 +7399,7 @@ pub const ID_START: &'static [(char, char)] = &[ ('๐‘‡œ', '๐‘‡œ'), ('๐‘ˆ€', '๐‘ˆ‘'), ('๐‘ˆ“', '๐‘ˆซ'), + ('๐‘ˆฟ', '๐‘‰€'), ('๐‘Š€', '๐‘Š†'), ('๐‘Šˆ', '๐‘Šˆ'), ('๐‘ŠŠ', '๐‘Š'), @@ -7403,12 +7462,16 @@ pub const ID_START: &'static [(char, char)] = &[ ('๐‘ตช', '๐‘ถ‰'), ('๐‘ถ˜', '๐‘ถ˜'), ('๐‘ป ', '๐‘ปฒ'), + ('๐‘ผ‚', '๐‘ผ‚'), + ('๐‘ผ„', '๐‘ผ'), + ('๐‘ผ’', '๐‘ผณ'), ('๐‘พฐ', '๐‘พฐ'), ('๐’€€', '๐’Ž™'), ('๐’€', '๐’‘ฎ'), ('๐’’€', '๐’•ƒ'), ('๐’พ', '๐’ฟฐ'), - ('๐“€€', '๐“ฎ'), + ('๐“€€', '๐“ฏ'), + ('๐“‘', '๐“‘†'), ('๐”€', '๐”™†'), ('๐– €', '๐–จธ'), ('๐–ฉ€', '๐–ฉž'), @@ -7431,7 +7494,9 @@ pub const ID_START: &'static [(char, char)] = &[ ('๐šฟต', '๐šฟป'), ('๐šฟฝ', '๐šฟพ'), ('๐›€€', '๐›„ข'), + ('๐›„ฒ', '๐›„ฒ'), ('๐›…', '๐›…’'), + ('๐›…•', '๐›…•'), ('๐›…ค', '๐›…ง'), ('๐›…ฐ', '๐›‹ป'), ('๐›ฐ€', '๐›ฑช'), @@ -7469,11 +7534,14 @@ pub const ID_START: &'static [(char, char)] = &[ ('๐žช', '๐Ÿ‚'), ('๐Ÿ„', '๐Ÿ‹'), ('๐ผ€', '๐ผž'), + ('๐ผฅ', '๐ผช'), + ('๐ž€ฐ', '๐žญ'), ('๐ž„€', '๐ž„ฌ'), ('๐ž„ท', '๐ž„ฝ'), ('๐ž…Ž', '๐ž…Ž'), ('๐žŠ', '๐žŠญ'), ('๐ž‹€', '๐ž‹ซ'), + ('๐ž“', '๐ž“ซ'), ('๐žŸ ', '๐žŸฆ'), ('๐žŸจ', '๐žŸซ'), ('๐žŸญ', '๐žŸฎ'), @@ -7515,12 +7583,13 @@ pub const ID_START: &'static [(char, char)] = &[ ('๐žบฅ', '๐žบฉ'), ('๐žบซ', '๐žบป'), ('๐ €€', '๐ช›Ÿ'), - ('๐ชœ€', '๐ซœธ'), + ('๐ชœ€', '๐ซœน'), ('๐ซ€', '๐ซ '), ('๐ซ  ', '๐ฌบก'), ('๐ฌบฐ', '๐ฎฏ '), ('๐ฏ €', '๐ฏจ'), ('๐ฐ€€', '๐ฑŠ'), + ('๐ฑ', '๐ฒŽฏ'), ]; pub const IDEOGRAPHIC: &'static [(char, char)] = &[ @@ -7537,12 +7606,13 @@ pub const IDEOGRAPHIC: &'static [(char, char)] = &[ ('๐˜ด€', '๐˜ดˆ'), ('๐›…ฐ', '๐›‹ป'), ('๐ €€', '๐ช›Ÿ'), - ('๐ชœ€', '๐ซœธ'), + ('๐ชœ€', '๐ซœน'), ('๐ซ€', '๐ซ '), ('๐ซ  ', '๐ฌบก'), ('๐ฌบฐ', '๐ฎฏ '), ('๐ฏ €', '๐ฏจ'), ('๐ฐ€€', '๐ฑŠ'), + ('๐ฑ', '๐ฒŽฏ'), ]; pub const JOIN_CONTROL: &'static [(char, char)] = &[('\u{200c}', '\u{200d}')]; @@ -7834,7 +7904,7 @@ pub const LOWERCASE: &'static [(char, char)] = &[ ('ิฏ', 'ิฏ'), ('ี ', 'ึˆ'), ('แƒ', 'แƒบ'), - ('แƒฝ', 'แƒฟ'), + ('แƒผ', 'แƒฟ'), ('แธ', 'แฝ'), ('แฒ€', 'แฒˆ'), ('แด€', 'แถฟ'), @@ -8174,10 +8244,11 @@ pub const LOWERCASE: &'static [(char, char)] = &[ ('๊Ÿ•', '๊Ÿ•'), ('๊Ÿ—', '๊Ÿ—'), ('๊Ÿ™', '๊Ÿ™'), + ('๊Ÿฒ', '๊Ÿด'), ('๊Ÿถ', '๊Ÿถ'), ('๊Ÿธ', '๊Ÿบ'), ('๊ฌฐ', '๊ญš'), - ('๊ญœ', '๊ญจ'), + ('๊ญœ', '๊ญฉ'), ('๊ญฐ', '๊ฎฟ'), ('๏ฌ€', '๏ฌ†'), ('๏ฌ“', '๏ฌ—'), @@ -8225,6 +8296,8 @@ pub const LOWERCASE: &'static [(char, char)] = &[ ('๐Ÿ‹', '๐Ÿ‹'), ('๐ผ€', '๐ผ‰'), ('๐ผ‹', '๐ผž'), + ('๐ผฅ', '๐ผช'), + ('๐ž€ฐ', '๐žญ'), ('๐žคข', '๐žฅƒ'), ]; @@ -8450,7 +8523,7 @@ pub const OTHER_ALPHABETIC: &'static [(char, char)] = &[ ('เฏ†', 'เฏˆ'), ('เฏŠ', 'เฏŒ'), ('\u{bd7}', '\u{bd7}'), - ('\u{c00}', 'เฐƒ'), + ('\u{c00}', '\u{c04}'), ('\u{c3e}', 'เฑ„'), ('\u{c46}', '\u{c48}'), ('\u{c4a}', '\u{c4c}'), @@ -8462,6 +8535,7 @@ pub const OTHER_ALPHABETIC: &'static [(char, char)] = &[ ('เณŠ', '\u{ccc}'), ('\u{cd5}', '\u{cd6}'), ('\u{ce2}', '\u{ce3}'), + ('เณณ', 'เณณ'), ('\u{d00}', 'เดƒ'), ('\u{d3e}', '\u{d44}'), ('เต†', 'เตˆ'), @@ -8480,7 +8554,7 @@ pub const OTHER_ALPHABETIC: &'static [(char, char)] = &[ ('\u{eb4}', '\u{eb9}'), ('\u{ebb}', '\u{ebc}'), ('\u{ecd}', '\u{ecd}'), - ('\u{f71}', '\u{f81}'), + ('\u{f71}', '\u{f83}'), ('\u{f8d}', '\u{f97}'), ('\u{f99}', '\u{fbc}'), ('แ€ซ', '\u{1036}'), @@ -8553,7 +8627,7 @@ pub const OTHER_ALPHABETIC: &'static [(char, char)] = &[ ('๐‘€€', '๐‘€‚'), ('\u{11038}', '\u{11045}'), ('\u{11073}', '\u{11074}'), - ('๐‘‚‚', '๐‘‚‚'), + ('\u{11080}', '๐‘‚‚'), ('๐‘‚ฐ', '๐‘‚ธ'), ('\u{110c2}', '\u{110c2}'), ('\u{11100}', '\u{11102}'), @@ -8565,6 +8639,7 @@ pub const OTHER_ALPHABETIC: &'static [(char, char)] = &[ ('๐‘ˆฌ', '\u{11234}'), ('\u{11237}', '\u{11237}'), ('\u{1123e}', '\u{1123e}'), + ('\u{11241}', '\u{11241}'), ('\u{112df}', '\u{112e8}'), ('\u{11300}', '๐‘Œƒ'), ('\u{1133e}', '๐‘„'), @@ -8610,6 +8685,10 @@ pub const OTHER_ALPHABETIC: &'static [(char, char)] = &[ ('\u{11d90}', '\u{11d91}'), ('๐‘ถ“', '๐‘ถ–'), ('\u{11ef3}', '๐‘ปถ'), + ('\u{11f00}', '\u{11f01}'), + ('๐‘ผƒ', '๐‘ผƒ'), + ('๐‘ผด', '\u{11f3a}'), + ('๐‘ผพ', '\u{11f40}'), ('\u{16f4f}', '\u{16f4f}'), ('๐–ฝ‘', '๐–พ‡'), ('\u{16f8f}', '\u{16f92}'), @@ -8620,6 +8699,7 @@ pub const OTHER_ALPHABETIC: &'static [(char, char)] = &[ ('\u{1e01b}', '\u{1e021}'), ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), + ('\u{1e08f}', '\u{1e08f}'), ('\u{1e947}', '\u{1e947}'), ('๐Ÿ„ฐ', '๐Ÿ…‰'), ('๐Ÿ…', '๐Ÿ…ฉ'), @@ -8682,6 +8762,7 @@ pub const OTHER_LOWERCASE: &'static [(char, char)] = &[ ('ห ', 'หค'), ('\u{345}', '\u{345}'), ('อบ', 'อบ'), + ('แƒผ', 'แƒผ'), ('แดฌ', 'แตช'), ('แตธ', 'แตธ'), ('แถ›', 'แถฟ'), @@ -8693,12 +8774,15 @@ pub const OTHER_LOWERCASE: &'static [(char, char)] = &[ ('โฑผ', 'โฑฝ'), ('๊šœ', '๊š'), ('๊ฐ', '๊ฐ'), + ('๊Ÿฒ', '๊Ÿด'), ('๊Ÿธ', '๊Ÿน'), ('๊ญœ', '๊ญŸ'), + ('๊ญฉ', '๊ญฉ'), ('๐ž€', '๐ž€'), ('๐žƒ', '๐ž…'), ('๐ž‡', '๐žฐ'), ('๐žฒ', '๐žบ'), + ('๐ž€ฐ', '๐žญ'), ]; pub const OTHER_MATH: &'static [(char, char)] = &[ @@ -8984,6 +9068,7 @@ pub const SENTENCE_TERMINAL: &'static [(char, char)] = &[ ('๐‘ช›', '๐‘ชœ'), ('๐‘ฑ', '๐‘ฑ‚'), ('๐‘ปท', '๐‘ปธ'), + ('๐‘ฝƒ', '๐‘ฝ„'), ('๐–ฉฎ', '๐–ฉฏ'), ('๐–ซต', '๐–ซต'), ('๐–ฌท', '๐–ฌธ'), @@ -9026,6 +9111,8 @@ pub const SOFT_DOTTED: &'static [(char, char)] = &[ ('๐™ž', '๐™Ÿ'), ('๐š’', '๐š“'), ('๐ผš', '๐ผš'), + ('๐žŒ', '๐ž'), + ('๐žจ', '๐žจ'), ]; pub const TERMINAL_PUNCTUATION: &'static [(char, char)] = &[ @@ -9128,6 +9215,7 @@ pub const TERMINAL_PUNCTUATION: &'static [(char, char)] = &[ ('๐‘ฑ', '๐‘ฑƒ'), ('๐‘ฑฑ', '๐‘ฑฑ'), ('๐‘ปท', '๐‘ปธ'), + ('๐‘ฝƒ', '๐‘ฝ„'), ('๐’‘ฐ', '๐’‘ด'), ('๐–ฉฎ', '๐–ฉฏ'), ('๐–ซต', '๐–ซต'), @@ -9149,11 +9237,12 @@ pub const UNIFIED_IDEOGRAPH: &'static [(char, char)] = &[ ('๏จฃ', '๏จค'), ('๏จง', '๏จฉ'), ('๐ €€', '๐ช›Ÿ'), - ('๐ชœ€', '๐ซœธ'), + ('๐ชœ€', '๐ซœน'), ('๐ซ€', '๐ซ '), ('๐ซ  ', '๐ฌบก'), ('๐ฌบฐ', '๐ฎฏ '), ('๐ฐ€€', '๐ฑŠ'), + ('๐ฑ', '๐ฒŽฏ'), ]; pub const UPPERCASE: &'static [(char, char)] = &[ @@ -9989,7 +10078,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('เณ', 'เณž'), ('เณ ', '\u{ce3}'), ('เณฆ', 'เณฏ'), - ('เณฑ', 'เณฒ'), + ('เณฑ', 'เณณ'), ('\u{d00}', 'เดŒ'), ('เดŽ', 'เด'), ('เด’', '\u{d44}'), @@ -10022,7 +10111,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('เบง', 'เบฝ'), ('เป€', 'เป„'), ('เป†', 'เป†'), - ('\u{ec8}', '\u{ecd}'), + ('\u{ec8}', '\u{ece}'), ('เป', 'เป™'), ('เปœ', 'เปŸ'), ('เผ€', 'เผ€'), @@ -10342,7 +10431,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('๐บ€', '๐บฉ'), ('\u{10eab}', '\u{10eac}'), ('๐บฐ', '๐บฑ'), - ('๐ผ€', '๐ผœ'), + ('\u{10efd}', '๐ผœ'), ('๐ผง', '๐ผง'), ('๐ผฐ', '\u{10f50}'), ('๐ฝฐ', '\u{10f85}'), @@ -10365,7 +10454,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('๐‘‡œ', '๐‘‡œ'), ('๐‘ˆ€', '๐‘ˆ‘'), ('๐‘ˆ“', '\u{11237}'), - ('\u{1123e}', '\u{1123e}'), + ('\u{1123e}', '\u{11241}'), ('๐‘Š€', '๐‘Š†'), ('๐‘Šˆ', '๐‘Šˆ'), ('๐‘ŠŠ', '๐‘Š'), @@ -10446,12 +10535,17 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('๐‘ถ“', '๐‘ถ˜'), ('๐‘ถ ', '๐‘ถฉ'), ('๐‘ป ', '๐‘ปถ'), + ('\u{11f00}', '๐‘ผ'), + ('๐‘ผ’', '\u{11f3a}'), + ('๐‘ผพ', '\u{11f42}'), + ('๐‘ฝ', '๐‘ฝ™'), ('๐‘พฐ', '๐‘พฐ'), ('๐’€€', '๐’Ž™'), ('๐’€', '๐’‘ฎ'), ('๐’’€', '๐’•ƒ'), ('๐’พ', '๐’ฟฐ'), - ('๐“€€', '๐“ฎ'), + ('๐“€€', '๐“ฏ'), + ('\u{13440}', '\u{13455}'), ('๐”€', '๐”™†'), ('๐– €', '๐–จธ'), ('๐–ฉ€', '๐–ฉž'), @@ -10479,7 +10573,9 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('๐šฟต', '๐šฟป'), ('๐šฟฝ', '๐šฟพ'), ('๐›€€', '๐›„ข'), + ('๐›„ฒ', '๐›„ฒ'), ('๐›…', '๐›…’'), + ('๐›…•', '๐›…•'), ('๐›…ค', '๐›…ง'), ('๐›…ฐ', '๐›‹ป'), ('๐›ฐ€', '๐›ฑช'), @@ -10533,17 +10629,21 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('\u{1da9b}', '\u{1da9f}'), ('\u{1daa1}', '\u{1daaf}'), ('๐ผ€', '๐ผž'), + ('๐ผฅ', '๐ผช'), ('\u{1e000}', '\u{1e006}'), ('\u{1e008}', '\u{1e018}'), ('\u{1e01b}', '\u{1e021}'), ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), + ('๐ž€ฐ', '๐žญ'), + ('\u{1e08f}', '\u{1e08f}'), ('๐ž„€', '๐ž„ฌ'), ('\u{1e130}', '๐ž„ฝ'), ('๐ž…€', '๐ž…‰'), ('๐ž…Ž', '๐ž…Ž'), ('๐žŠ', '\u{1e2ae}'), ('๐ž‹€', '๐ž‹น'), + ('๐ž“', '๐ž“น'), ('๐žŸ ', '๐žŸฆ'), ('๐žŸจ', '๐žŸซ'), ('๐žŸญ', '๐žŸฎ'), @@ -10587,12 +10687,13 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('๐žบซ', '๐žบป'), ('๐Ÿฏฐ', '๐Ÿฏน'), ('๐ €€', '๐ช›Ÿ'), - ('๐ชœ€', '๐ซœธ'), + ('๐ชœ€', '๐ซœน'), ('๐ซ€', '๐ซ '), ('๐ซ  ', '๐ฌบก'), ('๐ฌบฐ', '๐ฎฏ '), ('๐ฏ €', '๐ฏจ'), ('๐ฐ€€', '๐ฑŠ'), + ('๐ฑ', '๐ฒŽฏ'), ('\u{e0100}', '\u{e01ef}'), ]; @@ -11072,6 +11173,7 @@ pub const XID_START: &'static [(char, char)] = &[ ('๐‘‡œ', '๐‘‡œ'), ('๐‘ˆ€', '๐‘ˆ‘'), ('๐‘ˆ“', '๐‘ˆซ'), + ('๐‘ˆฟ', '๐‘‰€'), ('๐‘Š€', '๐‘Š†'), ('๐‘Šˆ', '๐‘Šˆ'), ('๐‘ŠŠ', '๐‘Š'), @@ -11134,12 +11236,16 @@ pub const XID_START: &'static [(char, char)] = &[ ('๐‘ตช', '๐‘ถ‰'), ('๐‘ถ˜', '๐‘ถ˜'), ('๐‘ป ', '๐‘ปฒ'), + ('๐‘ผ‚', '๐‘ผ‚'), + ('๐‘ผ„', '๐‘ผ'), + ('๐‘ผ’', '๐‘ผณ'), ('๐‘พฐ', '๐‘พฐ'), ('๐’€€', '๐’Ž™'), ('๐’€', '๐’‘ฎ'), ('๐’’€', '๐’•ƒ'), ('๐’พ', '๐’ฟฐ'), - ('๐“€€', '๐“ฎ'), + ('๐“€€', '๐“ฏ'), + ('๐“‘', '๐“‘†'), ('๐”€', '๐”™†'), ('๐– €', '๐–จธ'), ('๐–ฉ€', '๐–ฉž'), @@ -11162,7 +11268,9 @@ pub const XID_START: &'static [(char, char)] = &[ ('๐šฟต', '๐šฟป'), ('๐šฟฝ', '๐šฟพ'), ('๐›€€', '๐›„ข'), + ('๐›„ฒ', '๐›„ฒ'), ('๐›…', '๐›…’'), + ('๐›…•', '๐›…•'), ('๐›…ค', '๐›…ง'), ('๐›…ฐ', '๐›‹ป'), ('๐›ฐ€', '๐›ฑช'), @@ -11200,11 +11308,14 @@ pub const XID_START: &'static [(char, char)] = &[ ('๐žช', '๐Ÿ‚'), ('๐Ÿ„', '๐Ÿ‹'), ('๐ผ€', '๐ผž'), + ('๐ผฅ', '๐ผช'), + ('๐ž€ฐ', '๐žญ'), ('๐ž„€', '๐ž„ฌ'), ('๐ž„ท', '๐ž„ฝ'), ('๐ž…Ž', '๐ž…Ž'), ('๐žŠ', '๐žŠญ'), ('๐ž‹€', '๐ž‹ซ'), + ('๐ž“', '๐ž“ซ'), ('๐žŸ ', '๐žŸฆ'), ('๐žŸจ', '๐žŸซ'), ('๐žŸญ', '๐žŸฎ'), @@ -11246,10 +11357,11 @@ pub const XID_START: &'static [(char, char)] = &[ ('๐žบฅ', '๐žบฉ'), ('๐žบซ', '๐žบป'), ('๐ €€', '๐ช›Ÿ'), - ('๐ชœ€', '๐ซœธ'), + ('๐ชœ€', '๐ซœน'), ('๐ซ€', '๐ซ '), ('๐ซ  ', '๐ฌบก'), ('๐ฌบฐ', '๐ฎฏ '), ('๐ฏ €', '๐ฏจ'), ('๐ฐ€€', '๐ฑŠ'), + ('๐ฑ', '๐ฒŽฏ'), ]; diff --git a/regex-syntax/src/unicode_tables/property_names.rs b/regex-syntax/src/unicode_tables/property_names.rs index 3fce1bf03..599a123ae 100644 --- a/regex-syntax/src/unicode_tables/property_names.rs +++ b/regex-syntax/src/unicode_tables/property_names.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate property-names /tmp/ucd +// ucd-generate property-names ucd-15.0.0 // -// Unicode version: 14.0.0. +// Unicode version: 15.0.0. // -// ucd-generate 0.2.11 is available on crates.io. +// ucd-generate 0.2.14 is available on crates.io. pub const PROPERTY_NAMES: &'static [(&'static str, &'static str)] = &[ ("age", "Age"), diff --git a/regex-syntax/src/unicode_tables/property_values.rs b/regex-syntax/src/unicode_tables/property_values.rs index 08a91477b..cb2d32fb7 100644 --- a/regex-syntax/src/unicode_tables/property_values.rs +++ b/regex-syntax/src/unicode_tables/property_values.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate property-values /tmp/ucd --include gc,script,scx,age,gcb,wb,sb +// ucd-generate property-values ucd-15.0.0 --include gc,script,scx,age,gcb,wb,sb // -// Unicode version: 14.0.0. +// Unicode version: 15.0.0. // -// ucd-generate 0.2.11 is available on crates.io. +// ucd-generate 0.2.14 is available on crates.io. pub const PROPERTY_VALUES: &'static [( &'static str, @@ -20,6 +20,7 @@ pub const PROPERTY_VALUES: &'static [( ("12.1", "V12_1"), ("13.0", "V13_0"), ("14.0", "V14_0"), + ("15.0", "V15_0"), ("2.0", "V2_0"), ("2.1", "V2_1"), ("3.0", "V3_0"), @@ -46,6 +47,7 @@ pub const PROPERTY_VALUES: &'static [( ("v121", "V12_1"), ("v130", "V13_0"), ("v140", "V14_0"), + ("v150", "V15_0"), ("v20", "V2_0"), ("v21", "V2_1"), ("v30", "V3_0"), @@ -308,6 +310,7 @@ pub const PROPERTY_VALUES: &'static [( ("kannada", "Kannada"), ("katakana", "Katakana"), ("katakanaorhiragana", "Katakana_Or_Hiragana"), + ("kawi", "Kawi"), ("kayahli", "Kayah_Li"), ("khar", "Kharoshthi"), ("kharoshthi", "Kharoshthi"), @@ -372,6 +375,8 @@ pub const PROPERTY_VALUES: &'static [( ("myanmar", "Myanmar"), ("mymr", "Myanmar"), ("nabataean", "Nabataean"), + ("nagm", "Nag_Mundari"), + ("nagmundari", "Nag_Mundari"), ("nand", "Nandinagari"), ("nandinagari", "Nandinagari"), ("narb", "Old_North_Arabian"), @@ -634,6 +639,7 @@ pub const PROPERTY_VALUES: &'static [( ("kannada", "Kannada"), ("katakana", "Katakana"), ("katakanaorhiragana", "Katakana_Or_Hiragana"), + ("kawi", "Kawi"), ("kayahli", "Kayah_Li"), ("khar", "Kharoshthi"), ("kharoshthi", "Kharoshthi"), @@ -698,6 +704,8 @@ pub const PROPERTY_VALUES: &'static [( ("myanmar", "Myanmar"), ("mymr", "Myanmar"), ("nabataean", "Nabataean"), + ("nagm", "Nag_Mundari"), + ("nagmundari", "Nag_Mundari"), ("nand", "Nandinagari"), ("nandinagari", "Nandinagari"), ("narb", "Old_North_Arabian"), diff --git a/regex-syntax/src/unicode_tables/script.rs b/regex-syntax/src/unicode_tables/script.rs index 3327b76ae..cc5c400dd 100644 --- a/regex-syntax/src/unicode_tables/script.rs +++ b/regex-syntax/src/unicode_tables/script.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate script /tmp/ucd --chars +// ucd-generate script ucd-15.0.0 --chars // -// Unicode version: 14.0.0. +// Unicode version: 15.0.0. // -// ucd-generate 0.2.11 is available on crates.io. +// ucd-generate 0.2.14 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Adlam", ADLAM), @@ -69,6 +69,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Kaithi", KAITHI), ("Kannada", KANNADA), ("Katakana", KATAKANA), + ("Kawi", KAWI), ("Kayah_Li", KAYAH_LI), ("Kharoshthi", KHAROSHTHI), ("Khitan_Small_Script", KHITAN_SMALL_SCRIPT), @@ -103,6 +104,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Multani", MULTANI), ("Myanmar", MYANMAR), ("Nabataean", NABATAEAN), + ("Nag_Mundari", NAG_MUNDARI), ("Nandinagari", NANDINAGARI), ("New_Tai_Lue", NEW_TAI_LUE), ("Newa", NEWA), @@ -202,6 +204,7 @@ pub const ARABIC: &'static [(char, char)] = &[ ('๏นฐ', '๏นด'), ('๏นถ', '๏ปผ'), ('๐น ', '๐นพ'), + ('\u{10efd}', '\u{10eff}'), ('๐žธ€', '๐žธƒ'), ('๐žธ…', '๐žธŸ'), ('๐žธก', '๐žธข'), @@ -410,6 +413,7 @@ pub const COMMON: &'static [(char, char)] = &[ ('๐†ƒ', '๐†„'), ('๐†Œ', '๐†ฉ'), ('๐†ฎ', '๐‡ช'), + ('๐‹€', '๐‹“'), ('๐‹ ', '๐‹ณ'), ('๐Œ€', '๐–'), ('๐ ', '๐ธ'), @@ -450,10 +454,10 @@ pub const COMMON: &'static [(char, char)] = &[ ('๐Ÿ‰', '๐Ÿ‰‘'), ('๐Ÿ‰ ', '๐Ÿ‰ฅ'), ('๐ŸŒ€', '๐Ÿ›—'), - ('๐Ÿ›', '๐Ÿ›ฌ'), + ('๐Ÿ›œ', '๐Ÿ›ฌ'), ('๐Ÿ›ฐ', '๐Ÿ›ผ'), - ('๐Ÿœ€', '๐Ÿณ'), - ('๐Ÿž€', '๐ŸŸ˜'), + ('๐Ÿœ€', '๐Ÿถ'), + ('๐Ÿป', '๐ŸŸ™'), ('๐ŸŸ ', '๐ŸŸซ'), ('๐ŸŸฐ', '๐ŸŸฐ'), ('๐Ÿ €', '๐Ÿ ‹'), @@ -464,15 +468,13 @@ pub const COMMON: &'static [(char, char)] = &[ ('๐Ÿขฐ', '๐Ÿขฑ'), ('๐Ÿค€', '๐Ÿฉ“'), ('๐Ÿฉ ', '๐Ÿฉญ'), - ('๐Ÿฉฐ', '๐Ÿฉด'), - ('๐Ÿฉธ', '๐Ÿฉผ'), - ('๐Ÿช€', '๐Ÿช†'), - ('๐Ÿช', '๐Ÿชฌ'), - ('๐Ÿชฐ', '๐Ÿชบ'), - ('๐Ÿซ€', '๐Ÿซ…'), - ('๐Ÿซ', '๐Ÿซ™'), - ('๐Ÿซ ', '๐Ÿซง'), - ('๐Ÿซฐ', '๐Ÿซถ'), + ('๐Ÿฉฐ', '๐Ÿฉผ'), + ('๐Ÿช€', '๐Ÿชˆ'), + ('๐Ÿช', '๐Ÿชฝ'), + ('๐Ÿชฟ', '๐Ÿซ…'), + ('๐ŸซŽ', '๐Ÿซ›'), + ('๐Ÿซ ', '๐Ÿซจ'), + ('๐Ÿซฐ', '๐Ÿซธ'), ('๐Ÿฌ€', '๐Ÿฎ’'), ('๐Ÿฎ”', '๐ŸฏŠ'), ('๐Ÿฏฐ', '๐Ÿฏน'), @@ -500,6 +502,8 @@ pub const CYRILLIC: &'static [(char, char)] = &[ ('\u{2de0}', '\u{2dff}'), ('๊™€', '\u{a69f}'), ('\u{fe2e}', '\u{fe2f}'), + ('๐ž€ฐ', '๐žญ'), + ('\u{1e08f}', '\u{1e08f}'), ]; pub const DESERET: &'static [(char, char)] = &[('๐€', '๐‘')]; @@ -509,6 +513,7 @@ pub const DEVANAGARI: &'static [(char, char)] = &[ ('\u{955}', '\u{963}'), ('เฅฆ', 'เฅฟ'), ('\u{a8e0}', '\u{a8ff}'), + ('๐‘ฌ€', '๐‘ฌ‰'), ]; pub const DIVES_AKURU: &'static [(char, char)] = &[ @@ -528,7 +533,7 @@ pub const DUPLOYAN: &'static [(char, char)] = &[('๐›ฐ€', '๐›ฑช'), ('๐›ฑฐ', '๐›ฑผ'), ('๐›ฒ€', '๐›ฒˆ'), ('๐›ฒ', '๐›ฒ™'), ('๐›ฒœ', '๐›ฒŸ')]; pub const EGYPTIAN_HIEROGLYPHS: &'static [(char, char)] = - &[('๐“€€', '๐“ฎ'), ('\u{13430}', '\u{13438}')]; + &[('๐“€€', '\u{13455}')]; pub const ELBASAN: &'static [(char, char)] = &[('๐”€', '๐”ง')]; @@ -714,12 +719,13 @@ pub const HAN: &'static [(char, char)] = &[ ('๐–ฟข', '๐–ฟฃ'), ('๐–ฟฐ', '๐–ฟฑ'), ('๐ €€', '๐ช›Ÿ'), - ('๐ชœ€', '๐ซœธ'), + ('๐ชœ€', '๐ซœน'), ('๐ซ€', '๐ซ '), ('๐ซ  ', '๐ฌบก'), ('๐ฌบฐ', '๐ฎฏ '), ('๐ฏ €', '๐ฏจ'), ('๐ฐ€€', '๐ฑŠ'), + ('๐ฑ', '๐ฒŽฏ'), ]; pub const HANGUL: &'static [(char, char)] = &[ @@ -759,8 +765,14 @@ pub const HEBREW: &'static [(char, char)] = &[ ('๏ญ†', '๏ญ'), ]; -pub const HIRAGANA: &'static [(char, char)] = - &[('ใ', 'ใ‚–'), ('ใ‚', 'ใ‚Ÿ'), ('๐›€', '๐›„Ÿ'), ('๐›…', '๐›…’'), ('๐Ÿˆ€', '๐Ÿˆ€')]; +pub const HIRAGANA: &'static [(char, char)] = &[ + ('ใ', 'ใ‚–'), + ('ใ‚', 'ใ‚Ÿ'), + ('๐›€', '๐›„Ÿ'), + ('๐›„ฒ', '๐›„ฒ'), + ('๐›…', '๐›…’'), + ('๐Ÿˆ€', '๐Ÿˆ€'), +]; pub const IMPERIAL_ARAMAIC: &'static [(char, char)] = &[('๐ก€', '๐ก•'), ('๐ก—', '๐กŸ')]; @@ -822,7 +834,7 @@ pub const KANNADA: &'static [(char, char)] = &[ ('เณ', 'เณž'), ('เณ ', '\u{ce3}'), ('เณฆ', 'เณฏ'), - ('เณฑ', 'เณฒ'), + ('เณฑ', 'เณณ'), ]; pub const KATAKANA: &'static [(char, char)] = &[ @@ -838,9 +850,13 @@ pub const KATAKANA: &'static [(char, char)] = &[ ('๐šฟฝ', '๐šฟพ'), ('๐›€€', '๐›€€'), ('๐›„ ', '๐›„ข'), + ('๐›…•', '๐›…•'), ('๐›…ค', '๐›…ง'), ]; +pub const KAWI: &'static [(char, char)] = + &[('\u{11f00}', '๐‘ผ'), ('๐‘ผ’', '\u{11f3a}'), ('๐‘ผพ', '๐‘ฝ™')]; + pub const KAYAH_LI: &'static [(char, char)] = &[('๊ค€', '\u{a92d}'), ('๊คฏ', '๊คฏ')]; pub const KHAROSHTHI: &'static [(char, char)] = &[ @@ -860,7 +876,7 @@ pub const KHITAN_SMALL_SCRIPT: &'static [(char, char)] = pub const KHMER: &'static [(char, char)] = &[('แž€', '\u{17dd}'), ('แŸ ', 'แŸฉ'), ('แŸฐ', 'แŸน'), ('แง ', 'แงฟ')]; -pub const KHOJKI: &'static [(char, char)] = &[('๐‘ˆ€', '๐‘ˆ‘'), ('๐‘ˆ“', '\u{1123e}')]; +pub const KHOJKI: &'static [(char, char)] = &[('๐‘ˆ€', '๐‘ˆ‘'), ('๐‘ˆ“', '\u{11241}')]; pub const KHUDAWADI: &'static [(char, char)] = &[('๐‘Šฐ', '\u{112ea}'), ('๐‘‹ฐ', '๐‘‹น')]; @@ -874,7 +890,7 @@ pub const LAO: &'static [(char, char)] = &[ ('เบง', 'เบฝ'), ('เป€', 'เป„'), ('เป†', 'เป†'), - ('\u{ec8}', '\u{ecd}'), + ('\u{ec8}', '\u{ece}'), ('เป', 'เป™'), ('เปœ', 'เปŸ'), ]; @@ -918,6 +934,7 @@ pub const LATIN: &'static [(char, char)] = &[ ('๐ž‡', '๐žฐ'), ('๐žฒ', '๐žบ'), ('๐ผ€', '๐ผž'), + ('๐ผฅ', '๐ผช'), ]; pub const LEPCHA: &'static [(char, char)] = @@ -1013,6 +1030,8 @@ pub const MYANMAR: &'static [(char, char)] = pub const NABATAEAN: &'static [(char, char)] = &[('๐ข€', '๐ขž'), ('๐ขง', '๐ขฏ')]; +pub const NAG_MUNDARI: &'static [(char, char)] = &[('๐ž“', '๐ž“น')]; + pub const NANDINAGARI: &'static [(char, char)] = &[('๐‘ฆ ', '๐‘ฆง'), ('๐‘ฆช', '\u{119d7}'), ('\u{119da}', '๐‘งค')]; diff --git a/regex-syntax/src/unicode_tables/script_extension.rs b/regex-syntax/src/unicode_tables/script_extension.rs index c970e0104..42625e21b 100644 --- a/regex-syntax/src/unicode_tables/script_extension.rs +++ b/regex-syntax/src/unicode_tables/script_extension.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate script-extension /tmp/ucd --chars +// ucd-generate script-extension ucd-15.0.0 --chars // -// Unicode version: 14.0.0. +// Unicode version: 15.0.0. // -// ucd-generate 0.2.11 is available on crates.io. +// ucd-generate 0.2.14 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Adlam", ADLAM), @@ -69,6 +69,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Kaithi", KAITHI), ("Kannada", KANNADA), ("Katakana", KATAKANA), + ("Kawi", KAWI), ("Kayah_Li", KAYAH_LI), ("Kharoshthi", KHAROSHTHI), ("Khitan_Small_Script", KHITAN_SMALL_SCRIPT), @@ -103,6 +104,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Multani", MULTANI), ("Myanmar", MYANMAR), ("Nabataean", NABATAEAN), + ("Nag_Mundari", NAG_MUNDARI), ("Nandinagari", NANDINAGARI), ("New_Tai_Lue", NEW_TAI_LUE), ("Newa", NEWA), @@ -196,6 +198,7 @@ pub const ARABIC: &'static [(char, char)] = &[ ('๏นถ', '๏ปผ'), ('\u{102e0}', '๐‹ป'), ('๐น ', '๐นพ'), + ('\u{10efd}', '\u{10eff}'), ('๐žธ€', '๐žธƒ'), ('๐žธ…', '๐žธŸ'), ('๐žธก', '๐žธข'), @@ -404,6 +407,7 @@ pub const COMMON: &'static [(char, char)] = &[ ('๐†ƒ', '๐†„'), ('๐†Œ', '๐†ฉ'), ('๐†ฎ', '๐‡ช'), + ('๐‹€', '๐‹“'), ('๐‹ ', '๐‹ณ'), ('๐Œ€', '๐–'), ('๐ฒ', '๐ธ'), @@ -443,10 +447,10 @@ pub const COMMON: &'static [(char, char)] = &[ ('๐Ÿ‰€', '๐Ÿ‰ˆ'), ('๐Ÿ‰ ', '๐Ÿ‰ฅ'), ('๐ŸŒ€', '๐Ÿ›—'), - ('๐Ÿ›', '๐Ÿ›ฌ'), + ('๐Ÿ›œ', '๐Ÿ›ฌ'), ('๐Ÿ›ฐ', '๐Ÿ›ผ'), - ('๐Ÿœ€', '๐Ÿณ'), - ('๐Ÿž€', '๐ŸŸ˜'), + ('๐Ÿœ€', '๐Ÿถ'), + ('๐Ÿป', '๐ŸŸ™'), ('๐ŸŸ ', '๐ŸŸซ'), ('๐ŸŸฐ', '๐ŸŸฐ'), ('๐Ÿ €', '๐Ÿ ‹'), @@ -457,15 +461,13 @@ pub const COMMON: &'static [(char, char)] = &[ ('๐Ÿขฐ', '๐Ÿขฑ'), ('๐Ÿค€', '๐Ÿฉ“'), ('๐Ÿฉ ', '๐Ÿฉญ'), - ('๐Ÿฉฐ', '๐Ÿฉด'), - ('๐Ÿฉธ', '๐Ÿฉผ'), - ('๐Ÿช€', '๐Ÿช†'), - ('๐Ÿช', '๐Ÿชฌ'), - ('๐Ÿชฐ', '๐Ÿชบ'), - ('๐Ÿซ€', '๐Ÿซ…'), - ('๐Ÿซ', '๐Ÿซ™'), - ('๐Ÿซ ', '๐Ÿซง'), - ('๐Ÿซฐ', '๐Ÿซถ'), + ('๐Ÿฉฐ', '๐Ÿฉผ'), + ('๐Ÿช€', '๐Ÿชˆ'), + ('๐Ÿช', '๐Ÿชฝ'), + ('๐Ÿชฟ', '๐Ÿซ…'), + ('๐ŸซŽ', '๐Ÿซ›'), + ('๐Ÿซ ', '๐Ÿซจ'), + ('๐Ÿซฐ', '๐Ÿซธ'), ('๐Ÿฌ€', '๐Ÿฎ’'), ('๐Ÿฎ”', '๐ŸฏŠ'), ('๐Ÿฏฐ', '๐Ÿฏน'), @@ -503,6 +505,8 @@ pub const CYRILLIC: &'static [(char, char)] = &[ ('โนƒ', 'โนƒ'), ('๊™€', '\u{a69f}'), ('\u{fe2e}', '\u{fe2f}'), + ('๐ž€ฐ', '๐žญ'), + ('\u{1e08f}', '\u{1e08f}'), ]; pub const DESERET: &'static [(char, char)] = &[('๐€', '๐‘')]; @@ -515,6 +519,7 @@ pub const DEVANAGARI: &'static [(char, char)] = &[ ('\u{20f0}', '\u{20f0}'), ('๊ ฐ', '๊ น'), ('\u{a8e0}', '\u{a8ff}'), + ('๐‘ฌ€', '๐‘ฌ‰'), ]; pub const DIVES_AKURU: &'static [(char, char)] = &[ @@ -535,7 +540,7 @@ pub const DUPLOYAN: &'static [(char, char)] = &[('๐›ฐ€', '๐›ฑช'), ('๐›ฑฐ', '๐›ฑผ'), ('๐›ฒ€', '๐›ฒˆ'), ('๐›ฒ', '๐›ฒ™'), ('๐›ฒœ', '\u{1bca3}')]; pub const EGYPTIAN_HIEROGLYPHS: &'static [(char, char)] = - &[('๐“€€', '๐“ฎ'), ('\u{13430}', '\u{13438}')]; + &[('๐“€€', '\u{13455}')]; pub const ELBASAN: &'static [(char, char)] = &[('๐”€', '๐”ง')]; @@ -760,12 +765,13 @@ pub const HAN: &'static [(char, char)] = &[ ('๐ ', '๐ฑ'), ('๐Ÿ‰', '๐Ÿ‰‘'), ('๐ €€', '๐ช›Ÿ'), - ('๐ชœ€', '๐ซœธ'), + ('๐ชœ€', '๐ซœน'), ('๐ซ€', '๐ซ '), ('๐ซ  ', '๐ฌบก'), ('๐ฌบฐ', '๐ฎฏ '), ('๐ฏ €', '๐ฏจ'), ('๐ฐ€€', '๐ฑŠ'), + ('๐ฑ', '๐ฒŽฏ'), ]; pub const HANGUL: &'static [(char, char)] = &[ @@ -834,6 +840,7 @@ pub const HIRAGANA: &'static [(char, char)] = &[ ('๏ฝฐ', '๏ฝฐ'), ('\u{ff9e}', '\u{ff9f}'), ('๐›€', '๐›„Ÿ'), + ('๐›„ฒ', '๐›„ฒ'), ('๐›…', '๐›…’'), ('๐Ÿˆ€', '๐Ÿˆ€'), ]; @@ -895,7 +902,7 @@ pub const KANNADA: &'static [(char, char)] = &[ ('เณ', 'เณž'), ('เณ ', '\u{ce3}'), ('เณฆ', 'เณฏ'), - ('เณฑ', 'เณฒ'), + ('เณฑ', 'เณณ'), ('\u{1cd0}', '\u{1cd0}'), ('\u{1cd2}', '\u{1cd2}'), ('\u{1cda}', '\u{1cda}'), @@ -923,9 +930,13 @@ pub const KATAKANA: &'static [(char, char)] = &[ ('๐šฟฝ', '๐šฟพ'), ('๐›€€', '๐›€€'), ('๐›„ ', '๐›„ข'), + ('๐›…•', '๐›…•'), ('๐›…ค', '๐›…ง'), ]; +pub const KAWI: &'static [(char, char)] = + &[('\u{11f00}', '๐‘ผ'), ('๐‘ผ’', '\u{11f3a}'), ('๐‘ผพ', '๐‘ฝ™')]; + pub const KAYAH_LI: &'static [(char, char)] = &[('๊ค€', '๊คฏ')]; pub const KHAROSHTHI: &'static [(char, char)] = &[ @@ -946,7 +957,7 @@ pub const KHMER: &'static [(char, char)] = &[('แž€', '\u{17dd}'), ('แŸ ', 'แŸฉ'), ('แŸฐ', 'แŸน'), ('แง ', 'แงฟ')]; pub const KHOJKI: &'static [(char, char)] = - &[('เซฆ', 'เซฏ'), ('๊ ฐ', '๊ น'), ('๐‘ˆ€', '๐‘ˆ‘'), ('๐‘ˆ“', '\u{1123e}')]; + &[('เซฆ', 'เซฏ'), ('๊ ฐ', '๊ น'), ('๐‘ˆ€', '๐‘ˆ‘'), ('๐‘ˆ“', '\u{11241}')]; pub const KHUDAWADI: &'static [(char, char)] = &[('เฅค', 'เฅฅ'), ('๊ ฐ', '๊ น'), ('๐‘Šฐ', '\u{112ea}'), ('๐‘‹ฐ', '๐‘‹น')]; @@ -960,7 +971,7 @@ pub const LAO: &'static [(char, char)] = &[ ('เบง', 'เบฝ'), ('เป€', 'เป„'), ('เป†', 'เป†'), - ('\u{ec8}', '\u{ecd}'), + ('\u{ec8}', '\u{ece}'), ('เป', 'เป™'), ('เปœ', 'เปŸ'), ]; @@ -1012,6 +1023,7 @@ pub const LATIN: &'static [(char, char)] = &[ ('๐ž‡', '๐žฐ'), ('๐žฒ', '๐žบ'), ('๐ผ€', '๐ผž'), + ('๐ผฅ', '๐ผช'), ]; pub const LEPCHA: &'static [(char, char)] = @@ -1124,6 +1136,8 @@ pub const MYANMAR: &'static [(char, char)] = pub const NABATAEAN: &'static [(char, char)] = &[('๐ข€', '๐ขž'), ('๐ขง', '๐ขฏ')]; +pub const NAG_MUNDARI: &'static [(char, char)] = &[('๐ž“', '๐ž“น')]; + pub const NANDINAGARI: &'static [(char, char)] = &[ ('เฅค', 'เฅฅ'), ('เณฆ', 'เณฏ'), diff --git a/regex-syntax/src/unicode_tables/sentence_break.rs b/regex-syntax/src/unicode_tables/sentence_break.rs index db8ad282b..24348736f 100644 --- a/regex-syntax/src/unicode_tables/sentence_break.rs +++ b/regex-syntax/src/unicode_tables/sentence_break.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate sentence-break /tmp/ucd --chars +// ucd-generate sentence-break ucd-15.0.0 --chars // -// Unicode version: 14.0.0. +// Unicode version: 15.0.0. // -// ucd-generate 0.2.11 is available on crates.io. +// ucd-generate 0.2.14 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("ATerm", ATERM), @@ -157,6 +157,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('เณŠ', '\u{ccd}'), ('\u{cd5}', '\u{cd6}'), ('\u{ce2}', '\u{ce3}'), + ('เณณ', 'เณณ'), ('\u{d00}', 'เดƒ'), ('\u{d3b}', '\u{d3c}'), ('\u{d3e}', '\u{d44}'), @@ -175,7 +176,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{e47}', '\u{e4e}'), ('\u{eb1}', '\u{eb1}'), ('\u{eb4}', '\u{ebc}'), - ('\u{ec8}', '\u{ecd}'), + ('\u{ec8}', '\u{ece}'), ('\u{f18}', '\u{f19}'), ('\u{f35}', '\u{f35}'), ('\u{f37}', '\u{f37}'), @@ -279,6 +280,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{10ae5}', '\u{10ae6}'), ('\u{10d24}', '\u{10d27}'), ('\u{10eab}', '\u{10eac}'), + ('\u{10efd}', '\u{10eff}'), ('\u{10f46}', '\u{10f50}'), ('\u{10f82}', '\u{10f85}'), ('๐‘€€', '๐‘€‚'), @@ -298,6 +300,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('๐‘‡Ž', '\u{111cf}'), ('๐‘ˆฌ', '\u{11237}'), ('\u{1123e}', '\u{1123e}'), + ('\u{11241}', '\u{11241}'), ('\u{112df}', '\u{112ea}'), ('\u{11300}', '๐‘Œƒ'), ('\u{1133b}', '\u{1133c}'), @@ -345,6 +348,12 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{11d90}', '\u{11d91}'), ('๐‘ถ“', '\u{11d97}'), ('\u{11ef3}', '๐‘ปถ'), + ('\u{11f00}', '\u{11f01}'), + ('๐‘ผƒ', '๐‘ผƒ'), + ('๐‘ผด', '\u{11f3a}'), + ('๐‘ผพ', '\u{11f42}'), + ('\u{13440}', '\u{13440}'), + ('\u{13447}', '\u{13455}'), ('\u{16af0}', '\u{16af4}'), ('\u{16b30}', '\u{16b36}'), ('\u{16f4f}', '\u{16f4f}'), @@ -372,9 +381,11 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{1e01b}', '\u{1e021}'), ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), + ('\u{1e08f}', '\u{1e08f}'), ('\u{1e130}', '\u{1e136}'), ('\u{1e2ae}', '\u{1e2ae}'), ('\u{1e2ec}', '\u{1e2ef}'), + ('\u{1e4ec}', '\u{1e4ef}'), ('\u{1e8d0}', '\u{1e8d6}'), ('\u{1e944}', '\u{1e94a}'), ('\u{e0020}', '\u{e007f}'), @@ -399,7 +410,7 @@ pub const FORMAT: &'static [(char, char)] = &[ ('\u{fff9}', '\u{fffb}'), ('\u{110bd}', '\u{110bd}'), ('\u{110cd}', '\u{110cd}'), - ('\u{13430}', '\u{13438}'), + ('\u{13430}', '\u{1343f}'), ('\u{1bca0}', '\u{1bca3}'), ('\u{1d173}', '\u{1d17a}'), ('\u{e0001}', '\u{e0001}'), @@ -682,6 +693,7 @@ pub const LOWER: &'static [(char, char)] = &[ ('ิญ', 'ิญ'), ('ิฏ', 'ิฏ'), ('ี ', 'ึˆ'), + ('แƒผ', 'แƒผ'), ('แธ', 'แฝ'), ('แฒ€', 'แฒˆ'), ('แด€', 'แถฟ'), @@ -1021,10 +1033,11 @@ pub const LOWER: &'static [(char, char)] = &[ ('๊Ÿ•', '๊Ÿ•'), ('๊Ÿ—', '๊Ÿ—'), ('๊Ÿ™', '๊Ÿ™'), + ('๊Ÿฒ', '๊Ÿด'), ('๊Ÿถ', '๊Ÿถ'), ('๊Ÿธ', '๊Ÿบ'), ('๊ฌฐ', '๊ญš'), - ('๊ญœ', '๊ญจ'), + ('๊ญœ', '๊ญฉ'), ('๊ญฐ', '๊ฎฟ'), ('๏ฌ€', '๏ฌ†'), ('๏ฌ“', '๏ฌ—'), @@ -1072,6 +1085,8 @@ pub const LOWER: &'static [(char, char)] = &[ ('๐Ÿ‹', '๐Ÿ‹'), ('๐ผ€', '๐ผ‰'), ('๐ผ‹', '๐ผž'), + ('๐ผฅ', '๐ผช'), + ('๐ž€ฐ', '๐žญ'), ('๐žคข', '๐žฅƒ'), ]; @@ -1131,12 +1146,14 @@ pub const NUMERIC: &'static [(char, char)] = &[ ('๐‘ฑ', '๐‘ฑ™'), ('๐‘ต', '๐‘ต™'), ('๐‘ถ ', '๐‘ถฉ'), + ('๐‘ฝ', '๐‘ฝ™'), ('๐–ฉ ', '๐–ฉฉ'), ('๐–ซ€', '๐–ซ‰'), ('๐–ญ', '๐–ญ™'), ('๐ŸŽ', '๐Ÿฟ'), ('๐ž…€', '๐ž…‰'), ('๐ž‹ฐ', '๐ž‹น'), + ('๐ž“ฐ', '๐ž“น'), ('๐žฅ', '๐žฅ™'), ('๐Ÿฏฐ', '๐Ÿฏน'), ]; @@ -1294,7 +1311,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('แต', 'แ‚'), ('แ‚Ž', 'แ‚Ž'), ('แƒ', 'แƒบ'), - ('แƒผ', 'แ‰ˆ'), + ('แƒฝ', 'แ‰ˆ'), ('แ‰Š', 'แ‰'), ('แ‰', 'แ‰–'), ('แ‰˜', 'แ‰˜'), @@ -1390,7 +1407,6 @@ pub const OLETTER: &'static [(char, char)] = &[ ('๊œ—', '๊œŸ'), ('๊žˆ', '๊žˆ'), ('๊ž', '๊ž'), - ('๊Ÿฒ', '๊Ÿด'), ('๊Ÿท', '๊Ÿท'), ('๊Ÿป', '๊ '), ('๊ ƒ', '๊ …'), @@ -1428,7 +1444,6 @@ pub const OLETTER: &'static [(char, char)] = &[ ('๊ฌ‘', '๊ฌ–'), ('๊ฌ ', '๊ฌฆ'), ('๊ฌจ', '๊ฌฎ'), - ('๊ญฉ', '๊ญฉ'), ('๊ฏ€', '๊ฏข'), ('๊ฐ€', 'ํžฃ'), ('ํžฐ', 'ํŸ†'), @@ -1531,6 +1546,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('๐‘‡œ', '๐‘‡œ'), ('๐‘ˆ€', '๐‘ˆ‘'), ('๐‘ˆ“', '๐‘ˆซ'), + ('๐‘ˆฟ', '๐‘‰€'), ('๐‘Š€', '๐‘Š†'), ('๐‘Šˆ', '๐‘Šˆ'), ('๐‘ŠŠ', '๐‘Š'), @@ -1592,12 +1608,16 @@ pub const OLETTER: &'static [(char, char)] = &[ ('๐‘ตช', '๐‘ถ‰'), ('๐‘ถ˜', '๐‘ถ˜'), ('๐‘ป ', '๐‘ปฒ'), + ('๐‘ผ‚', '๐‘ผ‚'), + ('๐‘ผ„', '๐‘ผ'), + ('๐‘ผ’', '๐‘ผณ'), ('๐‘พฐ', '๐‘พฐ'), ('๐’€€', '๐’Ž™'), ('๐’€', '๐’‘ฎ'), ('๐’’€', '๐’•ƒ'), ('๐’พ', '๐’ฟฐ'), - ('๐“€€', '๐“ฎ'), + ('๐“€€', '๐“ฏ'), + ('๐“‘', '๐“‘†'), ('๐”€', '๐”™†'), ('๐– €', '๐–จธ'), ('๐–ฉ€', '๐–ฉž'), @@ -1619,7 +1639,9 @@ pub const OLETTER: &'static [(char, char)] = &[ ('๐šฟต', '๐šฟป'), ('๐šฟฝ', '๐šฟพ'), ('๐›€€', '๐›„ข'), + ('๐›„ฒ', '๐›„ฒ'), ('๐›…', '๐›…’'), + ('๐›…•', '๐›…•'), ('๐›…ค', '๐›…ง'), ('๐›…ฐ', '๐›‹ป'), ('๐›ฐ€', '๐›ฑช'), @@ -1632,6 +1654,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('๐ž…Ž', '๐ž…Ž'), ('๐žŠ', '๐žŠญ'), ('๐ž‹€', '๐ž‹ซ'), + ('๐ž“', '๐ž“ซ'), ('๐žŸ ', '๐žŸฆ'), ('๐žŸจ', '๐žŸซ'), ('๐žŸญ', '๐žŸฎ'), @@ -1672,12 +1695,13 @@ pub const OLETTER: &'static [(char, char)] = &[ ('๐žบฅ', '๐žบฉ'), ('๐žบซ', '๐žบป'), ('๐ €€', '๐ช›Ÿ'), - ('๐ชœ€', '๐ซœธ'), + ('๐ชœ€', '๐ซœน'), ('๐ซ€', '๐ซ '), ('๐ซ  ', '๐ฌบก'), ('๐ฌบฐ', '๐ฎฏ '), ('๐ฏ €', '๐ฏจ'), ('๐ฐ€€', '๐ฑŠ'), + ('๐ฑ', '๐ฒŽฏ'), ]; pub const SCONTINUE: &'static [(char, char)] = &[ @@ -1772,6 +1796,7 @@ pub const STERM: &'static [(char, char)] = &[ ('๐‘ช›', '๐‘ชœ'), ('๐‘ฑ', '๐‘ฑ‚'), ('๐‘ปท', '๐‘ปธ'), + ('๐‘ฝƒ', '๐‘ฝ„'), ('๐–ฉฎ', '๐–ฉฏ'), ('๐–ซต', '๐–ซต'), ('๐–ฌท', '๐–ฌธ'), diff --git a/regex-syntax/src/unicode_tables/word_break.rs b/regex-syntax/src/unicode_tables/word_break.rs index 19b2a1c64..c0714956f 100644 --- a/regex-syntax/src/unicode_tables/word_break.rs +++ b/regex-syntax/src/unicode_tables/word_break.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate word-break /tmp/ucd --chars +// ucd-generate word-break ucd-15.0.0 --chars // -// Unicode version: 14.0.0. +// Unicode version: 15.0.0. // -// ucd-generate 0.2.11 is available on crates.io. +// ucd-generate 0.2.14 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("ALetter", ALETTER), @@ -434,6 +434,7 @@ pub const ALETTER: &'static [(char, char)] = &[ ('๐‘‡œ', '๐‘‡œ'), ('๐‘ˆ€', '๐‘ˆ‘'), ('๐‘ˆ“', '๐‘ˆซ'), + ('๐‘ˆฟ', '๐‘‰€'), ('๐‘Š€', '๐‘Š†'), ('๐‘Šˆ', '๐‘Šˆ'), ('๐‘ŠŠ', '๐‘Š'), @@ -494,12 +495,16 @@ pub const ALETTER: &'static [(char, char)] = &[ ('๐‘ตช', '๐‘ถ‰'), ('๐‘ถ˜', '๐‘ถ˜'), ('๐‘ป ', '๐‘ปฒ'), + ('๐‘ผ‚', '๐‘ผ‚'), + ('๐‘ผ„', '๐‘ผ'), + ('๐‘ผ’', '๐‘ผณ'), ('๐‘พฐ', '๐‘พฐ'), ('๐’€€', '๐’Ž™'), ('๐’€', '๐’‘ฎ'), ('๐’’€', '๐’•ƒ'), ('๐’พ', '๐’ฟฐ'), - ('๐“€€', '๐“ฎ'), + ('๐“€€', '๐“ฏ'), + ('๐“‘', '๐“‘†'), ('๐”€', '๐”™†'), ('๐– €', '๐–จธ'), ('๐–ฉ€', '๐–ฉž'), @@ -550,11 +555,14 @@ pub const ALETTER: &'static [(char, char)] = &[ ('๐žช', '๐Ÿ‚'), ('๐Ÿ„', '๐Ÿ‹'), ('๐ผ€', '๐ผž'), + ('๐ผฅ', '๐ผช'), + ('๐ž€ฐ', '๐žญ'), ('๐ž„€', '๐ž„ฌ'), ('๐ž„ท', '๐ž„ฝ'), ('๐ž…Ž', '๐ž…Ž'), ('๐žŠ', '๐žŠญ'), ('๐ž‹€', '๐ž‹ซ'), + ('๐ž“', '๐ž“ซ'), ('๐žŸ ', '๐žŸฆ'), ('๐žŸจ', '๐žŸซ'), ('๐žŸญ', '๐žŸฎ'), @@ -685,6 +693,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('เณŠ', '\u{ccd}'), ('\u{cd5}', '\u{cd6}'), ('\u{ce2}', '\u{ce3}'), + ('เณณ', 'เณณ'), ('\u{d00}', 'เดƒ'), ('\u{d3b}', '\u{d3c}'), ('\u{d3e}', '\u{d44}'), @@ -703,7 +712,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{e47}', '\u{e4e}'), ('\u{eb1}', '\u{eb1}'), ('\u{eb4}', '\u{ebc}'), - ('\u{ec8}', '\u{ecd}'), + ('\u{ec8}', '\u{ece}'), ('\u{f18}', '\u{f19}'), ('\u{f35}', '\u{f35}'), ('\u{f37}', '\u{f37}'), @@ -807,6 +816,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{10ae5}', '\u{10ae6}'), ('\u{10d24}', '\u{10d27}'), ('\u{10eab}', '\u{10eac}'), + ('\u{10efd}', '\u{10eff}'), ('\u{10f46}', '\u{10f50}'), ('\u{10f82}', '\u{10f85}'), ('๐‘€€', '๐‘€‚'), @@ -826,6 +836,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('๐‘‡Ž', '\u{111cf}'), ('๐‘ˆฌ', '\u{11237}'), ('\u{1123e}', '\u{1123e}'), + ('\u{11241}', '\u{11241}'), ('\u{112df}', '\u{112ea}'), ('\u{11300}', '๐‘Œƒ'), ('\u{1133b}', '\u{1133c}'), @@ -873,6 +884,12 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{11d90}', '\u{11d91}'), ('๐‘ถ“', '\u{11d97}'), ('\u{11ef3}', '๐‘ปถ'), + ('\u{11f00}', '\u{11f01}'), + ('๐‘ผƒ', '๐‘ผƒ'), + ('๐‘ผด', '\u{11f3a}'), + ('๐‘ผพ', '\u{11f42}'), + ('\u{13440}', '\u{13440}'), + ('\u{13447}', '\u{13455}'), ('\u{16af0}', '\u{16af4}'), ('\u{16b30}', '\u{16b36}'), ('\u{16f4f}', '\u{16f4f}'), @@ -900,9 +917,11 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{1e01b}', '\u{1e021}'), ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), + ('\u{1e08f}', '\u{1e08f}'), ('\u{1e130}', '\u{1e136}'), ('\u{1e2ae}', '\u{1e2ae}'), ('\u{1e2ec}', '\u{1e2ef}'), + ('\u{1e4ec}', '\u{1e4ef}'), ('\u{1e8d0}', '\u{1e8d6}'), ('\u{1e944}', '\u{1e94a}'), ('๐Ÿป', '๐Ÿฟ'), @@ -937,7 +956,7 @@ pub const FORMAT: &'static [(char, char)] = &[ ('\u{fff9}', '\u{fffb}'), ('\u{110bd}', '\u{110bd}'), ('\u{110cd}', '\u{110cd}'), - ('\u{13430}', '\u{13438}'), + ('\u{13430}', '\u{1343f}'), ('\u{1bca0}', '\u{1bca3}'), ('\u{1d173}', '\u{1d17a}'), ('\u{e0001}', '\u{e0001}'), @@ -970,6 +989,7 @@ pub const KATAKANA: &'static [(char, char)] = &[ ('๐šฟฝ', '๐šฟพ'), ('๐›€€', '๐›€€'), ('๐›„ ', '๐›„ข'), + ('๐›…•', '๐›…•'), ('๐›…ค', '๐›…ง'), ]; @@ -1072,12 +1092,14 @@ pub const NUMERIC: &'static [(char, char)] = &[ ('๐‘ฑ', '๐‘ฑ™'), ('๐‘ต', '๐‘ต™'), ('๐‘ถ ', '๐‘ถฉ'), + ('๐‘ฝ', '๐‘ฝ™'), ('๐–ฉ ', '๐–ฉฉ'), ('๐–ซ€', '๐–ซ‰'), ('๐–ญ', '๐–ญ™'), ('๐ŸŽ', '๐Ÿฟ'), ('๐ž…€', '๐ž…‰'), ('๐ž‹ฐ', '๐ž‹น'), + ('๐ž“ฐ', '๐ž“น'), ('๐žฅ', '๐žฅ™'), ('๐Ÿฏฐ', '๐Ÿฏน'), ];