diff options
Diffstat (limited to 'vendor/regex-syntax/src/unicode_tables/sentence_break.rs')
-rw-r--r-- | vendor/regex-syntax/src/unicode_tables/sentence_break.rs | 182 |
1 files changed, 119 insertions, 63 deletions
diff --git a/vendor/regex-syntax/src/unicode_tables/sentence_break.rs b/vendor/regex-syntax/src/unicode_tables/sentence_break.rs index 67d830f74..db8ad282b 100644 --- a/vendor/regex-syntax/src/unicode_tables/sentence_break.rs +++ b/vendor/regex-syntax/src/unicode_tables/sentence_break.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate sentence-break ucd-13.0.0 --chars +// ucd-generate sentence-break /tmp/ucd --chars // -// Unicode version: 13.0.0. +// Unicode version: 14.0.0. // -// ucd-generate 0.2.8 is available on crates.io. +// ucd-generate 0.2.11 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("ATerm", ATERM), @@ -29,7 +29,7 @@ pub const ATERM: &'static [(char, char)] = pub const CR: &'static [(char, char)] = &[('\r', '\r')]; pub const CLOSE: &'static [(char, char)] = &[ - ('\"', '\"'), + ('"', '"'), ('\'', ')'), ('[', '['), (']', ']'), @@ -57,6 +57,7 @@ pub const CLOSE: &'static [(char, char)] = &[ ('⸜', '⸝'), ('⸠', '⸩'), ('⹂', '⹂'), + ('⹕', '⹜'), ('〈', '】'), ('〔', '〛'), ('〝', '〟'), @@ -100,7 +101,8 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{825}', '\u{827}'), ('\u{829}', '\u{82d}'), ('\u{859}', '\u{85b}'), - ('\u{8d3}', '\u{8e1}'), + ('\u{898}', '\u{89f}'), + ('\u{8ca}', '\u{8e1}'), ('\u{8e3}', 'ः'), ('\u{93a}', '\u{93c}'), ('ा', 'ॏ'), @@ -142,6 +144,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('ொ', '\u{bcd}'), ('\u{bd7}', '\u{bd7}'), ('\u{c00}', '\u{c04}'), + ('\u{c3c}', '\u{c3c}'), ('\u{c3e}', 'ౄ'), ('\u{c46}', '\u{c48}'), ('\u{c4a}', '\u{c4d}'), @@ -193,13 +196,14 @@ pub const EXTEND: &'static [(char, char)] = &[ ('ႏ', 'ႏ'), ('ႚ', '\u{109d}'), ('\u{135d}', '\u{135f}'), - ('\u{1712}', '\u{1714}'), - ('\u{1732}', '\u{1734}'), + ('\u{1712}', '᜕'), + ('\u{1732}', '᜴'), ('\u{1752}', '\u{1753}'), ('\u{1772}', '\u{1773}'), ('\u{17b4}', '\u{17d3}'), ('\u{17dd}', '\u{17dd}'), ('\u{180b}', '\u{180d}'), + ('\u{180f}', '\u{180f}'), ('\u{1885}', '\u{1886}'), ('\u{18a9}', '\u{18a9}'), ('\u{1920}', 'ᤫ'), @@ -208,7 +212,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('ᩕ', '\u{1a5e}'), ('\u{1a60}', '\u{1a7c}'), ('\u{1a7f}', '\u{1a7f}'), - ('\u{1ab0}', '\u{1ac0}'), + ('\u{1ab0}', '\u{1ace}'), ('\u{1b00}', 'ᬄ'), ('\u{1b34}', '᭄'), ('\u{1b6b}', '\u{1b73}'), @@ -221,8 +225,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{1ced}', '\u{1ced}'), ('\u{1cf4}', '\u{1cf4}'), ('᳷', '\u{1cf9}'), - ('\u{1dc0}', '\u{1df9}'), - ('\u{1dfb}', '\u{1dff}'), + ('\u{1dc0}', '\u{1dff}'), ('\u{200c}', '\u{200d}'), ('\u{20d0}', '\u{20f0}'), ('\u{2cef}', '\u{2cf1}'), @@ -277,10 +280,14 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{10d24}', '\u{10d27}'), ('\u{10eab}', '\u{10eac}'), ('\u{10f46}', '\u{10f50}'), + ('\u{10f82}', '\u{10f85}'), ('𑀀', '𑀂'), ('\u{11038}', '\u{11046}'), + ('\u{11070}', '\u{11070}'), + ('\u{11073}', '\u{11074}'), ('\u{1107f}', '𑂂'), ('𑂰', '\u{110ba}'), + ('\u{110c2}', '\u{110c2}'), ('\u{11100}', '\u{11102}'), ('\u{11127}', '\u{11134}'), ('𑅅', '𑅆'), @@ -288,7 +295,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{11180}', '𑆂'), ('𑆳', '𑇀'), ('\u{111c9}', '\u{111cc}'), - ('\u{111ce}', '\u{111cf}'), + ('𑇎', '\u{111cf}'), ('𑈬', '\u{11237}'), ('\u{1123e}', '\u{1123e}'), ('\u{112df}', '\u{112ea}'), @@ -311,11 +318,11 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{116ab}', '\u{116b7}'), ('\u{1171d}', '\u{1172b}'), ('𑠬', '\u{1183a}'), - ('\u{11930}', '\u{11935}'), - ('\u{11937}', '\u{11938}'), + ('\u{11930}', '𑤵'), + ('𑤷', '𑤸'), ('\u{1193b}', '\u{1193e}'), - ('\u{11940}', '\u{11940}'), - ('\u{11942}', '\u{11943}'), + ('𑥀', '𑥀'), + ('𑥂', '\u{11943}'), ('𑧑', '\u{119d7}'), ('\u{119da}', '\u{119e0}'), ('𑧤', '𑧤'), @@ -344,8 +351,10 @@ pub const EXTEND: &'static [(char, char)] = &[ ('𖽑', '𖾇'), ('\u{16f8f}', '\u{16f92}'), ('\u{16fe4}', '\u{16fe4}'), - ('\u{16ff0}', '\u{16ff1}'), + ('𖿰', '𖿱'), ('\u{1bc9d}', '\u{1bc9e}'), + ('\u{1cf00}', '\u{1cf2d}'), + ('\u{1cf30}', '\u{1cf46}'), ('\u{1d165}', '\u{1d169}'), ('𝅭', '\u{1d172}'), ('\u{1d17b}', '\u{1d182}'), @@ -364,6 +373,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), ('\u{1e130}', '\u{1e136}'), + ('\u{1e2ae}', '\u{1e2ae}'), ('\u{1e2ec}', '\u{1e2ef}'), ('\u{1e8d0}', '\u{1e8d6}'), ('\u{1e944}', '\u{1e94a}'), @@ -377,6 +387,7 @@ pub const FORMAT: &'static [(char, char)] = &[ ('\u{61c}', '\u{61c}'), ('\u{6dd}', '\u{6dd}'), ('\u{70f}', '\u{70f}'), + ('\u{890}', '\u{891}'), ('\u{8e2}', '\u{8e2}'), ('\u{180e}', '\u{180e}'), ('\u{200b}', '\u{200b}'), @@ -833,7 +844,7 @@ pub const LOWER: &'static [(char, char)] = &[ ('ⅰ', 'ⅿ'), ('ↄ', 'ↄ'), ('ⓐ', 'ⓩ'), - ('ⰰ', 'ⱞ'), + ('ⰰ', 'ⱟ'), ('ⱡ', 'ⱡ'), ('ⱥ', 'ⱦ'), ('ⱨ', 'ⱨ'), @@ -1001,19 +1012,33 @@ pub const LOWER: &'static [(char, char)] = &[ ('ꞻ', 'ꞻ'), ('ꞽ', 'ꞽ'), ('ꞿ', 'ꞿ'), + ('ꟁ', 'ꟁ'), ('ꟃ', 'ꟃ'), - ('\u{a7c8}', '\u{a7c8}'), - ('\u{a7ca}', '\u{a7ca}'), - ('\u{a7f6}', '\u{a7f6}'), + ('ꟈ', 'ꟈ'), + ('ꟊ', 'ꟊ'), + ('ꟑ', 'ꟑ'), + ('ꟓ', 'ꟓ'), + ('ꟕ', 'ꟕ'), + ('ꟗ', 'ꟗ'), + ('ꟙ', 'ꟙ'), + ('ꟶ', 'ꟶ'), ('ꟸ', 'ꟺ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab68}'), + ('ꭜ', 'ꭨ'), ('ꭰ', 'ꮿ'), ('ff', 'st'), ('ﬓ', 'ﬗ'), ('a', 'z'), ('𐐨', '𐑏'), ('𐓘', '𐓻'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), + ('𐞀', '𐞀'), + ('𐞃', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), ('𐳀', '𐳲'), ('𑣀', '𑣟'), ('𖹠', '𖹿'), @@ -1045,6 +1070,8 @@ pub const LOWER: &'static [(char, char)] = &[ ('𝞪', '𝟂'), ('𝟄', '𝟉'), ('𝟋', '𝟋'), + ('𝼀', '𝼉'), + ('𝼋', '𝼞'), ('𞤢', '𞥃'), ]; @@ -1100,17 +1127,18 @@ pub const NUMERIC: &'static [(char, char)] = &[ ('𑛀', '𑛉'), ('𑜰', '𑜹'), ('𑣠', '𑣩'), - ('\u{11950}', '\u{11959}'), + ('𑥐', '𑥙'), ('𑱐', '𑱙'), ('𑵐', '𑵙'), ('𑶠', '𑶩'), ('𖩠', '𖩩'), + ('𖫀', '𖫉'), ('𖭐', '𖭙'), ('𝟎', '𝟿'), ('𞅀', '𞅉'), ('𞋰', '𞋹'), ('𞥐', '𞥙'), - ('\u{1fbf0}', '\u{1fbf9}'), + ('🯰', '🯹'), ]; pub const OLETTER: &'static [(char, char)] = &[ @@ -1146,8 +1174,9 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ࠨ', 'ࠨ'), ('ࡀ', 'ࡘ'), ('ࡠ', 'ࡪ'), - ('ࢠ', 'ࢴ'), - ('ࢶ', '\u{8c7}'), + ('ࡰ', 'ࢇ'), + ('ࢉ', 'ࢎ'), + ('ࢠ', 'ࣉ'), ('ऄ', 'ह'), ('ऽ', 'ऽ'), ('ॐ', 'ॐ'), @@ -1212,6 +1241,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ప', 'హ'), ('ఽ', 'ఽ'), ('ౘ', 'ౚ'), + ('ౝ', 'ౝ'), ('ౠ', 'ౡ'), ('ಀ', 'ಀ'), ('ಅ', 'ಌ'), @@ -1220,10 +1250,10 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ಪ', 'ಳ'), ('ವ', 'ಹ'), ('ಽ', 'ಽ'), - ('ೞ', 'ೞ'), + ('ೝ', 'ೞ'), ('ೠ', 'ೡ'), ('ೱ', 'ೲ'), - ('\u{d04}', 'ഌ'), + ('ഄ', 'ഌ'), ('എ', 'ഐ'), ('ഒ', 'ഺ'), ('ഽ', 'ഽ'), @@ -1286,9 +1316,8 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ᚁ', 'ᚚ'), ('ᚠ', 'ᛪ'), ('ᛮ', 'ᛸ'), - ('ᜀ', 'ᜌ'), - ('ᜎ', 'ᜑ'), - ('ᜠ', 'ᜱ'), + ('ᜀ', 'ᜑ'), + ('ᜟ', 'ᜱ'), ('ᝀ', 'ᝑ'), ('ᝠ', 'ᝬ'), ('ᝮ', 'ᝰ'), @@ -1309,7 +1338,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ᨠ', 'ᩔ'), ('ᪧ', 'ᪧ'), ('ᬅ', 'ᬳ'), - ('ᭅ', 'ᭋ'), + ('ᭅ', 'ᭌ'), ('ᮃ', 'ᮠ'), ('ᮮ', 'ᮯ'), ('ᮺ', 'ᯥ'), @@ -1347,11 +1376,10 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ー', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', '\u{31bf}'), + ('ㆠ', 'ㆿ'), ('ㇰ', 'ㇿ'), - ('㐀', '\u{4dbf}'), - ('一', '\u{9ffc}'), - ('ꀀ', 'ꒌ'), + ('㐀', '䶿'), + ('一', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), ('ꘐ', 'ꘟ'), @@ -1362,6 +1390,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ꜗ', 'ꜟ'), ('ꞈ', 'ꞈ'), ('ꞏ', 'ꞏ'), + ('ꟲ', 'ꟴ'), ('ꟷ', 'ꟷ'), ('ꟻ', 'ꠁ'), ('ꠃ', 'ꠅ'), @@ -1399,7 +1428,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ꬑ', 'ꬖ'), ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), - ('\u{ab69}', '\u{ab69}'), + ('ꭩ', 'ꭩ'), ('ꯀ', 'ꯢ'), ('가', '힣'), ('ힰ', 'ퟆ'), @@ -1449,6 +1478,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𐘀', '𐜶'), ('𐝀', '𐝕'), ('𐝠', '𐝧'), + ('𐞁', '𐞂'), ('𐠀', '𐠅'), ('𐠈', '𐠈'), ('𐠊', '𐠵'), @@ -1477,19 +1507,22 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𐮀', '𐮑'), ('𐰀', '𐱈'), ('𐴀', '𐴣'), - ('\u{10e80}', '\u{10ea9}'), - ('\u{10eb0}', '\u{10eb1}'), + ('𐺀', '𐺩'), + ('𐺰', '𐺱'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '𐽅'), - ('\u{10fb0}', '\u{10fc4}'), + ('𐽰', '𐾁'), + ('𐾰', '𐿄'), ('𐿠', '𐿶'), ('𑀃', '𑀷'), + ('𑁱', '𑁲'), + ('𑁵', '𑁵'), ('𑂃', '𑂯'), ('𑃐', '𑃨'), ('𑄃', '𑄦'), ('𑅄', '𑅄'), - ('\u{11147}', '\u{11147}'), + ('𑅇', '𑅇'), ('𑅐', '𑅲'), ('𑅶', '𑅶'), ('𑆃', '𑆲'), @@ -1515,7 +1548,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𑍝', '𑍡'), ('𑐀', '𑐴'), ('𑑇', '𑑊'), - ('𑑟', '\u{11461}'), + ('𑑟', '𑑡'), ('𑒀', '𑒯'), ('𑓄', '𑓅'), ('𑓇', '𑓇'), @@ -1526,14 +1559,15 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𑚀', '𑚪'), ('𑚸', '𑚸'), ('𑜀', '𑜚'), + ('𑝀', '𑝆'), ('𑠀', '𑠫'), - ('𑣿', '\u{11906}'), - ('\u{11909}', '\u{11909}'), - ('\u{1190c}', '\u{11913}'), - ('\u{11915}', '\u{11916}'), - ('\u{11918}', '\u{1192f}'), - ('\u{1193f}', '\u{1193f}'), - ('\u{11941}', '\u{11941}'), + ('𑣿', '𑤆'), + ('𑤉', '𑤉'), + ('𑤌', '𑤓'), + ('𑤕', '𑤖'), + ('𑤘', '𑤯'), + ('𑤿', '𑤿'), + ('𑥁', '𑥁'), ('𑦠', '𑦧'), ('𑦪', '𑧐'), ('𑧡', '𑧡'), @@ -1544,7 +1578,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𑩐', '𑩐'), ('𑩜', '𑪉'), ('𑪝', '𑪝'), - ('𑫀', '𑫸'), + ('𑪰', '𑫸'), ('𑰀', '𑰈'), ('𑰊', '𑰮'), ('𑱀', '𑱀'), @@ -1558,14 +1592,16 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𑵪', '𑶉'), ('𑶘', '𑶘'), ('𑻠', '𑻲'), - ('\u{11fb0}', '\u{11fb0}'), + ('𑾰', '𑾰'), ('𒀀', '𒎙'), ('𒐀', '𒑮'), ('𒒀', '𒕃'), + ('𒾐', '𒿰'), ('𓀀', '𓐮'), ('𔐀', '𔙆'), ('𖠀', '𖨸'), ('𖩀', '𖩞'), + ('𖩰', '𖪾'), ('𖫐', '𖫭'), ('𖬀', '𖬯'), ('𖭀', '𖭃'), @@ -1577,9 +1613,12 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𖿠', '𖿡'), ('𖿣', '𖿣'), ('𗀀', '𘟷'), - ('𘠀', '\u{18cd5}'), - ('\u{18d00}', '\u{18d08}'), - ('𛀀', '𛄞'), + ('𘠀', '𘳕'), + ('𘴀', '𘴈'), + ('𚿰', '𚿳'), + ('𚿵', '𚿻'), + ('𚿽', '𚿾'), + ('𛀀', '𛄢'), ('𛅐', '𛅒'), ('𛅤', '𛅧'), ('𛅰', '𛋻'), @@ -1587,10 +1626,16 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𛱰', '𛱼'), ('𛲀', '𛲈'), ('𛲐', '𛲙'), + ('𝼊', '𝼊'), ('𞄀', '𞄬'), ('𞄷', '𞄽'), ('𞅎', '𞅎'), + ('𞊐', '𞊭'), ('𞋀', '𞋫'), + ('𞟠', '𞟦'), + ('𞟨', '𞟫'), + ('𞟭', '𞟮'), + ('𞟰', '𞟾'), ('𞠀', '𞣄'), ('𞥋', '𞥋'), ('𞸀', '𞸃'), @@ -1626,13 +1671,13 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𞺡', '𞺣'), ('𞺥', '𞺩'), ('𞺫', '𞺻'), - ('𠀀', '\u{2a6dd}'), - ('𪜀', '𫜴'), + ('𠀀', '𪛟'), + ('𪜀', '𫜸'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), - ('\u{30000}', '\u{3134a}'), + ('𰀀', '𱍊'), ]; pub const SCONTINUE: &'static [(char, char)] = &[ @@ -1661,7 +1706,7 @@ pub const STERM: &'static [(char, char)] = &[ ('!', '!'), ('?', '?'), ('։', '։'), - ('؞', '؟'), + ('؝', '؟'), ('۔', '۔'), ('܀', '܂'), ('߹', '߹'), @@ -1680,12 +1725,14 @@ pub const STERM: &'static [(char, char)] = &[ ('᪨', '᪫'), ('᭚', '᭛'), ('᭞', '᭟'), + ('᭽', '᭾'), ('᰻', '᰼'), ('᱾', '᱿'), ('‼', '‽'), ('⁇', '⁉'), ('⸮', '⸮'), ('⸼', '⸼'), + ('⹓', '⹔'), ('。', '。'), ('꓿', '꓿'), ('꘎', '꘏'), @@ -1704,6 +1751,7 @@ pub const STERM: &'static [(char, char)] = &[ ('。', '。'), ('𐩖', '𐩗'), ('𐽕', '𐽙'), + ('𐾆', '𐾉'), ('𑁇', '𑁈'), ('𑂾', '𑃁'), ('𑅁', '𑅃'), @@ -1718,8 +1766,8 @@ pub const STERM: &'static [(char, char)] = &[ ('𑗉', '𑗗'), ('𑙁', '𑙂'), ('𑜼', '𑜾'), - ('\u{11944}', '\u{11944}'), - ('\u{11946}', '\u{11946}'), + ('𑥄', '𑥄'), + ('𑥆', '𑥆'), ('𑩂', '𑩃'), ('𑪛', '𑪜'), ('𑱁', '𑱂'), @@ -2183,7 +2231,7 @@ pub const UPPER: &'static [(char, char)] = &[ ('Ⅰ', 'Ⅿ'), ('Ↄ', 'Ↄ'), ('Ⓐ', 'Ⓩ'), - ('Ⰰ', 'Ⱞ'), + ('Ⰰ', 'Ⱟ'), ('Ⱡ', 'Ⱡ'), ('Ɫ', 'Ɽ'), ('Ⱨ', 'Ⱨ'), @@ -2348,13 +2396,21 @@ pub const UPPER: &'static [(char, char)] = &[ ('Ꞻ', 'Ꞻ'), ('Ꞽ', 'Ꞽ'), ('Ꞿ', 'Ꞿ'), + ('Ꟁ', 'Ꟁ'), ('Ꟃ', 'Ꟃ'), - ('Ꞔ', '\u{a7c7}'), - ('\u{a7c9}', '\u{a7c9}'), - ('\u{a7f5}', '\u{a7f5}'), + ('Ꞔ', 'Ꟈ'), + ('Ꟊ', 'Ꟊ'), + ('Ꟑ', 'Ꟑ'), + ('Ꟗ', 'Ꟗ'), + ('Ꟙ', 'Ꟙ'), + ('Ꟶ', 'Ꟶ'), ('A', 'Z'), ('𐐀', '𐐧'), ('𐒰', '𐓓'), + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), ('𐲀', '𐲲'), ('𑢠', '𑢿'), ('𖹀', '𖹟'), |