summaryrefslogtreecommitdiffstats
path: root/vendor/regex-syntax/src/unicode_tables/property_values.rs
blob: cb2d32fb707d24db0d0149d6d5eb8b0133726394 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
// DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY:
//
//   ucd-generate property-values ucd-15.0.0 --include gc,script,scx,age,gcb,wb,sb
//
// Unicode version: 15.0.0.
//
// ucd-generate 0.2.14 is available on crates.io.

pub const PROPERTY_VALUES: &'static [(
    &'static str,
    &'static [(&'static str, &'static str)],
)] = &[
    (
        "Age",
        &[
            ("1.1", "V1_1"),
            ("10.0", "V10_0"),
            ("11.0", "V11_0"),
            ("12.0", "V12_0"),
            ("12.1", "V12_1"),
            ("13.0", "V13_0"),
            ("14.0", "V14_0"),
            ("15.0", "V15_0"),
            ("2.0", "V2_0"),
            ("2.1", "V2_1"),
            ("3.0", "V3_0"),
            ("3.1", "V3_1"),
            ("3.2", "V3_2"),
            ("4.0", "V4_0"),
            ("4.1", "V4_1"),
            ("5.0", "V5_0"),
            ("5.1", "V5_1"),
            ("5.2", "V5_2"),
            ("6.0", "V6_0"),
            ("6.1", "V6_1"),
            ("6.2", "V6_2"),
            ("6.3", "V6_3"),
            ("7.0", "V7_0"),
            ("8.0", "V8_0"),
            ("9.0", "V9_0"),
            ("na", "Unassigned"),
            ("unassigned", "Unassigned"),
            ("v100", "V10_0"),
            ("v11", "V1_1"),
            ("v110", "V11_0"),
            ("v120", "V12_0"),
            ("v121", "V12_1"),
            ("v130", "V13_0"),
            ("v140", "V14_0"),
            ("v150", "V15_0"),
            ("v20", "V2_0"),
            ("v21", "V2_1"),
            ("v30", "V3_0"),
            ("v31", "V3_1"),
            ("v32", "V3_2"),
            ("v40", "V4_0"),
            ("v41", "V4_1"),
            ("v50", "V5_0"),
            ("v51", "V5_1"),
            ("v52", "V5_2"),
            ("v60", "V6_0"),
            ("v61", "V6_1"),
            ("v62", "V6_2"),
            ("v63", "V6_3"),
            ("v70", "V7_0"),
            ("v80", "V8_0"),
            ("v90", "V9_0"),
        ],
    ),
    (
        "General_Category",
        &[
            ("c", "Other"),
            ("casedletter", "Cased_Letter"),
            ("cc", "Control"),
            ("cf", "Format"),
            ("closepunctuation", "Close_Punctuation"),
            ("cn", "Unassigned"),
            ("cntrl", "Control"),
            ("co", "Private_Use"),
            ("combiningmark", "Mark"),
            ("connectorpunctuation", "Connector_Punctuation"),
            ("control", "Control"),
            ("cs", "Surrogate"),
            ("currencysymbol", "Currency_Symbol"),
            ("dashpunctuation", "Dash_Punctuation"),
            ("decimalnumber", "Decimal_Number"),
            ("digit", "Decimal_Number"),
            ("enclosingmark", "Enclosing_Mark"),
            ("finalpunctuation", "Final_Punctuation"),
            ("format", "Format"),
            ("initialpunctuation", "Initial_Punctuation"),
            ("l", "Letter"),
            ("lc", "Cased_Letter"),
            ("letter", "Letter"),
            ("letternumber", "Letter_Number"),
            ("lineseparator", "Line_Separator"),
            ("ll", "Lowercase_Letter"),
            ("lm", "Modifier_Letter"),
            ("lo", "Other_Letter"),
            ("lowercaseletter", "Lowercase_Letter"),
            ("lt", "Titlecase_Letter"),
            ("lu", "Uppercase_Letter"),
            ("m", "Mark"),
            ("mark", "Mark"),
            ("mathsymbol", "Math_Symbol"),
            ("mc", "Spacing_Mark"),
            ("me", "Enclosing_Mark"),
            ("mn", "Nonspacing_Mark"),
            ("modifierletter", "Modifier_Letter"),
            ("modifiersymbol", "Modifier_Symbol"),
            ("n", "Number"),
            ("nd", "Decimal_Number"),
            ("nl", "Letter_Number"),
            ("no", "Other_Number"),
            ("nonspacingmark", "Nonspacing_Mark"),
            ("number", "Number"),
            ("openpunctuation", "Open_Punctuation"),
            ("other", "Other"),
            ("otherletter", "Other_Letter"),
            ("othernumber", "Other_Number"),
            ("otherpunctuation", "Other_Punctuation"),
            ("othersymbol", "Other_Symbol"),
            ("p", "Punctuation"),
            ("paragraphseparator", "Paragraph_Separator"),
            ("pc", "Connector_Punctuation"),
            ("pd", "Dash_Punctuation"),
            ("pe", "Close_Punctuation"),
            ("pf", "Final_Punctuation"),
            ("pi", "Initial_Punctuation"),
            ("po", "Other_Punctuation"),
            ("privateuse", "Private_Use"),
            ("ps", "Open_Punctuation"),
            ("punct", "Punctuation"),
            ("punctuation", "Punctuation"),
            ("s", "Symbol"),
            ("sc", "Currency_Symbol"),
            ("separator", "Separator"),
            ("sk", "Modifier_Symbol"),
            ("sm", "Math_Symbol"),
            ("so", "Other_Symbol"),
            ("spaceseparator", "Space_Separator"),
            ("spacingmark", "Spacing_Mark"),
            ("surrogate", "Surrogate"),
            ("symbol", "Symbol"),
            ("titlecaseletter", "Titlecase_Letter"),
            ("unassigned", "Unassigned"),
            ("uppercaseletter", "Uppercase_Letter"),
            ("z", "Separator"),
            ("zl", "Line_Separator"),
            ("zp", "Paragraph_Separator"),
            ("zs", "Space_Separator"),
        ],
    ),
    (
        "Grapheme_Cluster_Break",
        &[
            ("cn", "Control"),
            ("control", "Control"),
            ("cr", "CR"),
            ("eb", "E_Base"),
            ("ebase", "E_Base"),
            ("ebasegaz", "E_Base_GAZ"),
            ("ebg", "E_Base_GAZ"),
            ("em", "E_Modifier"),
            ("emodifier", "E_Modifier"),
            ("ex", "Extend"),
            ("extend", "Extend"),
            ("gaz", "Glue_After_Zwj"),
            ("glueafterzwj", "Glue_After_Zwj"),
            ("l", "L"),
            ("lf", "LF"),
            ("lv", "LV"),
            ("lvt", "LVT"),
            ("other", "Other"),
            ("pp", "Prepend"),
            ("prepend", "Prepend"),
            ("regionalindicator", "Regional_Indicator"),
            ("ri", "Regional_Indicator"),
            ("sm", "SpacingMark"),
            ("spacingmark", "SpacingMark"),
            ("t", "T"),
            ("v", "V"),
            ("xx", "Other"),
            ("zwj", "ZWJ"),
        ],
    ),
    (
        "Script",
        &[
            ("adlam", "Adlam"),
            ("adlm", "Adlam"),
            ("aghb", "Caucasian_Albanian"),
            ("ahom", "Ahom"),
            ("anatolianhieroglyphs", "Anatolian_Hieroglyphs"),
            ("arab", "Arabic"),
            ("arabic", "Arabic"),
            ("armenian", "Armenian"),
            ("armi", "Imperial_Aramaic"),
            ("armn", "Armenian"),
            ("avestan", "Avestan"),
            ("avst", "Avestan"),
            ("bali", "Balinese"),
            ("balinese", "Balinese"),
            ("bamu", "Bamum"),
            ("bamum", "Bamum"),
            ("bass", "Bassa_Vah"),
            ("bassavah", "Bassa_Vah"),
            ("batak", "Batak"),
            ("batk", "Batak"),
            ("beng", "Bengali"),
            ("bengali", "Bengali"),
            ("bhaiksuki", "Bhaiksuki"),
            ("bhks", "Bhaiksuki"),
            ("bopo", "Bopomofo"),
            ("bopomofo", "Bopomofo"),
            ("brah", "Brahmi"),
            ("brahmi", "Brahmi"),
            ("brai", "Braille"),
            ("braille", "Braille"),
            ("bugi", "Buginese"),
            ("buginese", "Buginese"),
            ("buhd", "Buhid"),
            ("buhid", "Buhid"),
            ("cakm", "Chakma"),
            ("canadianaboriginal", "Canadian_Aboriginal"),
            ("cans", "Canadian_Aboriginal"),
            ("cari", "Carian"),
            ("carian", "Carian"),
            ("caucasianalbanian", "Caucasian_Albanian"),
            ("chakma", "Chakma"),
            ("cham", "Cham"),
            ("cher", "Cherokee"),
            ("cherokee", "Cherokee"),
            ("chorasmian", "Chorasmian"),
            ("chrs", "Chorasmian"),
            ("common", "Common"),
            ("copt", "Coptic"),
            ("coptic", "Coptic"),
            ("cpmn", "Cypro_Minoan"),
            ("cprt", "Cypriot"),
            ("cuneiform", "Cuneiform"),
            ("cypriot", "Cypriot"),
            ("cyprominoan", "Cypro_Minoan"),
            ("cyrillic", "Cyrillic"),
            ("cyrl", "Cyrillic"),
            ("deseret", "Deseret"),
            ("deva", "Devanagari"),
            ("devanagari", "Devanagari"),
            ("diak", "Dives_Akuru"),
            ("divesakuru", "Dives_Akuru"),
            ("dogr", "Dogra"),
            ("dogra", "Dogra"),
            ("dsrt", "Deseret"),
            ("dupl", "Duployan"),
            ("duployan", "Duployan"),
            ("egyp", "Egyptian_Hieroglyphs"),
            ("egyptianhieroglyphs", "Egyptian_Hieroglyphs"),
            ("elba", "Elbasan"),
            ("elbasan", "Elbasan"),
            ("elym", "Elymaic"),
            ("elymaic", "Elymaic"),
            ("ethi", "Ethiopic"),
            ("ethiopic", "Ethiopic"),
            ("geor", "Georgian"),
            ("georgian", "Georgian"),
            ("glag", "Glagolitic"),
            ("glagolitic", "Glagolitic"),
            ("gong", "Gunjala_Gondi"),
            ("gonm", "Masaram_Gondi"),
            ("goth", "Gothic"),
            ("gothic", "Gothic"),
            ("gran", "Grantha"),
            ("grantha", "Grantha"),
            ("greek", "Greek"),
            ("grek", "Greek"),
            ("gujarati", "Gujarati"),
            ("gujr", "Gujarati"),
            ("gunjalagondi", "Gunjala_Gondi"),
            ("gurmukhi", "Gurmukhi"),
            ("guru", "Gurmukhi"),
            ("han", "Han"),
            ("hang", "Hangul"),
            ("hangul", "Hangul"),
            ("hani", "Han"),
            ("hanifirohingya", "Hanifi_Rohingya"),
            ("hano", "Hanunoo"),
            ("hanunoo", "Hanunoo"),
            ("hatr", "Hatran"),
            ("hatran", "Hatran"),
            ("hebr", "Hebrew"),
            ("hebrew", "Hebrew"),
            ("hira", "Hiragana"),
            ("hiragana", "Hiragana"),
            ("hluw", "Anatolian_Hieroglyphs"),
            ("hmng", "Pahawh_Hmong"),
            ("hmnp", "Nyiakeng_Puachue_Hmong"),
            ("hrkt", "Katakana_Or_Hiragana"),
            ("hung", "Old_Hungarian"),
            ("imperialaramaic", "Imperial_Aramaic"),
            ("inherited", "Inherited"),
            ("inscriptionalpahlavi", "Inscriptional_Pahlavi"),
            ("inscriptionalparthian", "Inscriptional_Parthian"),
            ("ital", "Old_Italic"),
            ("java", "Javanese"),
            ("javanese", "Javanese"),
            ("kaithi", "Kaithi"),
            ("kali", "Kayah_Li"),
            ("kana", "Katakana"),
            ("kannada", "Kannada"),
            ("katakana", "Katakana"),
            ("katakanaorhiragana", "Katakana_Or_Hiragana"),
            ("kawi", "Kawi"),
            ("kayahli", "Kayah_Li"),
            ("khar", "Kharoshthi"),
            ("kharoshthi", "Kharoshthi"),
            ("khitansmallscript", "Khitan_Small_Script"),
            ("khmer", "Khmer"),
            ("khmr", "Khmer"),
            ("khoj", "Khojki"),
            ("khojki", "Khojki"),
            ("khudawadi", "Khudawadi"),
            ("kits", "Khitan_Small_Script"),
            ("knda", "Kannada"),
            ("kthi", "Kaithi"),
            ("lana", "Tai_Tham"),
            ("lao", "Lao"),
            ("laoo", "Lao"),
            ("latin", "Latin"),
            ("latn", "Latin"),
            ("lepc", "Lepcha"),
            ("lepcha", "Lepcha"),
            ("limb", "Limbu"),
            ("limbu", "Limbu"),
            ("lina", "Linear_A"),
            ("linb", "Linear_B"),
            ("lineara", "Linear_A"),
            ("linearb", "Linear_B"),
            ("lisu", "Lisu"),
            ("lyci", "Lycian"),
            ("lycian", "Lycian"),
            ("lydi", "Lydian"),
            ("lydian", "Lydian"),
            ("mahajani", "Mahajani"),
            ("mahj", "Mahajani"),
            ("maka", "Makasar"),
            ("makasar", "Makasar"),
            ("malayalam", "Malayalam"),
            ("mand", "Mandaic"),
            ("mandaic", "Mandaic"),
            ("mani", "Manichaean"),
            ("manichaean", "Manichaean"),
            ("marc", "Marchen"),
            ("marchen", "Marchen"),
            ("masaramgondi", "Masaram_Gondi"),
            ("medefaidrin", "Medefaidrin"),
            ("medf", "Medefaidrin"),
            ("meeteimayek", "Meetei_Mayek"),
            ("mend", "Mende_Kikakui"),
            ("mendekikakui", "Mende_Kikakui"),
            ("merc", "Meroitic_Cursive"),
            ("mero", "Meroitic_Hieroglyphs"),
            ("meroiticcursive", "Meroitic_Cursive"),
            ("meroitichieroglyphs", "Meroitic_Hieroglyphs"),
            ("miao", "Miao"),
            ("mlym", "Malayalam"),
            ("modi", "Modi"),
            ("mong", "Mongolian"),
            ("mongolian", "Mongolian"),
            ("mro", "Mro"),
            ("mroo", "Mro"),
            ("mtei", "Meetei_Mayek"),
            ("mult", "Multani"),
            ("multani", "Multani"),
            ("myanmar", "Myanmar"),
            ("mymr", "Myanmar"),
            ("nabataean", "Nabataean"),
            ("nagm", "Nag_Mundari"),
            ("nagmundari", "Nag_Mundari"),
            ("nand", "Nandinagari"),
            ("nandinagari", "Nandinagari"),
            ("narb", "Old_North_Arabian"),
            ("nbat", "Nabataean"),
            ("newa", "Newa"),
            ("newtailue", "New_Tai_Lue"),
            ("nko", "Nko"),
            ("nkoo", "Nko"),
            ("nshu", "Nushu"),
            ("nushu", "Nushu"),
            ("nyiakengpuachuehmong", "Nyiakeng_Puachue_Hmong"),
            ("ogam", "Ogham"),
            ("ogham", "Ogham"),
            ("olchiki", "Ol_Chiki"),
            ("olck", "Ol_Chiki"),
            ("oldhungarian", "Old_Hungarian"),
            ("olditalic", "Old_Italic"),
            ("oldnortharabian", "Old_North_Arabian"),
            ("oldpermic", "Old_Permic"),
            ("oldpersian", "Old_Persian"),
            ("oldsogdian", "Old_Sogdian"),
            ("oldsoutharabian", "Old_South_Arabian"),
            ("oldturkic", "Old_Turkic"),
            ("olduyghur", "Old_Uyghur"),
            ("oriya", "Oriya"),
            ("orkh", "Old_Turkic"),
            ("orya", "Oriya"),
            ("osage", "Osage"),
            ("osge", "Osage"),
            ("osma", "Osmanya"),
            ("osmanya", "Osmanya"),
            ("ougr", "Old_Uyghur"),
            ("pahawhhmong", "Pahawh_Hmong"),
            ("palm", "Palmyrene"),
            ("palmyrene", "Palmyrene"),
            ("pauc", "Pau_Cin_Hau"),
            ("paucinhau", "Pau_Cin_Hau"),
            ("perm", "Old_Permic"),
            ("phag", "Phags_Pa"),
            ("phagspa", "Phags_Pa"),
            ("phli", "Inscriptional_Pahlavi"),
            ("phlp", "Psalter_Pahlavi"),
            ("phnx", "Phoenician"),
            ("phoenician", "Phoenician"),
            ("plrd", "Miao"),
            ("prti", "Inscriptional_Parthian"),
            ("psalterpahlavi", "Psalter_Pahlavi"),
            ("qaac", "Coptic"),
            ("qaai", "Inherited"),
            ("rejang", "Rejang"),
            ("rjng", "Rejang"),
            ("rohg", "Hanifi_Rohingya"),
            ("runic", "Runic"),
            ("runr", "Runic"),
            ("samaritan", "Samaritan"),
            ("samr", "Samaritan"),
            ("sarb", "Old_South_Arabian"),
            ("saur", "Saurashtra"),
            ("saurashtra", "Saurashtra"),
            ("sgnw", "SignWriting"),
            ("sharada", "Sharada"),
            ("shavian", "Shavian"),
            ("shaw", "Shavian"),
            ("shrd", "Sharada"),
            ("sidd", "Siddham"),
            ("siddham", "Siddham"),
            ("signwriting", "SignWriting"),
            ("sind", "Khudawadi"),
            ("sinh", "Sinhala"),
            ("sinhala", "Sinhala"),
            ("sogd", "Sogdian"),
            ("sogdian", "Sogdian"),
            ("sogo", "Old_Sogdian"),
            ("sora", "Sora_Sompeng"),
            ("sorasompeng", "Sora_Sompeng"),
            ("soyo", "Soyombo"),
            ("soyombo", "Soyombo"),
            ("sund", "Sundanese"),
            ("sundanese", "Sundanese"),
            ("sylo", "Syloti_Nagri"),
            ("sylotinagri", "Syloti_Nagri"),
            ("syrc", "Syriac"),
            ("syriac", "Syriac"),
            ("tagalog", "Tagalog"),
            ("tagb", "Tagbanwa"),
            ("tagbanwa", "Tagbanwa"),
            ("taile", "Tai_Le"),
            ("taitham", "Tai_Tham"),
            ("taiviet", "Tai_Viet"),
            ("takr", "Takri"),
            ("takri", "Takri"),
            ("tale", "Tai_Le"),
            ("talu", "New_Tai_Lue"),
            ("tamil", "Tamil"),
            ("taml", "Tamil"),
            ("tang", "Tangut"),
            ("tangsa", "Tangsa"),
            ("tangut", "Tangut"),
            ("tavt", "Tai_Viet"),
            ("telu", "Telugu"),
            ("telugu", "Telugu"),
            ("tfng", "Tifinagh"),
            ("tglg", "Tagalog"),
            ("thaa", "Thaana"),
            ("thaana", "Thaana"),
            ("thai", "Thai"),
            ("tibetan", "Tibetan"),
            ("tibt", "Tibetan"),
            ("tifinagh", "Tifinagh"),
            ("tirh", "Tirhuta"),
            ("tirhuta", "Tirhuta"),
            ("tnsa", "Tangsa"),
            ("toto", "Toto"),
            ("ugar", "Ugaritic"),
            ("ugaritic", "Ugaritic"),
            ("unknown", "Unknown"),
            ("vai", "Vai"),
            ("vaii", "Vai"),
            ("vith", "Vithkuqi"),
            ("vithkuqi", "Vithkuqi"),
            ("wancho", "Wancho"),
            ("wara", "Warang_Citi"),
            ("warangciti", "Warang_Citi"),
            ("wcho", "Wancho"),
            ("xpeo", "Old_Persian"),
            ("xsux", "Cuneiform"),
            ("yezi", "Yezidi"),
            ("yezidi", "Yezidi"),
            ("yi", "Yi"),
            ("yiii", "Yi"),
            ("zanabazarsquare", "Zanabazar_Square"),
            ("zanb", "Zanabazar_Square"),
            ("zinh", "Inherited"),
            ("zyyy", "Common"),
            ("zzzz", "Unknown"),
        ],
    ),
    (
        "Script_Extensions",
        &[
            ("adlam", "Adlam"),
            ("adlm", "Adlam"),
            ("aghb", "Caucasian_Albanian"),
            ("ahom", "Ahom"),
            ("anatolianhieroglyphs", "Anatolian_Hieroglyphs"),
            ("arab", "Arabic"),
            ("arabic", "Arabic"),
            ("armenian", "Armenian"),
            ("armi", "Imperial_Aramaic"),
            ("armn", "Armenian"),
            ("avestan", "Avestan"),
            ("avst", "Avestan"),
            ("bali", "Balinese"),
            ("balinese", "Balinese"),
            ("bamu", "Bamum"),
            ("bamum", "Bamum"),
            ("bass", "Bassa_Vah"),
            ("bassavah", "Bassa_Vah"),
            ("batak", "Batak"),
            ("batk", "Batak"),
            ("beng", "Bengali"),
            ("bengali", "Bengali"),
            ("bhaiksuki", "Bhaiksuki"),
            ("bhks", "Bhaiksuki"),
            ("bopo", "Bopomofo"),
            ("bopomofo", "Bopomofo"),
            ("brah", "Brahmi"),
            ("brahmi", "Brahmi"),
            ("brai", "Braille"),
            ("braille", "Braille"),
            ("bugi", "Buginese"),
            ("buginese", "Buginese"),
            ("buhd", "Buhid"),
            ("buhid", "Buhid"),
            ("cakm", "Chakma"),
            ("canadianaboriginal", "Canadian_Aboriginal"),
            ("cans", "Canadian_Aboriginal"),
            ("cari", "Carian"),
            ("carian", "Carian"),
            ("caucasianalbanian", "Caucasian_Albanian"),
            ("chakma", "Chakma"),
            ("cham", "Cham"),
            ("cher", "Cherokee"),
            ("cherokee", "Cherokee"),
            ("chorasmian", "Chorasmian"),
            ("chrs", "Chorasmian"),
            ("common", "Common"),
            ("copt", "Coptic"),
            ("coptic", "Coptic"),
            ("cpmn", "Cypro_Minoan"),
            ("cprt", "Cypriot"),
            ("cuneiform", "Cuneiform"),
            ("cypriot", "Cypriot"),
            ("cyprominoan", "Cypro_Minoan"),
            ("cyrillic", "Cyrillic"),
            ("cyrl", "Cyrillic"),
            ("deseret", "Deseret"),
            ("deva", "Devanagari"),
            ("devanagari", "Devanagari"),
            ("diak", "Dives_Akuru"),
            ("divesakuru", "Dives_Akuru"),
            ("dogr", "Dogra"),
            ("dogra", "Dogra"),
            ("dsrt", "Deseret"),
            ("dupl", "Duployan"),
            ("duployan", "Duployan"),
            ("egyp", "Egyptian_Hieroglyphs"),
            ("egyptianhieroglyphs", "Egyptian_Hieroglyphs"),
            ("elba", "Elbasan"),
            ("elbasan", "Elbasan"),
            ("elym", "Elymaic"),
            ("elymaic", "Elymaic"),
            ("ethi", "Ethiopic"),
            ("ethiopic", "Ethiopic"),
            ("geor", "Georgian"),
            ("georgian", "Georgian"),
            ("glag", "Glagolitic"),
            ("glagolitic", "Glagolitic"),
            ("gong", "Gunjala_Gondi"),
            ("gonm", "Masaram_Gondi"),
            ("goth", "Gothic"),
            ("gothic", "Gothic"),
            ("gran", "Grantha"),
            ("grantha", "Grantha"),
            ("greek", "Greek"),
            ("grek", "Greek"),
            ("gujarati", "Gujarati"),
            ("gujr", "Gujarati"),
            ("gunjalagondi", "Gunjala_Gondi"),
            ("gurmukhi", "Gurmukhi"),
            ("guru", "Gurmukhi"),
            ("han", "Han"),
            ("hang", "Hangul"),
            ("hangul", "Hangul"),
            ("hani", "Han"),
            ("hanifirohingya", "Hanifi_Rohingya"),
            ("hano", "Hanunoo"),
            ("hanunoo", "Hanunoo"),
            ("hatr", "Hatran"),
            ("hatran", "Hatran"),
            ("hebr", "Hebrew"),
            ("hebrew", "Hebrew"),
            ("hira", "Hiragana"),
            ("hiragana", "Hiragana"),
            ("hluw", "Anatolian_Hieroglyphs"),
            ("hmng", "Pahawh_Hmong"),
            ("hmnp", "Nyiakeng_Puachue_Hmong"),
            ("hrkt", "Katakana_Or_Hiragana"),
            ("hung", "Old_Hungarian"),
            ("imperialaramaic", "Imperial_Aramaic"),
            ("inherited", "Inherited"),
            ("inscriptionalpahlavi", "Inscriptional_Pahlavi"),
            ("inscriptionalparthian", "Inscriptional_Parthian"),
            ("ital", "Old_Italic"),
            ("java", "Javanese"),
            ("javanese", "Javanese"),
            ("kaithi", "Kaithi"),
            ("kali", "Kayah_Li"),
            ("kana", "Katakana"),
            ("kannada", "Kannada"),
            ("katakana", "Katakana"),
            ("katakanaorhiragana", "Katakana_Or_Hiragana"),
            ("kawi", "Kawi"),
            ("kayahli", "Kayah_Li"),
            ("khar", "Kharoshthi"),
            ("kharoshthi", "Kharoshthi"),
            ("khitansmallscript", "Khitan_Small_Script"),
            ("khmer", "Khmer"),
            ("khmr", "Khmer"),
            ("khoj", "Khojki"),
            ("khojki", "Khojki"),
            ("khudawadi", "Khudawadi"),
            ("kits", "Khitan_Small_Script"),
            ("knda", "Kannada"),
            ("kthi", "Kaithi"),
            ("lana", "Tai_Tham"),
            ("lao", "Lao"),
            ("laoo", "Lao"),
            ("latin", "Latin"),
            ("latn", "Latin"),
            ("lepc", "Lepcha"),
            ("lepcha", "Lepcha"),
            ("limb", "Limbu"),
            ("limbu", "Limbu"),
            ("lina", "Linear_A"),
            ("linb", "Linear_B"),
            ("lineara", "Linear_A"),
            ("linearb", "Linear_B"),
            ("lisu", "Lisu"),
            ("lyci", "Lycian"),
            ("lycian", "Lycian"),
            ("lydi", "Lydian"),
            ("lydian", "Lydian"),
            ("mahajani", "Mahajani"),
            ("mahj", "Mahajani"),
            ("maka", "Makasar"),
            ("makasar", "Makasar"),
            ("malayalam", "Malayalam"),
            ("mand", "Mandaic"),
            ("mandaic", "Mandaic"),
            ("mani", "Manichaean"),
            ("manichaean", "Manichaean"),
            ("marc", "Marchen"),
            ("marchen", "Marchen"),
            ("masaramgondi", "Masaram_Gondi"),
            ("medefaidrin", "Medefaidrin"),
            ("medf", "Medefaidrin"),
            ("meeteimayek", "Meetei_Mayek"),
            ("mend", "Mende_Kikakui"),
            ("mendekikakui", "Mende_Kikakui"),
            ("merc", "Meroitic_Cursive"),
            ("mero", "Meroitic_Hieroglyphs"),
            ("meroiticcursive", "Meroitic_Cursive"),
            ("meroitichieroglyphs", "Meroitic_Hieroglyphs"),
            ("miao", "Miao"),
            ("mlym", "Malayalam"),
            ("modi", "Modi"),
            ("mong", "Mongolian"),
            ("mongolian", "Mongolian"),
            ("mro", "Mro"),
            ("mroo", "Mro"),
            ("mtei", "Meetei_Mayek"),
            ("mult", "Multani"),
            ("multani", "Multani"),
            ("myanmar", "Myanmar"),
            ("mymr", "Myanmar"),
            ("nabataean", "Nabataean"),
            ("nagm", "Nag_Mundari"),
            ("nagmundari", "Nag_Mundari"),
            ("nand", "Nandinagari"),
            ("nandinagari", "Nandinagari"),
            ("narb", "Old_North_Arabian"),
            ("nbat", "Nabataean"),
            ("newa", "Newa"),
            ("newtailue", "New_Tai_Lue"),
            ("nko", "Nko"),
            ("nkoo", "Nko"),
            ("nshu", "Nushu"),
            ("nushu", "Nushu"),
            ("nyiakengpuachuehmong", "Nyiakeng_Puachue_Hmong"),
            ("ogam", "Ogham"),
            ("ogham", "Ogham"),
            ("olchiki", "Ol_Chiki"),
            ("olck", "Ol_Chiki"),
            ("oldhungarian", "Old_Hungarian"),
            ("olditalic", "Old_Italic"),
            ("oldnortharabian", "Old_North_Arabian"),
            ("oldpermic", "Old_Permic"),
            ("oldpersian", "Old_Persian"),
            ("oldsogdian", "Old_Sogdian"),
            ("oldsoutharabian", "Old_South_Arabian"),
            ("oldturkic", "Old_Turkic"),
            ("olduyghur", "Old_Uyghur"),
            ("oriya", "Oriya"),
            ("orkh", "Old_Turkic"),
            ("orya", "Oriya"),
            ("osage", "Osage"),
            ("osge", "Osage"),
            ("osma", "Osmanya"),
            ("osmanya", "Osmanya"),
            ("ougr", "Old_Uyghur"),
            ("pahawhhmong", "Pahawh_Hmong"),
            ("palm", "Palmyrene"),
            ("palmyrene", "Palmyrene"),
            ("pauc", "Pau_Cin_Hau"),
            ("paucinhau", "Pau_Cin_Hau"),
            ("perm", "Old_Permic"),
            ("phag", "Phags_Pa"),
            ("phagspa", "Phags_Pa"),
            ("phli", "Inscriptional_Pahlavi"),
            ("phlp", "Psalter_Pahlavi"),
            ("phnx", "Phoenician"),
            ("phoenician", "Phoenician"),
            ("plrd", "Miao"),
            ("prti", "Inscriptional_Parthian"),
            ("psalterpahlavi", "Psalter_Pahlavi"),
            ("qaac", "Coptic"),
            ("qaai", "Inherited"),
            ("rejang", "Rejang"),
            ("rjng", "Rejang"),
            ("rohg", "Hanifi_Rohingya"),
            ("runic", "Runic"),
            ("runr", "Runic"),
            ("samaritan", "Samaritan"),
            ("samr", "Samaritan"),
            ("sarb", "Old_South_Arabian"),
            ("saur", "Saurashtra"),
            ("saurashtra", "Saurashtra"),
            ("sgnw", "SignWriting"),
            ("sharada", "Sharada"),
            ("shavian", "Shavian"),
            ("shaw", "Shavian"),
            ("shrd", "Sharada"),
            ("sidd", "Siddham"),
            ("siddham", "Siddham"),
            ("signwriting", "SignWriting"),
            ("sind", "Khudawadi"),
            ("sinh", "Sinhala"),
            ("sinhala", "Sinhala"),
            ("sogd", "Sogdian"),
            ("sogdian", "Sogdian"),
            ("sogo", "Old_Sogdian"),
            ("sora", "Sora_Sompeng"),
            ("sorasompeng", "Sora_Sompeng"),
            ("soyo", "Soyombo"),
            ("soyombo", "Soyombo"),
            ("sund", "Sundanese"),
            ("sundanese", "Sundanese"),
            ("sylo", "Syloti_Nagri"),
            ("sylotinagri", "Syloti_Nagri"),
            ("syrc", "Syriac"),
            ("syriac", "Syriac"),
            ("tagalog", "Tagalog"),
            ("tagb", "Tagbanwa"),
            ("tagbanwa", "Tagbanwa"),
            ("taile", "Tai_Le"),
            ("taitham", "Tai_Tham"),
            ("taiviet", "Tai_Viet"),
            ("takr", "Takri"),
            ("takri", "Takri"),
            ("tale", "Tai_Le"),
            ("talu", "New_Tai_Lue"),
            ("tamil", "Tamil"),
            ("taml", "Tamil"),
            ("tang", "Tangut"),
            ("tangsa", "Tangsa"),
            ("tangut", "Tangut"),
            ("tavt", "Tai_Viet"),
            ("telu", "Telugu"),
            ("telugu", "Telugu"),
            ("tfng", "Tifinagh"),
            ("tglg", "Tagalog"),
            ("thaa", "Thaana"),
            ("thaana", "Thaana"),
            ("thai", "Thai"),
            ("tibetan", "Tibetan"),
            ("tibt", "Tibetan"),
            ("tifinagh", "Tifinagh"),
            ("tirh", "Tirhuta"),
            ("tirhuta", "Tirhuta"),
            ("tnsa", "Tangsa"),
            ("toto", "Toto"),
            ("ugar", "Ugaritic"),
            ("ugaritic", "Ugaritic"),
            ("unknown", "Unknown"),
            ("vai", "Vai"),
            ("vaii", "Vai"),
            ("vith", "Vithkuqi"),
            ("vithkuqi", "Vithkuqi"),
            ("wancho", "Wancho"),
            ("wara", "Warang_Citi"),
            ("warangciti", "Warang_Citi"),
            ("wcho", "Wancho"),
            ("xpeo", "Old_Persian"),
            ("xsux", "Cuneiform"),
            ("yezi", "Yezidi"),
            ("yezidi", "Yezidi"),
            ("yi", "Yi"),
            ("yiii", "Yi"),
            ("zanabazarsquare", "Zanabazar_Square"),
            ("zanb", "Zanabazar_Square"),
            ("zinh", "Inherited"),
            ("zyyy", "Common"),
            ("zzzz", "Unknown"),
        ],
    ),
    (
        "Sentence_Break",
        &[
            ("at", "ATerm"),
            ("aterm", "ATerm"),
            ("cl", "Close"),
            ("close", "Close"),
            ("cr", "CR"),
            ("ex", "Extend"),
            ("extend", "Extend"),
            ("fo", "Format"),
            ("format", "Format"),
            ("le", "OLetter"),
            ("lf", "LF"),
            ("lo", "Lower"),
            ("lower", "Lower"),
            ("nu", "Numeric"),
            ("numeric", "Numeric"),
            ("oletter", "OLetter"),
            ("other", "Other"),
            ("sc", "SContinue"),
            ("scontinue", "SContinue"),
            ("se", "Sep"),
            ("sep", "Sep"),
            ("sp", "Sp"),
            ("st", "STerm"),
            ("sterm", "STerm"),
            ("up", "Upper"),
            ("upper", "Upper"),
            ("xx", "Other"),
        ],
    ),
    (
        "Word_Break",
        &[
            ("aletter", "ALetter"),
            ("cr", "CR"),
            ("doublequote", "Double_Quote"),
            ("dq", "Double_Quote"),
            ("eb", "E_Base"),
            ("ebase", "E_Base"),
            ("ebasegaz", "E_Base_GAZ"),
            ("ebg", "E_Base_GAZ"),
            ("em", "E_Modifier"),
            ("emodifier", "E_Modifier"),
            ("ex", "ExtendNumLet"),
            ("extend", "Extend"),
            ("extendnumlet", "ExtendNumLet"),
            ("fo", "Format"),
            ("format", "Format"),
            ("gaz", "Glue_After_Zwj"),
            ("glueafterzwj", "Glue_After_Zwj"),
            ("hebrewletter", "Hebrew_Letter"),
            ("hl", "Hebrew_Letter"),
            ("ka", "Katakana"),
            ("katakana", "Katakana"),
            ("le", "ALetter"),
            ("lf", "LF"),
            ("mb", "MidNumLet"),
            ("midletter", "MidLetter"),
            ("midnum", "MidNum"),
            ("midnumlet", "MidNumLet"),
            ("ml", "MidLetter"),
            ("mn", "MidNum"),
            ("newline", "Newline"),
            ("nl", "Newline"),
            ("nu", "Numeric"),
            ("numeric", "Numeric"),
            ("other", "Other"),
            ("regionalindicator", "Regional_Indicator"),
            ("ri", "Regional_Indicator"),
            ("singlequote", "Single_Quote"),
            ("sq", "Single_Quote"),
            ("wsegspace", "WSegSpace"),
            ("xx", "Other"),
            ("zwj", "ZWJ"),
        ],
    ),
];