diff options
Diffstat (limited to 'vendor/regex-automata-0.1.10/data/tests/unicode.toml')
-rw-r--r-- | vendor/regex-automata-0.1.10/data/tests/unicode.toml | 489 |
1 files changed, 489 insertions, 0 deletions
diff --git a/vendor/regex-automata-0.1.10/data/tests/unicode.toml b/vendor/regex-automata-0.1.10/data/tests/unicode.toml new file mode 100644 index 000000000..845393f28 --- /dev/null +++ b/vendor/regex-automata-0.1.10/data/tests/unicode.toml @@ -0,0 +1,489 @@ +[[tests]] +name = "unicode-literal1" +pattern = '☃' +input = "☃" +matches = [[0, 3]] + +[[tests]] +name = "unicode-literal2" +pattern = '☃+' +input = "☃" +matches = [[0, 3]] + +[[tests]] +name = "unicode-literal3" +options = ["case-insensitive"] +pattern = '☃+' +input = "☃" +matches = [[0, 3]] + +[[tests]] +name = "unicode-literal4" +options = ["case-insensitive"] +pattern = 'Δ' +input = "δ" +matches = [[0, 2]] + + +[[tests]] +name = "unicode-class1" +pattern = '[☃Ⅰ]+' +input = "☃" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class2" +pattern = '\pN' +input = "Ⅰ" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class3" +pattern = '\pN+' +input = "Ⅰ1Ⅱ2" +matches = [[0, 8]] + +[[tests]] +name = "unicode-class4" +pattern = '\PN+' +input = "abⅠ" +matches = [[0, 2]] + +[[tests]] +name = "unicode-class5" +pattern = '[\PN]+' +input = "abⅠ" +matches = [[0, 2]] + +[[tests]] +name = "unicode-class6" +pattern = '[^\PN]+' +input = "abⅠ" +matches = [[2, 5]] + +[[tests]] +name = "unicode-class7" +pattern = '\p{Lu}+' +input = "ΛΘΓΔα" +matches = [[0, 8]] + +[[tests]] +name = "unicode-class8" +options = ["case-insensitive"] +pattern = '\p{Lu}+' +input = "ΛΘΓΔα" +matches = [[0, 10]] + +[[tests]] +name = "unicode-class9" +pattern = '\pL+' +input = "ΛΘΓΔα" +matches = [[0, 10]] + +[[tests]] +name = "unicode-class10" +pattern = '\p{Ll}+' +input = "ΛΘΓΔα" +matches = [[8, 10]] + + +[[tests]] +name = "unicode-perl1" +pattern = '\w+' +input = "dδd" +matches = [[0, 4]] + +[[tests]] +name = "unicode-perl2" +pattern = '\w+' +input = "⥡" +matches = [] + +[[tests]] +name = "unicode-perl3" +pattern = '\W+' +input = "⥡" +matches = [[0, 3]] + +[[tests]] +name = "unicode-perl4" +pattern = '\d+' +input = "1२३9" +matches = [[0, 8]] + +[[tests]] +name = "unicode-perl5" +pattern = '\d+' +input = "Ⅱ" +matches = [] + +[[tests]] +name = "unicode-perl6" +pattern = '\D+' +input = "Ⅱ" +matches = [[0, 3]] + +[[tests]] +name = "unicode-perl7" +pattern = '\s+' +input = " " +matches = [[0, 3]] + +[[tests]] +name = "unicode-perl8" +pattern = '\s+' +input = "☃" +matches = [] + +[[tests]] +name = "unicode-perl9" +pattern = '\S+' +input = "☃" +matches = [[0, 3]] + + +[[tests]] +name = "unicode-class-gencat1" +pattern = '\p{Cased_Letter}' +input = "A" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat2" +pattern = '\p{Close_Punctuation}' +input = "❯" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat3" +pattern = '\p{Connector_Punctuation}' +input = "⁀" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat4" +pattern = '\p{Control}' +input = "\u009F" +matches = [[0, 2]] + +[[tests]] +name = "unicode-class-gencat5" +pattern = '\p{Currency_Symbol}' +input = "£" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat6" +pattern = '\p{Dash_Punctuation}' +input = "〰" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat7" +pattern = '\p{Decimal_Number}' +input = "𑓙" +matches = [[0, 4]] + +[[tests]] +name = "unicode-class-gencat8" +pattern = '\p{Enclosing_Mark}' +input = "\uA672" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat9" +pattern = '\p{Final_Punctuation}' +input = "⸡" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat10" +pattern = '\p{Format}' +input = "\U000E007F" +matches = [[0, 4]] + +[[tests]] +name = "unicode-class-gencat11" +pattern = '\p{Initial_Punctuation}' +input = "⸜" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat12" +pattern = '\p{Letter}' +input = "Έ" +matches = [[0, 2]] + +[[tests]] +name = "unicode-class-gencat13" +pattern = '\p{Letter_Number}' +input = "ↂ" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat14" +pattern = '\p{Line_Separator}' +input = "\u2028" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat15" +pattern = '\p{Lowercase_Letter}' +input = "ϛ" +matches = [[0, 2]] + +[[tests]] +name = "unicode-class-gencat16" +pattern = '\p{Mark}' +input = "\U000E01EF" +matches = [[0, 4]] + +[[tests]] +name = "unicode-class-gencat17" +pattern = '\p{Math}' +input = "⋿" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat18" +pattern = '\p{Modifier_Letter}' +input = "𖭃" +matches = [[0, 4]] + +[[tests]] +name = "unicode-class-gencat19" +pattern = '\p{Modifier_Symbol}' +input = "🏿" +matches = [[0, 4]] + +[[tests]] +name = "unicode-class-gencat20" +pattern = '\p{Nonspacing_Mark}' +input = "\U0001E94A" +matches = [[0, 4]] + +[[tests]] +name = "unicode-class-gencat21" +pattern = '\p{Number}' +input = "⓿" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat22" +pattern = '\p{Open_Punctuation}' +input = "⦅" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat23" +pattern = '\p{Other}' +input = "\u0BC9" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat24" +pattern = '\p{Other_Letter}' +input = "ꓷ" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat25" +pattern = '\p{Other_Number}' +input = "㉏" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat26" +pattern = '\p{Other_Punctuation}' +input = "𞥞" +matches = [[0, 4]] + +[[tests]] +name = "unicode-class-gencat27" +pattern = '\p{Other_Symbol}' +input = "⅌" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat28" +pattern = '\p{Paragraph_Separator}' +input = "\u2029" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat29" +pattern = '\p{Private_Use}' +input = "\U0010FFFD" +matches = [[0, 4]] + +[[tests]] +name = "unicode-class-gencat30" +pattern = '\p{Punctuation}' +input = "𑁍" +matches = [[0, 4]] + +[[tests]] +name = "unicode-class-gencat31" +pattern = '\p{Separator}' +input = "\u3000" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat32" +pattern = '\p{Space_Separator}' +input = "\u205F" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat33" +pattern = '\p{Spacing_Mark}' +input = "\U00016F7E" +matches = [[0, 4]] + +[[tests]] +name = "unicode-class-gencat34" +pattern = '\p{Symbol}' +input = "⯈" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat35" +pattern = '\p{Titlecase_Letter}' +input = "ῼ" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gencat36" +pattern = '\p{Unassigned}' +input = "\U0010FFFF" +matches = [[0, 4]] + +[[tests]] +name = "unicode-class-gencat37" +pattern = '\p{Uppercase_Letter}' +input = "Ꝋ" +matches = [[0, 3]] + + +[[tests]] +name = "unicode-class-emoji1" +pattern = '\p{Emoji}' +input = "\u23E9" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-emoji2" +pattern = '\p{emoji}' +input = "\U0001F21A" +matches = [[0, 4]] + +[[tests]] +name = "unicode-class-emoji3" +pattern = '\p{extendedpictographic}' +input = "\U0001FA6E" +matches = [[0, 4]] + +[[tests]] +name = "unicode-class-emoji4" +pattern = '\p{extendedpictographic}' +input = "\U0001FFFD" +matches = [[0, 4]] + + +[[tests]] +name = "unicode-class-gcb1" +pattern = '\p{grapheme_cluster_break=prepend}' +input = "\U00011D46" +matches = [[0, 4]] + +[[tests]] +name = "unicode-class-gcb2" +pattern = '\p{gcb=regional_indicator}' +input = "\U0001F1E6" +matches = [[0, 4]] + +[[tests]] +name = "unicode-class-gcb3" +pattern = '\p{gcb=ri}' +input = "\U0001F1E7" +matches = [[0, 4]] + +[[tests]] +name = "unicode-class-gcb4" +pattern = '\p{regionalindicator}' +input = "\U0001F1FF" +matches = [[0, 4]] + +[[tests]] +name = "unicode-class-gcb5" +pattern = '\p{gcb=lvt}' +input = "\uC989" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-gcb6" +pattern = '\p{gcb=zwj}' +input = "\u200D" +matches = [[0, 3]] + + +[[tests]] +name = "unicode-class-word-break1" +pattern = '\p{word_break=Hebrew_Letter}' +input = "\uFB46" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-word-break2" +pattern = '\p{wb=hebrewletter}' +input = "\uFB46" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-word-break3" +pattern = '\p{wb=ExtendNumLet}' +input = "\uFF3F" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-word-break4" +pattern = '\p{wb=WSegSpace}' +input = "\u3000" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-word-break5" +pattern = '\p{wb=numeric}' +input = "\U0001E950" +matches = [[0, 4]] + + +[[tests]] +name = "unicode-class-sentence-break1" +pattern = '\p{sentence_break=Lower}' +input = "\u0469" +matches = [[0, 2]] + +[[tests]] +name = "unicode-class-sentence-break2" +pattern = '\p{sb=lower}' +input = "\u0469" +matches = [[0, 2]] + +[[tests]] +name = "unicode-class-sentence-break3" +pattern = '\p{sb=Close}' +input = "\uFF60" +matches = [[0, 3]] + +[[tests]] +name = "unicode-class-sentence-break4" +pattern = '\p{sb=Close}' +input = "\U0001F677" +matches = [[0, 4]] + +[[tests]] +name = "unicode-class-sentence-break5" +pattern = '\p{sb=SContinue}' +input = "\uFF64" +matches = [[0, 3]] |