1[[tests]]
2name = "unicode-literal1"
3pattern = '☃'
4input = "☃"
5matches = [[0, 3]]
6
7[[tests]]
8name = "unicode-literal2"
9pattern = '☃+'
10input = "☃"
11matches = [[0, 3]]
12
13[[tests]]
14name = "unicode-literal3"
15options = ["case-insensitive"]
16pattern = '☃+'
17input = "☃"
18matches = [[0, 3]]
19
20[[tests]]
21name = "unicode-literal4"
22options = ["case-insensitive"]
23pattern = 'Δ'
24input = "δ"
25matches = [[0, 2]]
26
27
28[[tests]]
29name = "unicode-class1"
30pattern = '[☃Ⅰ]+'
31input = "☃"
32matches = [[0, 3]]
33
34[[tests]]
35name = "unicode-class2"
36pattern = '\pN'
37input = "Ⅰ"
38matches = [[0, 3]]
39
40[[tests]]
41name = "unicode-class3"
42pattern = '\pN+'
43input = "Ⅰ1Ⅱ2"
44matches = [[0, 8]]
45
46[[tests]]
47name = "unicode-class4"
48pattern = '\PN+'
49input = "abⅠ"
50matches = [[0, 2]]
51
52[[tests]]
53name = "unicode-class5"
54pattern = '[\PN]+'
55input = "abⅠ"
56matches = [[0, 2]]
57
58[[tests]]
59name = "unicode-class6"
60pattern = '[^\PN]+'
61input = "abⅠ"
62matches = [[2, 5]]
63
64[[tests]]
65name = "unicode-class7"
66pattern = '\p{Lu}+'
67input = "ΛΘΓΔα"
68matches = [[0, 8]]
69
70[[tests]]
71name = "unicode-class8"
72options = ["case-insensitive"]
73pattern = '\p{Lu}+'
74input = "ΛΘΓΔα"
75matches = [[0, 10]]
76
77[[tests]]
78name = "unicode-class9"
79pattern = '\pL+'
80input = "ΛΘΓΔα"
81matches = [[0, 10]]
82
83[[tests]]
84name = "unicode-class10"
85pattern = '\p{Ll}+'
86input = "ΛΘΓΔα"
87matches = [[8, 10]]
88
89
90[[tests]]
91name = "unicode-perl1"
92pattern = '\w+'
93input = "dδd"
94matches = [[0, 4]]
95
96[[tests]]
97name = "unicode-perl2"
98pattern = '\w+'
99input = "⥡"
100matches = []
101
102[[tests]]
103name = "unicode-perl3"
104pattern = '\W+'
105input = "⥡"
106matches = [[0, 3]]
107
108[[tests]]
109name = "unicode-perl4"
110pattern = '\d+'
111input = "1२३9"
112matches = [[0, 8]]
113
114[[tests]]
115name = "unicode-perl5"
116pattern = '\d+'
117input = "Ⅱ"
118matches = []
119
120[[tests]]
121name = "unicode-perl6"
122pattern = '\D+'
123input = "Ⅱ"
124matches = [[0, 3]]
125
126[[tests]]
127name = "unicode-perl7"
128pattern = '\s+'
129input = " "
130matches = [[0, 3]]
131
132[[tests]]
133name = "unicode-perl8"
134pattern = '\s+'
135input = "☃"
136matches = []
137
138[[tests]]
139name = "unicode-perl9"
140pattern = '\S+'
141input = "☃"
142matches = [[0, 3]]
143
144
145[[tests]]
146name = "unicode-class-gencat1"
147pattern = '\p{Cased_Letter}'
148input = "A"
149matches = [[0, 3]]
150
151[[tests]]
152name = "unicode-class-gencat2"
153pattern = '\p{Close_Punctuation}'
154input = "❯"
155matches = [[0, 3]]
156
157[[tests]]
158name = "unicode-class-gencat3"
159pattern = '\p{Connector_Punctuation}'
160input = "⁀"
161matches = [[0, 3]]
162
163[[tests]]
164name = "unicode-class-gencat4"
165pattern = '\p{Control}'
166input = "\u009F"
167matches = [[0, 2]]
168
169[[tests]]
170name = "unicode-class-gencat5"
171pattern = '\p{Currency_Symbol}'
172input = "£"
173matches = [[0, 3]]
174
175[[tests]]
176name = "unicode-class-gencat6"
177pattern = '\p{Dash_Punctuation}'
178input = "〰"
179matches = [[0, 3]]
180
181[[tests]]
182name = "unicode-class-gencat7"
183pattern = '\p{Decimal_Number}'
184input = "��"
185matches = [[0, 4]]
186
187[[tests]]
188name = "unicode-class-gencat8"
189pattern = '\p{Enclosing_Mark}'
190input = "\uA672"
191matches = [[0, 3]]
192
193[[tests]]
194name = "unicode-class-gencat9"
195pattern = '\p{Final_Punctuation}'
196input = "⸡"
197matches = [[0, 3]]
198
199[[tests]]
200name = "unicode-class-gencat10"
201pattern = '\p{Format}'
202input = "\U000E007F"
203matches = [[0, 4]]
204
205[[tests]]
206name = "unicode-class-gencat11"
207pattern = '\p{Initial_Punctuation}'
208input = "⸜"
209matches = [[0, 3]]
210
211[[tests]]
212name = "unicode-class-gencat12"
213pattern = '\p{Letter}'
214input = "Έ"
215matches = [[0, 2]]
216
217[[tests]]
218name = "unicode-class-gencat13"
219pattern = '\p{Letter_Number}'
220input = "ↂ"
221matches = [[0, 3]]
222
223[[tests]]
224name = "unicode-class-gencat14"
225pattern = '\p{Line_Separator}'
226input = "\u2028"
227matches = [[0, 3]]
228
229[[tests]]
230name = "unicode-class-gencat15"
231pattern = '\p{Lowercase_Letter}'
232input = "ϛ"
233matches = [[0, 2]]
234
235[[tests]]
236name = "unicode-class-gencat16"
237pattern = '\p{Mark}'
238input = "\U000E01EF"
239matches = [[0, 4]]
240
241[[tests]]
242name = "unicode-class-gencat17"
243pattern = '\p{Math}'
244input = "⋿"
245matches = [[0, 3]]
246
247[[tests]]
248name = "unicode-class-gencat18"
249pattern = '\p{Modifier_Letter}'
250input = "��"
251matches = [[0, 4]]
252
253[[tests]]
254name = "unicode-class-gencat19"
255pattern = '\p{Modifier_Symbol}'
256input = "��"
257matches = [[0, 4]]
258
259[[tests]]
260name = "unicode-class-gencat20"
261pattern = '\p{Nonspacing_Mark}'
262input = "\U0001E94A"
263matches = [[0, 4]]
264
265[[tests]]
266name = "unicode-class-gencat21"
267pattern = '\p{Number}'
268input = "⓿"
269matches = [[0, 3]]
270
271[[tests]]
272name = "unicode-class-gencat22"
273pattern = '\p{Open_Punctuation}'
274input = "⦅"
275matches = [[0, 3]]
276
277[[tests]]
278name = "unicode-class-gencat23"
279pattern = '\p{Other}'
280input = "\u0BC9"
281matches = [[0, 3]]
282
283[[tests]]
284name = "unicode-class-gencat24"
285pattern = '\p{Other_Letter}'
286input = "ꓷ"
287matches = [[0, 3]]
288
289[[tests]]
290name = "unicode-class-gencat25"
291pattern = '\p{Other_Number}'
292input = "㉏"
293matches = [[0, 3]]
294
295[[tests]]
296name = "unicode-class-gencat26"
297pattern = '\p{Other_Punctuation}'
298input = "��"
299matches = [[0, 4]]
300
301[[tests]]
302name = "unicode-class-gencat27"
303pattern = '\p{Other_Symbol}'
304input = "⅌"
305matches = [[0, 3]]
306
307[[tests]]
308name = "unicode-class-gencat28"
309pattern = '\p{Paragraph_Separator}'
310input = "\u2029"
311matches = [[0, 3]]
312
313[[tests]]
314name = "unicode-class-gencat29"
315pattern = '\p{Private_Use}'
316input = "\U0010FFFD"
317matches = [[0, 4]]
318
319[[tests]]
320name = "unicode-class-gencat30"
321pattern = '\p{Punctuation}'
322input = "��"
323matches = [[0, 4]]
324
325[[tests]]
326name = "unicode-class-gencat31"
327pattern = '\p{Separator}'
328input = "\u3000"
329matches = [[0, 3]]
330
331[[tests]]
332name = "unicode-class-gencat32"
333pattern = '\p{Space_Separator}'
334input = "\u205F"
335matches = [[0, 3]]
336
337[[tests]]
338name = "unicode-class-gencat33"
339pattern = '\p{Spacing_Mark}'
340input = "\U00016F7E"
341matches = [[0, 4]]
342
343[[tests]]
344name = "unicode-class-gencat34"
345pattern = '\p{Symbol}'
346input = "⯈"
347matches = [[0, 3]]
348
349[[tests]]
350name = "unicode-class-gencat35"
351pattern = '\p{Titlecase_Letter}'
352input = "ῼ"
353matches = [[0, 3]]
354
355[[tests]]
356name = "unicode-class-gencat36"
357pattern = '\p{Unassigned}'
358input = "\U0010FFFF"
359matches = [[0, 4]]
360
361[[tests]]
362name = "unicode-class-gencat37"
363pattern = '\p{Uppercase_Letter}'
364input = "Ꝋ"
365matches = [[0, 3]]
366
367
368[[tests]]
369name = "unicode-class-emoji1"
370pattern = '\p{Emoji}'
371input = "\u23E9"
372matches = [[0, 3]]
373
374[[tests]]
375name = "unicode-class-emoji2"
376pattern = '\p{emoji}'
377input = "\U0001F21A"
378matches = [[0, 4]]
379
380[[tests]]
381name = "unicode-class-emoji3"
382pattern = '\p{extendedpictographic}'
383input = "\U0001FA6E"
384matches = [[0, 4]]
385
386[[tests]]
387name = "unicode-class-emoji4"
388pattern = '\p{extendedpictographic}'
389input = "\U0001FFFD"
390matches = [[0, 4]]
391
392
393[[tests]]
394name = "unicode-class-gcb1"
395pattern = '\p{grapheme_cluster_break=prepend}'
396input = "\U00011D46"
397matches = [[0, 4]]
398
399[[tests]]
400name = "unicode-class-gcb2"
401pattern = '\p{gcb=regional_indicator}'
402input = "\U0001F1E6"
403matches = [[0, 4]]
404
405[[tests]]
406name = "unicode-class-gcb3"
407pattern = '\p{gcb=ri}'
408input = "\U0001F1E7"
409matches = [[0, 4]]
410
411[[tests]]
412name = "unicode-class-gcb4"
413pattern = '\p{regionalindicator}'
414input = "\U0001F1FF"
415matches = [[0, 4]]
416
417[[tests]]
418name = "unicode-class-gcb5"
419pattern = '\p{gcb=lvt}'
420input = "\uC989"
421matches = [[0, 3]]
422
423[[tests]]
424name = "unicode-class-gcb6"
425pattern = '\p{gcb=zwj}'
426input = "\u200D"
427matches = [[0, 3]]
428
429
430[[tests]]
431name = "unicode-class-word-break1"
432pattern = '\p{word_break=Hebrew_Letter}'
433input = "\uFB46"
434matches = [[0, 3]]
435
436[[tests]]
437name = "unicode-class-word-break2"
438pattern = '\p{wb=hebrewletter}'
439input = "\uFB46"
440matches = [[0, 3]]
441
442[[tests]]
443name = "unicode-class-word-break3"
444pattern = '\p{wb=ExtendNumLet}'
445input = "\uFF3F"
446matches = [[0, 3]]
447
448[[tests]]
449name = "unicode-class-word-break4"
450pattern = '\p{wb=WSegSpace}'
451input = "\u3000"
452matches = [[0, 3]]
453
454[[tests]]
455name = "unicode-class-word-break5"
456pattern = '\p{wb=numeric}'
457input = "\U0001E950"
458matches = [[0, 4]]
459
460
461[[tests]]
462name = "unicode-class-sentence-break1"
463pattern = '\p{sentence_break=Lower}'
464input = "\u0469"
465matches = [[0, 2]]
466
467[[tests]]
468name = "unicode-class-sentence-break2"
469pattern = '\p{sb=lower}'
470input = "\u0469"
471matches = [[0, 2]]
472
473[[tests]]
474name = "unicode-class-sentence-break3"
475pattern = '\p{sb=Close}'
476input = "\uFF60"
477matches = [[0, 3]]
478
479[[tests]]
480name = "unicode-class-sentence-break4"
481pattern = '\p{sb=Close}'
482input = "\U0001F677"
483matches = [[0, 4]]
484
485[[tests]]
486name = "unicode-class-sentence-break5"
487pattern = '\p{sb=SContinue}'
488input = "\uFF64"
489matches = [[0, 3]]
490