Lines Matching +full:0 +full:a
5 /* PCRE is a library of functions to support regular expressions whose syntax
29 IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
48 #define PCRE2_CODE_UNIT_WIDTH 0
53 \xe6\x92\xad = 0x64ad = 25773 (kanji)
55 \xc2\xa1 = 0xa1 = (Inverted Exclamation Mark)
56 \xf3\xa9\xb7\x80 = 0xe9dc0 = 957888
57 \xed\xa0\x80 = 55296 = 0xd800 (Invalid UTF character)
58 \xed\xb0\x80 = 56320 = 0xdc00 (Invalid UTF character)
60 \xc2\x85 = 0x85 = 133 (NExt Line = NEL)
61 \xe2\x80\xa8 = 0x2028 = 8232 (Line Separator)
63 \xc3\xa9 = 0xe9 = 233 (e')
64 \xc3\x89 = 0xc9 = 201 (E')
65 \xc3\xa1 = 0xe1 = 225 (a')
66 \xc3\x81 = 0xc1 = 193 (A')
67 \x53 = 0x53 = S
68 \x73 = 0x73 = s
69 \xc5\xbf = 0x17f = 383 (long S)
70 \xc8\xba = 0x23a = 570
71 \xe2\xb1\xa5 = 0x2c65 = 11365
72 \xe1\xbd\xb8 = 0x1f78 = 8056
73 \xe1\xbf\xb8 = 0x1ff8 = 8184
74 \xf0\x90\x90\x80 = 0x10400 = 66560
75 \xf0\x90\x90\xa8 = 0x10428 = 66600
76 \xc7\x84 = 0x1c4 = 452
77 \xc7\x85 = 0x1c5 = 453
78 \xc7\x86 = 0x1c6 = 454
81 ucp_Coptic - \x{2c80}-\x{2ce3} -> caseless: XOR 0x1
85 \xcc\x8d = 0x30d = 781
87 \xc2\x80 = 0x80 = 128 (lowest 2 byte character)
88 \xdf\xbf = 0x7ff = 2047 (highest 2 byte character)
89 \xe0\xa0\x80 = 0x800 = 2048 (lowest 2 byte character)
90 \xef\xbf\xbf = 0xffff = 65535 (highest 3 byte character)
91 \xf0\x90\x80\x80 = 0x10000 = 65536 (lowest 4 byte character)
92 \xf4\x8f\xbf\xbf = 0x10ffff = 1114111 (highest allowed utf character)
102 int jit = 0; in main()
136 #define A PCRE2_NEWLINE_ANYCRLF macro
138 #define GET_NEWLINE(x) ((x) & 0xffff)
141 #define OFFSET_MASK 0x00ffff
142 #define F_NO8 0x010000
143 #define F_NO16 0x020000
144 #define F_NO32 0x020000
145 #define F_NOMATCH 0x040000
146 #define F_DIFF 0x080000
147 #define F_FORCECONV 0x100000
148 #define F_PROPERTY 0x200000
161 { MU, A, 0, 0, "AbC", "AbAbC" },
162 { MU, A, 0, 0, "ACCEPT", "AACACCACCEACCEPACCEPTACCEPTT" },
163 { CMU, A, 0, 0, "aA#\xc3\xa9\xc3\x81", "aA#Aa#\xc3\x89\xc3\xa1" },
164 { M, A, 0, 0, "[^a]", "aAbB" },
165 { CM, A, 0, 0, "[^m]", "mMnN" },
166 { M, A, 0, 0, "a[^b][^#]", "abacd" },
167 { CM, A, 0, 0, "A[^B][^E]", "abacd" },
168 { CMU, A, 0, 0, "[^x][^#]", "XxBll" },
169 { MU, A, 0, 0, "[^a]", "aaa\xc3\xa1#Ab" },
170 { CMU, A, 0, 0, "[^A]", "aA\xe6\x92\xad" },
171 { MU, A, 0, 0, "\\W(\\W)?\\w", "\r\n+bc" },
172 { MU, A, 0, 0, "\\W(\\W)?\\w", "\n\r+bc" },
173 { MU, A, 0, 0, "\\W(\\W)?\\w", "\r\r+bc" },
174 { MU, A, 0, 0, "\\W(\\W)?\\w", "\n\n+bc" },
175 { MU, A, 0, 0, "[axd]", "sAXd" },
176 { CMU, A, 0, 0, "[axd]", "sAXd" },
177 { CMU, A, 0, 0 | F_NOMATCH, "[^axd]", "DxA" },
178 { MU, A, 0, 0, "[a-dA-C]", "\xe6\x92\xad\xc3\xa9.B" },
179 { MU, A, 0, 0, "[^a-dA-C]", "\xe6\x92\xad\xc3\xa9" },
180 { CMU, A, 0, 0, "[^\xc3\xa9]", "\xc3\xa9\xc3\x89." },
181 { MU, A, 0, 0, "[^\xc3\xa9]", "\xc3\xa9\xc3\x89." },
182 { MU, A, 0, 0, "[^a]", "\xc2\x80[]" },
183 { CMU, A, 0, 0, "\xf0\x90\x90\xa7", "\xf0\x90\x91\x8f" },
184 { CM, A, 0, 0, "1a2b3c4", "1a2B3c51A2B3C4" },
185 { PCRE2_CASELESS, 0, 0, 0, "\xff#a", "\xff#\xff\xfe##\xff#A" },
186 { PCRE2_CASELESS, 0, 0, 0, "\xfe", "\xff\xfc#\xfe\xfe" },
187 { PCRE2_CASELESS, 0, 0, 0, "a1", "Aa1" },
189 { M, A, 0, 0, "\\Ca", "cda" },
190 { CM, A, 0, 0, "\\Ca", "CDA" },
191 { M, A, 0, 0 | F_NOMATCH, "\\Cx", "cda" },
192 { CM, A, 0, 0 | F_NOMATCH, "\\Cx", "CDA" },
194 { CMUP, A, 0, 0, "\xf0\x90\x90\x80\xf0\x90\x90\xa8", "\xf0\x90\x90\xa8\xf0\x90\x90\x80" },
195 { CMUP, A, 0, 0, "\xf0\x90\x90\x80{2}", "\xf0\x90\x90\x80#\xf0\x90\x90\xa8\xf0\x90\x90\x80" },
196 { CMUP, A, 0, 0, "\xf0\x90\x90\xa8{2}", "\xf0\x90\x90\x80#\xf0\x90\x90\xa8\xf0\x90\x90\x80" },
197 { CMUP, A, 0, 0, "\xe1\xbd\xb8\xe1\xbf\xb8", "\xe1\xbf\xb8\xe1\xbd\xb8" },
198 { M, A, 0, 0, "[3-57-9]", "5" },
199 …{ PCRE2_AUTO_CALLOUT, A, 0, 0, "123456789012345678901234567890123456789012345678901234567890123456…
203 { MU, A, 0, 0, "\\b[^A]", "A_B#" },
204 { M, A, 0, 0 | F_NOMATCH, "\\b\\W", "\n*" },
205 { MU, A, 0, 0, "\\B[^,]\\b[^s]\\b", "#X" },
206 { MP, A, 0, 0, "\\B", "_\xa1" },
207 { MP, A, 0, 0 | F_PROPERTY, "\\b_\\b[,A]\\B", "_," },
208 { MUP, A, 0, 0, "\\b", "\xe6\x92\xad!" },
209 { MUP, A, 0, 0, "\\B", "_\xc2\xa1\xc3\xa1\xc2\x85" },
210 { MUP, A, 0, 0, "\\b[^A]\\B[^c]\\b[^_]\\B", "_\xc3\xa1\xe2\x80\xa8" },
211 { MUP, A, 0, 0, "\\b\\w+\\B", "\xc3\x89\xc2\xa1\xe6\x92\xad\xc3\x81\xc3\xa1" },
212 { MU, A, 0, 0 | F_NOMATCH, "\\b.", "\xcd\xbe" },
213 { CMUP, A, 0, 0, "\\By", "\xf0\x90\x90\xa8y" },
214 { M, A, 0, 0 | F_NOMATCH, "\\R^", "\n" },
215 { M, A, 0, 1 | F_NOMATCH, "^", "\n" },
216 { 0, 0, 0, 0, "^ab", "ab" },
217 { 0, 0, 0, 0 | F_NOMATCH, "^ab", "aab" },
218 { M, PCRE2_NEWLINE_CRLF, 0, 0, "^a", "\r\raa\n\naa\r\naa" },
219 { MU, A, 0, 0, "^-", "\xe2\x80\xa8--\xc2\x85-\r\n-" },
220 { M, PCRE2_NEWLINE_ANY, 0, 0, "^-", "a--b--\x85--" },
221 { MU, PCRE2_NEWLINE_ANY, 0, 0, "^-", "a--\xe2\x80\xa8--" },
222 { MU, PCRE2_NEWLINE_ANY, 0, 0, "^-", "a--\xc2\x85--" },
223 { 0, 0, 0, 0, "ab$", "ab" },
224 { 0, 0, 0, 0 | F_NOMATCH, "ab$", "abab\n\n" },
225 { PCRE2_DOLLAR_ENDONLY, 0, 0, 0 | F_NOMATCH, "ab$", "abab\r\n" },
226 { M, PCRE2_NEWLINE_CRLF, 0, 0, "a$", "\r\raa\n\naa\r\naa" },
227 { M, PCRE2_NEWLINE_ANY, 0, 0, "a$", "aaa" },
228 { MU, PCRE2_NEWLINE_ANYCRLF, 0, 0, "#$", "#\xc2\x85###\r#" },
229 { MU, PCRE2_NEWLINE_ANY, 0, 0, "#$", "#\xe2\x80\xa9" },
230 { 0, PCRE2_NEWLINE_ANY, PCRE2_NOTBOL, 0 | F_NOMATCH, "^a", "aa\naa" },
231 { M, PCRE2_NEWLINE_ANY, PCRE2_NOTBOL, 0, "^a", "aa\naa" },
232 { 0, PCRE2_NEWLINE_ANY, PCRE2_NOTEOL, 0 | F_NOMATCH, "a$", "aa\naa" },
233 { 0, PCRE2_NEWLINE_ANY, PCRE2_NOTEOL, 0 | F_NOMATCH, "a$", "aa\r\n" },
234 { U | PCRE2_DOLLAR_ENDONLY, PCRE2_NEWLINE_ANY, 0, 0 | F_PROPERTY, "\\p{Any}{2,}$", "aa\r\n" },
235 { M, PCRE2_NEWLINE_ANY, PCRE2_NOTEOL, 0, "a$", "aa\naa" },
236 { 0, PCRE2_NEWLINE_CR, 0, 0, ".\\Z", "aaa" },
237 { U, PCRE2_NEWLINE_CR, 0, 0, "a\\Z", "aaa\r" },
238 { 0, PCRE2_NEWLINE_CR, 0, 0, ".\\Z", "aaa\n" },
239 { 0, PCRE2_NEWLINE_CRLF, 0, 0, ".\\Z", "aaa\r" },
240 { U, PCRE2_NEWLINE_CRLF, 0, 0, ".\\Z", "aaa\n" },
241 { 0, PCRE2_NEWLINE_CRLF, 0, 0, ".\\Z", "aaa\r\n" },
242 { U, PCRE2_NEWLINE_ANYCRLF, 0, 0, ".\\Z", "aaa" },
243 { U, PCRE2_NEWLINE_ANYCRLF, 0, 0, ".\\Z", "aaa\r" },
244 { U, PCRE2_NEWLINE_ANYCRLF, 0, 0, ".\\Z", "aaa\n" },
245 { U, PCRE2_NEWLINE_ANYCRLF, 0, 0, ".\\Z", "aaa\r\n" },
246 { U, PCRE2_NEWLINE_ANYCRLF, 0, 0, ".\\Z", "aaa\xe2\x80\xa8" },
247 { U, PCRE2_NEWLINE_ANYCRLF, 0, 0, ".\\Z", "aaa" },
248 { U, PCRE2_NEWLINE_ANYCRLF, 0, 0, ".\\Z", "aaa\r" },
249 { U, PCRE2_NEWLINE_ANYCRLF, 0, 0, ".\\Z", "aaa\n" },
250 { U, PCRE2_NEWLINE_ANYCRLF, 0, 0, ".\\Z", "aaa\r\n" },
251 { U, PCRE2_NEWLINE_ANY, 0, 0, ".\\Z", "aaa\xc2\x85" },
252 { U, PCRE2_NEWLINE_ANY, 0, 0, ".\\Z", "aaa\xe2\x80\xa8" },
253 { M, A, 0, 0, "\\Aa", "aaa" },
254 { M, A, 0, 1 | F_NOMATCH, "\\Aa", "aaa" },
255 { M, A, 0, 1, "\\Ga", "aaa" },
256 { M, A, 0, 1 | F_NOMATCH, "\\Ga", "aba" },
257 { M, A, 0, 0, "a\\z", "aaa" },
258 { M, A, 0, 0 | F_NOMATCH, "a\\z", "aab" },
261 { MU, A, 0, 0, "(ab|bb|cd)", "bacde" },
262 { MU, A, 0, 0, "(?:ab|a)(bc|c)", "ababc" },
263 { MU, A, 0, 0, "((ab|(cc))|(bb)|(?:cd|efg))", "abac" },
264 { CMU, A, 0, 0, "((aB|(Cc))|(bB)|(?:cd|EFg))", "AcCe" },
265 { MU, A, 0, 0, "((ab|(cc))|(bb)|(?:cd|ebg))", "acebebg" },
266 { MU, A, 0, 0, "(?:(a)|(?:b))(cc|(?:d|e))(a|b)k", "accabdbbccbk" },
267 { MU, A, 0, 0, "\xc7\x82|\xc6\x82", "\xf1\x83\x82\x82\xc7\x82\xc7\x83" },
268 { MU, A, 0, 0, "=\xc7\x82|#\xc6\x82", "\xf1\x83\x82\x82=\xc7\x82\xc7\x83" },
269 { MU, A, 0, 0, "\xc7\x82\xc7\x83|\xc6\x82\xc6\x82", "\xf1\x83\x82\x82\xc7\x82\xc7\x83" },
270 …{ MU, A, 0, 0, "\xc6\x82\xc6\x82|\xc7\x83\xc7\x83|\xc8\x84\xc8\x84", "\xf1\x83\x82\x82\xc8\x84\xc8…
271 { U, A, 0, 0, "\xe1\x81\x80|\xe2\x82\x80|\xe4\x84\x80", "\xdf\xbf\xc2\x80\xe4\x84\x80" },
272 { U, A, 0, 0, "(?:\xe1\x81\x80|\xe2\x82\x80|\xe4\x84\x80)#", "\xdf\xbf\xc2\x80#\xe4\x84\x80#" },
273 { CM, A, 0, 0, "ab|cd", "CD" },
274 { CM, A, 0, 0, "a1277|a1377|bX487", "bx487" },
275 { CM, A, 0, 0, "a1277|a1377|bx487", "bX487" },
278 { MU, A, 0, 0, "(?:a)?a", "laab" },
279 { CMU, A, 0, 0, "(A)?A", "llaab" },
280 { MU, A, 0, 0, "(a)?\?a", "aab" }, /* ?? is the prefix of trygraphs in GCC. */
281 { MU, A, 0, 0, "(a)?a", "manm" },
282 { CMU, A, 0, 0, "(a|b)?\?d((?:e)?)", "ABABdx" },
283 { MU, A, 0, 0, "(a|b)?\?d((?:e)?)", "abcde" },
284 { MU, A, 0, 0, "((?:ab)?\?g|b(?:g(nn|d)?\?)?)?\?(?:n)?m", "abgnbgnnbgdnmm" },
287 { MU, A, 0, 0, "(aa)+aa", "aaaaaaa" },
288 { MU, A, 0, 0, "(aa)+?aa", "aaaaaaa" },
289 { MU, A, 0, 0, "(?:aba|ab|a)+l", "ababamababal" },
290 { MU, A, 0, 0, "(?:aba|ab|a)+?l", "ababamababal" },
291 { MU, A, 0, 0, "(a(?:bc|cb|b|c)+?|ss)+e", "accssabccbcacbccbbXaccssabccbcacbccbbe" },
292 { MU, A, 0, 0, "(a(?:bc|cb|b|c)+|ss)+?e", "accssabccbcacbccbbXaccssabccbcacbccbbe" },
293 { MU, A, 0, 0, "(?:(b(c)+?)+)?\?(?:(bc)+|(cb)+)+(?:m)+", "bccbcccbcbccbcbPbccbcccbcbccbcbmmn" },
294 { MU, A, 0, 0, "(aa|bb){8,1000}", "abaabbaabbaabbaab_aabbaabbaabbaabbaabbaabb_" },
297 { CMU, A, 0, 0, "(?:AA)*AB", "aaaaaaamaaaaaaab" },
298 { MU, A, 0, 0, "(?:aa)*?ab", "aaaaaaamaaaaaaab" },
299 { MU, A, 0, 0, "(aa|ab)*ab", "aaabaaab" },
300 { CMU, A, 0, 0, "(aa|Ab)*?aB", "aaabaaab" },
301 { MU, A, 0, 0, "(a|b)*(?:a)*(?:b)*m", "abbbaaababanabbbaaababamm" },
302 { MU, A, 0, 0, "(a|b)*?(?:a)*?(?:b)*?m", "abbbaaababanabbbaaababamm" },
303 { M, A, 0, 0, "a(a(\\1*)a|(b)b+){0}a", "aa" },
304 { M, A, 0, 0, "((?:a|)*){0}a", "a" },
307 { MU, A, 0, 0, "((bm)+)?\?(?:a)*(bm)+n|((am)+?)?(?:a)+(am)*n", "bmbmabmamaaamambmaman" },
308 { MU, A, 0, 0, "(((ab)?cd)*ef)+g", "abcdcdefcdefefmabcdcdefcdefefgg" },
309 { MU, A, 0, 0, "(((ab)?\?cd)*?ef)+?g", "abcdcdefcdefefmabcdcdefcdefefgg" },
310 { MU, A, 0, 0, "(?:(ab)?c|(?:ab)+?d)*g", "ababcdccababddg" },
311 { MU, A, 0, 0, "(?:(?:ab)?\?c|(ab)+d)*?g", "ababcdccababddg" },
314 { MU, A, 0, 0, "(a+aab)+aaaab", "aaaabcaaaabaabcaabcaaabaaaab" },
315 { MU, A, 0, 0, "(a*a*aab)+x", "aaaaabaabaaabmaabx" },
316 { MU, A, 0, 0, "(a*?(b|ab)a*?)+x", "aaaabcxbbaabaacbaaabaabax" },
317 { MU, A, 0, 0, "(a+(ab|ad)a+)+x", "aaabaaaadaabaaabaaaadaaax" },
318 { MU, A, 0, 0, "(a?(a)a?)+(aaa)", "abaaabaaaaaaaa" },
319 { MU, A, 0, 0, "(a?\?(a)a?\?)+(b)", "aaaacaaacaacacbaaab" },
320 { MU, A, 0, 0, "(a{0,4}(b))+d", "aaaaaabaabcaaaaabaaaaabd" },
321 { MU, A, 0, 0, "(a{0,4}?[^b])+d+(a{0,4}[^b])d+", "aaaaadaaaacaadddaaddd" },
322 { MU, A, 0, 0, "(ba{2})+c", "baabaaabacbaabaac" },
323 { MU, A, 0, 0, "(a*+bc++)+", "aaabbcaaabcccab" },
324 { MU, A, 0, 0, "(a?+[^b])+", "babaacacb" },
325 { MU, A, 0, 0, "(a{0,3}+b)(a{0,3}+b)(a{0,3}+)[^c]", "abaabaaacbaabaaaac" },
326 { CMU, A, 0, 0, "([a-c]+[d-f]+?)+?g", "aBdacdehAbDaFgA" },
327 { CMU, A, 0, 0, "[c-f]+k", "DemmFke" },
328 { MU, A, 0, 0, "([DGH]{0,4}M)+", "GGDGHDGMMHMDHHGHM" },
329 { MU, A, 0, 0, "([a-c]{4,}s)+", "abasabbasbbaabsbba" },
330 { CMU, A, 0, 0, "[ace]{3,7}", "AcbDAcEEcEd" },
331 { CMU, A, 0, 0, "[ace]{3,7}?", "AcbDAcEEcEd" },
332 { CMU, A, 0, 0, "[ace]{3,}", "AcbDAcEEcEd" },
333 { CMU, A, 0, 0, "[ace]{3,}?", "AcbDAcEEcEd" },
334 { MU, A, 0, 0, "[ckl]{2,}?g", "cdkkmlglglkcg" },
335 { CMU, A, 0, 0, "[ace]{5}?", "AcCebDAcEEcEd" },
336 { MU, A, 0, 0, "([AbC]{3,5}?d)+", "BACaAbbAEAACCbdCCbdCCAAbb" },
337 { MU, A, 0, 0, "([^ab]{0,}s){2}", "abaabcdsABamsDDs" },
338 { MU, A, 0, 0, "\\b\\w+\\B", "x,a_cd" },
339 { MUP, A, 0, 0, "\\b[^\xc2\xa1]+\\B", "\xc3\x89\xc2\xa1\xe6\x92\xad\xc3\x81\xc3\xa1" },
340 { CMU, A, 0, 0, "[^b]+(a*)([^c]?d{3})", "aaaaddd" },
341 { CMUP, A, 0, 0, "\xe1\xbd\xb8{2}", "\xe1\xbf\xb8#\xe1\xbf\xb8\xe1\xbd\xb8" },
342 …{ CMU, A, 0, 0, "[^\xf0\x90\x90\x80]{2,4}@", "\xf0\x90\x90\xa8\xf0\x90\x90\x80###\xf0\x90\x90\x80@…
343 { CMU, A, 0, 0, "[^\xe1\xbd\xb8][^\xc3\xa9]", "\xe1\xbd\xb8\xe1\xbf\xb8\xc3\xa9\xc3\x89#" },
344 { MU, A, 0, 0, "[^\xe1\xbd\xb8][^\xc3\xa9]", "\xe1\xbd\xb8\xe1\xbf\xb8\xc3\xa9\xc3\x89#" },
345 { MU, A, 0, 0, "[^\xe1\xbd\xb8]{3,}?", "##\xe1\xbd\xb8#\xe1\xbd\xb8#\xc3\x89#\xe1\xbd\xb8" },
346 { MU, A, 0, 0, "\\d+123", "987654321,01234" },
347 { MU, A, 0, 0, "abcd*|\\w+xy", "aaaaa,abxyz" },
348 { MU, A, 0, 0, "(?:abc|((?:amc|\\b\\w*xy)))", "aaaaa,abxyz" },
349 { MU, A, 0, 0, "a(?R)|([a-z]++)#", ".abcd.abcd#."},
350 { MU, A, 0, 0, "a(?R)|([a-z]++)#", ".abcd.mbcd#."},
351 { MU, A, 0, 0, ".[ab]*.", "xx" },
352 { MU, A, 0, 0, ".[ab]*a", "xxa" },
353 { MU, A, 0, 0, ".[ab]?.", "xx" },
354 { MU, A, 0, 0, "_[ab]+_*a", "_aa" },
355 { MU, A, 0, 0, "#(A+)#\\d+", "#A#A#0" },
356 { MU, A, 0, 0, "(?P<size>\\d+)m|M", "4M" },
357 { M, PCRE2_NEWLINE_CRLF, 0, 0, "\\n?.+#", "\n,\n,#" },
360 { MU, A, 0, 0, "(?:(ab){2}){5}M", "abababababababababababM" },
361 { MU, A, 0, 0, "(?:ab|abab){1,5}M", "abababababababababababM" },
362 { MU, A, 0, 0, "(?>ab|abab){1,5}M", "abababababababababababM" },
363 { MU, A, 0, 0, "(?:ab|abab){1,5}?M", "abababababababababababM" },
364 { MU, A, 0, 0, "(?>ab|abab){1,5}?M", "abababababababababababM" },
365 { MU, A, 0, 0, "(?:(ab){1,4}?){1,3}?M", "abababababababababababababM" },
366 { MU, A, 0, 0, "(?:(ab){1,4}){1,3}abababababababababababM", "ababababababababababababM" },
367 …{ MU, A, 0, 0 | F_NOMATCH, "(?:(ab){1,4}){1,3}abababababababababababM", "abababababababababababM" …
368 { MU, A, 0, 0, "(ab){4,6}?M", "abababababababM" },
371 { MU, A, 0, 0, "(?:\\s)+(?:\\S)+", "ab \t\xc3\xa9\xe6\x92\xad " },
372 { MU, A, 0, 0, "(\\w)*(k)(\\W)?\?", "abcdef abck11" },
373 { MU, A, 0, 0, "\\((\\d)+\\)\\D", "a() (83 (8)2 (9)ab" },
374 { MU, A, 0, 0, "\\w(\\s|(?:\\d)*,)+\\w\\wb", "a 5, 4,, bb 5, 4,, aab" },
375 { MU, A, 0, 0, "(\\v+)(\\V+)", "\x0e\xc2\x85\xe2\x80\xa8\x0b\x09\xe2\x80\xa9" },
376 …{ MU, A, 0, 0, "(\\h+)(\\H+)", "\xe2\x80\xa8\xe2\x80\x80\x20\xe2\x80\x8a\xe2\x81\x9f\xe3\x80\x80\x…
377 { MU, A, 0, 0, "x[bcef]+", "xaxdxecbfg" },
378 { MU, A, 0, 0, "x[bcdghij]+", "xaxexfxdgbjk" },
379 { MU, A, 0, 0, "x[^befg]+", "xbxexacdhg" },
380 { MU, A, 0, 0, "x[^bcdl]+", "xlxbxaekmd" },
381 { MU, A, 0, 0, "x[^bcdghi]+", "xbxdxgxaefji" },
382 { MU, A, 0, 0, "x[B-Fb-f]+", "xaxAxgxbfBFG" },
383 { CMU, A, 0, 0, "\\x{e9}+", "#\xf0\x90\x90\xa8\xc3\xa8\xc3\xa9\xc3\x89\xc3\x88" },
384 { CMU, A, 0, 0, "[^\\x{e9}]+", "\xc3\xa9#\xf0\x90\x90\xa8\xc3\xa8\xc3\x88\xc3\x89" },
385 { MU, A, 0, 0, "[\\x02\\x7e]+", "\xc3\x81\xe1\xbf\xb8\xf0\x90\x90\xa8\x01\x02\x7e\x7f" },
386 { MU, A, 0, 0, "[^\\x02\\x7e]+", "\x02\xc3\x81\xe1\xbf\xb8\xf0\x90\x90\xa8\x01\x7f\x7e" },
387 …{ MU, A, 0, 0, "[\\x{81}-\\x{7fe}]+", "#\xe1\xbf\xb8\xf0\x90\x90\xa8\xc2\x80\xc2\x81\xdf\xbe\xdf\x…
388 …{ MU, A, 0, 0, "[^\\x{81}-\\x{7fe}]+", "\xc2\x81#\xe1\xbf\xb8\xf0\x90\x90\xa8\xc2\x80\xdf\xbf\xdf\…
389 …{ MU, A, 0, 0, "[\\x{801}-\\x{fffe}]+", "#\xc3\xa9\xf0\x90\x90\x80\xe0\xa0\x80\xe0\xa0\x81\xef\xbf…
390 …{ MU, A, 0, 0, "[^\\x{801}-\\x{fffe}]+", "\xe0\xa0\x81#\xc3\xa9\xf0\x90\x90\x80\xe0\xa0\x80\xef\xb…
391 …{ MU, A, 0, 0, "[\\x{10001}-\\x{10fffe}]+", "#\xc3\xa9\xe2\xb1\xa5\xf0\x90\x80\x80\xf0\x90\x80\x81…
392 …{ MU, A, 0, 0, "[^\\x{10001}-\\x{10fffe}]+", "\xf0\x90\x80\x81#\xc3\xa9\xe2\xb1\xa5\xf0\x90\x80\x8…
393 { CMU, A, 0, 0 | F_NOMATCH, "^[\\x{0100}-\\x{017f}]", " " },
396 { MUP, A, 0, 0, "[1-5\xc3\xa9\\w]", "\xc3\xa1_" },
397 { MUP, A, 0, 0 | F_PROPERTY, "[\xc3\x81\\p{Ll}]", "A_\xc3\x89\xc3\xa1" },
398 { MUP, A, 0, 0, "[\\Wd-h_x-z]+", "a\xc2\xa1#_yhzdxi" },
399 { MUP, A, 0, 0 | F_NOMATCH | F_PROPERTY, "[\\P{Any}]", "abc" },
400 { MUP, A, 0, 0 | F_NOMATCH | F_PROPERTY, "[^\\p{Any}]", "abc" },
401 { MUP, A, 0, 0 | F_NOMATCH | F_PROPERTY, "[\\P{Any}\xc3\xa1-\xc3\xa8]", "abc" },
402 { MUP, A, 0, 0 | F_NOMATCH | F_PROPERTY, "[^\\p{Any}\xc3\xa1-\xc3\xa8]", "abc" },
403 { MUP, A, 0, 0 | F_NOMATCH | F_PROPERTY, "[\xc3\xa1-\xc3\xa8\\P{Any}]", "abc" },
404 { MUP, A, 0, 0 | F_NOMATCH | F_PROPERTY, "[^\xc3\xa1-\xc3\xa8\\p{Any}]", "abc" },
405 { MUP, A, 0, 0 | F_PROPERTY, "[\xc3\xa1-\xc3\xa8\\p{Any}]", "abc" },
406 { MUP, A, 0, 0 | F_PROPERTY, "[^\xc3\xa1-\xc3\xa8\\P{Any}]", "abc" },
407 { MUP, A, 0, 0, "[b-\xc3\xa9\\s]", "a\xc\xe6\x92\xad" },
408 { CMUP, A, 0, 0, "[\xc2\x85-\xc2\x89\xc3\x89]", "\xc2\x84\xc3\xa9" },
409 { MUP, A, 0, 0, "[^b-d^&\\s]{3,}", "db^ !a\xe2\x80\xa8_ae" },
410 …{ MUP, A, 0, 0 | F_PROPERTY, "[^\\S\\P{Any}][\\sN]{1,3}[\\P{N}]{4}", "\xe2\x80\xaa\xa N\x9\xc3\xa9…
411 { MU, A, 0, 0 | F_PROPERTY, "[^\\P{L}\x9!D-F\xa]{2,3}", "\x9,.DF\xa.CG\xc3\x81" },
412 …{ CMUP, A, 0, 0, "[\xc3\xa1-\xc3\xa9_\xe2\x80\xa0-\xe2\x80\xaf]{1,5}[^\xe2\x80\xa0-\xe2\x80\xaf]",…
413 …{ MUP, A, 0, 0 | F_PROPERTY, "[\xc3\xa2-\xc3\xa6\xc3\x81-\xc3\x84\xe2\x80\xa8-\xe2\x80\xa9\xe6\x92…
414 …{ MUP, A, 0, 0 | F_PROPERTY, "[\\P{L&}]{2}[^\xc2\x85-\xc2\x89\\p{Ll}\\p{Lu}]{2}", "\xc3\xa9\xe6\x9…
415 { PCRE2_UCP, 0, 0, 0 | F_PROPERTY, "[a-b\\s]{2,5}[^a]", "AB baaa" },
416 { MUP, 0, 0, 0 | F_NOMATCH, "[^\\p{Hangul}\\p{Z}]", " " },
417 { MUP, 0, 0, 0, "[\\p{Lu}\\P{Latin}]+", "c\xEA\xA4\xAE,A,b" },
418 { MUP, 0, 0, 0, "[\\x{a92e}\\p{Lu}\\P{Latin}]+", "c\xEA\xA4\xAE,A,b" },
419 { CMUP, 0, 0, 0, "[^S]\\B", "\xe2\x80\x8a" },
422 { MU, A, 0, 0, "(?:|ab||bc|a)+d", "abcxabcabd" },
423 { MU, A, 0, 0, "(|ab||bc|a)+d", "abcxabcabd" },
424 { MU, A, 0, 0, "(?:|ab||bc|a)*d", "abcxabcabd" },
425 { MU, A, 0, 0, "(|ab||bc|a)*d", "abcxabcabd" },
426 { MU, A, 0, 0, "(?:|ab||bc|a)+?d", "abcxabcabd" },
427 { MU, A, 0, 0, "(|ab||bc|a)+?d", "abcxabcabd" },
428 { MU, A, 0, 0, "(?:|ab||bc|a)*?d", "abcxabcabd" },
429 { MU, A, 0, 0, "(|ab||bc|a)*?d", "abcxabcabd" },
430 { MU, A, 0, 0, "(((a)*?|(?:ba)+)+?|(?:|c|ca)*)*m", "abaacaccabacabalabaacaccabacabamm" },
431 { MU, A, 0, 0, "(?:((?:a)*|(ba)+?)+|(|c|ca)*?)*?m", "abaacaccabacabalabaacaccabacabamm" },
434 { MU, A, 0, 3, "(\\d|(?:\\w)*\\w)+", "0ac01Hb" },
435 { MU, A, 0, 4 | F_NOMATCH, "(\\w\\W\\w)+", "ab#d" },
436 { MU, A, 0, 2 | F_NOMATCH, "(\\w\\W\\w)+", "ab#d" },
437 { MU, A, 0, 1, "(\\w\\W\\w)+", "ab#d" },
440 { M, PCRE2_NEWLINE_CRLF, 0, 0, "\\W{0,2}[^#]{3}", "\r\n#....." },
441 { M, PCRE2_NEWLINE_CR, 0, 0, "\\W{0,2}[^#]{3}", "\r\n#....." },
442 { M, PCRE2_NEWLINE_CRLF, 0, 0, "\\W{1,3}[^#]", "\r\n##...." },
443 { MU, A, PCRE2_NO_UTF_CHECK, 1, "^.a", "\n\x80\nxa" },
444 { MU, A, 0, 1, "^", "\r\n" },
445 { M, PCRE2_NEWLINE_CRLF, 0, 1 | F_NOMATCH, "^", "\r\n" },
446 { M, PCRE2_NEWLINE_CRLF, 0, 1, "^", "\r\na" },
449 { 0, PCRE2_NEWLINE_CRLF, 0, 0, ".", "\r" },
450 { U, PCRE2_NEWLINE_CRLF, 0, 0, ".(.).", "a\xc3\xa1\r\n\n\r\r" },
451 { 0, PCRE2_NEWLINE_ANYCRLF, 0, 0, ".(.)", "a\rb\nc\r\n\xc2\x85\xe2\x80\xa8" },
452 { U, PCRE2_NEWLINE_ANYCRLF, 0, 0, ".(.)", "a\rb\nc\r\n\xc2\x85\xe2\x80\xa8" },
453 { U, PCRE2_NEWLINE_ANY, 0, 0, "(.).", "a\rb\nc\r\n\xc2\x85\xe2\x80\xa9$de" },
454 { U, PCRE2_NEWLINE_ANYCRLF, 0, 0 | F_NOMATCH, ".(.).", "\xe2\x80\xa8\nb\r" },
455 { 0, PCRE2_NEWLINE_ANY, 0, 0, "(.)(.)", "#\x85#\r#\n#\r\n#\x84" },
456 { U, PCRE2_NEWLINE_ANY, 0, 0, "(.+)#", "#\rMn\xc2\x85#\n###" },
457 { 0, BSR(PCRE2_BSR_ANYCRLF), 0, 0, "\\R", "\r" },
458 { 0, BSR(PCRE2_BSR_ANYCRLF), 0, 0, "\\R", "\x85#\r\n#" },
459 { U, BSR(PCRE2_BSR_UNICODE), 0, 0, "\\R", "ab\xe2\x80\xa8#c" },
460 { U, BSR(PCRE2_BSR_UNICODE), 0, 0, "\\R", "ab\r\nc" },
461 …{ U, PCRE2_NEWLINE_CRLF | BSR(PCRE2_BSR_UNICODE), 0, 0, "(\\R.)+", "\xc2\x85\r\n#\xe2\x80\xa8\n\r\…
462 { MU, A, 0, 0 | F_NOMATCH, "\\R+", "ab" },
463 { MU, A, 0, 0, "\\R+", "ab\r\n\r" },
464 { MU, A, 0, 0, "\\R*", "ab\r\n\r" },
465 { MU, A, 0, 0, "\\R*", "\r\n\r" },
466 { MU, A, 0, 0, "\\R{2,4}", "\r\nab\r\r" },
467 { MU, A, 0, 0, "\\R{2,4}", "\r\nab\n\n\n\r\r\r" },
468 { MU, A, 0, 0, "\\R{2,}", "\r\nab\n\n\n\r\r\r" },
469 { MU, A, 0, 0, "\\R{0,3}", "\r\n\r\n\r\n\r\n\r\n" },
470 { MU, A, 0, 0 | F_NOMATCH, "\\R+\\R\\R", "\r\n\r\n" },
471 { MU, A, 0, 0, "\\R+\\R\\R", "\r\r\r" },
472 { MU, A, 0, 0, "\\R*\\R\\R", "\n\r" },
473 { MU, A, 0, 0 | F_NOMATCH, "\\R{2,4}\\R\\R", "\r\r\r" },
474 { MU, A, 0, 0, "\\R{2,4}\\R\\R", "\r\r\r\r" },
477 { MU, A, 0, 0 | F_NOMATCH, "(?>ab)ab", "bab" },
478 { MU, A, 0, 0 | F_NOMATCH, "(?>(ab))ab", "bab" },
479 { MU, A, 0, 0, "(?>ab)+abc(?>de)*def(?>gh)?ghe(?>ij)+?k(?>lm)*?n(?>op)?\?op",
481 { MU, A, 0, 0, "(?>a(b)+a|(ab)?\?(b))an", "abban" },
482 { MU, A, 0, 0, "(?>ab+a|(?:ab)?\?b)an", "abban" },
483 { MU, A, 0, 0, "((?>ab|ad|)*?)(?>|c)*abad", "abababcababad" },
484 { MU, A, 0, 0, "(?>(aa|b|)*+(?>(##)|###)*d|(aa)(?>(baa)?)m)", "aabaa#####da" },
485 { MU, A, 0, 0, "((?>a|)+?)b", "aaacaaab" },
486 { MU, A, 0, 0, "(?>x|)*$", "aaa" },
487 { MU, A, 0, 0, "(?>(x)|)*$", "aaa" },
488 { MU, A, 0, 0, "(?>x|())*$", "aaa" },
489 { MU, A, 0, 0, "((?>[cxy]a|[a-d])*?)b", "aaa+ aaab" },
490 { MU, A, 0, 0, "((?>[cxy](a)|[a-d])*?)b", "aaa+ aaab" },
491 { MU, A, 0, 0, "(?>((?>(a+))))bab|(?>((?>(a+))))bb", "aaaabaaabaabab" },
492 { MU, A, 0, 0, "(?>(?>a+))bab|(?>(?>a+))bb", "aaaabaaabaabab" },
493 { MU, A, 0, 0, "(?>(a)c|(?>(c)|(a))a)b*?bab", "aaaabaaabaabab" },
494 { MU, A, 0, 0, "(?>ac|(?>c|a)a)b*?bab", "aaaabaaabaabab" },
495 { MU, A, 0, 0, "(?>(b)b|(a))*b(?>(c)|d)?x", "ababcaaabdbx" },
496 { MU, A, 0, 0, "(?>bb|a)*b(?>c|d)?x", "ababcaaabdbx" },
497 { MU, A, 0, 0, "(?>(bb)|a)*b(?>c|(d))?x", "ababcaaabdbx" },
498 { MU, A, 0, 0, "(?>(a))*?(?>(a))+?(?>(a))??x", "aaaaaacccaaaaabax" },
499 { MU, A, 0, 0, "(?>a)*?(?>a)+?(?>a)??x", "aaaaaacccaaaaabax" },
500 { MU, A, 0, 0, "(?>(a)|)*?(?>(a)|)+?(?>(a)|)??x", "aaaaaacccaaaaabax" },
501 { MU, A, 0, 0, "(?>a|)*?(?>a|)+?(?>a|)??x", "aaaaaacccaaaaabax" },
502 { MU, A, 0, 0, "(?>a(?>(a{0,2}))*?b|aac)+b", "aaaaaaacaaaabaaaaacaaaabaacaaabb" },
503 …{ CM, A, 0, 0, "(?>((?>a{32}|b+|(a*))?(?>c+|d*)?\?)+e)+?f", "aaccebbdde bbdaaaccebbdee bbdaaaccebb…
504 …{ MU, A, 0, 0, "(?>(?:(?>aa|a||x)+?b|(?>aa|a||(x))+?c)?(?>[ad]{0,2})*?d)+d", "aaacdbaabdcabdbaaacd…
505 …{ MU, A, 0, 0, "(?>(?:(?>aa|a||(x))+?b|(?>aa|a||x)+?c)?(?>[ad]{0,2})*?d)+d", "aaacdbaabdcabdbaaacd…
506 { MU, A, 0, 0 | F_PROPERTY, "\\X", "\xcc\x8d\xcc\x8d" },
507 { MU, A, 0, 0 | F_PROPERTY, "\\X", "\xcc\x8d\xcc\x8d#\xcc\x8d\xcc\x8d" },
508 { MU, A, 0, 0 | F_PROPERTY, "\\X+..", "\xcc\x8d#\xcc\x8d#\xcc\x8d\xcc\x8d" },
509 { MU, A, 0, 0 | F_PROPERTY, "\\X{2,4}", "abcdef" },
510 { MU, A, 0, 0 | F_PROPERTY, "\\X{2,4}?", "abcdef" },
511 { MU, A, 0, 0 | F_NOMATCH | F_PROPERTY, "\\X{2,4}..", "#\xcc\x8d##" },
512 { MU, A, 0, 0 | F_PROPERTY, "\\X{2,4}..", "#\xcc\x8d#\xcc\x8d##" },
513 { MU, A, 0, 0, "(c(ab)?+ab)+", "cabcababcab" },
514 { MU, A, 0, 0, "(?>(a+)b)+aabab", "aaaabaaabaabab" },
517 { MU, A, 0, 0, "(?:a|b)++m", "mababbaaxababbaam" },
518 { MU, A, 0, 0, "(?:a|b)*+m", "mababbaaxababbaam" },
519 { MU, A, 0, 0, "(?:a|b)*+m", "ababbaaxababbaam" },
520 { MU, A, 0, 0, "(a|b)++m", "mababbaaxababbaam" },
521 { MU, A, 0, 0, "(a|b)*+m", "mababbaaxababbaam" },
522 { MU, A, 0, 0, "(a|b)*+m", "ababbaaxababbaam" },
523 { MU, A, 0, 0, "(a|b(*ACCEPT))++m", "maaxab" },
524 { MU, A, 0, 0, "(?:b*)++m", "bxbbxbbbxm" },
525 { MU, A, 0, 0, "(?:b*)++m", "bxbbxbbbxbbm" },
526 { MU, A, 0, 0, "(?:b*)*+m", "bxbbxbbbxm" },
527 { MU, A, 0, 0, "(?:b*)*+m", "bxbbxbbbxbbm" },
528 { MU, A, 0, 0, "(b*)++m", "bxbbxbbbxm" },
529 { MU, A, 0, 0, "(b*)++m", "bxbbxbbbxbbm" },
530 { MU, A, 0, 0, "(b*)*+m", "bxbbxbbbxm" },
531 { MU, A, 0, 0, "(b*)*+m", "bxbbxbbbxbbm" },
532 { MU, A, 0, 0, "(?:a|(b))++m", "mababbaaxababbaam" },
533 { MU, A, 0, 0, "(?:(a)|b)*+m", "mababbaaxababbaam" },
534 { MU, A, 0, 0, "(?:(a)|(b))*+m", "ababbaaxababbaam" },
535 { MU, A, 0, 0, "(a|(b))++m", "mababbaaxababbaam" },
536 { MU, A, 0, 0, "((a)|b)*+m", "mababbaaxababbaam" },
537 { MU, A, 0, 0, "((a)|(b))*+m", "ababbaaxababbaam" },
538 { MU, A, 0, 0, "(a|(b)(*ACCEPT))++m", "maaxab" },
539 { MU, A, 0, 0, "(?:(b*))++m", "bxbbxbbbxm" },
540 { MU, A, 0, 0, "(?:(b*))++m", "bxbbxbbbxbbm" },
541 { MU, A, 0, 0, "(?:(b*))*+m", "bxbbxbbbxm" },
542 { MU, A, 0, 0, "(?:(b*))*+m", "bxbbxbbbxbbm" },
543 { MU, A, 0, 0, "((b*))++m", "bxbbxbbbxm" },
544 { MU, A, 0, 0, "((b*))++m", "bxbbxbbbxbbm" },
545 { MU, A, 0, 0, "((b*))*+m", "bxbbxbbbxm" },
546 { MU, A, 0, 0, "((b*))*+m", "bxbbxbbbxbbm" },
547 { MU, A, 0, 0 | F_NOMATCH, "(?>(b{2,4}))(?:(?:(aa|c))++m|(?:(aa|c))+n)", "bbaacaaccaaaacxbbbmbn" },
548 { MU, A, 0, 0, "((?:b)++a)+(cd)*+m", "bbababbacdcdnbbababbacdcdm" },
549 { MU, A, 0, 0, "((?:(b))++a)+((c)d)*+m", "bbababbacdcdnbbababbacdcdm" },
550 …{ MU, A, 0, 0, "(?:(?:(?:ab)*+k)++(?:n(?:cd)++)*+)*+m", "ababkkXababkkabkncXababkkabkncdcdncdXabab…
551 …{ MU, A, 0, 0, "(?:((ab)*+(k))++(n(?:c(d))++)*+)*+m", "ababkkXababkkabkncXababkkabkncdcdncdXababkk…
554 { MU, A, 0, 0, "(aa|bb)(\\1*)(ll|)(\\3*)bbbbbbc", "aaaaaabbbbbbbbc" },
555 { CMU, A, 0, 0, "(aa|bb)(\\1+)(ll|)(\\3+)bbbbbbc", "bBbbBbCbBbbbBbbcbbBbbbBBbbC" },
556 { CM, A, 0, 0, "(a{2,4})\\1", "AaAaaAaA" },
557 { MU, A, 0, 0, "(aa|bb)(\\1?)aa(\\1?)(ll|)(\\4+)bbc", "aaaaaaaabbaabbbbaabbbbc" },
558 { MU, A, 0, 0, "(aa|bb)(\\1{0,5})(ll|)(\\3{0,5})cc", "bbxxbbbbxxaaaaaaaaaaaaaaaacc" },
559 { MU, A, 0, 0, "(aa|bb)(\\1{3,5})(ll|)(\\3{3,5})cc", "bbbbbbbbbbbbaaaaaaccbbbbbbbbbbbbbbcc" },
560 { MU, A, 0, 0, "(aa|bb)(\\1{3,})(ll|)(\\3{3,})cc", "bbbbbbbbbbbbaaaaaaccbbbbbbbbbbbbbbcc" },
561 { MU, A, 0, 0, "(\\w+)b(\\1+)c", "GabGaGaDbGaDGaDc" },
562 { MU, A, 0, 0, "(?:(aa)|b)\\1?b", "bb" },
563 { CMU, A, 0, 0, "(aa|bb)(\\1*?)aa(\\1+?)", "bBBbaaAAaaAAaa" },
564 { MU, A, 0, 0, "(aa|bb)(\\1*?)(dd|)cc(\\3+?)", "aaaaaccdd" },
565 { CMU, A, 0, 0, "(?:(aa|bb)(\\1?\?)cc){2}(\\1?\?)", "aAaABBbbAAaAcCaAcCaA" },
566 { MU, A, 0, 0, "(?:(aa|bb)(\\1{3,5}?)){2}(dd|)(\\3{3,5}?)", "aaaaaabbbbbbbbbbaaaaaaaaaaaaaa" },
567 { CM, A, 0, 0, "(?:(aa|bb)(\\1{3,}?)){2}(dd|)(\\3{3,}?)", "aaaaaabbbbbbbbbbaaaaaaaaaaaaaa" },
568 …{ MU, A, 0, 0, "(?:(aa|bb)(\\1{0,3}?)){2}(dd|)(\\3{0,3}?)b(\\1{0,3}?)(\\1{0,3})", "aaaaaaaaaaaaaaa…
569 { MU, A, 0, 0, "(a(?:\\1|)a){3}b", "aaaaaaaaaaab" },
570 …{ M, A, 0, 0, "(a?)b(\\1\\1*\\1+\\1?\\1*?\\1+?\\1??\\1*+\\1++\\1?+\\1{4}\\1{3,5}\\1{4,}\\1{0,5}\\1…
571 { MUP, A, 0, 0 | F_PROPERTY, "(\\P{N})\\1{2,}", ".www." },
572 { MUP, A, 0, 0 | F_PROPERTY, "(\\P{N})\\1{0,2}", "wwwww." },
573 { MUP, A, 0, 0 | F_PROPERTY, "(\\P{N})\\1{1,2}ww", "wwww" },
574 { MUP, A, 0, 0 | F_PROPERTY, "(\\P{N})\\1{1,2}ww", "wwwww" },
575 { PCRE2_UCP, 0, 0, 0 | F_PROPERTY, "(\\P{N})\\1{2,}", ".www." },
576 { CMUP, A, 0, 0, "(\xf0\x90\x90\x80)\\1", "\xf0\x90\x90\xa8\xf0\x90\x90\xa8" },
577 { MU | PCRE2_DUPNAMES, A, 0, 0 | F_NOMATCH, "\\k<A>{1,3}(?<A>aa)(?<A>bb)", "aabb" },
578 …{ MU | PCRE2_DUPNAMES | PCRE2_MATCH_UNSET_BACKREF, A, 0, 0, "\\k<A>{1,3}(?<A>aa)(?<A>bb)", "aabb" …
579 { MU | PCRE2_DUPNAMES | PCRE2_MATCH_UNSET_BACKREF, A, 0, 0, "\\k<A>*(?<A>aa)(?<A>bb)", "aabb" },
580 { MU | PCRE2_DUPNAMES, A, 0, 0, "(?<A>aa)(?<A>bb)\\k<A>{0,3}aaaaaa", "aabbaaaaaa" },
581 { MU | PCRE2_DUPNAMES, A, 0, 0, "(?<A>aa)(?<A>bb)\\k<A>{2,5}bb", "aabbaaaabb" },
582 { MU | PCRE2_DUPNAMES, A, 0, 0, "(?:(?<A>aa)|(?<A>bb))\\k<A>{0,3}m", "aaaaaaaabbbbaabbbbm" },
583 { MU | PCRE2_DUPNAMES, A, 0, 0 | F_NOMATCH, "\\k<A>{1,3}?(?<A>aa)(?<A>bb)", "aabb" },
584 …{ MU | PCRE2_DUPNAMES | PCRE2_MATCH_UNSET_BACKREF, A, 0, 0, "\\k<A>{1,3}?(?<A>aa)(?<A>bb)", "aabb"…
585 { MU | PCRE2_DUPNAMES, A, 0, 0, "\\k<A>*?(?<A>aa)(?<A>bb)", "aabb" },
586 …{ MU | PCRE2_DUPNAMES, A, 0, 0, "(?:(?<A>aa)|(?<A>bb))\\k<A>{0,3}?m", "aaaaaabbbbbbaabbbbbbbbbbm" …
587 { MU | PCRE2_DUPNAMES, A, 0, 0, "(?:(?<A>aa)|(?<A>bb))\\k<A>*?m", "aaaaaabbbbbbaabbbbbbbbbbm" },
588 { MU | PCRE2_DUPNAMES, A, 0, 0, "(?:(?<A>aa)|(?<A>bb))\\k<A>{2,3}?", "aaaabbbbaaaabbbbbbbbbb" },
589 { CMU | PCRE2_DUPNAMES, A, 0, 0, "(?:(?<A>AA)|(?<A>BB))\\k<A>{0,3}M", "aaaaaaaabbbbaabbbbm" },
590 { CMU | PCRE2_DUPNAMES, A, 0, 0, "(?:(?<A>AA)|(?<A>BB))\\k<A>{1,3}M", "aaaaaaaabbbbaabbbbm" },
591 …{ CMU | PCRE2_DUPNAMES, A, 0, 0, "(?:(?<A>AA)|(?<A>BB))\\k<A>{0,3}?M", "aaaaaabbbbbbaabbbbbbbbbbm"…
592 { CMU | PCRE2_DUPNAMES, A, 0, 0, "(?:(?<A>AA)|(?<A>BB))\\k<A>{2,3}?", "aaaabbbbaaaabbbbbbbbbb" },
595 { MU, A, 0, 0, "(?=xx|yy|zz)\\w{4}", "abczzdefg" },
596 { MU, A, 0, 0, "(?=((\\w+)b){3}|ab)", "dbbbb ab" },
597 { MU, A, 0, 0, "(?!ab|bc|cd)[a-z]{2}", "Xabcdef" },
598 { MU, A, 0, 0, "(?<=aaa|aa|a)a", "aaa" },
599 { MU, A, 0, 2, "(?<=aaa|aa|a)a", "aaa" },
600 { M, A, 0, 0, "(?<=aaa|aa|a)a", "aaa" },
601 { M, A, 0, 2, "(?<=aaa|aa|a)a", "aaa" },
602 { MU, A, 0, 0, "(\\d{2})(?!\\w+c|(((\\w?)m){2}n)+|\\1)", "x5656" },
603 …{ MU, A, 0, 0, "((?=((\\d{2,6}\\w){2,}))\\w{5,20}K){2,}", "567v09708K12l00M00 567v09708K12l00M00K4…
604 { MU, A, 0, 0, "(?=(?:(?=\\S+a)\\w*(b)){3})\\w+\\d", "bba bbab nbbkba nbbkba0kl" },
605 { MU, A, 0, 0, "(?>a(?>(b+))a(?=(..)))*?k", "acabbcabbaabacabaabbakk" },
606 { MU, A, 0, 0, "((?(?=(a))a)+k)", "bbak" },
607 { MU, A, 0, 0, "((?(?=a)a)+k)", "bbak" },
608 { MU, A, 0, 0 | F_NOMATCH, "(?=(?>(a))m)amk", "a k" },
609 { MU, A, 0, 0 | F_NOMATCH, "(?!(?>(a))m)amk", "a k" },
610 { MU, A, 0, 0 | F_NOMATCH, "(?>(?=(a))am)amk", "a k" },
611 …{ MU, A, 0, 0, "(?=(?>a|(?=(?>(b+))a|c)[a-c]+)*?m)[a-cm]+k", "aaam bbam baaambaam abbabba baaambaa…
612 { MU, A, 0, 0, "(?> ?\?\\b(?(?=\\w{1,4}(a))m)\\w{0,8}bc){2,}?", "bca ssbc mabd ssbc mabc" },
613 { MU, A, 0, 0, "(?:(?=ab)?[^n][^n])+m", "ababcdabcdcdabnababcdabcdcdabm" },
614 { MU, A, 0, 0, "(?:(?=a(b))?[^n][^n])+m", "ababcdabcdcdabnababcdabcdcdabm" },
615 { MU, A, 0, 0, "(?:(?=.(.))??\\1.)+m", "aabbbcbacccanaabbbcbacccam" },
616 { MU, A, 0, 0, "(?:(?=.)??[a-c])+m", "abacdcbacacdcaccam" },
617 { MU, A, 0, 0, "((?!a)?(?!([^a]))?)+$", "acbab" },
618 { MU, A, 0, 0, "((?!a)?\?(?!([^a]))?\?)+$", "acbab" },
619 { MU, A, 0, 0, "a(?=(?C)\\B(?C`x`))b", "ab" },
620 { MU, A, 0, 0, "a(?!(?C)\\B(?C`x`))bb|ab", "abb" },
621 { MU, A, 0, 0, "a(?=\\b|(?C)\\B(?C`x`))b", "ab" },
622 { MU, A, 0, 0, "a(?!\\b|(?C)\\B(?C`x`))bb|ab", "abb" },
623 { MU, A, 0, 0, "c(?(?=(?C)\\B(?C`x`))ab|a)", "cab" },
624 { MU, A, 0, 0, "c(?(?!(?C)\\B(?C`x`))ab|a)", "cab" },
625 { MU, A, 0, 0, "c(?(?=\\b|(?C)\\B(?C`x`))ab|a)", "cab" },
626 { MU, A, 0, 0, "c(?(?!\\b|(?C)\\B(?C`x`))ab|a)", "cab" },
627 { MU, A, 0, 0, "a(?=)b", "ab" },
628 { MU, A, 0, 0 | F_NOMATCH, "a(?!)b", "ab" },
631 { MU, A, PCRE2_NOTEMPTY, 0 | F_NOMATCH, "a*", "bcx" },
632 { MU, A, PCRE2_NOTEMPTY, 0, "a*", "bcaad" },
633 { MU, A, PCRE2_NOTEMPTY, 0, "a*?", "bcaad" },
634 { MU, A, PCRE2_NOTEMPTY_ATSTART, 0, "a*", "bcaad" },
635 { MU, A, 0, 0, "a(*ACCEPT)b", "ab" },
636 { MU, A, PCRE2_NOTEMPTY, 0 | F_NOMATCH, "a*(*ACCEPT)b", "bcx" },
637 { MU, A, PCRE2_NOTEMPTY, 0, "a*(*ACCEPT)b", "bcaad" },
638 { MU, A, PCRE2_NOTEMPTY, 0, "a*?(*ACCEPT)b", "bcaad" },
639 { MU, A, PCRE2_NOTEMPTY, 0 | F_NOMATCH, "(?:z|a*(*ACCEPT)b)", "bcx" },
640 { MU, A, PCRE2_NOTEMPTY, 0, "(?:z|a*(*ACCEPT)b)", "bcaad" },
641 { MU, A, PCRE2_NOTEMPTY, 0, "(?:z|a*?(*ACCEPT)b)", "bcaad" },
642 { MU, A, PCRE2_NOTEMPTY_ATSTART, 0, "a*(*ACCEPT)b", "bcx" },
643 { MU, A, PCRE2_NOTEMPTY_ATSTART, 0 | F_NOMATCH, "a*(*ACCEPT)b", "" },
644 { MU, A, 0, 0, "((a(*ACCEPT)b))", "ab" },
645 { MU, A, 0, 0, "(a(*FAIL)a|a)", "aaa" },
646 { MU, A, 0, 0, "(?=ab(*ACCEPT)b)a", "ab" },
647 { MU, A, 0, 0, "(?=(?:x|ab(*ACCEPT)b))", "ab" },
648 { MU, A, 0, 0, "(?=(a(b(*ACCEPT)b)))a", "ab" },
649 { MU, A, PCRE2_NOTEMPTY, 0, "(?=a*(*ACCEPT))c", "c" },
650 { MU, A, PCRE2_NOTEMPTY, 0 | F_NOMATCH, "(?=A)", "AB" },
653 { MU, A, 0, 0, "(?(?=(a))a|b)+k", "ababbalbbadabak" },
654 { MU, A, 0, 0, "(?(?!(b))a|b)+k", "ababbalbbadabak" },
655 { MU, A, 0, 0, "(?(?=a)a|b)+k", "ababbalbbadabak" },
656 { MU, A, 0, 0, "(?(?!b)a|b)+k", "ababbalbbadabak" },
657 { MU, A, 0, 0, "(?(?=(a))a*|b*)+k", "ababbalbbadabak" },
658 { MU, A, 0, 0, "(?(?!(b))a*|b*)+k", "ababbalbbadabak" },
659 …{ MU, A, 0, 0, "(?(?!(b))(?:aaaaaa|a)|(?:bbbbbb|b))+aaaak", "aaaaaaaaaaaaaa bbbbbbbbbbbbbbb aaaaaa…
660 …{ MU, A, 0, 0, "(?(?!b)(?:aaaaaa|a)|(?:bbbbbb|b))+aaaak", "aaaaaaaaaaaaaa bbbbbbbbbbbbbbb aaaaaaak…
661 …{ MU, A, 0, 0 | F_DIFF, "(?(?!(b))(?:aaaaaa|a)|(?:bbbbbb|b))+bbbbk", "aaaaaaaaaaaaaa bbbbbbbbbbbbb…
662 …{ MU, A, 0, 0, "(?(?!b)(?:aaaaaa|a)|(?:bbbbbb|b))+bbbbk", "aaaaaaaaaaaaaa bbbbbbbbbbbbbbb bbbbbbbk…
663 { MU, A, 0, 0, "(?(?=a)a*|b*)+k", "ababbalbbadabak" },
664 { MU, A, 0, 0, "(?(?!b)a*|b*)+k", "ababbalbbadabak" },
665 { MU, A, 0, 0, "(?(?=a)ab)", "a" },
666 { MU, A, 0, 0, "(?(?<!b)c)", "b" },
667 { MU, A, 0, 0, "(?(DEFINE)a(b))", "a" },
668 { MU, A, 0, 0, "a(?(DEFINE)(?:b|(?:c?)+)*)", "a" },
669 { MU, A, 0, 0, "(?(?=.[a-c])[k-l]|[A-D])", "kdB" },
670 { MU, A, 0, 0, "(?(?!.{0,4}[cd])(aa|bb)|(cc|dd))+", "aabbccddaa" },
671 { MU, A, 0, 0, "(?(?=[^#@]*@)(aaab|aa|aba)|(aba|aab)){3,}", "aaabaaaba#aaabaaaba#aaabaaaba@" },
672 { MU, A, 0, 0, "((?=\\w{5})\\w(?(?=\\w*k)\\d|[a-f_])*\\w\\s)+", "mol m10kk m088k _f_a_ mbkkl" },
673 { MU, A, 0, 0, "(c)?\?(?(1)a|b)", "cdcaa" },
674 { MU, A, 0, 0, "(c)?\?(?(1)a|b)", "cbb" },
675 { MU, A, 0, 0 | F_DIFF, "(?(?=(a))(aaaa|a?))+aak", "aaaaab aaaaak" },
676 { MU, A, 0, 0, "(?(?=a)(aaaa|a?))+aak", "aaaaab aaaaak" },
677 { MU, A, 0, 0, "(?(?!(b))(aaaa|a?))+aak", "aaaaab aaaaak" },
678 { MU, A, 0, 0, "(?(?!b)(aaaa|a?))+aak", "aaaaab aaaaak" },
679 { MU, A, 0, 0 | F_DIFF, "(?(?=(a))a*)+aak", "aaaaab aaaaak" },
680 { MU, A, 0, 0, "(?(?=a)a*)+aak", "aaaaab aaaaak" },
681 { MU, A, 0, 0, "(?(?!(b))a*)+aak", "aaaaab aaaaak" },
682 { MU, A, 0, 0, "(?(?!b)a*)+aak", "aaaaab aaaaak" },
683 …{ MU, A, 0, 0, "(?(?=(?=(?!(x))a)aa)aaa|(?(?=(?!y)bb)bbb))*k", "abaabbaaabbbaaabbb abaabbaaabbbaaa…
684 { MU, A, 0, 0, "(?P<Name>a)?(?P<Name2>b)?(?(Name)c|d)*l", "bc ddd abccabccl" },
685 { MU, A, 0, 0, "(?P<Name>a)?(?P<Name2>b)?(?(Name)c|d)+?dd", "bcabcacdb bdddd" },
686 { MU, A, 0, 0, "(?P<Name>a)?(?P<Name2>b)?(?(Name)c|d)+l", "ababccddabdbccd abcccl" },
687 { MU, A, 0, 0, "((?:a|aa)(?(1)aaa))x", "aax" },
688 { MU, A, 0, 0, "(?(?!)a|b)", "ab" },
689 { MU, A, 0, 0, "(?(?!)a)", "ab" },
690 { MU, A, 0, 0 | F_NOMATCH, "(?(?!)a|b)", "ac" },
693 { MU, A, 0, 0, "(?:\\Ka)*aaaab", "aaaaaaaa aaaaaaabb" },
694 { MU, A, 0, 0, "(?>\\Ka\\Ka)*aaaab", "aaaaaaaa aaaaaaaaaabb" },
695 { MU, A, 0, 0, "a+\\K(?<=\\Gaa)a", "aaaaaa" },
696 { MU, A, PCRE2_NOTEMPTY, 0 | F_NOMATCH, "a\\K(*ACCEPT)b", "aa" },
697 { MU, A, PCRE2_NOTEMPTY_ATSTART, 0, "a\\K(*ACCEPT)b", "aa" },
700 { MU | PCRE2_FIRSTLINE, A, 0, 0 | F_PROPERTY, "\\p{Any}a", "bb\naaa" },
701 { MU | PCRE2_FIRSTLINE, A, 0, 0 | F_NOMATCH | F_PROPERTY, "\\p{Any}a", "bb\r\naaa" },
702 { MU | PCRE2_FIRSTLINE, A, 0, 0, "(?<=a)", "a" },
703 { MU | PCRE2_FIRSTLINE, A, 0, 0 | F_NOMATCH, "[^a][^b]", "ab" },
704 { MU | PCRE2_FIRSTLINE, A, 0, 0 | F_NOMATCH, "a", "\na" },
705 { MU | PCRE2_FIRSTLINE, A, 0, 0 | F_NOMATCH, "[abc]", "\na" },
706 { MU | PCRE2_FIRSTLINE, A, 0, 0 | F_NOMATCH, "^a", "\na" },
707 { MU | PCRE2_FIRSTLINE, A, 0, 0 | F_NOMATCH, "^(?<=\n)", "\na" },
708 { MU | PCRE2_FIRSTLINE, A, 0, 0, "\xf0\x90\x90\x80", "\xf0\x90\x90\x80" },
709 { MU | PCRE2_FIRSTLINE, PCRE2_NEWLINE_ANY, 0, 0 | F_NOMATCH, "#", "\xc2\x85#" },
710 { M | PCRE2_FIRSTLINE, PCRE2_NEWLINE_ANY, 0, 0 | F_NOMATCH, "#", "\x85#" },
711 { MU | PCRE2_FIRSTLINE, PCRE2_NEWLINE_ANY, 0, 0 | F_NOMATCH, "^#", "\xe2\x80\xa8#" },
712 { MU | PCRE2_FIRSTLINE, PCRE2_NEWLINE_CRLF, 0, 0 | F_PROPERTY, "\\p{Any}", "\r\na" },
713 { MU | PCRE2_FIRSTLINE, PCRE2_NEWLINE_CRLF, 0, 0, ".", "\r" },
714 { MU | PCRE2_FIRSTLINE, PCRE2_NEWLINE_CRLF, 0, 0, "a", "\ra" },
715 { MU | PCRE2_FIRSTLINE, PCRE2_NEWLINE_CRLF, 0, 0 | F_NOMATCH, "ba", "bbb\r\nba" },
716 …{ MU | PCRE2_FIRSTLINE, PCRE2_NEWLINE_CRLF, 0, 0 | F_NOMATCH | F_PROPERTY, "\\p{Any}{4}|a", "\r\na…
717 { MU | PCRE2_FIRSTLINE, PCRE2_NEWLINE_CRLF, 0, 1, ".", "\r\n" },
718 { PCRE2_FIRSTLINE | PCRE2_DOTALL, PCRE2_NEWLINE_LF, 0, 0 | F_NOMATCH, "ab.", "ab" },
719 { MU | PCRE2_FIRSTLINE, A, 0, 1 | F_NOMATCH, "^[a-d0-9]", "\nxx\nd" },
720 { PCRE2_FIRSTLINE | PCRE2_DOTALL, PCRE2_NEWLINE_ANY, 0, 0, "....a", "012\n0a" },
721 { MU | PCRE2_FIRSTLINE, A, 0, 0, "[aC]", "a" },
724 { MU, A, 0, 0, "(a)(?1)", "aa" },
725 { MU, A, 0, 0, "((a))(?1)", "aa" },
726 { MU, A, 0, 0, "(b|a)(?1)", "aa" },
727 { MU, A, 0, 0, "(b|(a))(?1)", "aa" },
728 { MU, A, 0, 0 | F_NOMATCH, "((a)(b)(?:a*))(?1)", "aba" },
729 { MU, A, 0, 0, "((a)(b)(?:a*))(?1)", "abab" },
730 { MU, A, 0, 0, "((a+)c(?2))b(?1)", "aacaabaca" },
731 { MU, A, 0, 0, "((?2)b|(a)){2}(?1)", "aabab" },
732 { MU, A, 0, 0, "(?1)(a)*+(?2)(b(?1))", "aababa" },
733 { MU, A, 0, 0, "(?1)(((a(*ACCEPT)))b)", "axaa" },
734 { MU, A, 0, 0, "(?1)(?(DEFINE) (((ac(*ACCEPT)))b) )", "akaac" },
735 { MU, A, 0, 0, "(a+)b(?1)b\\1", "abaaabaaaaa" },
736 { MU, A, 0, 0, "(?(DEFINE)(aa|a))(?1)ab", "aab" },
737 { MU, A, 0, 0, "(?(DEFINE)(a\\Kb))(?1)+ababc", "abababxabababc" },
738 { MU, A, 0, 0, "(a\\Kb)(?1)+ababc", "abababxababababc" },
739 { MU, A, 0, 0 | F_NOMATCH, "(a\\Kb)(?1)+ababc", "abababxababababxc" },
740 { MU, A, 0, 0, "b|<(?R)*>", "<<b>" },
741 { MU, A, 0, 0, "(a\\K){0}(?:(?1)b|ac)", "ac" },
742 { MU, A, 0, 0, "(?(DEFINE)(a(?2)|b)(b(?1)|(a)))(?:(?1)|(?2))m", "ababababnababababaam" },
743 { MU, A, 0, 0, "(a)((?(R)a|b))(?2)", "aabbabaa" },
744 { MU, A, 0, 0, "(a)((?(R2)a|b))(?2)", "aabbabaa" },
745 { MU, A, 0, 0, "(a)((?(R1)a|b))(?2)", "ababba" },
746 { MU, A, 0, 0, "(?(R0)aa|bb(?R))", "abba aabb bbaa" },
747 { MU, A, 0, 0, "((?(R)(?:aaaa|a)|(?:(aaaa)|(a)))+)(?1)$", "aaaaaaaaaa aaaa" },
748 { MU, A, 0, 0, "(?P<Name>a(?(R&Name)a|b))(?1)", "aab abb abaa" },
749 { MU, A, 0, 0, "((?(R)a|(?1)){3})", "XaaaaaaaaaX" },
750 { MU, A, 0, 0, "((?:(?(R)a|(?1))){3})", "XaaaaaaaaaX" },
751 { MU, A, 0, 0, "((?(R)a|(?1)){1,3})aaaaaa", "aaaaaaaaXaaaaaaaaa" },
752 { MU, A, 0, 0, "((?(R)a|(?1)){1,3}?)M", "aaaM" },
753 { MU, A, 0, 0, "((.)(?:.|\\2(?1))){0}#(?1)#", "#aabbccdde# #aabbccddee#" },
754 { MU, A, 0, 0, "((.)(?:\\2|\\2{4}b)){0}#(?:(?1))+#", "#aaaab# #aaaaab#" },
755 { MU, A, 0, 0 | F_NOMATCH, "(?1)$((.|\\2xx){1,2})", "abc" },
758 { CM, A, 0, 0 | F_FORCECONV, "\xc3\xa1", "\xc3\x81\xc3\xa1" },
759 { CM, A, 0, 0 | F_FORCECONV, "\xe1\xbd\xb8", "\xe1\xbf\xb8\xe1\xbd\xb8" },
760 { CM, A, 0, 0 | F_FORCECONV, "[\xc3\xa1]", "\xc3\x81\xc3\xa1" },
761 { CM, A, 0, 0 | F_FORCECONV, "[\xe1\xbd\xb8]", "\xe1\xbf\xb8\xe1\xbd\xb8" },
762 { CM, A, 0, 0 | F_FORCECONV, "[a-\xed\xb0\x80]", "A" },
763 { CM, A, 0, 0 | F_NO8 | F_FORCECONV, "[a-\\x{dc00}]", "B" },
764 { CM, A, 0, 0 | F_NO8 | F_NOMATCH | F_FORCECONV, "[b-\\x{dc00}]", "a" },
765 …{ CM, A, 0, 0 | F_NO8 | F_FORCECONV, "\xed\xa0\x80\\x{d800}\xed\xb0\x80\\x{dc00}", "\xed\xa0\x80\x…
766 …{ CM, A, 0, 0 | F_NO8 | F_FORCECONV, "[\xed\xa0\x80\\x{d800}]{1,2}?[\xed\xb0\x80\\x{dc00}]{1,2}?#"…
767 …{ CM, A, 0, 0 | F_FORCECONV, "[\xed\xa0\x80\xed\xb0\x80#]{0,3}(?<=\xed\xb0\x80.)", "\xed\xa0\x80#\…
768 { CM, A, 0, 0 | F_FORCECONV, "[\xed\xa0\x80-\xed\xb3\xbf]", "\xed\x9f\xbf\xed\xa0\x83" },
769 { CM, A, 0, 0 | F_FORCECONV, "[\xed\xa0\x80-\xed\xb3\xbf]", "\xed\xb4\x80\xed\xb3\xb0" },
770 { CM, A, 0, 0 | F_NO8 | F_FORCECONV, "[\\x{d800}-\\x{dcff}]", "\xed\x9f\xbf\xed\xa0\x83" },
771 { CM, A, 0, 0 | F_NO8 | F_FORCECONV, "[\\x{d800}-\\x{dcff}]", "\xed\xb4\x80\xed\xb3\xb0" },
772 …{ CM, A, 0, 0 | F_FORCECONV, "[\xed\xa0\x80-\xef\xbf\xbf]+[\x1-\xed\xb0\x80]+#", "\xed\xa0\x85\xc3…
773 …{ CM, A, 0, 0 | F_FORCECONV, "[\xed\xa0\x80][\xed\xb0\x80]{2,}", "\xed\xa0\x80\xed\xb0\x80\xed\xa0…
774 …{ M, A, 0, 0 | F_FORCECONV, "[^\xed\xb0\x80]{3,}?", "##\xed\xb0\x80#\xed\xb0\x80#\xc3\x89#\xed\xb0…
775 …{ M, A, 0, 0 | F_NO8 | F_FORCECONV, "[^\\x{dc00}]{3,}?", "##\xed\xb0\x80#\xed\xb0\x80#\xc3\x89#\xe…
776 { CM, A, 0, 0 | F_FORCECONV, ".\\B.", "\xed\xa0\x80\xed\xb0\x80" },
777 …{ CM, A, 0, 0 | F_FORCECONV, "\\D+(?:\\d+|.)\\S+(?:\\s+|.)\\W+(?:\\w+|.)\xed\xa0\x80\xed\xa0\x80",…
778 { CM, A, 0, 0 | F_FORCECONV, "\\d*\\s*\\w*\xed\xa0\x80\xed\xa0\x80", "\xed\xa0\x80\xed\xa0\x80" },
779 …{ CM, A, 0, 0 | F_FORCECONV | F_NOMATCH, "\\d*?\\D*?\\s*?\\S*?\\w*?\\W*?##", "\xed\xa0\x80\xed\xa0…
780 …{ CM | PCRE2_EXTENDED, A, 0, 0 | F_FORCECONV, "\xed\xa0\x80 \xed\xb0\x80 !", "\xed\xa0\x80\xed\xb0…
781 { CM, A, 0, 0 | F_FORCECONV, "\xed\xa0\x80+#[^#]+\xed\xa0\x80", "\xed\xa0\x80#a\xed\xa0\x80" },
782 …{ CM, A, 0, 0 | F_FORCECONV, "(\xed\xa0\x80+)#\\1", "\xed\xa0\x80\xed\xa0\x80#\xed\xa0\x80\xed\xa0…
783 { M, PCRE2_NEWLINE_ANY, 0, 0 | F_NO8 | F_FORCECONV, "^-", "a--\xe2\x80\xa8--" },
784 { 0, BSR(PCRE2_BSR_UNICODE), 0, 0 | F_NO8 | F_FORCECONV, "\\R", "ab\xe2\x80\xa8" },
785 { 0, 0, 0, 0 | F_NO8 | F_FORCECONV, "\\v", "ab\xe2\x80\xa9" },
786 { 0, 0, 0, 0 | F_NO8 | F_FORCECONV, "\\h", "ab\xe1\xa0\x8e" },
787 …{ 0, 0, 0, 0 | F_NO8 | F_FORCECONV, "\\v+?\\V+?#", "\xe2\x80\xa9\xe2\x80\xa9\xef\xbf\xbf\xef\xbf\x…
788 …{ 0, 0, 0, 0 | F_NO8 | F_FORCECONV, "\\h+?\\H+?#", "\xe1\xa0\x8e\xe1\xa0\x8e\xef\xbf\xbf\xef\xbf\x…
791 { MU, A, PCRE2_PARTIAL_SOFT, 0, "ab", "a" },
792 { MU, A, PCRE2_PARTIAL_SOFT, 0, "ab|a", "a" },
793 { MU, A, PCRE2_PARTIAL_HARD, 0, "ab|a", "a" },
794 { MU, A, PCRE2_PARTIAL_SOFT, 0, "\\b#", "a" },
795 { MU, A, PCRE2_PARTIAL_SOFT, 0, "(?<=a)b", "a" },
796 { MU, A, PCRE2_PARTIAL_SOFT, 0, "abc|(?<=xxa)bc", "xxab" },
797 { MU, A, PCRE2_PARTIAL_SOFT, 0, "a\\B", "a" },
798 { MU, A, PCRE2_PARTIAL_HARD, 0, "a\\b", "a" },
801 { MU, A, 0, 0, "a(*MARK:aa)a", "ababaa" },
802 { MU, A, 0, 0 | F_NOMATCH, "a(*:aa)a", "abab" },
803 { MU, A, 0, 0, "a(*:aa)(b(*:bb)b|bc)", "abc" },
804 { MU, A, 0, 0 | F_NOMATCH, "a(*:1)x|b(*:2)y", "abc" },
805 { MU, A, 0, 0, "(?>a(*:aa))b|ac", "ac" },
806 { MU, A, 0, 0, "(?(DEFINE)(a(*:aa)))(?1)", "a" },
807 { MU, A, 0, 0 | F_NOMATCH, "(?(DEFINE)((a)(*:aa)))(?1)b", "aa" },
808 { MU, A, 0, 0, "(?(DEFINE)(a(*:aa)))a(?1)b|aac", "aac" },
809 { MU, A, 0, 0, "(a(*:aa)){0}(?:b(?1)b|c)+c", "babbab cc" },
810 { MU, A, 0, 0, "(a(*:aa)){0}(?:b(?1)b)+", "babba" },
811 { MU, A, 0, 0 | F_NOMATCH, "(a(*:aa)){0}(?:b(?1)b)+", "ba" },
812 { MU, A, 0, 0, "(a\\K(*:aa)){0}(?:b(?1)b|c)+c", "babbab cc" },
813 { MU, A, 0, 0, "(a\\K(*:aa)){0}(?:b(?1)b)+", "babba" },
814 { MU, A, 0, 0 | F_NOMATCH, "(a\\K(*:aa)){0}(?:b(?1)b)+", "ba" },
815 { MU, A, 0, 0 | F_NOMATCH, "(*:mark)m", "a" },
818 { MU, A, 0, 0 | F_NOMATCH, "a(*COMMIT)b", "ac" },
819 { MU, A, 0, 0, "aa(*COMMIT)b", "xaxaab" },
820 { MU, A, 0, 0 | F_NOMATCH, "a(*COMMIT)(*:msg)b|ac", "ac" },
821 { MU, A, 0, 0 | F_NOMATCH, "(a(*COMMIT)b)++", "abac" },
822 { MU, A, 0, 0 | F_NOMATCH, "((a)(*COMMIT)b)++", "abac" },
823 { MU, A, 0, 0 | F_NOMATCH, "(?=a(*COMMIT)b)ab|ad", "ad" },
826 { MU, A, 0, 0, "aa\\K(*PRUNE)b", "aaab" },
827 { MU, A, 0, 0, "aa(*PRUNE:bb)b|a", "aa" },
828 { MU, A, 0, 0, "(a)(a)(*PRUNE)b|(a)", "aa" },
829 { MU, A, 0, 0, "(a)(a)(a)(a)(a)(a)(a)(a)(*PRUNE)b|(a)", "aaaaaaaa" },
830 { MU, A, PCRE2_PARTIAL_SOFT, 0, "a(*PRUNE)a|", "a" },
831 { MU, A, PCRE2_PARTIAL_SOFT, 0, "a(*PRUNE)a|m", "a" },
832 { MU, A, 0, 0 | F_NOMATCH, "(?=a(*PRUNE)b)ab|ad", "ad" },
833 { MU, A, 0, 0, "a(*COMMIT)(*PRUNE)d|bc", "abc" },
834 { MU, A, 0, 0, "(?=a(*COMMIT)b)a(*PRUNE)c|bc", "abc" },
835 { MU, A, 0, 0 | F_NOMATCH, "(*COMMIT)(?=a(*COMMIT)b)a(*PRUNE)c|bc", "abc" },
836 { MU, A, 0, 0, "(?=(a)(*COMMIT)b)a(*PRUNE)c|bc", "abc" },
837 { MU, A, 0, 0 | F_NOMATCH, "(*COMMIT)(?=(a)(*COMMIT)b)a(*PRUNE)c|bc", "abc" },
838 { MU, A, 0, 0, "(a(*COMMIT)b){0}a(?1)(*PRUNE)c|bc", "abc" },
839 { MU, A, 0, 0 | F_NOMATCH, "(a(*COMMIT)b){0}a(*COMMIT)(?1)(*PRUNE)c|bc", "abc" },
840 { MU, A, 0, 0, "(a(*COMMIT)b)++(*PRUNE)d|c", "ababc" },
841 { MU, A, 0, 0 | F_NOMATCH, "(*COMMIT)(a(*COMMIT)b)++(*PRUNE)d|c", "ababc" },
842 { MU, A, 0, 0, "((a)(*COMMIT)b)++(*PRUNE)d|c", "ababc" },
843 { MU, A, 0, 0 | F_NOMATCH, "(*COMMIT)((a)(*COMMIT)b)++(*PRUNE)d|c", "ababc" },
844 { MU, A, 0, 0, "(?>a(*COMMIT)b)*abab(*PRUNE)d|ba", "ababab" },
845 { MU, A, 0, 0 | F_NOMATCH, "(*COMMIT)(?>a(*COMMIT)b)*abab(*PRUNE)d|ba", "ababab" },
846 { MU, A, 0, 0, "(?>a(*COMMIT)b)+abab(*PRUNE)d|ba", "ababab" },
847 { MU, A, 0, 0 | F_NOMATCH, "(*COMMIT)(?>a(*COMMIT)b)+abab(*PRUNE)d|ba", "ababab" },
848 { MU, A, 0, 0, "(?>a(*COMMIT)b)?ab(*PRUNE)d|ba", "aba" },
849 { MU, A, 0, 0 | F_NOMATCH, "(*COMMIT)(?>a(*COMMIT)b)?ab(*PRUNE)d|ba", "aba" },
850 { MU, A, 0, 0, "(?>a(*COMMIT)b)*?n(*PRUNE)d|ba", "abababn" },
851 { MU, A, 0, 0 | F_NOMATCH, "(*COMMIT)(?>a(*COMMIT)b)*?n(*PRUNE)d|ba", "abababn" },
852 { MU, A, 0, 0, "(?>a(*COMMIT)b)+?n(*PRUNE)d|ba", "abababn" },
853 { MU, A, 0, 0 | F_NOMATCH, "(*COMMIT)(?>a(*COMMIT)b)+?n(*PRUNE)d|ba", "abababn" },
854 { MU, A, 0, 0, "(?>a(*COMMIT)b)??n(*PRUNE)d|bn", "abn" },
855 { MU, A, 0, 0 | F_NOMATCH, "(*COMMIT)(?>a(*COMMIT)b)??n(*PRUNE)d|bn", "abn" },
858 { MU, A, 0, 0 | F_NOMATCH, "(?=a(*SKIP)b)ab|ad", "ad" },
859 { MU, A, 0, 0, "(\\w+(*SKIP)#)", "abcd,xyz#," },
860 { MU, A, 0, 0, "\\w+(*SKIP)#|mm", "abcd,xyz#," },
861 { MU, A, 0, 0 | F_NOMATCH, "b+(?<=(*SKIP)#c)|b+", "#bbb" },
864 { MU, A, 0, 0, "((?:a(*THEN)|aab)(*THEN)c|a+)+m", "aabcaabcaabcaabcnacm" },
865 { MU, A, 0, 0 | F_NOMATCH, "((?:a(*THEN)|aab)(*THEN)c|a+)+m", "aabcm" },
866 { MU, A, 0, 0, "((?:a(*THEN)|aab)c|a+)+m", "aabcaabcnmaabcaabcm" },
867 { MU, A, 0, 0, "((?:a|aab)(*THEN)c|a+)+m", "aam" },
868 { MU, A, 0, 0, "((?:a(*COMMIT)|aab)(*THEN)c|a+)+m", "aam" },
869 { MU, A, 0, 0, "(?(?=a(*THEN)b)ab|ad)", "ad" },
870 { MU, A, 0, 0, "(?(?!a(*THEN)b)ad|add)", "add" },
871 { MU, A, 0, 0 | F_NOMATCH, "(?(?=a)a(*THEN)b|ad)", "ad" },
872 { MU, A, 0, 0, "(?!(?(?=a)ab|b(*THEN)d))bn|bnn", "bnn" },
873 { MU, A, 0, 0, "(?=(*THEN: ))* ", " " },
874 { MU, A, 0, 0, "a(*THEN)(?R) |", "a" },
877 { MU, A, 0, 0, "(a(*ACCEPT)b){0}a(?1)b", "aacaabb" },
878 { MU, A, 0, 0, "((a)\\2(*ACCEPT)b){0}a(?1)b", "aaacaaabb" },
879 { MU, A, 0, 0, "((ab|a(*ACCEPT)x)+|ababababax){0}_(?1)_", "_ababababax_ _ababababa_" },
880 { MU, A, 0, 0, "((.)(?:A(*ACCEPT)|(?1)\\2)){0}_(?1)_", "_bcdaAdcb_bcdaAdcb_" },
881 { MU, A, 0, 0, "((*MARK:m)(?:a|a(*COMMIT)b|aa)){0}_(?1)_", "_ab_" },
882 { MU, A, 0, 0, "((*MARK:m)(?:a|a(*COMMIT)b|aa)){0}_(?1)_|(_aa_)", "_aa_" },
883 …{ MU, A, 0, 0, "(a(*COMMIT)(?:b|bb)|c(*ACCEPT)d|dd){0}_(?1)+_", "_ax_ _cd_ _abbb_ _abcd_ _abbcdd_"…
884 …{ MU, A, 0, 0, "((.)(?:.|(*COMMIT)\\2{3}(*ACCEPT).*|.*)){0}_(?1){0,4}_", "_aaaabbbbccccddd_ _aaaab…
888 { MU, A, 0, 0, "!(*sr:\\w\\w|\\w\\w\\w)*#", "!abcdefghijklmno!abcdefghijklmno!abcdef#" },
889 { MU, A, 0, 0, "!(*sr:\\w\\w|\\w\\w\\w)+#", "!abcdefghijklmno!abcdefghijklmno!abcdef#" },
890 { MU, A, 0, 0, "!(*sr:\\w\\w|\\w\\w\\w)*?#", "!abcdefghijklmno!abcdefghijklmno!abcdef#" },
891 { MU, A, 0, 0, "!(*sr:\\w\\w|\\w\\w\\w)+?#", "!abcdefghijklmno!abcdefghijklmno!abcdef#" },
892 { MU, A, 0, 0, "!(*sr:\\w\\w|\\w\\w\\w)*+#", "!abcdefghijklmno!abcdefghijklmno!abcdef#" },
893 { MU, A, 0, 0, "!(*sr:\\w\\w|\\w\\w\\w)++#", "!abcdefghijklmno!abcdefghijklmno!abcdef#" },
894 { MU, A, 0, 0, "!(*sr:\\w\\w|\\w\\w\\w)?#", "!ab!abc!ab!ab#" },
895 { MU, A, 0, 0, "!(*sr:\\w\\w|\\w\\w\\w)??#", "!ab!abc!ab!ab#" },
899 { MU, A, 0, 0, "((((?:(?:(?:\\w)+)?)*|(?>\\w)+?)+|(?>\\w)?\?)*)?\\s", "aaaaa+ " },
900 { MU, A, 0, 0, "(?:((?:(?:(?:\\w*?)+)??|(?>\\w)?|\\w*+)*)+)+?\\s", "aa+ " },
901 { MU, A, 0, 0, "((a?)+)+b", "aaaaaaaaaaaa b" },
904 …{ M, A, 0, 0 | F_NOMATCH, "a?a?a?a?a?a?a?a?a?a?a?a?a?a?a?a?a?a?a?a?a?a?a?a?aaaaaaaaaaaaaaaaaaaaaaa…
905 { M, A, 0, 0 | F_NOMATCH, "(?:a+)+b", "aaaaaaaaaaaaaaaaaaaaaaaa b" },
906 { M, A, 0, 0 | F_NOMATCH, "(?:a+?)+?b", "aaaaaaaaaaaaaaaaaaaaaaaa b" },
907 { M, A, 0, 0 | F_NOMATCH, "(?:a*)*b", "aaaaaaaaaaaaaaaaaaaaaaaa b" },
908 { M, A, 0, 0 | F_NOMATCH, "(?:a*?)*?b", "aaaaaaaaaaaaaaaaaaaaaaaa b" },
910 { 0, 0, 0, 0, NULL, NULL }
1011 if (max_length == 0) in convert_utf8_to_utf16()
1012 return 0; in convert_utf8_to_utf16()
1015 c = 0; in convert_utf8_to_utf16()
1019 if (*iptr < 0xc0) in convert_utf8_to_utf16()
1021 else if (!(*iptr & 0x20)) { in convert_utf8_to_utf16()
1022 c = ((iptr[0] & 0x1f) << 6) | (iptr[1] & 0x3f); in convert_utf8_to_utf16()
1024 } else if (!(*iptr & 0x10)) { in convert_utf8_to_utf16()
1025 c = ((iptr[0] & 0x0f) << 12) | ((iptr[1] & 0x3f) << 6) | (iptr[2] & 0x3f); in convert_utf8_to_utf16()
1027 } else if (!(*iptr & 0x08)) { in convert_utf8_to_utf16()
1028 …c = ((iptr[0] & 0x07) << 18) | ((iptr[1] & 0x3f) << 12) | ((iptr[2] & 0x3f) << 6) | (iptr[3] & 0x3… in convert_utf8_to_utf16()
1036 *optr = '\0'; in convert_utf8_to_utf16()
1039 c -= 0x10000; in convert_utf8_to_utf16()
1040 *optr++ = 0xd800 | ((c >> 10) & 0x3ff); in convert_utf8_to_utf16()
1041 *optr++ = 0xdc00 | (c & 0x3ff); in convert_utf8_to_utf16()
1049 *optr = '\0'; in convert_utf8_to_utf16()
1058 if (max_length == 0) in copy_char8_to_char16()
1059 return 0; in copy_char8_to_char16()
1065 *optr = '\0'; in copy_char8_to_char16()
1083 if (max_length == 0) in convert_utf8_to_utf32()
1084 return 0; in convert_utf8_to_utf32()
1087 c = 0; in convert_utf8_to_utf32()
1091 if (*iptr < 0xc0) in convert_utf8_to_utf32()
1093 else if (!(*iptr & 0x20)) { in convert_utf8_to_utf32()
1094 c = ((iptr[0] & 0x1f) << 6) | (iptr[1] & 0x3f); in convert_utf8_to_utf32()
1096 } else if (!(*iptr & 0x10)) { in convert_utf8_to_utf32()
1097 c = ((iptr[0] & 0x0f) << 12) | ((iptr[1] & 0x3f) << 6) | (iptr[2] & 0x3f); in convert_utf8_to_utf32()
1099 } else if (!(*iptr & 0x08)) { in convert_utf8_to_utf32()
1100 …c = ((iptr[0] & 0x07) << 18) | ((iptr[1] & 0x3f) << 12) | ((iptr[2] & 0x3f) << 6) | (iptr[3] & 0x3… in convert_utf8_to_utf32()
1109 *optr = 0; in convert_utf8_to_utf32()
1118 if (max_length == 0) in copy_char8_to_char32()
1119 return 0; in copy_char8_to_char32()
1125 *optr = '\0'; in copy_char8_to_char32()
1140 return 0; in check_ascii()
1155 int total = 0; in regression_tests()
1156 int successful = 0; in regression_tests()
1157 int successful_row = 0; in regression_tests()
1158 int counter = 0; in regression_tests()
1160 int utf = 0; in regression_tests()
1161 int disabled_options = 0; in regression_tests()
1221 for (i = 0; cpu_info[i]; i++) in regression_tests()
1248 is_ascii = 0; in regression_tests()
1258 error = 0; in regression_tests()
1337 if ((counter & 0x3) != 0) { in regression_tests()
1350 return_value8[0] = -1000; in regression_tests()
1365 for (i = 0; i < OVECTOR_SIZE * 2; ++i) in regression_tests()
1367 for (i = 0; i < OVECTOR_SIZE * 2; ++i) in regression_tests()
1377 } else if ((counter & 0x1) != 0) { in regression_tests()
1379 return_value8[0] = pcre2_match_8(re8, (PCRE2_SPTR8)current->input, strlen(current->input), in regression_tests()
1383 return_value8[0] = pcre2_jit_match_8(re8, (PCRE2_SPTR8)current->input, strlen(current->input), in regression_tests()
1390 return_value16[0] = -1000; in regression_tests()
1405 for (i = 0; i < OVECTOR_SIZE * 2; ++i) in regression_tests()
1407 for (i = 0; i < OVECTOR_SIZE * 2; ++i) in regression_tests()
1422 } else if ((counter & 0x1) != 0) { in regression_tests()
1424 return_value16[0] = pcre2_match_16(re16, regtest_buf16, length16, in regression_tests()
1428 return_value16[0] = pcre2_jit_match_16(re16, regtest_buf16, length16, in regression_tests()
1435 return_value32[0] = -1000; in regression_tests()
1450 for (i = 0; i < OVECTOR_SIZE * 2; ++i) in regression_tests()
1452 for (i = 0; i < OVECTOR_SIZE * 2; ++i) in regression_tests()
1467 } else if ((counter & 0x1) != 0) { in regression_tests()
1469 return_value32[0] = pcre2_match_32(re32, regtest_buf32, length32, in regression_tests()
1473 return_value32[0] = pcre2_jit_match_32(re32, regtest_buf32, length32, in regression_tests()
1480 return_value8[0], return_value16[0], return_value32[0], in regression_tests()
1481 (int)ovector8_1[0], (int)ovector8_1[1], in regression_tests()
1482 (int)ovector16_1[0], (int)ovector16_1[1], in regression_tests()
1483 (int)ovector32_1[0], (int)ovector32_1[1], in regression_tests()
1496 if ((return_value = return_value8[0]) != return_value8[1]) { in regression_tests()
1498 return_value8[0], return_value8[1], total, current->pattern, current->input); in regression_tests()
1499 is_successful = 0; in regression_tests()
1503 if ((return_value = return_value16[0]) != return_value16[1]) { in regression_tests()
1505 return_value16[0], return_value16[1], total, current->pattern, current->input); in regression_tests()
1506 is_successful = 0; in regression_tests()
1510 if ((return_value = return_value32[0]) != return_value32[1]) { in regression_tests()
1512 return_value32[0], return_value32[1], total, current->pattern, current->input); in regression_tests()
1513 is_successful = 0; in regression_tests()
1517 if (return_value8[0] != return_value16[0]) { in regression_tests()
1519 return_value8[0], return_value16[0], in regression_tests()
1521 is_successful = 0; in regression_tests()
1525 if (return_value8[0] != return_value32[0]) { in regression_tests()
1527 return_value8[0], return_value32[0], in regression_tests()
1529 is_successful = 0; in regression_tests()
1533 if (return_value16[0] != return_value32[0]) { in regression_tests()
1535 return_value16[0], return_value32[0], in regression_tests()
1537 is_successful = 0; in regression_tests()
1540 if (return_value >= 0 || return_value == PCRE2_ERROR_PARTIAL) { in regression_tests()
1547 return_value8[0] = return_value; in regression_tests()
1550 return_value16[0] = return_value; in regression_tests()
1553 return_value32[0] = return_value; in regression_tests()
1558 for (i = 0; i < return_value; ++i) { in regression_tests()
1566 for (i = 0; i < return_value; ++i) { in regression_tests()
1575 for (i = 0; i < return_value; ++i) { in regression_tests()
1581 is_successful = 0; in regression_tests()
1589 is_successful = 0; in regression_tests()
1597 is_successful = 0; in regression_tests()
1606 if (return_value8[0] != return_value8[1]) { in regression_tests()
1608 return_value8[0], return_value8[1], total, current->pattern, current->input); in regression_tests()
1609 is_successful = 0; in regression_tests()
1610 } else if (return_value8[0] >= 0 || return_value8[0] == PCRE2_ERROR_PARTIAL) { in regression_tests()
1611 if (return_value8[0] == PCRE2_ERROR_PARTIAL) in regression_tests()
1612 return_value8[0] = 2; in regression_tests()
1614 return_value8[0] *= 2; in regression_tests()
1616 for (i = 0; i < return_value8[0]; ++i) in regression_tests()
1620 is_successful = 0; in regression_tests()
1626 if (return_value16[0] != return_value16[1]) { in regression_tests()
1628 return_value16[0], return_value16[1], total, current->pattern, current->input); in regression_tests()
1629 is_successful = 0; in regression_tests()
1630 } else if (return_value16[0] >= 0 || return_value16[0] == PCRE2_ERROR_PARTIAL) { in regression_tests()
1631 if (return_value16[0] == PCRE2_ERROR_PARTIAL) in regression_tests()
1632 return_value16[0] = 2; in regression_tests()
1634 return_value16[0] *= 2; in regression_tests()
1636 for (i = 0; i < return_value16[0]; ++i) in regression_tests()
1640 is_successful = 0; in regression_tests()
1646 if (return_value32[0] != return_value32[1]) { in regression_tests()
1648 return_value32[0], return_value32[1], total, current->pattern, current->input); in regression_tests()
1649 is_successful = 0; in regression_tests()
1650 } else if (return_value32[0] >= 0 || return_value32[0] == PCRE2_ERROR_PARTIAL) { in regression_tests()
1651 if (return_value32[0] == PCRE2_ERROR_PARTIAL) in regression_tests()
1652 return_value32[0] = 2; in regression_tests()
1654 return_value32[0] *= 2; in regression_tests()
1656 for (i = 0; i < return_value32[0]; ++i) in regression_tests()
1660 is_successful = 0; in regression_tests()
1670 if (return_value8[0] < 0 && !(current->start_offset & F_NOMATCH)) { in regression_tests()
1673 is_successful = 0; in regression_tests()
1676 if (return_value8[0] >= 0 && (current->start_offset & F_NOMATCH)) { in regression_tests()
1679 is_successful = 0; in regression_tests()
1685 if (return_value16[0] < 0 && !(current->start_offset & F_NOMATCH)) { in regression_tests()
1688 is_successful = 0; in regression_tests()
1691 if (return_value16[0] >= 0 && (current->start_offset & F_NOMATCH)) { in regression_tests()
1694 is_successful = 0; in regression_tests()
1700 if (return_value32[0] < 0 && !(current->start_offset & F_NOMATCH)) { in regression_tests()
1703 is_successful = 0; in regression_tests()
1706 if (return_value32[0] >= 0 && (current->start_offset & F_NOMATCH)) { in regression_tests()
1709 is_successful = 0; in regression_tests()
1720 is_successful = 0; in regression_tests()
1727 is_successful = 0; in regression_tests()
1734 is_successful = 0; in regression_tests()
1763 successful_row = 0; in regression_tests()
1767 successful_row = 0; in regression_tests()
1784 return 0; in regression_tests()
1796 if (match_start < 0) { in check_invalid_utf_result()
1801 return 0; in check_invalid_utf_result()
1804 if (result <= 0) { in check_invalid_utf_result()
1805 printf("Pattern[%d] %s result (%d) is not greater than 0.\n", pattern_index, type, result); in check_invalid_utf_result()
1809 if (ovector[0] != (PCRE2_SIZE)match_start) { in check_invalid_utf_result()
1810 printf("Pattern[%d] %s ovector[0] is unexpected (%d instead of %d)\n", in check_invalid_utf_result()
1811 pattern_index, type, (int)ovector[0], match_start); in check_invalid_utf_result()
1821 return 0; in check_invalid_utf_result()
1847 { UDA, CI, 0, 0, 0, 0, 4, { ".", NULL }, "\xf4\x8f\xbf\xbf" },
1848 { UDA, CI, 0, 0, 0, 0, 4, { ".", NULL }, "\xf0\x90\x80\x80" },
1849 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\xf4\x90\x80\x80" },
1850 { UDA, CI, 0, 0, 1, -1, -1, { ".", NULL }, "\xf4\x8f\xbf\xbf" },
1851 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\xf0\x90\x80\x7f" },
1852 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\xf0\x90\x80\xc0" },
1853 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\xf0\x8f\xbf\xbf" },
1854 { UDA, CI, 0, 0, 0, 0, 3, { ".", NULL }, "\xef\xbf\xbf#" },
1855 { UDA, CI, 0, 0, 0, 0, 3, { ".", NULL }, "\xef\xbf\xbf" },
1856 { UDA, CI, 0, 0, 0, 0, 3, { ".", NULL }, "\xe0\xa0\x80#" },
1857 { UDA, CI, 0, 0, 0, 0, 3, { ".", NULL }, "\xe0\xa0\x80" },
1858 { UDA, CI, 0, 0, 2, -1, -1, { ".", NULL }, "\xef\xbf\xbf#" },
1859 { UDA, CI, 0, 0, 1, -1, -1, { ".", NULL }, "\xef\xbf\xbf" },
1860 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\xef\xbf\x7f#" },
1861 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\xef\xbf\xc0" },
1862 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\xe0\x9f\xbf#" },
1863 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\xe0\x9f\xbf" },
1864 { UDA, CI, 0, 0, 0, 0, 3, { ".", NULL }, "\xed\x9f\xbf#" },
1865 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\xed\xa0\x80#" },
1866 { UDA, CI, 0, 0, 0, 0, 3, { ".", NULL }, "\xee\x80\x80#" },
1867 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\xed\xbf\xbf#" },
1868 { UDA, CI, 0, 0, 0, 0, 2, { ".", NULL }, "\xdf\xbf##" },
1869 { UDA, CI, 0, 0, 0, 0, 2, { ".", NULL }, "\xdf\xbf#" },
1870 { UDA, CI, 0, 0, 0, 0, 2, { ".", NULL }, "\xdf\xbf" },
1871 { UDA, CI, 0, 0, 0, 0, 2, { ".", NULL }, "\xc2\x80##" },
1872 { UDA, CI, 0, 0, 0, 0, 2, { ".", NULL }, "\xc2\x80#" },
1873 { UDA, CI, 0, 0, 0, 0, 2, { ".", NULL }, "\xc2\x80" },
1874 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\xe0\x80##" },
1875 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\xdf\xc0##" },
1876 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\xe0\x80" },
1877 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\xdf\xc0" },
1878 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\xc1\xbf##" },
1879 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\xc1\xbf" },
1880 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\x80###" },
1881 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\x80" },
1882 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\xf8###" },
1883 { UDA, CI, 0, 0, 0, -1, -1, { ".", NULL }, "\xf8" },
1884 { UDA, CI, 0, 0, 0, 0, 1, { ".", NULL }, "\x7f" },
1886 { UDA, CPI, 4, 0, 0, 4, 4, { "\\B", NULL }, "\xf4\x8f\xbf\xbf#" },
1887 { UDA, CPI, 4, 0, 0, -1, -1, { "\\B", "\\b" }, "\xf4\xa0\x80\x80\xf4\xa0\x80\x80" },
1889 { UDA, CPI, 4, 0, 0, 4, 4, { "\\B", NULL }, "#\xef\xbf\xbf#" },
1890 { UDA, CPI, 4, 0, 0, 4, 4, { "\\B", NULL }, "#\xe0\xa0\x80#" },
1891 { UDA, CPI, 4, 0, 0, 4, 4, { "\\B", NULL }, "\xf0\x90\x80\x80#" },
1892 { UDA, CPI, 4, 0, 0, 4, 4, { "\\B", NULL }, "\xf3\xbf\xbf\xbf#" },
1893 { UDA, CPI, 4, 0, 0, -1, -1, { "\\B", "\\b" }, "\xf0\x8f\xbf\xbf\xf0\x8f\xbf\xbf" },
1894 { UDA, CPI, 4, 0, 0, -1, -1, { "\\B", "\\b" }, "\xf5\x80\x80\x80\xf5\x80\x80\x80" },
1895 { UDA, CPI, 4, 0, 0, -1, -1, { "\\B", "\\b" }, "\xf4\x90\x80\x80\xf4\x90\x80\x80" },
1896 { UDA, CPI, 4, 0, 0, -1, -1, { "\\B", "\\b" }, "\xf4\x8f\xbf\xff\xf4\x8f\xbf\xff" },
1897 { UDA, CPI, 4, 0, 0, -1, -1, { "\\B", "\\b" }, "\xf4\x8f\xff\xbf\xf4\x8f\xff\xbf" },
1898 { UDA, CPI, 4, 0, 1, -1, -1, { "\\B", "\\b" }, "\xef\x80\x80\x80\xef\x80\x80" },
1899 { UDA, CPI, 4, 0, 0, -1, -1, { "\\B", "\\b" }, "\x80\x80\x80\x80\x80\x80\x80\x80" },
1900 { UDA, CPI, 4, 0, 0, -1, -1, { "\\B", "\\b" }, "#\xe0\x9f\xbf\xe0\x9f\xbf#" },
1902 { UDA, CPI, 4, 0, 0, -1, -1, { "\\B", "\\b" }, "#\xf0\x80\x80\xf0\x80\x80#" },
1903 { UDA, CPI, 4, 0, 0, -1, -1, { "\\B", "\\b" }, "#\xed\xa0\x80\xed\xa0\x80#" },
1904 { UDA, CPI, 4, 0, 0, 4, 4, { "\\B", NULL }, "##\xdf\xbf#" },
1905 { UDA, CPI, 4, 2, 0, 2, 2, { "\\B", NULL }, "##\xdf\xbf#" },
1906 { UDA, CPI, 4, 0, 0, 4, 4, { "\\B", NULL }, "##\xc2\x80#" },
1907 { UDA, CPI, 4, 2, 0, 2, 2, { "\\B", NULL }, "##\xc2\x80#" },
1908 { UDA, CPI, 4, 0, 0, -1, -1, { "\\B", "\\b" }, "##\xc1\xbf\xc1\xbf##" },
1909 { UDA, CPI, 4, 0, 0, -1, -1, { "\\B", "\\b" }, "##\xdf\xc0\xdf\xc0##" },
1910 { UDA, CPI, 4, 0, 0, -1, -1, { "\\B", "\\b" }, "##\xe0\x80\xe0\x80##" },
1912 { UDA, CPI, 3, 0, 0, 3, 3, { "\\B", NULL }, "\xef\xbf\xbf#" },
1913 { UDA, CPI, 3, 0, 0, 3, 3, { "\\B", NULL }, "\xe0\xa0\x80#" },
1914 { UDA, CPI, 3, 0, 0, -1, -1, { "\\B", "\\b" }, "\xe0\x9f\xbf\xe0\x9f\xbf" },
1916 { UDA, CPI, 3, 0, 1, -1, -1, { "\\B", "\\b" }, "\xdf\x80\x80\xdf\x80" },
1917 { UDA, CPI, 3, 0, 0, -1, -1, { "\\B", "\\b" }, "\xef\xbf\xff\xef\xbf\xff" },
1918 { UDA, CPI, 3, 0, 0, -1, -1, { "\\B", "\\b" }, "\xef\xff\xbf\xef\xff\xbf" },
1919 { UDA, CPI, 3, 0, 0, -1, -1, { "\\B", "\\b" }, "\xed\xbf\xbf\xed\xbf\xbf" },
1921 { UDA, CPI, 2, 0, 0, 2, 2, { "\\B", NULL }, "\xdf\xbf#" },
1922 { UDA, CPI, 2, 0, 0, 2, 2, { "\\B", NULL }, "\xc2\x80#" },
1924 { UDA, CPI, 2, 0, 0, -1, -1, { "\\B", "\\b" }, "\xc1\xbf\xc1\xbf" },
1925 { UDA, CPI, 2, 0, 0, -1, -1, { "\\B", "\\b" }, "\xe0\x80\xe0\x80" },
1926 { UDA, CPI, 2, 0, 0, -1, -1, { "\\B", "\\b" }, "\xdf\xff\xdf\xff" },
1927 { UDA, CPI, 2, 0, 0, -1, -1, { "\\B", "\\b" }, "\xff\xbf\xff\xbf" },
1929 { UDA, CPI, 1, 0, 0, 1, 1, { "\\B", NULL }, "\x7f#" },
1930 { UDA, CPI, 1, 0, 0, 1, 1, { "\\B", NULL }, "\x01#" },
1931 { UDA, CPI, 1, 0, 0, -1, -1, { "\\B", "\\b" }, "\x80\x80" },
1932 { UDA, CPI, 1, 0, 0, -1, -1, { "\\B", "\\b" }, "\xb0\xb0" },
1934 { UDA | PCRE2_CASELESS, CPI, 0, 0, 0, 0, 2, { "(.)\\1", NULL }, "aA" },
1935 { UDA | PCRE2_CASELESS, CPI, 0, 0, 0, -1, -1, { "(.)\\1", NULL }, "a\xff" },
1936 { UDA | PCRE2_CASELESS, CPI, 0, 0, 0, 0, 4, { "(.)\\1", NULL }, "\xc3\xa1\xc3\x81" },
1937 { UDA | PCRE2_CASELESS, CPI, 0, 0, 1, -1, -1, { "(.)\\1", NULL }, "\xc3\xa1\xc3\x81" },
1938 { UDA | PCRE2_CASELESS, CPI, 0, 0, 0, -1, -1, { "(.)\\1", NULL }, "\xc2\x80\x80" },
1939 { UDA | PCRE2_CASELESS, CPI, 0, 0, 0, 0, 6, { "(.)\\1", NULL }, "\xe1\xbd\xb8\xe1\xbf\xb8" },
1940 { UDA | PCRE2_CASELESS, CPI, 0, 0, 1, -1, -1, { "(.)\\1", NULL }, "\xe1\xbd\xb8\xe1\xbf\xb8" },
1941 …{ UDA | PCRE2_CASELESS, CPI, 0, 0, 0, 0, 8, { "(.)\\1", NULL }, "\xf0\x90\x90\x80\xf0\x90\x90\xa8"…
1942 …{ UDA | PCRE2_CASELESS, CPI, 0, 0, 1, -1, -1, { "(.)\\1", NULL }, "\xf0\x90\x90\x80\xf0\x90\x90\xa…
1944 { UDA, CPI, 0, 0, 0, 0, 1, { "\\X", NULL }, "A" },
1945 { UDA, CPI, 0, 0, 0, -1, -1, { "\\X", NULL }, "\xff" },
1946 { UDA, CPI, 0, 0, 0, 0, 2, { "\\X", NULL }, "\xc3\xa1" },
1947 { UDA, CPI, 0, 0, 1, -1, -1, { "\\X", NULL }, "\xc3\xa1" },
1948 { UDA, CPI, 0, 0, 0, -1, -1, { "\\X", NULL }, "\xc3\x7f" },
1949 { UDA, CPI, 0, 0, 0, 0, 3, { "\\X", NULL }, "\xe1\xbd\xb8" },
1950 { UDA, CPI, 0, 0, 1, -1, -1, { "\\X", NULL }, "\xe1\xbd\xb8" },
1951 { UDA, CPI, 0, 0, 0, 0, 4, { "\\X", NULL }, "\xf0\x90\x90\x80" },
1952 { UDA, CPI, 0, 0, 1, -1, -1, { "\\X", NULL }, "\xf0\x90\x90\x80" },
1954 { UDA, CPI, 0, 0, 0, -1, -1, { "[^#]", NULL }, "#" },
1955 { UDA, CPI, 0, 0, 0, 0, 4, { "[^#]", NULL }, "\xf4\x8f\xbf\xbf" },
1956 { UDA, CPI, 0, 0, 0, -1, -1, { "[^#]", NULL }, "\xf4\x90\x80\x80" },
1957 { UDA, CPI, 0, 0, 0, -1, -1, { "[^#]", NULL }, "\xc1\x80" },
1959 { PCRE2_UTF | PCRE2_MULTILINE, CI, 1, 0, 0, 2, 3, { "^\\W", NULL }, " \x0a#"},
1960 …{ PCRE2_UTF | PCRE2_MULTILINE, CI, 1, 0, 0, 14, 15, { "^\\W", NULL }, " \xc0\x8a#\xe0\x80\x8a#\xf0…
1961 { PCRE2_UTF | PCRE2_MULTILINE, CI, 1, 0, 0, 3, 4, { "^\\W", NULL }, " \xf8\x0a#"},
1962 { PCRE2_UTF | PCRE2_MULTILINE, CI, 1, 0, 0, 3, 4, { "^\\W", NULL }, " \xc3\x0a#"},
1963 { PCRE2_UTF | PCRE2_MULTILINE, CI, 1, 0, 0, 3, 4, { "^\\W", NULL }, " \xf1\x0a#"},
1964 { PCRE2_UTF | PCRE2_MULTILINE, CI, 1, 0, 0, 4, 5, { "^\\W", NULL }, " \xf2\xbf\x0a#"},
1965 { PCRE2_UTF | PCRE2_MULTILINE, CI, 1, 0, 0, 5, 6, { "^\\W", NULL }, " \xf2\xbf\xbf\x0a#"},
1966 { PCRE2_UTF | PCRE2_MULTILINE, CI, 1, 0, 0, 3, 4, { "^\\W", NULL }, " \xef\x0a#"},
1967 { PCRE2_UTF | PCRE2_MULTILINE, CI, 1, 0, 0, 4, 5, { "^\\W", NULL }, " \xef\xbf\x0a#"},
1968 { PCRE2_UTF | PCRE2_MULTILINE, CI, 1, 0, 0, 5, 6, { "^\\W", NULL }, " \x85#\xc2\x85#"},
1969 { PCRE2_UTF | PCRE2_MULTILINE, CI, 1, 0, 0, 7, 8, { "^\\W", NULL }, " \xe2\x80\xf8\xe2\x80\xa8#"},
1971 { PCRE2_UTF | PCRE2_FIRSTLINE, CI, 0, 0, 0, -1, -1, { "#", NULL }, "\xe2\x80\xf8\xe2\x80\xa8#"},
1972 { PCRE2_UTF | PCRE2_FIRSTLINE, CI, 0, 0, 0, 3, 4, { "#", NULL }, "\xe2\x80\xf8#\xe2\x80\xa8#"},
1973 { PCRE2_UTF | PCRE2_FIRSTLINE, CI, 0, 0, 0, -1, -1, { "#", NULL }, "abcd\xc2\x85#"},
1974 { PCRE2_UTF | PCRE2_FIRSTLINE, CI, 0, 0, 0, 1, 2, { "#", NULL }, "\x85#\xc2\x85#"},
1975 { PCRE2_UTF | PCRE2_FIRSTLINE, CI, 0, 0, 0, 5, 6, { "#", NULL }, "\xef,\x80,\xf8#\x0a"},
1976 { PCRE2_UTF | PCRE2_FIRSTLINE, CI, 0, 0, 0, -1, -1, { "#", NULL }, "\xef,\x80,\xf8\x0a#"},
1978 …{ PCRE2_UTF | PCRE2_NO_START_OPTIMIZE, CI, 0, 0, 0, 4, 8, { "#\xc7\x85#", NULL }, "\x80\x80#\xc7#\…
1979 …{ PCRE2_UTF | PCRE2_NO_START_OPTIMIZE, CI, 0, 0, 0, 7, 11, { "#\xc7\x85#", NULL }, "\x80\x80#\xc7\…
1980 { PCRE2_UTF, CI, 0, 0, 0, 4, 8, { "#\xc7\x85#", NULL }, "\x80\x80#\xc7#\xc7\x85#" },
1981 { PCRE2_UTF, CI, 0, 0, 0, 7, 11, { "#\xc7\x85#", NULL }, "\x80\x80#\xc7\x80\x80\x80#\xc7\x85#" },
1983 { PCRE2_UTF | PCRE2_UCP, CI, 0, 0, 0, -1, -1, { "[\\s]", NULL }, "\xed\xa0\x80" },
1986 { 0, PCRE2_JIT_COMPLETE, 0, 0, 1, -1, -1, { "\\X{2}", NULL }, "\r\n\n" },
1987 { 0, PCRE2_JIT_COMPLETE, 0, 0, 1, -1, -1, { "\\R{2}", NULL }, "\r\n\n" },
1989 …{ PCRE2_UTF | PCRE2_MULTILINE, CI, 0, 0, 0, -1, -1, { "^.a", &invalid_utf8_newline_cr }, "\xc3\xa7…
1991 { 0, 0, 0, 0, 0, 0, 0, { NULL, NULL }, NULL }
2013 printf("Pattern[%d:0] cannot be compiled. Error offset: %d\n", pattern_index, (int)erroroffset); in run_invalid_utf8_test()
2014 return 0; in run_invalid_utf8_test()
2017 if (pcre2_jit_compile_8(code, current->jit_compile_options) != 0) { in run_invalid_utf8_test()
2018 printf("Pattern[%d:0] cannot be compiled by the JIT compiler.\n", pattern_index); in run_invalid_utf8_test()
2020 return 0; in run_invalid_utf8_test()
2027 length, current->start_offset - current->skip_left, 0, mdata, NULL); in run_invalid_utf8_test()
2031 return 0; in run_invalid_utf8_test()
2041 return 0; in run_invalid_utf8_test()
2054 int total = 0, successful = 0; in invalid_utf8_regression_tests()
2063 for (current = invalid_utf8_regression_test_cases; current->pattern[0]; current++) { in invalid_utf8_regression_tests()
2070 if (!run_invalid_utf8_test(current, total - 1, 0, ccontext, mdata)) in invalid_utf8_regression_tests()
2071 result = 0; in invalid_utf8_regression_tests()
2073 result = 0; in invalid_utf8_regression_tests()
2076 if (!run_invalid_utf8_test(current, total - 1, 0, ccontext, mdata)) in invalid_utf8_regression_tests()
2077 result = 0; in invalid_utf8_regression_tests()
2086 if ((total % 60) == 0) in invalid_utf8_regression_tests()
2090 if ((total % 60) != 0) in invalid_utf8_regression_tests()
2098 return 0; in invalid_utf8_regression_tests()
2109 return 0; in invalid_utf8_regression_tests()
2132 static PCRE2_UCHAR16 allany16[] = { '.', 0 };
2133 static PCRE2_UCHAR16 non_word_boundary16[] = { '\\', 'B', 0 };
2134 static PCRE2_UCHAR16 word_boundary16[] = { '\\', 'b', 0 };
2135 static PCRE2_UCHAR16 backreference16[] = { '(', '.', ')', '\\', '1', 0 };
2136 static PCRE2_UCHAR16 grapheme16[] = { '\\', 'X', 0 };
2137 static PCRE2_UCHAR16 nothashmark16[] = { '[', '^', '#', ']', 0 };
2138 static PCRE2_UCHAR16 afternl16[] = { '^', '\\', 'W', 0 };
2139 static PCRE2_UCHAR16 generic16[] = { '#', 0xd800, 0xdc00, '#', 0 };
2140 static PCRE2_UCHAR16 test16_1[] = { 0xd7ff, 0xe000, 0xffff, 0x01, '#', 0 };
2141 static PCRE2_UCHAR16 test16_2[] = { 0xd800, 0xdc00, 0xd800, 0xdc00, 0 };
2142 static PCRE2_UCHAR16 test16_3[] = { 0xdbff, 0xdfff, 0xdbff, 0xdfff, 0 };
2143 static PCRE2_UCHAR16 test16_4[] = { 0xd800, 0xdbff, 0xd800, 0xdbff, 0 };
2144 static PCRE2_UCHAR16 test16_5[] = { '#', 0xd800, 0xdc00, '#', 0 };
2145 static PCRE2_UCHAR16 test16_6[] = { 'a', 'A', 0xdc28, 0 };
2146 static PCRE2_UCHAR16 test16_7[] = { 0xd801, 0xdc00, 0xd801, 0xdc28, 0 };
2147 static PCRE2_UCHAR16 test16_8[] = { '#', 0xd800, 0xdc00, 0 };
2148 static PCRE2_UCHAR16 test16_9[] = { ' ', 0x2028, '#', 0 };
2149 static PCRE2_UCHAR16 test16_10[] = { ' ', 0xdc00, 0xd800, 0x2028, '#', 0 };
2150 static PCRE2_UCHAR16 test16_11[] = { 0xdc00, 0xdc00, 0xd800, 0xdc00, 0xdc00, '#', 0xd800, 0xdc00, '…
2151 …E2_UCHAR16 test16_12[] = { '#', 0xd800, 0xdc00, 0xd800, '#', 0xd800, 0xdc00, 0xdc00, 0xdc00, '#', …
2154 { UDA, CI, 0, 0, 0, 0, 1, { allany16, NULL }, test16_1 },
2155 { UDA, CI, 1, 0, 0, 1, 2, { allany16, NULL }, test16_1 },
2156 { UDA, CI, 2, 0, 0, 2, 3, { allany16, NULL }, test16_1 },
2157 { UDA, CI, 3, 0, 0, 3, 4, { allany16, NULL }, test16_1 },
2158 { UDA, CI, 0, 0, 0, 0, 2, { allany16, NULL }, test16_2 },
2159 { UDA, CI, 0, 0, 3, -1, -1, { allany16, NULL }, test16_2 },
2160 { UDA, CI, 1, 0, 0, -1, -1, { allany16, NULL }, test16_2 },
2161 { UDA, CI, 0, 0, 0, 0, 2, { allany16, NULL }, test16_3 },
2162 { UDA, CI, 0, 0, 3, -1, -1, { allany16, NULL }, test16_3 },
2163 { UDA, CI, 1, 0, 0, -1, -1, { allany16, NULL }, test16_3 },
2165 { UDA, CPI, 1, 0, 0, 1, 1, { non_word_boundary16, NULL }, test16_1 },
2166 { UDA, CPI, 2, 0, 0, 2, 2, { non_word_boundary16, NULL }, test16_1 },
2167 { UDA, CPI, 3, 0, 0, 3, 3, { non_word_boundary16, NULL }, test16_1 },
2168 { UDA, CPI, 4, 0, 0, 4, 4, { non_word_boundary16, NULL }, test16_1 },
2169 { UDA, CPI, 2, 0, 0, 2, 2, { non_word_boundary16, NULL }, test16_2 },
2170 { UDA, CPI, 2, 0, 0, 2, 2, { non_word_boundary16, NULL }, test16_3 },
2173 { UDA, CPI, 2, 0, 0, -1, -1, { non_word_boundary16, word_boundary16 }, test16_4 },
2174 { UDA, CPI, 2, 0, 0, -1, -1, { non_word_boundary16, word_boundary16 }, test16_5 },
2176 { UDA | PCRE2_CASELESS, CPI, 0, 0, 0, 0, 2, { backreference16, NULL }, test16_6 },
2177 { UDA | PCRE2_CASELESS, CPI, 1, 0, 0, -1, -1, { backreference16, NULL }, test16_6 },
2178 { UDA | PCRE2_CASELESS, CPI, 0, 0, 0, 0, 4, { backreference16, NULL }, test16_7 },
2179 { UDA | PCRE2_CASELESS, CPI, 0, 0, 1, -1, -1, { backreference16, NULL }, test16_7 },
2181 { UDA, CPI, 0, 0, 0, 0, 1, { grapheme16, NULL }, test16_6 },
2182 { UDA, CPI, 1, 0, 0, 1, 2, { grapheme16, NULL }, test16_6 },
2183 { UDA, CPI, 2, 0, 0, -1, -1, { grapheme16, NULL }, test16_6 },
2184 { UDA, CPI, 0, 0, 0, 0, 2, { grapheme16, NULL }, test16_7 },
2185 { UDA, CPI, 2, 0, 0, 2, 4, { grapheme16, NULL }, test16_7 },
2186 { UDA, CPI, 1, 0, 0, -1, -1, { grapheme16, NULL }, test16_7 },
2188 { UDA, CPI, 0, 0, 0, -1, -1, { nothashmark16, NULL }, test16_8 },
2189 { UDA, CPI, 1, 0, 0, 1, 3, { nothashmark16, NULL }, test16_8 },
2190 { UDA, CPI, 2, 0, 0, -1, -1, { nothashmark16, NULL }, test16_8 },
2192 { PCRE2_UTF | PCRE2_MULTILINE, CI, 1, 0, 0, 2, 3, { afternl16, NULL }, test16_9 },
2193 { PCRE2_UTF | PCRE2_MULTILINE, CI, 1, 0, 0, 4, 5, { afternl16, NULL }, test16_10 },
2195 { PCRE2_UTF | PCRE2_NO_START_OPTIMIZE, CI, 0, 0, 0, 5, 9, { generic16, NULL }, test16_11 },
2196 { PCRE2_UTF | PCRE2_NO_START_OPTIMIZE, CI, 0, 0, 0, 9, 13, { generic16, NULL }, test16_12 },
2197 { PCRE2_UTF, CI, 0, 0, 0, 5, 9, { generic16, NULL }, test16_11 },
2198 { PCRE2_UTF, CI, 0, 0, 0, 9, 13, { generic16, NULL }, test16_12 },
2200 { 0, 0, 0, 0, 0, 0, 0, { NULL, NULL }, NULL }
2223 printf("Pattern[%d:0] cannot be compiled. Error offset: %d\n", pattern_index, (int)erroroffset); in run_invalid_utf16_test()
2224 return 0; in run_invalid_utf16_test()
2227 if (pcre2_jit_compile_16(code, current->jit_compile_options) != 0) { in run_invalid_utf16_test()
2228 printf("Pattern[%d:0] cannot be compiled by the JIT compiler.\n", pattern_index); in run_invalid_utf16_test()
2230 return 0; in run_invalid_utf16_test()
2234 length = 0; in run_invalid_utf16_test()
2236 while (*input++ != 0) in run_invalid_utf16_test()
2243 length, current->start_offset - current->skip_left, 0, mdata, NULL); in run_invalid_utf16_test()
2247 return 0; in run_invalid_utf16_test()
2257 return 0; in run_invalid_utf16_test()
2270 int total = 0, successful = 0; in invalid_utf16_regression_tests()
2279 for (current = invalid_utf16_regression_test_cases; current->pattern[0]; current++) { in invalid_utf16_regression_tests()
2284 if (!run_invalid_utf16_test(current, total - 1, 0, ccontext, mdata)) in invalid_utf16_regression_tests()
2285 result = 0; in invalid_utf16_regression_tests()
2287 result = 0; in invalid_utf16_regression_tests()
2294 if ((total % 60) == 0) in invalid_utf16_regression_tests()
2298 if ((total % 60) != 0) in invalid_utf16_regression_tests()
2306 return 0; in invalid_utf16_regression_tests()
2317 return 0; in invalid_utf16_regression_tests()
2340 static PCRE2_UCHAR32 allany32[] = { '.', 0 };
2341 static PCRE2_UCHAR32 non_word_boundary32[] = { '\\', 'B', 0 };
2342 static PCRE2_UCHAR32 word_boundary32[] = { '\\', 'b', 0 };
2343 static PCRE2_UCHAR32 backreference32[] = { '(', '.', ')', '\\', '1', 0 };
2344 static PCRE2_UCHAR32 grapheme32[] = { '\\', 'X', 0 };
2345 static PCRE2_UCHAR32 nothashmark32[] = { '[', '^', '#', ']', 0 };
2346 static PCRE2_UCHAR32 afternl32[] = { '^', '\\', 'W', 0 };
2347 static PCRE2_UCHAR32 test32_1[] = { 0x10ffff, 0x10ffff, 0x110000, 0x110000, 0x10ffff, 0 };
2348 static PCRE2_UCHAR32 test32_2[] = { 0xd7ff, 0xe000, 0xd800, 0xdfff, 0xe000, 0xdfff, 0xd800, 0 };
2349 static PCRE2_UCHAR32 test32_3[] = { 'a', 'A', 0x110000, 0 };
2350 static PCRE2_UCHAR32 test32_4[] = { '#', 0x10ffff, 0x110000, 0 };
2351 static PCRE2_UCHAR32 test32_5[] = { ' ', 0x2028, '#', 0 };
2352 static PCRE2_UCHAR32 test32_6[] = { ' ', 0x110000, 0x2028, '#', 0 };
2355 { UDA, CI, 0, 0, 0, 0, 1, { allany32, NULL }, test32_1 },
2356 { UDA, CI, 2, 0, 0, -1, -1, { allany32, NULL }, test32_1 },
2357 { UDA, CI, 0, 0, 0, 0, 1, { allany32, NULL }, test32_2 },
2358 { UDA, CI, 1, 0, 0, 1, 2, { allany32, NULL }, test32_2 },
2359 { UDA, CI, 2, 0, 0, -1, -1, { allany32, NULL }, test32_2 },
2360 { UDA, CI, 3, 0, 0, -1, -1, { allany32, NULL }, test32_2 },
2362 { UDA, CPI, 1, 0, 0, 1, 1, { non_word_boundary32, NULL }, test32_1 },
2363 { UDA, CPI, 3, 0, 0, -1, -1, { non_word_boundary32, word_boundary32 }, test32_1 },
2364 { UDA, CPI, 1, 0, 0, 1, 1, { non_word_boundary32, NULL }, test32_2 },
2365 { UDA, CPI, 3, 0, 0, -1, -1, { non_word_boundary32, word_boundary32 }, test32_2 },
2366 { UDA, CPI, 6, 0, 0, -1, -1, { non_word_boundary32, word_boundary32 }, test32_2 },
2368 { UDA | PCRE2_CASELESS, CPI, 0, 0, 0, 0, 2, { backreference32, NULL }, test32_3 },
2369 { UDA | PCRE2_CASELESS, CPI, 1, 0, 0, -1, -1, { backreference32, NULL }, test32_3 },
2371 { UDA, CPI, 0, 0, 0, 0, 1, { grapheme32, NULL }, test32_1 },
2372 { UDA, CPI, 2, 0, 0, -1, -1, { grapheme32, NULL }, test32_1 },
2373 { UDA, CPI, 1, 0, 0, 1, 2, { grapheme32, NULL }, test32_2 },
2374 { UDA, CPI, 2, 0, 0, -1, -1, { grapheme32, NULL }, test32_2 },
2375 { UDA, CPI, 3, 0, 0, -1, -1, { grapheme32, NULL }, test32_2 },
2376 { UDA, CPI, 4, 0, 0, 4, 5, { grapheme32, NULL }, test32_2 },
2378 { UDA, CPI, 0, 0, 0, -1, -1, { nothashmark32, NULL }, test32_4 },
2379 { UDA, CPI, 1, 0, 0, 1, 2, { nothashmark32, NULL }, test32_4 },
2380 { UDA, CPI, 2, 0, 0, -1, -1, { nothashmark32, NULL }, test32_4 },
2381 { UDA, CPI, 1, 0, 0, 1, 2, { nothashmark32, NULL }, test32_2 },
2382 { UDA, CPI, 2, 0, 0, -1, -1, { nothashmark32, NULL }, test32_2 },
2384 { PCRE2_UTF | PCRE2_MULTILINE, CI, 1, 0, 0, 2, 3, { afternl32, NULL }, test32_5 },
2385 { PCRE2_UTF | PCRE2_MULTILINE, CI, 1, 0, 0, 3, 4, { afternl32, NULL }, test32_6 },
2387 { 0, 0, 0, 0, 0, 0, 0, { NULL, NULL }, NULL }
2410 printf("Pattern[%d:0] cannot be compiled. Error offset: %d\n", pattern_index, (int)erroroffset); in run_invalid_utf32_test()
2411 return 0; in run_invalid_utf32_test()
2414 if (pcre2_jit_compile_32(code, current->jit_compile_options) != 0) { in run_invalid_utf32_test()
2415 printf("Pattern[%d:0] cannot be compiled by the JIT compiler.\n", pattern_index); in run_invalid_utf32_test()
2417 return 0; in run_invalid_utf32_test()
2421 length = 0; in run_invalid_utf32_test()
2423 while (*input++ != 0) in run_invalid_utf32_test()
2430 length, current->start_offset - current->skip_left, 0, mdata, NULL); in run_invalid_utf32_test()
2434 return 0; in run_invalid_utf32_test()
2444 return 0; in run_invalid_utf32_test()
2457 int total = 0, successful = 0; in invalid_utf32_regression_tests()
2466 for (current = invalid_utf32_regression_test_cases; current->pattern[0]; current++) { in invalid_utf32_regression_tests()
2471 if (!run_invalid_utf32_test(current, total - 1, 0, ccontext, mdata)) in invalid_utf32_regression_tests()
2472 result = 0; in invalid_utf32_regression_tests()
2474 result = 0; in invalid_utf32_regression_tests()
2481 if ((total % 60) == 0) in invalid_utf32_regression_tests()
2485 if ((total % 60) != 0) in invalid_utf32_regression_tests()
2493 return 0; in invalid_utf32_regression_tests()
2504 return 0; in invalid_utf32_regression_tests()