1*22dc650dSSadaf Ebrahimi# This set of tests is for UTF-8 support and Unicode property support, with 2*22dc650dSSadaf Ebrahimi# relevance only for the 8-bit library. 3*22dc650dSSadaf Ebrahimi 4*22dc650dSSadaf Ebrahimi#newline_default lf any anycrlf 5*22dc650dSSadaf Ebrahimi 6*22dc650dSSadaf Ebrahimi# The next 5 patterns have UTF-8 errors 7*22dc650dSSadaf Ebrahimi 8*22dc650dSSadaf Ebrahimi/[�]/utf 9*22dc650dSSadaf EbrahimiFailed: error -8 at offset 1: UTF-8 error: byte 2 top bits not 0x80 10*22dc650dSSadaf Ebrahimi 11*22dc650dSSadaf Ebrahimi/�/utf 12*22dc650dSSadaf EbrahimiFailed: error -3 at offset 0: UTF-8 error: 1 byte missing at end 13*22dc650dSSadaf Ebrahimi 14*22dc650dSSadaf Ebrahimi/���xxx/utf 15*22dc650dSSadaf EbrahimiFailed: error -8 at offset 0: UTF-8 error: byte 2 top bits not 0x80 16*22dc650dSSadaf Ebrahimi 17*22dc650dSSadaf Ebrahimi/Â��������/utf 18*22dc650dSSadaf EbrahimiFailed: error -22 at offset 2: UTF-8 error: isolated byte with 0x80 bit set 19*22dc650dSSadaf Ebrahimi 20*22dc650dSSadaf Ebrahimi/Â��������/match_invalid_utf 21*22dc650dSSadaf EbrahimiFailed: error -22 at offset 2: UTF-8 error: isolated byte with 0x80 bit set 22*22dc650dSSadaf Ebrahimi 23*22dc650dSSadaf Ebrahimi# Now test subjects 24*22dc650dSSadaf Ebrahimi 25*22dc650dSSadaf Ebrahimi/badutf/utf 26*22dc650dSSadaf Ebrahimi\= Expect UTF-8 errors 27*22dc650dSSadaf Ebrahimi X\xdf 28*22dc650dSSadaf EbrahimiFailed: error -3: UTF-8 error: 1 byte missing at end at offset 1 29*22dc650dSSadaf Ebrahimi XX\xef 30*22dc650dSSadaf EbrahimiFailed: error -4: UTF-8 error: 2 bytes missing at end at offset 2 31*22dc650dSSadaf Ebrahimi XXX\xef\x80 32*22dc650dSSadaf EbrahimiFailed: error -3: UTF-8 error: 1 byte missing at end at offset 3 33*22dc650dSSadaf Ebrahimi X\xf7 34*22dc650dSSadaf EbrahimiFailed: error -5: UTF-8 error: 3 bytes missing at end at offset 1 35*22dc650dSSadaf Ebrahimi XX\xf7\x80 36*22dc650dSSadaf EbrahimiFailed: error -4: UTF-8 error: 2 bytes missing at end at offset 2 37*22dc650dSSadaf Ebrahimi XXX\xf7\x80\x80 38*22dc650dSSadaf EbrahimiFailed: error -3: UTF-8 error: 1 byte missing at end at offset 3 39*22dc650dSSadaf Ebrahimi \xfb 40*22dc650dSSadaf EbrahimiFailed: error -6: UTF-8 error: 4 bytes missing at end at offset 0 41*22dc650dSSadaf Ebrahimi \xfb\x80 42*22dc650dSSadaf EbrahimiFailed: error -5: UTF-8 error: 3 bytes missing at end at offset 0 43*22dc650dSSadaf Ebrahimi \xfb\x80\x80 44*22dc650dSSadaf EbrahimiFailed: error -4: UTF-8 error: 2 bytes missing at end at offset 0 45*22dc650dSSadaf Ebrahimi \xfb\x80\x80\x80 46*22dc650dSSadaf EbrahimiFailed: error -3: UTF-8 error: 1 byte missing at end at offset 0 47*22dc650dSSadaf Ebrahimi \xfd 48*22dc650dSSadaf EbrahimiFailed: error -7: UTF-8 error: 5 bytes missing at end at offset 0 49*22dc650dSSadaf Ebrahimi \xfd\x80 50*22dc650dSSadaf EbrahimiFailed: error -6: UTF-8 error: 4 bytes missing at end at offset 0 51*22dc650dSSadaf Ebrahimi \xfd\x80\x80 52*22dc650dSSadaf EbrahimiFailed: error -5: UTF-8 error: 3 bytes missing at end at offset 0 53*22dc650dSSadaf Ebrahimi \xfd\x80\x80\x80 54*22dc650dSSadaf EbrahimiFailed: error -4: UTF-8 error: 2 bytes missing at end at offset 0 55*22dc650dSSadaf Ebrahimi \xfd\x80\x80\x80\x80 56*22dc650dSSadaf EbrahimiFailed: error -3: UTF-8 error: 1 byte missing at end at offset 0 57*22dc650dSSadaf Ebrahimi \xdf\x7f 58*22dc650dSSadaf EbrahimiFailed: error -8: UTF-8 error: byte 2 top bits not 0x80 at offset 0 59*22dc650dSSadaf Ebrahimi \xef\x7f\x80 60*22dc650dSSadaf EbrahimiFailed: error -8: UTF-8 error: byte 2 top bits not 0x80 at offset 0 61*22dc650dSSadaf Ebrahimi \xef\x80\x7f 62*22dc650dSSadaf EbrahimiFailed: error -9: UTF-8 error: byte 3 top bits not 0x80 at offset 0 63*22dc650dSSadaf Ebrahimi \xf7\x7f\x80\x80 64*22dc650dSSadaf EbrahimiFailed: error -8: UTF-8 error: byte 2 top bits not 0x80 at offset 0 65*22dc650dSSadaf Ebrahimi \xf7\x80\x7f\x80 66*22dc650dSSadaf EbrahimiFailed: error -9: UTF-8 error: byte 3 top bits not 0x80 at offset 0 67*22dc650dSSadaf Ebrahimi \xf7\x80\x80\x7f 68*22dc650dSSadaf EbrahimiFailed: error -10: UTF-8 error: byte 4 top bits not 0x80 at offset 0 69*22dc650dSSadaf Ebrahimi \xfb\x7f\x80\x80\x80 70*22dc650dSSadaf EbrahimiFailed: error -8: UTF-8 error: byte 2 top bits not 0x80 at offset 0 71*22dc650dSSadaf Ebrahimi \xfb\x80\x7f\x80\x80 72*22dc650dSSadaf EbrahimiFailed: error -9: UTF-8 error: byte 3 top bits not 0x80 at offset 0 73*22dc650dSSadaf Ebrahimi \xfb\x80\x80\x7f\x80 74*22dc650dSSadaf EbrahimiFailed: error -10: UTF-8 error: byte 4 top bits not 0x80 at offset 0 75*22dc650dSSadaf Ebrahimi \xfb\x80\x80\x80\x7f 76*22dc650dSSadaf EbrahimiFailed: error -11: UTF-8 error: byte 5 top bits not 0x80 at offset 0 77*22dc650dSSadaf Ebrahimi \xfd\x7f\x80\x80\x80\x80 78*22dc650dSSadaf EbrahimiFailed: error -8: UTF-8 error: byte 2 top bits not 0x80 at offset 0 79*22dc650dSSadaf Ebrahimi \xfd\x80\x7f\x80\x80\x80 80*22dc650dSSadaf EbrahimiFailed: error -9: UTF-8 error: byte 3 top bits not 0x80 at offset 0 81*22dc650dSSadaf Ebrahimi \xfd\x80\x80\x7f\x80\x80 82*22dc650dSSadaf EbrahimiFailed: error -10: UTF-8 error: byte 4 top bits not 0x80 at offset 0 83*22dc650dSSadaf Ebrahimi \xfd\x80\x80\x80\x7f\x80 84*22dc650dSSadaf EbrahimiFailed: error -11: UTF-8 error: byte 5 top bits not 0x80 at offset 0 85*22dc650dSSadaf Ebrahimi \xfd\x80\x80\x80\x80\x7f 86*22dc650dSSadaf EbrahimiFailed: error -12: UTF-8 error: byte 6 top bits not 0x80 at offset 0 87*22dc650dSSadaf Ebrahimi \xed\xa0\x80 88*22dc650dSSadaf EbrahimiFailed: error -16: UTF-8 error: code points 0xd800-0xdfff are not defined at offset 0 89*22dc650dSSadaf Ebrahimi \xc0\x8f 90*22dc650dSSadaf EbrahimiFailed: error -17: UTF-8 error: overlong 2-byte sequence at offset 0 91*22dc650dSSadaf Ebrahimi \xe0\x80\x8f 92*22dc650dSSadaf EbrahimiFailed: error -18: UTF-8 error: overlong 3-byte sequence at offset 0 93*22dc650dSSadaf Ebrahimi \xf0\x80\x80\x8f 94*22dc650dSSadaf EbrahimiFailed: error -19: UTF-8 error: overlong 4-byte sequence at offset 0 95*22dc650dSSadaf Ebrahimi \xf8\x80\x80\x80\x8f 96*22dc650dSSadaf EbrahimiFailed: error -20: UTF-8 error: overlong 5-byte sequence at offset 0 97*22dc650dSSadaf Ebrahimi \xfc\x80\x80\x80\x80\x8f 98*22dc650dSSadaf EbrahimiFailed: error -21: UTF-8 error: overlong 6-byte sequence at offset 0 99*22dc650dSSadaf Ebrahimi \x80 100*22dc650dSSadaf EbrahimiFailed: error -22: UTF-8 error: isolated byte with 0x80 bit set at offset 0 101*22dc650dSSadaf Ebrahimi \xfe 102*22dc650dSSadaf EbrahimiFailed: error -23: UTF-8 error: illegal byte (0xfe or 0xff) at offset 0 103*22dc650dSSadaf Ebrahimi \xff 104*22dc650dSSadaf EbrahimiFailed: error -23: UTF-8 error: illegal byte (0xfe or 0xff) at offset 0 105*22dc650dSSadaf Ebrahimi 106*22dc650dSSadaf Ebrahimi/badutf/utf 107*22dc650dSSadaf Ebrahimi\= Expect UTF-8 errors 108*22dc650dSSadaf Ebrahimi XX\xfb\x80\x80\x80\x80 109*22dc650dSSadaf EbrahimiFailed: error -13: UTF-8 error: 5-byte character is not allowed (RFC 3629) at offset 2 110*22dc650dSSadaf Ebrahimi XX\xfd\x80\x80\x80\x80\x80 111*22dc650dSSadaf EbrahimiFailed: error -14: UTF-8 error: 6-byte character is not allowed (RFC 3629) at offset 2 112*22dc650dSSadaf Ebrahimi XX\xf7\xbf\xbf\xbf 113*22dc650dSSadaf EbrahimiFailed: error -15: UTF-8 error: code points greater than 0x10ffff are not defined at offset 2 114*22dc650dSSadaf Ebrahimi 115*22dc650dSSadaf Ebrahimi/shortutf/utf 116*22dc650dSSadaf Ebrahimi\= Expect UTF-8 errors 117*22dc650dSSadaf Ebrahimi XX\xdf\=ph 118*22dc650dSSadaf EbrahimiFailed: error -3: UTF-8 error: 1 byte missing at end at offset 2 119*22dc650dSSadaf Ebrahimi XX\xef\=ph 120*22dc650dSSadaf EbrahimiFailed: error -4: UTF-8 error: 2 bytes missing at end at offset 2 121*22dc650dSSadaf Ebrahimi XX\xef\x80\=ph 122*22dc650dSSadaf EbrahimiFailed: error -3: UTF-8 error: 1 byte missing at end at offset 2 123*22dc650dSSadaf Ebrahimi \xf7\=ph 124*22dc650dSSadaf EbrahimiFailed: error -5: UTF-8 error: 3 bytes missing at end at offset 0 125*22dc650dSSadaf Ebrahimi \xf7\x80\=ph 126*22dc650dSSadaf EbrahimiFailed: error -4: UTF-8 error: 2 bytes missing at end at offset 0 127*22dc650dSSadaf Ebrahimi \xf7\x80\x80\=ph 128*22dc650dSSadaf EbrahimiFailed: error -3: UTF-8 error: 1 byte missing at end at offset 0 129*22dc650dSSadaf Ebrahimi \xfb\=ph 130*22dc650dSSadaf EbrahimiFailed: error -6: UTF-8 error: 4 bytes missing at end at offset 0 131*22dc650dSSadaf Ebrahimi \xfb\x80\=ph 132*22dc650dSSadaf EbrahimiFailed: error -5: UTF-8 error: 3 bytes missing at end at offset 0 133*22dc650dSSadaf Ebrahimi \xfb\x80\x80\=ph 134*22dc650dSSadaf EbrahimiFailed: error -4: UTF-8 error: 2 bytes missing at end at offset 0 135*22dc650dSSadaf Ebrahimi \xfb\x80\x80\x80\=ph 136*22dc650dSSadaf EbrahimiFailed: error -3: UTF-8 error: 1 byte missing at end at offset 0 137*22dc650dSSadaf Ebrahimi \xfd\=ph 138*22dc650dSSadaf EbrahimiFailed: error -7: UTF-8 error: 5 bytes missing at end at offset 0 139*22dc650dSSadaf Ebrahimi \xfd\x80\=ph 140*22dc650dSSadaf EbrahimiFailed: error -6: UTF-8 error: 4 bytes missing at end at offset 0 141*22dc650dSSadaf Ebrahimi \xfd\x80\x80\=ph 142*22dc650dSSadaf EbrahimiFailed: error -5: UTF-8 error: 3 bytes missing at end at offset 0 143*22dc650dSSadaf Ebrahimi \xfd\x80\x80\x80\=ph 144*22dc650dSSadaf EbrahimiFailed: error -4: UTF-8 error: 2 bytes missing at end at offset 0 145*22dc650dSSadaf Ebrahimi \xfd\x80\x80\x80\x80\=ph 146*22dc650dSSadaf EbrahimiFailed: error -3: UTF-8 error: 1 byte missing at end at offset 0 147*22dc650dSSadaf Ebrahimi 148*22dc650dSSadaf Ebrahimi/anything/utf 149*22dc650dSSadaf Ebrahimi\= Expect UTF-8 errors 150*22dc650dSSadaf Ebrahimi X\xc0\x80 151*22dc650dSSadaf EbrahimiFailed: error -17: UTF-8 error: overlong 2-byte sequence at offset 1 152*22dc650dSSadaf Ebrahimi XX\xc1\x8f 153*22dc650dSSadaf EbrahimiFailed: error -17: UTF-8 error: overlong 2-byte sequence at offset 2 154*22dc650dSSadaf Ebrahimi XXX\xe0\x9f\x80 155*22dc650dSSadaf EbrahimiFailed: error -18: UTF-8 error: overlong 3-byte sequence at offset 3 156*22dc650dSSadaf Ebrahimi \xf0\x8f\x80\x80 157*22dc650dSSadaf EbrahimiFailed: error -19: UTF-8 error: overlong 4-byte sequence at offset 0 158*22dc650dSSadaf Ebrahimi \xf8\x87\x80\x80\x80 159*22dc650dSSadaf EbrahimiFailed: error -20: UTF-8 error: overlong 5-byte sequence at offset 0 160*22dc650dSSadaf Ebrahimi \xfc\x83\x80\x80\x80\x80 161*22dc650dSSadaf EbrahimiFailed: error -21: UTF-8 error: overlong 6-byte sequence at offset 0 162*22dc650dSSadaf Ebrahimi \xfe\x80\x80\x80\x80\x80 163*22dc650dSSadaf EbrahimiFailed: error -23: UTF-8 error: illegal byte (0xfe or 0xff) at offset 0 164*22dc650dSSadaf Ebrahimi \xff\x80\x80\x80\x80\x80 165*22dc650dSSadaf EbrahimiFailed: error -23: UTF-8 error: illegal byte (0xfe or 0xff) at offset 0 166*22dc650dSSadaf Ebrahimi \xf8\x88\x80\x80\x80 167*22dc650dSSadaf EbrahimiFailed: error -13: UTF-8 error: 5-byte character is not allowed (RFC 3629) at offset 0 168*22dc650dSSadaf Ebrahimi \xf9\x87\x80\x80\x80 169*22dc650dSSadaf EbrahimiFailed: error -13: UTF-8 error: 5-byte character is not allowed (RFC 3629) at offset 0 170*22dc650dSSadaf Ebrahimi \xfc\x84\x80\x80\x80\x80 171*22dc650dSSadaf EbrahimiFailed: error -14: UTF-8 error: 6-byte character is not allowed (RFC 3629) at offset 0 172*22dc650dSSadaf Ebrahimi \xfd\x83\x80\x80\x80\x80 173*22dc650dSSadaf EbrahimiFailed: error -14: UTF-8 error: 6-byte character is not allowed (RFC 3629) at offset 0 174*22dc650dSSadaf Ebrahimi\= Expect no match 175*22dc650dSSadaf Ebrahimi \xc3\x8f 176*22dc650dSSadaf EbrahimiNo match 177*22dc650dSSadaf Ebrahimi \xe0\xaf\x80 178*22dc650dSSadaf EbrahimiNo match 179*22dc650dSSadaf Ebrahimi \xe1\x80\x80 180*22dc650dSSadaf EbrahimiNo match 181*22dc650dSSadaf Ebrahimi \xf0\x9f\x80\x80 182*22dc650dSSadaf EbrahimiNo match 183*22dc650dSSadaf Ebrahimi \xf1\x8f\x80\x80 184*22dc650dSSadaf EbrahimiNo match 185*22dc650dSSadaf Ebrahimi \xf8\x88\x80\x80\x80\=no_utf_check 186*22dc650dSSadaf EbrahimiNo match 187*22dc650dSSadaf Ebrahimi \xf9\x87\x80\x80\x80\=no_utf_check 188*22dc650dSSadaf EbrahimiNo match 189*22dc650dSSadaf Ebrahimi \xfc\x84\x80\x80\x80\x80\=no_utf_check 190*22dc650dSSadaf EbrahimiNo match 191*22dc650dSSadaf Ebrahimi \xfd\x83\x80\x80\x80\x80\=no_utf_check 192*22dc650dSSadaf EbrahimiNo match 193*22dc650dSSadaf Ebrahimi 194*22dc650dSSadaf Ebrahimi# Similar tests with offsets 195*22dc650dSSadaf Ebrahimi 196*22dc650dSSadaf Ebrahimi/badutf/utf 197*22dc650dSSadaf Ebrahimi\= Expect UTF-8 errors 198*22dc650dSSadaf Ebrahimi X\xdfabcd 199*22dc650dSSadaf EbrahimiFailed: error -8: UTF-8 error: byte 2 top bits not 0x80 at offset 1 200*22dc650dSSadaf Ebrahimi X\xdfabcd\=offset=1 201*22dc650dSSadaf EbrahimiFailed: error -8: UTF-8 error: byte 2 top bits not 0x80 at offset 1 202*22dc650dSSadaf Ebrahimi\= Expect no match 203*22dc650dSSadaf Ebrahimi X\xdfabcd\=offset=2 204*22dc650dSSadaf EbrahimiNo match 205*22dc650dSSadaf Ebrahimi 206*22dc650dSSadaf Ebrahimi/(?<=x)badutf/utf 207*22dc650dSSadaf Ebrahimi\= Expect UTF-8 errors 208*22dc650dSSadaf Ebrahimi X\xdfabcd 209*22dc650dSSadaf EbrahimiFailed: error -8: UTF-8 error: byte 2 top bits not 0x80 at offset 1 210*22dc650dSSadaf Ebrahimi X\xdfabcd\=offset=1 211*22dc650dSSadaf EbrahimiFailed: error -8: UTF-8 error: byte 2 top bits not 0x80 at offset 1 212*22dc650dSSadaf Ebrahimi X\xdfabcd\=offset=2 213*22dc650dSSadaf EbrahimiFailed: error -8: UTF-8 error: byte 2 top bits not 0x80 at offset 1 214*22dc650dSSadaf Ebrahimi X\xdfabcd\xdf\=offset=3 215*22dc650dSSadaf EbrahimiFailed: error -3: UTF-8 error: 1 byte missing at end at offset 6 216*22dc650dSSadaf Ebrahimi\= Expect no match 217*22dc650dSSadaf Ebrahimi X\xdfabcd\=offset=3 218*22dc650dSSadaf EbrahimiNo match 219*22dc650dSSadaf Ebrahimi 220*22dc650dSSadaf Ebrahimi/(?<=xx)badutf/utf 221*22dc650dSSadaf Ebrahimi\= Expect UTF-8 errors 222*22dc650dSSadaf Ebrahimi X\xdfabcd 223*22dc650dSSadaf EbrahimiFailed: error -8: UTF-8 error: byte 2 top bits not 0x80 at offset 1 224*22dc650dSSadaf Ebrahimi X\xdfabcd\=offset=1 225*22dc650dSSadaf EbrahimiFailed: error -8: UTF-8 error: byte 2 top bits not 0x80 at offset 1 226*22dc650dSSadaf Ebrahimi X\xdfabcd\=offset=2 227*22dc650dSSadaf EbrahimiFailed: error -8: UTF-8 error: byte 2 top bits not 0x80 at offset 1 228*22dc650dSSadaf Ebrahimi X\xdfabcd\=offset=3 229*22dc650dSSadaf EbrahimiFailed: error -8: UTF-8 error: byte 2 top bits not 0x80 at offset 1 230*22dc650dSSadaf Ebrahimi 231*22dc650dSSadaf Ebrahimi/(?<=xxxx)badutf/utf 232*22dc650dSSadaf Ebrahimi\= Expect UTF-8 errors 233*22dc650dSSadaf Ebrahimi X\xdfabcd 234*22dc650dSSadaf EbrahimiFailed: error -8: UTF-8 error: byte 2 top bits not 0x80 at offset 1 235*22dc650dSSadaf Ebrahimi X\xdfabcd\=offset=1 236*22dc650dSSadaf EbrahimiFailed: error -8: UTF-8 error: byte 2 top bits not 0x80 at offset 1 237*22dc650dSSadaf Ebrahimi X\xdfabcd\=offset=2 238*22dc650dSSadaf EbrahimiFailed: error -8: UTF-8 error: byte 2 top bits not 0x80 at offset 1 239*22dc650dSSadaf Ebrahimi X\xdfabcd\=offset=3 240*22dc650dSSadaf EbrahimiFailed: error -8: UTF-8 error: byte 2 top bits not 0x80 at offset 1 241*22dc650dSSadaf Ebrahimi X\xdfabc\xdf\=offset=6 242*22dc650dSSadaf EbrahimiFailed: error -3: UTF-8 error: 1 byte missing at end at offset 5 243*22dc650dSSadaf Ebrahimi X\xdfabc\xdf\=offset=7 244*22dc650dSSadaf EbrahimiFailed: error -33: bad offset value 245*22dc650dSSadaf Ebrahimi\= Expect no match 246*22dc650dSSadaf Ebrahimi X\xdfabcd\=offset=6 247*22dc650dSSadaf EbrahimiNo match 248*22dc650dSSadaf Ebrahimi 249*22dc650dSSadaf Ebrahimi/\x{100}/IB,utf 250*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 251*22dc650dSSadaf Ebrahimi Bra 252*22dc650dSSadaf Ebrahimi \x{100} 253*22dc650dSSadaf Ebrahimi Ket 254*22dc650dSSadaf Ebrahimi End 255*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 256*22dc650dSSadaf EbrahimiCapture group count = 0 257*22dc650dSSadaf EbrahimiOptions: utf 258*22dc650dSSadaf EbrahimiFirst code unit = \xc4 259*22dc650dSSadaf EbrahimiLast code unit = \x80 260*22dc650dSSadaf EbrahimiSubject length lower bound = 1 261*22dc650dSSadaf Ebrahimi 262*22dc650dSSadaf Ebrahimi/\x{1000}/IB,utf 263*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 264*22dc650dSSadaf Ebrahimi Bra 265*22dc650dSSadaf Ebrahimi \x{1000} 266*22dc650dSSadaf Ebrahimi Ket 267*22dc650dSSadaf Ebrahimi End 268*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 269*22dc650dSSadaf EbrahimiCapture group count = 0 270*22dc650dSSadaf EbrahimiOptions: utf 271*22dc650dSSadaf EbrahimiFirst code unit = \xe1 272*22dc650dSSadaf EbrahimiLast code unit = \x80 273*22dc650dSSadaf EbrahimiSubject length lower bound = 1 274*22dc650dSSadaf Ebrahimi 275*22dc650dSSadaf Ebrahimi/\x{10000}/IB,utf 276*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 277*22dc650dSSadaf Ebrahimi Bra 278*22dc650dSSadaf Ebrahimi \x{10000} 279*22dc650dSSadaf Ebrahimi Ket 280*22dc650dSSadaf Ebrahimi End 281*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 282*22dc650dSSadaf EbrahimiCapture group count = 0 283*22dc650dSSadaf EbrahimiOptions: utf 284*22dc650dSSadaf EbrahimiFirst code unit = \xf0 285*22dc650dSSadaf EbrahimiLast code unit = \x80 286*22dc650dSSadaf EbrahimiSubject length lower bound = 1 287*22dc650dSSadaf Ebrahimi 288*22dc650dSSadaf Ebrahimi/\x{100000}/IB,utf 289*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 290*22dc650dSSadaf Ebrahimi Bra 291*22dc650dSSadaf Ebrahimi \x{100000} 292*22dc650dSSadaf Ebrahimi Ket 293*22dc650dSSadaf Ebrahimi End 294*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 295*22dc650dSSadaf EbrahimiCapture group count = 0 296*22dc650dSSadaf EbrahimiOptions: utf 297*22dc650dSSadaf EbrahimiFirst code unit = \xf4 298*22dc650dSSadaf EbrahimiLast code unit = \x80 299*22dc650dSSadaf EbrahimiSubject length lower bound = 1 300*22dc650dSSadaf Ebrahimi 301*22dc650dSSadaf Ebrahimi/\x{10ffff}/IB,utf 302*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 303*22dc650dSSadaf Ebrahimi Bra 304*22dc650dSSadaf Ebrahimi \x{10ffff} 305*22dc650dSSadaf Ebrahimi Ket 306*22dc650dSSadaf Ebrahimi End 307*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 308*22dc650dSSadaf EbrahimiCapture group count = 0 309*22dc650dSSadaf EbrahimiOptions: utf 310*22dc650dSSadaf EbrahimiFirst code unit = \xf4 311*22dc650dSSadaf EbrahimiLast code unit = \xbf 312*22dc650dSSadaf EbrahimiSubject length lower bound = 1 313*22dc650dSSadaf Ebrahimi 314*22dc650dSSadaf Ebrahimi/[\x{ff}]/IB,utf 315*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 316*22dc650dSSadaf Ebrahimi Bra 317*22dc650dSSadaf Ebrahimi \x{ff} 318*22dc650dSSadaf Ebrahimi Ket 319*22dc650dSSadaf Ebrahimi End 320*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 321*22dc650dSSadaf EbrahimiCapture group count = 0 322*22dc650dSSadaf EbrahimiOptions: utf 323*22dc650dSSadaf EbrahimiFirst code unit = \xc3 324*22dc650dSSadaf EbrahimiLast code unit = \xbf 325*22dc650dSSadaf EbrahimiSubject length lower bound = 1 326*22dc650dSSadaf Ebrahimi 327*22dc650dSSadaf Ebrahimi/[\x{100}]/IB,utf 328*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 329*22dc650dSSadaf Ebrahimi Bra 330*22dc650dSSadaf Ebrahimi \x{100} 331*22dc650dSSadaf Ebrahimi Ket 332*22dc650dSSadaf Ebrahimi End 333*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 334*22dc650dSSadaf EbrahimiCapture group count = 0 335*22dc650dSSadaf EbrahimiOptions: utf 336*22dc650dSSadaf EbrahimiFirst code unit = \xc4 337*22dc650dSSadaf EbrahimiLast code unit = \x80 338*22dc650dSSadaf EbrahimiSubject length lower bound = 1 339*22dc650dSSadaf Ebrahimi 340*22dc650dSSadaf Ebrahimi/\x80/IB,utf 341*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 342*22dc650dSSadaf Ebrahimi Bra 343*22dc650dSSadaf Ebrahimi \x{80} 344*22dc650dSSadaf Ebrahimi Ket 345*22dc650dSSadaf Ebrahimi End 346*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 347*22dc650dSSadaf EbrahimiCapture group count = 0 348*22dc650dSSadaf EbrahimiOptions: utf 349*22dc650dSSadaf EbrahimiFirst code unit = \xc2 350*22dc650dSSadaf EbrahimiLast code unit = \x80 351*22dc650dSSadaf EbrahimiSubject length lower bound = 1 352*22dc650dSSadaf Ebrahimi 353*22dc650dSSadaf Ebrahimi/\xff/IB,utf 354*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 355*22dc650dSSadaf Ebrahimi Bra 356*22dc650dSSadaf Ebrahimi \x{ff} 357*22dc650dSSadaf Ebrahimi Ket 358*22dc650dSSadaf Ebrahimi End 359*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 360*22dc650dSSadaf EbrahimiCapture group count = 0 361*22dc650dSSadaf EbrahimiOptions: utf 362*22dc650dSSadaf EbrahimiFirst code unit = \xc3 363*22dc650dSSadaf EbrahimiLast code unit = \xbf 364*22dc650dSSadaf EbrahimiSubject length lower bound = 1 365*22dc650dSSadaf Ebrahimi 366*22dc650dSSadaf Ebrahimi/\x{D55c}\x{ad6d}\x{C5B4}/IB,utf 367*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 368*22dc650dSSadaf Ebrahimi Bra 369*22dc650dSSadaf Ebrahimi \x{d55c}\x{ad6d}\x{c5b4} 370*22dc650dSSadaf Ebrahimi Ket 371*22dc650dSSadaf Ebrahimi End 372*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 373*22dc650dSSadaf EbrahimiCapture group count = 0 374*22dc650dSSadaf EbrahimiOptions: utf 375*22dc650dSSadaf EbrahimiFirst code unit = \xed 376*22dc650dSSadaf EbrahimiLast code unit = \xb4 377*22dc650dSSadaf EbrahimiSubject length lower bound = 3 378*22dc650dSSadaf Ebrahimi \x{D55c}\x{ad6d}\x{C5B4} 379*22dc650dSSadaf Ebrahimi 0: \x{d55c}\x{ad6d}\x{c5b4} 380*22dc650dSSadaf Ebrahimi 381*22dc650dSSadaf Ebrahimi/\x{65e5}\x{672c}\x{8a9e}/IB,utf 382*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 383*22dc650dSSadaf Ebrahimi Bra 384*22dc650dSSadaf Ebrahimi \x{65e5}\x{672c}\x{8a9e} 385*22dc650dSSadaf Ebrahimi Ket 386*22dc650dSSadaf Ebrahimi End 387*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 388*22dc650dSSadaf EbrahimiCapture group count = 0 389*22dc650dSSadaf EbrahimiOptions: utf 390*22dc650dSSadaf EbrahimiFirst code unit = \xe6 391*22dc650dSSadaf EbrahimiLast code unit = \x9e 392*22dc650dSSadaf EbrahimiSubject length lower bound = 3 393*22dc650dSSadaf Ebrahimi \x{65e5}\x{672c}\x{8a9e} 394*22dc650dSSadaf Ebrahimi 0: \x{65e5}\x{672c}\x{8a9e} 395*22dc650dSSadaf Ebrahimi 396*22dc650dSSadaf Ebrahimi/\x{80}/IB,utf 397*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 398*22dc650dSSadaf Ebrahimi Bra 399*22dc650dSSadaf Ebrahimi \x{80} 400*22dc650dSSadaf Ebrahimi Ket 401*22dc650dSSadaf Ebrahimi End 402*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 403*22dc650dSSadaf EbrahimiCapture group count = 0 404*22dc650dSSadaf EbrahimiOptions: utf 405*22dc650dSSadaf EbrahimiFirst code unit = \xc2 406*22dc650dSSadaf EbrahimiLast code unit = \x80 407*22dc650dSSadaf EbrahimiSubject length lower bound = 1 408*22dc650dSSadaf Ebrahimi 409*22dc650dSSadaf Ebrahimi/\x{084}/IB,utf 410*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 411*22dc650dSSadaf Ebrahimi Bra 412*22dc650dSSadaf Ebrahimi \x{84} 413*22dc650dSSadaf Ebrahimi Ket 414*22dc650dSSadaf Ebrahimi End 415*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 416*22dc650dSSadaf EbrahimiCapture group count = 0 417*22dc650dSSadaf EbrahimiOptions: utf 418*22dc650dSSadaf EbrahimiFirst code unit = \xc2 419*22dc650dSSadaf EbrahimiLast code unit = \x84 420*22dc650dSSadaf EbrahimiSubject length lower bound = 1 421*22dc650dSSadaf Ebrahimi 422*22dc650dSSadaf Ebrahimi/\x{104}/IB,utf 423*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 424*22dc650dSSadaf Ebrahimi Bra 425*22dc650dSSadaf Ebrahimi \x{104} 426*22dc650dSSadaf Ebrahimi Ket 427*22dc650dSSadaf Ebrahimi End 428*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 429*22dc650dSSadaf EbrahimiCapture group count = 0 430*22dc650dSSadaf EbrahimiOptions: utf 431*22dc650dSSadaf EbrahimiFirst code unit = \xc4 432*22dc650dSSadaf EbrahimiLast code unit = \x84 433*22dc650dSSadaf EbrahimiSubject length lower bound = 1 434*22dc650dSSadaf Ebrahimi 435*22dc650dSSadaf Ebrahimi/\x{861}/IB,utf 436*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 437*22dc650dSSadaf Ebrahimi Bra 438*22dc650dSSadaf Ebrahimi \x{861} 439*22dc650dSSadaf Ebrahimi Ket 440*22dc650dSSadaf Ebrahimi End 441*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 442*22dc650dSSadaf EbrahimiCapture group count = 0 443*22dc650dSSadaf EbrahimiOptions: utf 444*22dc650dSSadaf EbrahimiFirst code unit = \xe0 445*22dc650dSSadaf EbrahimiLast code unit = \xa1 446*22dc650dSSadaf EbrahimiSubject length lower bound = 1 447*22dc650dSSadaf Ebrahimi 448*22dc650dSSadaf Ebrahimi/\x{212ab}/IB,utf 449*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 450*22dc650dSSadaf Ebrahimi Bra 451*22dc650dSSadaf Ebrahimi \x{212ab} 452*22dc650dSSadaf Ebrahimi Ket 453*22dc650dSSadaf Ebrahimi End 454*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 455*22dc650dSSadaf EbrahimiCapture group count = 0 456*22dc650dSSadaf EbrahimiOptions: utf 457*22dc650dSSadaf EbrahimiFirst code unit = \xf0 458*22dc650dSSadaf EbrahimiLast code unit = \xab 459*22dc650dSSadaf EbrahimiSubject length lower bound = 1 460*22dc650dSSadaf Ebrahimi 461*22dc650dSSadaf Ebrahimi/[^ab\xC0-\xF0]/IB,utf 462*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 463*22dc650dSSadaf Ebrahimi Bra 464*22dc650dSSadaf Ebrahimi [\x00-`c-\xbf\xf1-\xff] (neg) 465*22dc650dSSadaf Ebrahimi Ket 466*22dc650dSSadaf Ebrahimi End 467*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 468*22dc650dSSadaf EbrahimiCapture group count = 0 469*22dc650dSSadaf EbrahimiOptions: utf 470*22dc650dSSadaf EbrahimiStarting code units: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x09 \x0a 471*22dc650dSSadaf Ebrahimi \x0b \x0c \x0d \x0e \x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19 472*22dc650dSSadaf Ebrahimi \x1a \x1b \x1c \x1d \x1e \x1f \x20 ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4 473*22dc650dSSadaf Ebrahimi 5 6 7 8 9 : ; < = > ? @ A B C D E F G H I J K L M N O P Q R S T U V W X Y 474*22dc650dSSadaf Ebrahimi Z [ \ ] ^ _ ` c d e f g h i j k l m n o p q r s t u v w x y z { | } ~ \x7f 475*22dc650dSSadaf Ebrahimi \xc2 \xc3 \xc4 \xc5 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd \xce \xcf \xd0 476*22dc650dSSadaf Ebrahimi \xd1 \xd2 \xd3 \xd4 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc \xdd \xde \xdf 477*22dc650dSSadaf Ebrahimi \xe0 \xe1 \xe2 \xe3 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb \xec \xed \xee 478*22dc650dSSadaf Ebrahimi \xef \xf0 \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb \xfc \xfd 479*22dc650dSSadaf Ebrahimi \xfe \xff 480*22dc650dSSadaf EbrahimiSubject length lower bound = 1 481*22dc650dSSadaf Ebrahimi \x{f1} 482*22dc650dSSadaf Ebrahimi 0: \x{f1} 483*22dc650dSSadaf Ebrahimi \x{bf} 484*22dc650dSSadaf Ebrahimi 0: \x{bf} 485*22dc650dSSadaf Ebrahimi \x{100} 486*22dc650dSSadaf Ebrahimi 0: \x{100} 487*22dc650dSSadaf Ebrahimi \x{1000} 488*22dc650dSSadaf Ebrahimi 0: \x{1000} 489*22dc650dSSadaf Ebrahimi\= Expect no match 490*22dc650dSSadaf Ebrahimi \x{c0} 491*22dc650dSSadaf EbrahimiNo match 492*22dc650dSSadaf Ebrahimi \x{f0} 493*22dc650dSSadaf EbrahimiNo match 494*22dc650dSSadaf Ebrahimi 495*22dc650dSSadaf Ebrahimi/Ā{3,4}/IB,utf 496*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 497*22dc650dSSadaf Ebrahimi Bra 498*22dc650dSSadaf Ebrahimi \x{100}{3} 499*22dc650dSSadaf Ebrahimi \x{100}?+ 500*22dc650dSSadaf Ebrahimi Ket 501*22dc650dSSadaf Ebrahimi End 502*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 503*22dc650dSSadaf EbrahimiCapture group count = 0 504*22dc650dSSadaf EbrahimiOptions: utf 505*22dc650dSSadaf EbrahimiFirst code unit = \xc4 506*22dc650dSSadaf EbrahimiLast code unit = \x80 507*22dc650dSSadaf EbrahimiSubject length lower bound = 3 508*22dc650dSSadaf Ebrahimi \x{100}\x{100}\x{100}\x{100\x{100} 509*22dc650dSSadaf Ebrahimi 0: \x{100}\x{100}\x{100} 510*22dc650dSSadaf Ebrahimi 511*22dc650dSSadaf Ebrahimi/(\x{100}+|x)/IB,utf 512*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 513*22dc650dSSadaf Ebrahimi Bra 514*22dc650dSSadaf Ebrahimi CBra 1 515*22dc650dSSadaf Ebrahimi \x{100}++ 516*22dc650dSSadaf Ebrahimi Alt 517*22dc650dSSadaf Ebrahimi x 518*22dc650dSSadaf Ebrahimi Ket 519*22dc650dSSadaf Ebrahimi Ket 520*22dc650dSSadaf Ebrahimi End 521*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 522*22dc650dSSadaf EbrahimiCapture group count = 1 523*22dc650dSSadaf EbrahimiOptions: utf 524*22dc650dSSadaf EbrahimiStarting code units: x \xc4 525*22dc650dSSadaf EbrahimiSubject length lower bound = 1 526*22dc650dSSadaf Ebrahimi 527*22dc650dSSadaf Ebrahimi/(\x{100}*a|x)/IB,utf 528*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 529*22dc650dSSadaf Ebrahimi Bra 530*22dc650dSSadaf Ebrahimi CBra 1 531*22dc650dSSadaf Ebrahimi \x{100}*+ 532*22dc650dSSadaf Ebrahimi a 533*22dc650dSSadaf Ebrahimi Alt 534*22dc650dSSadaf Ebrahimi x 535*22dc650dSSadaf Ebrahimi Ket 536*22dc650dSSadaf Ebrahimi Ket 537*22dc650dSSadaf Ebrahimi End 538*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 539*22dc650dSSadaf EbrahimiCapture group count = 1 540*22dc650dSSadaf EbrahimiOptions: utf 541*22dc650dSSadaf EbrahimiStarting code units: a x \xc4 542*22dc650dSSadaf EbrahimiSubject length lower bound = 1 543*22dc650dSSadaf Ebrahimi 544*22dc650dSSadaf Ebrahimi/(\x{100}{0,2}a|x)/IB,utf 545*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 546*22dc650dSSadaf Ebrahimi Bra 547*22dc650dSSadaf Ebrahimi CBra 1 548*22dc650dSSadaf Ebrahimi \x{100}{0,2}+ 549*22dc650dSSadaf Ebrahimi a 550*22dc650dSSadaf Ebrahimi Alt 551*22dc650dSSadaf Ebrahimi x 552*22dc650dSSadaf Ebrahimi Ket 553*22dc650dSSadaf Ebrahimi Ket 554*22dc650dSSadaf Ebrahimi End 555*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 556*22dc650dSSadaf EbrahimiCapture group count = 1 557*22dc650dSSadaf EbrahimiOptions: utf 558*22dc650dSSadaf EbrahimiStarting code units: a x \xc4 559*22dc650dSSadaf EbrahimiSubject length lower bound = 1 560*22dc650dSSadaf Ebrahimi 561*22dc650dSSadaf Ebrahimi/(\x{100}{1,2}a|x)/IB,utf 562*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 563*22dc650dSSadaf Ebrahimi Bra 564*22dc650dSSadaf Ebrahimi CBra 1 565*22dc650dSSadaf Ebrahimi \x{100} 566*22dc650dSSadaf Ebrahimi \x{100}{0,1}+ 567*22dc650dSSadaf Ebrahimi a 568*22dc650dSSadaf Ebrahimi Alt 569*22dc650dSSadaf Ebrahimi x 570*22dc650dSSadaf Ebrahimi Ket 571*22dc650dSSadaf Ebrahimi Ket 572*22dc650dSSadaf Ebrahimi End 573*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 574*22dc650dSSadaf EbrahimiCapture group count = 1 575*22dc650dSSadaf EbrahimiOptions: utf 576*22dc650dSSadaf EbrahimiStarting code units: x \xc4 577*22dc650dSSadaf EbrahimiSubject length lower bound = 1 578*22dc650dSSadaf Ebrahimi 579*22dc650dSSadaf Ebrahimi/\x{100}/IB,utf 580*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 581*22dc650dSSadaf Ebrahimi Bra 582*22dc650dSSadaf Ebrahimi \x{100} 583*22dc650dSSadaf Ebrahimi Ket 584*22dc650dSSadaf Ebrahimi End 585*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 586*22dc650dSSadaf EbrahimiCapture group count = 0 587*22dc650dSSadaf EbrahimiOptions: utf 588*22dc650dSSadaf EbrahimiFirst code unit = \xc4 589*22dc650dSSadaf EbrahimiLast code unit = \x80 590*22dc650dSSadaf EbrahimiSubject length lower bound = 1 591*22dc650dSSadaf Ebrahimi 592*22dc650dSSadaf Ebrahimi/a\x{100}\x{101}*/IB,utf 593*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 594*22dc650dSSadaf Ebrahimi Bra 595*22dc650dSSadaf Ebrahimi a\x{100} 596*22dc650dSSadaf Ebrahimi \x{101}*+ 597*22dc650dSSadaf Ebrahimi Ket 598*22dc650dSSadaf Ebrahimi End 599*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 600*22dc650dSSadaf EbrahimiCapture group count = 0 601*22dc650dSSadaf EbrahimiOptions: utf 602*22dc650dSSadaf EbrahimiFirst code unit = 'a' 603*22dc650dSSadaf EbrahimiLast code unit = \x80 604*22dc650dSSadaf EbrahimiSubject length lower bound = 2 605*22dc650dSSadaf Ebrahimi 606*22dc650dSSadaf Ebrahimi/a\x{100}\x{101}+/IB,utf 607*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 608*22dc650dSSadaf Ebrahimi Bra 609*22dc650dSSadaf Ebrahimi a\x{100} 610*22dc650dSSadaf Ebrahimi \x{101}++ 611*22dc650dSSadaf Ebrahimi Ket 612*22dc650dSSadaf Ebrahimi End 613*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 614*22dc650dSSadaf EbrahimiCapture group count = 0 615*22dc650dSSadaf EbrahimiOptions: utf 616*22dc650dSSadaf EbrahimiFirst code unit = 'a' 617*22dc650dSSadaf EbrahimiLast code unit = \x81 618*22dc650dSSadaf EbrahimiSubject length lower bound = 3 619*22dc650dSSadaf Ebrahimi 620*22dc650dSSadaf Ebrahimi/[^\x{c4}]/IB 621*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 622*22dc650dSSadaf Ebrahimi Bra 623*22dc650dSSadaf Ebrahimi [^\x{c4}] 624*22dc650dSSadaf Ebrahimi Ket 625*22dc650dSSadaf Ebrahimi End 626*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 627*22dc650dSSadaf EbrahimiCapture group count = 0 628*22dc650dSSadaf EbrahimiSubject length lower bound = 1 629*22dc650dSSadaf Ebrahimi 630*22dc650dSSadaf Ebrahimi/[\x{100}]/IB,utf 631*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 632*22dc650dSSadaf Ebrahimi Bra 633*22dc650dSSadaf Ebrahimi \x{100} 634*22dc650dSSadaf Ebrahimi Ket 635*22dc650dSSadaf Ebrahimi End 636*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 637*22dc650dSSadaf EbrahimiCapture group count = 0 638*22dc650dSSadaf EbrahimiOptions: utf 639*22dc650dSSadaf EbrahimiFirst code unit = \xc4 640*22dc650dSSadaf EbrahimiLast code unit = \x80 641*22dc650dSSadaf EbrahimiSubject length lower bound = 1 642*22dc650dSSadaf Ebrahimi \x{100} 643*22dc650dSSadaf Ebrahimi 0: \x{100} 644*22dc650dSSadaf Ebrahimi Z\x{100} 645*22dc650dSSadaf Ebrahimi 0: \x{100} 646*22dc650dSSadaf Ebrahimi \x{100}Z 647*22dc650dSSadaf Ebrahimi 0: \x{100} 648*22dc650dSSadaf Ebrahimi 649*22dc650dSSadaf Ebrahimi/[\xff]/IB,utf 650*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 651*22dc650dSSadaf Ebrahimi Bra 652*22dc650dSSadaf Ebrahimi \x{ff} 653*22dc650dSSadaf Ebrahimi Ket 654*22dc650dSSadaf Ebrahimi End 655*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 656*22dc650dSSadaf EbrahimiCapture group count = 0 657*22dc650dSSadaf EbrahimiOptions: utf 658*22dc650dSSadaf EbrahimiFirst code unit = \xc3 659*22dc650dSSadaf EbrahimiLast code unit = \xbf 660*22dc650dSSadaf EbrahimiSubject length lower bound = 1 661*22dc650dSSadaf Ebrahimi >\x{ff}< 662*22dc650dSSadaf Ebrahimi 0: \x{ff} 663*22dc650dSSadaf Ebrahimi 664*22dc650dSSadaf Ebrahimi/[^\xff]/IB,utf 665*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 666*22dc650dSSadaf Ebrahimi Bra 667*22dc650dSSadaf Ebrahimi [^\x{ff}] 668*22dc650dSSadaf Ebrahimi Ket 669*22dc650dSSadaf Ebrahimi End 670*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 671*22dc650dSSadaf EbrahimiCapture group count = 0 672*22dc650dSSadaf EbrahimiOptions: utf 673*22dc650dSSadaf EbrahimiSubject length lower bound = 1 674*22dc650dSSadaf Ebrahimi 675*22dc650dSSadaf Ebrahimi/\x{100}abc(xyz(?1))/IB,utf 676*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 677*22dc650dSSadaf Ebrahimi Bra 678*22dc650dSSadaf Ebrahimi \x{100}abc 679*22dc650dSSadaf Ebrahimi CBra 1 680*22dc650dSSadaf Ebrahimi xyz 681*22dc650dSSadaf Ebrahimi Recurse 682*22dc650dSSadaf Ebrahimi Ket 683*22dc650dSSadaf Ebrahimi Ket 684*22dc650dSSadaf Ebrahimi End 685*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 686*22dc650dSSadaf EbrahimiCapture group count = 1 687*22dc650dSSadaf EbrahimiOptions: utf 688*22dc650dSSadaf EbrahimiFirst code unit = \xc4 689*22dc650dSSadaf EbrahimiLast code unit = 'z' 690*22dc650dSSadaf EbrahimiSubject length lower bound = 7 691*22dc650dSSadaf Ebrahimi 692*22dc650dSSadaf Ebrahimi/\777/I,utf 693*22dc650dSSadaf EbrahimiCapture group count = 0 694*22dc650dSSadaf EbrahimiOptions: utf 695*22dc650dSSadaf EbrahimiFirst code unit = \xc7 696*22dc650dSSadaf EbrahimiLast code unit = \xbf 697*22dc650dSSadaf EbrahimiSubject length lower bound = 1 698*22dc650dSSadaf Ebrahimi \x{1ff} 699*22dc650dSSadaf Ebrahimi 0: \x{1ff} 700*22dc650dSSadaf Ebrahimi \777 701*22dc650dSSadaf Ebrahimi 0: \x{1ff} 702*22dc650dSSadaf Ebrahimi 703*22dc650dSSadaf Ebrahimi/\x{100}+\x{200}/IB,utf 704*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 705*22dc650dSSadaf Ebrahimi Bra 706*22dc650dSSadaf Ebrahimi \x{100}++ 707*22dc650dSSadaf Ebrahimi \x{200} 708*22dc650dSSadaf Ebrahimi Ket 709*22dc650dSSadaf Ebrahimi End 710*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 711*22dc650dSSadaf EbrahimiCapture group count = 0 712*22dc650dSSadaf EbrahimiOptions: utf 713*22dc650dSSadaf EbrahimiFirst code unit = \xc4 714*22dc650dSSadaf EbrahimiLast code unit = \x80 715*22dc650dSSadaf EbrahimiSubject length lower bound = 2 716*22dc650dSSadaf Ebrahimi 717*22dc650dSSadaf Ebrahimi/\x{100}+X/IB,utf 718*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 719*22dc650dSSadaf Ebrahimi Bra 720*22dc650dSSadaf Ebrahimi \x{100}++ 721*22dc650dSSadaf Ebrahimi X 722*22dc650dSSadaf Ebrahimi Ket 723*22dc650dSSadaf Ebrahimi End 724*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 725*22dc650dSSadaf EbrahimiCapture group count = 0 726*22dc650dSSadaf EbrahimiOptions: utf 727*22dc650dSSadaf EbrahimiFirst code unit = \xc4 728*22dc650dSSadaf EbrahimiLast code unit = 'X' 729*22dc650dSSadaf EbrahimiSubject length lower bound = 2 730*22dc650dSSadaf Ebrahimi 731*22dc650dSSadaf Ebrahimi/^[\QĀ\E-\QŐ\E/B,utf 732*22dc650dSSadaf EbrahimiFailed: error 106 at offset 15: missing terminating ] for character class 733*22dc650dSSadaf Ebrahimi 734*22dc650dSSadaf Ebrahimi# This tests the stricter UTF-8 check according to RFC 3629. 735*22dc650dSSadaf Ebrahimi 736*22dc650dSSadaf Ebrahimi/X/utf 737*22dc650dSSadaf Ebrahimi\= Expect UTF-8 errors 738*22dc650dSSadaf Ebrahimi \x{d800} 739*22dc650dSSadaf EbrahimiFailed: error -16: UTF-8 error: code points 0xd800-0xdfff are not defined at offset 0 740*22dc650dSSadaf Ebrahimi \x{da00} 741*22dc650dSSadaf EbrahimiFailed: error -16: UTF-8 error: code points 0xd800-0xdfff are not defined at offset 0 742*22dc650dSSadaf Ebrahimi \x{dfff} 743*22dc650dSSadaf EbrahimiFailed: error -16: UTF-8 error: code points 0xd800-0xdfff are not defined at offset 0 744*22dc650dSSadaf Ebrahimi \x{110000} 745*22dc650dSSadaf EbrahimiFailed: error -15: UTF-8 error: code points greater than 0x10ffff are not defined at offset 0 746*22dc650dSSadaf Ebrahimi \x{2000000} 747*22dc650dSSadaf EbrahimiFailed: error -13: UTF-8 error: 5-byte character is not allowed (RFC 3629) at offset 0 748*22dc650dSSadaf Ebrahimi \x{7fffffff} 749*22dc650dSSadaf EbrahimiFailed: error -14: UTF-8 error: 6-byte character is not allowed (RFC 3629) at offset 0 750*22dc650dSSadaf Ebrahimi\= Expect no match 751*22dc650dSSadaf Ebrahimi \x{d800}\=no_utf_check 752*22dc650dSSadaf EbrahimiNo match 753*22dc650dSSadaf Ebrahimi \x{da00}\=no_utf_check 754*22dc650dSSadaf EbrahimiNo match 755*22dc650dSSadaf Ebrahimi \x{dfff}\=no_utf_check 756*22dc650dSSadaf EbrahimiNo match 757*22dc650dSSadaf Ebrahimi \x{110000}\=no_utf_check 758*22dc650dSSadaf EbrahimiNo match 759*22dc650dSSadaf Ebrahimi \x{2000000}\=no_utf_check 760*22dc650dSSadaf EbrahimiNo match 761*22dc650dSSadaf Ebrahimi \x{7fffffff}\=no_utf_check 762*22dc650dSSadaf EbrahimiNo match 763*22dc650dSSadaf Ebrahimi 764*22dc650dSSadaf Ebrahimi/(*UTF8)\x{1234}/ 765*22dc650dSSadaf Ebrahimi abcd\x{1234}pqr 766*22dc650dSSadaf Ebrahimi 0: \x{1234} 767*22dc650dSSadaf Ebrahimi 768*22dc650dSSadaf Ebrahimi/(*CRLF)(*UTF)(*BSR_UNICODE)a\Rb/I 769*22dc650dSSadaf EbrahimiCapture group count = 0 770*22dc650dSSadaf EbrahimiCompile options: <none> 771*22dc650dSSadaf EbrahimiOverall options: utf 772*22dc650dSSadaf Ebrahimi\R matches any Unicode newline 773*22dc650dSSadaf EbrahimiForced newline is CRLF 774*22dc650dSSadaf EbrahimiFirst code unit = 'a' 775*22dc650dSSadaf EbrahimiLast code unit = 'b' 776*22dc650dSSadaf EbrahimiSubject length lower bound = 3 777*22dc650dSSadaf Ebrahimi 778*22dc650dSSadaf Ebrahimi/\h/I,utf 779*22dc650dSSadaf EbrahimiCapture group count = 0 780*22dc650dSSadaf EbrahimiOptions: utf 781*22dc650dSSadaf EbrahimiStarting code units: \x09 \x20 \xc2 \xe1 \xe2 \xe3 782*22dc650dSSadaf EbrahimiSubject length lower bound = 1 783*22dc650dSSadaf Ebrahimi ABC\x{09} 784*22dc650dSSadaf Ebrahimi 0: \x{09} 785*22dc650dSSadaf Ebrahimi ABC\x{20} 786*22dc650dSSadaf Ebrahimi 0: 787*22dc650dSSadaf Ebrahimi ABC\x{a0} 788*22dc650dSSadaf Ebrahimi 0: \x{a0} 789*22dc650dSSadaf Ebrahimi ABC\x{1680} 790*22dc650dSSadaf Ebrahimi 0: \x{1680} 791*22dc650dSSadaf Ebrahimi ABC\x{180e} 792*22dc650dSSadaf Ebrahimi 0: \x{180e} 793*22dc650dSSadaf Ebrahimi ABC\x{2000} 794*22dc650dSSadaf Ebrahimi 0: \x{2000} 795*22dc650dSSadaf Ebrahimi ABC\x{202f} 796*22dc650dSSadaf Ebrahimi 0: \x{202f} 797*22dc650dSSadaf Ebrahimi ABC\x{205f} 798*22dc650dSSadaf Ebrahimi 0: \x{205f} 799*22dc650dSSadaf Ebrahimi ABC\x{3000} 800*22dc650dSSadaf Ebrahimi 0: \x{3000} 801*22dc650dSSadaf Ebrahimi 802*22dc650dSSadaf Ebrahimi/\v/I,utf 803*22dc650dSSadaf EbrahimiCapture group count = 0 804*22dc650dSSadaf EbrahimiOptions: utf 805*22dc650dSSadaf EbrahimiStarting code units: \x0a \x0b \x0c \x0d \xc2 \xe2 806*22dc650dSSadaf EbrahimiSubject length lower bound = 1 807*22dc650dSSadaf Ebrahimi ABC\x{0a} 808*22dc650dSSadaf Ebrahimi 0: \x{0a} 809*22dc650dSSadaf Ebrahimi ABC\x{0b} 810*22dc650dSSadaf Ebrahimi 0: \x{0b} 811*22dc650dSSadaf Ebrahimi ABC\x{0c} 812*22dc650dSSadaf Ebrahimi 0: \x{0c} 813*22dc650dSSadaf Ebrahimi ABC\x{0d} 814*22dc650dSSadaf Ebrahimi 0: \x{0d} 815*22dc650dSSadaf Ebrahimi ABC\x{85} 816*22dc650dSSadaf Ebrahimi 0: \x{85} 817*22dc650dSSadaf Ebrahimi ABC\x{2028} 818*22dc650dSSadaf Ebrahimi 0: \x{2028} 819*22dc650dSSadaf Ebrahimi 820*22dc650dSSadaf Ebrahimi/\h*A/I,utf 821*22dc650dSSadaf EbrahimiCapture group count = 0 822*22dc650dSSadaf EbrahimiOptions: utf 823*22dc650dSSadaf EbrahimiStarting code units: \x09 \x20 A \xc2 \xe1 \xe2 \xe3 824*22dc650dSSadaf EbrahimiLast code unit = 'A' 825*22dc650dSSadaf EbrahimiSubject length lower bound = 1 826*22dc650dSSadaf Ebrahimi CDBABC 827*22dc650dSSadaf Ebrahimi 0: A 828*22dc650dSSadaf Ebrahimi 829*22dc650dSSadaf Ebrahimi/\v+A/I,utf 830*22dc650dSSadaf EbrahimiCapture group count = 0 831*22dc650dSSadaf EbrahimiOptions: utf 832*22dc650dSSadaf EbrahimiStarting code units: \x0a \x0b \x0c \x0d \xc2 \xe2 833*22dc650dSSadaf EbrahimiLast code unit = 'A' 834*22dc650dSSadaf EbrahimiSubject length lower bound = 2 835*22dc650dSSadaf Ebrahimi 836*22dc650dSSadaf Ebrahimi/\s?xxx\s/I,utf 837*22dc650dSSadaf EbrahimiCapture group count = 0 838*22dc650dSSadaf EbrahimiOptions: utf 839*22dc650dSSadaf EbrahimiStarting code units: \x09 \x0a \x0b \x0c \x0d \x20 x 840*22dc650dSSadaf EbrahimiLast code unit = 'x' 841*22dc650dSSadaf EbrahimiSubject length lower bound = 4 842*22dc650dSSadaf Ebrahimi 843*22dc650dSSadaf Ebrahimi/\sxxx\s/I,utf,tables=2 844*22dc650dSSadaf EbrahimiCapture group count = 0 845*22dc650dSSadaf EbrahimiOptions: utf 846*22dc650dSSadaf EbrahimiStarting code units: \x09 \x0a \x0b \x0c \x0d \x20 \xc2 847*22dc650dSSadaf EbrahimiLast code unit = 'x' 848*22dc650dSSadaf EbrahimiSubject length lower bound = 5 849*22dc650dSSadaf Ebrahimi AB\x{85}xxx\x{a0}XYZ 850*22dc650dSSadaf Ebrahimi 0: \x{85}xxx\x{a0} 851*22dc650dSSadaf Ebrahimi AB\x{a0}xxx\x{85}XYZ 852*22dc650dSSadaf Ebrahimi 0: \x{a0}xxx\x{85} 853*22dc650dSSadaf Ebrahimi 854*22dc650dSSadaf Ebrahimi/\S \S/I,utf,tables=2 855*22dc650dSSadaf EbrahimiCapture group count = 0 856*22dc650dSSadaf EbrahimiOptions: utf 857*22dc650dSSadaf EbrahimiStarting code units: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x0e \x0f 858*22dc650dSSadaf Ebrahimi \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19 \x1a \x1b \x1c \x1d \x1e 859*22dc650dSSadaf Ebrahimi \x1f ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4 5 6 7 8 9 : ; < = > ? @ A B C 860*22dc650dSSadaf Ebrahimi D E F G H I J K L M N O P Q R S T U V W X Y Z [ \ ] ^ _ ` a b c d e f g h 861*22dc650dSSadaf Ebrahimi i j k l m n o p q r s t u v w x y z { | } ~ \x7f \xc0 \xc1 \xc2 \xc3 \xc4 862*22dc650dSSadaf Ebrahimi \xc5 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd \xce \xcf \xd0 \xd1 \xd2 \xd3 863*22dc650dSSadaf Ebrahimi \xd4 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc \xdd \xde \xdf \xe0 \xe1 \xe2 864*22dc650dSSadaf Ebrahimi \xe3 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb \xec \xed \xee \xef \xf0 \xf1 865*22dc650dSSadaf Ebrahimi \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb \xfc \xfd \xfe \xff 866*22dc650dSSadaf EbrahimiLast code unit = ' ' 867*22dc650dSSadaf EbrahimiSubject length lower bound = 3 868*22dc650dSSadaf Ebrahimi \x{a2} \x{84} 869*22dc650dSSadaf Ebrahimi 0: \x{a2} \x{84} 870*22dc650dSSadaf Ebrahimi A Z 871*22dc650dSSadaf Ebrahimi 0: A Z 872*22dc650dSSadaf Ebrahimi 873*22dc650dSSadaf Ebrahimi/a+/utf 874*22dc650dSSadaf Ebrahimi a\x{123}aa\=offset=1 875*22dc650dSSadaf Ebrahimi 0: aa 876*22dc650dSSadaf Ebrahimi a\x{123}aa\=offset=3 877*22dc650dSSadaf Ebrahimi 0: aa 878*22dc650dSSadaf Ebrahimi a\x{123}aa\=offset=4 879*22dc650dSSadaf Ebrahimi 0: a 880*22dc650dSSadaf Ebrahimi\= Expect bad offset value 881*22dc650dSSadaf Ebrahimi a\x{123}aa\=offset=6 882*22dc650dSSadaf EbrahimiFailed: error -33: bad offset value 883*22dc650dSSadaf Ebrahimi\= Expect bad UTF-8 offset 884*22dc650dSSadaf Ebrahimi a\x{123}aa\=offset=2 885*22dc650dSSadaf EbrahimiError -36 (bad UTF-8 offset) 886*22dc650dSSadaf Ebrahimi\= Expect no match 887*22dc650dSSadaf Ebrahimi a\x{123}aa\=offset=5 888*22dc650dSSadaf EbrahimiNo match 889*22dc650dSSadaf Ebrahimi 890*22dc650dSSadaf Ebrahimi/\x{1234}+/Ii,utf 891*22dc650dSSadaf EbrahimiCapture group count = 0 892*22dc650dSSadaf EbrahimiOptions: caseless utf 893*22dc650dSSadaf EbrahimiStarting code units: \xe1 894*22dc650dSSadaf EbrahimiSubject length lower bound = 1 895*22dc650dSSadaf Ebrahimi 896*22dc650dSSadaf Ebrahimi/\x{1234}+?/Ii,utf 897*22dc650dSSadaf EbrahimiCapture group count = 0 898*22dc650dSSadaf EbrahimiOptions: caseless utf 899*22dc650dSSadaf EbrahimiStarting code units: \xe1 900*22dc650dSSadaf EbrahimiSubject length lower bound = 1 901*22dc650dSSadaf Ebrahimi 902*22dc650dSSadaf Ebrahimi/\x{1234}++/Ii,utf 903*22dc650dSSadaf EbrahimiCapture group count = 0 904*22dc650dSSadaf EbrahimiOptions: caseless utf 905*22dc650dSSadaf EbrahimiStarting code units: \xe1 906*22dc650dSSadaf EbrahimiSubject length lower bound = 1 907*22dc650dSSadaf Ebrahimi 908*22dc650dSSadaf Ebrahimi/\x{1234}{2}/Ii,utf 909*22dc650dSSadaf EbrahimiCapture group count = 0 910*22dc650dSSadaf EbrahimiOptions: caseless utf 911*22dc650dSSadaf EbrahimiStarting code units: \xe1 912*22dc650dSSadaf EbrahimiSubject length lower bound = 2 913*22dc650dSSadaf Ebrahimi 914*22dc650dSSadaf Ebrahimi/[^\x{c4}]/IB,utf 915*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 916*22dc650dSSadaf Ebrahimi Bra 917*22dc650dSSadaf Ebrahimi [^\x{c4}] 918*22dc650dSSadaf Ebrahimi Ket 919*22dc650dSSadaf Ebrahimi End 920*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 921*22dc650dSSadaf EbrahimiCapture group count = 0 922*22dc650dSSadaf EbrahimiOptions: utf 923*22dc650dSSadaf EbrahimiSubject length lower bound = 1 924*22dc650dSSadaf Ebrahimi 925*22dc650dSSadaf Ebrahimi/X+\x{200}/IB,utf 926*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 927*22dc650dSSadaf Ebrahimi Bra 928*22dc650dSSadaf Ebrahimi X++ 929*22dc650dSSadaf Ebrahimi \x{200} 930*22dc650dSSadaf Ebrahimi Ket 931*22dc650dSSadaf Ebrahimi End 932*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 933*22dc650dSSadaf EbrahimiCapture group count = 0 934*22dc650dSSadaf EbrahimiOptions: utf 935*22dc650dSSadaf EbrahimiFirst code unit = 'X' 936*22dc650dSSadaf EbrahimiLast code unit = \x80 937*22dc650dSSadaf EbrahimiSubject length lower bound = 2 938*22dc650dSSadaf Ebrahimi 939*22dc650dSSadaf Ebrahimi/\R/I,utf 940*22dc650dSSadaf EbrahimiCapture group count = 0 941*22dc650dSSadaf EbrahimiOptions: utf 942*22dc650dSSadaf EbrahimiStarting code units: \x0a \x0b \x0c \x0d \xc2 \xe2 943*22dc650dSSadaf EbrahimiSubject length lower bound = 1 944*22dc650dSSadaf Ebrahimi 945*22dc650dSSadaf Ebrahimi/\777/IB,utf 946*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 947*22dc650dSSadaf Ebrahimi Bra 948*22dc650dSSadaf Ebrahimi \x{1ff} 949*22dc650dSSadaf Ebrahimi Ket 950*22dc650dSSadaf Ebrahimi End 951*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 952*22dc650dSSadaf EbrahimiCapture group count = 0 953*22dc650dSSadaf EbrahimiOptions: utf 954*22dc650dSSadaf EbrahimiFirst code unit = \xc7 955*22dc650dSSadaf EbrahimiLast code unit = \xbf 956*22dc650dSSadaf EbrahimiSubject length lower bound = 1 957*22dc650dSSadaf Ebrahimi 958*22dc650dSSadaf Ebrahimi/\w+\x{C4}/B,utf 959*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 960*22dc650dSSadaf Ebrahimi Bra 961*22dc650dSSadaf Ebrahimi \w++ 962*22dc650dSSadaf Ebrahimi \x{c4} 963*22dc650dSSadaf Ebrahimi Ket 964*22dc650dSSadaf Ebrahimi End 965*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 966*22dc650dSSadaf Ebrahimi a\x{C4}\x{C4} 967*22dc650dSSadaf Ebrahimi 0: a\x{c4} 968*22dc650dSSadaf Ebrahimi 969*22dc650dSSadaf Ebrahimi/\w+\x{C4}/B,utf,tables=2 970*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 971*22dc650dSSadaf Ebrahimi Bra 972*22dc650dSSadaf Ebrahimi \w+ 973*22dc650dSSadaf Ebrahimi \x{c4} 974*22dc650dSSadaf Ebrahimi Ket 975*22dc650dSSadaf Ebrahimi End 976*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 977*22dc650dSSadaf Ebrahimi a\x{C4}\x{C4} 978*22dc650dSSadaf Ebrahimi 0: a\x{c4}\x{c4} 979*22dc650dSSadaf Ebrahimi 980*22dc650dSSadaf Ebrahimi/\W+\x{C4}/B,utf 981*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 982*22dc650dSSadaf Ebrahimi Bra 983*22dc650dSSadaf Ebrahimi \W+ 984*22dc650dSSadaf Ebrahimi \x{c4} 985*22dc650dSSadaf Ebrahimi Ket 986*22dc650dSSadaf Ebrahimi End 987*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 988*22dc650dSSadaf Ebrahimi !\x{C4} 989*22dc650dSSadaf Ebrahimi 0: !\x{c4} 990*22dc650dSSadaf Ebrahimi 991*22dc650dSSadaf Ebrahimi/\W+\x{C4}/B,utf,tables=2 992*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 993*22dc650dSSadaf Ebrahimi Bra 994*22dc650dSSadaf Ebrahimi \W++ 995*22dc650dSSadaf Ebrahimi \x{c4} 996*22dc650dSSadaf Ebrahimi Ket 997*22dc650dSSadaf Ebrahimi End 998*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 999*22dc650dSSadaf Ebrahimi !\x{C4} 1000*22dc650dSSadaf Ebrahimi 0: !\x{c4} 1001*22dc650dSSadaf Ebrahimi 1002*22dc650dSSadaf Ebrahimi/\W+\x{A1}/B,utf 1003*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1004*22dc650dSSadaf Ebrahimi Bra 1005*22dc650dSSadaf Ebrahimi \W+ 1006*22dc650dSSadaf Ebrahimi \x{a1} 1007*22dc650dSSadaf Ebrahimi Ket 1008*22dc650dSSadaf Ebrahimi End 1009*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1010*22dc650dSSadaf Ebrahimi !\x{A1} 1011*22dc650dSSadaf Ebrahimi 0: !\x{a1} 1012*22dc650dSSadaf Ebrahimi 1013*22dc650dSSadaf Ebrahimi/\W+\x{A1}/B,utf,tables=2 1014*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1015*22dc650dSSadaf Ebrahimi Bra 1016*22dc650dSSadaf Ebrahimi \W+ 1017*22dc650dSSadaf Ebrahimi \x{a1} 1018*22dc650dSSadaf Ebrahimi Ket 1019*22dc650dSSadaf Ebrahimi End 1020*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1021*22dc650dSSadaf Ebrahimi !\x{A1} 1022*22dc650dSSadaf Ebrahimi 0: !\x{a1} 1023*22dc650dSSadaf Ebrahimi 1024*22dc650dSSadaf Ebrahimi/X\s+\x{A0}/B,utf 1025*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1026*22dc650dSSadaf Ebrahimi Bra 1027*22dc650dSSadaf Ebrahimi X 1028*22dc650dSSadaf Ebrahimi \s++ 1029*22dc650dSSadaf Ebrahimi \x{a0} 1030*22dc650dSSadaf Ebrahimi Ket 1031*22dc650dSSadaf Ebrahimi End 1032*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1033*22dc650dSSadaf Ebrahimi X\x20\x{A0}\x{A0} 1034*22dc650dSSadaf Ebrahimi 0: X \x{a0} 1035*22dc650dSSadaf Ebrahimi 1036*22dc650dSSadaf Ebrahimi/X\s+\x{A0}/B,utf,tables=2 1037*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1038*22dc650dSSadaf Ebrahimi Bra 1039*22dc650dSSadaf Ebrahimi X 1040*22dc650dSSadaf Ebrahimi \s+ 1041*22dc650dSSadaf Ebrahimi \x{a0} 1042*22dc650dSSadaf Ebrahimi Ket 1043*22dc650dSSadaf Ebrahimi End 1044*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1045*22dc650dSSadaf Ebrahimi X\x20\x{A0}\x{A0} 1046*22dc650dSSadaf Ebrahimi 0: X \x{a0}\x{a0} 1047*22dc650dSSadaf Ebrahimi 1048*22dc650dSSadaf Ebrahimi/\S+\x{A0}/B,utf 1049*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1050*22dc650dSSadaf Ebrahimi Bra 1051*22dc650dSSadaf Ebrahimi \S+ 1052*22dc650dSSadaf Ebrahimi \x{a0} 1053*22dc650dSSadaf Ebrahimi Ket 1054*22dc650dSSadaf Ebrahimi End 1055*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1056*22dc650dSSadaf Ebrahimi X\x{A0}\x{A0} 1057*22dc650dSSadaf Ebrahimi 0: X\x{a0}\x{a0} 1058*22dc650dSSadaf Ebrahimi 1059*22dc650dSSadaf Ebrahimi/\S+\x{A0}/B,utf,tables=2 1060*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1061*22dc650dSSadaf Ebrahimi Bra 1062*22dc650dSSadaf Ebrahimi \S++ 1063*22dc650dSSadaf Ebrahimi \x{a0} 1064*22dc650dSSadaf Ebrahimi Ket 1065*22dc650dSSadaf Ebrahimi End 1066*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1067*22dc650dSSadaf Ebrahimi X\x{A0}\x{A0} 1068*22dc650dSSadaf Ebrahimi 0: X\x{a0} 1069*22dc650dSSadaf Ebrahimi 1070*22dc650dSSadaf Ebrahimi/\x{a0}+\s!/B,utf 1071*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1072*22dc650dSSadaf Ebrahimi Bra 1073*22dc650dSSadaf Ebrahimi \x{a0}++ 1074*22dc650dSSadaf Ebrahimi \s 1075*22dc650dSSadaf Ebrahimi ! 1076*22dc650dSSadaf Ebrahimi Ket 1077*22dc650dSSadaf Ebrahimi End 1078*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1079*22dc650dSSadaf Ebrahimi \x{a0}\x20! 1080*22dc650dSSadaf Ebrahimi 0: \x{a0} ! 1081*22dc650dSSadaf Ebrahimi 1082*22dc650dSSadaf Ebrahimi/\x{a0}+\s!/B,utf,tables=2 1083*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1084*22dc650dSSadaf Ebrahimi Bra 1085*22dc650dSSadaf Ebrahimi \x{a0}+ 1086*22dc650dSSadaf Ebrahimi \s 1087*22dc650dSSadaf Ebrahimi ! 1088*22dc650dSSadaf Ebrahimi Ket 1089*22dc650dSSadaf Ebrahimi End 1090*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1091*22dc650dSSadaf Ebrahimi \x{a0}\x20! 1092*22dc650dSSadaf Ebrahimi 0: \x{a0} ! 1093*22dc650dSSadaf Ebrahimi 1094*22dc650dSSadaf Ebrahimi/A/utf 1095*22dc650dSSadaf Ebrahimi \x{ff000041} 1096*22dc650dSSadaf Ebrahimi** Character \x{ff000041} is greater than 0x7fffffff and so cannot be converted to UTF-8 1097*22dc650dSSadaf Ebrahimi \x{7f000041} 1098*22dc650dSSadaf EbrahimiFailed: error -14: UTF-8 error: 6-byte character is not allowed (RFC 3629) at offset 0 1099*22dc650dSSadaf Ebrahimi 1100*22dc650dSSadaf Ebrahimi/(*UTF8)abc/never_utf 1101*22dc650dSSadaf EbrahimiFailed: error 174 at offset 7: using UTF is disabled by the application 1102*22dc650dSSadaf Ebrahimi 1103*22dc650dSSadaf Ebrahimi/abc/utf,never_utf 1104*22dc650dSSadaf EbrahimiFailed: error 174 at offset 0: using UTF is disabled by the application 1105*22dc650dSSadaf Ebrahimi 1106*22dc650dSSadaf Ebrahimi/A\x{391}\x{10427}\x{ff3a}\x{1fb0}/IBi,utf 1107*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1108*22dc650dSSadaf Ebrahimi Bra 1109*22dc650dSSadaf Ebrahimi /i A\x{391}\x{10427}\x{ff3a}\x{1fb0} 1110*22dc650dSSadaf Ebrahimi Ket 1111*22dc650dSSadaf Ebrahimi End 1112*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1113*22dc650dSSadaf EbrahimiCapture group count = 0 1114*22dc650dSSadaf EbrahimiOptions: caseless utf 1115*22dc650dSSadaf EbrahimiFirst code unit = 'A' (caseless) 1116*22dc650dSSadaf EbrahimiSubject length lower bound = 5 1117*22dc650dSSadaf Ebrahimi 1118*22dc650dSSadaf Ebrahimi/A\x{391}\x{10427}\x{ff3a}\x{1fb0}/IB,utf 1119*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1120*22dc650dSSadaf Ebrahimi Bra 1121*22dc650dSSadaf Ebrahimi A\x{391}\x{10427}\x{ff3a}\x{1fb0} 1122*22dc650dSSadaf Ebrahimi Ket 1123*22dc650dSSadaf Ebrahimi End 1124*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1125*22dc650dSSadaf EbrahimiCapture group count = 0 1126*22dc650dSSadaf EbrahimiOptions: utf 1127*22dc650dSSadaf EbrahimiFirst code unit = 'A' 1128*22dc650dSSadaf EbrahimiLast code unit = \xb0 1129*22dc650dSSadaf EbrahimiSubject length lower bound = 5 1130*22dc650dSSadaf Ebrahimi 1131*22dc650dSSadaf Ebrahimi/AB\x{1fb0}/IB,utf 1132*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1133*22dc650dSSadaf Ebrahimi Bra 1134*22dc650dSSadaf Ebrahimi AB\x{1fb0} 1135*22dc650dSSadaf Ebrahimi Ket 1136*22dc650dSSadaf Ebrahimi End 1137*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1138*22dc650dSSadaf EbrahimiCapture group count = 0 1139*22dc650dSSadaf EbrahimiOptions: utf 1140*22dc650dSSadaf EbrahimiFirst code unit = 'A' 1141*22dc650dSSadaf EbrahimiLast code unit = \xb0 1142*22dc650dSSadaf EbrahimiSubject length lower bound = 3 1143*22dc650dSSadaf Ebrahimi 1144*22dc650dSSadaf Ebrahimi/AB\x{1fb0}/IBi,utf 1145*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1146*22dc650dSSadaf Ebrahimi Bra 1147*22dc650dSSadaf Ebrahimi /i AB\x{1fb0} 1148*22dc650dSSadaf Ebrahimi Ket 1149*22dc650dSSadaf Ebrahimi End 1150*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1151*22dc650dSSadaf EbrahimiCapture group count = 0 1152*22dc650dSSadaf EbrahimiOptions: caseless utf 1153*22dc650dSSadaf EbrahimiFirst code unit = 'A' (caseless) 1154*22dc650dSSadaf EbrahimiLast code unit = 'B' (caseless) 1155*22dc650dSSadaf EbrahimiSubject length lower bound = 3 1156*22dc650dSSadaf Ebrahimi 1157*22dc650dSSadaf Ebrahimi/\x{401}\x{420}\x{421}\x{422}\x{423}\x{424}\x{425}\x{426}\x{427}\x{428}\x{429}\x{42a}\x{42b}\x{42c}\x{42d}\x{42e}\x{42f}/Ii,utf 1158*22dc650dSSadaf EbrahimiCapture group count = 0 1159*22dc650dSSadaf EbrahimiOptions: caseless utf 1160*22dc650dSSadaf EbrahimiStarting code units: \xd0 \xd1 1161*22dc650dSSadaf EbrahimiSubject length lower bound = 17 1162*22dc650dSSadaf Ebrahimi \x{401}\x{420}\x{421}\x{422}\x{423}\x{424}\x{425}\x{426}\x{427}\x{428}\x{429}\x{42a}\x{42b}\x{42c}\x{42d}\x{42e}\x{42f} 1163*22dc650dSSadaf Ebrahimi 0: \x{401}\x{420}\x{421}\x{422}\x{423}\x{424}\x{425}\x{426}\x{427}\x{428}\x{429}\x{42a}\x{42b}\x{42c}\x{42d}\x{42e}\x{42f} 1164*22dc650dSSadaf Ebrahimi \x{451}\x{440}\x{441}\x{442}\x{443}\x{444}\x{445}\x{446}\x{447}\x{448}\x{449}\x{44a}\x{44b}\x{44c}\x{44d}\x{44e}\x{44f} 1165*22dc650dSSadaf Ebrahimi 0: \x{451}\x{440}\x{441}\x{442}\x{443}\x{444}\x{445}\x{446}\x{447}\x{448}\x{449}\x{44a}\x{44b}\x{44c}\x{44d}\x{44e}\x{44f} 1166*22dc650dSSadaf Ebrahimi 1167*22dc650dSSadaf Ebrahimi/[ⱥ]/Bi,utf 1168*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1169*22dc650dSSadaf Ebrahimi Bra 1170*22dc650dSSadaf Ebrahimi /i \x{2c65} 1171*22dc650dSSadaf Ebrahimi Ket 1172*22dc650dSSadaf Ebrahimi End 1173*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1174*22dc650dSSadaf Ebrahimi 1175*22dc650dSSadaf Ebrahimi/[^ⱥ]/Bi,utf 1176*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1177*22dc650dSSadaf Ebrahimi Bra 1178*22dc650dSSadaf Ebrahimi /i [^\x{2c65}] 1179*22dc650dSSadaf Ebrahimi Ket 1180*22dc650dSSadaf Ebrahimi End 1181*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1182*22dc650dSSadaf Ebrahimi 1183*22dc650dSSadaf Ebrahimi/\h/I 1184*22dc650dSSadaf EbrahimiCapture group count = 0 1185*22dc650dSSadaf EbrahimiStarting code units: \x09 \x20 \xa0 1186*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1187*22dc650dSSadaf Ebrahimi 1188*22dc650dSSadaf Ebrahimi/\v/I 1189*22dc650dSSadaf EbrahimiCapture group count = 0 1190*22dc650dSSadaf EbrahimiStarting code units: \x0a \x0b \x0c \x0d \x85 1191*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1192*22dc650dSSadaf Ebrahimi 1193*22dc650dSSadaf Ebrahimi/\R/I 1194*22dc650dSSadaf EbrahimiCapture group count = 0 1195*22dc650dSSadaf EbrahimiStarting code units: \x0a \x0b \x0c \x0d \x85 1196*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1197*22dc650dSSadaf Ebrahimi 1198*22dc650dSSadaf Ebrahimi/[[:blank:]]/B,ucp 1199*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1200*22dc650dSSadaf Ebrahimi Bra 1201*22dc650dSSadaf Ebrahimi [\x09 \xa0] 1202*22dc650dSSadaf Ebrahimi Ket 1203*22dc650dSSadaf Ebrahimi End 1204*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1205*22dc650dSSadaf Ebrahimi 1206*22dc650dSSadaf Ebrahimi/\x{212a}+/Ii,utf 1207*22dc650dSSadaf EbrahimiCapture group count = 0 1208*22dc650dSSadaf EbrahimiOptions: caseless utf 1209*22dc650dSSadaf EbrahimiStarting code units: K k \xe2 1210*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1211*22dc650dSSadaf Ebrahimi KKkk\x{212a} 1212*22dc650dSSadaf Ebrahimi 0: KKkk\x{212a} 1213*22dc650dSSadaf Ebrahimi 1214*22dc650dSSadaf Ebrahimi/s+/Ii,utf 1215*22dc650dSSadaf EbrahimiCapture group count = 0 1216*22dc650dSSadaf EbrahimiOptions: caseless utf 1217*22dc650dSSadaf EbrahimiStarting code units: S s \xc5 1218*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1219*22dc650dSSadaf Ebrahimi SSss\x{17f} 1220*22dc650dSSadaf Ebrahimi 0: SSss\x{17f} 1221*22dc650dSSadaf Ebrahimi 1222*22dc650dSSadaf Ebrahimi/\x{100}*A/IB,utf 1223*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1224*22dc650dSSadaf Ebrahimi Bra 1225*22dc650dSSadaf Ebrahimi \x{100}*+ 1226*22dc650dSSadaf Ebrahimi A 1227*22dc650dSSadaf Ebrahimi Ket 1228*22dc650dSSadaf Ebrahimi End 1229*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1230*22dc650dSSadaf EbrahimiCapture group count = 0 1231*22dc650dSSadaf EbrahimiOptions: utf 1232*22dc650dSSadaf EbrahimiStarting code units: A \xc4 1233*22dc650dSSadaf EbrahimiLast code unit = 'A' 1234*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1235*22dc650dSSadaf Ebrahimi A 1236*22dc650dSSadaf Ebrahimi 0: A 1237*22dc650dSSadaf Ebrahimi 1238*22dc650dSSadaf Ebrahimi/\x{100}*\d(?R)/IB,utf 1239*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1240*22dc650dSSadaf Ebrahimi Bra 1241*22dc650dSSadaf Ebrahimi \x{100}*+ 1242*22dc650dSSadaf Ebrahimi \d 1243*22dc650dSSadaf Ebrahimi Recurse 1244*22dc650dSSadaf Ebrahimi Ket 1245*22dc650dSSadaf Ebrahimi End 1246*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1247*22dc650dSSadaf EbrahimiCapture group count = 0 1248*22dc650dSSadaf EbrahimiOptions: utf 1249*22dc650dSSadaf EbrahimiStarting code units: 0 1 2 3 4 5 6 7 8 9 \xc4 1250*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1251*22dc650dSSadaf Ebrahimi 1252*22dc650dSSadaf Ebrahimi/[Z\x{100}]/IB,utf 1253*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1254*22dc650dSSadaf Ebrahimi Bra 1255*22dc650dSSadaf Ebrahimi [Z\x{100}] 1256*22dc650dSSadaf Ebrahimi Ket 1257*22dc650dSSadaf Ebrahimi End 1258*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1259*22dc650dSSadaf EbrahimiCapture group count = 0 1260*22dc650dSSadaf EbrahimiOptions: utf 1261*22dc650dSSadaf EbrahimiStarting code units: Z \xc4 1262*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1263*22dc650dSSadaf Ebrahimi Z\x{100} 1264*22dc650dSSadaf Ebrahimi 0: Z 1265*22dc650dSSadaf Ebrahimi \x{100} 1266*22dc650dSSadaf Ebrahimi 0: \x{100} 1267*22dc650dSSadaf Ebrahimi \x{100}Z 1268*22dc650dSSadaf Ebrahimi 0: \x{100} 1269*22dc650dSSadaf Ebrahimi 1270*22dc650dSSadaf Ebrahimi/[z-\x{100}]/IB,utf 1271*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1272*22dc650dSSadaf Ebrahimi Bra 1273*22dc650dSSadaf Ebrahimi [z-\xff\x{100}] 1274*22dc650dSSadaf Ebrahimi Ket 1275*22dc650dSSadaf Ebrahimi End 1276*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1277*22dc650dSSadaf EbrahimiCapture group count = 0 1278*22dc650dSSadaf EbrahimiOptions: utf 1279*22dc650dSSadaf EbrahimiStarting code units: z { | } ~ \x7f \xc2 \xc3 \xc4 1280*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1281*22dc650dSSadaf Ebrahimi 1282*22dc650dSSadaf Ebrahimi/[z\Qa-d]Ā\E]/IB,utf 1283*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1284*22dc650dSSadaf Ebrahimi Bra 1285*22dc650dSSadaf Ebrahimi [\-\]adz\x{100}] 1286*22dc650dSSadaf Ebrahimi Ket 1287*22dc650dSSadaf Ebrahimi End 1288*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1289*22dc650dSSadaf EbrahimiCapture group count = 0 1290*22dc650dSSadaf EbrahimiOptions: utf 1291*22dc650dSSadaf EbrahimiStarting code units: - ] a d z \xc4 1292*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1293*22dc650dSSadaf Ebrahimi \x{100} 1294*22dc650dSSadaf Ebrahimi 0: \x{100} 1295*22dc650dSSadaf Ebrahimi Ā 1296*22dc650dSSadaf Ebrahimi 0: \x{100} 1297*22dc650dSSadaf Ebrahimi 1298*22dc650dSSadaf Ebrahimi/[ab\x{100}]abc(xyz(?1))/IB,utf 1299*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1300*22dc650dSSadaf Ebrahimi Bra 1301*22dc650dSSadaf Ebrahimi [ab\x{100}] 1302*22dc650dSSadaf Ebrahimi abc 1303*22dc650dSSadaf Ebrahimi CBra 1 1304*22dc650dSSadaf Ebrahimi xyz 1305*22dc650dSSadaf Ebrahimi Recurse 1306*22dc650dSSadaf Ebrahimi Ket 1307*22dc650dSSadaf Ebrahimi Ket 1308*22dc650dSSadaf Ebrahimi End 1309*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1310*22dc650dSSadaf EbrahimiCapture group count = 1 1311*22dc650dSSadaf EbrahimiOptions: utf 1312*22dc650dSSadaf EbrahimiStarting code units: a b \xc4 1313*22dc650dSSadaf EbrahimiLast code unit = 'z' 1314*22dc650dSSadaf EbrahimiSubject length lower bound = 7 1315*22dc650dSSadaf Ebrahimi 1316*22dc650dSSadaf Ebrahimi/\x{100}*\s/IB,utf 1317*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1318*22dc650dSSadaf Ebrahimi Bra 1319*22dc650dSSadaf Ebrahimi \x{100}*+ 1320*22dc650dSSadaf Ebrahimi \s 1321*22dc650dSSadaf Ebrahimi Ket 1322*22dc650dSSadaf Ebrahimi End 1323*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1324*22dc650dSSadaf EbrahimiCapture group count = 0 1325*22dc650dSSadaf EbrahimiOptions: utf 1326*22dc650dSSadaf EbrahimiStarting code units: \x09 \x0a \x0b \x0c \x0d \x20 \xc4 1327*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1328*22dc650dSSadaf Ebrahimi 1329*22dc650dSSadaf Ebrahimi/\x{100}*\d/IB,utf 1330*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1331*22dc650dSSadaf Ebrahimi Bra 1332*22dc650dSSadaf Ebrahimi \x{100}*+ 1333*22dc650dSSadaf Ebrahimi \d 1334*22dc650dSSadaf Ebrahimi Ket 1335*22dc650dSSadaf Ebrahimi End 1336*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1337*22dc650dSSadaf EbrahimiCapture group count = 0 1338*22dc650dSSadaf EbrahimiOptions: utf 1339*22dc650dSSadaf EbrahimiStarting code units: 0 1 2 3 4 5 6 7 8 9 \xc4 1340*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1341*22dc650dSSadaf Ebrahimi 1342*22dc650dSSadaf Ebrahimi/\x{100}*\w/IB,utf 1343*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1344*22dc650dSSadaf Ebrahimi Bra 1345*22dc650dSSadaf Ebrahimi \x{100}*+ 1346*22dc650dSSadaf Ebrahimi \w 1347*22dc650dSSadaf Ebrahimi Ket 1348*22dc650dSSadaf Ebrahimi End 1349*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1350*22dc650dSSadaf EbrahimiCapture group count = 0 1351*22dc650dSSadaf EbrahimiOptions: utf 1352*22dc650dSSadaf EbrahimiStarting code units: 0 1 2 3 4 5 6 7 8 9 A B C D E F G H I J K L M N O P 1353*22dc650dSSadaf Ebrahimi Q R S T U V W X Y Z _ a b c d e f g h i j k l m n o p q r s t u v w x y z 1354*22dc650dSSadaf Ebrahimi \xc4 1355*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1356*22dc650dSSadaf Ebrahimi 1357*22dc650dSSadaf Ebrahimi/\x{100}*\D/IB,utf 1358*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1359*22dc650dSSadaf Ebrahimi Bra 1360*22dc650dSSadaf Ebrahimi \x{100}* 1361*22dc650dSSadaf Ebrahimi \D 1362*22dc650dSSadaf Ebrahimi Ket 1363*22dc650dSSadaf Ebrahimi End 1364*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1365*22dc650dSSadaf EbrahimiCapture group count = 0 1366*22dc650dSSadaf EbrahimiOptions: utf 1367*22dc650dSSadaf EbrahimiStarting code units: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x09 \x0a 1368*22dc650dSSadaf Ebrahimi \x0b \x0c \x0d \x0e \x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19 1369*22dc650dSSadaf Ebrahimi \x1a \x1b \x1c \x1d \x1e \x1f \x20 ! " # $ % & ' ( ) * + , - . / : ; < = > 1370*22dc650dSSadaf Ebrahimi ? @ A B C D E F G H I J K L M N O P Q R S T U V W X Y Z [ \ ] ^ _ ` a b c 1371*22dc650dSSadaf Ebrahimi d e f g h i j k l m n o p q r s t u v w x y z { | } ~ \x7f \xc0 \xc1 \xc2 1372*22dc650dSSadaf Ebrahimi \xc3 \xc4 \xc5 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd \xce \xcf \xd0 \xd1 1373*22dc650dSSadaf Ebrahimi \xd2 \xd3 \xd4 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc \xdd \xde \xdf \xe0 1374*22dc650dSSadaf Ebrahimi \xe1 \xe2 \xe3 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb \xec \xed \xee \xef 1375*22dc650dSSadaf Ebrahimi \xf0 \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb \xfc \xfd \xfe 1376*22dc650dSSadaf Ebrahimi \xff 1377*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1378*22dc650dSSadaf Ebrahimi 1379*22dc650dSSadaf Ebrahimi/\x{100}*\S/IB,utf 1380*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1381*22dc650dSSadaf Ebrahimi Bra 1382*22dc650dSSadaf Ebrahimi \x{100}* 1383*22dc650dSSadaf Ebrahimi \S 1384*22dc650dSSadaf Ebrahimi Ket 1385*22dc650dSSadaf Ebrahimi End 1386*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1387*22dc650dSSadaf EbrahimiCapture group count = 0 1388*22dc650dSSadaf EbrahimiOptions: utf 1389*22dc650dSSadaf EbrahimiStarting code units: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x0e \x0f 1390*22dc650dSSadaf Ebrahimi \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19 \x1a \x1b \x1c \x1d \x1e 1391*22dc650dSSadaf Ebrahimi \x1f ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4 5 6 7 8 9 : ; < = > ? @ A B C 1392*22dc650dSSadaf Ebrahimi D E F G H I J K L M N O P Q R S T U V W X Y Z [ \ ] ^ _ ` a b c d e f g h 1393*22dc650dSSadaf Ebrahimi i j k l m n o p q r s t u v w x y z { | } ~ \x7f \xc0 \xc1 \xc2 \xc3 \xc4 1394*22dc650dSSadaf Ebrahimi \xc5 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd \xce \xcf \xd0 \xd1 \xd2 \xd3 1395*22dc650dSSadaf Ebrahimi \xd4 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc \xdd \xde \xdf \xe0 \xe1 \xe2 1396*22dc650dSSadaf Ebrahimi \xe3 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb \xec \xed \xee \xef \xf0 \xf1 1397*22dc650dSSadaf Ebrahimi \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb \xfc \xfd \xfe \xff 1398*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1399*22dc650dSSadaf Ebrahimi 1400*22dc650dSSadaf Ebrahimi/\x{100}*\W/IB,utf 1401*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1402*22dc650dSSadaf Ebrahimi Bra 1403*22dc650dSSadaf Ebrahimi \x{100}* 1404*22dc650dSSadaf Ebrahimi \W 1405*22dc650dSSadaf Ebrahimi Ket 1406*22dc650dSSadaf Ebrahimi End 1407*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1408*22dc650dSSadaf EbrahimiCapture group count = 0 1409*22dc650dSSadaf EbrahimiOptions: utf 1410*22dc650dSSadaf EbrahimiStarting code units: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x09 \x0a 1411*22dc650dSSadaf Ebrahimi \x0b \x0c \x0d \x0e \x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19 1412*22dc650dSSadaf Ebrahimi \x1a \x1b \x1c \x1d \x1e \x1f \x20 ! " # $ % & ' ( ) * + , - . / : ; < = > 1413*22dc650dSSadaf Ebrahimi ? @ [ \ ] ^ ` { | } ~ \x7f \xc0 \xc1 \xc2 \xc3 \xc4 \xc5 \xc6 \xc7 \xc8 \xc9 1414*22dc650dSSadaf Ebrahimi \xca \xcb \xcc \xcd \xce \xcf \xd0 \xd1 \xd2 \xd3 \xd4 \xd5 \xd6 \xd7 \xd8 1415*22dc650dSSadaf Ebrahimi \xd9 \xda \xdb \xdc \xdd \xde \xdf \xe0 \xe1 \xe2 \xe3 \xe4 \xe5 \xe6 \xe7 1416*22dc650dSSadaf Ebrahimi \xe8 \xe9 \xea \xeb \xec \xed \xee \xef \xf0 \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 1417*22dc650dSSadaf Ebrahimi \xf7 \xf8 \xf9 \xfa \xfb \xfc \xfd \xfe \xff 1418*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1419*22dc650dSSadaf Ebrahimi 1420*22dc650dSSadaf Ebrahimi/[\x{105}-\x{109}]/IBi,utf 1421*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1422*22dc650dSSadaf Ebrahimi Bra 1423*22dc650dSSadaf Ebrahimi [\x{104}-\x{109}] 1424*22dc650dSSadaf Ebrahimi Ket 1425*22dc650dSSadaf Ebrahimi End 1426*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1427*22dc650dSSadaf EbrahimiCapture group count = 0 1428*22dc650dSSadaf EbrahimiOptions: caseless utf 1429*22dc650dSSadaf EbrahimiStarting code units: \xc4 1430*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1431*22dc650dSSadaf Ebrahimi \x{104} 1432*22dc650dSSadaf Ebrahimi 0: \x{104} 1433*22dc650dSSadaf Ebrahimi \x{105} 1434*22dc650dSSadaf Ebrahimi 0: \x{105} 1435*22dc650dSSadaf Ebrahimi \x{109} 1436*22dc650dSSadaf Ebrahimi 0: \x{109} 1437*22dc650dSSadaf Ebrahimi\= Expect no match 1438*22dc650dSSadaf Ebrahimi \x{100} 1439*22dc650dSSadaf EbrahimiNo match 1440*22dc650dSSadaf Ebrahimi \x{10a} 1441*22dc650dSSadaf EbrahimiNo match 1442*22dc650dSSadaf Ebrahimi 1443*22dc650dSSadaf Ebrahimi/[z-\x{100}]/IBi,utf 1444*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1445*22dc650dSSadaf Ebrahimi Bra 1446*22dc650dSSadaf Ebrahimi [Zz-\xff\x{39c}\x{3bc}\x{212b}\x{1e9e}\x{212b}\x{178}\x{100}-\x{101}] 1447*22dc650dSSadaf Ebrahimi Ket 1448*22dc650dSSadaf Ebrahimi End 1449*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1450*22dc650dSSadaf EbrahimiCapture group count = 0 1451*22dc650dSSadaf EbrahimiOptions: caseless utf 1452*22dc650dSSadaf EbrahimiStarting code units: Z z { | } ~ \x7f \xc2 \xc3 \xc4 \xc5 \xce \xe1 \xe2 1453*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1454*22dc650dSSadaf Ebrahimi Z 1455*22dc650dSSadaf Ebrahimi 0: Z 1456*22dc650dSSadaf Ebrahimi z 1457*22dc650dSSadaf Ebrahimi 0: z 1458*22dc650dSSadaf Ebrahimi \x{39c} 1459*22dc650dSSadaf Ebrahimi 0: \x{39c} 1460*22dc650dSSadaf Ebrahimi \x{178} 1461*22dc650dSSadaf Ebrahimi 0: \x{178} 1462*22dc650dSSadaf Ebrahimi | 1463*22dc650dSSadaf Ebrahimi 0: | 1464*22dc650dSSadaf Ebrahimi \x{80} 1465*22dc650dSSadaf Ebrahimi 0: \x{80} 1466*22dc650dSSadaf Ebrahimi \x{ff} 1467*22dc650dSSadaf Ebrahimi 0: \x{ff} 1468*22dc650dSSadaf Ebrahimi \x{100} 1469*22dc650dSSadaf Ebrahimi 0: \x{100} 1470*22dc650dSSadaf Ebrahimi \x{101} 1471*22dc650dSSadaf Ebrahimi 0: \x{101} 1472*22dc650dSSadaf Ebrahimi\= Expect no match 1473*22dc650dSSadaf Ebrahimi \x{102} 1474*22dc650dSSadaf EbrahimiNo match 1475*22dc650dSSadaf Ebrahimi Y 1476*22dc650dSSadaf EbrahimiNo match 1477*22dc650dSSadaf Ebrahimi y 1478*22dc650dSSadaf EbrahimiNo match 1479*22dc650dSSadaf Ebrahimi 1480*22dc650dSSadaf Ebrahimi/[z-\x{100}]/IBi,utf 1481*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1482*22dc650dSSadaf Ebrahimi Bra 1483*22dc650dSSadaf Ebrahimi [Zz-\xff\x{39c}\x{3bc}\x{212b}\x{1e9e}\x{212b}\x{178}\x{100}-\x{101}] 1484*22dc650dSSadaf Ebrahimi Ket 1485*22dc650dSSadaf Ebrahimi End 1486*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1487*22dc650dSSadaf EbrahimiCapture group count = 0 1488*22dc650dSSadaf EbrahimiOptions: caseless utf 1489*22dc650dSSadaf EbrahimiStarting code units: Z z { | } ~ \x7f \xc2 \xc3 \xc4 \xc5 \xce \xe1 \xe2 1490*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1491*22dc650dSSadaf Ebrahimi 1492*22dc650dSSadaf Ebrahimi/\x{3a3}B/IBi,utf 1493*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1494*22dc650dSSadaf Ebrahimi Bra 1495*22dc650dSSadaf Ebrahimi clist 03a3 03c2 03c3 1496*22dc650dSSadaf Ebrahimi /i B 1497*22dc650dSSadaf Ebrahimi Ket 1498*22dc650dSSadaf Ebrahimi End 1499*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1500*22dc650dSSadaf EbrahimiCapture group count = 0 1501*22dc650dSSadaf EbrahimiOptions: caseless utf 1502*22dc650dSSadaf EbrahimiStarting code units: \xce \xcf 1503*22dc650dSSadaf EbrahimiLast code unit = 'B' (caseless) 1504*22dc650dSSadaf EbrahimiSubject length lower bound = 2 1505*22dc650dSSadaf Ebrahimi 1506*22dc650dSSadaf Ebrahimi/abc/utf,replace=� 1507*22dc650dSSadaf Ebrahimi abc 1508*22dc650dSSadaf EbrahimiFailed: error -3: UTF-8 error: 1 byte missing at end 1509*22dc650dSSadaf Ebrahimi 1510*22dc650dSSadaf Ebrahimi/(?<=(a)(?-1))x/I,utf 1511*22dc650dSSadaf EbrahimiCapture group count = 1 1512*22dc650dSSadaf EbrahimiMax lookbehind = 2 1513*22dc650dSSadaf EbrahimiOptions: utf 1514*22dc650dSSadaf EbrahimiFirst code unit = 'x' 1515*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1516*22dc650dSSadaf Ebrahimi a\x80zx\=offset=3 1517*22dc650dSSadaf EbrahimiFailed: error -22: UTF-8 error: isolated byte with 0x80 bit set at offset 1 1518*22dc650dSSadaf Ebrahimi 1519*22dc650dSSadaf Ebrahimi/[\W\p{Any}]/B 1520*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1521*22dc650dSSadaf Ebrahimi Bra 1522*22dc650dSSadaf Ebrahimi [\x00-/:-@[-^`{-\xff\p{Any}] 1523*22dc650dSSadaf Ebrahimi Ket 1524*22dc650dSSadaf Ebrahimi End 1525*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1526*22dc650dSSadaf Ebrahimi abc 1527*22dc650dSSadaf Ebrahimi 0: a 1528*22dc650dSSadaf Ebrahimi 123 1529*22dc650dSSadaf Ebrahimi 0: 1 1530*22dc650dSSadaf Ebrahimi 1531*22dc650dSSadaf Ebrahimi/[\W\pL]/B 1532*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1533*22dc650dSSadaf Ebrahimi Bra 1534*22dc650dSSadaf Ebrahimi [\x00-/:-@[-^`{-\xff\p{L}] 1535*22dc650dSSadaf Ebrahimi Ket 1536*22dc650dSSadaf Ebrahimi End 1537*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1538*22dc650dSSadaf Ebrahimi abc 1539*22dc650dSSadaf Ebrahimi 0: a 1540*22dc650dSSadaf Ebrahimi\= Expect no match 1541*22dc650dSSadaf Ebrahimi 123 1542*22dc650dSSadaf EbrahimiNo match 1543*22dc650dSSadaf Ebrahimi 1544*22dc650dSSadaf Ebrahimi/(*:*++++++++++++''''''''''''''''''''+''+++'+++x+++++++++++++++++++++++++++++++++++(++++++++++++++++++++:++++++%++:''''''''''''''''''''''''+++++++++++++++++++++++++++++++++++++++++++++++++++++-++++++++k+++++++''''+++'+++++++++++++++++++++++''''++++++++++++':ƿ)/utf 1545*22dc650dSSadaf EbrahimiFailed: error 176 at offset 259: name is too long in (*MARK), (*PRUNE), (*SKIP), or (*THEN) 1546*22dc650dSSadaf Ebrahimi 1547*22dc650dSSadaf Ebrahimi/[\s[:^ascii:]]/B,ucp 1548*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1549*22dc650dSSadaf Ebrahimi Bra 1550*22dc650dSSadaf Ebrahimi [\x80-\xff\p{Xsp}] 1551*22dc650dSSadaf Ebrahimi Ket 1552*22dc650dSSadaf Ebrahimi End 1553*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1554*22dc650dSSadaf Ebrahimi 1555*22dc650dSSadaf Ebrahimi# A special extra option allows excaped surrogate code points in 8-bit mode, 1556*22dc650dSSadaf Ebrahimi# but subjects containing them must not be UTF-checked. 1557*22dc650dSSadaf Ebrahimi 1558*22dc650dSSadaf Ebrahimi/\x{d800}/I,utf,allow_surrogate_escapes 1559*22dc650dSSadaf EbrahimiCapture group count = 0 1560*22dc650dSSadaf EbrahimiOptions: utf 1561*22dc650dSSadaf EbrahimiExtra options: allow_surrogate_escapes 1562*22dc650dSSadaf EbrahimiFirst code unit = \xed 1563*22dc650dSSadaf EbrahimiLast code unit = \x80 1564*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1565*22dc650dSSadaf Ebrahimi \x{d800}\=no_utf_check 1566*22dc650dSSadaf Ebrahimi 0: \x{d800} 1567*22dc650dSSadaf Ebrahimi 1568*22dc650dSSadaf Ebrahimi/\udfff\o{157401}/utf,alt_bsux,allow_surrogate_escapes 1569*22dc650dSSadaf Ebrahimi \x{dfff}\x{df01}\=no_utf_check 1570*22dc650dSSadaf Ebrahimi 0: \x{dfff}\x{df01} 1571*22dc650dSSadaf Ebrahimi 1572*22dc650dSSadaf Ebrahimi# This has different starting code units in 8-bit mode. 1573*22dc650dSSadaf Ebrahimi 1574*22dc650dSSadaf Ebrahimi/^[^ab]/IB,utf 1575*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1576*22dc650dSSadaf Ebrahimi Bra 1577*22dc650dSSadaf Ebrahimi ^ 1578*22dc650dSSadaf Ebrahimi [\x00-`c-\xff] (neg) 1579*22dc650dSSadaf Ebrahimi Ket 1580*22dc650dSSadaf Ebrahimi End 1581*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1582*22dc650dSSadaf EbrahimiCapture group count = 0 1583*22dc650dSSadaf EbrahimiCompile options: utf 1584*22dc650dSSadaf EbrahimiOverall options: anchored utf 1585*22dc650dSSadaf EbrahimiStarting code units: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x09 \x0a 1586*22dc650dSSadaf Ebrahimi \x0b \x0c \x0d \x0e \x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19 1587*22dc650dSSadaf Ebrahimi \x1a \x1b \x1c \x1d \x1e \x1f \x20 ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4 1588*22dc650dSSadaf Ebrahimi 5 6 7 8 9 : ; < = > ? @ A B C D E F G H I J K L M N O P Q R S T U V W X Y 1589*22dc650dSSadaf Ebrahimi Z [ \ ] ^ _ ` c d e f g h i j k l m n o p q r s t u v w x y z { | } ~ \x7f 1590*22dc650dSSadaf Ebrahimi \xc2 \xc3 \xc4 \xc5 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd \xce \xcf \xd0 1591*22dc650dSSadaf Ebrahimi \xd1 \xd2 \xd3 \xd4 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc \xdd \xde \xdf 1592*22dc650dSSadaf Ebrahimi \xe0 \xe1 \xe2 \xe3 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb \xec \xed \xee 1593*22dc650dSSadaf Ebrahimi \xef \xf0 \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb \xfc \xfd 1594*22dc650dSSadaf Ebrahimi \xfe \xff 1595*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1596*22dc650dSSadaf Ebrahimi c 1597*22dc650dSSadaf Ebrahimi 0: c 1598*22dc650dSSadaf Ebrahimi \x{ff} 1599*22dc650dSSadaf Ebrahimi 0: \x{ff} 1600*22dc650dSSadaf Ebrahimi \x{100} 1601*22dc650dSSadaf Ebrahimi 0: \x{100} 1602*22dc650dSSadaf Ebrahimi\= Expect no match 1603*22dc650dSSadaf Ebrahimi aaa 1604*22dc650dSSadaf EbrahimiNo match 1605*22dc650dSSadaf Ebrahimi 1606*22dc650dSSadaf Ebrahimi# Offsets are different in 8-bit mode. 1607*22dc650dSSadaf Ebrahimi 1608*22dc650dSSadaf Ebrahimi/(?<=abc)(|def)/g,utf,replace=<$0>,substitute_callout 1609*22dc650dSSadaf Ebrahimi 123abcáyzabcdef789abcሴqr 1610*22dc650dSSadaf Ebrahimi 1(2) Old 6 6 "" New 6 8 "<>" 1611*22dc650dSSadaf Ebrahimi 2(2) Old 13 13 "" New 15 17 "<>" 1612*22dc650dSSadaf Ebrahimi 3(2) Old 13 16 "def" New 17 22 "<def>" 1613*22dc650dSSadaf Ebrahimi 4(2) Old 22 22 "" New 28 30 "<>" 1614*22dc650dSSadaf Ebrahimi 4: 123abc<>\x{e1}yzabc<><def>789abc<>\x{1234}qr 1615*22dc650dSSadaf Ebrahimi 1616*22dc650dSSadaf Ebrahimi# Check name length with non-ASCII characters 1617*22dc650dSSadaf Ebrahimi 1618*22dc650dSSadaf Ebrahimi/(?'ABáC678901234567890123456789012012345678901234567890123456789AB012345678901234567890123456789AB012345678901234567890123456789AB'...)/utf 1619*22dc650dSSadaf Ebrahimi 1620*22dc650dSSadaf Ebrahimi/(?'ABáC6789012345678901234567890123012345678901234567890123456789AB012345678901234567890123456789AB012345678901234567890123456789AB'...)/utf 1621*22dc650dSSadaf EbrahimiFailed: error 148 at offset 132: subpattern name is too long (maximum 128 code units) 1622*22dc650dSSadaf Ebrahimi 1623*22dc650dSSadaf Ebrahimi/(?'ABZC6789012345678901234567890123012345678901234567890123456789AB012345678901234567890123456789AB012345678901234567890123456789AB'...)/utf 1624*22dc650dSSadaf Ebrahimi 1625*22dc650dSSadaf Ebrahimi/(?(n/utf 1626*22dc650dSSadaf EbrahimiFailed: error 142 at offset 4: syntax error in subpattern name (missing terminator?) 1627*22dc650dSSadaf Ebrahimi 1628*22dc650dSSadaf Ebrahimi/(?(á/utf 1629*22dc650dSSadaf EbrahimiFailed: error 142 at offset 5: syntax error in subpattern name (missing terminator?) 1630*22dc650dSSadaf Ebrahimi 1631*22dc650dSSadaf Ebrahimi# Invalid UTF-8 tests 1632*22dc650dSSadaf Ebrahimi 1633*22dc650dSSadaf Ebrahimi/.../g,match_invalid_utf 1634*22dc650dSSadaf Ebrahimi abcd\x80wxzy\x80pqrs 1635*22dc650dSSadaf Ebrahimi 0: abc 1636*22dc650dSSadaf Ebrahimi 0: wxz 1637*22dc650dSSadaf Ebrahimi 0: pqr 1638*22dc650dSSadaf Ebrahimi abcd\x{80}wxzy\x80pqrs 1639*22dc650dSSadaf Ebrahimi 0: abc 1640*22dc650dSSadaf Ebrahimi 0: d\x{80}w 1641*22dc650dSSadaf Ebrahimi 0: xzy 1642*22dc650dSSadaf Ebrahimi 0: pqr 1643*22dc650dSSadaf Ebrahimi 1644*22dc650dSSadaf Ebrahimi/abc/match_invalid_utf 1645*22dc650dSSadaf Ebrahimi ab\x80ab\=ph 1646*22dc650dSSadaf EbrahimiPartial match: ab 1647*22dc650dSSadaf Ebrahimi\= Expect no match 1648*22dc650dSSadaf Ebrahimi ab\x80cdef\=ph 1649*22dc650dSSadaf EbrahimiNo match 1650*22dc650dSSadaf Ebrahimi 1651*22dc650dSSadaf Ebrahimi/.a/match_invalid_utf 1652*22dc650dSSadaf Ebrahimi ab\=ph 1653*22dc650dSSadaf EbrahimiPartial match: b 1654*22dc650dSSadaf Ebrahimi ab\=ps 1655*22dc650dSSadaf EbrahimiPartial match: b 1656*22dc650dSSadaf Ebrahimi b\xf0\x91\x88b\=ph 1657*22dc650dSSadaf EbrahimiPartial match: b 1658*22dc650dSSadaf Ebrahimi b\xf0\x91\x88b\=ps 1659*22dc650dSSadaf EbrahimiPartial match: b 1660*22dc650dSSadaf Ebrahimi b\xf0\x91\x88\xb4a 1661*22dc650dSSadaf Ebrahimi 0: \x{11234}a 1662*22dc650dSSadaf Ebrahimi\= Expect no match 1663*22dc650dSSadaf Ebrahimi b\x80\=ph 1664*22dc650dSSadaf EbrahimiNo match 1665*22dc650dSSadaf Ebrahimi b\x80\=ps 1666*22dc650dSSadaf EbrahimiNo match 1667*22dc650dSSadaf Ebrahimi b\xf0\x91\x88\=ph 1668*22dc650dSSadaf EbrahimiNo match 1669*22dc650dSSadaf Ebrahimi b\xf0\x91\x88\=ps 1670*22dc650dSSadaf EbrahimiNo match 1671*22dc650dSSadaf Ebrahimi 1672*22dc650dSSadaf Ebrahimi/.a$/match_invalid_utf 1673*22dc650dSSadaf Ebrahimi ab\=ph 1674*22dc650dSSadaf EbrahimiPartial match: b 1675*22dc650dSSadaf Ebrahimi ab\=ps 1676*22dc650dSSadaf EbrahimiPartial match: b 1677*22dc650dSSadaf Ebrahimi\= Expect no match 1678*22dc650dSSadaf Ebrahimi b\xf0\x91\x98\=ph 1679*22dc650dSSadaf EbrahimiNo match 1680*22dc650dSSadaf Ebrahimi b\xf0\x91\x98\=ps 1681*22dc650dSSadaf EbrahimiNo match 1682*22dc650dSSadaf Ebrahimi 1683*22dc650dSSadaf Ebrahimi/ab$/match_invalid_utf 1684*22dc650dSSadaf Ebrahimi ab\x80cdeab 1685*22dc650dSSadaf Ebrahimi 0: ab 1686*22dc650dSSadaf Ebrahimi\= Expect no match 1687*22dc650dSSadaf Ebrahimi ab\x80cde 1688*22dc650dSSadaf EbrahimiNo match 1689*22dc650dSSadaf Ebrahimi 1690*22dc650dSSadaf Ebrahimi/.../g,match_invalid_utf 1691*22dc650dSSadaf Ebrahimi abcd\x{80}wxzy\x80pqrs 1692*22dc650dSSadaf Ebrahimi 0: abc 1693*22dc650dSSadaf Ebrahimi 0: d\x{80}w 1694*22dc650dSSadaf Ebrahimi 0: xzy 1695*22dc650dSSadaf Ebrahimi 0: pqr 1696*22dc650dSSadaf Ebrahimi 1697*22dc650dSSadaf Ebrahimi/(?<=x)../g,match_invalid_utf 1698*22dc650dSSadaf Ebrahimi abcd\x{80}wxzy\x80pqrs 1699*22dc650dSSadaf Ebrahimi 0: zy 1700*22dc650dSSadaf Ebrahimi abcd\x{80}wxzy\x80xpqrs 1701*22dc650dSSadaf Ebrahimi 0: zy 1702*22dc650dSSadaf Ebrahimi 0: pq 1703*22dc650dSSadaf Ebrahimi 1704*22dc650dSSadaf Ebrahimi/X$/match_invalid_utf 1705*22dc650dSSadaf Ebrahimi\= Expect no match 1706*22dc650dSSadaf Ebrahimi X\xc4 1707*22dc650dSSadaf EbrahimiNo match 1708*22dc650dSSadaf Ebrahimi 1709*22dc650dSSadaf Ebrahimi/(?<=..)X/match_invalid_utf,aftertext 1710*22dc650dSSadaf Ebrahimi AB\x80AQXYZ 1711*22dc650dSSadaf Ebrahimi 0: X 1712*22dc650dSSadaf Ebrahimi 0+ YZ 1713*22dc650dSSadaf Ebrahimi AB\x80AQXYZ\=offset=5 1714*22dc650dSSadaf Ebrahimi 0: X 1715*22dc650dSSadaf Ebrahimi 0+ YZ 1716*22dc650dSSadaf Ebrahimi AB\x80\x80AXYZXC\=offset=5 1717*22dc650dSSadaf Ebrahimi 0: X 1718*22dc650dSSadaf Ebrahimi 0+ C 1719*22dc650dSSadaf Ebrahimi\= Expect no match 1720*22dc650dSSadaf Ebrahimi AB\x80XYZ 1721*22dc650dSSadaf EbrahimiNo match 1722*22dc650dSSadaf Ebrahimi AB\x80XYZ\=offset=3 1723*22dc650dSSadaf EbrahimiNo match 1724*22dc650dSSadaf Ebrahimi AB\xfeXYZ 1725*22dc650dSSadaf EbrahimiNo match 1726*22dc650dSSadaf Ebrahimi AB\xffXYZ\=offset=3 1727*22dc650dSSadaf EbrahimiNo match 1728*22dc650dSSadaf Ebrahimi AB\x80AXYZ 1729*22dc650dSSadaf EbrahimiNo match 1730*22dc650dSSadaf Ebrahimi AB\x80AXYZ\=offset=4 1731*22dc650dSSadaf EbrahimiNo match 1732*22dc650dSSadaf Ebrahimi AB\x80\x80AXYZ\=offset=5 1733*22dc650dSSadaf EbrahimiNo match 1734*22dc650dSSadaf Ebrahimi 1735*22dc650dSSadaf Ebrahimi/.../match_invalid_utf 1736*22dc650dSSadaf Ebrahimi AB\xc4CCC 1737*22dc650dSSadaf Ebrahimi 0: CCC 1738*22dc650dSSadaf Ebrahimi\= Expect no match 1739*22dc650dSSadaf Ebrahimi A\x{d800}B 1740*22dc650dSSadaf EbrahimiNo match 1741*22dc650dSSadaf Ebrahimi A\x{110000}B 1742*22dc650dSSadaf EbrahimiNo match 1743*22dc650dSSadaf Ebrahimi A\xc4B 1744*22dc650dSSadaf EbrahimiNo match 1745*22dc650dSSadaf Ebrahimi 1746*22dc650dSSadaf Ebrahimi/\bX/match_invalid_utf 1747*22dc650dSSadaf Ebrahimi A\x80X 1748*22dc650dSSadaf Ebrahimi 0: X 1749*22dc650dSSadaf Ebrahimi 1750*22dc650dSSadaf Ebrahimi/\BX/match_invalid_utf 1751*22dc650dSSadaf Ebrahimi\= Expect no match 1752*22dc650dSSadaf Ebrahimi A\x80X 1753*22dc650dSSadaf EbrahimiNo match 1754*22dc650dSSadaf Ebrahimi 1755*22dc650dSSadaf Ebrahimi/(?<=...)X/match_invalid_utf 1756*22dc650dSSadaf Ebrahimi AAA\x80BBBXYZ 1757*22dc650dSSadaf Ebrahimi 0: X 1758*22dc650dSSadaf Ebrahimi\= Expect no match 1759*22dc650dSSadaf Ebrahimi AAA\x80BXYZ 1760*22dc650dSSadaf EbrahimiNo match 1761*22dc650dSSadaf Ebrahimi AAA\x80BBXYZ 1762*22dc650dSSadaf EbrahimiNo match 1763*22dc650dSSadaf Ebrahimi 1764*22dc650dSSadaf Ebrahimi# ------------------------------------- 1765*22dc650dSSadaf Ebrahimi 1766*22dc650dSSadaf Ebrahimi/(*UTF)(?=\x{123})/I 1767*22dc650dSSadaf EbrahimiCapture group count = 0 1768*22dc650dSSadaf EbrahimiMay match empty string 1769*22dc650dSSadaf EbrahimiCompile options: <none> 1770*22dc650dSSadaf EbrahimiOverall options: utf 1771*22dc650dSSadaf EbrahimiFirst code unit = \xc4 1772*22dc650dSSadaf EbrahimiLast code unit = \xa3 1773*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1774*22dc650dSSadaf Ebrahimi 1775*22dc650dSSadaf Ebrahimi/[\x{c1}\x{e1}]X[\x{145}\x{146}]/I,utf 1776*22dc650dSSadaf EbrahimiCapture group count = 0 1777*22dc650dSSadaf EbrahimiOptions: utf 1778*22dc650dSSadaf EbrahimiStarting code units: \xc3 1779*22dc650dSSadaf EbrahimiLast code unit = 'X' 1780*22dc650dSSadaf EbrahimiSubject length lower bound = 3 1781*22dc650dSSadaf Ebrahimi 1782*22dc650dSSadaf Ebrahimi/[,]/BI,utf 1783*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1784*22dc650dSSadaf Ebrahimi Bra 1785*22dc650dSSadaf Ebrahimi [,\x{fff9f}] 1786*22dc650dSSadaf Ebrahimi Ket 1787*22dc650dSSadaf Ebrahimi End 1788*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1789*22dc650dSSadaf EbrahimiCapture group count = 0 1790*22dc650dSSadaf EbrahimiOptions: utf 1791*22dc650dSSadaf EbrahimiStarting code units: , \xf3 1792*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1793*22dc650dSSadaf Ebrahimi 1794*22dc650dSSadaf Ebrahimi/[\x{fff4}-\x{ffff8}]/I,utf 1795*22dc650dSSadaf EbrahimiCapture group count = 0 1796*22dc650dSSadaf EbrahimiOptions: utf 1797*22dc650dSSadaf EbrahimiStarting code units: \xef \xf0 \xf1 \xf2 \xf3 1798*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1799*22dc650dSSadaf Ebrahimi 1800*22dc650dSSadaf Ebrahimi/[\x{fff4}-\x{afff8}\x{10ffff}]/I,utf 1801*22dc650dSSadaf EbrahimiCapture group count = 0 1802*22dc650dSSadaf EbrahimiOptions: utf 1803*22dc650dSSadaf EbrahimiStarting code units: \xef \xf0 \xf1 \xf2 \xf4 1804*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1805*22dc650dSSadaf Ebrahimi 1806*22dc650dSSadaf Ebrahimi/[\xff\x{ffff}]/I,utf 1807*22dc650dSSadaf EbrahimiCapture group count = 0 1808*22dc650dSSadaf EbrahimiOptions: utf 1809*22dc650dSSadaf EbrahimiStarting code units: \xc3 \xef 1810*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1811*22dc650dSSadaf Ebrahimi 1812*22dc650dSSadaf Ebrahimi/[\xff\x{ff}]/I,utf 1813*22dc650dSSadaf EbrahimiCapture group count = 0 1814*22dc650dSSadaf EbrahimiOptions: utf 1815*22dc650dSSadaf EbrahimiStarting code units: \xc3 1816*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1817*22dc650dSSadaf Ebrahimi abc\x{ff}def 1818*22dc650dSSadaf Ebrahimi 0: \x{ff} 1819*22dc650dSSadaf Ebrahimi 1820*22dc650dSSadaf Ebrahimi/[\xff\x{ff}]/I 1821*22dc650dSSadaf EbrahimiCapture group count = 0 1822*22dc650dSSadaf EbrahimiFirst code unit = \xff 1823*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1824*22dc650dSSadaf Ebrahimi abc\x{ff}def 1825*22dc650dSSadaf Ebrahimi 0: \xff 1826*22dc650dSSadaf Ebrahimi 1827*22dc650dSSadaf Ebrahimi/[Ss]/I 1828*22dc650dSSadaf EbrahimiCapture group count = 0 1829*22dc650dSSadaf EbrahimiFirst code unit = 'S' (caseless) 1830*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1831*22dc650dSSadaf Ebrahimi 1832*22dc650dSSadaf Ebrahimi/[Ss]/I,utf 1833*22dc650dSSadaf EbrahimiCapture group count = 0 1834*22dc650dSSadaf EbrahimiOptions: utf 1835*22dc650dSSadaf EbrahimiStarting code units: S s 1836*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1837*22dc650dSSadaf Ebrahimi 1838*22dc650dSSadaf Ebrahimi/(?:\x{ff}|\x{3000})/I,utf 1839*22dc650dSSadaf EbrahimiCapture group count = 0 1840*22dc650dSSadaf EbrahimiOptions: utf 1841*22dc650dSSadaf EbrahimiStarting code units: \xc3 \xe3 1842*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1843*22dc650dSSadaf Ebrahimi 1844*22dc650dSSadaf Ebrahimi/x/utf 1845*22dc650dSSadaf Ebrahimi abxyz 1846*22dc650dSSadaf Ebrahimi 0: x 1847*22dc650dSSadaf Ebrahimi \x80\=startchar 1848*22dc650dSSadaf EbrahimiFailed: error -22: UTF-8 error: isolated byte with 0x80 bit set at offset 0 1849*22dc650dSSadaf Ebrahimi abc\x80\=startchar 1850*22dc650dSSadaf EbrahimiFailed: error -22: UTF-8 error: isolated byte with 0x80 bit set at offset 3 1851*22dc650dSSadaf Ebrahimi abc\x80\=startchar,offset=3 1852*22dc650dSSadaf EbrahimiError -36 (bad UTF-8 offset) 1853*22dc650dSSadaf Ebrahimi 1854*22dc650dSSadaf Ebrahimi/\x{c1}+\x{e1}/iIB,ucp 1855*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1856*22dc650dSSadaf Ebrahimi Bra 1857*22dc650dSSadaf Ebrahimi /i \x{c1}+ 1858*22dc650dSSadaf Ebrahimi /i \x{e1} 1859*22dc650dSSadaf Ebrahimi Ket 1860*22dc650dSSadaf Ebrahimi End 1861*22dc650dSSadaf Ebrahimi------------------------------------------------------------------ 1862*22dc650dSSadaf EbrahimiCapture group count = 0 1863*22dc650dSSadaf EbrahimiOptions: caseless ucp 1864*22dc650dSSadaf EbrahimiFirst code unit = \xc1 (caseless) 1865*22dc650dSSadaf EbrahimiLast code unit = \xe1 (caseless) 1866*22dc650dSSadaf EbrahimiSubject length lower bound = 2 1867*22dc650dSSadaf Ebrahimi \x{c1}\x{c1}\x{c1} 1868*22dc650dSSadaf Ebrahimi 0: \xc1\xc1\xc1 1869*22dc650dSSadaf Ebrahimi \x{e1}\x{e1}\x{e1} 1870*22dc650dSSadaf Ebrahimi 0: \xe1\xe1\xe1 1871*22dc650dSSadaf Ebrahimi 1872*22dc650dSSadaf Ebrahimi/a|\x{c1}/iI,ucp 1873*22dc650dSSadaf EbrahimiCapture group count = 0 1874*22dc650dSSadaf EbrahimiOptions: caseless ucp 1875*22dc650dSSadaf EbrahimiStarting code units: A a \xc1 \xe1 1876*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1877*22dc650dSSadaf Ebrahimi \x{e1}xxx 1878*22dc650dSSadaf Ebrahimi 0: \xe1 1879*22dc650dSSadaf Ebrahimi 1880*22dc650dSSadaf Ebrahimi/a|\x{c1}/iI,utf 1881*22dc650dSSadaf EbrahimiCapture group count = 0 1882*22dc650dSSadaf EbrahimiOptions: caseless utf 1883*22dc650dSSadaf EbrahimiStarting code units: A a \xc3 1884*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1885*22dc650dSSadaf Ebrahimi \x{e1}xxx 1886*22dc650dSSadaf Ebrahimi 0: \x{e1} 1887*22dc650dSSadaf Ebrahimi 1888*22dc650dSSadaf Ebrahimi/\x{c1}|\x{e1}/iI,ucp 1889*22dc650dSSadaf EbrahimiCapture group count = 0 1890*22dc650dSSadaf EbrahimiOptions: caseless ucp 1891*22dc650dSSadaf EbrahimiFirst code unit = \xc1 (caseless) 1892*22dc650dSSadaf EbrahimiSubject length lower bound = 1 1893*22dc650dSSadaf Ebrahimi 1894*22dc650dSSadaf Ebrahimi/X(\x{e1})Y/ucp,replace=>\U$1<,substitute_extended 1895*22dc650dSSadaf Ebrahimi X\x{e1}Y 1896*22dc650dSSadaf Ebrahimi 1: >\xc1< 1897*22dc650dSSadaf Ebrahimi 1898*22dc650dSSadaf Ebrahimi/X(\x{e1})Y/i,ucp,replace=>\L$1<,substitute_extended 1899*22dc650dSSadaf Ebrahimi X\x{c1}Y 1900*22dc650dSSadaf Ebrahimi 1: >\xe1< 1901*22dc650dSSadaf Ebrahimi 1902*22dc650dSSadaf Ebrahimi# Without UTF or UCP characters > 127 have only one case in the default locale. 1903*22dc650dSSadaf Ebrahimi 1904*22dc650dSSadaf Ebrahimi/X(\x{e1})Y/replace=>\U$1<,substitute_extended 1905*22dc650dSSadaf Ebrahimi X\x{e1}Y 1906*22dc650dSSadaf Ebrahimi 1: >\xe1< 1907*22dc650dSSadaf Ebrahimi 1908*22dc650dSSadaf Ebrahimi/A/utf,match_invalid_utf,caseless 1909*22dc650dSSadaf Ebrahimi \xe5A 1910*22dc650dSSadaf Ebrahimi 0: A 1911*22dc650dSSadaf Ebrahimi 1912*22dc650dSSadaf Ebrahimi/\bch\b/utf,match_invalid_utf 1913*22dc650dSSadaf Ebrahimi qchq\=ph 1914*22dc650dSSadaf EbrahimiPartial match: 1915*22dc650dSSadaf Ebrahimi qchq\=ps 1916*22dc650dSSadaf EbrahimiPartial match: 1917*22dc650dSSadaf Ebrahimi 1918*22dc650dSSadaf Ebrahimi/line1\nbreak/firstline,utf,match_invalid_utf 1919*22dc650dSSadaf Ebrahimi line1\nbreak 1920*22dc650dSSadaf Ebrahimi 0: line1\x{0a}break 1921*22dc650dSSadaf Ebrahimi line0\nline1\nbreak 1922*22dc650dSSadaf EbrahimiNo match 1923*22dc650dSSadaf Ebrahimi 1924*22dc650dSSadaf Ebrahimi/A\z/utf,match_invalid_utf 1925*22dc650dSSadaf Ebrahimi A\x80\x42\n 1926*22dc650dSSadaf EbrahimiNo match 1927*22dc650dSSadaf Ebrahimi 1928*22dc650dSSadaf Ebrahimi# End of testinput10 1929