testinput4 57 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466246724682469247024712472247324742475247624772478247924802481248224832484248524862487248824892490249124922493249424952496249724982499250025012502250325042505250625072508250925102511251225132514251525162517251825192520252125222523252425252526252725282529253025312532253325342535253625372538253925402541254225432544254525462547254825492550255125522553255425552556255725582559256025612562256325642565256625672568256925702571257225732574257525762577257825792580258125822583258425852586258725882589259025912592259325942595259625972598259926002601260226032604260526062607260826092610261126122613261426152616261726182619262026212622262326242625262626272628262926302631263226332634263526362637263826392640264126422643264426452646264726482649265026512652265326542655265626572658265926602661266226632664266526662667266826692670267126722673267426752676267726782679268026812682268326842685268626872688268926902691269226932694269526962697269826992700270127022703270427052706270727082709271027112712271327142715271627172718271927202721272227232724272527262727272827292730273127322733273427352736273727382739274027412742274327442745274627472748274927502751275227532754275527562757275827592760276127622763276427652766276727682769277027712772277327742775277627772778277927802781278227832784278527862787278827892790279127922793279427952796279727982799280028012802280328042805280628072808280928102811281228132814281528162817281828192820282128222823282428252826282728282829283028312832283328342835283628372838283928402841284228432844284528462847284828492850285128522853285428552856285728582859286028612862286328642865
  1. # This set of tests is for UTF support, including Unicode properties. The
  2. # Unicode tests are all compatible with all versions of Perl >= 5.10, but
  3. # some of the property tests may differ because of different versions of
  4. # Unicode in use by PCRE2 and Perl.
  5. # WARNING: Use only / as the pattern delimiter. Although pcre2test supports
  6. # a number of delimiters, all those other than / give problems with the
  7. # perltest.sh script.
  8. #newline_default lf anycrlf any
  9. #perltest
  10. /a.b/utf
  11. acb
  12. a\x7fb
  13. a\x{100}b
  14. \= Expect no match
  15. a\nb
  16. /a(.{3})b/utf
  17. a\x{4000}xyb
  18. a\x{4000}\x7fyb
  19. a\x{4000}\x{100}yb
  20. \= Expect no match
  21. a\x{4000}b
  22. ac\ncb
  23. /a(.*?)(.)/
  24. a\xc0\x88b
  25. /a(.*?)(.)/utf
  26. a\x{100}b
  27. /a(.*)(.)/
  28. a\xc0\x88b
  29. /a(.*)(.)/utf
  30. a\x{100}b
  31. /a(.)(.)/
  32. a\xc0\x92bcd
  33. /a(.)(.)/utf
  34. a\x{240}bcd
  35. /a(.?)(.)/
  36. a\xc0\x92bcd
  37. /a(.?)(.)/utf
  38. a\x{240}bcd
  39. /a(.??)(.)/
  40. a\xc0\x92bcd
  41. /a(.??)(.)/utf
  42. a\x{240}bcd
  43. /a(.{3})b/utf
  44. a\x{1234}xyb
  45. a\x{1234}\x{4321}yb
  46. a\x{1234}\x{4321}\x{3412}b
  47. \= Expect no match
  48. a\x{1234}b
  49. ac\ncb
  50. /a(.{3,})b/utf
  51. a\x{1234}xyb
  52. a\x{1234}\x{4321}yb
  53. a\x{1234}\x{4321}\x{3412}b
  54. axxxxbcdefghijb
  55. a\x{1234}\x{4321}\x{3412}\x{3421}b
  56. \= Expect no match
  57. a\x{1234}b
  58. /a(.{3,}?)b/utf
  59. a\x{1234}xyb
  60. a\x{1234}\x{4321}yb
  61. a\x{1234}\x{4321}\x{3412}b
  62. axxxxbcdefghijb
  63. a\x{1234}\x{4321}\x{3412}\x{3421}b
  64. \= Expect no match
  65. a\x{1234}b
  66. /a(.{3,5})b/utf
  67. a\x{1234}xyb
  68. a\x{1234}\x{4321}yb
  69. a\x{1234}\x{4321}\x{3412}b
  70. axxxxbcdefghijb
  71. a\x{1234}\x{4321}\x{3412}\x{3421}b
  72. axbxxbcdefghijb
  73. axxxxxbcdefghijb
  74. \= Expect no match
  75. a\x{1234}b
  76. axxxxxxbcdefghijb
  77. /a(.{3,5}?)b/utf
  78. a\x{1234}xyb
  79. a\x{1234}\x{4321}yb
  80. a\x{1234}\x{4321}\x{3412}b
  81. axxxxbcdefghijb
  82. a\x{1234}\x{4321}\x{3412}\x{3421}b
  83. axbxxbcdefghijb
  84. axxxxxbcdefghijb
  85. \= Expect no match
  86. a\x{1234}b
  87. axxxxxxbcdefghijb
  88. /^[a\x{c0}]/utf
  89. \= Expect no match
  90. \x{100}
  91. /(?<=aXb)cd/utf
  92. aXbcd
  93. /(?<=a\x{100}b)cd/utf
  94. a\x{100}bcd
  95. /(?<=a\x{100000}b)cd/utf
  96. a\x{100000}bcd
  97. /(?:\x{100}){3}b/utf
  98. \x{100}\x{100}\x{100}b
  99. \= Expect no match
  100. \x{100}\x{100}b
  101. /\x{ab}/utf
  102. \x{ab}
  103. \xc2\xab
  104. \= Expect no match
  105. \x00{ab}
  106. /(?<=(.))X/utf
  107. WXYZ
  108. \x{256}XYZ
  109. \= Expect no match
  110. XYZ
  111. /[^a]+/g,utf
  112. bcd
  113. \x{100}aY\x{256}Z
  114. /^[^a]{2}/utf
  115. \x{100}bc
  116. /^[^a]{2,}/utf
  117. \x{100}bcAa
  118. /^[^a]{2,}?/utf
  119. \x{100}bca
  120. /[^a]+/gi,utf
  121. bcd
  122. \x{100}aY\x{256}Z
  123. /^[^a]{2}/i,utf
  124. \x{100}bc
  125. /^[^a]{2,}/i,utf
  126. \x{100}bcAa
  127. /^[^a]{2,}?/i,utf
  128. \x{100}bca
  129. /\x{100}{0,0}/utf
  130. abcd
  131. /\x{100}?/utf
  132. abcd
  133. \x{100}\x{100}
  134. /\x{100}{0,3}/utf
  135. \x{100}\x{100}
  136. \x{100}\x{100}\x{100}\x{100}
  137. /\x{100}*/utf
  138. abce
  139. \x{100}\x{100}\x{100}\x{100}
  140. /\x{100}{1,1}/utf
  141. abcd\x{100}\x{100}\x{100}\x{100}
  142. /\x{100}{1,3}/utf
  143. abcd\x{100}\x{100}\x{100}\x{100}
  144. /\x{100}+/utf
  145. abcd\x{100}\x{100}\x{100}\x{100}
  146. /\x{100}{3}/utf
  147. abcd\x{100}\x{100}\x{100}XX
  148. /\x{100}{3,5}/utf
  149. abcd\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}XX
  150. /\x{100}{3,}/utf
  151. abcd\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}XX
  152. /(?<=a\x{100}{2}b)X/utf,aftertext
  153. Xyyya\x{100}\x{100}bXzzz
  154. /\D*/utf
  155. aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa
  156. /\D*/utf
  157. \x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}
  158. /\D/utf
  159. 1X2
  160. 1\x{100}2
  161. />\S/utf
  162. > >X Y
  163. > >\x{100} Y
  164. /\d/utf
  165. \x{100}3
  166. /\s/utf
  167. \x{100} X
  168. /\D+/utf
  169. 12abcd34
  170. \= Expect no match
  171. 1234
  172. /\D{2,3}/utf
  173. 12abcd34
  174. 12ab34
  175. \= Expect no match
  176. 1234
  177. 12a34
  178. /\D{2,3}?/utf
  179. 12abcd34
  180. 12ab34
  181. \= Expect no match
  182. 1234
  183. 12a34
  184. /\d+/utf
  185. 12abcd34
  186. /\d{2,3}/utf
  187. 12abcd34
  188. 1234abcd
  189. \= Expect no match
  190. 1.4
  191. /\d{2,3}?/utf
  192. 12abcd34
  193. 1234abcd
  194. \= Expect no match
  195. 1.4
  196. /\S+/utf
  197. 12abcd34
  198. \= Expect no match
  199. \ \
  200. /\S{2,3}/utf
  201. 12abcd34
  202. 1234abcd
  203. \= Expect no match
  204. \ \
  205. /\S{2,3}?/utf
  206. 12abcd34
  207. 1234abcd
  208. \= Expect no match
  209. \ \
  210. />\s+</utf,aftertext
  211. 12> <34
  212. />\s{2,3}</utf,aftertext
  213. ab> <cd
  214. ab> <ce
  215. \= Expect no match
  216. ab> <cd
  217. />\s{2,3}?</utf,aftertext
  218. ab> <cd
  219. ab> <ce
  220. \= Expect no match
  221. ab> <cd
  222. /\w+/utf
  223. 12 34
  224. \= Expect no match
  225. +++=*!
  226. /\w{2,3}/utf
  227. ab cd
  228. abcd ce
  229. \= Expect no match
  230. a.b.c
  231. /\w{2,3}?/utf
  232. ab cd
  233. abcd ce
  234. \= Expect no match
  235. a.b.c
  236. /\W+/utf
  237. 12====34
  238. \= Expect no match
  239. abcd
  240. /\W{2,3}/utf
  241. ab====cd
  242. ab==cd
  243. \= Expect no match
  244. a.b.c
  245. /\W{2,3}?/utf
  246. ab====cd
  247. ab==cd
  248. \= Expect no match
  249. a.b.c
  250. /[\x{100}]/utf
  251. \x{100}
  252. Z\x{100}
  253. \x{100}Z
  254. /[Z\x{100}]/utf
  255. Z\x{100}
  256. \x{100}
  257. \x{100}Z
  258. /[\x{100}\x{200}]/utf
  259. ab\x{100}cd
  260. ab\x{200}cd
  261. /[\x{100}-\x{200}]/utf
  262. ab\x{100}cd
  263. ab\x{200}cd
  264. ab\x{111}cd
  265. /[z-\x{200}]/utf
  266. ab\x{100}cd
  267. ab\x{200}cd
  268. ab\x{111}cd
  269. abzcd
  270. ab|cd
  271. /[Q\x{100}\x{200}]/utf
  272. ab\x{100}cd
  273. ab\x{200}cd
  274. Q?
  275. /[Q\x{100}-\x{200}]/utf
  276. ab\x{100}cd
  277. ab\x{200}cd
  278. ab\x{111}cd
  279. Q?
  280. /[Qz-\x{200}]/utf
  281. ab\x{100}cd
  282. ab\x{200}cd
  283. ab\x{111}cd
  284. abzcd
  285. ab|cd
  286. Q?
  287. /[\x{100}\x{200}]{1,3}/utf
  288. ab\x{100}cd
  289. ab\x{200}cd
  290. ab\x{200}\x{100}\x{200}\x{100}cd
  291. /[\x{100}\x{200}]{1,3}?/utf
  292. ab\x{100}cd
  293. ab\x{200}cd
  294. ab\x{200}\x{100}\x{200}\x{100}cd
  295. /[Q\x{100}\x{200}]{1,3}/utf
  296. ab\x{100}cd
  297. ab\x{200}cd
  298. ab\x{200}\x{100}\x{200}\x{100}cd
  299. /[Q\x{100}\x{200}]{1,3}?/utf
  300. ab\x{100}cd
  301. ab\x{200}cd
  302. ab\x{200}\x{100}\x{200}\x{100}cd
  303. /(?<=[\x{100}\x{200}])X/utf
  304. abc\x{200}X
  305. abc\x{100}X
  306. \= Expect no match
  307. X
  308. /(?<=[Q\x{100}\x{200}])X/utf
  309. abc\x{200}X
  310. abc\x{100}X
  311. abQX
  312. \= Expect no match
  313. X
  314. /(?<=[\x{100}\x{200}]{3})X/utf
  315. abc\x{100}\x{200}\x{100}X
  316. \= Expect no match
  317. abc\x{200}X
  318. X
  319. /[^\x{100}\x{200}]X/utf
  320. AX
  321. \x{150}X
  322. \x{500}X
  323. \= Expect no match
  324. \x{100}X
  325. \x{200}X
  326. /[^Q\x{100}\x{200}]X/utf
  327. AX
  328. \x{150}X
  329. \x{500}X
  330. \= Expect no match
  331. \x{100}X
  332. \x{200}X
  333. QX
  334. /[^\x{100}-\x{200}]X/utf
  335. AX
  336. \x{500}X
  337. \= Expect no match
  338. \x{100}X
  339. \x{150}X
  340. \x{200}X
  341. /[z-\x{100}]/i,utf
  342. z
  343. Z
  344. \x{100}
  345. \= Expect no match
  346. \x{102}
  347. y
  348. /[\xFF]/
  349. >\xff<
  350. /[\xff]/utf
  351. >\x{ff}<
  352. /[^\xFF]/
  353. XYZ
  354. /[^\xff]/utf
  355. XYZ
  356. \x{123}
  357. /^[ac]*b/utf
  358. \= Expect no match
  359. xb
  360. /^[ac\x{100}]*b/utf
  361. \= Expect no match
  362. xb
  363. /^[^x]*b/i,utf
  364. \= Expect no match
  365. xb
  366. /^[^x]*b/utf
  367. \= Expect no match
  368. xb
  369. /^\d*b/utf
  370. \= Expect no match
  371. xb
  372. /(|a)/g,utf
  373. catac
  374. a\x{256}a
  375. /^\x{85}$/i,utf
  376. \x{85}
  377. /^ሴ/utf
  378. /^\ሴ/utf
  379. /(?s)(.{1,5})/utf
  380. abcdefg
  381. ab
  382. /a*\x{100}*\w/utf
  383. a
  384. /\S\S/g,utf
  385. A\x{a3}BC
  386. /\S{2}/g,utf
  387. A\x{a3}BC
  388. /\W\W/g,utf
  389. +\x{a3}==
  390. /\W{2}/g,utf
  391. +\x{a3}==
  392. /\S/g,utf
  393. \x{442}\x{435}\x{441}\x{442}
  394. /[\S]/g,utf
  395. \x{442}\x{435}\x{441}\x{442}
  396. /\D/g,utf
  397. \x{442}\x{435}\x{441}\x{442}
  398. /[\D]/g,utf
  399. \x{442}\x{435}\x{441}\x{442}
  400. /\W/g,utf
  401. \x{2442}\x{2435}\x{2441}\x{2442}
  402. /[\W]/g,utf
  403. \x{2442}\x{2435}\x{2441}\x{2442}
  404. /[\S\s]*/utf
  405. abc\n\r\x{442}\x{435}\x{441}\x{442}xyz
  406. /[\x{41f}\S]/g,utf
  407. \x{442}\x{435}\x{441}\x{442}
  408. /.[^\S]./g,utf
  409. abc def\x{442}\x{443}xyz\npqr
  410. /.[^\S\n]./g,utf
  411. abc def\x{442}\x{443}xyz\npqr
  412. /[[:^alnum:]]/g,utf
  413. +\x{2442}
  414. /[[:^alpha:]]/g,utf
  415. +\x{2442}
  416. /[[:^ascii:]]/g,utf
  417. A\x{442}
  418. /[[:^blank:]]/g,utf
  419. A\x{442}
  420. /[[:^cntrl:]]/g,utf
  421. A\x{442}
  422. /[[:^digit:]]/g,utf
  423. A\x{442}
  424. /[[:^graph:]]/g,utf
  425. \x19\x{e01ff}
  426. /[[:^lower:]]/g,utf
  427. A\x{422}
  428. /[[:^print:]]/g,utf
  429. \x{19}\x{e01ff}
  430. /[[:^punct:]]/g,utf
  431. A\x{442}
  432. /[[:^space:]]/g,utf
  433. A\x{442}
  434. /[[:^upper:]]/g,utf
  435. a\x{442}
  436. /[[:^word:]]/g,utf
  437. +\x{2442}
  438. /[[:^xdigit:]]/g,utf
  439. M\x{442}
  440. /[^ABCDEFGHIJKLMNOPQRSTUVWXYZÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖØÙÚÛÜÝÞĀĂĄĆĈĊČĎĐĒĔĖĘĚĜĞĠĢĤĦĨĪĬĮİIJĴĶĹĻĽĿŁŃŅŇŊŌŎŐŒŔŖŘŚŜŞŠŢŤŦŨŪŬŮŰŲŴŶŸŹŻŽƁƂƄƆƇƉƊƋƎƏƐƑƓƔƖƗƘƜƝƟƠƢƤƦƧƩƬƮƯƱƲƳƵƷƸƼDŽLJNJǍǏǑǓǕǗǙǛǞǠǢǤǦǨǪǬǮDZǴǶǷǸǺǼǾȀȂȄȆȈȊȌȎȐȒȔȖȘȚȜȞȠȢȤȦȨȪȬȮȰȲȺȻȽȾɁΆΈΉΊΌΎΏΑΒΓΔΕΖΗΘΙΚΛΜΝΞΟΠΡΣΤΥΦΧΨΩΪΫϒϓϔϘϚϜϞϠϢϤϦϨϪϬϮϴϷϹϺϽϾϿЀЁЂЃЄЅІЇЈЉЊЋЌЍЎЏАБВГДЕЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЫЬЭЮЯѠѢѤѦѨѪѬѮѰѲѴѶѸѺѼѾҀҊҌҎҐҒҔҖҘҚҜҞҠҢҤҦҨҪҬҮҰҲҴҶҸҺҼҾӀӁӃӅӇӉӋӍӐӒӔӖӘӚӜӞӠӢӤӦӨӪӬӮӰӲӴӶӸԀԂԄԆԈԊԌԎԱԲԳԴԵԶԷԸԹԺԻԼԽԾԿՀՁՂՃՄՅՆՇՈՉՊՋՌՍՎՏՐՑՒՓՔՕՖႠႡႢႣႤႥႦႧႨႩႪႫႬႭႮႯႰႱႲႳႴႵႶႷႸႹႺႻႼႽႾႿჀჁჂჃჄჅḀḂḄḆḈḊḌḎḐḒḔḖḘḚḜḞḠḢḤḦḨḪḬḮḰḲḴḶḸḺḼḾṀṂṄṆṈṊṌṎṐṒṔṖṘṚṜṞṠṢṤṦṨṪṬṮṰṲṴṶṸṺṼṾẀẂẄẆẈẊẌẎẐẒẔẠẢẤẦẨẪẬẮẰẲẴẶẸẺẼẾỀỂỄỆỈỊỌỎỐỒỔỖỘỚỜỞỠỢỤỦỨỪỬỮỰỲỴỶỸἈἉἊἋἌἍἎἏἘἙἚἛἜἝἨἩἪἫἬἭἮἯἸἹἺἻἼἽἾἿὈὉὊὋὌὍὙὛὝὟὨὩὪὫὬὭὮὯᾸᾹᾺΆῈΈῊΉῘῙῚΊῨῩῪΎῬῸΌῺΏabcdefghijklmnopqrstuvwxyzªµºßàáâãäåæçèéêëìíîïðñòóôõöøùúûüýþÿāăąćĉċčďđēĕėęěĝğġģĥħĩīĭįıijĵķĸĺļľŀłńņňʼnŋōŏőœŕŗřśŝşšţťŧũūŭůűųŵŷźżžſƀƃƅƈƌƍƒƕƙƚƛƞơƣƥƨƪƫƭưƴƶƹƺƽƾƿdžljnjǎǐǒǔǖǘǚǜǝǟǡǣǥǧǩǫǭǯǰdzǵǹǻǽǿȁȃȅȇȉȋȍȏȑȓȕȗșțȝȟȡȣȥȧȩȫȭȯȱȳȴȵȶȷȸȹȼȿɀɐɑɒɓɔɕɖɗɘəɚɛɜɝɞɟɠɡɢɣɤɥɦɧɨɩɪɫɬɭɮɯɰɱɲɳɴɵɶɷɸɹɺɻɼɽɾɿʀʁʂʃʄʅʆʇʈʉʊʋʌʍʎʏʐʑʒʓʔʕʖʗʘʙʚʛʜʝʞʟʠʡʢʣʤʥʦʧʨʩʪʫʬʭʮʯΐάέήίΰαβγδεζηθικλμνξοπρςστυφχψωϊϋόύώϐϑϕϖϗϙϛϝϟϡϣϥϧϩϫϭϯϰϱϲϳϵϸϻϼабвгдежзийклмнопрстуфхцчшщъыьэюяѐёђѓєѕіїјљњћќѝўџѡѣѥѧѩѫѭѯѱѳѵѷѹѻѽѿҁҋҍҏґғҕҗҙқҝҟҡңҥҧҩҫҭүұҳҵҷҹһҽҿӂӄӆӈӊӌӎӑӓӕӗәӛӝӟӡӣӥӧөӫӭӯӱӳӵӷӹԁԃԅԇԉԋԍԏաբգդեզէըթժիլխծկհձղճմյնշոչպջռսվտրցւփքօֆևᴀᴁᴂᴃᴄᴅᴆᴇᴈᴉᴊᴋᴌᴍᴎᴏᴐᴑᴒᴓᴔᴕᴖᴗᴘᴙᴚᴛᴜᴝᴞᴟᴠᴡᴢᴣᴤᴥᴦᴧᴨᴩᴪᴫᵢᵣᵤᵥᵦᵧᵨᵩᵪᵫᵬᵭᵮᵯᵰᵱᵲᵳᵴᵵᵶᵷᵹᵺᵻᵼᵽᵾᵿᶀᶁᶂᶃᶄᶅᶆᶇᶈᶉᶊᶋᶌᶍᶎᶏᶐᶑᶒᶓᶔᶕᶖᶗᶘᶙᶚḁḃḅḇḉḋḍḏḑḓḕḗḙḛḝḟḡḣḥḧḩḫḭḯḱḳḵḷḹḻḽḿṁṃṅṇṉṋṍṏṑṓṕṗṙṛṝṟṡṣṥṧṩṫṭṯṱṳṵṷṹṻṽṿẁẃẅẇẉẋẍẏẑẓẕẖẗẘẙẚẛạảấầẩẫậắằẳẵặẹẻẽếềểễệỉịọỏốồổỗộớờởỡợụủứừửữựỳỵỷỹἀἁἂἃἄἅἆἇἐἑἒἓἔἕἠἡἢἣἤἥἦἧἰἱἲἳἴἵἶἷὀὁὂὃὄὅὐὑὒὓὔὕὖὗὠὡὢὣὤὥὦὧὰάὲέὴήὶίὸόὺύὼώᾀᾁᾂᾃᾄᾅᾆᾇᾐᾑᾒᾓᾔᾕᾖᾗᾠᾡᾢᾣᾤᾥᾦᾧᾰᾱᾲᾳᾴᾶᾷιῂῃῄῆῇῐῑῒΐῖῗῠῡῢΰῤῥῦῧῲῳῴῶῷⲁⲃⲅⲇⲉⲋⲍⲏⲑⲓⲕⲗⲙⲛⲝⲟⲡⲣⲥⲧⲩⲫⲭⲯⲱⲳⲵⲷⲹⲻⲽⲿⳁⳃⳅⳇⳉⳋⳍⳏⳑⳓⳕⳗⳙⳛⳝⳟⳡⳣⳤⴀⴁⴂⴃⴄⴅⴆⴇⴈⴉⴊⴋⴌⴍⴎⴏⴐⴑⴒⴓⴔⴕⴖⴗⴘⴙⴚⴛⴜⴝⴞⴟⴠⴡⴢⴣⴤⴥfffiflffifflſtstﬓﬔﬕﬖﬗ\d_^]/utf
  441. /^[^d]*?$/
  442. abc
  443. /^[^d]*?$/utf
  444. abc
  445. /^[^d]*?$/i
  446. abc
  447. /^[^d]*?$/i,utf
  448. abc
  449. /(?i)[\xc3\xa9\xc3\xbd]|[\xc3\xa9\xc3\xbdA]/utf
  450. /^[a\x{c0}]b/utf
  451. \x{c0}b
  452. /^([a\x{c0}]*?)aa/utf
  453. a\x{c0}aaaa/
  454. /^([a\x{c0}]*?)aa/utf
  455. a\x{c0}aaaa/
  456. a\x{c0}a\x{c0}aaa/
  457. /^([a\x{c0}]*)aa/utf
  458. a\x{c0}aaaa/
  459. a\x{c0}a\x{c0}aaa/
  460. /^([a\x{c0}]*)a\x{c0}/utf
  461. a\x{c0}aaaa/
  462. a\x{c0}a\x{c0}aaa/
  463. /A*/g,utf
  464. AAB\x{123}BAA
  465. /(abc)\1/i,utf
  466. \= Expect no match
  467. abc
  468. /(abc)\1/utf
  469. \= Expect no match
  470. abc
  471. /a(*:a\x{1234}b)/utf,mark
  472. abc
  473. /a(*:a£b)/utf,mark
  474. abc
  475. # Noncharacters
  476. /./utf
  477. \x{fffe}
  478. \x{ffff}
  479. \x{1fffe}
  480. \x{1ffff}
  481. \x{2fffe}
  482. \x{2ffff}
  483. \x{3fffe}
  484. \x{3ffff}
  485. \x{4fffe}
  486. \x{4ffff}
  487. \x{5fffe}
  488. \x{5ffff}
  489. \x{6fffe}
  490. \x{6ffff}
  491. \x{7fffe}
  492. \x{7ffff}
  493. \x{8fffe}
  494. \x{8ffff}
  495. \x{9fffe}
  496. \x{9ffff}
  497. \x{afffe}
  498. \x{affff}
  499. \x{bfffe}
  500. \x{bffff}
  501. \x{cfffe}
  502. \x{cffff}
  503. \x{dfffe}
  504. \x{dffff}
  505. \x{efffe}
  506. \x{effff}
  507. \x{ffffe}
  508. \x{fffff}
  509. \x{10fffe}
  510. \x{10ffff}
  511. \x{fdd0}
  512. \x{fdd1}
  513. \x{fdd2}
  514. \x{fdd3}
  515. \x{fdd4}
  516. \x{fdd5}
  517. \x{fdd6}
  518. \x{fdd7}
  519. \x{fdd8}
  520. \x{fdd9}
  521. \x{fdda}
  522. \x{fddb}
  523. \x{fddc}
  524. \x{fddd}
  525. \x{fdde}
  526. \x{fddf}
  527. \x{fde0}
  528. \x{fde1}
  529. \x{fde2}
  530. \x{fde3}
  531. \x{fde4}
  532. \x{fde5}
  533. \x{fde6}
  534. \x{fde7}
  535. \x{fde8}
  536. \x{fde9}
  537. \x{fdea}
  538. \x{fdeb}
  539. \x{fdec}
  540. \x{fded}
  541. \x{fdee}
  542. \x{fdef}
  543. /^\d*\w{4}/utf
  544. 1234
  545. \= Expect no match
  546. 123
  547. /^[^b]*\w{4}/utf
  548. aaaa
  549. \= Expect no match
  550. aaa
  551. /^[^b]*\w{4}/i,utf
  552. aaaa
  553. \= Expect no match
  554. aaa
  555. /^\x{100}*.{4}/utf
  556. \x{100}\x{100}\x{100}\x{100}
  557. \= Expect no match
  558. \x{100}\x{100}\x{100}
  559. /^\x{100}*.{4}/i,utf
  560. \x{100}\x{100}\x{100}\x{100}
  561. \= Expect no match
  562. \x{100}\x{100}\x{100}
  563. /^a+[a\x{200}]/utf
  564. aa
  565. /^.\B.\B./utf
  566. \x{10123}\x{10124}\x{10125}
  567. /^#[^\x{ffff}]#[^\x{ffff}]#[^\x{ffff}]#/utf
  568. #\x{10000}#\x{100}#\x{10ffff}#
  569. # Unicode property support tests
  570. /^\pC\pL\pM\pN\pP\pS\pZ</utf
  571. \x7f\x{c0}\x{30f}\x{660}\x{66c}\x{f01}\x{1680}<
  572. \np\x{300}9!\$ <
  573. \= Expect no match
  574. ap\x{300}9!\$ <
  575. /^\PC/utf
  576. X
  577. \= Expect no match
  578. \x7f
  579. /^\PL/utf
  580. 9
  581. \= Expect no match
  582. \x{c0}
  583. /^\PM/utf
  584. X
  585. \= Expect no match
  586. \x{30f}
  587. /^\PN/utf
  588. X
  589. \= Expect no match
  590. \x{660}
  591. /^\PP/utf
  592. X
  593. \= Expect no match
  594. \x{66c}
  595. /^\PS/utf
  596. X
  597. \= Expect no match
  598. \x{f01}
  599. /^\PZ/utf
  600. X
  601. \= Expect no match
  602. \x{1680}
  603. /^\p{Cc}/utf
  604. \x{017}
  605. \x{09f}
  606. \= Expect no match
  607. \x{0600}
  608. /^\p{Cf}/utf
  609. \x{601}
  610. \= Expect no match
  611. \x{09f}
  612. /^\p{Cn}/utf
  613. \x{e0000}
  614. \= Expect no match
  615. \x{09f}
  616. /^\p{Co}/utf
  617. \x{f8ff}
  618. \= Expect no match
  619. \x{09f}
  620. /^\p{Ll}/utf
  621. a
  622. \= Expect no match
  623. Z
  624. \x{e000}
  625. /^\p{Lm}/utf
  626. \x{2b0}
  627. \= Expect no match
  628. a
  629. /^\p{Lo}/utf
  630. \x{1bb}
  631. \x{3400}
  632. \x{3401}
  633. \x{4d00}
  634. \x{4db4}
  635. \x{4db5}
  636. \x{4db6}
  637. \= Expect no match
  638. a
  639. \x{2b0}
  640. /^\p{Lt}/utf
  641. \x{1c5}
  642. \= Expect no match
  643. a
  644. \x{2b0}
  645. /^\p{Lu}/utf
  646. A
  647. \= Expect no match
  648. \x{2b0}
  649. /^\p{Mc}/utf
  650. \x{903}
  651. \= Expect no match
  652. X
  653. \x{300}
  654. /^\p{Me}/utf
  655. \x{488}
  656. \= Expect no match
  657. X
  658. \x{903}
  659. \x{300}
  660. /^\p{Mn}/utf
  661. \x{300}
  662. \= Expect no match
  663. X
  664. \x{903}
  665. /^\p{Nd}+/utf
  666. 0123456789\x{660}\x{661}\x{662}\x{663}\x{664}\x{665}\x{666}\x{667}\x{668}\x{669}\x{66a}
  667. \x{6f0}\x{6f1}\x{6f2}\x{6f3}\x{6f4}\x{6f5}\x{6f6}\x{6f7}\x{6f8}\x{6f9}\x{6fa}
  668. \x{966}\x{967}\x{968}\x{969}\x{96a}\x{96b}\x{96c}\x{96d}\x{96e}\x{96f}\x{970}
  669. \= Expect no match
  670. X
  671. /^\p{Nl}/utf
  672. \x{16ee}
  673. \= Expect no match
  674. X
  675. \x{966}
  676. /^\p{No}/utf
  677. \x{b2}
  678. \x{b3}
  679. \= Expect no match
  680. X
  681. \x{16ee}
  682. /^\p{Pc}/utf
  683. \x5f
  684. \x{203f}
  685. \= Expect no match
  686. X
  687. -
  688. \x{58a}
  689. /^\p{Pd}/utf
  690. -
  691. \x{58a}
  692. \= Expect no match
  693. X
  694. \x{203f}
  695. /^\p{Pe}/utf
  696. )
  697. ]
  698. }
  699. \x{f3b}
  700. \= Expect no match
  701. X
  702. \x{203f}
  703. (
  704. [
  705. {
  706. \x{f3c}
  707. /^\p{Pf}/utf
  708. \x{bb}
  709. \x{2019}
  710. \= Expect no match
  711. X
  712. \x{203f}
  713. /^\p{Pi}/utf
  714. \x{ab}
  715. \x{2018}
  716. \= Expect no match
  717. X
  718. \x{203f}
  719. /^\p{Po}/utf
  720. !
  721. \x{37e}
  722. \= Expect no match
  723. X
  724. \x{203f}
  725. /^\p{Ps}/utf
  726. (
  727. [
  728. {
  729. \x{f3c}
  730. \= Expect no match
  731. X
  732. )
  733. ]
  734. }
  735. \x{f3b}
  736. /^\p{Sk}/utf
  737. \x{2c2}
  738. \= Expect no match
  739. X
  740. \x{9f2}
  741. /^\p{Sm}+/utf
  742. +<|~\x{ac}\x{2044}
  743. \= Expect no match
  744. X
  745. \x{9f2}
  746. /^\p{So}/utf
  747. \x{a6}
  748. \x{482}
  749. \= Expect no match
  750. X
  751. \x{9f2}
  752. /^\p{Zl}/utf
  753. \x{2028}
  754. \= Expect no match
  755. X
  756. \x{2029}
  757. /^\p{Zp}/utf
  758. \x{2029}
  759. \= Expect no match
  760. X
  761. \x{2028}
  762. /\p{Nd}+(..)/utf
  763. \x{660}\x{661}\x{662}ABC
  764. /\p{Nd}+?(..)/utf
  765. \x{660}\x{661}\x{662}ABC
  766. /\p{Nd}{2,}(..)/utf
  767. \x{660}\x{661}\x{662}ABC
  768. /\p{Nd}{2,}?(..)/utf
  769. \x{660}\x{661}\x{662}ABC
  770. /\p{Nd}*(..)/utf
  771. \x{660}\x{661}\x{662}ABC
  772. /\p{Nd}*?(..)/utf
  773. \x{660}\x{661}\x{662}ABC
  774. /\p{Nd}{2}(..)/utf
  775. \x{660}\x{661}\x{662}ABC
  776. /\p{Nd}{2,3}(..)/utf
  777. \x{660}\x{661}\x{662}ABC
  778. /\p{Nd}{2,3}?(..)/utf
  779. \x{660}\x{661}\x{662}ABC
  780. /\p{Nd}?(..)/utf
  781. \x{660}\x{661}\x{662}ABC
  782. /\p{Nd}??(..)/utf
  783. \x{660}\x{661}\x{662}ABC
  784. /\p{Nd}*+(..)/utf
  785. \x{660}\x{661}\x{662}ABC
  786. /\p{Nd}*+(...)/utf
  787. \x{660}\x{661}\x{662}ABC
  788. /\p{Nd}*+(....)/utf
  789. \= Expect no match
  790. \x{660}\x{661}\x{662}ABC
  791. /(?<=A\p{Nd})XYZ/utf
  792. A2XYZ
  793. 123A5XYZPQR
  794. ABA\x{660}XYZpqr
  795. \= Expect no match
  796. AXYZ
  797. XYZ
  798. /(?<!\pL)XYZ/utf
  799. 1XYZ
  800. AB=XYZ..
  801. XYZ
  802. \= Expect no match
  803. WXYZ
  804. /[\P{Nd}]+/utf
  805. abcd
  806. \= Expect no match
  807. 1234
  808. /\D+/utf
  809. aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa
  810. \= Expect no match
  811. 11111111111111111111111111111111111111111111111111111111111111111111111
  812. /\P{Nd}+/utf
  813. aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa
  814. \= Expect no match
  815. 11111111111111111111111111111111111111111111111111111111111111111111111
  816. /[\D]+/utf
  817. aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa
  818. \= Expect no match
  819. 11111111111111111111111111111111111111111111111111111111111111111111111
  820. /[\P{Nd}]+/utf
  821. aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa
  822. \= Expect no match
  823. 11111111111111111111111111111111111111111111111111111111111111111111111
  824. /[\D\P{Nd}]+/utf
  825. aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa
  826. \= Expect no match
  827. 11111111111111111111111111111111111111111111111111111111111111111111111
  828. /\pL/utf
  829. a
  830. A
  831. /\pL/i,utf
  832. a
  833. A
  834. /\p{Lu}/utf
  835. A
  836. aZ
  837. \= Expect no match
  838. abc
  839. /\p{Ll}/utf
  840. a
  841. Az
  842. \= Expect no match
  843. ABC
  844. /A\x{391}\x{10427}\x{ff3a}\x{1fb0}/utf
  845. A\x{391}\x{10427}\x{ff3a}\x{1fb0}
  846. \= Expect no match
  847. a\x{391}\x{10427}\x{ff3a}\x{1fb0}
  848. A\x{3b1}\x{10427}\x{ff3a}\x{1fb0}
  849. A\x{391}\x{1044F}\x{ff3a}\x{1fb0}
  850. A\x{391}\x{10427}\x{ff5a}\x{1fb0}
  851. A\x{391}\x{10427}\x{ff3a}\x{1fb8}
  852. /A\x{391}\x{10427}\x{ff3a}\x{1fb0}/i,utf
  853. A\x{391}\x{10427}\x{ff3a}\x{1fb0}
  854. a\x{391}\x{10427}\x{ff3a}\x{1fb0}
  855. A\x{3b1}\x{10427}\x{ff3a}\x{1fb0}
  856. A\x{391}\x{1044F}\x{ff3a}\x{1fb0}
  857. A\x{391}\x{10427}\x{ff5a}\x{1fb0}
  858. A\x{391}\x{10427}\x{ff3a}\x{1fb8}
  859. /\x{391}+/i,utf
  860. \x{391}\x{3b1}\x{3b1}\x{3b1}\x{391}
  861. /\x{391}{3,5}(.)/i,utf
  862. \x{391}\x{3b1}\x{3b1}\x{3b1}\x{391}X
  863. /\x{391}{3,5}?(.)/i,utf
  864. \x{391}\x{3b1}\x{3b1}\x{3b1}\x{391}X
  865. /[\x{391}\x{ff3a}]/i,utf
  866. \x{391}
  867. \x{ff3a}
  868. \x{3b1}
  869. \x{ff5a}
  870. /^(\X*)C/utf
  871. A\x{300}\x{301}\x{302}BCA\x{300}\x{301}
  872. A\x{300}\x{301}\x{302}BCA\x{300}\x{301}C
  873. /^(\X*?)C/utf
  874. A\x{300}\x{301}\x{302}BCA\x{300}\x{301}
  875. A\x{300}\x{301}\x{302}BCA\x{300}\x{301}C
  876. /^(\X*)(.)/utf
  877. A\x{300}\x{301}\x{302}BCA\x{300}\x{301}
  878. A\x{300}\x{301}\x{302}BCA\x{300}\x{301}C
  879. /^(\X*?)(.)/utf
  880. A\x{300}\x{301}\x{302}BCA\x{300}\x{301}
  881. A\x{300}\x{301}\x{302}BCA\x{300}\x{301}C
  882. /^\X(.)/utf
  883. \= Expect no match
  884. A\x{300}\x{301}\x{302}
  885. /^\X{2,3}(.)/utf
  886. A\x{300}\x{301}B\x{300}X
  887. A\x{300}\x{301}B\x{300}C\x{300}\x{301}
  888. A\x{300}\x{301}B\x{300}C\x{300}\x{301}X
  889. A\x{300}\x{301}B\x{300}C\x{300}\x{301}DA\x{300}X
  890. /^\X{2,3}?(.)/utf
  891. A\x{300}\x{301}B\x{300}X
  892. A\x{300}\x{301}B\x{300}C\x{300}\x{301}
  893. A\x{300}\x{301}B\x{300}C\x{300}\x{301}X
  894. A\x{300}\x{301}B\x{300}C\x{300}\x{301}DA\x{300}X
  895. /^\X/utf
  896. A
  897. A\x{300}BC
  898. A\x{300}\x{301}\x{302}BC
  899. \x{300}
  900. /^\p{Han}+/utf
  901. \x{2e81}\x{3007}\x{2f804}\x{31a0}
  902. \= Expect no match
  903. \x{2e7f}
  904. /^[\p{Arabic}]/utf
  905. \x{06e9}
  906. \x{060b}
  907. \= Expect no match
  908. X\x{06e9}
  909. /^\P{Katakana}+/utf
  910. \x{3105}
  911. \= Expect no match
  912. \x{30ff}
  913. /^[\P{Yi}]/utf
  914. \x{2f800}
  915. \= Expect no match
  916. \x{a014}
  917. \x{a4c6}
  918. /^\p{Any}X/utf
  919. AXYZ
  920. \x{1234}XYZ
  921. \= Expect no match
  922. X
  923. /^\P{Any}X/utf
  924. \= Expect no match
  925. AX
  926. /^\p{Any}?X/utf
  927. XYZ
  928. AXYZ
  929. \x{1234}XYZ
  930. \= Expect no match
  931. ABXYZ
  932. /^\P{Any}?X/utf
  933. XYZ
  934. \= Expect no match
  935. AXYZ
  936. \x{1234}XYZ
  937. ABXYZ
  938. /^\p{Any}+X/utf
  939. AXYZ
  940. \x{1234}XYZ
  941. A\x{1234}XYZ
  942. \= Expect no match
  943. XYZ
  944. /^\P{Any}+X/utf
  945. \= Expect no match
  946. AXYZ
  947. \x{1234}XYZ
  948. A\x{1234}XYZ
  949. XYZ
  950. /^\p{Any}*X/utf
  951. XYZ
  952. AXYZ
  953. \x{1234}XYZ
  954. A\x{1234}XYZ
  955. /^\P{Any}*X/utf
  956. XYZ
  957. \= Expect no match
  958. AXYZ
  959. \x{1234}XYZ
  960. A\x{1234}XYZ
  961. /^[\p{Any}]X/utf
  962. AXYZ
  963. \x{1234}XYZ
  964. \= Expect no match
  965. X
  966. /^[\P{Any}]X/utf
  967. \= Expect no match
  968. AX
  969. /^[\p{Any}]?X/utf
  970. XYZ
  971. AXYZ
  972. \x{1234}XYZ
  973. \= Expect no match
  974. ABXYZ
  975. /^[\P{Any}]?X/utf
  976. XYZ
  977. \= Expect no match
  978. AXYZ
  979. \x{1234}XYZ
  980. ABXYZ
  981. /^[\p{Any}]+X/utf
  982. AXYZ
  983. \x{1234}XYZ
  984. A\x{1234}XYZ
  985. \= Expect no match
  986. XYZ
  987. /^[\P{Any}]+X/utf
  988. \= Expect no match
  989. AXYZ
  990. \x{1234}XYZ
  991. A\x{1234}XYZ
  992. XYZ
  993. /^[\p{Any}]*X/utf
  994. XYZ
  995. AXYZ
  996. \x{1234}XYZ
  997. A\x{1234}XYZ
  998. /^[\P{Any}]*X/utf
  999. XYZ
  1000. \= Expect no match
  1001. AXYZ
  1002. \x{1234}XYZ
  1003. A\x{1234}XYZ
  1004. /^\p{Any}{3,5}?/utf
  1005. abcdefgh
  1006. \x{1234}\n\r\x{3456}xyz
  1007. /^\p{Any}{3,5}/utf
  1008. abcdefgh
  1009. \x{1234}\n\r\x{3456}xyz
  1010. /^\P{Any}{3,5}?/utf
  1011. \= Expect no match
  1012. abcdefgh
  1013. \x{1234}\n\r\x{3456}xyz
  1014. /^\p{L&}X/utf
  1015. AXY
  1016. aXY
  1017. \x{1c5}XY
  1018. \= Expect no match
  1019. \x{1bb}XY
  1020. \x{2b0}XY
  1021. !XY
  1022. /^[\p{L&}]X/utf
  1023. AXY
  1024. aXY
  1025. \x{1c5}XY
  1026. \= Expect no match
  1027. \x{1bb}XY
  1028. \x{2b0}XY
  1029. !XY
  1030. /^\p{L&}+X/utf
  1031. AXY
  1032. aXY
  1033. AbcdeXyz
  1034. \x{1c5}AbXY
  1035. abcDEXypqreXlmn
  1036. \= Expect no match
  1037. \x{1bb}XY
  1038. \x{2b0}XY
  1039. !XY
  1040. /^[\p{L&}]+X/utf
  1041. AXY
  1042. aXY
  1043. AbcdeXyz
  1044. \x{1c5}AbXY
  1045. abcDEXypqreXlmn
  1046. \= Expect no match
  1047. \x{1bb}XY
  1048. \x{2b0}XY
  1049. !XY
  1050. /^\p{L&}+?X/utf
  1051. AXY
  1052. aXY
  1053. AbcdeXyz
  1054. \x{1c5}AbXY
  1055. abcDEXypqreXlmn
  1056. \= Expect no match
  1057. \x{1bb}XY
  1058. \x{2b0}XY
  1059. !XY
  1060. /^[\p{L&}]+?X/utf
  1061. AXY
  1062. aXY
  1063. AbcdeXyz
  1064. \x{1c5}AbXY
  1065. abcDEXypqreXlmn
  1066. \= Expect no match
  1067. \x{1bb}XY
  1068. \x{2b0}XY
  1069. !XY
  1070. /^\P{L&}X/utf
  1071. !XY
  1072. \x{1bb}XY
  1073. \x{2b0}XY
  1074. \= Expect no match
  1075. \x{1c5}XY
  1076. AXY
  1077. /^[\P{L&}]X/utf
  1078. !XY
  1079. \x{1bb}XY
  1080. \x{2b0}XY
  1081. \= Expect no match
  1082. \x{1c5}XY
  1083. AXY
  1084. /^(\p{Z}[^\p{C}\p{Z}]+)*$/
  1085. \xa0!
  1086. /^[\pL](abc)(?1)/
  1087. AabcabcYZ
  1088. /([\pL]=(abc))*X/
  1089. L=abcX
  1090. /^\p{Balinese}\p{Cuneiform}\p{Nko}\p{Phags_Pa}\p{Phoenician}/utf
  1091. \x{1b00}\x{12000}\x{7c0}\x{a840}\x{10900}
  1092. # Check property support in non-UTF mode
  1093. /\p{L}{4}/
  1094. 123abcdefg
  1095. 123abc\xc4\xc5zz
  1096. /\X{1,3}\d/
  1097. \= Expect no match
  1098. \x8aBCD
  1099. /\X?\d/
  1100. \= Expect no match
  1101. \x8aBCD
  1102. /\P{L}?\d/
  1103. \= Expect no match
  1104. \x8aBCD
  1105. /[\PPP\x8a]{1,}\x80/
  1106. A\x80
  1107. /^[\p{Arabic}]/utf
  1108. \x{604}
  1109. \x{60e}
  1110. \x{656}
  1111. \x{657}
  1112. \x{658}
  1113. \x{659}
  1114. \x{65a}
  1115. \x{65b}
  1116. \x{65c}
  1117. \x{65d}
  1118. \x{65e}
  1119. \x{65f}
  1120. \x{66a}
  1121. \x{6e9}
  1122. \x{6ef}
  1123. \x{6fa}
  1124. /^\p{Cyrillic}/utf
  1125. \x{1d2b}
  1126. /^\p{Common}/utf
  1127. \x{2116}
  1128. \x{1D183}
  1129. /^\p{Inherited}/utf
  1130. \x{200c}
  1131. \= Expect no match
  1132. \x{64a}
  1133. \x{656}
  1134. /^\p{Shavian}/utf
  1135. \x{10450}
  1136. \x{1047f}
  1137. /^\p{Deseret}/utf
  1138. \x{10400}
  1139. \x{1044f}
  1140. /^\p{Osmanya}/utf
  1141. \x{10480}
  1142. \x{1049d}
  1143. \x{104a0}
  1144. \x{104a9}
  1145. \= Expect no match
  1146. \x{1049e}
  1147. \x{1049f}
  1148. \x{104aa}
  1149. /\p{katakana}/utf
  1150. \x{30a1}
  1151. \x{3001}
  1152. /\p{scx:katakana}/utf
  1153. \x{30a1}
  1154. \x{3001}
  1155. /\p{script extensions:katakana}/utf
  1156. \x{30a1}
  1157. \x{3001}
  1158. /\p{sc:katakana}/utf
  1159. \x{30a1}
  1160. \= Expect no match
  1161. \x{3001}
  1162. /\p{script:katakana}/utf
  1163. \x{30a1}
  1164. \= Expect no match
  1165. \x{3001}
  1166. /\p{sc:katakana}{3,}/utf
  1167. \x{30a1}\x{30fa}\x{32d0}\x{1b122}\x{ff66}\x{3001}ABC
  1168. /\p{sc:katakana}{3,}?/utf
  1169. \x{30a1}\x{30fa}\x{32d0}\x{1b122}\x{ff66}\x{3001}ABC
  1170. /\p{Carian}\p{Cham}\p{Kayah_Li}\p{Lepcha}\p{Lycian}\p{Lydian}\p{Ol_Chiki}\p{Rejang}\p{Saurashtra}\p{Sundanese}\p{Vai}/utf
  1171. \x{102A4}\x{AA52}\x{A91D}\x{1C46}\x{10283}\x{1092E}\x{1C6B}\x{A93B}\x{A8BF}\x{1BA0}\x{A50A}====
  1172. /\x{a77d}\x{1d79}/i,utf
  1173. \x{a77d}\x{1d79}
  1174. \x{1d79}\x{a77d}
  1175. /\x{a77d}\x{1d79}/utf
  1176. \x{a77d}\x{1d79}
  1177. \= Expect no match
  1178. \x{1d79}\x{a77d}
  1179. /(A)\1/i,utf
  1180. AA
  1181. Aa
  1182. aa
  1183. aA
  1184. /(\x{10a})\1/i,utf
  1185. \x{10a}\x{10a}
  1186. \x{10a}\x{10b}
  1187. \x{10b}\x{10b}
  1188. \x{10b}\x{10a}
  1189. # The next two tests are for property support in non-UTF mode
  1190. /(?:\p{Lu}|\x20)+/
  1191. \x41\x20\x50\xC2\x54\xC9\x20\x54\x4F\x44\x41\x59
  1192. /[\p{Lu}\x20]+/
  1193. \x41\x20\x50\xC2\x54\xC9\x20\x54\x4F\x44\x41\x59
  1194. /\p{Avestan}\p{Bamum}\p{Egyptian_Hieroglyphs}\p{Imperial_Aramaic}\p{Inscriptional_Pahlavi}\p{Inscriptional_Parthian}\p{Javanese}\p{Kaithi}\p{Lisu}\p{Meetei_Mayek}\p{Old_South_Arabian}\p{Old_Turkic}\p{Samaritan}\p{Tai_Tham}\p{Tai_Viet}/utf
  1195. \x{10b00}\x{a6ef}\x{13007}\x{10857}\x{10b78}\x{10b58}\x{a980}\x{110c1}\x{a4ff}\x{abc0}\x{10a7d}\x{10c48}\x{0800}\x{1aad}\x{aac0}
  1196. /^\w+/utf,ucp
  1197. Az_\x{aa}\x{c0}\x{1c5}\x{2b0}\x{3b6}\x{1d7c9}\x{2fa1d}1\x{660}\x{bef}\x{16ee}
  1198. /^[[:xdigit:]]*/utf,ucp
  1199. 1a\x{660}\x{bef}\x{16ee}
  1200. /^\d+/utf,ucp
  1201. 1\x{660}\x{bef}\x{16ee}
  1202. /^[[:digit:]]+/utf,ucp
  1203. 1\x{660}\x{bef}\x{16ee}
  1204. /^>\s+/utf,ucp
  1205. >\x{20}\x{a0}\x{1680}\x{2028}\x{2029}\x{202f}\x{9}\x{b}
  1206. /^>\pZ+/utf,ucp
  1207. >\x{20}\x{a0}\x{1680}\x{2028}\x{2029}\x{202f}\x{9}\x{b}
  1208. /^>[[:space:]]*/utf,ucp
  1209. >\x{20}\x{a0}\x{1680}\x{2028}\x{2029}\x{202f}\x{9}\x{b}
  1210. /^>[[:blank:]]*/utf,ucp
  1211. >\x{20}\x{a0}\x{1680}\x{2000}\x{202f}\x{9}\x{b}\x{2028}
  1212. /^[[:alpha:]]*/utf,ucp
  1213. Az\x{aa}\x{c0}\x{1c5}\x{2b0}\x{3b6}\x{1d7c9}\x{2fa1d}
  1214. /^[[:alnum:]]*/utf,ucp
  1215. Az\x{aa}\x{c0}\x{1c5}\x{2b0}\x{3b6}\x{1d7c9}\x{2fa1d}1\x{660}\x{bef}\x{16ee}
  1216. /^[[:cntrl:]]*/utf,ucp
  1217. \x{0}\x{09}\x{1f}\x{7f}\x{9f}
  1218. /^[[:graph:]]*/utf,ucp
  1219. A\x{a1}\x{a0}
  1220. /^[[:print:]]*/utf,ucp
  1221. A z\x{a0}\x{a1}
  1222. /^[[:punct:]]*/utf,ucp
  1223. .+\x{a1}\x{a0}
  1224. /\p{Zs}*?\R/
  1225. \= Expect no match
  1226. a\xFCb
  1227. /\p{Zs}*\R/
  1228. \= Expect no match
  1229. a\xFCb
  1230. /ⱥ/i,utf
  1231. Ⱥx
  1232. Ⱥ
  1233. /[ⱥ]/i,utf
  1234. Ⱥx
  1235. Ⱥ
  1236. /Ⱥ/i,utf
  1237. Ⱥ
  1238. # These are tests for extended grapheme clusters
  1239. /^\X/utf,aftertext
  1240. G\x{34e}\x{34e}X
  1241. \x{34e}\x{34e}X
  1242. \x04X
  1243. \x{1100}X
  1244. \x{1100}\x{34e}X
  1245. \x{1b04}\x{1b04}X
  1246. *These match up to the roman letters
  1247. \x{1111}\x{1111}L,L
  1248. \x{1111}\x{1111}\x{1169}L,L,V
  1249. \x{1111}\x{ae4c}L, LV
  1250. \x{1111}\x{ad89}L, LVT
  1251. \x{1111}\x{ae4c}\x{1169}L, LV, V
  1252. \x{1111}\x{ae4c}\x{1169}\x{1169}L, LV, V, V
  1253. \x{1111}\x{ae4c}\x{1169}\x{11fe}L, LV, V, T
  1254. \x{1111}\x{ad89}\x{11fe}L, LVT, T
  1255. \x{1111}\x{ad89}\x{11fe}\x{11fe}L, LVT, T, T
  1256. \x{ad89}\x{11fe}\x{11fe}LVT, T, T
  1257. *These match just the first codepoint (invalid sequence)
  1258. \x{1111}\x{11fe}L, T
  1259. \x{ae4c}\x{1111}LV, L
  1260. \x{ae4c}\x{ae4c}LV, LV
  1261. \x{ae4c}\x{ad89}LV, LVT
  1262. \x{1169}\x{1111}V, L
  1263. \x{1169}\x{ae4c}V, LV
  1264. \x{1169}\x{ad89}V, LVT
  1265. \x{ad89}\x{1111}LVT, L
  1266. \x{ad89}\x{1169}LVT, V
  1267. \x{ad89}\x{ae4c}LVT, LV
  1268. \x{ad89}\x{ad89}LVT, LVT
  1269. \x{11fe}\x{1111}T, L
  1270. \x{11fe}\x{1169}T, V
  1271. \x{11fe}\x{ae4c}T, LV
  1272. \x{11fe}\x{ad89}T, LVT
  1273. *Test extend and spacing mark
  1274. \x{1111}\x{ae4c}\x{0711}L, LV, extend
  1275. \x{1111}\x{ae4c}\x{1b04}L, LV, spacing mark
  1276. \x{1111}\x{ae4c}\x{1b04}\x{0711}\x{1b04}L, LV, spacing mark, extend, spacing mark
  1277. *Test CR, LF, and control
  1278. \x0d\x{0711}CR, extend
  1279. \x0d\x{1b04}CR, spacingmark
  1280. \x0a\x{0711}LF, extend
  1281. \x0a\x{1b04}LF, spacingmark
  1282. \x0b\x{0711}Control, extend
  1283. \x09\x{1b04}Control, spacingmark
  1284. *There are no Prepend characters, so we can't test Prepend, CR
  1285. /^(?>\X{2})X/utf,aftertext
  1286. \x{1111}\x{ae4c}\x{1111}\x{ae4c}X
  1287. /^\X{2,4}X/utf,aftertext
  1288. \x{1111}\x{ae4c}\x{1111}\x{ae4c}X
  1289. \x{1111}\x{ae4c}\x{1111}\x{ae4c}\x{1111}\x{ae4c}X
  1290. \x{1111}\x{ae4c}\x{1111}\x{ae4c}\x{1111}\x{ae4c}\x{1111}\x{ae4c}X
  1291. /^\X{2,4}?X/utf,aftertext
  1292. \x{1111}\x{ae4c}\x{1111}\x{ae4c}X
  1293. \x{1111}\x{ae4c}\x{1111}\x{ae4c}\x{1111}\x{ae4c}X
  1294. \x{1111}\x{ae4c}\x{1111}\x{ae4c}\x{1111}\x{ae4c}\x{1111}\x{ae4c}X
  1295. /\X*Z/utf,no_start_optimize
  1296. \= Expect no match
  1297. A\x{300}
  1298. /\X*(.)/utf,no_start_optimize
  1299. A\x{1111}\x{ae4c}\x{1169}
  1300. # --------------------------------------------
  1301. /\x{1e9e}+/i,utf
  1302. \x{1e9e}\x{00df}
  1303. /[z\x{1e9e}]+/i,utf
  1304. \x{1e9e}\x{00df}
  1305. /\x{00df}+/i,utf
  1306. \x{1e9e}\x{00df}
  1307. /[z\x{00df}]+/i,utf
  1308. \x{1e9e}\x{00df}
  1309. /\x{1f88}+/i,utf
  1310. \x{1f88}\x{1f80}
  1311. /[z\x{1f88}]+/i,utf
  1312. \x{1f88}\x{1f80}
  1313. # Check a reference with more than one other case
  1314. /^(\x{00b5})\1{2}$/i,utf
  1315. \x{00b5}\x{039c}\x{03bc}
  1316. # Characters with more than one other case; test in classes
  1317. /[z\x{00b5}]+/i,utf
  1318. \x{00b5}\x{039c}\x{03bc}
  1319. /[z\x{039c}]+/i,utf
  1320. \x{00b5}\x{039c}\x{03bc}
  1321. /[z\x{03bc}]+/i,utf
  1322. \x{00b5}\x{039c}\x{03bc}
  1323. /[z\x{00c5}]+/i,utf
  1324. \x{00c5}\x{00e5}\x{212b}
  1325. /[z\x{00e5}]+/i,utf
  1326. \x{00c5}\x{00e5}\x{212b}
  1327. /[z\x{212b}]+/i,utf
  1328. \x{00c5}\x{00e5}\x{212b}
  1329. /[z\x{01c4}]+/i,utf
  1330. \x{01c4}\x{01c5}\x{01c6}
  1331. /[z\x{01c5}]+/i,utf
  1332. \x{01c4}\x{01c5}\x{01c6}
  1333. /[z\x{01c6}]+/i,utf
  1334. \x{01c4}\x{01c5}\x{01c6}
  1335. /[z\x{01c7}]+/i,utf
  1336. \x{01c7}\x{01c8}\x{01c9}
  1337. /[z\x{01c8}]+/i,utf
  1338. \x{01c7}\x{01c8}\x{01c9}
  1339. /[z\x{01c9}]+/i,utf
  1340. \x{01c7}\x{01c8}\x{01c9}
  1341. /[z\x{01ca}]+/i,utf
  1342. \x{01ca}\x{01cb}\x{01cc}
  1343. /[z\x{01cb}]+/i,utf
  1344. \x{01ca}\x{01cb}\x{01cc}
  1345. /[z\x{01cc}]+/i,utf
  1346. \x{01ca}\x{01cb}\x{01cc}
  1347. /[z\x{01f1}]+/i,utf
  1348. \x{01f1}\x{01f2}\x{01f3}
  1349. /[z\x{01f2}]+/i,utf
  1350. \x{01f1}\x{01f2}\x{01f3}
  1351. /[z\x{01f3}]+/i,utf
  1352. \x{01f1}\x{01f2}\x{01f3}
  1353. /[z\x{0345}]+/i,utf
  1354. \x{0345}\x{0399}\x{03b9}\x{1fbe}
  1355. /[z\x{0399}]+/i,utf
  1356. \x{0345}\x{0399}\x{03b9}\x{1fbe}
  1357. /[z\x{03b9}]+/i,utf
  1358. \x{0345}\x{0399}\x{03b9}\x{1fbe}
  1359. /[z\x{1fbe}]+/i,utf
  1360. \x{0345}\x{0399}\x{03b9}\x{1fbe}
  1361. /[z\x{0392}]+/i,utf
  1362. \x{0392}\x{03b2}\x{03d0}
  1363. /[z\x{03b2}]+/i,utf
  1364. \x{0392}\x{03b2}\x{03d0}
  1365. /[z\x{03d0}]+/i,utf
  1366. \x{0392}\x{03b2}\x{03d0}
  1367. /[z\x{0395}]+/i,utf
  1368. \x{0395}\x{03b5}\x{03f5}
  1369. /[z\x{03b5}]+/i,utf
  1370. \x{0395}\x{03b5}\x{03f5}
  1371. /[z\x{03f5}]+/i,utf
  1372. \x{0395}\x{03b5}\x{03f5}
  1373. /[z\x{0398}]+/i,utf
  1374. \x{0398}\x{03b8}\x{03d1}\x{03f4}
  1375. /[z\x{03b8}]+/i,utf
  1376. \x{0398}\x{03b8}\x{03d1}\x{03f4}
  1377. /[z\x{03d1}]+/i,utf
  1378. \x{0398}\x{03b8}\x{03d1}\x{03f4}
  1379. /[z\x{03f4}]+/i,utf
  1380. \x{0398}\x{03b8}\x{03d1}\x{03f4}
  1381. /[z\x{039a}]+/i,utf
  1382. \x{039a}\x{03ba}\x{03f0}
  1383. /[z\x{03ba}]+/i,utf
  1384. \x{039a}\x{03ba}\x{03f0}
  1385. /[z\x{03f0}]+/i,utf
  1386. \x{039a}\x{03ba}\x{03f0}
  1387. /[z\x{03a0}]+/i,utf
  1388. \x{03a0}\x{03c0}\x{03d6}
  1389. /[z\x{03c0}]+/i,utf
  1390. \x{03a0}\x{03c0}\x{03d6}
  1391. /[z\x{03d6}]+/i,utf
  1392. \x{03a0}\x{03c0}\x{03d6}
  1393. /[z\x{03a1}]+/i,utf
  1394. \x{03a1}\x{03c1}\x{03f1}
  1395. /[z\x{03c1}]+/i,utf
  1396. \x{03a1}\x{03c1}\x{03f1}
  1397. /[z\x{03f1}]+/i,utf
  1398. \x{03a1}\x{03c1}\x{03f1}
  1399. /[z\x{03a3}]+/i,utf
  1400. \x{03A3}\x{03C2}\x{03C3}
  1401. /[z\x{03c2}]+/i,utf
  1402. \x{03A3}\x{03C2}\x{03C3}
  1403. /[z\x{03c3}]+/i,utf
  1404. \x{03A3}\x{03C2}\x{03C3}
  1405. /[z\x{03a6}]+/i,utf
  1406. \x{03a6}\x{03c6}\x{03d5}
  1407. /[z\x{03c6}]+/i,utf
  1408. \x{03a6}\x{03c6}\x{03d5}
  1409. /[z\x{03d5}]+/i,utf
  1410. \x{03a6}\x{03c6}\x{03d5}
  1411. /[z\x{03c9}]+/i,utf
  1412. \x{03c9}\x{03a9}\x{2126}
  1413. /[z\x{03a9}]+/i,utf
  1414. \x{03c9}\x{03a9}\x{2126}
  1415. /[z\x{2126}]+/i,utf
  1416. \x{03c9}\x{03a9}\x{2126}
  1417. /[z\x{1e60}]+/i,utf
  1418. \x{1e60}\x{1e61}\x{1e9b}
  1419. /[z\x{1e61}]+/i,utf
  1420. \x{1e60}\x{1e61}\x{1e9b}
  1421. /[z\x{1e9b}]+/i,utf
  1422. \x{1e60}\x{1e61}\x{1e9b}
  1423. # Perl 5.12.4 gets these wrong, but 5.15.3 is OK
  1424. /[z\x{004b}]+/i,utf
  1425. \x{004b}\x{006b}\x{212a}
  1426. /[z\x{006b}]+/i,utf
  1427. \x{004b}\x{006b}\x{212a}
  1428. /[z\x{212a}]+/i,utf
  1429. \x{004b}\x{006b}\x{212a}
  1430. /[z\x{0053}]+/i,utf
  1431. \x{0053}\x{0073}\x{017f}
  1432. /[z\x{0073}]+/i,utf
  1433. \x{0053}\x{0073}\x{017f}
  1434. /[z\x{017f}]+/i,utf
  1435. \x{0053}\x{0073}\x{017f}
  1436. # --------------------------------------
  1437. /(ΣΆΜΟΣ) \1/i,utf
  1438. ΣΆΜΟΣ ΣΆΜΟΣ
  1439. ΣΆΜΟΣ σάμος
  1440. σάμος σάμος
  1441. σάμος σάμοσ
  1442. σάμος ΣΆΜΟΣ
  1443. /(σάμος) \1/i,utf
  1444. ΣΆΜΟΣ ΣΆΜΟΣ
  1445. ΣΆΜΟΣ σάμος
  1446. σάμος σάμος
  1447. σάμος σάμοσ
  1448. σάμος ΣΆΜΟΣ
  1449. /(ΣΆΜΟΣ) \1*/i,utf
  1450. ΣΆΜΟΣ\x20
  1451. ΣΆΜΟΣ ΣΆΜΟΣσάμοςσάμος
  1452. # Perl matches these
  1453. /\x{00b5}+/i,utf
  1454. \x{00b5}\x{039c}\x{03bc}
  1455. /\x{039c}+/i,utf
  1456. \x{00b5}\x{039c}\x{03bc}
  1457. /\x{03bc}+/i,utf
  1458. \x{00b5}\x{039c}\x{03bc}
  1459. /\x{00c5}+/i,utf
  1460. \x{00c5}\x{00e5}\x{212b}
  1461. /\x{00e5}+/i,utf
  1462. \x{00c5}\x{00e5}\x{212b}
  1463. /\x{212b}+/i,utf
  1464. \x{00c5}\x{00e5}\x{212b}
  1465. /\x{01c4}+/i,utf
  1466. \x{01c4}\x{01c5}\x{01c6}
  1467. /\x{01c5}+/i,utf
  1468. \x{01c4}\x{01c5}\x{01c6}
  1469. /\x{01c6}+/i,utf
  1470. \x{01c4}\x{01c5}\x{01c6}
  1471. /\x{01c7}+/i,utf
  1472. \x{01c7}\x{01c8}\x{01c9}
  1473. /\x{01c8}+/i,utf
  1474. \x{01c7}\x{01c8}\x{01c9}
  1475. /\x{01c9}+/i,utf
  1476. \x{01c7}\x{01c8}\x{01c9}
  1477. /\x{01ca}+/i,utf
  1478. \x{01ca}\x{01cb}\x{01cc}
  1479. /\x{01cb}+/i,utf
  1480. \x{01ca}\x{01cb}\x{01cc}
  1481. /\x{01cc}+/i,utf
  1482. \x{01ca}\x{01cb}\x{01cc}
  1483. /\x{01f1}+/i,utf
  1484. \x{01f1}\x{01f2}\x{01f3}
  1485. /\x{01f2}+/i,utf
  1486. \x{01f1}\x{01f2}\x{01f3}
  1487. /\x{01f3}+/i,utf
  1488. \x{01f1}\x{01f2}\x{01f3}
  1489. /\x{0345}+/i,utf
  1490. \x{0345}\x{0399}\x{03b9}\x{1fbe}
  1491. /\x{0399}+/i,utf
  1492. \x{0345}\x{0399}\x{03b9}\x{1fbe}
  1493. /\x{03b9}+/i,utf
  1494. \x{0345}\x{0399}\x{03b9}\x{1fbe}
  1495. /\x{1fbe}+/i,utf
  1496. \x{0345}\x{0399}\x{03b9}\x{1fbe}
  1497. /\x{0392}+/i,utf
  1498. \x{0392}\x{03b2}\x{03d0}
  1499. /\x{03b2}+/i,utf
  1500. \x{0392}\x{03b2}\x{03d0}
  1501. /\x{03d0}+/i,utf
  1502. \x{0392}\x{03b2}\x{03d0}
  1503. /\x{0395}+/i,utf
  1504. \x{0395}\x{03b5}\x{03f5}
  1505. /\x{03b5}+/i,utf
  1506. \x{0395}\x{03b5}\x{03f5}
  1507. /\x{03f5}+/i,utf
  1508. \x{0395}\x{03b5}\x{03f5}
  1509. /\x{0398}+/i,utf
  1510. \x{0398}\x{03b8}\x{03d1}\x{03f4}
  1511. /\x{03b8}+/i,utf
  1512. \x{0398}\x{03b8}\x{03d1}\x{03f4}
  1513. /\x{03d1}+/i,utf
  1514. \x{0398}\x{03b8}\x{03d1}\x{03f4}
  1515. /\x{03f4}+/i,utf
  1516. \x{0398}\x{03b8}\x{03d1}\x{03f4}
  1517. /\x{039a}+/i,utf
  1518. \x{039a}\x{03ba}\x{03f0}
  1519. /\x{03ba}+/i,utf
  1520. \x{039a}\x{03ba}\x{03f0}
  1521. /\x{03f0}+/i,utf
  1522. \x{039a}\x{03ba}\x{03f0}
  1523. /\x{03a0}+/i,utf
  1524. \x{03a0}\x{03c0}\x{03d6}
  1525. /\x{03c0}+/i,utf
  1526. \x{03a0}\x{03c0}\x{03d6}
  1527. /\x{03d6}+/i,utf
  1528. \x{03a0}\x{03c0}\x{03d6}
  1529. /\x{03a1}+/i,utf
  1530. \x{03a1}\x{03c1}\x{03f1}
  1531. /\x{03c1}+/i,utf
  1532. \x{03a1}\x{03c1}\x{03f1}
  1533. /\x{03f1}+/i,utf
  1534. \x{03a1}\x{03c1}\x{03f1}
  1535. /\x{03a3}+/i,utf
  1536. \x{03A3}\x{03C2}\x{03C3}
  1537. /\x{03c2}+/i,utf
  1538. \x{03A3}\x{03C2}\x{03C3}
  1539. /\x{03c3}+/i,utf
  1540. \x{03A3}\x{03C2}\x{03C3}
  1541. /\x{03a6}+/i,utf
  1542. \x{03a6}\x{03c6}\x{03d5}
  1543. /\x{03c6}+/i,utf
  1544. \x{03a6}\x{03c6}\x{03d5}
  1545. /\x{03d5}+/i,utf
  1546. \x{03a6}\x{03c6}\x{03d5}
  1547. /\x{03c9}+/i,utf
  1548. \x{03c9}\x{03a9}\x{2126}
  1549. /\x{03a9}+/i,utf
  1550. \x{03c9}\x{03a9}\x{2126}
  1551. /\x{2126}+/i,utf
  1552. \x{03c9}\x{03a9}\x{2126}
  1553. /\x{1e60}+/i,utf
  1554. \x{1e60}\x{1e61}\x{1e9b}
  1555. /\x{1e61}+/i,utf
  1556. \x{1e60}\x{1e61}\x{1e9b}
  1557. /\x{1e9b}+/i,utf
  1558. \x{1e60}\x{1e61}\x{1e9b}
  1559. /\x{1e9e}+/i,utf
  1560. \x{1e9e}\x{00df}
  1561. /\x{00df}+/i,utf
  1562. \x{1e9e}\x{00df}
  1563. /\x{1f88}+/i,utf
  1564. \x{1f88}\x{1f80}
  1565. /\x{1f80}+/i,utf
  1566. \x{1f88}\x{1f80}
  1567. # Perl 5.12.4 gets these wrong, but 5.15.3 is OK
  1568. /\x{004b}+/i,utf
  1569. \x{004b}\x{006b}\x{212a}
  1570. /\x{006b}+/i,utf
  1571. \x{004b}\x{006b}\x{212a}
  1572. /\x{212a}+/i,utf
  1573. \x{004b}\x{006b}\x{212a}
  1574. /\x{0053}+/i,utf
  1575. \x{0053}\x{0073}\x{017f}
  1576. /\x{0073}+/i,utf
  1577. \x{0053}\x{0073}\x{017f}
  1578. /\x{017f}+/i,utf
  1579. \x{0053}\x{0073}\x{017f}
  1580. /^\p{Any}*\d{4}/utf
  1581. 1234
  1582. \= Expect no match
  1583. 123
  1584. /^\X*\w{4}/utf
  1585. 1234
  1586. \= Expect no match
  1587. 123
  1588. /^A\s+Z/utf,ucp
  1589. A\x{2005}Z
  1590. A\x{85}\x{2005}Z
  1591. /^A[\s]+Z/utf,ucp
  1592. A\x{2005}Z
  1593. A\x{85}\x{2005}Z
  1594. /^[[:graph:]]+$/utf,ucp
  1595. Letter:ABC
  1596. Mark:\x{300}\x{1d172}\x{1d17b}
  1597. Number:9\x{660}
  1598. Punctuation:\x{66a},;
  1599. Symbol:\x{6de}<>\x{fffc}
  1600. Cf-property:\x{ad}\x{600}\x{601}\x{602}\x{603}\x{604}\x{6dd}\x{70f}
  1601. \x{200b}\x{200c}\x{200d}\x{200e}\x{200f}
  1602. \x{202a}\x{202b}\x{202c}\x{202d}\x{202e}
  1603. \x{2060}\x{2061}\x{2062}\x{2063}\x{2064}
  1604. \x{206a}\x{206b}\x{206c}\x{206d}\x{206e}\x{206f}
  1605. \x{feff}
  1606. \x{fff9}\x{fffa}\x{fffb}
  1607. \x{110bd}
  1608. \x{1d173}\x{1d174}\x{1d175}\x{1d176}\x{1d177}\x{1d178}\x{1d179}\x{1d17a}
  1609. \x{e0001}
  1610. \x{e0020}\x{e0030}\x{e0040}\x{e0050}\x{e0060}\x{e0070}\x{e007f}
  1611. \= Expect no match
  1612. \x{09}
  1613. \x{0a}
  1614. \x{1D}
  1615. \x{20}
  1616. \x{85}
  1617. \x{a0}
  1618. \x{1680}
  1619. \x{2028}
  1620. \x{2029}
  1621. \x{202f}
  1622. \x{2065}
  1623. \x{3000}
  1624. \x{e0002}
  1625. \x{e001f}
  1626. \x{e0080}
  1627. /^[[:print:]]+$/utf,ucp
  1628. Space: \x{a0}
  1629. \x{1680}\x{2000}\x{2001}\x{2002}\x{2003}\x{2004}\x{2005}
  1630. \x{2006}\x{2007}\x{2008}\x{2009}\x{200a}
  1631. \x{202f}\x{205f}
  1632. \x{3000}
  1633. Letter:ABC
  1634. Mark:\x{300}\x{1d172}\x{1d17b}
  1635. Number:9\x{660}
  1636. Punctuation:\x{66a},;
  1637. Symbol:\x{6de}<>\x{fffc}
  1638. Cf-property:\x{ad}\x{600}\x{601}\x{602}\x{603}\x{604}\x{6dd}\x{70f}
  1639. \x{200b}\x{200c}\x{200d}\x{200e}\x{200f}
  1640. \x{202a}\x{202b}\x{202c}\x{202d}\x{202e}
  1641. \x{202f}
  1642. \x{2060}\x{2061}\x{2062}\x{2063}\x{2064}
  1643. \x{206a}\x{206b}\x{206c}\x{206d}\x{206e}\x{206f}
  1644. \x{feff}
  1645. \x{fff9}\x{fffa}\x{fffb}
  1646. \x{110bd}
  1647. \x{1d173}\x{1d174}\x{1d175}\x{1d176}\x{1d177}\x{1d178}\x{1d179}\x{1d17a}
  1648. \x{e0001}
  1649. \x{e0020}\x{e0030}\x{e0040}\x{e0050}\x{e0060}\x{e0070}\x{e007f}
  1650. \= Expect no match
  1651. \x{09}
  1652. \x{1D}
  1653. \x{85}
  1654. \x{2028}
  1655. \x{2029}
  1656. \x{2065}
  1657. \x{e0002}
  1658. \x{e001f}
  1659. \x{e0080}
  1660. /^[[:punct:]]+$/utf,ucp
  1661. \$+<=>^`|~
  1662. !\"#%&'()*,-./:;?@[\\]_{}
  1663. \x{a1}\x{a7}
  1664. \x{37e}
  1665. \= Expect no match
  1666. abcde
  1667. /^[[:^graph:]]+$/utf,ucp
  1668. \x{09}\x{0a}\x{1D}\x{20}\x{85}\x{a0}\x{1680}
  1669. \x{2028}\x{2029}\x{202f}\x{2065}
  1670. \x{3000}\x{e0002}\x{e001f}\x{e0080}
  1671. \= Expect no match
  1672. Letter:ABC
  1673. Mark:\x{300}\x{1d172}\x{1d17b}
  1674. Number:9\x{660}
  1675. Punctuation:\x{66a},;
  1676. Symbol:\x{6de}<>\x{fffc}
  1677. Cf-property:\x{ad}\x{600}\x{601}\x{602}\x{603}\x{604}\x{6dd}\x{70f}
  1678. \x{200b}\x{200c}\x{200d}\x{200e}\x{200f}
  1679. \x{202a}\x{202b}\x{202c}\x{202d}\x{202e}
  1680. \x{2060}\x{2061}\x{2062}\x{2063}\x{2064}
  1681. \x{206a}\x{206b}\x{206c}\x{206d}\x{206e}\x{206f}
  1682. \x{feff}
  1683. \x{fff9}\x{fffa}\x{fffb}
  1684. \x{110bd}
  1685. \x{1d173}\x{1d174}\x{1d175}\x{1d176}\x{1d177}\x{1d178}\x{1d179}\x{1d17a}
  1686. \x{e0001}
  1687. \x{e0020}\x{e0030}\x{e0040}\x{e0050}\x{e0060}\x{e0070}\x{e007f}
  1688. /^[[:^print:]]+$/utf,ucp
  1689. \x{09}\x{1D}\x{85}\x{2028}\x{2029}\x{2065}
  1690. \x{e0002}\x{e001f}\x{e0080}
  1691. \= Expect no match
  1692. Space: \x{a0}
  1693. \x{1680}\x{2000}\x{2001}\x{2002}\x{2003}\x{2004}\x{2005}
  1694. \x{2006}\x{2007}\x{2008}\x{2009}\x{200a}
  1695. \x{202f}\x{205f}
  1696. \x{3000}
  1697. Letter:ABC
  1698. Mark:\x{300}\x{1d172}\x{1d17b}
  1699. Number:9\x{660}
  1700. Punctuation:\x{66a},;
  1701. Symbol:\x{6de}<>\x{fffc}
  1702. Cf-property:\x{ad}\x{600}\x{601}\x{602}\x{603}\x{604}\x{6dd}\x{70f}
  1703. \x{200b}\x{200c}\x{200d}\x{200e}\x{200f}
  1704. \x{202a}\x{202b}\x{202c}\x{202d}\x{202e}
  1705. \x{202f}
  1706. \x{2060}\x{2061}\x{2062}\x{2063}\x{2064}
  1707. \x{206a}\x{206b}\x{206c}\x{206d}\x{206e}\x{206f}
  1708. \x{feff}
  1709. \x{fff9}\x{fffa}\x{fffb}
  1710. \x{110bd}
  1711. \x{1d173}\x{1d174}\x{1d175}\x{1d176}\x{1d177}\x{1d178}\x{1d179}\x{1d17a}
  1712. \x{e0001}
  1713. \x{e0020}\x{e0030}\x{e0040}\x{e0050}\x{e0060}\x{e0070}\x{e007f}
  1714. /^[[:^punct:]]+$/utf,ucp
  1715. abcde
  1716. \= Expect no match
  1717. \$+<=>^`|~
  1718. !\"#%&'()*,-./:;?@[\\]_{}
  1719. \x{a1}\x{a7}
  1720. \x{37e}
  1721. /[RST]+/i,utf,ucp
  1722. Ss\x{17f}
  1723. /[R-T]+/i,utf,ucp
  1724. Ss\x{17f}
  1725. /[q-u]+/i,utf,ucp
  1726. Ss\x{17f}
  1727. /^s?c/im,utf
  1728. scat
  1729. # The next four tests are for repeated caseless back references when the
  1730. # code unit length of the matched text is different to that of the original
  1731. # group in the UTF-8 case.
  1732. /^(\x{23a})\1*(.)/i,utf
  1733. \x{23a}\x{23a}\x{23a}\x{23a}
  1734. \x{23a}\x{2c65}\x{2c65}\x{2c65}
  1735. \x{23a}\x{23a}\x{2c65}\x{23a}
  1736. /^(\x{23a})\1*(..)/i,utf
  1737. \x{23a}\x{2c65}\x{2c65}\x{2c65}
  1738. \x{23a}\x{23a}\x{2c65}\x{23a}
  1739. /^(\x{23a})\1*(...)/i,utf
  1740. \x{23a}\x{2c65}\x{2c65}\x{2c65}
  1741. \x{23a}\x{23a}\x{2c65}\x{23a}
  1742. /^(\x{23a})\1*(....)/i,utf
  1743. \= Expect no match
  1744. \x{23a}\x{2c65}\x{2c65}\x{2c65}
  1745. \x{23a}\x{23a}\x{2c65}\x{23a}
  1746. /[A-`]/i,utf
  1747. abcdefghijklmno
  1748. /[\S\V\H]/utf
  1749. /[^\p{Any}]*+x/utf
  1750. x
  1751. /[[:punct:]]/utf,ucp
  1752. \x{b4}
  1753. /[[:^ascii:]]/utf,ucp
  1754. \x{100}
  1755. \x{200}
  1756. \x{300}
  1757. \x{37e}
  1758. \= Expect no match
  1759. aa
  1760. 99
  1761. /[[:^ascii:]\w]/utf,ucp
  1762. aa
  1763. 99
  1764. gg
  1765. \x{100}
  1766. \x{200}
  1767. \x{300}
  1768. \x{37e}
  1769. /[\w[:^ascii:]]/utf,ucp
  1770. aa
  1771. 99
  1772. gg
  1773. \x{100}
  1774. \x{200}
  1775. \x{300}
  1776. \x{37e}
  1777. /[^[:ascii:]\W]/utf,ucp
  1778. \x{100}
  1779. \x{200}
  1780. \= Expect no match
  1781. aa
  1782. 99
  1783. gg
  1784. \x{37e}
  1785. /[^[:^ascii:]\d]/utf,ucp
  1786. a
  1787. ~
  1788. \a
  1789. \x{7f}
  1790. \= Expect no match
  1791. 0
  1792. \x{389}
  1793. \x{20ac}
  1794. /(?=.*b)\pL/
  1795. 11bb
  1796. /(?(?=.*b)(?=.*b)\pL|.*c)/
  1797. 11bb
  1798. /^\x{123}+?$/utf,no_auto_possess
  1799. \x{123}\x{123}\x{123}
  1800. /^\x{123}+?$/i,utf,no_auto_possess
  1801. \x{123}\x{122}\x{123}
  1802. \= Expect no match
  1803. \x{123}\x{124}\x{123}
  1804. /\N{U+1234}/utf
  1805. \x{1234}
  1806. /[\N{U+1234}]/utf
  1807. \x{1234}
  1808. # Test the full list of Unicode "Pattern White Space" characters that are to
  1809. # be ignored by /x. The pattern lines below may show up oddly in text editors
  1810. # or when listed to the screen. Note that characters such as U+2002, which are
  1811. # matched as space by \h and \v are *not* "Pattern White Space".
  1812. /A…‎‏

B/x,utf
  1813. AB
  1814. /A B/x,utf
  1815. A\x{2002}B
  1816. \= Expect no match
  1817. AB
  1818. # -------
  1819. /[^\x{100}-\x{ffff}]*[\x80-\xff]/utf
  1820. \x{99}\x{99}\x{99}
  1821. /[^\x{100}-\x{ffff}ABC]*[\x80-\xff]/utf
  1822. \x{99}\x{99}\x{99}
  1823. /[^\x{100}-\x{ffff}]*[\x80-\xff]/i,utf
  1824. \x{99}\x{99}\x{99}
  1825. # Script run tests
  1826. /^(*script_run:.{4})/utf
  1827. abcd Latin x4
  1828. \x{2e80}\x{2fa1d}\x{3041}\x{30a1} Han Han Hiragana Katakana
  1829. \x{3041}\x{30a1}\x{3007}\x{3007} Hiragana Katakana Han Han
  1830. \x{30a1}\x{3041}\x{3007}\x{3007} Katakana Hiragana Han Han
  1831. \x{1100}\x{2e80}\x{2e80}\x{1101} Hangul Han Han Hangul
  1832. \x{2e80}\x{3105}\x{2e80}\x{3105} Han Bopomofo Han Bopomofo
  1833. \x{02ea}\x{2e80}\x{2e80}\x{3105} Bopomofo-Sk Han Han Bopomofo
  1834. \x{3105}\x{2e80}\x{2e80}\x{3105} Bopomofo Han Han Bopomofo
  1835. \x{0300}cd! Inherited Latin Latin Common
  1836. \x{0391}12\x{03a9} Greek Common-digits Greek
  1837. \x{0400}12\x{fe2f} Cyrillic Common-digits Cyrillic
  1838. \x{0531}12\x{fb17} Armenian Common-digits Armenian
  1839. \x{0591}12\x{fb4f} Hebrew Common-digits Hebrew
  1840. \x{0600}12\x{1eef1} Arabic Common-digits Arabic
  1841. \x{0600}\x{0660}\x{0669}\x{1eef1} Arabic Arabic-digits Arabic
  1842. \x{0700}12\x{086a} Syriac Common-digits Syriac
  1843. \x{1200}12\x{ab2e} Ethiopic Common-digits Ethiopic
  1844. \x{1680}12\x{169c} Ogham Common-digits Ogham
  1845. \x{3041}12\x{3041} Hiragana Common-digits Hiragana
  1846. \x{0980}\x{09e6}\x{09e7}\x{0993} Bengali Bengali-digits Bengali
  1847. !cde Common Latin Latin Latin
  1848. A..B Latin Common Common Latin
  1849. 0abc Ascii-digit Latin Latin Latin
  1850. 1\x{0700}\x{0700}\x{0700} Ascii-digit Syriac x 3
  1851. \x{1A80}\x{1A80}\x{1a40}\x{1a41} Tai Tham Hora digits, letters
  1852. \= Expect no match
  1853. a\x{370}bcd Latin Greek Latin Latin
  1854. \x{1100}\x{02ea}\x{02ea}\x{02ea} Hangul Bopomofo x3
  1855. \x{02ea}\x{02ea}\x{02ea}\x{1100} Bopomofo x3 Hangul
  1856. \x{1100}\x{2e80}\x{3041}\x{1101} Hangul Han Hiragana Hangul
  1857. \x{0391}\x{09e6}\x{09e7}\x{03a9} Greek Bengali digits Greek
  1858. \x{0600}7\x{0669}\x{1eef1} Arabic ascii-digit Arabic-digit Arabic
  1859. \x{0600}\x{0669}7\x{1eef1} Arabic Arabic-digit ascii-digit Arabic
  1860. A5\x{ff19}B Latin Common-ascii/notascii-digits Latin
  1861. \x{0300}cd\x{0391} Inherited Latin Latin Greek
  1862. !cd\x{0391} Common Latin Latin Greek
  1863. \x{1A80}\x{1A90}\x{1a40}\x{1a41} Tai Tham Hora digit, Tham digit, letters
  1864. A\x{1d7ce}\x{1d7ff}B Common fancy-common-2-sets-digits Common
  1865. \x{2e80}\x{3105}\x{2e80}\x{30a1} Han Bopomofo Han Katakana
  1866. /^(*sr:.{4}|..)/utf
  1867. \x{2e80}\x{3105}\x{2e80}\x{30a1} Han Bopomofo Han Katakana
  1868. /^(*atomic_script_run:.{4}|..)/utf
  1869. \= Expect no match
  1870. \x{2e80}\x{3105}\x{2e80}\x{30a1} Han Bopomofo Han Katakana
  1871. /^(*asr:.*)/utf
  1872. \= Expect no match
  1873. \x{2e80}\x{3105}\x{2e80}\x{30a1} Han Bopomofo Han Katakana
  1874. /^(?>(*sr:.*))/utf
  1875. \x{2e80}\x{3105}\x{2e80}\x{30a1} Han Bopomofo Han Katakana
  1876. /^(*sr:.*)/utf
  1877. \x{2e80}\x{3105}\x{2e80}\x{30a1} Han Bopomofo Han Katakana
  1878. \x{10fffd}\x{10fffd}\x{10fffd} Private use (Unknown)
  1879. /^(*sr:\x{2e80}*)/utf
  1880. \x{2e80}\x{2e80}\x{3105} Han Han Bopomofo
  1881. /^(*sr:\x{2e80}*)\x{2e80}/utf
  1882. \x{2e80}\x{2e80}\x{3105} Han Han Bopomofo
  1883. /^(*sr:.*)Test/utf
  1884. Test script run on an empty string
  1885. /^(*sr:(.{2})){2}/utf
  1886. \x{0600}7\x{0669}\x{1eef1} Arabic ascii-digit Arabic-digit Arabic
  1887. \x{1A80}\x{1A80}\x{1a40}\x{1a41} Tai Tham Hora digits, letters
  1888. \x{1A80}\x{1a40}\x{1A90}\x{1a41} Tai Tham Hora digit, letter, Tham digit, letter
  1889. \= Expect no match
  1890. \x{1100}\x{2e80}\x{3041}\x{1101} Hangul Han Hiragana Hangul
  1891. /^(*sr:\S*)/utf
  1892. \x{1cf4}\x{20f0}\x{900}\x{11305} [Dev,Gran,Kan] [Dev,Gran,Lat] Dev Gran
  1893. \x{1cf4}\x{20f0}\x{11305}\x{900} [Dev,Gran,Kan] [Dev,Gran,Lat] Gran Dev
  1894. \x{1cf4}\x{20f0}\x{900}ABC [Dev,Gran,Kan] [Dev,Gran,Lat] Dev Lat
  1895. \x{1cf4}\x{20f0}ABC [Dev,Gran,Kan] [Dev,Gran,Lat] Lat
  1896. \x{20f0}ABC [Dev,Gran,Lat] Lat
  1897. XYZ\x{20f0}ABC Lat [Dev,Gran,Lat] Lat
  1898. \x{a36}\x{a33}\x{900} [Dev,...] [Dev,...] Dev
  1899. \x{3001}\x{2e80}\x{3041}\x{30a1} [Bopo, Han, etc] Han Hira Kata
  1900. \x{3001}\x{30a1}\x{2e80}\x{3041} [Bopo, Han, etc] Kata Han Hira
  1901. \x{3001}\x{3105}\x{2e80}\x{1101} [Bopo, Han, etc] Bopomofo Han Hangul
  1902. \x{3105}\x{3001}\x{2e80}\x{1101} Bopomofo [Bopo, Han, etc] Han Hangul
  1903. \x{3031}\x{3041}\x{30a1}\x{2e80} [Hira Kata] Hira Kata Han
  1904. \x{060c}\x{06d4}\x{0600}\x{10d00}\x{0700} [Arab Rohg Syrc Thaa] [Arab Rohg] Arab Rohg Syrc
  1905. \x{060c}\x{06d4}\x{0700}\x{0600}\x{10d00} [Arab Rohg Syrc Thaa] [Arab Rohg] Syrc Arab Rohg
  1906. \x{2e80}\x{3041}\x{3001}\x{3031}\x{2e80} Han Hira [Bopo, Han, etc] [Hira Kata] Han
  1907. /(?<!)(*sr:)/
  1908. /(?<!X(*sr:B)C)/
  1909. /(?<=abc(?=X(*sr:BCY)Z)XBCYZ)./
  1910. abcXBCYZ!
  1911. /(?<=abc(?=X(*sr:BXY)CCC)XBXYCCC)./
  1912. abcXBXYCCC!
  1913. /^(*sr:\S*)/utf
  1914. \x{10d00}\x{10d00}\x{06d4} Rohingya Rohingya Arabic-full-stop
  1915. \x{06d4}\x{10d00}\x{10d00} Arabic-full-stop Rohingya Rohingya
  1916. \x{10d00}\x{10d00}\x{0363} Rohingya Rohingya Inherited-extend-Latin
  1917. \x{0363}\x{10d00}\x{10d00} Inherited-extend-Latin Rohingya Rohingya
  1918. AB\x{0363} Latin Latin Inherited-extend-Latin
  1919. \x{0363}AB Inherited-extend-Latin Latin Latin
  1920. AB\x{1cf7} Latin Latin Common-extended-Beng
  1921. \x{1cf7}AB Common-extend-Beng Latin Latin
  1922. \x{1cf7}\x{0993} Common-extend-Beng Bengali
  1923. A\x{1abe}BC Test enclosing mark
  1924. \x{0370}\x{1abe}\x{0371} Which can occur with any script (Greek here)
  1925. \x{3001}\x{adf9}\x{3001} [.. Hangul ..] Hangul [.. Hangul ..]
  1926. \x{3400}\x{3001}XXX Han [Han etc.]
  1927. \x{3400}\x{1cd5} Han [Bengali Devanagari]
  1928. \x{ac01}\x{3400} Hangul [.. Hangul ..]
  1929. \x{ac01}\x{1cd5} Hangul [Bengali Devanagari]
  1930. \x{102e0}\x{06d4}\x{1ee4d} [Arabic Coptic] [Arab Rohingya] Arabic
  1931. \x{102e0}\x{06d4}\x{2cc9} [Arabic Coptic] [Arab Rohingya] Coptic
  1932. \x{102e0}\x{06d4}\x{10d30} [Arabic Coptic] [Arab Rohingya] Rohingya
  1933. # Test loop breaking for empty string match
  1934. /^(*sr:A|)*BCD/utf
  1935. AABCD
  1936. ABCD
  1937. BCD
  1938. # The use of (*ACCEPT) breaks script run checking
  1939. /^(*sr:.*(*ACCEPT)ZZ)/utf
  1940. \x{1100}\x{2e80}\x{3041}\x{1101} Hangul Han Hiragana Hangul
  1941. # -------
  1942. # Test group names containing non-ASCII letters and digits
  1943. /(?'ABáC'...)\g{ABáC}/utf
  1944. abcabcdefg
  1945. /(?'XʰABC'...)/utf
  1946. xyzpq
  1947. /(?'XאABC'...)/utf
  1948. 12345
  1949. /(?'XᾈABC'...)/utf
  1950. %^&*(...
  1951. /(?'𐨐ABC'...)/utf
  1952. abcde
  1953. /^(?'אABC'...)(?&אABC)(?P=אABC)/utf
  1954. 123123123456
  1955. /^(?'אABC'...)(?&אABC)/utf
  1956. 123123123456
  1957. /\X*/
  1958. \xF3aaa\xE4\xEA\xEB\xFEa
  1959. /Я/i,utf
  1960. \x{42f}
  1961. \x{44f}
  1962. /(?=Я)/i,utf
  1963. \x{42f}
  1964. \x{44f}
  1965. # -----------------------------------------------------------------------------
  1966. # Tests for bidi control and bidi class properties.
  1967. /\p{ bidi_control }/utf
  1968. -->\x{202c}<--
  1969. /\p{bidicontrol}+/utf
  1970. -->\x{061c}\x{200e}\x{200f}\x{202a}\x{202b}\x{202c}\x{202d}<--
  1971. -->\x{2066}\x{2067}\x{2068}\x{2069}<--
  1972. /\p{bidic}+?/utf
  1973. -->\x{061c}\x{200e}\x{200f}\x{202a}\x{202b}\x{202c}\x{202d}<--
  1974. -->\x{2066}\x{2067}\x{2068}\x{2069}<--
  1975. /\p{bidi_control}++/utf
  1976. -->\x{061c}\x{200e}\x{200f}\x{202a}\x{202b}\x{202c}\x{202d}<--
  1977. -->\x{2066}\x{2067}\x{2068}\x{2069}<--
  1978. /[\p{bidi_c}]/utf
  1979. -->\x{202c}<--
  1980. /[\p{bidicontrol}]+/utf
  1981. -->\x{061c}\x{200e}\x{200f}\x{202a}\x{202b}\x{202c}\x{202d}<--
  1982. -->\x{2066}\x{2067}\x{2068}\x{2069}<--
  1983. /[\p{bidicontrol}]+?/utf
  1984. -->\x{061c}\x{200e}\x{200f}\x{202a}\x{202b}\x{202c}\x{202d}<--
  1985. -->\x{2066}\x{2067}\x{2068}\x{2069}<--
  1986. /[\p{bidicontrol}]++/utf
  1987. -->\x{061c}\x{200e}\x{200f}\x{202a}\x{202b}\x{202c}\x{202d}<--
  1988. -->\x{2066}\x{2067}\x{2068}\x{2069}<--
  1989. /[\p{bidicontrol}<>]+/utf
  1990. -->\x{061c}\x{200e}\x{200f}\x{202a}\x{202b}\x{202c}\x{202d}<--
  1991. -->\x{2066}\x{2067}\x{2068}\x{2069}<--
  1992. /\P{bidicontrol}+/g,utf
  1993. -->\x{061c}\x{200e}\x{200f}\x{202a}\x{202b}\x{202c}\x{202d}<--
  1994. -->\x{2066}\x{2067}\x{2068}\x{2069}<--
  1995. /\p{^bidicontrol}+/g,utf
  1996. -->\x{061c}\x{200e}\x{200f}\x{202a}\x{202b}\x{202c}\x{202d}<--
  1997. -->\x{2066}\x{2067}\x{2068}\x{2069}<--
  1998. /\p{bidi class = al}/utf
  1999. -->\x{061D}<--
  2000. /\p{bc = al}+/utf
  2001. -->\x{061D}\x{061e}\x{061f}<--
  2002. /\p{bidi_class : AL}+?/utf
  2003. -->\x{061D}\x{061e}\x{061f}<--
  2004. /\p{Bidi_Class : AL}++/utf
  2005. -->\x{061D}\x{061e}\x{061f}<--
  2006. /\p{b_c = aN}+/utf
  2007. -->\x{061D}\x{0602}\x{0604}\x{061f}<--
  2008. /\p{bidi class = B}+/utf
  2009. -->\x{0a}\x{0d}\x{01c}\x{01e}\x{085}\x{2029}<--
  2010. /\p{bidi class:BN}+/utf
  2011. -->\x{0}\x{08}\x{200c}\x{fffe}\x{dfffe}\x{10ffff}<--
  2012. /\p{bidiclass:cs}+/utf
  2013. -->,.\x{060c}\x{ff1a}<--
  2014. /\p{bidiclass:En}+/utf
  2015. -->09\x{b2}\x{2074}\x{1fbf9}<--
  2016. /\p{bidiclass:es}+/utf
  2017. ==>+-\x{207a}\x{ff0d}<==
  2018. /\p{bidiclass:et}+/utf
  2019. -->#\{24}%\x{a2}\x{A838}\x{1e2ff}<--
  2020. /\p{bidiclass:FSI}+/utf
  2021. -->\x{2068}<--
  2022. /\p{bidi class:L}+/utf
  2023. -->ABC<--
  2024. /\P{bidi class:L}+/utf
  2025. -->ABC<--
  2026. /\p{bidi class:LRE}+\p{bidiclass=lri}*\p{bidiclass:lro}/utf
  2027. -->\x{202a}\x{2066}\x{202d}<--
  2028. /\p{bidi class:NSM}+/utf
  2029. -->\x{9bc}\x{a71}\x{e31}<--
  2030. /\p{bidi class:ON}+/utf
  2031. -->\x{21}'()*;@\x{384}\x{2039}<=-
  2032. /\p{bidiclass:pdf}\p{bidiclass:pdi}/utf
  2033. -->\x{202c}\x{2069}<--
  2034. /\p{bidi class:R}+/utf
  2035. -->\x{590}\x{5c6}\x{200f}\x{10805}<--
  2036. /\p{bidi class:RLE}+\p{bidi class:RLI}*\p{bidi class:RLO}+/utf
  2037. -->\x{202b}\x{2067}\x{202e}<--
  2038. /\p{bidi class:S}+\p{bidiclass:WS}+/utf
  2039. -->\x{9}\x{b}\x{1f} \x{c} \x{2000} \x{3000}<--
  2040. # -----------------------------------------------------------------------------
  2041. /[\p{taml}\p{sc:ugar}]+/utf
  2042. \x{0b82}\x{10380}
  2043. /^[\p{sc:Arabic}]/utf
  2044. \= Expect no match
  2045. \x{650}
  2046. \x{651}
  2047. \x{652}
  2048. \x{653}
  2049. \x{654}
  2050. \x{655}
  2051. # -----------------------------------------------------------------------------
  2052. # Tests for newly-added Boolean Properties
  2053. /\p{ahex}\p{asciihexdigit}/utf
  2054. >4F<
  2055. /\p{alpha}\p{alphabetic}/g,utf
  2056. >AB<>\x{148}\x{1234}
  2057. /\p{ascii}\p{ascii}/g,utf
  2058. >AB<>\x{148}\x{1234}
  2059. /\p{Bidi_C}\p{bidicontrol}/g,utf
  2060. >\x{202d}\x{2069}<
  2061. /\p{Bidi_M}\p{bidimirrored}/g,utf
  2062. >\x{202d}\x{2069}<>\x{298b}\x{bb}<
  2063. /\p{cased}\p{cased}/g,utf
  2064. >AN<>\x{149}\x{120}<
  2065. /\p{caseignorable}\p{ci}/g,utf
  2066. >AN<>\x{60}\x{859}<
  2067. /\p{changeswhencasefolded}\p{cwcf}/g,utf
  2068. >AN<>\x{149}\x{120}<
  2069. /\p{changeswhencasemapped}\p{cwcm}/g,utf
  2070. >AN<>\x{149}\x{120}<
  2071. /\p{changeswhenlowercased}\p{cwl}/g,utf
  2072. >AN<>\x{149}\x{120}<>yz<
  2073. /\p{changeswhenuppercased}\p{cwu}/g,utf
  2074. >AN<>\x{149}\x{120}<>yz<
  2075. /\p{changeswhentitlecased}\p{cwt}/g,utf
  2076. >AN<>\x{149}\x{120}<>yz<
  2077. /\p{dash}\p{dash}/g,utf
  2078. >\x{2d}\x{1400}<>yz<
  2079. /\p{defaultignorablecodepoint}\p{di}/g,utf
  2080. >AN<>\x{ad}\x{e0fff}<>yz<
  2081. /\p{deprecated}\p{dep}/g,utf
  2082. >AN<>\x{149}\x{e0001}<>yz<
  2083. /\p{diacritic}\p{dia}/g,utf
  2084. >AN<>\x{f84}\x{5e}<>yz<
  2085. /\p{emojicomponent}\p{ecomp}/g,utf
  2086. >AN<>\x{200d}\x{e007f}<>yz<
  2087. /\p{emojimodifier}\p{emod}/g,utf
  2088. >AN<>\x{1f3fb}\x{1f3ff}<>yz<
  2089. /\p{emojipresentation}\p{epres}/g,utf
  2090. >AN<>\x{2653}\x{1f6d2}<>yz<
  2091. /\p{extender}\p{ext}/g,utf
  2092. >AN<>\x{1e944}\x{b7}<>yz<
  2093. /\p{extendedpictographic}\p{extpict}/g,utf
  2094. >AN<>\x{26cf}\x{ae}<>yz<
  2095. /\p{graphemebase}\p{grbase}/g,utf
  2096. >AN<>\x{10f}\x{60}<>yz<
  2097. /\p{graphemeextend}\p{grext}/g,utf
  2098. >AN<>\x{300}\x{b44}<>yz<
  2099. /\p{hexdigit}\p{hex}/g,utf
  2100. >AF23<>\x{ff46}\x{ff10}<>yz<
  2101. /\p{idcontinue}\p{idc}/g,utf
  2102. >AF23<>\x{146}\x{7a}<>yz<
  2103. /\p{ideographic}\p{ideo}/g,utf
  2104. >AF23<>\x{30000}\x{3006}<>yz<
  2105. /\p{idstart}\p{ids}/g,utf
  2106. >AF23<>\x{146}\x{7a}<>yz<
  2107. /\p{idsbinaryoperator}\p{idsb}/g,utf
  2108. >AF23<>\x{2ff0}\x{2ffb}<>yz<\x{2ff2}\x{2ff1}
  2109. /\p{idstrinaryoperator}\p{idst}/g,utf
  2110. >AF23<>\x{2ff2}\x{2ff3}<>yz<
  2111. /\p{Join Control}\p{joinc}/g,utf
  2112. >AF23<>\x{200c}\x{200d}<>yz<
  2113. /\p{logical_order_exception}\p{loe}/g,utf
  2114. >AF23<>\x{e40}\x{aabc}<>yz<
  2115. /\p{Lowercase}\p{lower}/g,utf
  2116. >AF23<>\x{146}\x{7a}<>yz<
  2117. /\p{math}\p{math}/g,utf
  2118. >AF23<>\x{2215}\x{2b}<>yz<
  2119. /\p{Non Character Code Point}\p{nchar}/g,utf
  2120. >AF23<>\x{10ffff}\x{fdd0}<>yz<
  2121. /\p{patternsyntax}\p{patsyn}/g,utf
  2122. >AF23<>\x{21cd}\x{21}<>yz<
  2123. /\p{patternwhitespace}\p{patws}/g,utf
  2124. >AF23<>\x{2029}\x{85}<>yz<
  2125. /\p{prependedconcatenationmark}\p{pcm}/g,utf
  2126. >AF23<>\x{600}\x{110cd}<>yz<
  2127. /\p{quotationmark}\p{qmark}/g,utf
  2128. >AF23<>\x{ff63}\x{22}<>yz<
  2129. /\p{radical}\p{radical}/g,utf
  2130. >AF23<>\x{2fd5}\x{2e80}<>yz<
  2131. /\p{regionalindicator}\p{ri}/g,utf
  2132. >AF23<>\x{1f1e6}\x{1f1ff}<>yz<
  2133. /=\p{whitespace}\p{space}\p{wspace}=/g,utf
  2134. >AF23<=\x{d}\x{1680}\x{3000}=>yz<
  2135. /\p{sentenceterminal}\p{sterm}/g,utf
  2136. >AF23<>\x{1da88}\x{2e}<>yz<
  2137. /\p{terminalpunctuation}\p{term}/g,utf
  2138. >AF23<>\x{1da88}\x{2e}<>yz<
  2139. /\p{unified ideograph}\p{uideo}/g,utf
  2140. >AF23<>\x{30000}\x{3400}<>yz<
  2141. /\p{UPPERcase}\p{upper}/g,utf
  2142. >AF23<>\x{146}\x{7a}<>yz<
  2143. /\p{variationselector}\p{vs}/g,utf
  2144. >AF23<>\x{180b}\x{e01ef}<>yz<
  2145. /\p{xidcontinue}\p{xidc}/g,utf
  2146. >AF23<>\x{146}\x{30}<>yz<
  2147. # -----------------------------------------------------------------------------
  2148. # Variable-length lookbehinds.
  2149. /(?<=áb?c).../g,utf
  2150. ábcdèfgácxyz
  2151. /(?<=PQR|áb?c).../g,utf
  2152. ábcdèfgácxyzPQR123
  2153. /(?<=áb?c|PQR).../g,utf
  2154. ábcdèfgácxyzPQR123
  2155. /(?<=PQ|áb?c).../g,utf
  2156. ábcdèfgácxyzPQR123
  2157. /(?<=áb?c|PQ).../g,utf
  2158. ábcdèfgácxyzPQR123
  2159. /(?<=á(b?c|d?è?è)f)X./g,utf
  2160. ácfX1zzzáèfX2zzzádèèfX3zzzX4zzz
  2161. /(?<!á(b?c|d?è?è)f)X./g,utf
  2162. ácfX1zzzáèfX2zzzádèèfX3zzzX4zzz
  2163. /(?(?<=áb?c)d|è)/utf
  2164. ábcdèfg
  2165. ácdèfg
  2166. áxdèfg
  2167. /(?<=\d{2,3}|áBC)./utf
  2168. áBCD
  2169. /(?<=á(b?c){3}d)X/utf
  2170. ZXácbccdXYZ
  2171. /(?<=á(b?c){0}d)X/utf
  2172. ZXádXYZ
  2173. /(?<=á?(b?c){0}d)X./utf
  2174. ZXádXYZ
  2175. # --------------------------------------------------------------------------
  2176. /\N{ U+1234 }/utf
  2177. \x{1234}
  2178. /\o{ 1234 }/utf
  2179. x\o{1234}y
  2180. /\x{ 1234 }/utf
  2181. x\x{1234}y
  2182. /\p{ L }/
  2183. 23AB56
  2184. /\w+/utf,ucp
  2185. --cafe\x{300}_au\x{203f}lait!
  2186. /[\w]+/utf,ucp
  2187. --cafe\x{300}_au\x{203f}lait!
  2188. /[[:word:]]+/utf,ucp
  2189. --cafe\x{300}_au\x{203f}lait!
  2190. /[[:xdigit:]]+/utf,ucp
  2191. --123ef\x{ff10}\x{ff19}\x{ff21}\x{ff26}\x{ff1a}
  2192. /\b.+?\b/utf,ucp
  2193. --cafe\x{300}_au\x{203f}lait!
  2194. /caf\B.+?\B/utf,ucp
  2195. --cafe\x{300}_au\x{203f}lait!
  2196. # End of testinput4