# This set of tests is for UTF support, including Unicode properties. The # Unicode tests are all compatible with all versions of Perl >= 5.10, but # some of the property tests may differ because of different versions of # Unicode in use by PCRE2 and Perl. # WARNING: Use only / as the pattern delimiter. Although pcre2test supports # a number of delimiters, all those other than / give problems with the # perltest.sh script. #newline_default lf anycrlf any #perltest /a.b/utf acb a\x7fb a\x{100}b \= Expect no match a\nb /a(.{3})b/utf a\x{4000}xyb a\x{4000}\x7fyb a\x{4000}\x{100}yb \= Expect no match a\x{4000}b ac\ncb /a(.*?)(.)/ a\xc0\x88b /a(.*?)(.)/utf a\x{100}b /a(.*)(.)/ a\xc0\x88b /a(.*)(.)/utf a\x{100}b /a(.)(.)/ a\xc0\x92bcd /a(.)(.)/utf a\x{240}bcd /a(.?)(.)/ a\xc0\x92bcd /a(.?)(.)/utf a\x{240}bcd /a(.??)(.)/ a\xc0\x92bcd /a(.??)(.)/utf a\x{240}bcd /a(.{3})b/utf a\x{1234}xyb a\x{1234}\x{4321}yb a\x{1234}\x{4321}\x{3412}b \= Expect no match a\x{1234}b ac\ncb /a(.{3,})b/utf a\x{1234}xyb a\x{1234}\x{4321}yb a\x{1234}\x{4321}\x{3412}b axxxxbcdefghijb a\x{1234}\x{4321}\x{3412}\x{3421}b \= Expect no match a\x{1234}b /a(.{3,}?)b/utf a\x{1234}xyb a\x{1234}\x{4321}yb a\x{1234}\x{4321}\x{3412}b axxxxbcdefghijb a\x{1234}\x{4321}\x{3412}\x{3421}b \= Expect no match a\x{1234}b /a(.{3,5})b/utf a\x{1234}xyb a\x{1234}\x{4321}yb a\x{1234}\x{4321}\x{3412}b axxxxbcdefghijb a\x{1234}\x{4321}\x{3412}\x{3421}b axbxxbcdefghijb axxxxxbcdefghijb \= Expect no match a\x{1234}b axxxxxxbcdefghijb /a(.{3,5}?)b/utf a\x{1234}xyb a\x{1234}\x{4321}yb a\x{1234}\x{4321}\x{3412}b axxxxbcdefghijb a\x{1234}\x{4321}\x{3412}\x{3421}b axbxxbcdefghijb axxxxxbcdefghijb \= Expect no match a\x{1234}b axxxxxxbcdefghijb /^[a\x{c0}]/utf \= Expect no match \x{100} /(?<=aXb)cd/utf aXbcd /(?<=a\x{100}b)cd/utf a\x{100}bcd /(?<=a\x{100000}b)cd/utf a\x{100000}bcd /(?:\x{100}){3}b/utf \x{100}\x{100}\x{100}b \= Expect no match \x{100}\x{100}b /\x{ab}/utf \x{ab} \xc2\xab \= Expect no match \x00{ab} /(?<=(.))X/utf WXYZ \x{256}XYZ \= Expect no match XYZ /[^a]+/g,utf bcd \x{100}aY\x{256}Z /^[^a]{2}/utf \x{100}bc /^[^a]{2,}/utf \x{100}bcAa /^[^a]{2,}?/utf \x{100}bca /[^a]+/gi,utf bcd \x{100}aY\x{256}Z /^[^a]{2}/i,utf \x{100}bc /^[^a]{2,}/i,utf \x{100}bcAa /^[^a]{2,}?/i,utf \x{100}bca /\x{100}{0,0}/utf abcd /\x{100}?/utf abcd \x{100}\x{100} /\x{100}{0,3}/utf \x{100}\x{100} \x{100}\x{100}\x{100}\x{100} /\x{100}*/utf abce \x{100}\x{100}\x{100}\x{100} /\x{100}{1,1}/utf abcd\x{100}\x{100}\x{100}\x{100} /\x{100}{1,3}/utf abcd\x{100}\x{100}\x{100}\x{100} /\x{100}+/utf abcd\x{100}\x{100}\x{100}\x{100} /\x{100}{3}/utf abcd\x{100}\x{100}\x{100}XX /\x{100}{3,5}/utf abcd\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}XX /\x{100}{3,}/utf abcd\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}XX /(?<=a\x{100}{2}b)X/utf,aftertext Xyyya\x{100}\x{100}bXzzz /\D*/utf aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa /\D*/utf \x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100}\x{100} /\D/utf 1X2 1\x{100}2 />\S/utf > >X Y > >\x{100} Y /\d/utf \x{100}3 /\s/utf \x{100} X /\D+/utf 12abcd34 \= Expect no match 1234 /\D{2,3}/utf 12abcd34 12ab34 \= Expect no match 1234 12a34 /\D{2,3}?/utf 12abcd34 12ab34 \= Expect no match 1234 12a34 /\d+/utf 12abcd34 /\d{2,3}/utf 12abcd34 1234abcd \= Expect no match 1.4 /\d{2,3}?/utf 12abcd34 1234abcd \= Expect no match 1.4 /\S+/utf 12abcd34 \= Expect no match \ \ /\S{2,3}/utf 12abcd34 1234abcd \= Expect no match \ \ /\S{2,3}?/utf 12abcd34 1234abcd \= Expect no match \ \ />\s+ <34 />\s{2,3} \s{2,3}? \xff< /[\xff]/utf >\x{ff}< /[^\xFF]/ XYZ /[^\xff]/utf XYZ \x{123} /^[ac]*b/utf \= Expect no match xb /^[ac\x{100}]*b/utf \= Expect no match xb /^[^x]*b/i,utf \= Expect no match xb /^[^x]*b/utf \= Expect no match xb /^\d*b/utf \= Expect no match xb /(|a)/g,utf catac a\x{256}a /^\x{85}$/i,utf \x{85} /^ሴ/utf ሴ /^\ሴ/utf ሴ /(?s)(.{1,5})/utf abcdefg ab /a*\x{100}*\w/utf a /\S\S/g,utf A\x{a3}BC /\S{2}/g,utf A\x{a3}BC /\W\W/g,utf +\x{a3}== /\W{2}/g,utf +\x{a3}== /\S/g,utf \x{442}\x{435}\x{441}\x{442} /[\S]/g,utf \x{442}\x{435}\x{441}\x{442} /\D/g,utf \x{442}\x{435}\x{441}\x{442} /[\D]/g,utf \x{442}\x{435}\x{441}\x{442} /\W/g,utf \x{2442}\x{2435}\x{2441}\x{2442} /[\W]/g,utf \x{2442}\x{2435}\x{2441}\x{2442} /[\S\s]*/utf abc\n\r\x{442}\x{435}\x{441}\x{442}xyz /[\x{41f}\S]/g,utf \x{442}\x{435}\x{441}\x{442} /.[^\S]./g,utf abc def\x{442}\x{443}xyz\npqr /.[^\S\n]./g,utf abc def\x{442}\x{443}xyz\npqr /[[:^alnum:]]/g,utf +\x{2442} /[[:^alpha:]]/g,utf +\x{2442} /[[:^ascii:]]/g,utf A\x{442} /[[:^blank:]]/g,utf A\x{442} /[[:^cntrl:]]/g,utf A\x{442} /[[:^digit:]]/g,utf A\x{442} /[[:^graph:]]/g,utf \x19\x{e01ff} /[[:^lower:]]/g,utf A\x{422} /[[:^print:]]/g,utf \x{19}\x{e01ff} /[[:^punct:]]/g,utf A\x{442} /[[:^space:]]/g,utf A\x{442} /[[:^upper:]]/g,utf a\x{442} /[[:^word:]]/g,utf +\x{2442} /[[:^xdigit:]]/g,utf M\x{442} /[^ABCDEFGHIJKLMNOPQRSTUVWXYZÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖØÙÚÛÜÝÞĀĂĄĆĈĊČĎĐĒĔĖĘĚĜĞĠĢĤĦĨĪĬĮİIJĴĶĹĻĽĿŁŃŅŇŊŌŎŐŒŔŖŘŚŜŞŠŢŤŦŨŪŬŮŰŲŴŶŸŹŻŽƁƂƄƆƇƉƊƋƎƏƐƑƓƔƖƗƘƜƝƟƠƢƤƦƧƩƬƮƯƱƲƳƵƷƸƼDŽLJNJǍǏǑǓǕǗǙǛǞǠǢǤǦǨǪǬǮDZǴǶǷǸǺǼǾȀȂȄȆȈȊȌȎȐȒȔȖȘȚȜȞȠȢȤȦȨȪȬȮȰȲȺȻȽȾɁΆΈΉΊΌΎΏΑΒΓΔΕΖΗΘΙΚΛΜΝΞΟΠΡΣΤΥΦΧΨΩΪΫϒϓϔϘϚϜϞϠϢϤϦϨϪϬϮϴϷϹϺϽϾϿЀЁЂЃЄЅІЇЈЉЊЋЌЍЎЏАБВГДЕЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЫЬЭЮЯѠѢѤѦѨѪѬѮѰѲѴѶѸѺѼѾҀҊҌҎҐҒҔҖҘҚҜҞҠҢҤҦҨҪҬҮҰҲҴҶҸҺҼҾӀӁӃӅӇӉӋӍӐӒӔӖӘӚӜӞӠӢӤӦӨӪӬӮӰӲӴӶӸԀԂԄԆԈԊԌԎԱԲԳԴԵԶԷԸԹԺԻԼԽԾԿՀՁՂՃՄՅՆՇՈՉՊՋՌՍՎՏՐՑՒՓՔՕՖႠႡႢႣႤႥႦႧႨႩႪႫႬႭႮႯႰႱႲႳႴႵႶႷႸႹႺႻႼႽႾႿჀჁჂჃჄჅḀḂḄḆḈḊḌḎḐḒḔḖḘḚḜḞḠḢḤḦḨḪḬḮḰḲḴḶḸḺḼḾṀṂṄṆṈṊṌṎṐṒṔṖṘṚṜṞṠṢṤṦṨṪṬṮṰṲṴṶṸṺṼṾẀẂẄẆẈẊẌẎẐẒẔẠẢẤẦẨẪẬẮẰẲẴẶẸẺẼẾỀỂỄỆỈỊỌỎỐỒỔỖỘỚỜỞỠỢỤỦỨỪỬỮỰỲỴỶỸἈἉἊἋἌἍἎἏἘἙἚἛἜἝἨἩἪἫἬἭἮἯἸἹἺἻἼἽἾἿὈὉὊὋὌὍὙὛὝὟὨὩὪὫὬὭὮὯᾸᾹᾺΆῈΈῊΉῘῙῚΊῨῩῪΎῬῸΌῺΏabcdefghijklmnopqrstuvwxyzªµºßàáâãäåæçèéêëìíîïðñòóôõöøùúûüýþÿāăąćĉċčďđēĕėęěĝğġģĥħĩīĭįıijĵķĸĺļľŀłńņňʼnŋōŏőœŕŗřśŝşšţťŧũūŭůűųŵŷźżžſƀƃƅƈƌƍƒƕƙƚƛƞơƣƥƨƪƫƭưƴƶƹƺƽƾƿdžljnjǎǐǒǔǖǘǚǜǝǟǡǣǥǧǩǫǭǯǰdzǵǹǻǽǿȁȃȅȇȉȋȍȏȑȓȕȗșțȝȟȡȣȥȧȩȫȭȯȱȳȴȵȶȷȸȹȼȿɀɐɑɒɓɔɕɖɗɘəɚɛɜɝɞɟɠɡɢɣɤɥɦɧɨɩɪɫɬɭɮɯɰɱɲɳɴɵɶɷɸɹɺɻɼɽɾɿʀʁʂʃʄʅʆʇʈʉʊʋʌʍʎʏʐʑʒʓʔʕʖʗʘʙʚʛʜʝʞʟʠʡʢʣʤʥʦʧʨʩʪʫʬʭʮʯΐάέήίΰαβγδεζηθικλμνξοπρςστυφχψωϊϋόύώϐϑϕϖϗϙϛϝϟϡϣϥϧϩϫϭϯϰϱϲϳϵϸϻϼабвгдежзийклмнопрстуфхцчшщъыьэюяѐёђѓєѕіїјљњћќѝўџѡѣѥѧѩѫѭѯѱѳѵѷѹѻѽѿҁҋҍҏґғҕҗҙқҝҟҡңҥҧҩҫҭүұҳҵҷҹһҽҿӂӄӆӈӊӌӎӑӓӕӗәӛӝӟӡӣӥӧөӫӭӯӱӳӵӷӹԁԃԅԇԉԋԍԏաբգդեզէըթժիլխծկհձղճմյնշոչպջռսվտրցւփքօֆևᴀᴁᴂᴃᴄᴅᴆᴇᴈᴉᴊᴋᴌᴍᴎᴏᴐᴑᴒᴓᴔᴕᴖᴗᴘᴙᴚᴛᴜᴝᴞᴟᴠᴡᴢᴣᴤᴥᴦᴧᴨᴩᴪᴫᵢᵣᵤᵥᵦᵧᵨᵩᵪᵫᵬᵭᵮᵯᵰᵱᵲᵳᵴᵵᵶᵷᵹᵺᵻᵼᵽᵾᵿᶀᶁᶂᶃᶄᶅᶆᶇᶈᶉᶊᶋᶌᶍᶎᶏᶐᶑᶒᶓᶔᶕᶖᶗᶘᶙᶚḁḃḅḇḉḋḍḏḑḓḕḗḙḛḝḟḡḣḥḧḩḫḭḯḱḳḵḷḹḻḽḿṁṃṅṇṉṋṍṏṑṓṕṗṙṛṝṟṡṣṥṧṩṫṭṯṱṳṵṷṹṻṽṿẁẃẅẇẉẋẍẏẑẓẕẖẗẘẙẚẛạảấầẩẫậắằẳẵặẹẻẽếềểễệỉịọỏốồổỗộớờởỡợụủứừửữựỳỵỷỹἀἁἂἃἄἅἆἇἐἑἒἓἔἕἠἡἢἣἤἥἦἧἰἱἲἳἴἵἶἷὀὁὂὃὄὅὐὑὒὓὔὕὖὗὠὡὢὣὤὥὦὧὰάὲέὴήὶίὸόὺύὼώᾀᾁᾂᾃᾄᾅᾆᾇᾐᾑᾒᾓᾔᾕᾖᾗᾠᾡᾢᾣᾤᾥᾦᾧᾰᾱᾲᾳᾴᾶᾷιῂῃῄῆῇῐῑῒΐῖῗῠῡῢΰῤῥῦῧῲῳῴῶῷⲁⲃⲅⲇⲉⲋⲍⲏⲑⲓⲕⲗⲙⲛⲝⲟⲡⲣⲥⲧⲩⲫⲭⲯⲱⲳⲵⲷⲹⲻⲽⲿⳁⳃⳅⳇⳉⳋⳍⳏⳑⳓⳕⳗⳙⳛⳝⳟⳡⳣⳤⴀⴁⴂⴃⴄⴅⴆⴇⴈⴉⴊⴋⴌⴍⴎⴏⴐⴑⴒⴓⴔⴕⴖⴗⴘⴙⴚⴛⴜⴝⴞⴟⴠⴡⴢⴣⴤⴥfffiflffifflſtstﬓﬔﬕﬖﬗ\d_^]/utf /^[^d]*?$/ abc /^[^d]*?$/utf abc /^[^d]*?$/i abc /^[^d]*?$/i,utf abc /(?i)[\xc3\xa9\xc3\xbd]|[\xc3\xa9\xc3\xbdA]/utf /^[a\x{c0}]b/utf \x{c0}b /^([a\x{c0}]*?)aa/utf a\x{c0}aaaa/ /^([a\x{c0}]*?)aa/utf a\x{c0}aaaa/ a\x{c0}a\x{c0}aaa/ /^([a\x{c0}]*)aa/utf a\x{c0}aaaa/ a\x{c0}a\x{c0}aaa/ /^([a\x{c0}]*)a\x{c0}/utf a\x{c0}aaaa/ a\x{c0}a\x{c0}aaa/ /A*/g,utf AAB\x{123}BAA /(abc)\1/i,utf \= Expect no match abc /(abc)\1/utf \= Expect no match abc /a(*:a\x{1234}b)/utf,mark abc /a(*:a£b)/utf,mark abc # Noncharacters /./utf \x{fffe} \x{ffff} \x{1fffe} \x{1ffff} \x{2fffe} \x{2ffff} \x{3fffe} \x{3ffff} \x{4fffe} \x{4ffff} \x{5fffe} \x{5ffff} \x{6fffe} \x{6ffff} \x{7fffe} \x{7ffff} \x{8fffe} \x{8ffff} \x{9fffe} \x{9ffff} \x{afffe} \x{affff} \x{bfffe} \x{bffff} \x{cfffe} \x{cffff} \x{dfffe} \x{dffff} \x{efffe} \x{effff} \x{ffffe} \x{fffff} \x{10fffe} \x{10ffff} \x{fdd0} \x{fdd1} \x{fdd2} \x{fdd3} \x{fdd4} \x{fdd5} \x{fdd6} \x{fdd7} \x{fdd8} \x{fdd9} \x{fdda} \x{fddb} \x{fddc} \x{fddd} \x{fdde} \x{fddf} \x{fde0} \x{fde1} \x{fde2} \x{fde3} \x{fde4} \x{fde5} \x{fde6} \x{fde7} \x{fde8} \x{fde9} \x{fdea} \x{fdeb} \x{fdec} \x{fded} \x{fdee} \x{fdef} /^\d*\w{4}/utf 1234 \= Expect no match 123 /^[^b]*\w{4}/utf aaaa \= Expect no match aaa /^[^b]*\w{4}/i,utf aaaa \= Expect no match aaa /^\x{100}*.{4}/utf \x{100}\x{100}\x{100}\x{100} \= Expect no match \x{100}\x{100}\x{100} /^\x{100}*.{4}/i,utf \x{100}\x{100}\x{100}\x{100} \= Expect no match \x{100}\x{100}\x{100} /^a+[a\x{200}]/utf aa /^.\B.\B./utf \x{10123}\x{10124}\x{10125} /^#[^\x{ffff}]#[^\x{ffff}]#[^\x{ffff}]#/utf #\x{10000}#\x{100}#\x{10ffff}# # Unicode property support tests /^\pC\pL\pM\pN\pP\pS\pZ\s+/utf,ucp >\x{20}\x{a0}\x{1680}\x{2028}\x{2029}\x{202f}\x{9}\x{b} /^>\pZ+/utf,ucp >\x{20}\x{a0}\x{1680}\x{2028}\x{2029}\x{202f}\x{9}\x{b} /^>[[:space:]]*/utf,ucp >\x{20}\x{a0}\x{1680}\x{2028}\x{2029}\x{202f}\x{9}\x{b} /^>[[:blank:]]*/utf,ucp >\x{20}\x{a0}\x{1680}\x{2000}\x{202f}\x{9}\x{b}\x{2028} /^[[:alpha:]]*/utf,ucp Az\x{aa}\x{c0}\x{1c5}\x{2b0}\x{3b6}\x{1d7c9}\x{2fa1d} /^[[:alnum:]]*/utf,ucp Az\x{aa}\x{c0}\x{1c5}\x{2b0}\x{3b6}\x{1d7c9}\x{2fa1d}1\x{660}\x{bef}\x{16ee} /^[[:cntrl:]]*/utf,ucp \x{0}\x{09}\x{1f}\x{7f}\x{9f} /^[[:graph:]]*/utf,ucp A\x{a1}\x{a0} /^[[:print:]]*/utf,ucp A z\x{a0}\x{a1} /^[[:punct:]]*/utf,ucp .+\x{a1}\x{a0} /\p{Zs}*?\R/ \= Expect no match a\xFCb /\p{Zs}*\R/ \= Expect no match a\xFCb /ⱥ/i,utf ⱥ Ⱥx Ⱥ /[ⱥ]/i,utf ⱥ Ⱥx Ⱥ /Ⱥ/i,utf Ⱥ ⱥ # These are tests for extended grapheme clusters /^\X/utf,aftertext G\x{34e}\x{34e}X \x{34e}\x{34e}X \x04X \x{1100}X \x{1100}\x{34e}X \x{1b04}\x{1b04}X *These match up to the roman letters \x{1111}\x{1111}L,L \x{1111}\x{1111}\x{1169}L,L,V \x{1111}\x{ae4c}L, LV \x{1111}\x{ad89}L, LVT \x{1111}\x{ae4c}\x{1169}L, LV, V \x{1111}\x{ae4c}\x{1169}\x{1169}L, LV, V, V \x{1111}\x{ae4c}\x{1169}\x{11fe}L, LV, V, T \x{1111}\x{ad89}\x{11fe}L, LVT, T \x{1111}\x{ad89}\x{11fe}\x{11fe}L, LVT, T, T \x{ad89}\x{11fe}\x{11fe}LVT, T, T *These match just the first codepoint (invalid sequence) \x{1111}\x{11fe}L, T \x{ae4c}\x{1111}LV, L \x{ae4c}\x{ae4c}LV, LV \x{ae4c}\x{ad89}LV, LVT \x{1169}\x{1111}V, L \x{1169}\x{ae4c}V, LV \x{1169}\x{ad89}V, LVT \x{ad89}\x{1111}LVT, L \x{ad89}\x{1169}LVT, V \x{ad89}\x{ae4c}LVT, LV \x{ad89}\x{ad89}LVT, LVT \x{11fe}\x{1111}T, L \x{11fe}\x{1169}T, V \x{11fe}\x{ae4c}T, LV \x{11fe}\x{ad89}T, LVT *Test extend and spacing mark \x{1111}\x{ae4c}\x{0711}L, LV, extend \x{1111}\x{ae4c}\x{1b04}L, LV, spacing mark \x{1111}\x{ae4c}\x{1b04}\x{0711}\x{1b04}L, LV, spacing mark, extend, spacing mark *Test CR, LF, and control \x0d\x{0711}CR, extend \x0d\x{1b04}CR, spacingmark \x0a\x{0711}LF, extend \x0a\x{1b04}LF, spacingmark \x0b\x{0711}Control, extend \x09\x{1b04}Control, spacingmark *Test Extended Pictographic after bug fix \x{261d}\x{261d}B Extended_Pictographic Extended_Pictographic \x{261D}\x{1F3FB}\x{261d}B Extended_Pictographic Extend E-P \x{261D}\x{1F3FB}\x{200d}\x{261d}B Extended_Pictographic Extend ZWJ E-P \x{1f3f3}\x{fe0f}\x{200d}\x{1f308}\x{1f3f4}\x{200d}\x{2620}\x{fe0f}\x{1f3f3}\x{fe0f}\x{200d}\x{1f308}\x{1f3f4}\x{200d}\x{2620}\x{fe0f} A\x{200d}\x{1f308}B A\x{200d}B A ZWJ \x{261D}\x{1F3FB}B Extended_Pictographic Extend \x{1F1E6}\x{1F1E7}B RegionalIndicator RegionalIndicator *There are no Prepend characters, so we can't test Prepend, CR /^(?>\X{2})X/utf,aftertext \x{1111}\x{ae4c}\x{1111}\x{ae4c}X /^\X{2,4}X/utf,aftertext \x{1111}\x{ae4c}\x{1111}\x{ae4c}X \x{1111}\x{ae4c}\x{1111}\x{ae4c}\x{1111}\x{ae4c}X \x{1111}\x{ae4c}\x{1111}\x{ae4c}\x{1111}\x{ae4c}\x{1111}\x{ae4c}X /^\X{2,4}?X/utf,aftertext \x{1111}\x{ae4c}\x{1111}\x{ae4c}X \x{1111}\x{ae4c}\x{1111}\x{ae4c}\x{1111}\x{ae4c}X \x{1111}\x{ae4c}\x{1111}\x{ae4c}\x{1111}\x{ae4c}\x{1111}\x{ae4c}X /\X*Z/utf,no_start_optimize \= Expect no match A\x{300} /\X*(.)/utf,no_start_optimize A\x{1111}\x{ae4c}\x{1169} # -------------------------------------------- /\x{1e9e}+/i,utf \x{1e9e}\x{00df} /[z\x{1e9e}]+/i,utf \x{1e9e}\x{00df} /\x{00df}+/i,utf \x{1e9e}\x{00df} /[z\x{00df}]+/i,utf \x{1e9e}\x{00df} /\x{1f88}+/i,utf \x{1f88}\x{1f80} /[z\x{1f88}]+/i,utf \x{1f88}\x{1f80} # Check a reference with more than one other case /^(\x{00b5})\1{2}$/i,utf \x{00b5}\x{039c}\x{03bc} # Characters with more than one other case; test in classes /[z\x{00b5}]+/i,utf \x{00b5}\x{039c}\x{03bc} /[z\x{039c}]+/i,utf \x{00b5}\x{039c}\x{03bc} /[z\x{03bc}]+/i,utf \x{00b5}\x{039c}\x{03bc} /[z\x{00c5}]+/i,utf \x{00c5}\x{00e5}\x{212b} /[z\x{00e5}]+/i,utf \x{00c5}\x{00e5}\x{212b} /[z\x{212b}]+/i,utf \x{00c5}\x{00e5}\x{212b} /[z\x{01c4}]+/i,utf \x{01c4}\x{01c5}\x{01c6} /[z\x{01c5}]+/i,utf \x{01c4}\x{01c5}\x{01c6} /[z\x{01c6}]+/i,utf \x{01c4}\x{01c5}\x{01c6} /[z\x{01c7}]+/i,utf \x{01c7}\x{01c8}\x{01c9} /[z\x{01c8}]+/i,utf \x{01c7}\x{01c8}\x{01c9} /[z\x{01c9}]+/i,utf \x{01c7}\x{01c8}\x{01c9} /[z\x{01ca}]+/i,utf \x{01ca}\x{01cb}\x{01cc} /[z\x{01cb}]+/i,utf \x{01ca}\x{01cb}\x{01cc} /[z\x{01cc}]+/i,utf \x{01ca}\x{01cb}\x{01cc} /[z\x{01f1}]+/i,utf \x{01f1}\x{01f2}\x{01f3} /[z\x{01f2}]+/i,utf \x{01f1}\x{01f2}\x{01f3} /[z\x{01f3}]+/i,utf \x{01f1}\x{01f2}\x{01f3} /[z\x{0345}]+/i,utf \x{0345}\x{0399}\x{03b9}\x{1fbe} /[z\x{0399}]+/i,utf \x{0345}\x{0399}\x{03b9}\x{1fbe} /[z\x{03b9}]+/i,utf \x{0345}\x{0399}\x{03b9}\x{1fbe} /[z\x{1fbe}]+/i,utf \x{0345}\x{0399}\x{03b9}\x{1fbe} /[z\x{0392}]+/i,utf \x{0392}\x{03b2}\x{03d0} /[z\x{03b2}]+/i,utf \x{0392}\x{03b2}\x{03d0} /[z\x{03d0}]+/i,utf \x{0392}\x{03b2}\x{03d0} /[z\x{0395}]+/i,utf \x{0395}\x{03b5}\x{03f5} /[z\x{03b5}]+/i,utf \x{0395}\x{03b5}\x{03f5} /[z\x{03f5}]+/i,utf \x{0395}\x{03b5}\x{03f5} /[z\x{0398}]+/i,utf \x{0398}\x{03b8}\x{03d1}\x{03f4} /[z\x{03b8}]+/i,utf \x{0398}\x{03b8}\x{03d1}\x{03f4} /[z\x{03d1}]+/i,utf \x{0398}\x{03b8}\x{03d1}\x{03f4} /[z\x{03f4}]+/i,utf \x{0398}\x{03b8}\x{03d1}\x{03f4} /[z\x{039a}]+/i,utf \x{039a}\x{03ba}\x{03f0} /[z\x{03ba}]+/i,utf \x{039a}\x{03ba}\x{03f0} /[z\x{03f0}]+/i,utf \x{039a}\x{03ba}\x{03f0} /[z\x{03a0}]+/i,utf \x{03a0}\x{03c0}\x{03d6} /[z\x{03c0}]+/i,utf \x{03a0}\x{03c0}\x{03d6} /[z\x{03d6}]+/i,utf \x{03a0}\x{03c0}\x{03d6} /[z\x{03a1}]+/i,utf \x{03a1}\x{03c1}\x{03f1} /[z\x{03c1}]+/i,utf \x{03a1}\x{03c1}\x{03f1} /[z\x{03f1}]+/i,utf \x{03a1}\x{03c1}\x{03f1} /[z\x{03a3}]+/i,utf \x{03A3}\x{03C2}\x{03C3} /[z\x{03c2}]+/i,utf \x{03A3}\x{03C2}\x{03C3} /[z\x{03c3}]+/i,utf \x{03A3}\x{03C2}\x{03C3} /[z\x{03a6}]+/i,utf \x{03a6}\x{03c6}\x{03d5} /[z\x{03c6}]+/i,utf \x{03a6}\x{03c6}\x{03d5} /[z\x{03d5}]+/i,utf \x{03a6}\x{03c6}\x{03d5} /[z\x{03c9}]+/i,utf \x{03c9}\x{03a9}\x{2126} /[z\x{03a9}]+/i,utf \x{03c9}\x{03a9}\x{2126} /[z\x{2126}]+/i,utf \x{03c9}\x{03a9}\x{2126} /[z\x{1e60}]+/i,utf \x{1e60}\x{1e61}\x{1e9b} /[z\x{1e61}]+/i,utf \x{1e60}\x{1e61}\x{1e9b} /[z\x{1e9b}]+/i,utf \x{1e60}\x{1e61}\x{1e9b} # Perl 5.12.4 gets these wrong, but 5.15.3 is OK /[z\x{004b}]+/i,utf \x{004b}\x{006b}\x{212a} /[z\x{006b}]+/i,utf \x{004b}\x{006b}\x{212a} /[z\x{212a}]+/i,utf \x{004b}\x{006b}\x{212a} /[z\x{0053}]+/i,utf \x{0053}\x{0073}\x{017f} /[z\x{0073}]+/i,utf \x{0053}\x{0073}\x{017f} /[z\x{017f}]+/i,utf \x{0053}\x{0073}\x{017f} # -------------------------------------- /(ΣΆΜΟΣ) \1/i,utf ΣΆΜΟΣ ΣΆΜΟΣ ΣΆΜΟΣ σάμος σάμος σάμος σάμος σάμοσ σάμος ΣΆΜΟΣ /(σάμος) \1/i,utf ΣΆΜΟΣ ΣΆΜΟΣ ΣΆΜΟΣ σάμος σάμος σάμος σάμος σάμοσ σάμος ΣΆΜΟΣ /(ΣΆΜΟΣ) \1*/i,utf ΣΆΜΟΣ\x20 ΣΆΜΟΣ ΣΆΜΟΣσάμοςσάμος # Perl matches these /\x{00b5}+/i,utf \x{00b5}\x{039c}\x{03bc} /\x{039c}+/i,utf \x{00b5}\x{039c}\x{03bc} /\x{03bc}+/i,utf \x{00b5}\x{039c}\x{03bc} /\x{00c5}+/i,utf \x{00c5}\x{00e5}\x{212b} /\x{00e5}+/i,utf \x{00c5}\x{00e5}\x{212b} /\x{212b}+/i,utf \x{00c5}\x{00e5}\x{212b} /\x{01c4}+/i,utf \x{01c4}\x{01c5}\x{01c6} /\x{01c5}+/i,utf \x{01c4}\x{01c5}\x{01c6} /\x{01c6}+/i,utf \x{01c4}\x{01c5}\x{01c6} /\x{01c7}+/i,utf \x{01c7}\x{01c8}\x{01c9} /\x{01c8}+/i,utf \x{01c7}\x{01c8}\x{01c9} /\x{01c9}+/i,utf \x{01c7}\x{01c8}\x{01c9} /\x{01ca}+/i,utf \x{01ca}\x{01cb}\x{01cc} /\x{01cb}+/i,utf \x{01ca}\x{01cb}\x{01cc} /\x{01cc}+/i,utf \x{01ca}\x{01cb}\x{01cc} /\x{01f1}+/i,utf \x{01f1}\x{01f2}\x{01f3} /\x{01f2}+/i,utf \x{01f1}\x{01f2}\x{01f3} /\x{01f3}+/i,utf \x{01f1}\x{01f2}\x{01f3} /\x{0345}+/i,utf \x{0345}\x{0399}\x{03b9}\x{1fbe} /\x{0399}+/i,utf \x{0345}\x{0399}\x{03b9}\x{1fbe} /\x{03b9}+/i,utf \x{0345}\x{0399}\x{03b9}\x{1fbe} /\x{1fbe}+/i,utf \x{0345}\x{0399}\x{03b9}\x{1fbe} /\x{0392}+/i,utf \x{0392}\x{03b2}\x{03d0} /\x{03b2}+/i,utf \x{0392}\x{03b2}\x{03d0} /\x{03d0}+/i,utf \x{0392}\x{03b2}\x{03d0} /\x{0395}+/i,utf \x{0395}\x{03b5}\x{03f5} /\x{03b5}+/i,utf \x{0395}\x{03b5}\x{03f5} /\x{03f5}+/i,utf \x{0395}\x{03b5}\x{03f5} /\x{0398}+/i,utf \x{0398}\x{03b8}\x{03d1}\x{03f4} /\x{03b8}+/i,utf \x{0398}\x{03b8}\x{03d1}\x{03f4} /\x{03d1}+/i,utf \x{0398}\x{03b8}\x{03d1}\x{03f4} /\x{03f4}+/i,utf \x{0398}\x{03b8}\x{03d1}\x{03f4} /\x{039a}+/i,utf \x{039a}\x{03ba}\x{03f0} /\x{03ba}+/i,utf \x{039a}\x{03ba}\x{03f0} /\x{03f0}+/i,utf \x{039a}\x{03ba}\x{03f0} /\x{03a0}+/i,utf \x{03a0}\x{03c0}\x{03d6} /\x{03c0}+/i,utf \x{03a0}\x{03c0}\x{03d6} /\x{03d6}+/i,utf \x{03a0}\x{03c0}\x{03d6} /\x{03a1}+/i,utf \x{03a1}\x{03c1}\x{03f1} /\x{03c1}+/i,utf \x{03a1}\x{03c1}\x{03f1} /\x{03f1}+/i,utf \x{03a1}\x{03c1}\x{03f1} /\x{03a3}+/i,utf \x{03A3}\x{03C2}\x{03C3} /\x{03c2}+/i,utf \x{03A3}\x{03C2}\x{03C3} /\x{03c3}+/i,utf \x{03A3}\x{03C2}\x{03C3} /\x{03a6}+/i,utf \x{03a6}\x{03c6}\x{03d5} /\x{03c6}+/i,utf \x{03a6}\x{03c6}\x{03d5} /\x{03d5}+/i,utf \x{03a6}\x{03c6}\x{03d5} /\x{03c9}+/i,utf \x{03c9}\x{03a9}\x{2126} /\x{03a9}+/i,utf \x{03c9}\x{03a9}\x{2126} /\x{2126}+/i,utf \x{03c9}\x{03a9}\x{2126} /\x{1e60}+/i,utf \x{1e60}\x{1e61}\x{1e9b} /\x{1e61}+/i,utf \x{1e60}\x{1e61}\x{1e9b} /\x{1e9b}+/i,utf \x{1e60}\x{1e61}\x{1e9b} /\x{1e9e}+/i,utf \x{1e9e}\x{00df} /\x{00df}+/i,utf \x{1e9e}\x{00df} /\x{1f88}+/i,utf \x{1f88}\x{1f80} /\x{1f80}+/i,utf \x{1f88}\x{1f80} # Perl 5.12.4 gets these wrong, but 5.15.3 is OK /\x{004b}+/i,utf \x{004b}\x{006b}\x{212a} /\x{006b}+/i,utf \x{004b}\x{006b}\x{212a} /\x{212a}+/i,utf \x{004b}\x{006b}\x{212a} /\x{0053}+/i,utf \x{0053}\x{0073}\x{017f} /\x{0073}+/i,utf \x{0053}\x{0073}\x{017f} /\x{017f}+/i,utf \x{0053}\x{0073}\x{017f} /^\p{Any}*\d{4}/utf 1234 \= Expect no match 123 /^\X*\w{4}/utf 1234 \= Expect no match 123 /^A\s+Z/utf,ucp A\x{2005}Z A\x{85}\x{2005}Z /^A[\s]+Z/utf,ucp A\x{2005}Z A\x{85}\x{2005}Z /^[[:graph:]]+$/utf,ucp Letter:ABC Mark:\x{300}\x{1d172}\x{1d17b} Number:9\x{660} Punctuation:\x{66a},; Symbol:\x{6de}<>\x{fffc} Cf-property:\x{ad}\x{600}\x{601}\x{602}\x{603}\x{604}\x{6dd}\x{70f} \x{200b}\x{200c}\x{200d}\x{200e}\x{200f} \x{202a}\x{202b}\x{202c}\x{202d}\x{202e} \x{2060}\x{2061}\x{2062}\x{2063}\x{2064} \x{206a}\x{206b}\x{206c}\x{206d}\x{206e}\x{206f} \x{feff} \x{fff9}\x{fffa}\x{fffb} \x{110bd} \x{1d173}\x{1d174}\x{1d175}\x{1d176}\x{1d177}\x{1d178}\x{1d179}\x{1d17a} \x{e0001} \x{e0020}\x{e0030}\x{e0040}\x{e0050}\x{e0060}\x{e0070}\x{e007f} \= Expect no match \x{09} \x{0a} \x{1D} \x{20} \x{85} \x{a0} \x{1680} \x{2028} \x{2029} \x{202f} \x{2065} \x{3000} \x{e0002} \x{e001f} \x{e0080} /^[[:print:]]+$/utf,ucp Space: \x{a0} \x{1680}\x{2000}\x{2001}\x{2002}\x{2003}\x{2004}\x{2005} \x{2006}\x{2007}\x{2008}\x{2009}\x{200a} \x{202f}\x{205f} \x{3000} Letter:ABC Mark:\x{300}\x{1d172}\x{1d17b} Number:9\x{660} Punctuation:\x{66a},; Symbol:\x{6de}<>\x{fffc} Cf-property:\x{ad}\x{600}\x{601}\x{602}\x{603}\x{604}\x{6dd}\x{70f} \x{200b}\x{200c}\x{200d}\x{200e}\x{200f} \x{202a}\x{202b}\x{202c}\x{202d}\x{202e} \x{202f} \x{2060}\x{2061}\x{2062}\x{2063}\x{2064} \x{206a}\x{206b}\x{206c}\x{206d}\x{206e}\x{206f} \x{feff} \x{fff9}\x{fffa}\x{fffb} \x{110bd} \x{1d173}\x{1d174}\x{1d175}\x{1d176}\x{1d177}\x{1d178}\x{1d179}\x{1d17a} \x{e0001} \x{e0020}\x{e0030}\x{e0040}\x{e0050}\x{e0060}\x{e0070}\x{e007f} \= Expect no match \x{09} \x{1D} \x{85} \x{2028} \x{2029} \x{2065} \x{e0002} \x{e001f} \x{e0080} /^[[:punct:]]+$/utf,ucp \$+<=>^`|~ !\"#%&'()*,-./:;?@[\\]_{} \x{a1}\x{a7} \x{37e} \= Expect no match abcde /^[[:^graph:]]+$/utf,ucp \x{09}\x{0a}\x{1D}\x{20}\x{85}\x{a0}\x{1680} \x{2028}\x{2029}\x{202f}\x{2065} \x{3000}\x{e0002}\x{e001f}\x{e0080} \= Expect no match Letter:ABC Mark:\x{300}\x{1d172}\x{1d17b} Number:9\x{660} Punctuation:\x{66a},; Symbol:\x{6de}<>\x{fffc} Cf-property:\x{ad}\x{600}\x{601}\x{602}\x{603}\x{604}\x{6dd}\x{70f} \x{200b}\x{200c}\x{200d}\x{200e}\x{200f} \x{202a}\x{202b}\x{202c}\x{202d}\x{202e} \x{2060}\x{2061}\x{2062}\x{2063}\x{2064} \x{206a}\x{206b}\x{206c}\x{206d}\x{206e}\x{206f} \x{feff} \x{fff9}\x{fffa}\x{fffb} \x{110bd} \x{1d173}\x{1d174}\x{1d175}\x{1d176}\x{1d177}\x{1d178}\x{1d179}\x{1d17a} \x{e0001} \x{e0020}\x{e0030}\x{e0040}\x{e0050}\x{e0060}\x{e0070}\x{e007f} /^[[:^print:]]+$/utf,ucp \x{09}\x{1D}\x{85}\x{2028}\x{2029}\x{2065} \x{e0002}\x{e001f}\x{e0080} \= Expect no match Space: \x{a0} \x{1680}\x{2000}\x{2001}\x{2002}\x{2003}\x{2004}\x{2005} \x{2006}\x{2007}\x{2008}\x{2009}\x{200a} \x{202f}\x{205f} \x{3000} Letter:ABC Mark:\x{300}\x{1d172}\x{1d17b} Number:9\x{660} Punctuation:\x{66a},; Symbol:\x{6de}<>\x{fffc} Cf-property:\x{ad}\x{600}\x{601}\x{602}\x{603}\x{604}\x{6dd}\x{70f} \x{200b}\x{200c}\x{200d}\x{200e}\x{200f} \x{202a}\x{202b}\x{202c}\x{202d}\x{202e} \x{202f} \x{2060}\x{2061}\x{2062}\x{2063}\x{2064} \x{206a}\x{206b}\x{206c}\x{206d}\x{206e}\x{206f} \x{feff} \x{fff9}\x{fffa}\x{fffb} \x{110bd} \x{1d173}\x{1d174}\x{1d175}\x{1d176}\x{1d177}\x{1d178}\x{1d179}\x{1d17a} \x{e0001} \x{e0020}\x{e0030}\x{e0040}\x{e0050}\x{e0060}\x{e0070}\x{e007f} /^[[:^punct:]]+$/utf,ucp abcde \= Expect no match \$+<=>^`|~ !\"#%&'()*,-./:;?@[\\]_{} \x{a1}\x{a7} \x{37e} /[RST]+/i,utf,ucp Ss\x{17f} /[R-T]+/i,utf,ucp Ss\x{17f} /[q-u]+/i,utf,ucp Ss\x{17f} /^s?c/im,utf scat # The next four tests are for repeated caseless back references when the # code unit length of the matched text is different to that of the original # group in the UTF-8 case. /^(\x{23a})\1*(.)/i,utf \x{23a}\x{23a}\x{23a}\x{23a} \x{23a}\x{2c65}\x{2c65}\x{2c65} \x{23a}\x{23a}\x{2c65}\x{23a} /^(\x{23a})\1*(..)/i,utf \x{23a}\x{2c65}\x{2c65}\x{2c65} \x{23a}\x{23a}\x{2c65}\x{23a} /^(\x{23a})\1*(...)/i,utf \x{23a}\x{2c65}\x{2c65}\x{2c65} \x{23a}\x{23a}\x{2c65}\x{23a} /^(\x{23a})\1*(....)/i,utf \= Expect no match \x{23a}\x{2c65}\x{2c65}\x{2c65} \x{23a}\x{23a}\x{2c65}\x{23a} /[A-`]/i,utf abcdefghijklmno /[\S\V\H]/utf /[^\p{Any}]*+x/utf x /[[:punct:]]/utf,ucp \x{b4} /[[:^ascii:]]/utf,ucp \x{100} \x{200} \x{300} \x{37e} \= Expect no match aa 99 /[[:^ascii:]\w]/utf,ucp aa 99 gg \x{100} \x{200} \x{300} \x{37e} /[\w[:^ascii:]]/utf,ucp aa 99 gg \x{100} \x{200} \x{300} \x{37e} /[^[:ascii:]\W]/utf,ucp \x{100} \x{200} \= Expect no match aa 99 gg \x{37e} /[^[:^ascii:]\d]/utf,ucp a ~ \a \x{7f} \= Expect no match 0 \x{389} \x{20ac} /(?=.*b)\pL/ 11bb /(?(?=.*b)(?=.*b)\pL|.*c)/ 11bb /^\x{123}+?$/utf,no_auto_possess \x{123}\x{123}\x{123} /^\x{123}+?$/i,utf,no_auto_possess \x{123}\x{122}\x{123} \= Expect no match \x{123}\x{124}\x{123} /\N{U+1234}/utf \x{1234} /[\N{U+1234}]/utf \x{1234} # Test the full list of Unicode "Pattern White Space" characters that are to # be ignored by /x. The pattern lines below may show up oddly in text editors # or when listed to the screen. Note that characters such as U+2002, which are # matched as space by \h and \v are *not* "Pattern White Space". /A…‎‏

B/x,utf AB /A B/x,utf A\x{2002}B \= Expect no match AB # ------- /[^\x{100}-\x{ffff}]*[\x80-\xff]/utf \x{99}\x{99}\x{99} /[^\x{100}-\x{ffff}ABC]*[\x80-\xff]/utf \x{99}\x{99}\x{99} /[^\x{100}-\x{ffff}]*[\x80-\xff]/i,utf \x{99}\x{99}\x{99} # Script run tests /^(*script_run:.{4})/utf abcd Latin x4 \x{2e80}\x{2fa1d}\x{3041}\x{30a1} Han Han Hiragana Katakana \x{3041}\x{30a1}\x{3007}\x{3007} Hiragana Katakana Han Han \x{30a1}\x{3041}\x{3007}\x{3007} Katakana Hiragana Han Han \x{1100}\x{2e80}\x{2e80}\x{1101} Hangul Han Han Hangul \x{2e80}\x{3105}\x{2e80}\x{3105} Han Bopomofo Han Bopomofo \x{02ea}\x{2e80}\x{2e80}\x{3105} Bopomofo-Sk Han Han Bopomofo \x{3105}\x{2e80}\x{2e80}\x{3105} Bopomofo Han Han Bopomofo \x{0300}cd! Inherited Latin Latin Common \x{0391}12\x{03a9} Greek Common-digits Greek \x{0400}12\x{fe2f} Cyrillic Common-digits Cyrillic \x{0531}12\x{fb17} Armenian Common-digits Armenian \x{0591}12\x{fb4f} Hebrew Common-digits Hebrew \x{0600}12\x{1eef1} Arabic Common-digits Arabic \x{0600}\x{0660}\x{0669}\x{1eef1} Arabic Arabic-digits Arabic \x{0700}12\x{086a} Syriac Common-digits Syriac \x{1200}12\x{ab2e} Ethiopic Common-digits Ethiopic \x{1680}12\x{169c} Ogham Common-digits Ogham \x{3041}12\x{3041} Hiragana Common-digits Hiragana \x{0980}\x{09e6}\x{09e7}\x{0993} Bengali Bengali-digits Bengali !cde Common Latin Latin Latin A..B Latin Common Common Latin 0abc Ascii-digit Latin Latin Latin 1\x{0700}\x{0700}\x{0700} Ascii-digit Syriac x 3 \x{1A80}\x{1A80}\x{1a40}\x{1a41} Tai Tham Hora digits, letters \= Expect no match a\x{370}bcd Latin Greek Latin Latin \x{1100}\x{02ea}\x{02ea}\x{02ea} Hangul Bopomofo x3 \x{02ea}\x{02ea}\x{02ea}\x{1100} Bopomofo x3 Hangul \x{1100}\x{2e80}\x{3041}\x{1101} Hangul Han Hiragana Hangul \x{0391}\x{09e6}\x{09e7}\x{03a9} Greek Bengali digits Greek \x{0600}7\x{0669}\x{1eef1} Arabic ascii-digit Arabic-digit Arabic \x{0600}\x{0669}7\x{1eef1} Arabic Arabic-digit ascii-digit Arabic A5\x{ff19}B Latin Common-ascii/notascii-digits Latin \x{0300}cd\x{0391} Inherited Latin Latin Greek !cd\x{0391} Common Latin Latin Greek \x{1A80}\x{1A90}\x{1a40}\x{1a41} Tai Tham Hora digit, Tham digit, letters A\x{1d7ce}\x{1d7ff}B Common fancy-common-2-sets-digits Common \x{2e80}\x{3105}\x{2e80}\x{30a1} Han Bopomofo Han Katakana /^(*sr:.{4}|..)/utf \x{2e80}\x{3105}\x{2e80}\x{30a1} Han Bopomofo Han Katakana /^(*atomic_script_run:.{4}|..)/utf \= Expect no match \x{2e80}\x{3105}\x{2e80}\x{30a1} Han Bopomofo Han Katakana /^(*asr:.*)/utf \= Expect no match \x{2e80}\x{3105}\x{2e80}\x{30a1} Han Bopomofo Han Katakana /^(?>(*sr:.*))/utf \x{2e80}\x{3105}\x{2e80}\x{30a1} Han Bopomofo Han Katakana /^(*sr:.*)/utf \x{2e80}\x{3105}\x{2e80}\x{30a1} Han Bopomofo Han Katakana \x{10fffd}\x{10fffd}\x{10fffd} Private use (Unknown) /^(*sr:\x{2e80}*)/utf \x{2e80}\x{2e80}\x{3105} Han Han Bopomofo /^(*sr:\x{2e80}*)\x{2e80}/utf \x{2e80}\x{2e80}\x{3105} Han Han Bopomofo /^(*sr:.*)Test/utf Test script run on an empty string /^(*sr:(.{2})){2}/utf \x{0600}7\x{0669}\x{1eef1} Arabic ascii-digit Arabic-digit Arabic \x{1A80}\x{1A80}\x{1a40}\x{1a41} Tai Tham Hora digits, letters \x{1A80}\x{1a40}\x{1A90}\x{1a41} Tai Tham Hora digit, letter, Tham digit, letter \= Expect no match \x{1100}\x{2e80}\x{3041}\x{1101} Hangul Han Hiragana Hangul /^(*sr:\S*)/utf \x{1cf4}\x{20f0}\x{900}\x{11305} [Dev,Gran,Kan] [Dev,Gran,Lat] Dev Gran \x{1cf4}\x{20f0}\x{11305}\x{900} [Dev,Gran,Kan] [Dev,Gran,Lat] Gran Dev \x{1cf4}\x{20f0}\x{900}ABC [Dev,Gran,Kan] [Dev,Gran,Lat] Dev Lat \x{1cf4}\x{20f0}ABC [Dev,Gran,Kan] [Dev,Gran,Lat] Lat \x{20f0}ABC [Dev,Gran,Lat] Lat XYZ\x{20f0}ABC Lat [Dev,Gran,Lat] Lat \x{a36}\x{a33}\x{900} [Dev,...] [Dev,...] Dev \x{3001}\x{2e80}\x{3041}\x{30a1} [Bopo, Han, etc] Han Hira Kata \x{3001}\x{30a1}\x{2e80}\x{3041} [Bopo, Han, etc] Kata Han Hira \x{3001}\x{3105}\x{2e80}\x{1101} [Bopo, Han, etc] Bopomofo Han Hangul \x{3105}\x{3001}\x{2e80}\x{1101} Bopomofo [Bopo, Han, etc] Han Hangul \x{3031}\x{3041}\x{30a1}\x{2e80} [Hira Kata] Hira Kata Han \x{060c}\x{06d4}\x{0600}\x{10d00}\x{0700} [Arab Rohg Syrc Thaa] [Arab Rohg] Arab Rohg Syrc \x{060c}\x{06d4}\x{0700}\x{0600}\x{10d00} [Arab Rohg Syrc Thaa] [Arab Rohg] Syrc Arab Rohg \x{2e80}\x{3041}\x{3001}\x{3031}\x{2e80} Han Hira [Bopo, Han, etc] [Hira Kata] Han /(?\x{202c}<-- /\p{bidicontrol}+/utf -->\x{061c}\x{200e}\x{200f}\x{202a}\x{202b}\x{202c}\x{202d}<-- -->\x{2066}\x{2067}\x{2068}\x{2069}<-- /\p{bidic}+?/utf -->\x{061c}\x{200e}\x{200f}\x{202a}\x{202b}\x{202c}\x{202d}<-- -->\x{2066}\x{2067}\x{2068}\x{2069}<-- /\p{bidi_control}++/utf -->\x{061c}\x{200e}\x{200f}\x{202a}\x{202b}\x{202c}\x{202d}<-- -->\x{2066}\x{2067}\x{2068}\x{2069}<-- /[\p{bidi_c}]/utf -->\x{202c}<-- /[\p{bidicontrol}]+/utf -->\x{061c}\x{200e}\x{200f}\x{202a}\x{202b}\x{202c}\x{202d}<-- -->\x{2066}\x{2067}\x{2068}\x{2069}<-- /[\p{bidicontrol}]+?/utf -->\x{061c}\x{200e}\x{200f}\x{202a}\x{202b}\x{202c}\x{202d}<-- -->\x{2066}\x{2067}\x{2068}\x{2069}<-- /[\p{bidicontrol}]++/utf -->\x{061c}\x{200e}\x{200f}\x{202a}\x{202b}\x{202c}\x{202d}<-- -->\x{2066}\x{2067}\x{2068}\x{2069}<-- /[\p{bidicontrol}<>]+/utf -->\x{061c}\x{200e}\x{200f}\x{202a}\x{202b}\x{202c}\x{202d}<-- -->\x{2066}\x{2067}\x{2068}\x{2069}<-- /\P{bidicontrol}+/g,utf -->\x{061c}\x{200e}\x{200f}\x{202a}\x{202b}\x{202c}\x{202d}<-- -->\x{2066}\x{2067}\x{2068}\x{2069}<-- /\p{^bidicontrol}+/g,utf -->\x{061c}\x{200e}\x{200f}\x{202a}\x{202b}\x{202c}\x{202d}<-- -->\x{2066}\x{2067}\x{2068}\x{2069}<-- /\p{bidi class = al}/utf -->\x{061D}<-- /\p{bc = al}+/utf -->\x{061D}\x{061e}\x{061f}<-- /\p{bidi_class : AL}+?/utf -->\x{061D}\x{061e}\x{061f}<-- /\p{Bidi_Class : AL}++/utf -->\x{061D}\x{061e}\x{061f}<-- /\p{b_c = aN}+/utf -->\x{061D}\x{0602}\x{0604}\x{061f}<-- /\p{bidi class = B}+/utf -->\x{0a}\x{0d}\x{01c}\x{01e}\x{085}\x{2029}<-- /\p{bidi class:BN}+/utf -->\x{0}\x{08}\x{200c}\x{fffe}\x{dfffe}\x{10ffff}<-- /\p{bidiclass:cs}+/utf -->,.\x{060c}\x{ff1a}<-- /\p{bidiclass:En}+/utf -->09\x{b2}\x{2074}\x{1fbf9}<-- /\p{bidiclass:es}+/utf ==>+-\x{207a}\x{ff0d}<== /\p{bidiclass:et}+/utf -->#\{24}%\x{a2}\x{A838}\x{1e2ff}<-- /\p{bidiclass:FSI}+/utf -->\x{2068}<-- /\p{bidi class:L}+/utf -->ABC<-- /\P{bidi class:L}+/utf -->ABC<-- /\p{bidi class:LRE}+\p{bidiclass=lri}*\p{bidiclass:lro}/utf -->\x{202a}\x{2066}\x{202d}<-- /\p{bidi class:NSM}+/utf -->\x{9bc}\x{a71}\x{e31}<-- /\p{bidi class:ON}+/utf -->\x{21}'()*;@\x{384}\x{2039}<=- /\p{bidiclass:pdf}\p{bidiclass:pdi}/utf -->\x{202c}\x{2069}<-- /\p{bidi class:R}+/utf -->\x{590}\x{5c6}\x{200f}\x{10805}<-- /\p{bidi class:RLE}+\p{bidi class:RLI}*\p{bidi class:RLO}+/utf -->\x{202b}\x{2067}\x{202e}<-- /\p{bidi class:S}+\p{bidiclass:WS}+/utf -->\x{9}\x{b}\x{1f} \x{c} \x{2000} \x{3000}<-- # ----------------------------------------------------------------------------- /[\p{taml}\p{sc:ugar}]+/utf \x{0b82}\x{10380} /^[\p{sc:Arabic}]/utf \= Expect no match \x{650} \x{651} \x{652} \x{653} \x{654} \x{655} # ----------------------------------------------------------------------------- # Tests for newly-added Boolean Properties /\p{ahex}\p{asciihexdigit}/utf >4F< /\p{alpha}\p{alphabetic}/g,utf >AB<>\x{148}\x{1234} /\p{ascii}\p{ascii}/g,utf >AB<>\x{148}\x{1234} /\p{Bidi_C}\p{bidicontrol}/g,utf >\x{202d}\x{2069}< /\p{Bidi_M}\p{bidimirrored}/g,utf >\x{202d}\x{2069}<>\x{298b}\x{bb}< /\p{cased}\p{cased}/g,utf >AN<>\x{149}\x{120}< /\p{caseignorable}\p{ci}/g,utf >AN<>\x{60}\x{859}< /\p{changeswhencasefolded}\p{cwcf}/g,utf >AN<>\x{149}\x{120}< /\p{changeswhencasemapped}\p{cwcm}/g,utf >AN<>\x{149}\x{120}< /\p{changeswhenlowercased}\p{cwl}/g,utf >AN<>\x{149}\x{120}<>yz< /\p{changeswhenuppercased}\p{cwu}/g,utf >AN<>\x{149}\x{120}<>yz< /\p{changeswhentitlecased}\p{cwt}/g,utf >AN<>\x{149}\x{120}<>yz< /\p{dash}\p{dash}/g,utf >\x{2d}\x{1400}<>yz< /\p{defaultignorablecodepoint}\p{di}/g,utf >AN<>\x{ad}\x{e0fff}<>yz< /\p{deprecated}\p{dep}/g,utf >AN<>\x{149}\x{e0001}<>yz< /\p{diacritic}\p{dia}/g,utf >AN<>\x{f84}\x{5e}<>yz< /\p{emojicomponent}\p{ecomp}/g,utf >AN<>\x{200d}\x{e007f}<>yz< /\p{emojimodifier}\p{emod}/g,utf >AN<>\x{1f3fb}\x{1f3ff}<>yz< /\p{emojipresentation}\p{epres}/g,utf >AN<>\x{2653}\x{1f6d2}<>yz< /\p{extender}\p{ext}/g,utf >AN<>\x{1e944}\x{b7}<>yz< /\p{extendedpictographic}\p{extpict}/g,utf >AN<>\x{26cf}\x{ae}<>yz< /\p{graphemebase}\p{grbase}/g,utf >AN<>\x{10f}\x{60}<>yz< /\p{graphemeextend}\p{grext}/g,utf >AN<>\x{300}\x{b44}<>yz< /\p{hexdigit}\p{hex}/g,utf >AF23<>\x{ff46}\x{ff10}<>yz< /\p{idcontinue}\p{idc}/g,utf >AF23<>\x{146}\x{7a}<>yz< /\p{ideographic}\p{ideo}/g,utf >AF23<>\x{30000}\x{3006}<>yz< /\p{idstart}\p{ids}/g,utf >AF23<>\x{146}\x{7a}<>yz< /\p{idsbinaryoperator}\p{idsb}/g,utf >AF23<>\x{2ff0}\x{2ffb}<>yz<\x{2ff2}\x{2ff1} /\p{idstrinaryoperator}\p{idst}/g,utf >AF23<>\x{2ff2}\x{2ff3}<>yz< /\p{Join Control}\p{joinc}/g,utf >AF23<>\x{200c}\x{200d}<>yz< /\p{logical_order_exception}\p{loe}/g,utf >AF23<>\x{e40}\x{aabc}<>yz< /\p{Lowercase}\p{lower}/g,utf >AF23<>\x{146}\x{7a}<>yz< /\p{math}\p{math}/g,utf >AF23<>\x{2215}\x{2b}<>yz< /\p{Non Character Code Point}\p{nchar}/g,utf >AF23<>\x{10ffff}\x{fdd0}<>yz< /\p{patternsyntax}\p{patsyn}/g,utf >AF23<>\x{21cd}\x{21}<>yz< /\p{patternwhitespace}\p{patws}/g,utf >AF23<>\x{2029}\x{85}<>yz< /\p{prependedconcatenationmark}\p{pcm}/g,utf >AF23<>\x{600}\x{110cd}<>yz< /\p{quotationmark}\p{qmark}/g,utf >AF23<>\x{ff63}\x{22}<>yz< /\p{radical}\p{radical}/g,utf >AF23<>\x{2fd5}\x{2e80}<>yz< /\p{regionalindicator}\p{ri}/g,utf >AF23<>\x{1f1e6}\x{1f1ff}<>yz< /=\p{whitespace}\p{space}\p{wspace}=/g,utf >AF23<=\x{d}\x{1680}\x{3000}=>yz< /\p{sentenceterminal}\p{sterm}/g,utf >AF23<>\x{1da88}\x{2e}<>yz< /\p{terminalpunctuation}\p{term}/g,utf >AF23<>\x{1da88}\x{2e}<>yz< /\p{unified ideograph}\p{uideo}/g,utf >AF23<>\x{30000}\x{3400}<>yz< /\p{UPPERcase}\p{upper}/g,utf >AF23<>\x{146}\x{7a}<>yz< /\p{variationselector}\p{vs}/g,utf >AF23<>\x{180b}\x{e01ef}<>yz< /\p{xidcontinue}\p{xidc}/g,utf >AF23<>\x{146}\x{30}<>yz< # ----------------------------------------------------------------------------- # Variable-length lookbehinds. /(?<=áb?c).../g,utf ábcdèfgácxyz /(?<=PQR|áb?c).../g,utf ábcdèfgácxyzPQR123 /(?<=áb?c|PQR).../g,utf ábcdèfgácxyzPQR123 /(?<=PQ|áb?c).../g,utf ábcdèfgácxyzPQR123 /(?<=áb?c|PQ).../g,utf ábcdèfgácxyzPQR123 /(?<=á(b?c|d?è?è)f)X./g,utf ácfX1zzzáèfX2zzzádèèfX3zzzX4zzz /(?