github的一些开源项目
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

2750 lines
36 KiB

  1. # These tests are generated by maint/GenerateTest26.py, do not edit.
  2. # Unicode Script Extension tests.
  3. # Base script check
  4. /^\p{sc=Latin}/utf
  5. A
  6. /^\p{Script=Latn}/utf
  7. \x{1df2a}
  8. # Script extension check
  9. /^\p{Latin}/utf
  10. \x{363}
  11. /^\p{scx=Latn}/utf
  12. \x{a92e}
  13. # Script extension only character
  14. /^\p{Latin}/utf
  15. \x{363}
  16. /^\p{sc=Latin}/utf
  17. \x{363}
  18. # Character not in script
  19. /^\p{Latin}/utf
  20. \x{1df2b}
  21. # Base script check
  22. /^\p{sc=Greek}/utf
  23. \x{370}
  24. /^\p{Script=Grek}/utf
  25. \x{1d245}
  26. # Script extension check
  27. /^\p{Greek}/utf
  28. \x{342}
  29. /^\p{Script_Extensions=Grek}/utf
  30. \x{1dc1}
  31. # Script extension only character
  32. /^\p{Greek}/utf
  33. \x{342}
  34. /^\p{sc=Greek}/utf
  35. \x{342}
  36. # Character not in script
  37. /^\p{Greek}/utf
  38. \x{1d246}
  39. # Base script check
  40. /^\p{sc=Cyrillic}/utf
  41. \x{400}
  42. /^\p{Script=Cyrl}/utf
  43. \x{1e08f}
  44. # Script extension check
  45. /^\p{Cyrillic}/utf
  46. \x{483}
  47. /^\p{scx=Cyrl}/utf
  48. \x{a66f}
  49. # Script extension only character
  50. /^\p{Cyrillic}/utf
  51. \x{2e43}
  52. /^\p{sc=Cyrillic}/utf
  53. \x{2e43}
  54. # Character not in script
  55. /^\p{Cyrillic}/utf
  56. \x{1e090}
  57. # Base script check
  58. /^\p{sc=Arabic}/utf
  59. \x{600}
  60. /^\p{Script=Arab}/utf
  61. \x{1eef1}
  62. # Script extension check
  63. /^\p{Arabic}/utf
  64. \x{60c}
  65. /^\p{Script_Extensions=Arab}/utf
  66. \x{102fb}
  67. # Script extension only character
  68. /^\p{Arabic}/utf
  69. \x{102e0}
  70. /^\p{sc=Arabic}/utf
  71. \x{102e0}
  72. # Character not in script
  73. /^\p{Arabic}/utf
  74. \x{1eef2}
  75. # Base script check
  76. /^\p{sc=Syriac}/utf
  77. \x{700}
  78. /^\p{Script=Syrc}/utf
  79. \x{86a}
  80. # Script extension check
  81. /^\p{Syriac}/utf
  82. \x{60c}
  83. /^\p{scx=Syrc}/utf
  84. \x{1dfa}
  85. # Script extension only character
  86. /^\p{Syriac}/utf
  87. \x{1dfa}
  88. /^\p{sc=Syriac}/utf
  89. \x{1dfa}
  90. # Character not in script
  91. /^\p{Syriac}/utf
  92. \x{1dfb}
  93. # Base script check
  94. /^\p{sc=Thaana}/utf
  95. \x{780}
  96. /^\p{Script=Thaa}/utf
  97. \x{7b1}
  98. # Script extension check
  99. /^\p{Thaana}/utf
  100. \x{60c}
  101. /^\p{Script_Extensions=Thaa}/utf
  102. \x{fdfd}
  103. # Script extension only character
  104. /^\p{Thaana}/utf
  105. \x{fdf2}
  106. /^\p{sc=Thaana}/utf
  107. \x{fdf2}
  108. # Character not in script
  109. /^\p{Thaana}/utf
  110. \x{fdfe}
  111. # Base script check
  112. /^\p{sc=Devanagari}/utf
  113. \x{900}
  114. /^\p{Script=Deva}/utf
  115. \x{11b09}
  116. # Script extension check
  117. /^\p{Devanagari}/utf
  118. \x{951}
  119. /^\p{scx=Deva}/utf
  120. \x{a8f3}
  121. # Script extension only character
  122. /^\p{Devanagari}/utf
  123. \x{1cd1}
  124. /^\p{sc=Devanagari}/utf
  125. \x{1cd1}
  126. # Character not in script
  127. /^\p{Devanagari}/utf
  128. \x{11b0a}
  129. # Base script check
  130. /^\p{sc=Bengali}/utf
  131. \x{980}
  132. /^\p{Script=Beng}/utf
  133. \x{9fe}
  134. # Script extension check
  135. /^\p{Bengali}/utf
  136. \x{951}
  137. /^\p{Script_Extensions=Beng}/utf
  138. \x{a8f1}
  139. # Script extension only character
  140. /^\p{Bengali}/utf
  141. \x{1cf7}
  142. /^\p{sc=Bengali}/utf
  143. \x{1cf7}
  144. # Character not in script
  145. /^\p{Bengali}/utf
  146. \x{a8f2}
  147. # Base script check
  148. /^\p{sc=Gurmukhi}/utf
  149. \x{a01}
  150. /^\p{Script=Guru}/utf
  151. \x{a76}
  152. # Script extension check
  153. /^\p{Gurmukhi}/utf
  154. \x{951}
  155. /^\p{scx=Guru}/utf
  156. \x{a839}
  157. # Script extension only character
  158. /^\p{Gurmukhi}/utf
  159. \x{a836}
  160. /^\p{sc=Gurmukhi}/utf
  161. \x{a836}
  162. # Character not in script
  163. /^\p{Gurmukhi}/utf
  164. \x{a83a}
  165. # Base script check
  166. /^\p{sc=Gujarati}/utf
  167. \x{a81}
  168. /^\p{Script=Gujr}/utf
  169. \x{aff}
  170. # Script extension check
  171. /^\p{Gujarati}/utf
  172. \x{951}
  173. /^\p{Script_Extensions=Gujr}/utf
  174. \x{a839}
  175. # Script extension only character
  176. /^\p{Gujarati}/utf
  177. \x{a836}
  178. /^\p{sc=Gujarati}/utf
  179. \x{a836}
  180. # Character not in script
  181. /^\p{Gujarati}/utf
  182. \x{a83a}
  183. # Base script check
  184. /^\p{sc=Oriya}/utf
  185. \x{b01}
  186. /^\p{Script=Orya}/utf
  187. \x{b77}
  188. # Script extension check
  189. /^\p{Oriya}/utf
  190. \x{951}
  191. /^\p{scx=Orya}/utf
  192. \x{1cf2}
  193. # Script extension only character
  194. /^\p{Oriya}/utf
  195. \x{1cda}
  196. /^\p{sc=Oriya}/utf
  197. \x{1cda}
  198. # Character not in script
  199. /^\p{Oriya}/utf
  200. \x{1cf3}
  201. # Base script check
  202. /^\p{sc=Tamil}/utf
  203. \x{b82}
  204. /^\p{Script=Taml}/utf
  205. \x{11fff}
  206. # Script extension check
  207. /^\p{Tamil}/utf
  208. \x{951}
  209. /^\p{Script_Extensions=Taml}/utf
  210. \x{11fd3}
  211. # Script extension only character
  212. /^\p{Tamil}/utf
  213. \x{a8f3}
  214. /^\p{sc=Tamil}/utf
  215. \x{a8f3}
  216. # Character not in script
  217. /^\p{Tamil}/utf
  218. \x{12000}
  219. # Base script check
  220. /^\p{sc=Telugu}/utf
  221. \x{c00}
  222. /^\p{Script=Telu}/utf
  223. \x{c7f}
  224. # Script extension check
  225. /^\p{Telugu}/utf
  226. \x{951}
  227. /^\p{scx=Telu}/utf
  228. \x{1cf2}
  229. # Script extension only character
  230. /^\p{Telugu}/utf
  231. \x{1cda}
  232. /^\p{sc=Telugu}/utf
  233. \x{1cda}
  234. # Character not in script
  235. /^\p{Telugu}/utf
  236. \x{1cf3}
  237. # Base script check
  238. /^\p{sc=Kannada}/utf
  239. \x{c80}
  240. /^\p{Script=Knda}/utf
  241. \x{cf3}
  242. # Script extension check
  243. /^\p{Kannada}/utf
  244. \x{951}
  245. /^\p{Script_Extensions=Knda}/utf
  246. \x{a835}
  247. # Script extension only character
  248. /^\p{Kannada}/utf
  249. \x{1cf4}
  250. /^\p{sc=Kannada}/utf
  251. \x{1cf4}
  252. # Character not in script
  253. /^\p{Kannada}/utf
  254. \x{a836}
  255. # Base script check
  256. /^\p{sc=Malayalam}/utf
  257. \x{d00}
  258. /^\p{Script=Mlym}/utf
  259. \x{d7f}
  260. # Script extension check
  261. /^\p{Malayalam}/utf
  262. \x{951}
  263. /^\p{scx=Mlym}/utf
  264. \x{a832}
  265. # Script extension only character
  266. /^\p{Malayalam}/utf
  267. \x{1cda}
  268. /^\p{sc=Malayalam}/utf
  269. \x{1cda}
  270. # Character not in script
  271. /^\p{Malayalam}/utf
  272. \x{a833}
  273. # Base script check
  274. /^\p{sc=Sinhala}/utf
  275. \x{d81}
  276. /^\p{Script=Sinh}/utf
  277. \x{111f4}
  278. # Script extension check
  279. /^\p{Sinhala}/utf
  280. \x{964}
  281. /^\p{Script_Extensions=Sinh}/utf
  282. \x{965}
  283. # Script extension only character
  284. /^\p{Sinhala}/utf
  285. \x{964}
  286. /^\p{sc=Sinhala}/utf
  287. \x{964}
  288. # Character not in script
  289. /^\p{Sinhala}/utf
  290. \x{111f5}
  291. # Base script check
  292. /^\p{sc=Myanmar}/utf
  293. \x{1000}
  294. /^\p{Script=Mymr}/utf
  295. \x{aa7f}
  296. # Script extension check
  297. /^\p{Myanmar}/utf
  298. \x{1040}
  299. /^\p{scx=Mymr}/utf
  300. \x{a92e}
  301. # Script extension only character
  302. /^\p{Myanmar}/utf
  303. \x{a92e}
  304. /^\p{sc=Myanmar}/utf
  305. \x{a92e}
  306. # Character not in script
  307. /^\p{Myanmar}/utf
  308. \x{aa80}
  309. # Base script check
  310. /^\p{sc=Georgian}/utf
  311. \x{10a0}
  312. /^\p{Script=Geor}/utf
  313. \x{2d2d}
  314. # Script extension check
  315. /^\p{Georgian}/utf
  316. \x{10fb}
  317. /^\p{Script_Extensions=Geor}/utf
  318. \x{10fb}
  319. # Script extension only character
  320. /^\p{Georgian}/utf
  321. \x{10fb}
  322. /^\p{sc=Georgian}/utf
  323. \x{10fb}
  324. # Character not in script
  325. /^\p{Georgian}/utf
  326. \x{2d2e}
  327. # Base script check
  328. /^\p{sc=Hangul}/utf
  329. \x{1100}
  330. /^\p{Script=Hang}/utf
  331. \x{ffdc}
  332. # Script extension check
  333. /^\p{Hangul}/utf
  334. \x{3001}
  335. /^\p{scx=Hang}/utf
  336. \x{ff65}
  337. # Script extension only character
  338. /^\p{Hangul}/utf
  339. \x{3003}
  340. /^\p{sc=Hangul}/utf
  341. \x{3003}
  342. # Character not in script
  343. /^\p{Hangul}/utf
  344. \x{ffdd}
  345. # Base script check
  346. /^\p{sc=Mongolian}/utf
  347. \x{1800}
  348. /^\p{Script=Mong}/utf
  349. \x{1166c}
  350. # Script extension check
  351. /^\p{Mongolian}/utf
  352. \x{1802}
  353. /^\p{Script_Extensions=Mong}/utf
  354. \x{202f}
  355. # Script extension only character
  356. /^\p{Mongolian}/utf
  357. \x{202f}
  358. /^\p{sc=Mongolian}/utf
  359. \x{202f}
  360. # Character not in script
  361. /^\p{Mongolian}/utf
  362. \x{1166d}
  363. # Base script check
  364. /^\p{sc=Hiragana}/utf
  365. \x{3041}
  366. /^\p{Script=Hira}/utf
  367. \x{1f200}
  368. # Script extension check
  369. /^\p{Hiragana}/utf
  370. \x{3001}
  371. /^\p{scx=Hira}/utf
  372. \x{ff9f}
  373. # Script extension only character
  374. /^\p{Hiragana}/utf
  375. \x{3031}
  376. /^\p{sc=Hiragana}/utf
  377. \x{3031}
  378. # Character not in script
  379. /^\p{Hiragana}/utf
  380. \x{1f201}
  381. # Base script check
  382. /^\p{sc=Katakana}/utf
  383. \x{30a1}
  384. /^\p{Script=Kana}/utf
  385. \x{1b167}
  386. # Script extension check
  387. /^\p{Katakana}/utf
  388. \x{3001}
  389. /^\p{Script_Extensions=Kana}/utf
  390. \x{ff9f}
  391. # Script extension only character
  392. /^\p{Katakana}/utf
  393. \x{3031}
  394. /^\p{sc=Katakana}/utf
  395. \x{3031}
  396. # Character not in script
  397. /^\p{Katakana}/utf
  398. \x{1b168}
  399. # Base script check
  400. /^\p{sc=Bopomofo}/utf
  401. \x{2ea}
  402. /^\p{Script=Bopo}/utf
  403. \x{31bf}
  404. # Script extension check
  405. /^\p{Bopomofo}/utf
  406. \x{3001}
  407. /^\p{scx=Bopo}/utf
  408. \x{ff65}
  409. # Script extension only character
  410. /^\p{Bopomofo}/utf
  411. \x{302a}
  412. /^\p{sc=Bopomofo}/utf
  413. \x{302a}
  414. # Character not in script
  415. /^\p{Bopomofo}/utf
  416. \x{ff66}
  417. # Base script check
  418. /^\p{sc=Han}/utf
  419. \x{2e80}
  420. /^\p{Script=Hani}/utf
  421. \x{323af}
  422. # Script extension check
  423. /^\p{Han}/utf
  424. \x{3001}
  425. /^\p{Script_Extensions=Hani}/utf
  426. \x{1f251}
  427. # Script extension only character
  428. /^\p{Han}/utf
  429. \x{3006}
  430. /^\p{sc=Han}/utf
  431. \x{3006}
  432. # Character not in script
  433. /^\p{Han}/utf
  434. \x{323b0}
  435. # Base script check
  436. /^\p{sc=Yi}/utf
  437. \x{a000}
  438. /^\p{Script=Yiii}/utf
  439. \x{a4c6}
  440. # Script extension check
  441. /^\p{Yi}/utf
  442. \x{3001}
  443. /^\p{scx=Yiii}/utf
  444. \x{ff65}
  445. # Script extension only character
  446. /^\p{Yi}/utf
  447. \x{3001}
  448. /^\p{sc=Yi}/utf
  449. \x{3001}
  450. # Character not in script
  451. /^\p{Yi}/utf
  452. \x{ff66}
  453. # Base script check
  454. /^\p{sc=Tagalog}/utf
  455. \x{1700}
  456. /^\p{Script=Tglg}/utf
  457. \x{171f}
  458. # Script extension check
  459. /^\p{Tagalog}/utf
  460. \x{1735}
  461. /^\p{Script_Extensions=Tglg}/utf
  462. \x{1736}
  463. # Script extension only character
  464. /^\p{Tagalog}/utf
  465. \x{1735}
  466. /^\p{sc=Tagalog}/utf
  467. \x{1735}
  468. # Character not in script
  469. /^\p{Tagalog}/utf
  470. \x{1737}
  471. # Base script check
  472. /^\p{sc=Hanunoo}/utf
  473. \x{1720}
  474. /^\p{Script=Hano}/utf
  475. \x{1734}
  476. # Script extension check
  477. /^\p{Hanunoo}/utf
  478. \x{1735}
  479. /^\p{scx=Hano}/utf
  480. \x{1736}
  481. # Script extension only character
  482. /^\p{Hanunoo}/utf
  483. \x{1735}
  484. /^\p{sc=Hanunoo}/utf
  485. \x{1735}
  486. # Character not in script
  487. /^\p{Hanunoo}/utf
  488. \x{1737}
  489. # Base script check
  490. /^\p{sc=Buhid}/utf
  491. \x{1740}
  492. /^\p{Script=Buhd}/utf
  493. \x{1753}
  494. # Script extension check
  495. /^\p{Buhid}/utf
  496. \x{1735}
  497. /^\p{Script_Extensions=Buhd}/utf
  498. \x{1736}
  499. # Script extension only character
  500. /^\p{Buhid}/utf
  501. \x{1735}
  502. /^\p{sc=Buhid}/utf
  503. \x{1735}
  504. # Character not in script
  505. /^\p{Buhid}/utf
  506. \x{1754}
  507. # Base script check
  508. /^\p{sc=Tagbanwa}/utf
  509. \x{1760}
  510. /^\p{Script=Tagb}/utf
  511. \x{1773}
  512. # Script extension check
  513. /^\p{Tagbanwa}/utf
  514. \x{1735}
  515. /^\p{scx=Tagb}/utf
  516. \x{1736}
  517. # Script extension only character
  518. /^\p{Tagbanwa}/utf
  519. \x{1735}
  520. /^\p{sc=Tagbanwa}/utf
  521. \x{1735}
  522. # Character not in script
  523. /^\p{Tagbanwa}/utf
  524. \x{1774}
  525. # Base script check
  526. /^\p{sc=Limbu}/utf
  527. \x{1900}
  528. /^\p{Script=Limb}/utf
  529. \x{194f}
  530. # Script extension check
  531. /^\p{Limbu}/utf
  532. \x{965}
  533. /^\p{Script_Extensions=Limb}/utf
  534. \x{965}
  535. # Script extension only character
  536. /^\p{Limbu}/utf
  537. \x{965}
  538. /^\p{sc=Limbu}/utf
  539. \x{965}
  540. # Character not in script
  541. /^\p{Limbu}/utf
  542. \x{1950}
  543. # Base script check
  544. /^\p{sc=Tai_Le}/utf
  545. \x{1950}
  546. /^\p{Script=Tale}/utf
  547. \x{1974}
  548. # Script extension check
  549. /^\p{Tai_Le}/utf
  550. \x{1040}
  551. /^\p{scx=Tale}/utf
  552. \x{1049}
  553. # Script extension only character
  554. /^\p{Tai_Le}/utf
  555. \x{1040}
  556. /^\p{sc=Tai_Le}/utf
  557. \x{1040}
  558. # Character not in script
  559. /^\p{Tai_Le}/utf
  560. \x{1975}
  561. # Base script check
  562. /^\p{sc=Linear_B}/utf
  563. \x{10000}
  564. /^\p{Script=Linb}/utf
  565. \x{100fa}
  566. # Script extension check
  567. /^\p{Linear_B}/utf
  568. \x{10100}
  569. /^\p{Script_Extensions=Linb}/utf
  570. \x{1013f}
  571. # Script extension only character
  572. /^\p{Linear_B}/utf
  573. \x{10102}
  574. /^\p{sc=Linear_B}/utf
  575. \x{10102}
  576. # Character not in script
  577. /^\p{Linear_B}/utf
  578. \x{10140}
  579. # Base script check
  580. /^\p{sc=Cypriot}/utf
  581. \x{10800}
  582. /^\p{Script=Cprt}/utf
  583. \x{1083f}
  584. # Script extension check
  585. /^\p{Cypriot}/utf
  586. \x{10100}
  587. /^\p{scx=Cprt}/utf
  588. \x{1013f}
  589. # Script extension only character
  590. /^\p{Cypriot}/utf
  591. \x{10102}
  592. /^\p{sc=Cypriot}/utf
  593. \x{10102}
  594. # Character not in script
  595. /^\p{Cypriot}/utf
  596. \x{10840}
  597. # Base script check
  598. /^\p{sc=Buginese}/utf
  599. \x{1a00}
  600. /^\p{Script=Bugi}/utf
  601. \x{1a1f}
  602. # Script extension check
  603. /^\p{Buginese}/utf
  604. \x{a9cf}
  605. /^\p{Script_Extensions=Bugi}/utf
  606. \x{a9cf}
  607. # Script extension only character
  608. /^\p{Buginese}/utf
  609. \x{a9cf}
  610. /^\p{sc=Buginese}/utf
  611. \x{a9cf}
  612. # Character not in script
  613. /^\p{Buginese}/utf
  614. \x{a9d0}
  615. # Base script check
  616. /^\p{sc=Coptic}/utf
  617. \x{3e2}
  618. /^\p{Script=Copt}/utf
  619. \x{2cff}
  620. # Script extension check
  621. /^\p{Coptic}/utf
  622. \x{102e0}
  623. /^\p{scx=Copt}/utf
  624. \x{102fb}
  625. # Script extension only character
  626. /^\p{Coptic}/utf
  627. \x{102e0}
  628. /^\p{sc=Coptic}/utf
  629. \x{102e0}
  630. # Character not in script
  631. /^\p{Coptic}/utf
  632. \x{102fc}
  633. # Base script check
  634. /^\p{sc=Glagolitic}/utf
  635. \x{2c00}
  636. /^\p{Script=Glag}/utf
  637. \x{1e02a}
  638. # Script extension check
  639. /^\p{Glagolitic}/utf
  640. \x{484}
  641. /^\p{Script_Extensions=Glag}/utf
  642. \x{a66f}
  643. # Script extension only character
  644. /^\p{Glagolitic}/utf
  645. \x{484}
  646. /^\p{sc=Glagolitic}/utf
  647. \x{484}
  648. # Character not in script
  649. /^\p{Glagolitic}/utf
  650. \x{1e02b}
  651. # Base script check
  652. /^\p{sc=Syloti_Nagri}/utf
  653. \x{a800}
  654. /^\p{Script=Sylo}/utf
  655. \x{a82c}
  656. # Script extension check
  657. /^\p{Syloti_Nagri}/utf
  658. \x{964}
  659. /^\p{scx=Sylo}/utf
  660. \x{9ef}
  661. # Script extension only character
  662. /^\p{Syloti_Nagri}/utf
  663. \x{9e6}
  664. /^\p{sc=Syloti_Nagri}/utf
  665. \x{9e6}
  666. # Character not in script
  667. /^\p{Syloti_Nagri}/utf
  668. \x{a82d}
  669. # Base script check
  670. /^\p{sc=Phags_Pa}/utf
  671. \x{a840}
  672. /^\p{Script=Phag}/utf
  673. \x{a877}
  674. # Script extension check
  675. /^\p{Phags_Pa}/utf
  676. \x{1802}
  677. /^\p{Script_Extensions=Phag}/utf
  678. \x{1805}
  679. # Script extension only character
  680. /^\p{Phags_Pa}/utf
  681. \x{1802}
  682. /^\p{sc=Phags_Pa}/utf
  683. \x{1802}
  684. # Character not in script
  685. /^\p{Phags_Pa}/utf
  686. \x{a878}
  687. # Base script check
  688. /^\p{sc=Nko}/utf
  689. \x{7c0}
  690. /^\p{Script=Nkoo}/utf
  691. \x{7ff}
  692. # Script extension check
  693. /^\p{Nko}/utf
  694. \x{60c}
  695. /^\p{scx=Nkoo}/utf
  696. \x{fd3f}
  697. # Script extension only character
  698. /^\p{Nko}/utf
  699. \x{fd3e}
  700. /^\p{sc=Nko}/utf
  701. \x{fd3e}
  702. # Character not in script
  703. /^\p{Nko}/utf
  704. \x{fd40}
  705. # Base script check
  706. /^\p{sc=Kayah_Li}/utf
  707. \x{a900}
  708. /^\p{Script=Kali}/utf
  709. \x{a92f}
  710. # Script extension check
  711. /^\p{Kayah_Li}/utf
  712. \x{a92e}
  713. /^\p{Script_Extensions=Kali}/utf
  714. \x{a92e}
  715. # Script extension only character
  716. /^\p{Kayah_Li}/utf
  717. \x{a92e}
  718. /^\p{sc=Kayah_Li}/utf
  719. \x{a92e}
  720. # Character not in script
  721. /^\p{Kayah_Li}/utf
  722. \x{a930}
  723. # Base script check
  724. /^\p{sc=Javanese}/utf
  725. \x{a980}
  726. /^\p{Script=Java}/utf
  727. \x{a9df}
  728. # Script extension check
  729. /^\p{Javanese}/utf
  730. \x{a9cf}
  731. /^\p{scx=Java}/utf
  732. \x{a9cf}
  733. # Script extension only character
  734. /^\p{Javanese}/utf
  735. \x{a9cf}
  736. /^\p{sc=Javanese}/utf
  737. \x{a9cf}
  738. # Character not in script
  739. /^\p{Javanese}/utf
  740. \x{a9e0}
  741. # Base script check
  742. /^\p{sc=Kaithi}/utf
  743. \x{11080}
  744. /^\p{Script=Kthi}/utf
  745. \x{110cd}
  746. # Script extension check
  747. /^\p{Kaithi}/utf
  748. \x{966}
  749. /^\p{Script_Extensions=Kthi}/utf
  750. \x{a839}
  751. # Script extension only character
  752. /^\p{Kaithi}/utf
  753. \x{966}
  754. /^\p{sc=Kaithi}/utf
  755. \x{966}
  756. # Character not in script
  757. /^\p{Kaithi}/utf
  758. \x{110ce}
  759. # Base script check
  760. /^\p{sc=Mandaic}/utf
  761. \x{840}
  762. /^\p{Script=Mand}/utf
  763. \x{85e}
  764. # Script extension check
  765. /^\p{Mandaic}/utf
  766. \x{640}
  767. /^\p{scx=Mand}/utf
  768. \x{640}
  769. # Script extension only character
  770. /^\p{Mandaic}/utf
  771. \x{640}
  772. /^\p{sc=Mandaic}/utf
  773. \x{640}
  774. # Character not in script
  775. /^\p{Mandaic}/utf
  776. \x{85f}
  777. # Base script check
  778. /^\p{sc=Chakma}/utf
  779. \x{11100}
  780. /^\p{Script=Cakm}/utf
  781. \x{11147}
  782. # Script extension check
  783. /^\p{Chakma}/utf
  784. \x{9e6}
  785. /^\p{Script_Extensions=Cakm}/utf
  786. \x{1049}
  787. # Script extension only character
  788. /^\p{Chakma}/utf
  789. \x{9e6}
  790. /^\p{sc=Chakma}/utf
  791. \x{9e6}
  792. # Character not in script
  793. /^\p{Chakma}/utf
  794. \x{11148}
  795. # Base script check
  796. /^\p{sc=Sharada}/utf
  797. \x{11180}
  798. /^\p{Script=Shrd}/utf
  799. \x{111df}
  800. # Script extension check
  801. /^\p{Sharada}/utf
  802. \x{951}
  803. /^\p{scx=Shrd}/utf
  804. \x{1ce0}
  805. # Script extension only character
  806. /^\p{Sharada}/utf
  807. \x{1cd7}
  808. /^\p{sc=Sharada}/utf
  809. \x{1cd7}
  810. # Character not in script
  811. /^\p{Sharada}/utf
  812. \x{111e0}
  813. # Base script check
  814. /^\p{sc=Takri}/utf
  815. \x{11680}
  816. /^\p{Script=Takr}/utf
  817. \x{116c9}
  818. # Script extension check
  819. /^\p{Takri}/utf
  820. \x{964}
  821. /^\p{Script_Extensions=Takr}/utf
  822. \x{a839}
  823. # Script extension only character
  824. /^\p{Takri}/utf
  825. \x{a836}
  826. /^\p{sc=Takri}/utf
  827. \x{a836}
  828. # Character not in script
  829. /^\p{Takri}/utf
  830. \x{116ca}
  831. # Base script check
  832. /^\p{sc=Duployan}/utf
  833. \x{1bc00}
  834. /^\p{Script=Dupl}/utf
  835. \x{1bc9f}
  836. # Script extension check
  837. /^\p{Duployan}/utf
  838. \x{1bca0}
  839. /^\p{scx=Dupl}/utf
  840. \x{1bca3}
  841. # Script extension only character
  842. /^\p{Duployan}/utf
  843. \x{1bca0}
  844. /^\p{sc=Duployan}/utf
  845. \x{1bca0}
  846. # Character not in script
  847. /^\p{Duployan}/utf
  848. \x{1bca4}
  849. # Base script check
  850. /^\p{sc=Grantha}/utf
  851. \x{11300}
  852. /^\p{Script=Gran}/utf
  853. \x{11374}
  854. # Script extension check
  855. /^\p{Grantha}/utf
  856. \x{951}
  857. /^\p{Script_Extensions=Gran}/utf
  858. \x{11fd3}
  859. # Script extension only character
  860. /^\p{Grantha}/utf
  861. \x{1cd3}
  862. /^\p{sc=Grantha}/utf
  863. \x{1cd3}
  864. # Character not in script
  865. /^\p{Grantha}/utf
  866. \x{11fd4}
  867. # Base script check
  868. /^\p{sc=Khojki}/utf
  869. \x{11200}
  870. /^\p{Script=Khoj}/utf
  871. \x{11241}
  872. # Script extension check
  873. /^\p{Khojki}/utf
  874. \x{ae6}
  875. /^\p{scx=Khoj}/utf
  876. \x{a839}
  877. # Script extension only character
  878. /^\p{Khojki}/utf
  879. \x{ae6}
  880. /^\p{sc=Khojki}/utf
  881. \x{ae6}
  882. # Character not in script
  883. /^\p{Khojki}/utf
  884. \x{11242}
  885. # Base script check
  886. /^\p{sc=Linear_A}/utf
  887. \x{10600}
  888. /^\p{Script=Lina}/utf
  889. \x{10767}
  890. # Script extension check
  891. /^\p{Linear_A}/utf
  892. \x{10107}
  893. /^\p{Script_Extensions=Lina}/utf
  894. \x{10133}
  895. # Script extension only character
  896. /^\p{Linear_A}/utf
  897. \x{10107}
  898. /^\p{sc=Linear_A}/utf
  899. \x{10107}
  900. # Character not in script
  901. /^\p{Linear_A}/utf
  902. \x{10768}
  903. # Base script check
  904. /^\p{sc=Mahajani}/utf
  905. \x{11150}
  906. /^\p{Script=Mahj}/utf
  907. \x{11176}
  908. # Script extension check
  909. /^\p{Mahajani}/utf
  910. \x{964}
  911. /^\p{scx=Mahj}/utf
  912. \x{a839}
  913. # Script extension only character
  914. /^\p{Mahajani}/utf
  915. \x{966}
  916. /^\p{sc=Mahajani}/utf
  917. \x{966}
  918. # Character not in script
  919. /^\p{Mahajani}/utf
  920. \x{11177}
  921. # Base script check
  922. /^\p{sc=Manichaean}/utf
  923. \x{10ac0}
  924. /^\p{Script=Mani}/utf
  925. \x{10af6}
  926. # Script extension check
  927. /^\p{Manichaean}/utf
  928. \x{640}
  929. /^\p{Script_Extensions=Mani}/utf
  930. \x{10af2}
  931. # Script extension only character
  932. /^\p{Manichaean}/utf
  933. \x{640}
  934. /^\p{sc=Manichaean}/utf
  935. \x{640}
  936. # Character not in script
  937. /^\p{Manichaean}/utf
  938. \x{10af7}
  939. # Base script check
  940. /^\p{sc=Modi}/utf
  941. \x{11600}
  942. /^\p{Script=Modi}/utf
  943. \x{11659}
  944. # Script extension check
  945. /^\p{Modi}/utf
  946. \x{a830}
  947. /^\p{scx=Modi}/utf
  948. \x{a839}
  949. # Script extension only character
  950. /^\p{Modi}/utf
  951. \x{a836}
  952. /^\p{sc=Modi}/utf
  953. \x{a836}
  954. # Character not in script
  955. /^\p{Modi}/utf
  956. \x{1165a}
  957. # Base script check
  958. /^\p{sc=Old_Permic}/utf
  959. \x{10350}
  960. /^\p{Script=Perm}/utf
  961. \x{1037a}
  962. # Script extension check
  963. /^\p{Old_Permic}/utf
  964. \x{483}
  965. /^\p{Script_Extensions=Perm}/utf
  966. \x{483}
  967. # Script extension only character
  968. /^\p{Old_Permic}/utf
  969. \x{483}
  970. /^\p{sc=Old_Permic}/utf
  971. \x{483}
  972. # Character not in script
  973. /^\p{Old_Permic}/utf
  974. \x{1037b}
  975. # Base script check
  976. /^\p{sc=Psalter_Pahlavi}/utf
  977. \x{10b80}
  978. /^\p{Script=Phlp}/utf
  979. \x{10baf}
  980. # Script extension check
  981. /^\p{Psalter_Pahlavi}/utf
  982. \x{640}
  983. /^\p{scx=Phlp}/utf
  984. \x{640}
  985. # Script extension only character
  986. /^\p{Psalter_Pahlavi}/utf
  987. \x{640}
  988. /^\p{sc=Psalter_Pahlavi}/utf
  989. \x{640}
  990. # Character not in script
  991. /^\p{Psalter_Pahlavi}/utf
  992. \x{10bb0}
  993. # Base script check
  994. /^\p{sc=Khudawadi}/utf
  995. \x{112b0}
  996. /^\p{Script=Sind}/utf
  997. \x{112f9}
  998. # Script extension check
  999. /^\p{Khudawadi}/utf
  1000. \x{964}
  1001. /^\p{Script_Extensions=Sind}/utf
  1002. \x{a839}
  1003. # Script extension only character
  1004. /^\p{Khudawadi}/utf
  1005. \x{a836}
  1006. /^\p{sc=Khudawadi}/utf
  1007. \x{a836}
  1008. # Character not in script
  1009. /^\p{Khudawadi}/utf
  1010. \x{112fa}
  1011. # Base script check
  1012. /^\p{sc=Tirhuta}/utf
  1013. \x{11480}
  1014. /^\p{Script=Tirh}/utf
  1015. \x{114d9}
  1016. # Script extension check
  1017. /^\p{Tirhuta}/utf
  1018. \x{951}
  1019. /^\p{scx=Tirh}/utf
  1020. \x{a839}
  1021. # Script extension only character
  1022. /^\p{Tirhuta}/utf
  1023. \x{1cf2}
  1024. /^\p{sc=Tirhuta}/utf
  1025. \x{1cf2}
  1026. # Character not in script
  1027. /^\p{Tirhuta}/utf
  1028. \x{114da}
  1029. # Base script check
  1030. /^\p{sc=Multani}/utf
  1031. \x{11280}
  1032. /^\p{Script=Mult}/utf
  1033. \x{112a9}
  1034. # Script extension check
  1035. /^\p{Multani}/utf
  1036. \x{a66}
  1037. /^\p{Script_Extensions=Mult}/utf
  1038. \x{a6f}
  1039. # Script extension only character
  1040. /^\p{Multani}/utf
  1041. \x{a66}
  1042. /^\p{sc=Multani}/utf
  1043. \x{a66}
  1044. # Character not in script
  1045. /^\p{Multani}/utf
  1046. \x{112aa}
  1047. # Base script check
  1048. /^\p{sc=Adlam}/utf
  1049. \x{1e900}
  1050. /^\p{Script=Adlm}/utf
  1051. \x{1e95f}
  1052. # Script extension check
  1053. /^\p{Adlam}/utf
  1054. \x{61f}
  1055. /^\p{scx=Adlm}/utf
  1056. \x{640}
  1057. # Script extension only character
  1058. /^\p{Adlam}/utf
  1059. \x{61f}
  1060. /^\p{sc=Adlam}/utf
  1061. \x{61f}
  1062. # Character not in script
  1063. /^\p{Adlam}/utf
  1064. \x{1e960}
  1065. # Base script check
  1066. /^\p{sc=Masaram_Gondi}/utf
  1067. \x{11d00}
  1068. /^\p{Script=Gonm}/utf
  1069. \x{11d59}
  1070. # Script extension check
  1071. /^\p{Masaram_Gondi}/utf
  1072. \x{964}
  1073. /^\p{Script_Extensions=Gonm}/utf
  1074. \x{965}
  1075. # Script extension only character
  1076. /^\p{Masaram_Gondi}/utf
  1077. \x{964}
  1078. /^\p{sc=Masaram_Gondi}/utf
  1079. \x{964}
  1080. # Character not in script
  1081. /^\p{Masaram_Gondi}/utf
  1082. \x{11d5a}
  1083. # Base script check
  1084. /^\p{sc=Dogra}/utf
  1085. \x{11800}
  1086. /^\p{Script=Dogr}/utf
  1087. \x{1183b}
  1088. # Script extension check
  1089. /^\p{Dogra}/utf
  1090. \x{964}
  1091. /^\p{scx=Dogr}/utf
  1092. \x{a839}
  1093. # Script extension only character
  1094. /^\p{Dogra}/utf
  1095. \x{966}
  1096. /^\p{sc=Dogra}/utf
  1097. \x{966}
  1098. # Character not in script
  1099. /^\p{Dogra}/utf
  1100. \x{1183c}
  1101. # Base script check
  1102. /^\p{sc=Gunjala_Gondi}/utf
  1103. \x{11d60}
  1104. /^\p{Script=Gong}/utf
  1105. \x{11da9}
  1106. # Script extension check
  1107. /^\p{Gunjala_Gondi}/utf
  1108. \x{964}
  1109. /^\p{Script_Extensions=Gong}/utf
  1110. \x{965}
  1111. # Script extension only character
  1112. /^\p{Gunjala_Gondi}/utf
  1113. \x{964}
  1114. /^\p{sc=Gunjala_Gondi}/utf
  1115. \x{964}
  1116. # Character not in script
  1117. /^\p{Gunjala_Gondi}/utf
  1118. \x{11daa}
  1119. # Base script check
  1120. /^\p{sc=Hanifi_Rohingya}/utf
  1121. \x{10d00}
  1122. /^\p{Script=Rohg}/utf
  1123. \x{10d39}
  1124. # Script extension check
  1125. /^\p{Hanifi_Rohingya}/utf
  1126. \x{60c}
  1127. /^\p{scx=Rohg}/utf
  1128. \x{6d4}
  1129. # Script extension only character
  1130. /^\p{Hanifi_Rohingya}/utf
  1131. \x{6d4}
  1132. /^\p{sc=Hanifi_Rohingya}/utf
  1133. \x{6d4}
  1134. # Character not in script
  1135. /^\p{Hanifi_Rohingya}/utf
  1136. \x{10d3a}
  1137. # Base script check
  1138. /^\p{sc=Sogdian}/utf
  1139. \x{10f30}
  1140. /^\p{Script=Sogd}/utf
  1141. \x{10f59}
  1142. # Script extension check
  1143. /^\p{Sogdian}/utf
  1144. \x{640}
  1145. /^\p{Script_Extensions=Sogd}/utf
  1146. \x{640}
  1147. # Script extension only character
  1148. /^\p{Sogdian}/utf
  1149. \x{640}
  1150. /^\p{sc=Sogdian}/utf
  1151. \x{640}
  1152. # Character not in script
  1153. /^\p{Sogdian}/utf
  1154. \x{10f5a}
  1155. # Base script check
  1156. /^\p{sc=Nandinagari}/utf
  1157. \x{119a0}
  1158. /^\p{Script=Nand}/utf
  1159. \x{119e4}
  1160. # Script extension check
  1161. /^\p{Nandinagari}/utf
  1162. \x{964}
  1163. /^\p{scx=Nand}/utf
  1164. \x{a835}
  1165. # Script extension only character
  1166. /^\p{Nandinagari}/utf
  1167. \x{1cfa}
  1168. /^\p{sc=Nandinagari}/utf
  1169. \x{1cfa}
  1170. # Character not in script
  1171. /^\p{Nandinagari}/utf
  1172. \x{119e5}
  1173. # Base script check
  1174. /^\p{sc=Yezidi}/utf
  1175. \x{10e80}
  1176. /^\p{Script=Yezi}/utf
  1177. \x{10eb1}
  1178. # Script extension check
  1179. /^\p{Yezidi}/utf
  1180. \x{60c}
  1181. /^\p{Script_Extensions=Yezi}/utf
  1182. \x{669}
  1183. # Script extension only character
  1184. /^\p{Yezidi}/utf
  1185. \x{660}
  1186. /^\p{sc=Yezidi}/utf
  1187. \x{660}
  1188. # Character not in script
  1189. /^\p{Yezidi}/utf
  1190. \x{10eb2}
  1191. # Base script check
  1192. /^\p{sc=Cypro_Minoan}/utf
  1193. \x{12f90}
  1194. /^\p{Script=Cpmn}/utf
  1195. \x{12ff2}
  1196. # Script extension check
  1197. /^\p{Cypro_Minoan}/utf
  1198. \x{10100}
  1199. /^\p{scx=Cpmn}/utf
  1200. \x{10101}
  1201. # Script extension only character
  1202. /^\p{Cypro_Minoan}/utf
  1203. \x{10100}
  1204. /^\p{sc=Cypro_Minoan}/utf
  1205. \x{10100}
  1206. # Character not in script
  1207. /^\p{Cypro_Minoan}/utf
  1208. \x{12ff3}
  1209. # Base script check
  1210. /^\p{sc=Old_Uyghur}/utf
  1211. \x{10f70}
  1212. /^\p{Script=Ougr}/utf
  1213. \x{10f89}
  1214. # Script extension check
  1215. /^\p{Old_Uyghur}/utf
  1216. \x{640}
  1217. /^\p{Script_Extensions=Ougr}/utf
  1218. \x{10af2}
  1219. # Script extension only character
  1220. /^\p{Old_Uyghur}/utf
  1221. \x{10af2}
  1222. /^\p{sc=Old_Uyghur}/utf
  1223. \x{10af2}
  1224. # Character not in script
  1225. /^\p{Old_Uyghur}/utf
  1226. \x{10f8a}
  1227. # Base script check
  1228. /^\p{sc=Common}/utf
  1229. \x{00}
  1230. /^\p{Script=Zyyy}/utf
  1231. \x{e007f}
  1232. # Character not in script
  1233. /^\p{Common}/utf
  1234. \x{e0080}
  1235. # Base script check
  1236. /^\p{sc=Armenian}/utf
  1237. \x{531}
  1238. /^\p{Script=Armn}/utf
  1239. \x{fb17}
  1240. # Character not in script
  1241. /^\p{Armenian}/utf
  1242. \x{fb18}
  1243. # Base script check
  1244. /^\p{sc=Hebrew}/utf
  1245. \x{591}
  1246. /^\p{Script=Hebr}/utf
  1247. \x{fb4f}
  1248. # Character not in script
  1249. /^\p{Hebrew}/utf
  1250. \x{fb50}
  1251. # Base script check
  1252. /^\p{sc=Thai}/utf
  1253. \x{e01}
  1254. /^\p{Script=Thai}/utf
  1255. \x{e5b}
  1256. # Character not in script
  1257. /^\p{Thai}/utf
  1258. \x{e5c}
  1259. # Base script check
  1260. /^\p{sc=Lao}/utf
  1261. \x{e81}
  1262. /^\p{Script=Laoo}/utf
  1263. \x{edf}
  1264. # Character not in script
  1265. /^\p{Lao}/utf
  1266. \x{ee0}
  1267. # Base script check
  1268. /^\p{sc=Tibetan}/utf
  1269. \x{f00}
  1270. /^\p{Script=Tibt}/utf
  1271. \x{fda}
  1272. # Character not in script
  1273. /^\p{Tibetan}/utf
  1274. \x{fdb}
  1275. # Base script check
  1276. /^\p{sc=Ethiopic}/utf
  1277. \x{1200}
  1278. /^\p{Script=Ethi}/utf
  1279. \x{1e7fe}
  1280. # Character not in script
  1281. /^\p{Ethiopic}/utf
  1282. \x{1e7ff}
  1283. # Base script check
  1284. /^\p{sc=Cherokee}/utf
  1285. \x{13a0}
  1286. /^\p{Script=Cher}/utf
  1287. \x{abbf}
  1288. # Character not in script
  1289. /^\p{Cherokee}/utf
  1290. \x{abc0}
  1291. # Base script check
  1292. /^\p{sc=Canadian_Aboriginal}/utf
  1293. \x{1400}
  1294. /^\p{Script=Cans}/utf
  1295. \x{11abf}
  1296. # Character not in script
  1297. /^\p{Canadian_Aboriginal}/utf
  1298. \x{11ac0}
  1299. # Base script check
  1300. /^\p{sc=Ogham}/utf
  1301. \x{1680}
  1302. /^\p{Script=Ogam}/utf
  1303. \x{169c}
  1304. # Character not in script
  1305. /^\p{Ogham}/utf
  1306. \x{169d}
  1307. # Base script check
  1308. /^\p{sc=Runic}/utf
  1309. \x{16a0}
  1310. /^\p{Script=Runr}/utf
  1311. \x{16f8}
  1312. # Character not in script
  1313. /^\p{Runic}/utf
  1314. \x{16f9}
  1315. # Base script check
  1316. /^\p{sc=Khmer}/utf
  1317. \x{1780}
  1318. /^\p{Script=Khmr}/utf
  1319. \x{19ff}
  1320. # Character not in script
  1321. /^\p{Khmer}/utf
  1322. \x{1a00}
  1323. # Base script check
  1324. /^\p{sc=Old_Italic}/utf
  1325. \x{10300}
  1326. /^\p{Script=Ital}/utf
  1327. \x{1032f}
  1328. # Character not in script
  1329. /^\p{Old_Italic}/utf
  1330. \x{10330}
  1331. # Base script check
  1332. /^\p{sc=Gothic}/utf
  1333. \x{10330}
  1334. /^\p{Script=Goth}/utf
  1335. \x{1034a}
  1336. # Character not in script
  1337. /^\p{Gothic}/utf
  1338. \x{1034b}
  1339. # Base script check
  1340. /^\p{sc=Deseret}/utf
  1341. \x{10400}
  1342. /^\p{Script=Dsrt}/utf
  1343. \x{1044f}
  1344. # Character not in script
  1345. /^\p{Deseret}/utf
  1346. \x{10450}
  1347. # Base script check
  1348. /^\p{sc=Inherited}/utf
  1349. \x{300}
  1350. /^\p{Script=Zinh}/utf
  1351. \x{e01ef}
  1352. # Character not in script
  1353. /^\p{Inherited}/utf
  1354. \x{e01f0}
  1355. # Base script check
  1356. /^\p{sc=Ugaritic}/utf
  1357. \x{10380}
  1358. /^\p{Script=Ugar}/utf
  1359. \x{1039f}
  1360. # Character not in script
  1361. /^\p{Ugaritic}/utf
  1362. \x{103a0}
  1363. # Base script check
  1364. /^\p{sc=Shavian}/utf
  1365. \x{10450}
  1366. /^\p{Script=Shaw}/utf
  1367. \x{1047f}
  1368. # Character not in script
  1369. /^\p{Shavian}/utf
  1370. \x{10480}
  1371. # Base script check
  1372. /^\p{sc=Osmanya}/utf
  1373. \x{10480}
  1374. /^\p{Script=Osma}/utf
  1375. \x{104a9}
  1376. # Character not in script
  1377. /^\p{Osmanya}/utf
  1378. \x{104aa}
  1379. # Base script check
  1380. /^\p{sc=Braille}/utf
  1381. \x{2800}
  1382. /^\p{Script=Brai}/utf
  1383. \x{28ff}
  1384. # Character not in script
  1385. /^\p{Braille}/utf
  1386. \x{2900}
  1387. # Base script check
  1388. /^\p{sc=New_Tai_Lue}/utf
  1389. \x{1980}
  1390. /^\p{Script=Talu}/utf
  1391. \x{19df}
  1392. # Character not in script
  1393. /^\p{New_Tai_Lue}/utf
  1394. \x{19e0}
  1395. # Base script check
  1396. /^\p{sc=Tifinagh}/utf
  1397. \x{2d30}
  1398. /^\p{Script=Tfng}/utf
  1399. \x{2d7f}
  1400. # Character not in script
  1401. /^\p{Tifinagh}/utf
  1402. \x{2d80}
  1403. # Base script check
  1404. /^\p{sc=Old_Persian}/utf
  1405. \x{103a0}
  1406. /^\p{Script=Xpeo}/utf
  1407. \x{103d5}
  1408. # Character not in script
  1409. /^\p{Old_Persian}/utf
  1410. \x{103d6}
  1411. # Base script check
  1412. /^\p{sc=Kharoshthi}/utf
  1413. \x{10a00}
  1414. /^\p{Script=Khar}/utf
  1415. \x{10a58}
  1416. # Character not in script
  1417. /^\p{Kharoshthi}/utf
  1418. \x{10a59}
  1419. # Base script check
  1420. /^\p{sc=Balinese}/utf
  1421. \x{1b00}
  1422. /^\p{Script=Bali}/utf
  1423. \x{1b7e}
  1424. # Character not in script
  1425. /^\p{Balinese}/utf
  1426. \x{1b7f}
  1427. # Base script check
  1428. /^\p{sc=Cuneiform}/utf
  1429. \x{12000}
  1430. /^\p{Script=Xsux}/utf
  1431. \x{12543}
  1432. # Character not in script
  1433. /^\p{Cuneiform}/utf
  1434. \x{12544}
  1435. # Base script check
  1436. /^\p{sc=Phoenician}/utf
  1437. \x{10900}
  1438. /^\p{Script=Phnx}/utf
  1439. \x{1091f}
  1440. # Character not in script
  1441. /^\p{Phoenician}/utf
  1442. \x{10920}
  1443. # Base script check
  1444. /^\p{sc=Sundanese}/utf
  1445. \x{1b80}
  1446. /^\p{Script=Sund}/utf
  1447. \x{1cc7}
  1448. # Character not in script
  1449. /^\p{Sundanese}/utf
  1450. \x{1cc8}
  1451. # Base script check
  1452. /^\p{sc=Lepcha}/utf
  1453. \x{1c00}
  1454. /^\p{Script=Lepc}/utf
  1455. \x{1c4f}
  1456. # Character not in script
  1457. /^\p{Lepcha}/utf
  1458. \x{1c50}
  1459. # Base script check
  1460. /^\p{sc=Ol_Chiki}/utf
  1461. \x{1c50}
  1462. /^\p{Script=Olck}/utf
  1463. \x{1c7f}
  1464. # Character not in script
  1465. /^\p{Ol_Chiki}/utf
  1466. \x{1c80}
  1467. # Base script check
  1468. /^\p{sc=Vai}/utf
  1469. \x{a500}
  1470. /^\p{Script=Vaii}/utf
  1471. \x{a62b}
  1472. # Character not in script
  1473. /^\p{Vai}/utf
  1474. \x{a62c}
  1475. # Base script check
  1476. /^\p{sc=Saurashtra}/utf
  1477. \x{a880}
  1478. /^\p{Script=Saur}/utf
  1479. \x{a8d9}
  1480. # Character not in script
  1481. /^\p{Saurashtra}/utf
  1482. \x{a8da}
  1483. # Base script check
  1484. /^\p{sc=Rejang}/utf
  1485. \x{a930}
  1486. /^\p{Script=Rjng}/utf
  1487. \x{a95f}
  1488. # Character not in script
  1489. /^\p{Rejang}/utf
  1490. \x{a960}
  1491. # Base script check
  1492. /^\p{sc=Lycian}/utf
  1493. \x{10280}
  1494. /^\p{Script=Lyci}/utf
  1495. \x{1029c}
  1496. # Character not in script
  1497. /^\p{Lycian}/utf
  1498. \x{1029d}
  1499. # Base script check
  1500. /^\p{sc=Carian}/utf
  1501. \x{102a0}
  1502. /^\p{Script=Cari}/utf
  1503. \x{102d0}
  1504. # Character not in script
  1505. /^\p{Carian}/utf
  1506. \x{102d1}
  1507. # Base script check
  1508. /^\p{sc=Lydian}/utf
  1509. \x{10920}
  1510. /^\p{Script=Lydi}/utf
  1511. \x{1093f}
  1512. # Character not in script
  1513. /^\p{Lydian}/utf
  1514. \x{10940}
  1515. # Base script check
  1516. /^\p{sc=Cham}/utf
  1517. \x{aa00}
  1518. /^\p{Script=Cham}/utf
  1519. \x{aa5f}
  1520. # Character not in script
  1521. /^\p{Cham}/utf
  1522. \x{aa60}
  1523. # Base script check
  1524. /^\p{sc=Tai_Tham}/utf
  1525. \x{1a20}
  1526. /^\p{Script=Lana}/utf
  1527. \x{1aad}
  1528. # Character not in script
  1529. /^\p{Tai_Tham}/utf
  1530. \x{1aae}
  1531. # Base script check
  1532. /^\p{sc=Tai_Viet}/utf
  1533. \x{aa80}
  1534. /^\p{Script=Tavt}/utf
  1535. \x{aadf}
  1536. # Character not in script
  1537. /^\p{Tai_Viet}/utf
  1538. \x{aae0}
  1539. # Base script check
  1540. /^\p{sc=Avestan}/utf
  1541. \x{10b00}
  1542. /^\p{Script=Avst}/utf
  1543. \x{10b3f}
  1544. # Character not in script
  1545. /^\p{Avestan}/utf
  1546. \x{10b40}
  1547. # Base script check
  1548. /^\p{sc=Egyptian_Hieroglyphs}/utf
  1549. \x{13000}
  1550. /^\p{Script=Egyp}/utf
  1551. \x{13455}
  1552. # Character not in script
  1553. /^\p{Egyptian_Hieroglyphs}/utf
  1554. \x{13456}
  1555. # Base script check
  1556. /^\p{sc=Samaritan}/utf
  1557. \x{800}
  1558. /^\p{Script=Samr}/utf
  1559. \x{83e}
  1560. # Character not in script
  1561. /^\p{Samaritan}/utf
  1562. \x{83f}
  1563. # Base script check
  1564. /^\p{sc=Lisu}/utf
  1565. \x{a4d0}
  1566. /^\p{Script=Lisu}/utf
  1567. \x{11fb0}
  1568. # Character not in script
  1569. /^\p{Lisu}/utf
  1570. \x{11fb1}
  1571. # Base script check
  1572. /^\p{sc=Bamum}/utf
  1573. \x{a6a0}
  1574. /^\p{Script=Bamu}/utf
  1575. \x{16a38}
  1576. # Character not in script
  1577. /^\p{Bamum}/utf
  1578. \x{16a39}
  1579. # Base script check
  1580. /^\p{sc=Meetei_Mayek}/utf
  1581. \x{aae0}
  1582. /^\p{Script=Mtei}/utf
  1583. \x{abf9}
  1584. # Character not in script
  1585. /^\p{Meetei_Mayek}/utf
  1586. \x{abfa}
  1587. # Base script check
  1588. /^\p{sc=Imperial_Aramaic}/utf
  1589. \x{10840}
  1590. /^\p{Script=Armi}/utf
  1591. \x{1085f}
  1592. # Character not in script
  1593. /^\p{Imperial_Aramaic}/utf
  1594. \x{10860}
  1595. # Base script check
  1596. /^\p{sc=Old_South_Arabian}/utf
  1597. \x{10a60}
  1598. /^\p{Script=Sarb}/utf
  1599. \x{10a7f}
  1600. # Character not in script
  1601. /^\p{Old_South_Arabian}/utf
  1602. \x{10a80}
  1603. # Base script check
  1604. /^\p{sc=Inscriptional_Parthian}/utf
  1605. \x{10b40}
  1606. /^\p{Script=Prti}/utf
  1607. \x{10b5f}
  1608. # Character not in script
  1609. /^\p{Inscriptional_Parthian}/utf
  1610. \x{10b60}
  1611. # Base script check
  1612. /^\p{sc=Inscriptional_Pahlavi}/utf
  1613. \x{10b60}
  1614. /^\p{Script=Phli}/utf
  1615. \x{10b7f}
  1616. # Character not in script
  1617. /^\p{Inscriptional_Pahlavi}/utf
  1618. \x{10b80}
  1619. # Base script check
  1620. /^\p{sc=Old_Turkic}/utf
  1621. \x{10c00}
  1622. /^\p{Script=Orkh}/utf
  1623. \x{10c48}
  1624. # Character not in script
  1625. /^\p{Old_Turkic}/utf
  1626. \x{10c49}
  1627. # Base script check
  1628. /^\p{sc=Batak}/utf
  1629. \x{1bc0}
  1630. /^\p{Script=Batk}/utf
  1631. \x{1bff}
  1632. # Character not in script
  1633. /^\p{Batak}/utf
  1634. \x{1c00}
  1635. # Base script check
  1636. /^\p{sc=Brahmi}/utf
  1637. \x{11000}
  1638. /^\p{Script=Brah}/utf
  1639. \x{1107f}
  1640. # Character not in script
  1641. /^\p{Brahmi}/utf
  1642. \x{11080}
  1643. # Base script check
  1644. /^\p{sc=Meroitic_Cursive}/utf
  1645. \x{109a0}
  1646. /^\p{Script=Merc}/utf
  1647. \x{109ff}
  1648. # Character not in script
  1649. /^\p{Meroitic_Cursive}/utf
  1650. \x{10a00}
  1651. # Base script check
  1652. /^\p{sc=Meroitic_Hieroglyphs}/utf
  1653. \x{10980}
  1654. /^\p{Script=Mero}/utf
  1655. \x{1099f}
  1656. # Character not in script
  1657. /^\p{Meroitic_Hieroglyphs}/utf
  1658. \x{109a0}
  1659. # Base script check
  1660. /^\p{sc=Miao}/utf
  1661. \x{16f00}
  1662. /^\p{Script=Plrd}/utf
  1663. \x{16f9f}
  1664. # Character not in script
  1665. /^\p{Miao}/utf
  1666. \x{16fa0}
  1667. # Base script check
  1668. /^\p{sc=Sora_Sompeng}/utf
  1669. \x{110d0}
  1670. /^\p{Script=Sora}/utf
  1671. \x{110f9}
  1672. # Character not in script
  1673. /^\p{Sora_Sompeng}/utf
  1674. \x{110fa}
  1675. # Base script check
  1676. /^\p{sc=Caucasian_Albanian}/utf
  1677. \x{10530}
  1678. /^\p{Script=Aghb}/utf
  1679. \x{1056f}
  1680. # Character not in script
  1681. /^\p{Caucasian_Albanian}/utf
  1682. \x{10570}
  1683. # Base script check
  1684. /^\p{sc=Bassa_Vah}/utf
  1685. \x{16ad0}
  1686. /^\p{Script=Bass}/utf
  1687. \x{16af5}
  1688. # Character not in script
  1689. /^\p{Bassa_Vah}/utf
  1690. \x{16af6}
  1691. # Base script check
  1692. /^\p{sc=Elbasan}/utf
  1693. \x{10500}
  1694. /^\p{Script=Elba}/utf
  1695. \x{10527}
  1696. # Character not in script
  1697. /^\p{Elbasan}/utf
  1698. \x{10528}
  1699. # Base script check
  1700. /^\p{sc=Pahawh_Hmong}/utf
  1701. \x{16b00}
  1702. /^\p{Script=Hmng}/utf
  1703. \x{16b8f}
  1704. # Character not in script
  1705. /^\p{Pahawh_Hmong}/utf
  1706. \x{16b90}
  1707. # Base script check
  1708. /^\p{sc=Mende_Kikakui}/utf
  1709. \x{1e800}
  1710. /^\p{Script=Mend}/utf
  1711. \x{1e8d6}
  1712. # Character not in script
  1713. /^\p{Mende_Kikakui}/utf
  1714. \x{1e8d7}
  1715. # Base script check
  1716. /^\p{sc=Mro}/utf
  1717. \x{16a40}
  1718. /^\p{Script=Mroo}/utf
  1719. \x{16a6f}
  1720. # Character not in script
  1721. /^\p{Mro}/utf
  1722. \x{16a70}
  1723. # Base script check
  1724. /^\p{sc=Old_North_Arabian}/utf
  1725. \x{10a80}
  1726. /^\p{Script=Narb}/utf
  1727. \x{10a9f}
  1728. # Character not in script
  1729. /^\p{Old_North_Arabian}/utf
  1730. \x{10aa0}
  1731. # Base script check
  1732. /^\p{sc=Nabataean}/utf
  1733. \x{10880}
  1734. /^\p{Script=Nbat}/utf
  1735. \x{108af}
  1736. # Character not in script
  1737. /^\p{Nabataean}/utf
  1738. \x{108b0}
  1739. # Base script check
  1740. /^\p{sc=Palmyrene}/utf
  1741. \x{10860}
  1742. /^\p{Script=Palm}/utf
  1743. \x{1087f}
  1744. # Character not in script
  1745. /^\p{Palmyrene}/utf
  1746. \x{10880}
  1747. # Base script check
  1748. /^\p{sc=Pau_Cin_Hau}/utf
  1749. \x{11ac0}
  1750. /^\p{Script=Pauc}/utf
  1751. \x{11af8}
  1752. # Character not in script
  1753. /^\p{Pau_Cin_Hau}/utf
  1754. \x{11af9}
  1755. # Base script check
  1756. /^\p{sc=Siddham}/utf
  1757. \x{11580}
  1758. /^\p{Script=Sidd}/utf
  1759. \x{115dd}
  1760. # Character not in script
  1761. /^\p{Siddham}/utf
  1762. \x{115de}
  1763. # Base script check
  1764. /^\p{sc=Warang_Citi}/utf
  1765. \x{118a0}
  1766. /^\p{Script=Wara}/utf
  1767. \x{118ff}
  1768. # Character not in script
  1769. /^\p{Warang_Citi}/utf
  1770. \x{11900}
  1771. # Base script check
  1772. /^\p{sc=Ahom}/utf
  1773. \x{11700}
  1774. /^\p{Script=Ahom}/utf
  1775. \x{11746}
  1776. # Character not in script
  1777. /^\p{Ahom}/utf
  1778. \x{11747}
  1779. # Base script check
  1780. /^\p{sc=Anatolian_Hieroglyphs}/utf
  1781. \x{14400}
  1782. /^\p{Script=Hluw}/utf
  1783. \x{14646}
  1784. # Character not in script
  1785. /^\p{Anatolian_Hieroglyphs}/utf
  1786. \x{14647}
  1787. # Base script check
  1788. /^\p{sc=Hatran}/utf
  1789. \x{108e0}
  1790. /^\p{Script=Hatr}/utf
  1791. \x{108ff}
  1792. # Character not in script
  1793. /^\p{Hatran}/utf
  1794. \x{10900}
  1795. # Base script check
  1796. /^\p{sc=Old_Hungarian}/utf
  1797. \x{10c80}
  1798. /^\p{Script=Hung}/utf
  1799. \x{10cff}
  1800. # Character not in script
  1801. /^\p{Old_Hungarian}/utf
  1802. \x{10d00}
  1803. # Base script check
  1804. /^\p{sc=SignWriting}/utf
  1805. \x{1d800}
  1806. /^\p{Script=Sgnw}/utf
  1807. \x{1daaf}
  1808. # Character not in script
  1809. /^\p{SignWriting}/utf
  1810. \x{1dab0}
  1811. # Base script check
  1812. /^\p{sc=Bhaiksuki}/utf
  1813. \x{11c00}
  1814. /^\p{Script=Bhks}/utf
  1815. \x{11c6c}
  1816. # Character not in script
  1817. /^\p{Bhaiksuki}/utf
  1818. \x{11c6d}
  1819. # Base script check
  1820. /^\p{sc=Marchen}/utf
  1821. \x{11c70}
  1822. /^\p{Script=Marc}/utf
  1823. \x{11cb6}
  1824. # Character not in script
  1825. /^\p{Marchen}/utf
  1826. \x{11cb7}
  1827. # Base script check
  1828. /^\p{sc=Newa}/utf
  1829. \x{11400}
  1830. /^\p{Script=Newa}/utf
  1831. \x{11461}
  1832. # Character not in script
  1833. /^\p{Newa}/utf
  1834. \x{11462}
  1835. # Base script check
  1836. /^\p{sc=Osage}/utf
  1837. \x{104b0}
  1838. /^\p{Script=Osge}/utf
  1839. \x{104fb}
  1840. # Character not in script
  1841. /^\p{Osage}/utf
  1842. \x{104fc}
  1843. # Base script check
  1844. /^\p{sc=Tangut}/utf
  1845. \x{16fe0}
  1846. /^\p{Script=Tang}/utf
  1847. \x{18d08}
  1848. # Character not in script
  1849. /^\p{Tangut}/utf
  1850. \x{18d09}
  1851. # Base script check
  1852. /^\p{sc=Nushu}/utf
  1853. \x{16fe1}
  1854. /^\p{Script=Nshu}/utf
  1855. \x{1b2fb}
  1856. # Character not in script
  1857. /^\p{Nushu}/utf
  1858. \x{1b2fc}
  1859. # Base script check
  1860. /^\p{sc=Soyombo}/utf
  1861. \x{11a50}
  1862. /^\p{Script=Soyo}/utf
  1863. \x{11aa2}
  1864. # Character not in script
  1865. /^\p{Soyombo}/utf
  1866. \x{11aa3}
  1867. # Base script check
  1868. /^\p{sc=Zanabazar_Square}/utf
  1869. \x{11a00}
  1870. /^\p{Script=Zanb}/utf
  1871. \x{11a47}
  1872. # Character not in script
  1873. /^\p{Zanabazar_Square}/utf
  1874. \x{11a48}
  1875. # Base script check
  1876. /^\p{sc=Makasar}/utf
  1877. \x{11ee0}
  1878. /^\p{Script=Maka}/utf
  1879. \x{11ef8}
  1880. # Character not in script
  1881. /^\p{Makasar}/utf
  1882. \x{11ef9}
  1883. # Base script check
  1884. /^\p{sc=Medefaidrin}/utf
  1885. \x{16e40}
  1886. /^\p{Script=Medf}/utf
  1887. \x{16e9a}
  1888. # Character not in script
  1889. /^\p{Medefaidrin}/utf
  1890. \x{16e9b}
  1891. # Base script check
  1892. /^\p{sc=Old_Sogdian}/utf
  1893. \x{10f00}
  1894. /^\p{Script=Sogo}/utf
  1895. \x{10f27}
  1896. # Character not in script
  1897. /^\p{Old_Sogdian}/utf
  1898. \x{10f28}
  1899. # Base script check
  1900. /^\p{sc=Elymaic}/utf
  1901. \x{10fe0}
  1902. /^\p{Script=Elym}/utf
  1903. \x{10ff6}
  1904. # Character not in script
  1905. /^\p{Elymaic}/utf
  1906. \x{10ff7}
  1907. # Base script check
  1908. /^\p{sc=Nyiakeng_Puachue_Hmong}/utf
  1909. \x{1e100}
  1910. /^\p{Script=Hmnp}/utf
  1911. \x{1e14f}
  1912. # Character not in script
  1913. /^\p{Nyiakeng_Puachue_Hmong}/utf
  1914. \x{1e150}
  1915. # Base script check
  1916. /^\p{sc=Wancho}/utf
  1917. \x{1e2c0}
  1918. /^\p{Script=Wcho}/utf
  1919. \x{1e2ff}
  1920. # Character not in script
  1921. /^\p{Wancho}/utf
  1922. \x{1e300}
  1923. # Base script check
  1924. /^\p{sc=Chorasmian}/utf
  1925. \x{10fb0}
  1926. /^\p{Script=Chrs}/utf
  1927. \x{10fcb}
  1928. # Character not in script
  1929. /^\p{Chorasmian}/utf
  1930. \x{10fcc}
  1931. # Base script check
  1932. /^\p{sc=Dives_Akuru}/utf
  1933. \x{11900}
  1934. /^\p{Script=Diak}/utf
  1935. \x{11959}
  1936. # Character not in script
  1937. /^\p{Dives_Akuru}/utf
  1938. \x{1195a}
  1939. # Base script check
  1940. /^\p{sc=Khitan_Small_Script}/utf
  1941. \x{16fe4}
  1942. /^\p{Script=Kits}/utf
  1943. \x{18cd5}
  1944. # Character not in script
  1945. /^\p{Khitan_Small_Script}/utf
  1946. \x{18cd6}
  1947. # Base script check
  1948. /^\p{sc=Tangsa}/utf
  1949. \x{16a70}
  1950. /^\p{Script=Tnsa}/utf
  1951. \x{16ac9}
  1952. # Character not in script
  1953. /^\p{Tangsa}/utf
  1954. \x{16aca}
  1955. # Base script check
  1956. /^\p{sc=Toto}/utf
  1957. \x{1e290}
  1958. /^\p{Script=Toto}/utf
  1959. \x{1e2ae}
  1960. # Character not in script
  1961. /^\p{Toto}/utf
  1962. \x{1e2af}
  1963. # Base script check
  1964. /^\p{sc=Vithkuqi}/utf
  1965. \x{10570}
  1966. /^\p{Script=Vith}/utf
  1967. \x{105bc}
  1968. # Character not in script
  1969. /^\p{Vithkuqi}/utf
  1970. \x{105bd}
  1971. # Base script check
  1972. /^\p{sc=Kawi}/utf
  1973. \x{11f00}
  1974. /^\p{Script=Kawi}/utf
  1975. \x{11f59}
  1976. # Character not in script
  1977. /^\p{Kawi}/utf
  1978. \x{11f5a}
  1979. # Base script check
  1980. /^\p{sc=Nag_Mundari}/utf
  1981. \x{1e4d0}
  1982. /^\p{Script=Nagm}/utf
  1983. \x{1e4f9}
  1984. # Character not in script
  1985. /^\p{Nag_Mundari}/utf
  1986. \x{1e4fa}
  1987. # End of testinput26