mirror of
https://github.com/PCRE2Project/pcre2.git
synced 2025-10-17 15:25:55 +08:00

UCD 16 makes a lot of changes to scripts, so make sure that we have sufficient coverage by keeping the original autogenerated tests in addition. Complete the code updates for changes to ScriptExtensions.txt which is no longer sorted by script and allow for multiple unicode property test files, depending on Unicode version.
2755 lines
38 KiB
Plaintext
2755 lines
38 KiB
Plaintext
# These tests were generated by maint/GenerateTest.py using PCRE2's UCP
|
|
# data, do not edit unless that data has changed and they are reflecting
|
|
# a previous version.
|
|
|
|
# Unicode Script Extension tests for version 15.0.0
|
|
|
|
#perltest
|
|
|
|
# Base script check
|
|
/^\p{sc=Latin}/utf
|
|
A
|
|
|
|
/^\p{Script=Latn}/utf
|
|
\x{1df2a}
|
|
|
|
# Script extension check
|
|
/^\p{Latin}/utf
|
|
\x{363}
|
|
|
|
/^\p{scx=Latn}/utf
|
|
\x{a92e}
|
|
|
|
# Script extension only character
|
|
/^\p{Latin}/utf
|
|
\x{363}
|
|
|
|
/^\p{sc=Latin}/utf
|
|
\x{363}
|
|
|
|
# Character not in script
|
|
/^\p{Latin}/utf
|
|
\x{1df2b}
|
|
|
|
# Base script check
|
|
/^\p{sc=Greek}/utf
|
|
\x{370}
|
|
|
|
/^\p{Script=Grek}/utf
|
|
\x{1d245}
|
|
|
|
# Script extension check
|
|
/^\p{Greek}/utf
|
|
\x{342}
|
|
|
|
/^\p{Script_Extensions=Grek}/utf
|
|
\x{1dc1}
|
|
|
|
# Script extension only character
|
|
/^\p{Greek}/utf
|
|
\x{342}
|
|
|
|
/^\p{sc=Greek}/utf
|
|
\x{342}
|
|
|
|
# Character not in script
|
|
/^\p{Greek}/utf
|
|
\x{1d246}
|
|
|
|
# Base script check
|
|
/^\p{sc=Cyrillic}/utf
|
|
\x{400}
|
|
|
|
/^\p{Script=Cyrl}/utf
|
|
\x{1e08f}
|
|
|
|
# Script extension check
|
|
/^\p{Cyrillic}/utf
|
|
\x{483}
|
|
|
|
/^\p{scx=Cyrl}/utf
|
|
\x{a66f}
|
|
|
|
# Script extension only character
|
|
/^\p{Cyrillic}/utf
|
|
\x{2e43}
|
|
|
|
/^\p{sc=Cyrillic}/utf
|
|
\x{2e43}
|
|
|
|
# Character not in script
|
|
/^\p{Cyrillic}/utf
|
|
\x{1e090}
|
|
|
|
# Base script check
|
|
/^\p{sc=Arabic}/utf
|
|
\x{600}
|
|
|
|
/^\p{Script=Arab}/utf
|
|
\x{1eef1}
|
|
|
|
# Script extension check
|
|
/^\p{Arabic}/utf
|
|
\x{60c}
|
|
|
|
/^\p{Script_Extensions=Arab}/utf
|
|
\x{102fb}
|
|
|
|
# Script extension only character
|
|
/^\p{Arabic}/utf
|
|
\x{102e0}
|
|
|
|
/^\p{sc=Arabic}/utf
|
|
\x{102e0}
|
|
|
|
# Character not in script
|
|
/^\p{Arabic}/utf
|
|
\x{1eef2}
|
|
|
|
# Base script check
|
|
/^\p{sc=Syriac}/utf
|
|
\x{700}
|
|
|
|
/^\p{Script=Syrc}/utf
|
|
\x{86a}
|
|
|
|
# Script extension check
|
|
/^\p{Syriac}/utf
|
|
\x{60c}
|
|
|
|
/^\p{scx=Syrc}/utf
|
|
\x{1dfa}
|
|
|
|
# Script extension only character
|
|
/^\p{Syriac}/utf
|
|
\x{1dfa}
|
|
|
|
/^\p{sc=Syriac}/utf
|
|
\x{1dfa}
|
|
|
|
# Character not in script
|
|
/^\p{Syriac}/utf
|
|
\x{1dfb}
|
|
|
|
# Base script check
|
|
/^\p{sc=Thaana}/utf
|
|
\x{780}
|
|
|
|
/^\p{Script=Thaa}/utf
|
|
\x{7b1}
|
|
|
|
# Script extension check
|
|
/^\p{Thaana}/utf
|
|
\x{60c}
|
|
|
|
/^\p{Script_Extensions=Thaa}/utf
|
|
\x{fdfd}
|
|
|
|
# Script extension only character
|
|
/^\p{Thaana}/utf
|
|
\x{fdf2}
|
|
|
|
/^\p{sc=Thaana}/utf
|
|
\x{fdf2}
|
|
|
|
# Character not in script
|
|
/^\p{Thaana}/utf
|
|
\x{fdfe}
|
|
|
|
# Base script check
|
|
/^\p{sc=Devanagari}/utf
|
|
\x{900}
|
|
|
|
/^\p{Script=Deva}/utf
|
|
\x{11b09}
|
|
|
|
# Script extension check
|
|
/^\p{Devanagari}/utf
|
|
\x{951}
|
|
|
|
/^\p{scx=Deva}/utf
|
|
\x{a8f3}
|
|
|
|
# Script extension only character
|
|
/^\p{Devanagari}/utf
|
|
\x{1cd1}
|
|
|
|
/^\p{sc=Devanagari}/utf
|
|
\x{1cd1}
|
|
|
|
# Character not in script
|
|
/^\p{Devanagari}/utf
|
|
\x{11b0a}
|
|
|
|
# Base script check
|
|
/^\p{sc=Bengali}/utf
|
|
\x{980}
|
|
|
|
/^\p{Script=Beng}/utf
|
|
\x{9fe}
|
|
|
|
# Script extension check
|
|
/^\p{Bengali}/utf
|
|
\x{951}
|
|
|
|
/^\p{Script_Extensions=Beng}/utf
|
|
\x{a8f1}
|
|
|
|
# Script extension only character
|
|
/^\p{Bengali}/utf
|
|
\x{1cf7}
|
|
|
|
/^\p{sc=Bengali}/utf
|
|
\x{1cf7}
|
|
|
|
# Character not in script
|
|
/^\p{Bengali}/utf
|
|
\x{a8f2}
|
|
|
|
# Base script check
|
|
/^\p{sc=Gurmukhi}/utf
|
|
\x{a01}
|
|
|
|
/^\p{Script=Guru}/utf
|
|
\x{a76}
|
|
|
|
# Script extension check
|
|
/^\p{Gurmukhi}/utf
|
|
\x{951}
|
|
|
|
/^\p{scx=Guru}/utf
|
|
\x{a839}
|
|
|
|
# Script extension only character
|
|
/^\p{Gurmukhi}/utf
|
|
\x{a836}
|
|
|
|
/^\p{sc=Gurmukhi}/utf
|
|
\x{a836}
|
|
|
|
# Character not in script
|
|
/^\p{Gurmukhi}/utf
|
|
\x{a83a}
|
|
|
|
# Base script check
|
|
/^\p{sc=Gujarati}/utf
|
|
\x{a81}
|
|
|
|
/^\p{Script=Gujr}/utf
|
|
\x{aff}
|
|
|
|
# Script extension check
|
|
/^\p{Gujarati}/utf
|
|
\x{951}
|
|
|
|
/^\p{Script_Extensions=Gujr}/utf
|
|
\x{a839}
|
|
|
|
# Script extension only character
|
|
/^\p{Gujarati}/utf
|
|
\x{a836}
|
|
|
|
/^\p{sc=Gujarati}/utf
|
|
\x{a836}
|
|
|
|
# Character not in script
|
|
/^\p{Gujarati}/utf
|
|
\x{a83a}
|
|
|
|
# Base script check
|
|
/^\p{sc=Oriya}/utf
|
|
\x{b01}
|
|
|
|
/^\p{Script=Orya}/utf
|
|
\x{b77}
|
|
|
|
# Script extension check
|
|
/^\p{Oriya}/utf
|
|
\x{951}
|
|
|
|
/^\p{scx=Orya}/utf
|
|
\x{1cf2}
|
|
|
|
# Script extension only character
|
|
/^\p{Oriya}/utf
|
|
\x{1cda}
|
|
|
|
/^\p{sc=Oriya}/utf
|
|
\x{1cda}
|
|
|
|
# Character not in script
|
|
/^\p{Oriya}/utf
|
|
\x{1cf3}
|
|
|
|
# Base script check
|
|
/^\p{sc=Tamil}/utf
|
|
\x{b82}
|
|
|
|
/^\p{Script=Taml}/utf
|
|
\x{11fff}
|
|
|
|
# Script extension check
|
|
/^\p{Tamil}/utf
|
|
\x{951}
|
|
|
|
/^\p{Script_Extensions=Taml}/utf
|
|
\x{11fd3}
|
|
|
|
# Script extension only character
|
|
/^\p{Tamil}/utf
|
|
\x{a8f3}
|
|
|
|
/^\p{sc=Tamil}/utf
|
|
\x{a8f3}
|
|
|
|
# Character not in script
|
|
/^\p{Tamil}/utf
|
|
\x{12000}
|
|
|
|
# Base script check
|
|
/^\p{sc=Telugu}/utf
|
|
\x{c00}
|
|
|
|
/^\p{Script=Telu}/utf
|
|
\x{c7f}
|
|
|
|
# Script extension check
|
|
/^\p{Telugu}/utf
|
|
\x{951}
|
|
|
|
/^\p{scx=Telu}/utf
|
|
\x{1cf2}
|
|
|
|
# Script extension only character
|
|
/^\p{Telugu}/utf
|
|
\x{1cda}
|
|
|
|
/^\p{sc=Telugu}/utf
|
|
\x{1cda}
|
|
|
|
# Character not in script
|
|
/^\p{Telugu}/utf
|
|
\x{1cf3}
|
|
|
|
# Base script check
|
|
/^\p{sc=Kannada}/utf
|
|
\x{c80}
|
|
|
|
/^\p{Script=Knda}/utf
|
|
\x{cf3}
|
|
|
|
# Script extension check
|
|
/^\p{Kannada}/utf
|
|
\x{951}
|
|
|
|
/^\p{Script_Extensions=Knda}/utf
|
|
\x{a835}
|
|
|
|
# Script extension only character
|
|
/^\p{Kannada}/utf
|
|
\x{1cf4}
|
|
|
|
/^\p{sc=Kannada}/utf
|
|
\x{1cf4}
|
|
|
|
# Character not in script
|
|
/^\p{Kannada}/utf
|
|
\x{a836}
|
|
|
|
# Base script check
|
|
/^\p{sc=Malayalam}/utf
|
|
\x{d00}
|
|
|
|
/^\p{Script=Mlym}/utf
|
|
\x{d7f}
|
|
|
|
# Script extension check
|
|
/^\p{Malayalam}/utf
|
|
\x{951}
|
|
|
|
/^\p{scx=Mlym}/utf
|
|
\x{a832}
|
|
|
|
# Script extension only character
|
|
/^\p{Malayalam}/utf
|
|
\x{1cda}
|
|
|
|
/^\p{sc=Malayalam}/utf
|
|
\x{1cda}
|
|
|
|
# Character not in script
|
|
/^\p{Malayalam}/utf
|
|
\x{a833}
|
|
|
|
# Base script check
|
|
/^\p{sc=Sinhala}/utf
|
|
\x{d81}
|
|
|
|
/^\p{Script=Sinh}/utf
|
|
\x{111f4}
|
|
|
|
# Script extension check
|
|
/^\p{Sinhala}/utf
|
|
\x{964}
|
|
|
|
/^\p{Script_Extensions=Sinh}/utf
|
|
\x{965}
|
|
|
|
# Script extension only character
|
|
/^\p{Sinhala}/utf
|
|
\x{964}
|
|
|
|
/^\p{sc=Sinhala}/utf
|
|
\x{964}
|
|
|
|
# Character not in script
|
|
/^\p{Sinhala}/utf
|
|
\x{111f5}
|
|
|
|
# Base script check
|
|
/^\p{sc=Myanmar}/utf
|
|
\x{1000}
|
|
|
|
/^\p{Script=Mymr}/utf
|
|
\x{aa7f}
|
|
|
|
# Script extension check
|
|
/^\p{Myanmar}/utf
|
|
\x{1040}
|
|
|
|
/^\p{scx=Mymr}/utf
|
|
\x{a92e}
|
|
|
|
# Script extension only character
|
|
/^\p{Myanmar}/utf
|
|
\x{a92e}
|
|
|
|
/^\p{sc=Myanmar}/utf
|
|
\x{a92e}
|
|
|
|
# Character not in script
|
|
/^\p{Myanmar}/utf
|
|
\x{aa80}
|
|
|
|
# Base script check
|
|
/^\p{sc=Georgian}/utf
|
|
\x{10a0}
|
|
|
|
/^\p{Script=Geor}/utf
|
|
\x{2d2d}
|
|
|
|
# Script extension check
|
|
/^\p{Georgian}/utf
|
|
\x{10fb}
|
|
|
|
/^\p{Script_Extensions=Geor}/utf
|
|
\x{10fb}
|
|
|
|
# Script extension only character
|
|
/^\p{Georgian}/utf
|
|
\x{10fb}
|
|
|
|
/^\p{sc=Georgian}/utf
|
|
\x{10fb}
|
|
|
|
# Character not in script
|
|
/^\p{Georgian}/utf
|
|
\x{2d2e}
|
|
|
|
# Base script check
|
|
/^\p{sc=Hangul}/utf
|
|
\x{1100}
|
|
|
|
/^\p{Script=Hang}/utf
|
|
\x{ffdc}
|
|
|
|
# Script extension check
|
|
/^\p{Hangul}/utf
|
|
\x{3001}
|
|
|
|
/^\p{scx=Hang}/utf
|
|
\x{ff65}
|
|
|
|
# Script extension only character
|
|
/^\p{Hangul}/utf
|
|
\x{3003}
|
|
|
|
/^\p{sc=Hangul}/utf
|
|
\x{3003}
|
|
|
|
# Character not in script
|
|
/^\p{Hangul}/utf
|
|
\x{ffdd}
|
|
|
|
# Base script check
|
|
/^\p{sc=Mongolian}/utf
|
|
\x{1800}
|
|
|
|
/^\p{Script=Mong}/utf
|
|
\x{1166c}
|
|
|
|
# Script extension check
|
|
/^\p{Mongolian}/utf
|
|
\x{1802}
|
|
|
|
/^\p{Script_Extensions=Mong}/utf
|
|
\x{202f}
|
|
|
|
# Script extension only character
|
|
/^\p{Mongolian}/utf
|
|
\x{202f}
|
|
|
|
/^\p{sc=Mongolian}/utf
|
|
\x{202f}
|
|
|
|
# Character not in script
|
|
/^\p{Mongolian}/utf
|
|
\x{1166d}
|
|
|
|
# Base script check
|
|
/^\p{sc=Hiragana}/utf
|
|
\x{3041}
|
|
|
|
/^\p{Script=Hira}/utf
|
|
\x{1f200}
|
|
|
|
# Script extension check
|
|
/^\p{Hiragana}/utf
|
|
\x{3001}
|
|
|
|
/^\p{scx=Hira}/utf
|
|
\x{ff9f}
|
|
|
|
# Script extension only character
|
|
/^\p{Hiragana}/utf
|
|
\x{3031}
|
|
|
|
/^\p{sc=Hiragana}/utf
|
|
\x{3031}
|
|
|
|
# Character not in script
|
|
/^\p{Hiragana}/utf
|
|
\x{1f201}
|
|
|
|
# Base script check
|
|
/^\p{sc=Katakana}/utf
|
|
\x{30a1}
|
|
|
|
/^\p{Script=Kana}/utf
|
|
\x{1b167}
|
|
|
|
# Script extension check
|
|
/^\p{Katakana}/utf
|
|
\x{3001}
|
|
|
|
/^\p{Script_Extensions=Kana}/utf
|
|
\x{ff9f}
|
|
|
|
# Script extension only character
|
|
/^\p{Katakana}/utf
|
|
\x{3031}
|
|
|
|
/^\p{sc=Katakana}/utf
|
|
\x{3031}
|
|
|
|
# Character not in script
|
|
/^\p{Katakana}/utf
|
|
\x{1b168}
|
|
|
|
# Base script check
|
|
/^\p{sc=Bopomofo}/utf
|
|
\x{2ea}
|
|
|
|
/^\p{Script=Bopo}/utf
|
|
\x{31bf}
|
|
|
|
# Script extension check
|
|
/^\p{Bopomofo}/utf
|
|
\x{3001}
|
|
|
|
/^\p{scx=Bopo}/utf
|
|
\x{ff65}
|
|
|
|
# Script extension only character
|
|
/^\p{Bopomofo}/utf
|
|
\x{302a}
|
|
|
|
/^\p{sc=Bopomofo}/utf
|
|
\x{302a}
|
|
|
|
# Character not in script
|
|
/^\p{Bopomofo}/utf
|
|
\x{ff66}
|
|
|
|
# Base script check
|
|
/^\p{sc=Han}/utf
|
|
\x{2e80}
|
|
|
|
/^\p{Script=Hani}/utf
|
|
\x{323af}
|
|
|
|
# Script extension check
|
|
/^\p{Han}/utf
|
|
\x{3001}
|
|
|
|
/^\p{Script_Extensions=Hani}/utf
|
|
\x{1f251}
|
|
|
|
# Script extension only character
|
|
/^\p{Han}/utf
|
|
\x{3006}
|
|
|
|
/^\p{sc=Han}/utf
|
|
\x{3006}
|
|
|
|
# Character not in script
|
|
/^\p{Han}/utf
|
|
\x{323b0}
|
|
|
|
# Base script check
|
|
/^\p{sc=Yi}/utf
|
|
\x{a000}
|
|
|
|
/^\p{Script=Yiii}/utf
|
|
\x{a4c6}
|
|
|
|
# Script extension check
|
|
/^\p{Yi}/utf
|
|
\x{3001}
|
|
|
|
/^\p{scx=Yiii}/utf
|
|
\x{ff65}
|
|
|
|
# Script extension only character
|
|
/^\p{Yi}/utf
|
|
\x{3001}
|
|
|
|
/^\p{sc=Yi}/utf
|
|
\x{3001}
|
|
|
|
# Character not in script
|
|
/^\p{Yi}/utf
|
|
\x{ff66}
|
|
|
|
# Base script check
|
|
/^\p{sc=Tagalog}/utf
|
|
\x{1700}
|
|
|
|
/^\p{Script=Tglg}/utf
|
|
\x{171f}
|
|
|
|
# Script extension check
|
|
/^\p{Tagalog}/utf
|
|
\x{1735}
|
|
|
|
/^\p{Script_Extensions=Tglg}/utf
|
|
\x{1736}
|
|
|
|
# Script extension only character
|
|
/^\p{Tagalog}/utf
|
|
\x{1735}
|
|
|
|
/^\p{sc=Tagalog}/utf
|
|
\x{1735}
|
|
|
|
# Character not in script
|
|
/^\p{Tagalog}/utf
|
|
\x{1737}
|
|
|
|
# Base script check
|
|
/^\p{sc=Hanunoo}/utf
|
|
\x{1720}
|
|
|
|
/^\p{Script=Hano}/utf
|
|
\x{1734}
|
|
|
|
# Script extension check
|
|
/^\p{Hanunoo}/utf
|
|
\x{1735}
|
|
|
|
/^\p{scx=Hano}/utf
|
|
\x{1736}
|
|
|
|
# Script extension only character
|
|
/^\p{Hanunoo}/utf
|
|
\x{1735}
|
|
|
|
/^\p{sc=Hanunoo}/utf
|
|
\x{1735}
|
|
|
|
# Character not in script
|
|
/^\p{Hanunoo}/utf
|
|
\x{1737}
|
|
|
|
# Base script check
|
|
/^\p{sc=Buhid}/utf
|
|
\x{1740}
|
|
|
|
/^\p{Script=Buhd}/utf
|
|
\x{1753}
|
|
|
|
# Script extension check
|
|
/^\p{Buhid}/utf
|
|
\x{1735}
|
|
|
|
/^\p{Script_Extensions=Buhd}/utf
|
|
\x{1736}
|
|
|
|
# Script extension only character
|
|
/^\p{Buhid}/utf
|
|
\x{1735}
|
|
|
|
/^\p{sc=Buhid}/utf
|
|
\x{1735}
|
|
|
|
# Character not in script
|
|
/^\p{Buhid}/utf
|
|
\x{1754}
|
|
|
|
# Base script check
|
|
/^\p{sc=Tagbanwa}/utf
|
|
\x{1760}
|
|
|
|
/^\p{Script=Tagb}/utf
|
|
\x{1773}
|
|
|
|
# Script extension check
|
|
/^\p{Tagbanwa}/utf
|
|
\x{1735}
|
|
|
|
/^\p{scx=Tagb}/utf
|
|
\x{1736}
|
|
|
|
# Script extension only character
|
|
/^\p{Tagbanwa}/utf
|
|
\x{1735}
|
|
|
|
/^\p{sc=Tagbanwa}/utf
|
|
\x{1735}
|
|
|
|
# Character not in script
|
|
/^\p{Tagbanwa}/utf
|
|
\x{1774}
|
|
|
|
# Base script check
|
|
/^\p{sc=Limbu}/utf
|
|
\x{1900}
|
|
|
|
/^\p{Script=Limb}/utf
|
|
\x{194f}
|
|
|
|
# Script extension check
|
|
/^\p{Limbu}/utf
|
|
\x{965}
|
|
|
|
/^\p{Script_Extensions=Limb}/utf
|
|
\x{965}
|
|
|
|
# Script extension only character
|
|
/^\p{Limbu}/utf
|
|
\x{965}
|
|
|
|
/^\p{sc=Limbu}/utf
|
|
\x{965}
|
|
|
|
# Character not in script
|
|
/^\p{Limbu}/utf
|
|
\x{1950}
|
|
|
|
# Base script check
|
|
/^\p{sc=Tai_Le}/utf
|
|
\x{1950}
|
|
|
|
/^\p{Script=Tale}/utf
|
|
\x{1974}
|
|
|
|
# Script extension check
|
|
/^\p{Tai_Le}/utf
|
|
\x{1040}
|
|
|
|
/^\p{scx=Tale}/utf
|
|
\x{1049}
|
|
|
|
# Script extension only character
|
|
/^\p{Tai_Le}/utf
|
|
\x{1040}
|
|
|
|
/^\p{sc=Tai_Le}/utf
|
|
\x{1040}
|
|
|
|
# Character not in script
|
|
/^\p{Tai_Le}/utf
|
|
\x{1975}
|
|
|
|
# Base script check
|
|
/^\p{sc=Linear_B}/utf
|
|
\x{10000}
|
|
|
|
/^\p{Script=Linb}/utf
|
|
\x{100fa}
|
|
|
|
# Script extension check
|
|
/^\p{Linear_B}/utf
|
|
\x{10100}
|
|
|
|
/^\p{Script_Extensions=Linb}/utf
|
|
\x{1013f}
|
|
|
|
# Script extension only character
|
|
/^\p{Linear_B}/utf
|
|
\x{10102}
|
|
|
|
/^\p{sc=Linear_B}/utf
|
|
\x{10102}
|
|
|
|
# Character not in script
|
|
/^\p{Linear_B}/utf
|
|
\x{10140}
|
|
|
|
# Base script check
|
|
/^\p{sc=Cypriot}/utf
|
|
\x{10800}
|
|
|
|
/^\p{Script=Cprt}/utf
|
|
\x{1083f}
|
|
|
|
# Script extension check
|
|
/^\p{Cypriot}/utf
|
|
\x{10100}
|
|
|
|
/^\p{scx=Cprt}/utf
|
|
\x{1013f}
|
|
|
|
# Script extension only character
|
|
/^\p{Cypriot}/utf
|
|
\x{10102}
|
|
|
|
/^\p{sc=Cypriot}/utf
|
|
\x{10102}
|
|
|
|
# Character not in script
|
|
/^\p{Cypriot}/utf
|
|
\x{10840}
|
|
|
|
# Base script check
|
|
/^\p{sc=Buginese}/utf
|
|
\x{1a00}
|
|
|
|
/^\p{Script=Bugi}/utf
|
|
\x{1a1f}
|
|
|
|
# Script extension check
|
|
/^\p{Buginese}/utf
|
|
\x{a9cf}
|
|
|
|
/^\p{Script_Extensions=Bugi}/utf
|
|
\x{a9cf}
|
|
|
|
# Script extension only character
|
|
/^\p{Buginese}/utf
|
|
\x{a9cf}
|
|
|
|
/^\p{sc=Buginese}/utf
|
|
\x{a9cf}
|
|
|
|
# Character not in script
|
|
/^\p{Buginese}/utf
|
|
\x{a9d0}
|
|
|
|
# Base script check
|
|
/^\p{sc=Coptic}/utf
|
|
\x{3e2}
|
|
|
|
/^\p{Script=Copt}/utf
|
|
\x{2cff}
|
|
|
|
# Script extension check
|
|
/^\p{Coptic}/utf
|
|
\x{102e0}
|
|
|
|
/^\p{scx=Copt}/utf
|
|
\x{102fb}
|
|
|
|
# Script extension only character
|
|
/^\p{Coptic}/utf
|
|
\x{102e0}
|
|
|
|
/^\p{sc=Coptic}/utf
|
|
\x{102e0}
|
|
|
|
# Character not in script
|
|
/^\p{Coptic}/utf
|
|
\x{102fc}
|
|
|
|
# Base script check
|
|
/^\p{sc=Glagolitic}/utf
|
|
\x{2c00}
|
|
|
|
/^\p{Script=Glag}/utf
|
|
\x{1e02a}
|
|
|
|
# Script extension check
|
|
/^\p{Glagolitic}/utf
|
|
\x{484}
|
|
|
|
/^\p{Script_Extensions=Glag}/utf
|
|
\x{a66f}
|
|
|
|
# Script extension only character
|
|
/^\p{Glagolitic}/utf
|
|
\x{484}
|
|
|
|
/^\p{sc=Glagolitic}/utf
|
|
\x{484}
|
|
|
|
# Character not in script
|
|
/^\p{Glagolitic}/utf
|
|
\x{1e02b}
|
|
|
|
# Base script check
|
|
/^\p{sc=Syloti_Nagri}/utf
|
|
\x{a800}
|
|
|
|
/^\p{Script=Sylo}/utf
|
|
\x{a82c}
|
|
|
|
# Script extension check
|
|
/^\p{Syloti_Nagri}/utf
|
|
\x{964}
|
|
|
|
/^\p{scx=Sylo}/utf
|
|
\x{9ef}
|
|
|
|
# Script extension only character
|
|
/^\p{Syloti_Nagri}/utf
|
|
\x{9e6}
|
|
|
|
/^\p{sc=Syloti_Nagri}/utf
|
|
\x{9e6}
|
|
|
|
# Character not in script
|
|
/^\p{Syloti_Nagri}/utf
|
|
\x{a82d}
|
|
|
|
# Base script check
|
|
/^\p{sc=Phags_Pa}/utf
|
|
\x{a840}
|
|
|
|
/^\p{Script=Phag}/utf
|
|
\x{a877}
|
|
|
|
# Script extension check
|
|
/^\p{Phags_Pa}/utf
|
|
\x{1802}
|
|
|
|
/^\p{Script_Extensions=Phag}/utf
|
|
\x{1805}
|
|
|
|
# Script extension only character
|
|
/^\p{Phags_Pa}/utf
|
|
\x{1802}
|
|
|
|
/^\p{sc=Phags_Pa}/utf
|
|
\x{1802}
|
|
|
|
# Character not in script
|
|
/^\p{Phags_Pa}/utf
|
|
\x{a878}
|
|
|
|
# Base script check
|
|
/^\p{sc=Nko}/utf
|
|
\x{7c0}
|
|
|
|
/^\p{Script=Nkoo}/utf
|
|
\x{7ff}
|
|
|
|
# Script extension check
|
|
/^\p{Nko}/utf
|
|
\x{60c}
|
|
|
|
/^\p{scx=Nkoo}/utf
|
|
\x{fd3f}
|
|
|
|
# Script extension only character
|
|
/^\p{Nko}/utf
|
|
\x{fd3e}
|
|
|
|
/^\p{sc=Nko}/utf
|
|
\x{fd3e}
|
|
|
|
# Character not in script
|
|
/^\p{Nko}/utf
|
|
\x{fd40}
|
|
|
|
# Base script check
|
|
/^\p{sc=Kayah_Li}/utf
|
|
\x{a900}
|
|
|
|
/^\p{Script=Kali}/utf
|
|
\x{a92f}
|
|
|
|
# Script extension check
|
|
/^\p{Kayah_Li}/utf
|
|
\x{a92e}
|
|
|
|
/^\p{Script_Extensions=Kali}/utf
|
|
\x{a92e}
|
|
|
|
# Script extension only character
|
|
/^\p{Kayah_Li}/utf
|
|
\x{a92e}
|
|
|
|
/^\p{sc=Kayah_Li}/utf
|
|
\x{a92e}
|
|
|
|
# Character not in script
|
|
/^\p{Kayah_Li}/utf
|
|
\x{a930}
|
|
|
|
# Base script check
|
|
/^\p{sc=Javanese}/utf
|
|
\x{a980}
|
|
|
|
/^\p{Script=Java}/utf
|
|
\x{a9df}
|
|
|
|
# Script extension check
|
|
/^\p{Javanese}/utf
|
|
\x{a9cf}
|
|
|
|
/^\p{scx=Java}/utf
|
|
\x{a9cf}
|
|
|
|
# Script extension only character
|
|
/^\p{Javanese}/utf
|
|
\x{a9cf}
|
|
|
|
/^\p{sc=Javanese}/utf
|
|
\x{a9cf}
|
|
|
|
# Character not in script
|
|
/^\p{Javanese}/utf
|
|
\x{a9e0}
|
|
|
|
# Base script check
|
|
/^\p{sc=Kaithi}/utf
|
|
\x{11080}
|
|
|
|
/^\p{Script=Kthi}/utf
|
|
\x{110cd}
|
|
|
|
# Script extension check
|
|
/^\p{Kaithi}/utf
|
|
\x{966}
|
|
|
|
/^\p{Script_Extensions=Kthi}/utf
|
|
\x{a839}
|
|
|
|
# Script extension only character
|
|
/^\p{Kaithi}/utf
|
|
\x{966}
|
|
|
|
/^\p{sc=Kaithi}/utf
|
|
\x{966}
|
|
|
|
# Character not in script
|
|
/^\p{Kaithi}/utf
|
|
\x{110ce}
|
|
|
|
# Base script check
|
|
/^\p{sc=Mandaic}/utf
|
|
\x{840}
|
|
|
|
/^\p{Script=Mand}/utf
|
|
\x{85e}
|
|
|
|
# Script extension check
|
|
/^\p{Mandaic}/utf
|
|
\x{640}
|
|
|
|
/^\p{scx=Mand}/utf
|
|
\x{640}
|
|
|
|
# Script extension only character
|
|
/^\p{Mandaic}/utf
|
|
\x{640}
|
|
|
|
/^\p{sc=Mandaic}/utf
|
|
\x{640}
|
|
|
|
# Character not in script
|
|
/^\p{Mandaic}/utf
|
|
\x{85f}
|
|
|
|
# Base script check
|
|
/^\p{sc=Chakma}/utf
|
|
\x{11100}
|
|
|
|
/^\p{Script=Cakm}/utf
|
|
\x{11147}
|
|
|
|
# Script extension check
|
|
/^\p{Chakma}/utf
|
|
\x{9e6}
|
|
|
|
/^\p{Script_Extensions=Cakm}/utf
|
|
\x{1049}
|
|
|
|
# Script extension only character
|
|
/^\p{Chakma}/utf
|
|
\x{9e6}
|
|
|
|
/^\p{sc=Chakma}/utf
|
|
\x{9e6}
|
|
|
|
# Character not in script
|
|
/^\p{Chakma}/utf
|
|
\x{11148}
|
|
|
|
# Base script check
|
|
/^\p{sc=Sharada}/utf
|
|
\x{11180}
|
|
|
|
/^\p{Script=Shrd}/utf
|
|
\x{111df}
|
|
|
|
# Script extension check
|
|
/^\p{Sharada}/utf
|
|
\x{951}
|
|
|
|
/^\p{scx=Shrd}/utf
|
|
\x{1ce0}
|
|
|
|
# Script extension only character
|
|
/^\p{Sharada}/utf
|
|
\x{1cd7}
|
|
|
|
/^\p{sc=Sharada}/utf
|
|
\x{1cd7}
|
|
|
|
# Character not in script
|
|
/^\p{Sharada}/utf
|
|
\x{111e0}
|
|
|
|
# Base script check
|
|
/^\p{sc=Takri}/utf
|
|
\x{11680}
|
|
|
|
/^\p{Script=Takr}/utf
|
|
\x{116c9}
|
|
|
|
# Script extension check
|
|
/^\p{Takri}/utf
|
|
\x{964}
|
|
|
|
/^\p{Script_Extensions=Takr}/utf
|
|
\x{a839}
|
|
|
|
# Script extension only character
|
|
/^\p{Takri}/utf
|
|
\x{a836}
|
|
|
|
/^\p{sc=Takri}/utf
|
|
\x{a836}
|
|
|
|
# Character not in script
|
|
/^\p{Takri}/utf
|
|
\x{116ca}
|
|
|
|
# Base script check
|
|
/^\p{sc=Duployan}/utf
|
|
\x{1bc00}
|
|
|
|
/^\p{Script=Dupl}/utf
|
|
\x{1bc9f}
|
|
|
|
# Script extension check
|
|
/^\p{Duployan}/utf
|
|
\x{1bca0}
|
|
|
|
/^\p{scx=Dupl}/utf
|
|
\x{1bca3}
|
|
|
|
# Script extension only character
|
|
/^\p{Duployan}/utf
|
|
\x{1bca0}
|
|
|
|
/^\p{sc=Duployan}/utf
|
|
\x{1bca0}
|
|
|
|
# Character not in script
|
|
/^\p{Duployan}/utf
|
|
\x{1bca4}
|
|
|
|
# Base script check
|
|
/^\p{sc=Grantha}/utf
|
|
\x{11300}
|
|
|
|
/^\p{Script=Gran}/utf
|
|
\x{11374}
|
|
|
|
# Script extension check
|
|
/^\p{Grantha}/utf
|
|
\x{951}
|
|
|
|
/^\p{Script_Extensions=Gran}/utf
|
|
\x{11fd3}
|
|
|
|
# Script extension only character
|
|
/^\p{Grantha}/utf
|
|
\x{1cd3}
|
|
|
|
/^\p{sc=Grantha}/utf
|
|
\x{1cd3}
|
|
|
|
# Character not in script
|
|
/^\p{Grantha}/utf
|
|
\x{11fd4}
|
|
|
|
# Base script check
|
|
/^\p{sc=Khojki}/utf
|
|
\x{11200}
|
|
|
|
/^\p{Script=Khoj}/utf
|
|
\x{11241}
|
|
|
|
# Script extension check
|
|
/^\p{Khojki}/utf
|
|
\x{ae6}
|
|
|
|
/^\p{scx=Khoj}/utf
|
|
\x{a839}
|
|
|
|
# Script extension only character
|
|
/^\p{Khojki}/utf
|
|
\x{ae6}
|
|
|
|
/^\p{sc=Khojki}/utf
|
|
\x{ae6}
|
|
|
|
# Character not in script
|
|
/^\p{Khojki}/utf
|
|
\x{11242}
|
|
|
|
# Base script check
|
|
/^\p{sc=Linear_A}/utf
|
|
\x{10600}
|
|
|
|
/^\p{Script=Lina}/utf
|
|
\x{10767}
|
|
|
|
# Script extension check
|
|
/^\p{Linear_A}/utf
|
|
\x{10107}
|
|
|
|
/^\p{Script_Extensions=Lina}/utf
|
|
\x{10133}
|
|
|
|
# Script extension only character
|
|
/^\p{Linear_A}/utf
|
|
\x{10107}
|
|
|
|
/^\p{sc=Linear_A}/utf
|
|
\x{10107}
|
|
|
|
# Character not in script
|
|
/^\p{Linear_A}/utf
|
|
\x{10768}
|
|
|
|
# Base script check
|
|
/^\p{sc=Mahajani}/utf
|
|
\x{11150}
|
|
|
|
/^\p{Script=Mahj}/utf
|
|
\x{11176}
|
|
|
|
# Script extension check
|
|
/^\p{Mahajani}/utf
|
|
\x{964}
|
|
|
|
/^\p{scx=Mahj}/utf
|
|
\x{a839}
|
|
|
|
# Script extension only character
|
|
/^\p{Mahajani}/utf
|
|
\x{966}
|
|
|
|
/^\p{sc=Mahajani}/utf
|
|
\x{966}
|
|
|
|
# Character not in script
|
|
/^\p{Mahajani}/utf
|
|
\x{11177}
|
|
|
|
# Base script check
|
|
/^\p{sc=Manichaean}/utf
|
|
\x{10ac0}
|
|
|
|
/^\p{Script=Mani}/utf
|
|
\x{10af6}
|
|
|
|
# Script extension check
|
|
/^\p{Manichaean}/utf
|
|
\x{640}
|
|
|
|
/^\p{Script_Extensions=Mani}/utf
|
|
\x{10af2}
|
|
|
|
# Script extension only character
|
|
/^\p{Manichaean}/utf
|
|
\x{640}
|
|
|
|
/^\p{sc=Manichaean}/utf
|
|
\x{640}
|
|
|
|
# Character not in script
|
|
/^\p{Manichaean}/utf
|
|
\x{10af7}
|
|
|
|
# Base script check
|
|
/^\p{sc=Modi}/utf
|
|
\x{11600}
|
|
|
|
/^\p{Script=Modi}/utf
|
|
\x{11659}
|
|
|
|
# Script extension check
|
|
/^\p{Modi}/utf
|
|
\x{a830}
|
|
|
|
/^\p{scx=Modi}/utf
|
|
\x{a839}
|
|
|
|
# Script extension only character
|
|
/^\p{Modi}/utf
|
|
\x{a836}
|
|
|
|
/^\p{sc=Modi}/utf
|
|
\x{a836}
|
|
|
|
# Character not in script
|
|
/^\p{Modi}/utf
|
|
\x{1165a}
|
|
|
|
# Base script check
|
|
/^\p{sc=Old_Permic}/utf
|
|
\x{10350}
|
|
|
|
/^\p{Script=Perm}/utf
|
|
\x{1037a}
|
|
|
|
# Script extension check
|
|
/^\p{Old_Permic}/utf
|
|
\x{483}
|
|
|
|
/^\p{Script_Extensions=Perm}/utf
|
|
\x{483}
|
|
|
|
# Script extension only character
|
|
/^\p{Old_Permic}/utf
|
|
\x{483}
|
|
|
|
/^\p{sc=Old_Permic}/utf
|
|
\x{483}
|
|
|
|
# Character not in script
|
|
/^\p{Old_Permic}/utf
|
|
\x{1037b}
|
|
|
|
# Base script check
|
|
/^\p{sc=Psalter_Pahlavi}/utf
|
|
\x{10b80}
|
|
|
|
/^\p{Script=Phlp}/utf
|
|
\x{10baf}
|
|
|
|
# Script extension check
|
|
/^\p{Psalter_Pahlavi}/utf
|
|
\x{640}
|
|
|
|
/^\p{scx=Phlp}/utf
|
|
\x{640}
|
|
|
|
# Script extension only character
|
|
/^\p{Psalter_Pahlavi}/utf
|
|
\x{640}
|
|
|
|
/^\p{sc=Psalter_Pahlavi}/utf
|
|
\x{640}
|
|
|
|
# Character not in script
|
|
/^\p{Psalter_Pahlavi}/utf
|
|
\x{10bb0}
|
|
|
|
# Base script check
|
|
/^\p{sc=Khudawadi}/utf
|
|
\x{112b0}
|
|
|
|
/^\p{Script=Sind}/utf
|
|
\x{112f9}
|
|
|
|
# Script extension check
|
|
/^\p{Khudawadi}/utf
|
|
\x{964}
|
|
|
|
/^\p{Script_Extensions=Sind}/utf
|
|
\x{a839}
|
|
|
|
# Script extension only character
|
|
/^\p{Khudawadi}/utf
|
|
\x{a836}
|
|
|
|
/^\p{sc=Khudawadi}/utf
|
|
\x{a836}
|
|
|
|
# Character not in script
|
|
/^\p{Khudawadi}/utf
|
|
\x{112fa}
|
|
|
|
# Base script check
|
|
/^\p{sc=Tirhuta}/utf
|
|
\x{11480}
|
|
|
|
/^\p{Script=Tirh}/utf
|
|
\x{114d9}
|
|
|
|
# Script extension check
|
|
/^\p{Tirhuta}/utf
|
|
\x{951}
|
|
|
|
/^\p{scx=Tirh}/utf
|
|
\x{a839}
|
|
|
|
# Script extension only character
|
|
/^\p{Tirhuta}/utf
|
|
\x{1cf2}
|
|
|
|
/^\p{sc=Tirhuta}/utf
|
|
\x{1cf2}
|
|
|
|
# Character not in script
|
|
/^\p{Tirhuta}/utf
|
|
\x{114da}
|
|
|
|
# Base script check
|
|
/^\p{sc=Multani}/utf
|
|
\x{11280}
|
|
|
|
/^\p{Script=Mult}/utf
|
|
\x{112a9}
|
|
|
|
# Script extension check
|
|
/^\p{Multani}/utf
|
|
\x{a66}
|
|
|
|
/^\p{Script_Extensions=Mult}/utf
|
|
\x{a6f}
|
|
|
|
# Script extension only character
|
|
/^\p{Multani}/utf
|
|
\x{a66}
|
|
|
|
/^\p{sc=Multani}/utf
|
|
\x{a66}
|
|
|
|
# Character not in script
|
|
/^\p{Multani}/utf
|
|
\x{112aa}
|
|
|
|
# Base script check
|
|
/^\p{sc=Adlam}/utf
|
|
\x{1e900}
|
|
|
|
/^\p{Script=Adlm}/utf
|
|
\x{1e95f}
|
|
|
|
# Script extension check
|
|
/^\p{Adlam}/utf
|
|
\x{61f}
|
|
|
|
/^\p{scx=Adlm}/utf
|
|
\x{640}
|
|
|
|
# Script extension only character
|
|
/^\p{Adlam}/utf
|
|
\x{61f}
|
|
|
|
/^\p{sc=Adlam}/utf
|
|
\x{61f}
|
|
|
|
# Character not in script
|
|
/^\p{Adlam}/utf
|
|
\x{1e960}
|
|
|
|
# Base script check
|
|
/^\p{sc=Masaram_Gondi}/utf
|
|
\x{11d00}
|
|
|
|
/^\p{Script=Gonm}/utf
|
|
\x{11d59}
|
|
|
|
# Script extension check
|
|
/^\p{Masaram_Gondi}/utf
|
|
\x{964}
|
|
|
|
/^\p{Script_Extensions=Gonm}/utf
|
|
\x{965}
|
|
|
|
# Script extension only character
|
|
/^\p{Masaram_Gondi}/utf
|
|
\x{964}
|
|
|
|
/^\p{sc=Masaram_Gondi}/utf
|
|
\x{964}
|
|
|
|
# Character not in script
|
|
/^\p{Masaram_Gondi}/utf
|
|
\x{11d5a}
|
|
|
|
# Base script check
|
|
/^\p{sc=Dogra}/utf
|
|
\x{11800}
|
|
|
|
/^\p{Script=Dogr}/utf
|
|
\x{1183b}
|
|
|
|
# Script extension check
|
|
/^\p{Dogra}/utf
|
|
\x{964}
|
|
|
|
/^\p{scx=Dogr}/utf
|
|
\x{a839}
|
|
|
|
# Script extension only character
|
|
/^\p{Dogra}/utf
|
|
\x{966}
|
|
|
|
/^\p{sc=Dogra}/utf
|
|
\x{966}
|
|
|
|
# Character not in script
|
|
/^\p{Dogra}/utf
|
|
\x{1183c}
|
|
|
|
# Base script check
|
|
/^\p{sc=Gunjala_Gondi}/utf
|
|
\x{11d60}
|
|
|
|
/^\p{Script=Gong}/utf
|
|
\x{11da9}
|
|
|
|
# Script extension check
|
|
/^\p{Gunjala_Gondi}/utf
|
|
\x{964}
|
|
|
|
/^\p{Script_Extensions=Gong}/utf
|
|
\x{965}
|
|
|
|
# Script extension only character
|
|
/^\p{Gunjala_Gondi}/utf
|
|
\x{964}
|
|
|
|
/^\p{sc=Gunjala_Gondi}/utf
|
|
\x{964}
|
|
|
|
# Character not in script
|
|
/^\p{Gunjala_Gondi}/utf
|
|
\x{11daa}
|
|
|
|
# Base script check
|
|
/^\p{sc=Hanifi_Rohingya}/utf
|
|
\x{10d00}
|
|
|
|
/^\p{Script=Rohg}/utf
|
|
\x{10d39}
|
|
|
|
# Script extension check
|
|
/^\p{Hanifi_Rohingya}/utf
|
|
\x{60c}
|
|
|
|
/^\p{scx=Rohg}/utf
|
|
\x{6d4}
|
|
|
|
# Script extension only character
|
|
/^\p{Hanifi_Rohingya}/utf
|
|
\x{6d4}
|
|
|
|
/^\p{sc=Hanifi_Rohingya}/utf
|
|
\x{6d4}
|
|
|
|
# Character not in script
|
|
/^\p{Hanifi_Rohingya}/utf
|
|
\x{10d3a}
|
|
|
|
# Base script check
|
|
/^\p{sc=Sogdian}/utf
|
|
\x{10f30}
|
|
|
|
/^\p{Script=Sogd}/utf
|
|
\x{10f59}
|
|
|
|
# Script extension check
|
|
/^\p{Sogdian}/utf
|
|
\x{640}
|
|
|
|
/^\p{Script_Extensions=Sogd}/utf
|
|
\x{640}
|
|
|
|
# Script extension only character
|
|
/^\p{Sogdian}/utf
|
|
\x{640}
|
|
|
|
/^\p{sc=Sogdian}/utf
|
|
\x{640}
|
|
|
|
# Character not in script
|
|
/^\p{Sogdian}/utf
|
|
\x{10f5a}
|
|
|
|
# Base script check
|
|
/^\p{sc=Nandinagari}/utf
|
|
\x{119a0}
|
|
|
|
/^\p{Script=Nand}/utf
|
|
\x{119e4}
|
|
|
|
# Script extension check
|
|
/^\p{Nandinagari}/utf
|
|
\x{964}
|
|
|
|
/^\p{scx=Nand}/utf
|
|
\x{a835}
|
|
|
|
# Script extension only character
|
|
/^\p{Nandinagari}/utf
|
|
\x{1cfa}
|
|
|
|
/^\p{sc=Nandinagari}/utf
|
|
\x{1cfa}
|
|
|
|
# Character not in script
|
|
/^\p{Nandinagari}/utf
|
|
\x{119e5}
|
|
|
|
# Base script check
|
|
/^\p{sc=Yezidi}/utf
|
|
\x{10e80}
|
|
|
|
/^\p{Script=Yezi}/utf
|
|
\x{10eb1}
|
|
|
|
# Script extension check
|
|
/^\p{Yezidi}/utf
|
|
\x{60c}
|
|
|
|
/^\p{Script_Extensions=Yezi}/utf
|
|
\x{669}
|
|
|
|
# Script extension only character
|
|
/^\p{Yezidi}/utf
|
|
\x{660}
|
|
|
|
/^\p{sc=Yezidi}/utf
|
|
\x{660}
|
|
|
|
# Character not in script
|
|
/^\p{Yezidi}/utf
|
|
\x{10eb2}
|
|
|
|
# Base script check
|
|
/^\p{sc=Cypro_Minoan}/utf
|
|
\x{12f90}
|
|
|
|
/^\p{Script=Cpmn}/utf
|
|
\x{12ff2}
|
|
|
|
# Script extension check
|
|
/^\p{Cypro_Minoan}/utf
|
|
\x{10100}
|
|
|
|
/^\p{scx=Cpmn}/utf
|
|
\x{10101}
|
|
|
|
# Script extension only character
|
|
/^\p{Cypro_Minoan}/utf
|
|
\x{10100}
|
|
|
|
/^\p{sc=Cypro_Minoan}/utf
|
|
\x{10100}
|
|
|
|
# Character not in script
|
|
/^\p{Cypro_Minoan}/utf
|
|
\x{12ff3}
|
|
|
|
# Base script check
|
|
/^\p{sc=Old_Uyghur}/utf
|
|
\x{10f70}
|
|
|
|
/^\p{Script=Ougr}/utf
|
|
\x{10f89}
|
|
|
|
# Script extension check
|
|
/^\p{Old_Uyghur}/utf
|
|
\x{640}
|
|
|
|
/^\p{Script_Extensions=Ougr}/utf
|
|
\x{10af2}
|
|
|
|
# Script extension only character
|
|
/^\p{Old_Uyghur}/utf
|
|
\x{10af2}
|
|
|
|
/^\p{sc=Old_Uyghur}/utf
|
|
\x{10af2}
|
|
|
|
# Character not in script
|
|
/^\p{Old_Uyghur}/utf
|
|
\x{10f8a}
|
|
|
|
# Base script check
|
|
/^\p{sc=Common}/utf
|
|
\x{00}
|
|
|
|
/^\p{Script=Zyyy}/utf
|
|
\x{e007f}
|
|
|
|
# Character not in script
|
|
/^\p{Common}/utf
|
|
\x{e0080}
|
|
|
|
# Base script check
|
|
/^\p{sc=Armenian}/utf
|
|
\x{531}
|
|
|
|
/^\p{Script=Armn}/utf
|
|
\x{fb17}
|
|
|
|
# Character not in script
|
|
/^\p{Armenian}/utf
|
|
\x{fb18}
|
|
|
|
# Base script check
|
|
/^\p{sc=Hebrew}/utf
|
|
\x{591}
|
|
|
|
/^\p{Script=Hebr}/utf
|
|
\x{fb4f}
|
|
|
|
# Character not in script
|
|
/^\p{Hebrew}/utf
|
|
\x{fb50}
|
|
|
|
# Base script check
|
|
/^\p{sc=Thai}/utf
|
|
\x{e01}
|
|
|
|
/^\p{Script=Thai}/utf
|
|
\x{e5b}
|
|
|
|
# Character not in script
|
|
/^\p{Thai}/utf
|
|
\x{e5c}
|
|
|
|
# Base script check
|
|
/^\p{sc=Lao}/utf
|
|
\x{e81}
|
|
|
|
/^\p{Script=Laoo}/utf
|
|
\x{edf}
|
|
|
|
# Character not in script
|
|
/^\p{Lao}/utf
|
|
\x{ee0}
|
|
|
|
# Base script check
|
|
/^\p{sc=Tibetan}/utf
|
|
\x{f00}
|
|
|
|
/^\p{Script=Tibt}/utf
|
|
\x{fda}
|
|
|
|
# Character not in script
|
|
/^\p{Tibetan}/utf
|
|
\x{fdb}
|
|
|
|
# Base script check
|
|
/^\p{sc=Ethiopic}/utf
|
|
\x{1200}
|
|
|
|
/^\p{Script=Ethi}/utf
|
|
\x{1e7fe}
|
|
|
|
# Character not in script
|
|
/^\p{Ethiopic}/utf
|
|
\x{1e7ff}
|
|
|
|
# Base script check
|
|
/^\p{sc=Cherokee}/utf
|
|
\x{13a0}
|
|
|
|
/^\p{Script=Cher}/utf
|
|
\x{abbf}
|
|
|
|
# Character not in script
|
|
/^\p{Cherokee}/utf
|
|
\x{abc0}
|
|
|
|
# Base script check
|
|
/^\p{sc=Canadian_Aboriginal}/utf
|
|
\x{1400}
|
|
|
|
/^\p{Script=Cans}/utf
|
|
\x{11abf}
|
|
|
|
# Character not in script
|
|
/^\p{Canadian_Aboriginal}/utf
|
|
\x{11ac0}
|
|
|
|
# Base script check
|
|
/^\p{sc=Ogham}/utf
|
|
\x{1680}
|
|
|
|
/^\p{Script=Ogam}/utf
|
|
\x{169c}
|
|
|
|
# Character not in script
|
|
/^\p{Ogham}/utf
|
|
\x{169d}
|
|
|
|
# Base script check
|
|
/^\p{sc=Runic}/utf
|
|
\x{16a0}
|
|
|
|
/^\p{Script=Runr}/utf
|
|
\x{16f8}
|
|
|
|
# Character not in script
|
|
/^\p{Runic}/utf
|
|
\x{16f9}
|
|
|
|
# Base script check
|
|
/^\p{sc=Khmer}/utf
|
|
\x{1780}
|
|
|
|
/^\p{Script=Khmr}/utf
|
|
\x{19ff}
|
|
|
|
# Character not in script
|
|
/^\p{Khmer}/utf
|
|
\x{1a00}
|
|
|
|
# Base script check
|
|
/^\p{sc=Old_Italic}/utf
|
|
\x{10300}
|
|
|
|
/^\p{Script=Ital}/utf
|
|
\x{1032f}
|
|
|
|
# Character not in script
|
|
/^\p{Old_Italic}/utf
|
|
\x{10330}
|
|
|
|
# Base script check
|
|
/^\p{sc=Gothic}/utf
|
|
\x{10330}
|
|
|
|
/^\p{Script=Goth}/utf
|
|
\x{1034a}
|
|
|
|
# Character not in script
|
|
/^\p{Gothic}/utf
|
|
\x{1034b}
|
|
|
|
# Base script check
|
|
/^\p{sc=Deseret}/utf
|
|
\x{10400}
|
|
|
|
/^\p{Script=Dsrt}/utf
|
|
\x{1044f}
|
|
|
|
# Character not in script
|
|
/^\p{Deseret}/utf
|
|
\x{10450}
|
|
|
|
# Base script check
|
|
/^\p{sc=Inherited}/utf
|
|
\x{300}
|
|
|
|
/^\p{Script=Zinh}/utf
|
|
\x{e01ef}
|
|
|
|
# Character not in script
|
|
/^\p{Inherited}/utf
|
|
\x{e01f0}
|
|
|
|
# Base script check
|
|
/^\p{sc=Ugaritic}/utf
|
|
\x{10380}
|
|
|
|
/^\p{Script=Ugar}/utf
|
|
\x{1039f}
|
|
|
|
# Character not in script
|
|
/^\p{Ugaritic}/utf
|
|
\x{103a0}
|
|
|
|
# Base script check
|
|
/^\p{sc=Shavian}/utf
|
|
\x{10450}
|
|
|
|
/^\p{Script=Shaw}/utf
|
|
\x{1047f}
|
|
|
|
# Character not in script
|
|
/^\p{Shavian}/utf
|
|
\x{10480}
|
|
|
|
# Base script check
|
|
/^\p{sc=Osmanya}/utf
|
|
\x{10480}
|
|
|
|
/^\p{Script=Osma}/utf
|
|
\x{104a9}
|
|
|
|
# Character not in script
|
|
/^\p{Osmanya}/utf
|
|
\x{104aa}
|
|
|
|
# Base script check
|
|
/^\p{sc=Braille}/utf
|
|
\x{2800}
|
|
|
|
/^\p{Script=Brai}/utf
|
|
\x{28ff}
|
|
|
|
# Character not in script
|
|
/^\p{Braille}/utf
|
|
\x{2900}
|
|
|
|
# Base script check
|
|
/^\p{sc=New_Tai_Lue}/utf
|
|
\x{1980}
|
|
|
|
/^\p{Script=Talu}/utf
|
|
\x{19df}
|
|
|
|
# Character not in script
|
|
/^\p{New_Tai_Lue}/utf
|
|
\x{19e0}
|
|
|
|
# Base script check
|
|
/^\p{sc=Tifinagh}/utf
|
|
\x{2d30}
|
|
|
|
/^\p{Script=Tfng}/utf
|
|
\x{2d7f}
|
|
|
|
# Character not in script
|
|
/^\p{Tifinagh}/utf
|
|
\x{2d80}
|
|
|
|
# Base script check
|
|
/^\p{sc=Old_Persian}/utf
|
|
\x{103a0}
|
|
|
|
/^\p{Script=Xpeo}/utf
|
|
\x{103d5}
|
|
|
|
# Character not in script
|
|
/^\p{Old_Persian}/utf
|
|
\x{103d6}
|
|
|
|
# Base script check
|
|
/^\p{sc=Kharoshthi}/utf
|
|
\x{10a00}
|
|
|
|
/^\p{Script=Khar}/utf
|
|
\x{10a58}
|
|
|
|
# Character not in script
|
|
/^\p{Kharoshthi}/utf
|
|
\x{10a59}
|
|
|
|
# Base script check
|
|
/^\p{sc=Balinese}/utf
|
|
\x{1b00}
|
|
|
|
/^\p{Script=Bali}/utf
|
|
\x{1b7e}
|
|
|
|
# Character not in script
|
|
/^\p{Balinese}/utf
|
|
\x{1b8f}
|
|
|
|
# Base script check
|
|
/^\p{sc=Cuneiform}/utf
|
|
\x{12000}
|
|
|
|
/^\p{Script=Xsux}/utf
|
|
\x{12543}
|
|
|
|
# Character not in script
|
|
/^\p{Cuneiform}/utf
|
|
\x{12544}
|
|
|
|
# Base script check
|
|
/^\p{sc=Phoenician}/utf
|
|
\x{10900}
|
|
|
|
/^\p{Script=Phnx}/utf
|
|
\x{1091f}
|
|
|
|
# Character not in script
|
|
/^\p{Phoenician}/utf
|
|
\x{10920}
|
|
|
|
# Base script check
|
|
/^\p{sc=Sundanese}/utf
|
|
\x{1b80}
|
|
|
|
/^\p{Script=Sund}/utf
|
|
\x{1cc7}
|
|
|
|
# Character not in script
|
|
/^\p{Sundanese}/utf
|
|
\x{1cc8}
|
|
|
|
# Base script check
|
|
/^\p{sc=Lepcha}/utf
|
|
\x{1c00}
|
|
|
|
/^\p{Script=Lepc}/utf
|
|
\x{1c4f}
|
|
|
|
# Character not in script
|
|
/^\p{Lepcha}/utf
|
|
\x{1c50}
|
|
|
|
# Base script check
|
|
/^\p{sc=Ol_Chiki}/utf
|
|
\x{1c50}
|
|
|
|
/^\p{Script=Olck}/utf
|
|
\x{1c7f}
|
|
|
|
# Character not in script
|
|
/^\p{Ol_Chiki}/utf
|
|
\x{1c80}
|
|
|
|
# Base script check
|
|
/^\p{sc=Vai}/utf
|
|
\x{a500}
|
|
|
|
/^\p{Script=Vaii}/utf
|
|
\x{a62b}
|
|
|
|
# Character not in script
|
|
/^\p{Vai}/utf
|
|
\x{a62c}
|
|
|
|
# Base script check
|
|
/^\p{sc=Saurashtra}/utf
|
|
\x{a880}
|
|
|
|
/^\p{Script=Saur}/utf
|
|
\x{a8d9}
|
|
|
|
# Character not in script
|
|
/^\p{Saurashtra}/utf
|
|
\x{a8da}
|
|
|
|
# Base script check
|
|
/^\p{sc=Rejang}/utf
|
|
\x{a930}
|
|
|
|
/^\p{Script=Rjng}/utf
|
|
\x{a95f}
|
|
|
|
# Character not in script
|
|
/^\p{Rejang}/utf
|
|
\x{a960}
|
|
|
|
# Base script check
|
|
/^\p{sc=Lycian}/utf
|
|
\x{10280}
|
|
|
|
/^\p{Script=Lyci}/utf
|
|
\x{1029c}
|
|
|
|
# Character not in script
|
|
/^\p{Lycian}/utf
|
|
\x{1029d}
|
|
|
|
# Base script check
|
|
/^\p{sc=Carian}/utf
|
|
\x{102a0}
|
|
|
|
/^\p{Script=Cari}/utf
|
|
\x{102d0}
|
|
|
|
# Character not in script
|
|
/^\p{Carian}/utf
|
|
\x{102d1}
|
|
|
|
# Base script check
|
|
/^\p{sc=Lydian}/utf
|
|
\x{10920}
|
|
|
|
/^\p{Script=Lydi}/utf
|
|
\x{1093f}
|
|
|
|
# Character not in script
|
|
/^\p{Lydian}/utf
|
|
\x{10940}
|
|
|
|
# Base script check
|
|
/^\p{sc=Cham}/utf
|
|
\x{aa00}
|
|
|
|
/^\p{Script=Cham}/utf
|
|
\x{aa5f}
|
|
|
|
# Character not in script
|
|
/^\p{Cham}/utf
|
|
\x{aa60}
|
|
|
|
# Base script check
|
|
/^\p{sc=Tai_Tham}/utf
|
|
\x{1a20}
|
|
|
|
/^\p{Script=Lana}/utf
|
|
\x{1aad}
|
|
|
|
# Character not in script
|
|
/^\p{Tai_Tham}/utf
|
|
\x{1aae}
|
|
|
|
# Base script check
|
|
/^\p{sc=Tai_Viet}/utf
|
|
\x{aa80}
|
|
|
|
/^\p{Script=Tavt}/utf
|
|
\x{aadf}
|
|
|
|
# Character not in script
|
|
/^\p{Tai_Viet}/utf
|
|
\x{aae0}
|
|
|
|
# Base script check
|
|
/^\p{sc=Avestan}/utf
|
|
\x{10b00}
|
|
|
|
/^\p{Script=Avst}/utf
|
|
\x{10b3f}
|
|
|
|
# Character not in script
|
|
/^\p{Avestan}/utf
|
|
\x{10b40}
|
|
|
|
# Base script check
|
|
/^\p{sc=Egyptian_Hieroglyphs}/utf
|
|
\x{13000}
|
|
|
|
/^\p{Script=Egyp}/utf
|
|
\x{13455}
|
|
|
|
# Character not in script
|
|
/^\p{Egyptian_Hieroglyphs}/utf
|
|
\x{13456}
|
|
|
|
# Base script check
|
|
/^\p{sc=Samaritan}/utf
|
|
\x{800}
|
|
|
|
/^\p{Script=Samr}/utf
|
|
\x{83e}
|
|
|
|
# Character not in script
|
|
/^\p{Samaritan}/utf
|
|
\x{83f}
|
|
|
|
# Base script check
|
|
/^\p{sc=Lisu}/utf
|
|
\x{a4d0}
|
|
|
|
/^\p{Script=Lisu}/utf
|
|
\x{11fb0}
|
|
|
|
# Character not in script
|
|
/^\p{Lisu}/utf
|
|
\x{11fb1}
|
|
|
|
# Base script check
|
|
/^\p{sc=Bamum}/utf
|
|
\x{a6a0}
|
|
|
|
/^\p{Script=Bamu}/utf
|
|
\x{16a38}
|
|
|
|
# Character not in script
|
|
/^\p{Bamum}/utf
|
|
\x{16a39}
|
|
|
|
# Base script check
|
|
/^\p{sc=Meetei_Mayek}/utf
|
|
\x{aae0}
|
|
|
|
/^\p{Script=Mtei}/utf
|
|
\x{abf9}
|
|
|
|
# Character not in script
|
|
/^\p{Meetei_Mayek}/utf
|
|
\x{abfa}
|
|
|
|
# Base script check
|
|
/^\p{sc=Imperial_Aramaic}/utf
|
|
\x{10840}
|
|
|
|
/^\p{Script=Armi}/utf
|
|
\x{1085f}
|
|
|
|
# Character not in script
|
|
/^\p{Imperial_Aramaic}/utf
|
|
\x{10860}
|
|
|
|
# Base script check
|
|
/^\p{sc=Old_South_Arabian}/utf
|
|
\x{10a60}
|
|
|
|
/^\p{Script=Sarb}/utf
|
|
\x{10a7f}
|
|
|
|
# Character not in script
|
|
/^\p{Old_South_Arabian}/utf
|
|
\x{10a80}
|
|
|
|
# Base script check
|
|
/^\p{sc=Inscriptional_Parthian}/utf
|
|
\x{10b40}
|
|
|
|
/^\p{Script=Prti}/utf
|
|
\x{10b5f}
|
|
|
|
# Character not in script
|
|
/^\p{Inscriptional_Parthian}/utf
|
|
\x{10b60}
|
|
|
|
# Base script check
|
|
/^\p{sc=Inscriptional_Pahlavi}/utf
|
|
\x{10b60}
|
|
|
|
/^\p{Script=Phli}/utf
|
|
\x{10b7f}
|
|
|
|
# Character not in script
|
|
/^\p{Inscriptional_Pahlavi}/utf
|
|
\x{10b80}
|
|
|
|
# Base script check
|
|
/^\p{sc=Old_Turkic}/utf
|
|
\x{10c00}
|
|
|
|
/^\p{Script=Orkh}/utf
|
|
\x{10c48}
|
|
|
|
# Character not in script
|
|
/^\p{Old_Turkic}/utf
|
|
\x{10c49}
|
|
|
|
# Base script check
|
|
/^\p{sc=Batak}/utf
|
|
\x{1bc0}
|
|
|
|
/^\p{Script=Batk}/utf
|
|
\x{1bff}
|
|
|
|
# Character not in script
|
|
/^\p{Batak}/utf
|
|
\x{1c00}
|
|
|
|
# Base script check
|
|
/^\p{sc=Brahmi}/utf
|
|
\x{11000}
|
|
|
|
/^\p{Script=Brah}/utf
|
|
\x{1107f}
|
|
|
|
# Character not in script
|
|
/^\p{Brahmi}/utf
|
|
\x{11080}
|
|
|
|
# Base script check
|
|
/^\p{sc=Meroitic_Cursive}/utf
|
|
\x{109a0}
|
|
|
|
/^\p{Script=Merc}/utf
|
|
\x{109ff}
|
|
|
|
# Character not in script
|
|
/^\p{Meroitic_Cursive}/utf
|
|
\x{10a00}
|
|
|
|
# Base script check
|
|
/^\p{sc=Meroitic_Hieroglyphs}/utf
|
|
\x{10980}
|
|
|
|
/^\p{Script=Mero}/utf
|
|
\x{1099f}
|
|
|
|
# Character not in script
|
|
/^\p{Meroitic_Hieroglyphs}/utf
|
|
\x{109a0}
|
|
|
|
# Base script check
|
|
/^\p{sc=Miao}/utf
|
|
\x{16f00}
|
|
|
|
/^\p{Script=Plrd}/utf
|
|
\x{16f9f}
|
|
|
|
# Character not in script
|
|
/^\p{Miao}/utf
|
|
\x{16fa0}
|
|
|
|
# Base script check
|
|
/^\p{sc=Sora_Sompeng}/utf
|
|
\x{110d0}
|
|
|
|
/^\p{Script=Sora}/utf
|
|
\x{110f9}
|
|
|
|
# Character not in script
|
|
/^\p{Sora_Sompeng}/utf
|
|
\x{110fa}
|
|
|
|
# Base script check
|
|
/^\p{sc=Caucasian_Albanian}/utf
|
|
\x{10530}
|
|
|
|
/^\p{Script=Aghb}/utf
|
|
\x{1056f}
|
|
|
|
# Character not in script
|
|
/^\p{Caucasian_Albanian}/utf
|
|
\x{10570}
|
|
|
|
# Base script check
|
|
/^\p{sc=Bassa_Vah}/utf
|
|
\x{16ad0}
|
|
|
|
/^\p{Script=Bass}/utf
|
|
\x{16af5}
|
|
|
|
# Character not in script
|
|
/^\p{Bassa_Vah}/utf
|
|
\x{16af6}
|
|
|
|
# Base script check
|
|
/^\p{sc=Elbasan}/utf
|
|
\x{10500}
|
|
|
|
/^\p{Script=Elba}/utf
|
|
\x{10527}
|
|
|
|
# Character not in script
|
|
/^\p{Elbasan}/utf
|
|
\x{10528}
|
|
|
|
# Base script check
|
|
/^\p{sc=Pahawh_Hmong}/utf
|
|
\x{16b00}
|
|
|
|
/^\p{Script=Hmng}/utf
|
|
\x{16b8f}
|
|
|
|
# Character not in script
|
|
/^\p{Pahawh_Hmong}/utf
|
|
\x{16b90}
|
|
|
|
# Base script check
|
|
/^\p{sc=Mende_Kikakui}/utf
|
|
\x{1e800}
|
|
|
|
/^\p{Script=Mend}/utf
|
|
\x{1e8d6}
|
|
|
|
# Character not in script
|
|
/^\p{Mende_Kikakui}/utf
|
|
\x{1e8d7}
|
|
|
|
# Base script check
|
|
/^\p{sc=Mro}/utf
|
|
\x{16a40}
|
|
|
|
/^\p{Script=Mroo}/utf
|
|
\x{16a6f}
|
|
|
|
# Character not in script
|
|
/^\p{Mro}/utf
|
|
\x{16a70}
|
|
|
|
# Base script check
|
|
/^\p{sc=Old_North_Arabian}/utf
|
|
\x{10a80}
|
|
|
|
/^\p{Script=Narb}/utf
|
|
\x{10a9f}
|
|
|
|
# Character not in script
|
|
/^\p{Old_North_Arabian}/utf
|
|
\x{10aa0}
|
|
|
|
# Base script check
|
|
/^\p{sc=Nabataean}/utf
|
|
\x{10880}
|
|
|
|
/^\p{Script=Nbat}/utf
|
|
\x{108af}
|
|
|
|
# Character not in script
|
|
/^\p{Nabataean}/utf
|
|
\x{108b0}
|
|
|
|
# Base script check
|
|
/^\p{sc=Palmyrene}/utf
|
|
\x{10860}
|
|
|
|
/^\p{Script=Palm}/utf
|
|
\x{1087f}
|
|
|
|
# Character not in script
|
|
/^\p{Palmyrene}/utf
|
|
\x{10880}
|
|
|
|
# Base script check
|
|
/^\p{sc=Pau_Cin_Hau}/utf
|
|
\x{11ac0}
|
|
|
|
/^\p{Script=Pauc}/utf
|
|
\x{11af8}
|
|
|
|
# Character not in script
|
|
/^\p{Pau_Cin_Hau}/utf
|
|
\x{11af9}
|
|
|
|
# Base script check
|
|
/^\p{sc=Siddham}/utf
|
|
\x{11580}
|
|
|
|
/^\p{Script=Sidd}/utf
|
|
\x{115dd}
|
|
|
|
# Character not in script
|
|
/^\p{Siddham}/utf
|
|
\x{115de}
|
|
|
|
# Base script check
|
|
/^\p{sc=Warang_Citi}/utf
|
|
\x{118a0}
|
|
|
|
/^\p{Script=Wara}/utf
|
|
\x{118ff}
|
|
|
|
# Character not in script
|
|
/^\p{Warang_Citi}/utf
|
|
\x{11900}
|
|
|
|
# Base script check
|
|
/^\p{sc=Ahom}/utf
|
|
\x{11700}
|
|
|
|
/^\p{Script=Ahom}/utf
|
|
\x{11746}
|
|
|
|
# Character not in script
|
|
/^\p{Ahom}/utf
|
|
\x{11747}
|
|
|
|
# Base script check
|
|
/^\p{sc=Anatolian_Hieroglyphs}/utf
|
|
\x{14400}
|
|
|
|
/^\p{Script=Hluw}/utf
|
|
\x{14646}
|
|
|
|
# Character not in script
|
|
/^\p{Anatolian_Hieroglyphs}/utf
|
|
\x{14647}
|
|
|
|
# Base script check
|
|
/^\p{sc=Hatran}/utf
|
|
\x{108e0}
|
|
|
|
/^\p{Script=Hatr}/utf
|
|
\x{108ff}
|
|
|
|
# Character not in script
|
|
/^\p{Hatran}/utf
|
|
\x{10900}
|
|
|
|
# Base script check
|
|
/^\p{sc=Old_Hungarian}/utf
|
|
\x{10c80}
|
|
|
|
/^\p{Script=Hung}/utf
|
|
\x{10cff}
|
|
|
|
# Character not in script
|
|
/^\p{Old_Hungarian}/utf
|
|
\x{10d00}
|
|
|
|
# Base script check
|
|
/^\p{sc=SignWriting}/utf
|
|
\x{1d800}
|
|
|
|
/^\p{Script=Sgnw}/utf
|
|
\x{1daaf}
|
|
|
|
# Character not in script
|
|
/^\p{SignWriting}/utf
|
|
\x{1dab0}
|
|
|
|
# Base script check
|
|
/^\p{sc=Bhaiksuki}/utf
|
|
\x{11c00}
|
|
|
|
/^\p{Script=Bhks}/utf
|
|
\x{11c6c}
|
|
|
|
# Character not in script
|
|
/^\p{Bhaiksuki}/utf
|
|
\x{11c6d}
|
|
|
|
# Base script check
|
|
/^\p{sc=Marchen}/utf
|
|
\x{11c70}
|
|
|
|
/^\p{Script=Marc}/utf
|
|
\x{11cb6}
|
|
|
|
# Character not in script
|
|
/^\p{Marchen}/utf
|
|
\x{11cb7}
|
|
|
|
# Base script check
|
|
/^\p{sc=Newa}/utf
|
|
\x{11400}
|
|
|
|
/^\p{Script=Newa}/utf
|
|
\x{11461}
|
|
|
|
# Character not in script
|
|
/^\p{Newa}/utf
|
|
\x{11462}
|
|
|
|
# Base script check
|
|
/^\p{sc=Osage}/utf
|
|
\x{104b0}
|
|
|
|
/^\p{Script=Osge}/utf
|
|
\x{104fb}
|
|
|
|
# Character not in script
|
|
/^\p{Osage}/utf
|
|
\x{104fc}
|
|
|
|
# Base script check
|
|
/^\p{sc=Tangut}/utf
|
|
\x{16fe0}
|
|
|
|
/^\p{Script=Tang}/utf
|
|
\x{18d08}
|
|
|
|
# Character not in script
|
|
/^\p{Tangut}/utf
|
|
\x{18d09}
|
|
|
|
# Base script check
|
|
/^\p{sc=Nushu}/utf
|
|
\x{16fe1}
|
|
|
|
/^\p{Script=Nshu}/utf
|
|
\x{1b2fb}
|
|
|
|
# Character not in script
|
|
/^\p{Nushu}/utf
|
|
\x{1b2fc}
|
|
|
|
# Base script check
|
|
/^\p{sc=Soyombo}/utf
|
|
\x{11a50}
|
|
|
|
/^\p{Script=Soyo}/utf
|
|
\x{11aa2}
|
|
|
|
# Character not in script
|
|
/^\p{Soyombo}/utf
|
|
\x{11aa3}
|
|
|
|
# Base script check
|
|
/^\p{sc=Zanabazar_Square}/utf
|
|
\x{11a00}
|
|
|
|
/^\p{Script=Zanb}/utf
|
|
\x{11a47}
|
|
|
|
# Character not in script
|
|
/^\p{Zanabazar_Square}/utf
|
|
\x{11a48}
|
|
|
|
# Base script check
|
|
/^\p{sc=Makasar}/utf
|
|
\x{11ee0}
|
|
|
|
/^\p{Script=Maka}/utf
|
|
\x{11ef8}
|
|
|
|
# Character not in script
|
|
/^\p{Makasar}/utf
|
|
\x{11ef9}
|
|
|
|
# Base script check
|
|
/^\p{sc=Medefaidrin}/utf
|
|
\x{16e40}
|
|
|
|
/^\p{Script=Medf}/utf
|
|
\x{16e9a}
|
|
|
|
# Character not in script
|
|
/^\p{Medefaidrin}/utf
|
|
\x{16e9b}
|
|
|
|
# Base script check
|
|
/^\p{sc=Old_Sogdian}/utf
|
|
\x{10f00}
|
|
|
|
/^\p{Script=Sogo}/utf
|
|
\x{10f27}
|
|
|
|
# Character not in script
|
|
/^\p{Old_Sogdian}/utf
|
|
\x{10f28}
|
|
|
|
# Base script check
|
|
/^\p{sc=Elymaic}/utf
|
|
\x{10fe0}
|
|
|
|
/^\p{Script=Elym}/utf
|
|
\x{10ff6}
|
|
|
|
# Character not in script
|
|
/^\p{Elymaic}/utf
|
|
\x{10ff7}
|
|
|
|
# Base script check
|
|
/^\p{sc=Nyiakeng_Puachue_Hmong}/utf
|
|
\x{1e100}
|
|
|
|
/^\p{Script=Hmnp}/utf
|
|
\x{1e14f}
|
|
|
|
# Character not in script
|
|
/^\p{Nyiakeng_Puachue_Hmong}/utf
|
|
\x{1e150}
|
|
|
|
# Base script check
|
|
/^\p{sc=Wancho}/utf
|
|
\x{1e2c0}
|
|
|
|
/^\p{Script=Wcho}/utf
|
|
\x{1e2ff}
|
|
|
|
# Character not in script
|
|
/^\p{Wancho}/utf
|
|
\x{1e300}
|
|
|
|
# Base script check
|
|
/^\p{sc=Chorasmian}/utf
|
|
\x{10fb0}
|
|
|
|
/^\p{Script=Chrs}/utf
|
|
\x{10fcb}
|
|
|
|
# Character not in script
|
|
/^\p{Chorasmian}/utf
|
|
\x{10fcc}
|
|
|
|
# Base script check
|
|
/^\p{sc=Dives_Akuru}/utf
|
|
\x{11900}
|
|
|
|
/^\p{Script=Diak}/utf
|
|
\x{11959}
|
|
|
|
# Character not in script
|
|
/^\p{Dives_Akuru}/utf
|
|
\x{1195a}
|
|
|
|
# Base script check
|
|
/^\p{sc=Khitan_Small_Script}/utf
|
|
\x{16fe4}
|
|
|
|
/^\p{Script=Kits}/utf
|
|
\x{18cd5}
|
|
|
|
# Character not in script
|
|
/^\p{Khitan_Small_Script}/utf
|
|
\x{18cd6}
|
|
|
|
# Base script check
|
|
/^\p{sc=Tangsa}/utf
|
|
\x{16a70}
|
|
|
|
/^\p{Script=Tnsa}/utf
|
|
\x{16ac9}
|
|
|
|
# Character not in script
|
|
/^\p{Tangsa}/utf
|
|
\x{16aca}
|
|
|
|
# Base script check
|
|
/^\p{sc=Toto}/utf
|
|
\x{1e290}
|
|
|
|
/^\p{Script=Toto}/utf
|
|
\x{1e2ae}
|
|
|
|
# Character not in script
|
|
/^\p{Toto}/utf
|
|
\x{1e2af}
|
|
|
|
# Base script check
|
|
/^\p{sc=Vithkuqi}/utf
|
|
\x{10570}
|
|
|
|
/^\p{Script=Vith}/utf
|
|
\x{105bc}
|
|
|
|
# Character not in script
|
|
/^\p{Vithkuqi}/utf
|
|
\x{105bd}
|
|
|
|
# Base script check
|
|
/^\p{sc=Kawi}/utf
|
|
\x{11f00}
|
|
|
|
/^\p{Script=Kawi}/utf
|
|
\x{11f59}
|
|
|
|
# Character not in script
|
|
/^\p{Kawi}/utf
|
|
\x{11f6a}
|
|
|
|
# Base script check
|
|
/^\p{sc=Nag_Mundari}/utf
|
|
\x{1e4d0}
|
|
|
|
/^\p{Script=Nagm}/utf
|
|
\x{1e4f9}
|
|
|
|
# Character not in script
|
|
/^\p{Nag_Mundari}/utf
|
|
\x{1e4fa}
|
|
|
|
# End of testinput26
|