diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml index cb883bc800..0accb3731f 100644 --- a/.github/workflows/ci.yml +++ b/.github/workflows/ci.yml @@ -30,47 +30,45 @@ jobs: - win-gnu include: - build: pinned - os: ubuntu-18.04 + os: ubuntu-latest rust: 1.41.1 - build: stable - os: ubuntu-18.04 + os: ubuntu-latest rust: stable - build: stable-32 - os: ubuntu-18.04 + os: ubuntu-latest rust: stable target: i686-unknown-linux-gnu - build: stable-mips - os: ubuntu-18.04 + os: ubuntu-latest rust: stable target: mips64-unknown-linux-gnuabi64 - build: beta - os: ubuntu-18.04 + os: ubuntu-latest rust: beta - build: nightly - os: ubuntu-18.04 + os: ubuntu-latest rust: nightly - build: macos os: macos-latest rust: stable - build: win-msvc - os: windows-2019 + os: windows-latest rust: stable - build: win-gnu - os: windows-2019 + os: windows-latest rust: stable-x86_64-gnu steps: - name: Checkout repository - uses: actions/checkout@v1 - with: - fetch-depth: 1 + uses: actions/checkout@v3 - name: Install Rust uses: actions-rs/toolchain@v1 with: + override: true toolchain: ${{ matrix.rust }} profile: minimal - override: true - name: Install and configure Cross if: matrix.target != '' @@ -89,7 +87,7 @@ jobs: echo "target flag is: ${{ env.TARGET }}" - name: Show CPU info for debugging - if: matrix.os == 'ubuntu-18.04' + if: matrix.os == 'ubuntu-latest' run: lscpu - name: Basic build @@ -163,18 +161,14 @@ jobs: runs-on: ubuntu-18.04 steps: - name: Checkout repository - uses: actions/checkout@v1 - with: - fetch-depth: 1 + uses: actions/checkout@v3 - name: Install Rust uses: actions-rs/toolchain@v1 with: + override: true toolchain: stable profile: minimal - override: true components: rustfmt - - name: Install rustfmt - run: rustup component add rustfmt - name: Check formatting run: | cargo fmt --all -- --check diff --git a/regex-syntax/src/unicode.rs b/regex-syntax/src/unicode.rs index b894c7db22..f0358e949d 100644 --- a/regex-syntax/src/unicode.rs +++ b/regex-syntax/src/unicode.rs @@ -604,6 +604,7 @@ fn ages(canonical_age: &str) -> Result> { ("V12_0", age::V12_0), ("V12_1", age::V12_1), ("V13_0", age::V13_0), + ("V14_0", age::V14_0), ]; assert_eq!(AGES.len(), age::BY_NAME.len(), "ages are out of sync"); diff --git a/regex-syntax/src/unicode_tables/age.rs b/regex-syntax/src/unicode_tables/age.rs index 7772919ebe..ffdfef316c 100644 --- a/regex-syntax/src/unicode_tables/age.rs +++ b/regex-syntax/src/unicode_tables/age.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate age ucd-13.0.0 --chars +// ucd-generate age /tmp/ucd --chars // -// Unicode version: 13.0.0. +// Unicode version: 14.0.0. // -// ucd-generate 0.2.8 is available on crates.io. +// ucd-generate 0.2.11 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("V10_0", V10_0), @@ -12,6 +12,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("V12_0", V12_0), ("V12_1", V12_1), ("V13_0", V13_0), + ("V14_0", V14_0), ("V1_1", V1_1), ("V2_0", V2_0), ("V2_1", V2_1), @@ -203,69 +204,150 @@ pub const V12_0: &'static [(char, char)] = &[ pub const V12_1: &'static [(char, char)] = &[('㋿', '㋿')]; pub const V13_0: &'static [(char, char)] = &[ - ('\u{8be}', '\u{8c7}'), + ('ࢾ', 'ࣇ'), ('\u{b55}', '\u{b55}'), - ('\u{d04}', '\u{d04}'), + ('ഄ', 'ഄ'), ('\u{d81}', '\u{d81}'), ('\u{1abf}', '\u{1ac0}'), - ('\u{2b97}', '\u{2b97}'), - ('\u{2e50}', '\u{2e52}'), - ('\u{31bb}', '\u{31bf}'), - ('\u{4db6}', '\u{4dbf}'), - ('\u{9ff0}', '\u{9ffc}'), - ('\u{a7c7}', '\u{a7ca}'), - ('\u{a7f5}', '\u{a7f6}'), + ('⮗', '⮗'), + ('⹐', '⹒'), + ('ㆻ', 'ㆿ'), + ('䶶', '䶿'), + ('鿰', '鿼'), + ('Ꟈ', 'ꟊ'), + ('Ꟶ', 'ꟶ'), ('\u{a82c}', '\u{a82c}'), - ('\u{ab68}', '\u{ab6b}'), - ('\u{1019c}', '\u{1019c}'), - ('\u{10e80}', '\u{10ea9}'), - ('\u{10eab}', '\u{10ead}'), - ('\u{10eb0}', '\u{10eb1}'), - ('\u{10fb0}', '\u{10fcb}'), - ('\u{11147}', '\u{11147}'), - ('\u{111ce}', '\u{111cf}'), - ('\u{1145a}', '\u{1145a}'), - ('\u{11460}', '\u{11461}'), - ('\u{11900}', '\u{11906}'), - ('\u{11909}', '\u{11909}'), - ('\u{1190c}', '\u{11913}'), - ('\u{11915}', '\u{11916}'), - ('\u{11918}', '\u{11935}'), - ('\u{11937}', '\u{11938}'), - ('\u{1193b}', '\u{11946}'), - ('\u{11950}', '\u{11959}'), - ('\u{11fb0}', '\u{11fb0}'), + ('ꭨ', '꭫'), + ('𐆜', '𐆜'), + ('𐺀', '𐺩'), + ('\u{10eab}', '𐺭'), + ('𐺰', '𐺱'), + ('𐾰', '𐿋'), + ('𑅇', '𑅇'), + ('𑇎', '\u{111cf}'), + ('𑑚', '𑑚'), + ('𑑠', '𑑡'), + ('𑤀', '𑤆'), + ('𑤉', '𑤉'), + ('𑤌', '𑤓'), + ('𑤕', '𑤖'), + ('𑤘', '𑤵'), + ('𑤷', '𑤸'), + ('\u{1193b}', '𑥆'), + ('𑥐', '𑥙'), + ('𑾰', '𑾰'), ('\u{16fe4}', '\u{16fe4}'), - ('\u{16ff0}', '\u{16ff1}'), - ('\u{18af3}', '\u{18cd5}'), - ('\u{18d00}', '\u{18d08}'), - ('\u{1f10d}', '\u{1f10f}'), - ('\u{1f16d}', '\u{1f16f}'), - ('\u{1f1ad}', '\u{1f1ad}'), - ('\u{1f6d6}', '\u{1f6d7}'), - ('\u{1f6fb}', '\u{1f6fc}'), - ('\u{1f8b0}', '\u{1f8b1}'), - ('\u{1f90c}', '\u{1f90c}'), - ('\u{1f972}', '\u{1f972}'), - ('\u{1f977}', '\u{1f978}'), - ('\u{1f9a3}', '\u{1f9a4}'), - ('\u{1f9ab}', '\u{1f9ad}'), - ('\u{1f9cb}', '\u{1f9cb}'), - ('\u{1fa74}', '\u{1fa74}'), - ('\u{1fa83}', '\u{1fa86}'), - ('\u{1fa96}', '\u{1faa8}'), - ('\u{1fab0}', '\u{1fab6}'), - ('\u{1fac0}', '\u{1fac2}'), - ('\u{1fad0}', '\u{1fad6}'), - ('\u{1fb00}', '\u{1fb92}'), - ('\u{1fb94}', '\u{1fbca}'), - ('\u{1fbf0}', '\u{1fbf9}'), - ('\u{2a6d7}', '\u{2a6dd}'), - ('\u{30000}', '\u{3134a}'), + ('𖿰', '𖿱'), + ('𘫳', '𘳕'), + ('𘴀', '𘴈'), + ('🄍', '🄏'), + ('🅭', '🅯'), + ('🆭', '🆭'), + ('🛖', '🛗'), + ('🛻', '🛼'), + ('🢰', '🢱'), + ('🤌', '🤌'), + ('🥲', '🥲'), + ('🥷', '🥸'), + ('🦣', '🦤'), + ('🦫', '🦭'), + ('🧋', '🧋'), + ('🩴', '🩴'), + ('🪃', '🪆'), + ('🪖', '🪨'), + ('🪰', '🪶'), + ('🫀', '🫂'), + ('🫐', '🫖'), + ('🬀', '🮒'), + ('🮔', '🯊'), + ('🯰', '🯹'), + ('𪛗', '𪛝'), + ('𰀀', '𱍊'), +]; + +pub const V14_0: &'static [(char, char)] = &[ + ('؝', '؝'), + ('ࡰ', 'ࢎ'), + ('\u{890}', '\u{891}'), + ('\u{898}', '\u{89f}'), + ('ࢵ', 'ࢵ'), + ('ࣈ', '\u{8d2}'), + ('\u{c3c}', '\u{c3c}'), + ('ౝ', 'ౝ'), + ('ೝ', 'ೝ'), + ('ᜍ', 'ᜍ'), + ('᜕', '᜕'), + ('ᜟ', 'ᜟ'), + ('\u{180f}', '\u{180f}'), + ('\u{1ac1}', '\u{1ace}'), + ('ᭌ', 'ᭌ'), + ('᭽', '᭾'), + ('\u{1dfa}', '\u{1dfa}'), + ('⃀', '⃀'), + ('Ⱟ', 'Ⱟ'), + ('ⱟ', 'ⱟ'), + ('⹓', '⹝'), + ('鿽', '鿿'), + ('Ꟁ', 'ꟁ'), + ('Ꟑ', 'ꟑ'), + ('ꟓ', 'ꟓ'), + ('ꟕ', 'ꟙ'), + ('ꟲ', 'ꟴ'), + ('﯂', '﯂'), + ('﵀', '﵏'), + ('﷏', '﷏'), + ('﷾', '﷿'), + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), + ('𐞀', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), + ('𐽰', '𐾉'), + ('\u{11070}', '𑁵'), + ('\u{110c2}', '\u{110c2}'), + ('𑚹', '𑚹'), + ('𑝀', '𑝆'), + ('𑪰', '𑪿'), + ('𒾐', '𒿲'), + ('𖩰', '𖪾'), + ('𖫀', '𖫉'), + ('𚿰', '𚿳'), + ('𚿵', '𚿻'), + ('𚿽', '𚿾'), + ('𛄟', '𛄢'), + ('\u{1cf00}', '\u{1cf2d}'), + ('\u{1cf30}', '\u{1cf46}'), + ('𜽐', '𜿃'), + ('𝇩', '𝇪'), + ('𝼀', '𝼞'), + ('𞊐', '\u{1e2ae}'), + ('𞟠', '𞟦'), + ('𞟨', '𞟫'), + ('𞟭', '𞟮'), + ('𞟰', '𞟾'), + ('🛝', '🛟'), + ('🟰', '🟰'), + ('🥹', '🥹'), + ('🧌', '🧌'), + ('🩻', '🩼'), + ('🪩', '🪬'), + ('🪷', '🪺'), + ('🫃', '🫅'), + ('🫗', '🫙'), + ('🫠', '🫧'), + ('🫰', '🫶'), + ('𪛞', '𪛟'), + ('𫜵', '𫜸'), ]; pub const V1_1: &'static [(char, char)] = &[ - ('\u{0}', 'ǵ'), + ('\0', 'ǵ'), ('Ǻ', 'ȗ'), ('ɐ', 'ʨ'), ('ʰ', '˞'), diff --git a/regex-syntax/src/unicode_tables/case_folding_simple.rs b/regex-syntax/src/unicode_tables/case_folding_simple.rs index cfb83f363a..766d21b487 100644 --- a/regex-syntax/src/unicode_tables/case_folding_simple.rs +++ b/regex-syntax/src/unicode_tables/case_folding_simple.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate case-folding-simple ucd-13.0.0 --chars --all-pairs +// ucd-generate case-folding-simple /tmp/ucd --chars --all-pairs // -// Unicode version: 13.0.0. +// Unicode version: 14.0.0. // -// ucd-generate 0.2.8 is available on crates.io. +// ucd-generate 0.2.11 is available on crates.io. pub const CASE_FOLDING_SIMPLE: &'static [(char, &'static [char])] = &[ ('A', &['a']), @@ -1781,6 +1781,7 @@ pub const CASE_FOLDING_SIMPLE: &'static [(char, &'static [char])] = &[ ('Ⱜ', &['ⱜ']), ('Ⱝ', &['ⱝ']), ('Ⱞ', &['ⱞ']), + ('Ⱟ', &['ⱟ']), ('ⰰ', &['Ⰰ']), ('ⰱ', &['Ⰱ']), ('ⰲ', &['Ⰲ']), @@ -1828,6 +1829,7 @@ pub const CASE_FOLDING_SIMPLE: &'static [(char, &'static [char])] = &[ ('ⱜ', &['Ⱜ']), ('ⱝ', &['Ⱝ']), ('ⱞ', &['Ⱞ']), + ('ⱟ', &['Ⱟ']), ('Ⱡ', &['ⱡ']), ('ⱡ', &['Ⱡ']), ('Ɫ', &['ɫ']), @@ -2211,17 +2213,25 @@ pub const CASE_FOLDING_SIMPLE: &'static [(char, &'static [char])] = &[ ('ꞽ', &['Ꞽ']), ('Ꞿ', &['ꞿ']), ('ꞿ', &['Ꞿ']), + ('Ꟁ', &['ꟁ']), + ('ꟁ', &['Ꟁ']), ('Ꟃ', &['ꟃ']), ('ꟃ', &['Ꟃ']), ('Ꞔ', &['ꞔ']), ('Ʂ', &['ʂ']), ('Ᶎ', &['ᶎ']), - ('\u{a7c7}', &['\u{a7c8}']), - ('\u{a7c8}', &['\u{a7c7}']), - ('\u{a7c9}', &['\u{a7ca}']), - ('\u{a7ca}', &['\u{a7c9}']), - ('\u{a7f5}', &['\u{a7f6}']), - ('\u{a7f6}', &['\u{a7f5}']), + ('Ꟈ', &['ꟈ']), + ('ꟈ', &['Ꟈ']), + ('Ꟊ', &['ꟊ']), + ('ꟊ', &['Ꟊ']), + ('Ꟑ', &['ꟑ']), + ('ꟑ', &['Ꟑ']), + ('Ꟗ', &['ꟗ']), + ('ꟗ', &['Ꟗ']), + ('Ꟙ', &['ꟙ']), + ('ꟙ', &['Ꟙ']), + ('Ꟶ', &['ꟶ']), + ('ꟶ', &['Ꟶ']), ('ꭓ', &['Ꭓ']), ('ꭰ', &['Ꭰ']), ('ꭱ', &['Ꭱ']), @@ -2507,6 +2517,76 @@ pub const CASE_FOLDING_SIMPLE: &'static [(char, &'static [char])] = &[ ('𐓹', &['𐓑']), ('𐓺', &['𐓒']), ('𐓻', &['𐓓']), + ('𐕰', &['𐖗']), + ('𐕱', &['𐖘']), + ('𐕲', &['𐖙']), + ('𐕳', &['𐖚']), + ('𐕴', &['𐖛']), + ('𐕵', &['𐖜']), + ('𐕶', &['𐖝']), + ('𐕷', &['𐖞']), + ('𐕸', &['𐖟']), + ('𐕹', &['𐖠']), + ('𐕺', &['𐖡']), + ('𐕼', &['𐖣']), + ('𐕽', &['𐖤']), + ('𐕾', &['𐖥']), + ('𐕿', &['𐖦']), + ('𐖀', &['𐖧']), + ('𐖁', &['𐖨']), + ('𐖂', &['𐖩']), + ('𐖃', &['𐖪']), + ('𐖄', &['𐖫']), + ('𐖅', &['𐖬']), + ('𐖆', &['𐖭']), + ('𐖇', &['𐖮']), + ('𐖈', &['𐖯']), + ('𐖉', &['𐖰']), + ('𐖊', &['𐖱']), + ('𐖌', &['𐖳']), + ('𐖍', &['𐖴']), + ('𐖎', &['𐖵']), + ('𐖏', &['𐖶']), + ('𐖐', &['𐖷']), + ('𐖑', &['𐖸']), + ('𐖒', &['𐖹']), + ('𐖔', &['𐖻']), + ('𐖕', &['𐖼']), + ('𐖗', &['𐕰']), + ('𐖘', &['𐕱']), + ('𐖙', &['𐕲']), + ('𐖚', &['𐕳']), + ('𐖛', &['𐕴']), + ('𐖜', &['𐕵']), + ('𐖝', &['𐕶']), + ('𐖞', &['𐕷']), + ('𐖟', &['𐕸']), + ('𐖠', &['𐕹']), + ('𐖡', &['𐕺']), + ('𐖣', &['𐕼']), + ('𐖤', &['𐕽']), + ('𐖥', &['𐕾']), + ('𐖦', &['𐕿']), + ('𐖧', &['𐖀']), + ('𐖨', &['𐖁']), + ('𐖩', &['𐖂']), + ('𐖪', &['𐖃']), + ('𐖫', &['𐖄']), + ('𐖬', &['𐖅']), + ('𐖭', &['𐖆']), + ('𐖮', &['𐖇']), + ('𐖯', &['𐖈']), + ('𐖰', &['𐖉']), + ('𐖱', &['𐖊']), + ('𐖳', &['𐖌']), + ('𐖴', &['𐖍']), + ('𐖵', &['𐖎']), + ('𐖶', &['𐖏']), + ('𐖷', &['𐖐']), + ('𐖸', &['𐖑']), + ('𐖹', &['𐖒']), + ('𐖻', &['𐖔']), + ('𐖼', &['𐖕']), ('𐲀', &['𐳀']), ('𐲁', &['𐳁']), ('𐲂', &['𐳂']), diff --git a/regex-syntax/src/unicode_tables/general_category.rs b/regex-syntax/src/unicode_tables/general_category.rs index 33b7b7e6e1..8aa6b00788 100644 --- a/regex-syntax/src/unicode_tables/general_category.rs +++ b/regex-syntax/src/unicode_tables/general_category.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate general-category ucd-13.0.0 --chars --exclude surrogate +// ucd-generate general-category /tmp/ucd --chars --exclude surrogate // -// Unicode version: 13.0.0. +// Unicode version: 14.0.0. // -// ucd-generate 0.2.8 is available on crates.io. +// ucd-generate 0.2.11 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Cased_Letter", CASED_LETTER), @@ -116,9 +116,7 @@ pub const CASED_LETTER: &'static [(char, char)] = &[ ('ⅅ', 'ⅉ'), ('ⅎ', 'ⅎ'), ('Ↄ', 'ↄ'), - ('Ⰰ', 'Ⱞ'), - ('ⰰ', 'ⱞ'), - ('Ⱡ', 'ⱻ'), + ('Ⰰ', 'ⱻ'), ('Ȿ', 'ⳤ'), ('Ⳬ', 'ⳮ'), ('Ⳳ', 'ⳳ'), @@ -130,12 +128,14 @@ pub const CASED_LETTER: &'static [(char, char)] = &[ ('Ꜣ', 'ꝯ'), ('ꝱ', 'ꞇ'), ('Ꞌ', 'ꞎ'), - ('Ꞑ', 'ꞿ'), - ('Ꟃ', '\u{a7ca}'), - ('\u{a7f5}', '\u{a7f6}'), + ('Ꞑ', 'ꟊ'), + ('Ꟑ', 'ꟑ'), + ('ꟓ', 'ꟓ'), + ('ꟕ', 'ꟙ'), + ('Ꟶ', 'ꟶ'), ('ꟺ', 'ꟺ'), ('ꬰ', 'ꭚ'), - ('ꭠ', '\u{ab68}'), + ('ꭠ', 'ꭨ'), ('ꭰ', 'ꮿ'), ('ff', 'st'), ('ﬓ', 'ﬗ'), @@ -144,6 +144,14 @@ pub const CASED_LETTER: &'static [(char, char)] = &[ ('𐐀', '𐑏'), ('𐒰', '𐓓'), ('𐓘', '𐓻'), + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), ('𐲀', '𐲲'), ('𐳀', '𐳲'), ('𑢠', '𑣟'), @@ -178,6 +186,8 @@ pub const CASED_LETTER: &'static [(char, char)] = &[ ('𝞊', '𝞨'), ('𝞪', '𝟂'), ('𝟄', '𝟋'), + ('𝼀', '𝼉'), + ('𝼋', '𝼞'), ('𞤀', '𞥃'), ]; @@ -225,6 +235,10 @@ pub const CLOSE_PUNCTUATION: &'static [(char, char)] = &[ ('⸥', '⸥'), ('⸧', '⸧'), ('⸩', '⸩'), + ('⹖', '⹖'), + ('⹘', '⹘'), + ('⹚', '⹚'), + ('⹜', '⹜'), ('〉', '〉'), ('》', '》'), ('」', '」'), @@ -266,7 +280,7 @@ pub const CONNECTOR_PUNCTUATION: &'static [(char, char)] = &[ ]; pub const CONTROL: &'static [(char, char)] = - &[('\u{0}', '\u{1f}'), ('\u{7f}', '\u{9f}')]; + &[('\0', '\u{1f}'), ('\u{7f}', '\u{9f}')]; pub const CURRENCY_SYMBOL: &'static [(char, char)] = &[ ('$', '$'), @@ -280,7 +294,7 @@ pub const CURRENCY_SYMBOL: &'static [(char, char)] = &[ ('௹', '௹'), ('฿', '฿'), ('៛', '៛'), - ('₠', '₿'), + ('₠', '⃀'), ('꠸', '꠸'), ('﷼', '﷼'), ('﹩', '﹩'), @@ -303,6 +317,7 @@ pub const DASH_PUNCTUATION: &'static [(char, char)] = &[ ('⸚', '⸚'), ('⸺', '⸻'), ('⹀', '⹀'), + ('⹝', '⹝'), ('〜', '〜'), ('〰', '〰'), ('゠', '゠'), @@ -310,7 +325,7 @@ pub const DASH_PUNCTUATION: &'static [(char, char)] = &[ ('﹘', '﹘'), ('﹣', '﹣'), ('-', '-'), - ('\u{10ead}', '\u{10ead}'), + ('𐺭', '𐺭'), ]; pub const DECIMAL_NUMBER: &'static [(char, char)] = &[ @@ -364,17 +379,18 @@ pub const DECIMAL_NUMBER: &'static [(char, char)] = &[ ('𑛀', '𑛉'), ('𑜰', '𑜹'), ('𑣠', '𑣩'), - ('\u{11950}', '\u{11959}'), + ('𑥐', '𑥙'), ('𑱐', '𑱙'), ('𑵐', '𑵙'), ('𑶠', '𑶩'), ('𖩠', '𖩩'), + ('𖫀', '𖫉'), ('𖭐', '𖭙'), ('𝟎', '𝟿'), ('𞅀', '𞅉'), ('𞋰', '𞋹'), ('𞥐', '𞥙'), - ('\u{1fbf0}', '\u{1fbf9}'), + ('🯰', '🯹'), ]; pub const ENCLOSING_MARK: &'static [(char, char)] = &[ @@ -404,6 +420,7 @@ pub const FORMAT: &'static [(char, char)] = &[ ('\u{61c}', '\u{61c}'), ('\u{6dd}', '\u{6dd}'), ('\u{70f}', '\u{70f}'), + ('\u{890}', '\u{891}'), ('\u{8e2}', '\u{8e2}'), ('\u{180e}', '\u{180e}'), ('\u{200b}', '\u{200f}'), @@ -485,8 +502,9 @@ pub const LETTER: &'static [(char, char)] = &[ ('ࠨ', 'ࠨ'), ('ࡀ', 'ࡘ'), ('ࡠ', 'ࡪ'), - ('ࢠ', 'ࢴ'), - ('ࢶ', '\u{8c7}'), + ('ࡰ', 'ࢇ'), + ('ࢉ', 'ࢎ'), + ('ࢠ', 'ࣉ'), ('ऄ', 'ह'), ('ऽ', 'ऽ'), ('ॐ', 'ॐ'), @@ -551,6 +569,7 @@ pub const LETTER: &'static [(char, char)] = &[ ('ప', 'హ'), ('ఽ', 'ఽ'), ('ౘ', 'ౚ'), + ('ౝ', 'ౝ'), ('ౠ', 'ౡ'), ('ಀ', 'ಀ'), ('ಅ', 'ಌ'), @@ -559,10 +578,10 @@ pub const LETTER: &'static [(char, char)] = &[ ('ಪ', 'ಳ'), ('ವ', 'ಹ'), ('ಽ', 'ಽ'), - ('ೞ', 'ೞ'), + ('ೝ', 'ೞ'), ('ೠ', 'ೡ'), ('ೱ', 'ೲ'), - ('\u{d04}', 'ഌ'), + ('ഄ', 'ഌ'), ('എ', 'ഐ'), ('ഒ', 'ഺ'), ('ഽ', 'ഽ'), @@ -630,9 +649,8 @@ pub const LETTER: &'static [(char, char)] = &[ ('ᚁ', 'ᚚ'), ('ᚠ', 'ᛪ'), ('ᛱ', 'ᛸ'), - ('ᜀ', 'ᜌ'), - ('ᜎ', 'ᜑ'), - ('ᜠ', 'ᜱ'), + ('ᜀ', 'ᜑ'), + ('ᜟ', 'ᜱ'), ('ᝀ', 'ᝑ'), ('ᝠ', 'ᝬ'), ('ᝮ', 'ᝰ'), @@ -653,7 +671,7 @@ pub const LETTER: &'static [(char, char)] = &[ ('ᨠ', 'ᩔ'), ('ᪧ', 'ᪧ'), ('ᬅ', 'ᬳ'), - ('ᭅ', 'ᭋ'), + ('ᭅ', 'ᭌ'), ('ᮃ', 'ᮠ'), ('ᮮ', 'ᮯ'), ('ᮺ', 'ᯥ'), @@ -704,9 +722,7 @@ pub const LETTER: &'static [(char, char)] = &[ ('ⅅ', 'ⅉ'), ('ⅎ', 'ⅎ'), ('Ↄ', 'ↄ'), - ('Ⰰ', 'Ⱞ'), - ('ⰰ', 'ⱞ'), - ('Ⱡ', 'ⳤ'), + ('Ⰰ', 'ⳤ'), ('Ⳬ', 'ⳮ'), ('Ⳳ', 'ⳳ'), ('ⴀ', 'ⴥ'), @@ -733,11 +749,10 @@ pub const LETTER: &'static [(char, char)] = &[ ('ー', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', '\u{31bf}'), + ('ㆠ', 'ㆿ'), ('ㇰ', 'ㇿ'), - ('㐀', '\u{4dbf}'), - ('一', '\u{9ffc}'), - ('ꀀ', 'ꒌ'), + ('㐀', '䶿'), + ('一', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), ('ꘐ', 'ꘟ'), @@ -747,9 +762,11 @@ pub const LETTER: &'static [(char, char)] = &[ ('ꚠ', 'ꛥ'), ('ꜗ', 'ꜟ'), ('Ꜣ', 'ꞈ'), - ('Ꞌ', 'ꞿ'), - ('Ꟃ', '\u{a7ca}'), - ('\u{a7f5}', 'ꠁ'), + ('Ꞌ', 'ꟊ'), + ('Ꟑ', 'ꟑ'), + ('ꟓ', 'ꟓ'), + ('ꟕ', 'ꟙ'), + ('ꟲ', 'ꠁ'), ('ꠃ', 'ꠅ'), ('ꠇ', 'ꠊ'), ('ꠌ', 'ꠢ'), @@ -786,7 +803,7 @@ pub const LETTER: &'static [(char, char)] = &[ ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab69}'), + ('ꭜ', 'ꭩ'), ('ꭰ', 'ꯢ'), ('가', '힣'), ('ힰ', 'ퟆ'), @@ -837,9 +854,20 @@ pub const LETTER: &'static [(char, char)] = &[ ('𐓘', '𐓻'), ('𐔀', '𐔧'), ('𐔰', '𐕣'), + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), ('𐘀', '𐜶'), ('𐝀', '𐝕'), ('𐝠', '𐝧'), + ('𐞀', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), ('𐠀', '𐠅'), ('𐠈', '𐠈'), ('𐠊', '𐠵'), @@ -870,19 +898,22 @@ pub const LETTER: &'static [(char, char)] = &[ ('𐲀', '𐲲'), ('𐳀', '𐳲'), ('𐴀', '𐴣'), - ('\u{10e80}', '\u{10ea9}'), - ('\u{10eb0}', '\u{10eb1}'), + ('𐺀', '𐺩'), + ('𐺰', '𐺱'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '𐽅'), - ('\u{10fb0}', '\u{10fc4}'), + ('𐽰', '𐾁'), + ('𐾰', '𐿄'), ('𐿠', '𐿶'), ('𑀃', '𑀷'), + ('𑁱', '𑁲'), + ('𑁵', '𑁵'), ('𑂃', '𑂯'), ('𑃐', '𑃨'), ('𑄃', '𑄦'), ('𑅄', '𑅄'), - ('\u{11147}', '\u{11147}'), + ('𑅇', '𑅇'), ('𑅐', '𑅲'), ('𑅶', '𑅶'), ('𑆃', '𑆲'), @@ -908,7 +939,7 @@ pub const LETTER: &'static [(char, char)] = &[ ('𑍝', '𑍡'), ('𑐀', '𑐴'), ('𑑇', '𑑊'), - ('𑑟', '\u{11461}'), + ('𑑟', '𑑡'), ('𑒀', '𑒯'), ('𑓄', '𑓅'), ('𑓇', '𑓇'), @@ -919,15 +950,16 @@ pub const LETTER: &'static [(char, char)] = &[ ('𑚀', '𑚪'), ('𑚸', '𑚸'), ('𑜀', '𑜚'), + ('𑝀', '𑝆'), ('𑠀', '𑠫'), ('𑢠', '𑣟'), - ('𑣿', '\u{11906}'), - ('\u{11909}', '\u{11909}'), - ('\u{1190c}', '\u{11913}'), - ('\u{11915}', '\u{11916}'), - ('\u{11918}', '\u{1192f}'), - ('\u{1193f}', '\u{1193f}'), - ('\u{11941}', '\u{11941}'), + ('𑣿', '𑤆'), + ('𑤉', '𑤉'), + ('𑤌', '𑤓'), + ('𑤕', '𑤖'), + ('𑤘', '𑤯'), + ('𑤿', '𑤿'), + ('𑥁', '𑥁'), ('𑦠', '𑦧'), ('𑦪', '𑧐'), ('𑧡', '𑧡'), @@ -938,7 +970,7 @@ pub const LETTER: &'static [(char, char)] = &[ ('𑩐', '𑩐'), ('𑩜', '𑪉'), ('𑪝', '𑪝'), - ('𑫀', '𑫸'), + ('𑪰', '𑫸'), ('𑰀', '𑰈'), ('𑰊', '𑰮'), ('𑱀', '𑱀'), @@ -952,13 +984,15 @@ pub const LETTER: &'static [(char, char)] = &[ ('𑵪', '𑶉'), ('𑶘', '𑶘'), ('𑻠', '𑻲'), - ('\u{11fb0}', '\u{11fb0}'), + ('𑾰', '𑾰'), ('𒀀', '𒎙'), ('𒒀', '𒕃'), + ('𒾐', '𒿰'), ('𓀀', '𓐮'), ('𔐀', '𔙆'), ('𖠀', '𖨸'), ('𖩀', '𖩞'), + ('𖩰', '𖪾'), ('𖫐', '𖫭'), ('𖬀', '𖬯'), ('𖭀', '𖭃'), @@ -971,9 +1005,12 @@ pub const LETTER: &'static [(char, char)] = &[ ('𖿠', '𖿡'), ('𖿣', '𖿣'), ('𗀀', '𘟷'), - ('𘠀', '\u{18cd5}'), - ('\u{18d00}', '\u{18d08}'), - ('𛀀', '𛄞'), + ('𘠀', '𘳕'), + ('𘴀', '𘴈'), + ('𚿰', '𚿳'), + ('𚿵', '𚿻'), + ('𚿽', '𚿾'), + ('𛀀', '𛄢'), ('𛅐', '𛅒'), ('𛅤', '𛅧'), ('𛅰', '𛋻'), @@ -1011,10 +1048,16 @@ pub const LETTER: &'static [(char, char)] = &[ ('𝞊', '𝞨'), ('𝞪', '𝟂'), ('𝟄', '𝟋'), + ('𝼀', '𝼞'), ('𞄀', '𞄬'), ('𞄷', '𞄽'), ('𞅎', '𞅎'), + ('𞊐', '𞊭'), ('𞋀', '𞋫'), + ('𞟠', '𞟦'), + ('𞟨', '𞟫'), + ('𞟭', '𞟮'), + ('𞟰', '𞟾'), ('𞠀', '𞣄'), ('𞤀', '𞥃'), ('𞥋', '𞥋'), @@ -1051,13 +1094,13 @@ pub const LETTER: &'static [(char, char)] = &[ ('𞺡', '𞺣'), ('𞺥', '𞺩'), ('𞺫', '𞺻'), - ('𠀀', '\u{2a6dd}'), - ('𪜀', '𫜴'), + ('𠀀', '𪛟'), + ('𪜀', '𫜸'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), - ('\u{30000}', '\u{3134a}'), + ('𰀀', '𱍊'), ]; pub const LETTER_NUMBER: &'static [(char, char)] = &[ @@ -1510,7 +1553,7 @@ pub const LOWERCASE_LETTER: &'static [(char, char)] = &[ ('ⅆ', 'ⅉ'), ('ⅎ', 'ⅎ'), ('ↄ', 'ↄ'), - ('ⰰ', 'ⱞ'), + ('ⰰ', 'ⱟ'), ('ⱡ', 'ⱡ'), ('ⱥ', 'ⱦ'), ('ⱨ', 'ⱨ'), @@ -1679,19 +1722,29 @@ pub const LOWERCASE_LETTER: &'static [(char, char)] = &[ ('ꞻ', 'ꞻ'), ('ꞽ', 'ꞽ'), ('ꞿ', 'ꞿ'), + ('ꟁ', 'ꟁ'), ('ꟃ', 'ꟃ'), - ('\u{a7c8}', '\u{a7c8}'), - ('\u{a7ca}', '\u{a7ca}'), - ('\u{a7f6}', '\u{a7f6}'), + ('ꟈ', 'ꟈ'), + ('ꟊ', 'ꟊ'), + ('ꟑ', 'ꟑ'), + ('ꟓ', 'ꟓ'), + ('ꟕ', 'ꟕ'), + ('ꟗ', 'ꟗ'), + ('ꟙ', 'ꟙ'), + ('ꟶ', 'ꟶ'), ('ꟺ', 'ꟺ'), ('ꬰ', 'ꭚ'), - ('ꭠ', '\u{ab68}'), + ('ꭠ', 'ꭨ'), ('ꭰ', 'ꮿ'), ('ff', 'st'), ('ﬓ', 'ﬗ'), ('a', 'z'), ('𐐨', '𐑏'), ('𐓘', '𐓻'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), ('𐳀', '𐳲'), ('𑣀', '𑣟'), ('𖹠', '𖹿'), @@ -1723,6 +1776,8 @@ pub const LOWERCASE_LETTER: &'static [(char, char)] = &[ ('𝞪', '𝟂'), ('𝟄', '𝟉'), ('𝟋', '𝟋'), + ('𝼀', '𝼉'), + ('𝼋', '𝼞'), ('𞤢', '𞥃'), ]; @@ -1751,7 +1806,8 @@ pub const MARK: &'static [(char, char)] = &[ ('\u{825}', '\u{827}'), ('\u{829}', '\u{82d}'), ('\u{859}', '\u{85b}'), - ('\u{8d3}', '\u{8e1}'), + ('\u{898}', '\u{89f}'), + ('\u{8ca}', '\u{8e1}'), ('\u{8e3}', 'ः'), ('\u{93a}', '\u{93c}'), ('ा', 'ॏ'), @@ -1793,6 +1849,7 @@ pub const MARK: &'static [(char, char)] = &[ ('ொ', '\u{bcd}'), ('\u{bd7}', '\u{bd7}'), ('\u{c00}', '\u{c04}'), + ('\u{c3c}', '\u{c3c}'), ('\u{c3e}', 'ౄ'), ('\u{c46}', '\u{c48}'), ('\u{c4a}', '\u{c4d}'), @@ -1844,13 +1901,14 @@ pub const MARK: &'static [(char, char)] = &[ ('ႏ', 'ႏ'), ('ႚ', '\u{109d}'), ('\u{135d}', '\u{135f}'), - ('\u{1712}', '\u{1714}'), - ('\u{1732}', '\u{1734}'), + ('\u{1712}', '᜕'), + ('\u{1732}', '᜴'), ('\u{1752}', '\u{1753}'), ('\u{1772}', '\u{1773}'), ('\u{17b4}', '\u{17d3}'), ('\u{17dd}', '\u{17dd}'), ('\u{180b}', '\u{180d}'), + ('\u{180f}', '\u{180f}'), ('\u{1885}', '\u{1886}'), ('\u{18a9}', '\u{18a9}'), ('\u{1920}', 'ᤫ'), @@ -1859,7 +1917,7 @@ pub const MARK: &'static [(char, char)] = &[ ('ᩕ', '\u{1a5e}'), ('\u{1a60}', '\u{1a7c}'), ('\u{1a7f}', '\u{1a7f}'), - ('\u{1ab0}', '\u{1ac0}'), + ('\u{1ab0}', '\u{1ace}'), ('\u{1b00}', 'ᬄ'), ('\u{1b34}', '᭄'), ('\u{1b6b}', '\u{1b73}'), @@ -1872,8 +1930,7 @@ pub const MARK: &'static [(char, char)] = &[ ('\u{1ced}', '\u{1ced}'), ('\u{1cf4}', '\u{1cf4}'), ('᳷', '\u{1cf9}'), - ('\u{1dc0}', '\u{1df9}'), - ('\u{1dfb}', '\u{1dff}'), + ('\u{1dc0}', '\u{1dff}'), ('\u{20d0}', '\u{20f0}'), ('\u{2cef}', '\u{2cf1}'), ('\u{2d7f}', '\u{2d7f}'), @@ -1926,10 +1983,14 @@ pub const MARK: &'static [(char, char)] = &[ ('\u{10d24}', '\u{10d27}'), ('\u{10eab}', '\u{10eac}'), ('\u{10f46}', '\u{10f50}'), + ('\u{10f82}', '\u{10f85}'), ('𑀀', '𑀂'), ('\u{11038}', '\u{11046}'), + ('\u{11070}', '\u{11070}'), + ('\u{11073}', '\u{11074}'), ('\u{1107f}', '𑂂'), ('𑂰', '\u{110ba}'), + ('\u{110c2}', '\u{110c2}'), ('\u{11100}', '\u{11102}'), ('\u{11127}', '\u{11134}'), ('𑅅', '𑅆'), @@ -1937,7 +1998,7 @@ pub const MARK: &'static [(char, char)] = &[ ('\u{11180}', '𑆂'), ('𑆳', '𑇀'), ('\u{111c9}', '\u{111cc}'), - ('\u{111ce}', '\u{111cf}'), + ('𑇎', '\u{111cf}'), ('𑈬', '\u{11237}'), ('\u{1123e}', '\u{1123e}'), ('\u{112df}', '\u{112ea}'), @@ -1960,11 +2021,11 @@ pub const MARK: &'static [(char, char)] = &[ ('\u{116ab}', '\u{116b7}'), ('\u{1171d}', '\u{1172b}'), ('𑠬', '\u{1183a}'), - ('\u{11930}', '\u{11935}'), - ('\u{11937}', '\u{11938}'), + ('\u{11930}', '𑤵'), + ('𑤷', '𑤸'), ('\u{1193b}', '\u{1193e}'), - ('\u{11940}', '\u{11940}'), - ('\u{11942}', '\u{11943}'), + ('𑥀', '𑥀'), + ('𑥂', '\u{11943}'), ('𑧑', '\u{119d7}'), ('\u{119da}', '\u{119e0}'), ('𑧤', '𑧤'), @@ -1993,8 +2054,10 @@ pub const MARK: &'static [(char, char)] = &[ ('𖽑', '𖾇'), ('\u{16f8f}', '\u{16f92}'), ('\u{16fe4}', '\u{16fe4}'), - ('\u{16ff0}', '\u{16ff1}'), + ('𖿰', '𖿱'), ('\u{1bc9d}', '\u{1bc9e}'), + ('\u{1cf00}', '\u{1cf2d}'), + ('\u{1cf30}', '\u{1cf46}'), ('\u{1d165}', '\u{1d169}'), ('𝅭', '\u{1d172}'), ('\u{1d17b}', '\u{1d182}'), @@ -2013,6 +2076,7 @@ pub const MARK: &'static [(char, char)] = &[ ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), ('\u{1e130}', '\u{1e136}'), + ('\u{1e2ae}', '\u{1e2ae}'), ('\u{1e2ec}', '\u{1e2ef}'), ('\u{1e8d0}', '\u{1e8d6}'), ('\u{1e944}', '\u{1e94a}'), @@ -2102,6 +2166,7 @@ pub const MODIFIER_LETTER: &'static [(char, char)] = &[ ('ࠚ', 'ࠚ'), ('ࠤ', 'ࠤ'), ('ࠨ', 'ࠨ'), + ('ࣉ', 'ࣉ'), ('ॱ', 'ॱ'), ('ๆ', 'ๆ'), ('ໆ', 'ໆ'), @@ -2132,6 +2197,7 @@ pub const MODIFIER_LETTER: &'static [(char, char)] = &[ ('ꜗ', 'ꜟ'), ('ꝰ', 'ꝰ'), ('ꞈ', 'ꞈ'), + ('ꟲ', 'ꟴ'), ('ꟸ', 'ꟹ'), ('ꧏ', 'ꧏ'), ('ꧦ', 'ꧦ'), @@ -2139,13 +2205,19 @@ pub const MODIFIER_LETTER: &'static [(char, char)] = &[ ('ꫝ', 'ꫝ'), ('ꫳ', 'ꫴ'), ('ꭜ', 'ꭟ'), - ('\u{ab69}', '\u{ab69}'), + ('ꭩ', 'ꭩ'), ('ー', 'ー'), ('\u{ff9e}', '\u{ff9f}'), + ('𐞀', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), ('𖭀', '𖭃'), ('𖾓', '𖾟'), ('𖿠', '𖿡'), ('𖿣', '𖿣'), + ('𚿰', '𚿳'), + ('𚿵', '𚿻'), + ('𚿽', '𚿾'), ('𞄷', '𞄽'), ('𞥋', '𞥋'), ]; @@ -2164,6 +2236,7 @@ pub const MODIFIER_SYMBOL: &'static [(char, char)] = &[ ('˯', '˿'), ('͵', '͵'), ('΄', '΅'), + ('࢈', '࢈'), ('᾽', '᾽'), ('᾿', '῁'), ('῍', '῏'), @@ -2175,8 +2248,8 @@ pub const MODIFIER_SYMBOL: &'static [(char, char)] = &[ ('꜠', '꜡'), ('꞉', '꞊'), ('꭛', '꭛'), - ('\u{ab6a}', '\u{ab6b}'), - ('﮲', '﯁'), + ('꭪', '꭫'), + ('﮲', '﯂'), ('^', '^'), ('`', '`'), (' ̄', ' ̄'), @@ -2208,7 +2281,8 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{825}', '\u{827}'), ('\u{829}', '\u{82d}'), ('\u{859}', '\u{85b}'), - ('\u{8d3}', '\u{8e1}'), + ('\u{898}', '\u{89f}'), + ('\u{8ca}', '\u{8e1}'), ('\u{8e3}', '\u{902}'), ('\u{93a}', '\u{93a}'), ('\u{93c}', '\u{93c}'), @@ -2249,6 +2323,7 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{bcd}', '\u{bcd}'), ('\u{c00}', '\u{c00}'), ('\u{c04}', '\u{c04}'), + ('\u{c3c}', '\u{c3c}'), ('\u{c3e}', '\u{c40}'), ('\u{c46}', '\u{c48}'), ('\u{c4a}', '\u{c4d}'), @@ -2298,7 +2373,7 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{109d}', '\u{109d}'), ('\u{135d}', '\u{135f}'), ('\u{1712}', '\u{1714}'), - ('\u{1732}', '\u{1734}'), + ('\u{1732}', '\u{1733}'), ('\u{1752}', '\u{1753}'), ('\u{1772}', '\u{1773}'), ('\u{17b4}', '\u{17b5}'), @@ -2307,6 +2382,7 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{17c9}', '\u{17d3}'), ('\u{17dd}', '\u{17dd}'), ('\u{180b}', '\u{180d}'), + ('\u{180f}', '\u{180f}'), ('\u{1885}', '\u{1886}'), ('\u{18a9}', '\u{18a9}'), ('\u{1920}', '\u{1922}'), @@ -2323,7 +2399,7 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{1a73}', '\u{1a7c}'), ('\u{1a7f}', '\u{1a7f}'), ('\u{1ab0}', '\u{1abd}'), - ('\u{1abf}', '\u{1ac0}'), + ('\u{1abf}', '\u{1ace}'), ('\u{1b00}', '\u{1b03}'), ('\u{1b34}', '\u{1b34}'), ('\u{1b36}', '\u{1b3a}'), @@ -2346,8 +2422,7 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{1ced}', '\u{1ced}'), ('\u{1cf4}', '\u{1cf4}'), ('\u{1cf8}', '\u{1cf9}'), - ('\u{1dc0}', '\u{1df9}'), - ('\u{1dfb}', '\u{1dff}'), + ('\u{1dc0}', '\u{1dff}'), ('\u{20d0}', '\u{20dc}'), ('\u{20e1}', '\u{20e1}'), ('\u{20e5}', '\u{20f0}'), @@ -2406,11 +2481,15 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{10d24}', '\u{10d27}'), ('\u{10eab}', '\u{10eac}'), ('\u{10f46}', '\u{10f50}'), + ('\u{10f82}', '\u{10f85}'), ('\u{11001}', '\u{11001}'), ('\u{11038}', '\u{11046}'), + ('\u{11070}', '\u{11070}'), + ('\u{11073}', '\u{11074}'), ('\u{1107f}', '\u{11081}'), ('\u{110b3}', '\u{110b6}'), ('\u{110b9}', '\u{110ba}'), + ('\u{110c2}', '\u{110c2}'), ('\u{11100}', '\u{11102}'), ('\u{11127}', '\u{1112b}'), ('\u{1112d}', '\u{11134}'), @@ -2490,6 +2569,8 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{16f8f}', '\u{16f92}'), ('\u{16fe4}', '\u{16fe4}'), ('\u{1bc9d}', '\u{1bc9e}'), + ('\u{1cf00}', '\u{1cf2d}'), + ('\u{1cf30}', '\u{1cf46}'), ('\u{1d167}', '\u{1d169}'), ('\u{1d17b}', '\u{1d182}'), ('\u{1d185}', '\u{1d18b}'), @@ -2507,6 +2588,7 @@ pub const NONSPACING_MARK: &'static [(char, char)] = &[ ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), ('\u{1e130}', '\u{1e136}'), + ('\u{1e2ae}', '\u{1e2ae}'), ('\u{1e2ec}', '\u{1e2ef}'), ('\u{1e8d0}', '\u{1e8d6}'), ('\u{1e944}', '\u{1e94a}'), @@ -2610,7 +2692,7 @@ pub const NUMBER: &'static [(char, char)] = &[ ('𐹠', '𐹾'), ('𐼝', '𐼦'), ('𐽑', '𐽔'), - ('\u{10fc5}', '\u{10fcb}'), + ('𐿅', '𐿋'), ('𑁒', '𑁯'), ('𑃰', '𑃹'), ('𑄶', '𑄿'), @@ -2623,13 +2705,14 @@ pub const NUMBER: &'static [(char, char)] = &[ ('𑛀', '𑛉'), ('𑜰', '𑜻'), ('𑣠', '𑣲'), - ('\u{11950}', '\u{11959}'), + ('𑥐', '𑥙'), ('𑱐', '𑱬'), ('𑵐', '𑵙'), ('𑶠', '𑶩'), ('𑿀', '𑿔'), ('𒐀', '𒑮'), ('𖩠', '𖩩'), + ('𖫀', '𖫉'), ('𖭐', '𖭙'), ('𖭛', '𖭡'), ('𖺀', '𖺖'), @@ -2646,7 +2729,7 @@ pub const NUMBER: &'static [(char, char)] = &[ ('𞴁', '𞴭'), ('𞴯', '𞴽'), ('🄀', '🄌'), - ('\u{1fbf0}', '\u{1fbf9}'), + ('🯰', '🯹'), ]; pub const OPEN_PUNCTUATION: &'static [(char, char)] = &[ @@ -2696,6 +2779,10 @@ pub const OPEN_PUNCTUATION: &'static [(char, char)] = &[ ('⸦', '⸦'), ('⸨', '⸨'), ('⹂', '⹂'), + ('⹕', '⹕'), + ('⹗', '⹗'), + ('⹙', '⹙'), + ('⹛', '⹛'), ('〈', '〈'), ('《', '《'), ('「', '「'), @@ -2728,7 +2815,7 @@ pub const OPEN_PUNCTUATION: &'static [(char, char)] = &[ ]; pub const OTHER: &'static [(char, char)] = &[ - ('\u{0}', '\u{1f}'), + ('\0', '\u{1f}'), ('\u{7f}', '\u{9f}'), ('\u{ad}', '\u{ad}'), ('\u{378}', '\u{379}'), @@ -2743,7 +2830,7 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{5c8}', '\u{5cf}'), ('\u{5eb}', '\u{5ee}'), ('\u{5f5}', '\u{605}'), - ('\u{61c}', '\u{61d}'), + ('\u{61c}', '\u{61c}'), ('\u{6dd}', '\u{6dd}'), ('\u{70e}', '\u{70f}'), ('\u{74b}', '\u{74c}'), @@ -2753,9 +2840,8 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{83f}', '\u{83f}'), ('\u{85c}', '\u{85d}'), ('\u{85f}', '\u{85f}'), - ('\u{86b}', '\u{89f}'), - ('\u{8b5}', '\u{8b5}'), - ('\u{8c8}', '\u{8d2}'), + ('\u{86b}', '\u{86f}'), + ('\u{88f}', '\u{897}'), ('\u{8e2}', '\u{8e2}'), ('\u{984}', '\u{984}'), ('\u{98d}', '\u{98e}'), @@ -2834,12 +2920,13 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{c0d}', '\u{c0d}'), ('\u{c11}', '\u{c11}'), ('\u{c29}', '\u{c29}'), - ('\u{c3a}', '\u{c3c}'), + ('\u{c3a}', '\u{c3b}'), ('\u{c45}', '\u{c45}'), ('\u{c49}', '\u{c49}'), ('\u{c4e}', '\u{c54}'), ('\u{c57}', '\u{c57}'), - ('\u{c5b}', '\u{c5f}'), + ('\u{c5b}', '\u{c5c}'), + ('\u{c5e}', '\u{c5f}'), ('\u{c64}', '\u{c65}'), ('\u{c70}', '\u{c76}'), ('\u{c8d}', '\u{c8d}'), @@ -2850,7 +2937,7 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{cc5}', '\u{cc5}'), ('\u{cc9}', '\u{cc9}'), ('\u{cce}', '\u{cd4}'), - ('\u{cd7}', '\u{cdd}'), + ('\u{cd7}', '\u{cdc}'), ('\u{cdf}', '\u{cdf}'), ('\u{ce4}', '\u{ce5}'), ('\u{cf0}', '\u{cf0}'), @@ -2918,8 +3005,7 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{13fe}', '\u{13ff}'), ('\u{169d}', '\u{169f}'), ('\u{16f9}', '\u{16ff}'), - ('\u{170d}', '\u{170d}'), - ('\u{1715}', '\u{171f}'), + ('\u{1716}', '\u{171e}'), ('\u{1737}', '\u{173f}'), ('\u{1754}', '\u{175f}'), ('\u{176d}', '\u{176d}'), @@ -2928,7 +3014,7 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{17de}', '\u{17df}'), ('\u{17ea}', '\u{17ef}'), ('\u{17fa}', '\u{17ff}'), - ('\u{180e}', '\u{180f}'), + ('\u{180e}', '\u{180e}'), ('\u{181a}', '\u{181f}'), ('\u{1879}', '\u{187f}'), ('\u{18ab}', '\u{18af}'), @@ -2948,9 +3034,9 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{1a8a}', '\u{1a8f}'), ('\u{1a9a}', '\u{1a9f}'), ('\u{1aae}', '\u{1aaf}'), - ('\u{1ac1}', '\u{1aff}'), - ('\u{1b4c}', '\u{1b4f}'), - ('\u{1b7d}', '\u{1b7f}'), + ('\u{1acf}', '\u{1aff}'), + ('\u{1b4d}', '\u{1b4f}'), + ('\u{1b7f}', '\u{1b7f}'), ('\u{1bf4}', '\u{1bfb}'), ('\u{1c38}', '\u{1c3a}'), ('\u{1c4a}', '\u{1c4c}'), @@ -2958,7 +3044,6 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{1cbb}', '\u{1cbc}'), ('\u{1cc8}', '\u{1ccf}'), ('\u{1cfb}', '\u{1cff}'), - ('\u{1dfa}', '\u{1dfa}'), ('\u{1f16}', '\u{1f17}'), ('\u{1f1e}', '\u{1f1f}'), ('\u{1f46}', '\u{1f47}'), @@ -2981,15 +3066,13 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{2072}', '\u{2073}'), ('\u{208f}', '\u{208f}'), ('\u{209d}', '\u{209f}'), - ('\u{20c0}', '\u{20cf}'), + ('\u{20c1}', '\u{20cf}'), ('\u{20f1}', '\u{20ff}'), ('\u{218c}', '\u{218f}'), ('\u{2427}', '\u{243f}'), ('\u{244b}', '\u{245f}'), ('\u{2b74}', '\u{2b75}'), ('\u{2b96}', '\u{2b96}'), - ('\u{2c2f}', '\u{2c2f}'), - ('\u{2c5f}', '\u{2c5f}'), ('\u{2cf4}', '\u{2cf8}'), ('\u{2d26}', '\u{2d26}'), ('\u{2d28}', '\u{2d2c}'), @@ -3005,7 +3088,7 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{2dcf}', '\u{2dcf}'), ('\u{2dd7}', '\u{2dd7}'), ('\u{2ddf}', '\u{2ddf}'), - ('\u{2e53}', '\u{2e7f}'), + ('\u{2e5e}', '\u{2e7f}'), ('\u{2e9a}', '\u{2e9a}'), ('\u{2ef4}', '\u{2eff}'), ('\u{2fd6}', '\u{2fef}'), @@ -3017,13 +3100,14 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{318f}', '\u{318f}'), ('\u{31e4}', '\u{31ef}'), ('\u{321f}', '\u{321f}'), - ('\u{9ffd}', '\u{9fff}'), ('\u{a48d}', '\u{a48f}'), ('\u{a4c7}', '\u{a4cf}'), ('\u{a62c}', '\u{a63f}'), ('\u{a6f8}', '\u{a6ff}'), - ('\u{a7c0}', '\u{a7c1}'), - ('\u{a7cb}', '\u{a7f4}'), + ('\u{a7cb}', '\u{a7cf}'), + ('\u{a7d2}', '\u{a7d2}'), + ('\u{a7d4}', '\u{a7d4}'), + ('\u{a7da}', '\u{a7f1}'), ('\u{a82d}', '\u{a82f}'), ('\u{a83a}', '\u{a83f}'), ('\u{a878}', '\u{a87f}'), @@ -3059,11 +3143,10 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{fb3f}', '\u{fb3f}'), ('\u{fb42}', '\u{fb42}'), ('\u{fb45}', '\u{fb45}'), - ('\u{fbc2}', '\u{fbd2}'), - ('\u{fd40}', '\u{fd4f}'), + ('\u{fbc3}', '\u{fbd2}'), ('\u{fd90}', '\u{fd91}'), - ('\u{fdc8}', '\u{fdef}'), - ('\u{fdfe}', '\u{fdff}'), + ('\u{fdc8}', '\u{fdce}'), + ('\u{fdd0}', '\u{fdef}'), ('\u{fe1a}', '\u{fe1f}'), ('\u{fe53}', '\u{fe53}'), ('\u{fe67}', '\u{fe67}'), @@ -3106,10 +3189,20 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{104fc}', '\u{104ff}'), ('\u{10528}', '\u{1052f}'), ('\u{10564}', '\u{1056e}'), - ('\u{10570}', '\u{105ff}'), + ('\u{1057b}', '\u{1057b}'), + ('\u{1058b}', '\u{1058b}'), + ('\u{10593}', '\u{10593}'), + ('\u{10596}', '\u{10596}'), + ('\u{105a2}', '\u{105a2}'), + ('\u{105b2}', '\u{105b2}'), + ('\u{105ba}', '\u{105ba}'), + ('\u{105bd}', '\u{105ff}'), ('\u{10737}', '\u{1073f}'), ('\u{10756}', '\u{1075f}'), - ('\u{10768}', '\u{107ff}'), + ('\u{10768}', '\u{1077f}'), + ('\u{10786}', '\u{10786}'), + ('\u{107b1}', '\u{107b1}'), + ('\u{107bb}', '\u{107ff}'), ('\u{10806}', '\u{10807}'), ('\u{10809}', '\u{10809}'), ('\u{10836}', '\u{10836}'), @@ -3152,13 +3245,14 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{10eae}', '\u{10eaf}'), ('\u{10eb2}', '\u{10eff}'), ('\u{10f28}', '\u{10f2f}'), - ('\u{10f5a}', '\u{10faf}'), + ('\u{10f5a}', '\u{10f6f}'), + ('\u{10f8a}', '\u{10faf}'), ('\u{10fcc}', '\u{10fdf}'), ('\u{10ff7}', '\u{10fff}'), ('\u{1104e}', '\u{11051}'), - ('\u{11070}', '\u{1107e}'), + ('\u{11076}', '\u{1107e}'), ('\u{110bd}', '\u{110bd}'), - ('\u{110c2}', '\u{110cf}'), + ('\u{110c3}', '\u{110cf}'), ('\u{110e9}', '\u{110ef}'), ('\u{110fa}', '\u{110ff}'), ('\u{11135}', '\u{11135}'), @@ -3199,11 +3293,11 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{11645}', '\u{1164f}'), ('\u{1165a}', '\u{1165f}'), ('\u{1166d}', '\u{1167f}'), - ('\u{116b9}', '\u{116bf}'), + ('\u{116ba}', '\u{116bf}'), ('\u{116ca}', '\u{116ff}'), ('\u{1171b}', '\u{1171c}'), ('\u{1172c}', '\u{1172f}'), - ('\u{11740}', '\u{117ff}'), + ('\u{11747}', '\u{117ff}'), ('\u{1183c}', '\u{1189f}'), ('\u{118f3}', '\u{118fe}'), ('\u{11907}', '\u{11908}'), @@ -3218,7 +3312,7 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{119d8}', '\u{119d9}'), ('\u{119e5}', '\u{119ff}'), ('\u{11a48}', '\u{11a4f}'), - ('\u{11aa3}', '\u{11abf}'), + ('\u{11aa3}', '\u{11aaf}'), ('\u{11af9}', '\u{11bff}'), ('\u{11c09}', '\u{11c09}'), ('\u{11c37}', '\u{11c37}'), @@ -3246,13 +3340,15 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{1239a}', '\u{123ff}'), ('\u{1246f}', '\u{1246f}'), ('\u{12475}', '\u{1247f}'), - ('\u{12544}', '\u{12fff}'), + ('\u{12544}', '\u{12f8f}'), + ('\u{12ff3}', '\u{12fff}'), ('\u{1342f}', '\u{143ff}'), ('\u{14647}', '\u{167ff}'), ('\u{16a39}', '\u{16a3f}'), ('\u{16a5f}', '\u{16a5f}'), ('\u{16a6a}', '\u{16a6d}'), - ('\u{16a70}', '\u{16acf}'), + ('\u{16abf}', '\u{16abf}'), + ('\u{16aca}', '\u{16acf}'), ('\u{16aee}', '\u{16aef}'), ('\u{16af6}', '\u{16aff}'), ('\u{16b46}', '\u{16b4f}'), @@ -3268,8 +3364,11 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{16ff2}', '\u{16fff}'), ('\u{187f8}', '\u{187ff}'), ('\u{18cd6}', '\u{18cff}'), - ('\u{18d09}', '\u{1afff}'), - ('\u{1b11f}', '\u{1b14f}'), + ('\u{18d09}', '\u{1afef}'), + ('\u{1aff4}', '\u{1aff4}'), + ('\u{1affc}', '\u{1affc}'), + ('\u{1afff}', '\u{1afff}'), + ('\u{1b123}', '\u{1b14f}'), ('\u{1b153}', '\u{1b163}'), ('\u{1b168}', '\u{1b16f}'), ('\u{1b2fc}', '\u{1bbff}'), @@ -3277,11 +3376,14 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{1bc7d}', '\u{1bc7f}'), ('\u{1bc89}', '\u{1bc8f}'), ('\u{1bc9a}', '\u{1bc9b}'), - ('\u{1bca0}', '\u{1cfff}'), + ('\u{1bca0}', '\u{1ceff}'), + ('\u{1cf2e}', '\u{1cf2f}'), + ('\u{1cf47}', '\u{1cf4f}'), + ('\u{1cfc4}', '\u{1cfff}'), ('\u{1d0f6}', '\u{1d0ff}'), ('\u{1d127}', '\u{1d128}'), ('\u{1d173}', '\u{1d17a}'), - ('\u{1d1e9}', '\u{1d1ff}'), + ('\u{1d1eb}', '\u{1d1ff}'), ('\u{1d246}', '\u{1d2df}'), ('\u{1d2f4}', '\u{1d2ff}'), ('\u{1d357}', '\u{1d35f}'), @@ -3308,7 +3410,8 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{1d7cc}', '\u{1d7cd}'), ('\u{1da8c}', '\u{1da9a}'), ('\u{1daa0}', '\u{1daa0}'), - ('\u{1dab0}', '\u{1dfff}'), + ('\u{1dab0}', '\u{1deff}'), + ('\u{1df1f}', '\u{1dfff}'), ('\u{1e007}', '\u{1e007}'), ('\u{1e019}', '\u{1e01a}'), ('\u{1e022}', '\u{1e022}'), @@ -3317,9 +3420,14 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{1e12d}', '\u{1e12f}'), ('\u{1e13e}', '\u{1e13f}'), ('\u{1e14a}', '\u{1e14d}'), - ('\u{1e150}', '\u{1e2bf}'), + ('\u{1e150}', '\u{1e28f}'), + ('\u{1e2af}', '\u{1e2bf}'), ('\u{1e2fa}', '\u{1e2fe}'), - ('\u{1e300}', '\u{1e7ff}'), + ('\u{1e300}', '\u{1e7df}'), + ('\u{1e7e7}', '\u{1e7e7}'), + ('\u{1e7ec}', '\u{1e7ec}'), + ('\u{1e7ef}', '\u{1e7ef}'), + ('\u{1e7ff}', '\u{1e7ff}'), ('\u{1e8c5}', '\u{1e8c6}'), ('\u{1e8d7}', '\u{1e8ff}'), ('\u{1e94c}', '\u{1e94f}'), @@ -3373,34 +3481,35 @@ pub const OTHER: &'static [(char, char)] = &[ ('\u{1f249}', '\u{1f24f}'), ('\u{1f252}', '\u{1f25f}'), ('\u{1f266}', '\u{1f2ff}'), - ('\u{1f6d8}', '\u{1f6df}'), + ('\u{1f6d8}', '\u{1f6dc}'), ('\u{1f6ed}', '\u{1f6ef}'), ('\u{1f6fd}', '\u{1f6ff}'), ('\u{1f774}', '\u{1f77f}'), ('\u{1f7d9}', '\u{1f7df}'), - ('\u{1f7ec}', '\u{1f7ff}'), + ('\u{1f7ec}', '\u{1f7ef}'), + ('\u{1f7f1}', '\u{1f7ff}'), ('\u{1f80c}', '\u{1f80f}'), ('\u{1f848}', '\u{1f84f}'), ('\u{1f85a}', '\u{1f85f}'), ('\u{1f888}', '\u{1f88f}'), ('\u{1f8ae}', '\u{1f8af}'), ('\u{1f8b2}', '\u{1f8ff}'), - ('\u{1f979}', '\u{1f979}'), - ('\u{1f9cc}', '\u{1f9cc}'), ('\u{1fa54}', '\u{1fa5f}'), ('\u{1fa6e}', '\u{1fa6f}'), ('\u{1fa75}', '\u{1fa77}'), - ('\u{1fa7b}', '\u{1fa7f}'), + ('\u{1fa7d}', '\u{1fa7f}'), ('\u{1fa87}', '\u{1fa8f}'), - ('\u{1faa9}', '\u{1faaf}'), - ('\u{1fab7}', '\u{1fabf}'), - ('\u{1fac3}', '\u{1facf}'), - ('\u{1fad7}', '\u{1faff}'), + ('\u{1faad}', '\u{1faaf}'), + ('\u{1fabb}', '\u{1fabf}'), + ('\u{1fac6}', '\u{1facf}'), + ('\u{1fada}', '\u{1fadf}'), + ('\u{1fae8}', '\u{1faef}'), + ('\u{1faf7}', '\u{1faff}'), ('\u{1fb93}', '\u{1fb93}'), ('\u{1fbcb}', '\u{1fbef}'), ('\u{1fbfa}', '\u{1ffff}'), - ('\u{2a6de}', '\u{2a6ff}'), - ('\u{2b735}', '\u{2b73f}'), + ('\u{2a6e0}', '\u{2a6ff}'), + ('\u{2b739}', '\u{2b73f}'), ('\u{2b81e}', '\u{2b81f}'), ('\u{2cea2}', '\u{2ceaf}'), ('\u{2ebe1}', '\u{2f7ff}'), @@ -3433,8 +3542,9 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('ࠀ', 'ࠕ'), ('ࡀ', 'ࡘ'), ('ࡠ', 'ࡪ'), - ('ࢠ', 'ࢴ'), - ('ࢶ', '\u{8c7}'), + ('ࡰ', 'ࢇ'), + ('ࢉ', 'ࢎ'), + ('ࢠ', 'ࣈ'), ('ऄ', 'ह'), ('ऽ', 'ऽ'), ('ॐ', 'ॐ'), @@ -3499,6 +3609,7 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('ప', 'హ'), ('ఽ', 'ఽ'), ('ౘ', 'ౚ'), + ('ౝ', 'ౝ'), ('ౠ', 'ౡ'), ('ಀ', 'ಀ'), ('ಅ', 'ಌ'), @@ -3507,10 +3618,10 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('ಪ', 'ಳ'), ('ವ', 'ಹ'), ('ಽ', 'ಽ'), - ('ೞ', 'ೞ'), + ('ೝ', 'ೞ'), ('ೠ', 'ೡ'), ('ೱ', 'ೲ'), - ('\u{d04}', 'ഌ'), + ('ഄ', 'ഌ'), ('എ', 'ഐ'), ('ഒ', 'ഺ'), ('ഽ', 'ഽ'), @@ -3571,9 +3682,8 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('ᚁ', 'ᚚ'), ('ᚠ', 'ᛪ'), ('ᛱ', 'ᛸ'), - ('ᜀ', 'ᜌ'), - ('ᜎ', 'ᜑ'), - ('ᜠ', 'ᜱ'), + ('ᜀ', 'ᜑ'), + ('ᜟ', 'ᜱ'), ('ᝀ', 'ᝑ'), ('ᝠ', 'ᝬ'), ('ᝮ', 'ᝰ'), @@ -3593,7 +3703,7 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('ᨀ', 'ᨖ'), ('ᨠ', 'ᩔ'), ('ᬅ', 'ᬳ'), - ('ᭅ', 'ᭋ'), + ('ᭅ', 'ᭌ'), ('ᮃ', 'ᮠ'), ('ᮮ', 'ᮯ'), ('ᮺ', 'ᯥ'), @@ -3623,11 +3733,10 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('ヿ', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', '\u{31bf}'), + ('ㆠ', 'ㆿ'), ('ㇰ', 'ㇿ'), - ('㐀', '\u{4dbf}'), - ('一', '\u{9ffc}'), - ('ꀀ', 'ꀔ'), + ('㐀', '䶿'), + ('一', 'ꀔ'), ('ꀖ', 'ꒌ'), ('ꓐ', 'ꓷ'), ('ꔀ', 'ꘋ'), @@ -3750,19 +3859,22 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('𐮀', '𐮑'), ('𐰀', '𐱈'), ('𐴀', '𐴣'), - ('\u{10e80}', '\u{10ea9}'), - ('\u{10eb0}', '\u{10eb1}'), + ('𐺀', '𐺩'), + ('𐺰', '𐺱'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '𐽅'), - ('\u{10fb0}', '\u{10fc4}'), + ('𐽰', '𐾁'), + ('𐾰', '𐿄'), ('𐿠', '𐿶'), ('𑀃', '𑀷'), + ('𑁱', '𑁲'), + ('𑁵', '𑁵'), ('𑂃', '𑂯'), ('𑃐', '𑃨'), ('𑄃', '𑄦'), ('𑅄', '𑅄'), - ('\u{11147}', '\u{11147}'), + ('𑅇', '𑅇'), ('𑅐', '𑅲'), ('𑅶', '𑅶'), ('𑆃', '𑆲'), @@ -3788,7 +3900,7 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('𑍝', '𑍡'), ('𑐀', '𑐴'), ('𑑇', '𑑊'), - ('𑑟', '\u{11461}'), + ('𑑟', '𑑡'), ('𑒀', '𑒯'), ('𑓄', '𑓅'), ('𑓇', '𑓇'), @@ -3799,14 +3911,15 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('𑚀', '𑚪'), ('𑚸', '𑚸'), ('𑜀', '𑜚'), + ('𑝀', '𑝆'), ('𑠀', '𑠫'), - ('𑣿', '\u{11906}'), - ('\u{11909}', '\u{11909}'), - ('\u{1190c}', '\u{11913}'), - ('\u{11915}', '\u{11916}'), - ('\u{11918}', '\u{1192f}'), - ('\u{1193f}', '\u{1193f}'), - ('\u{11941}', '\u{11941}'), + ('𑣿', '𑤆'), + ('𑤉', '𑤉'), + ('𑤌', '𑤓'), + ('𑤕', '𑤖'), + ('𑤘', '𑤯'), + ('𑤿', '𑤿'), + ('𑥁', '𑥁'), ('𑦠', '𑦧'), ('𑦪', '𑧐'), ('𑧡', '𑧡'), @@ -3817,7 +3930,7 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('𑩐', '𑩐'), ('𑩜', '𑪉'), ('𑪝', '𑪝'), - ('𑫀', '𑫸'), + ('𑪰', '𑫸'), ('𑰀', '𑰈'), ('𑰊', '𑰮'), ('𑱀', '𑱀'), @@ -3831,13 +3944,15 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('𑵪', '𑶉'), ('𑶘', '𑶘'), ('𑻠', '𑻲'), - ('\u{11fb0}', '\u{11fb0}'), + ('𑾰', '𑾰'), ('𒀀', '𒎙'), ('𒒀', '𒕃'), + ('𒾐', '𒿰'), ('𓀀', '𓐮'), ('𔐀', '𔙆'), ('𖠀', '𖨸'), ('𖩀', '𖩞'), + ('𖩰', '𖪾'), ('𖫐', '𖫭'), ('𖬀', '𖬯'), ('𖭣', '𖭷'), @@ -3845,9 +3960,9 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('𖼀', '𖽊'), ('𖽐', '𖽐'), ('𗀀', '𘟷'), - ('𘠀', '\u{18cd5}'), - ('\u{18d00}', '\u{18d08}'), - ('𛀀', '𛄞'), + ('𘠀', '𘳕'), + ('𘴀', '𘴈'), + ('𛀀', '𛄢'), ('𛅐', '𛅒'), ('𛅤', '𛅧'), ('𛅰', '𛋻'), @@ -3855,9 +3970,15 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('𛱰', '𛱼'), ('𛲀', '𛲈'), ('𛲐', '𛲙'), + ('𝼊', '𝼊'), ('𞄀', '𞄬'), ('𞅎', '𞅎'), + ('𞊐', '𞊭'), ('𞋀', '𞋫'), + ('𞟠', '𞟦'), + ('𞟨', '𞟫'), + ('𞟭', '𞟮'), + ('𞟰', '𞟾'), ('𞠀', '𞣄'), ('𞸀', '𞸃'), ('𞸅', '𞸟'), @@ -3892,13 +4013,13 @@ pub const OTHER_LETTER: &'static [(char, char)] = &[ ('𞺡', '𞺣'), ('𞺥', '𞺩'), ('𞺫', '𞺻'), - ('𠀀', '\u{2a6dd}'), - ('𪜀', '𫜴'), + ('𠀀', '𪛟'), + ('𪜀', '𫜸'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), - ('\u{30000}', '\u{3134a}'), + ('𰀀', '𱍊'), ]; pub const OTHER_NUMBER: &'static [(char, char)] = &[ @@ -3955,7 +4076,7 @@ pub const OTHER_NUMBER: &'static [(char, char)] = &[ ('𐹠', '𐹾'), ('𐼝', '𐼦'), ('𐽑', '𐽔'), - ('\u{10fc5}', '\u{10fcb}'), + ('𐿅', '𐿋'), ('𑁒', '𑁥'), ('𑇡', '𑇴'), ('𑜺', '𑜻'), @@ -3999,7 +4120,7 @@ pub const OTHER_PUNCTUATION: &'static [(char, char)] = &[ ('؉', '؊'), ('،', '؍'), ('؛', '؛'), - ('؞', '؟'), + ('؝', '؟'), ('٪', '٭'), ('۔', '۔'), ('܀', '܍'), @@ -4036,6 +4157,7 @@ pub const OTHER_PUNCTUATION: &'static [(char, char)] = &[ ('᪠', '᪦'), ('᪨', '᪭'), ('᭚', '᭠'), + ('᭽', '᭾'), ('᯼', '᯿'), ('᰻', '᰿'), ('᱾', '᱿'), @@ -4064,7 +4186,7 @@ pub const OTHER_PUNCTUATION: &'static [(char, char)] = &[ ('⸼', '⸿'), ('⹁', '⹁'), ('⹃', '⹏'), - ('\u{2e52}', '\u{2e52}'), + ('⹒', '⹔'), ('、', '〃'), ('〽', '〽'), ('・', '・'), @@ -4118,6 +4240,7 @@ pub const OTHER_PUNCTUATION: &'static [(char, char)] = &[ ('𐬹', '𐬿'), ('𐮙', '𐮜'), ('𐽕', '𐽙'), + ('𐾆', '𐾉'), ('𑁇', '𑁍'), ('𑂻', '𑂼'), ('𑂾', '𑃁'), @@ -4130,15 +4253,16 @@ pub const OTHER_PUNCTUATION: &'static [(char, char)] = &[ ('𑈸', '𑈽'), ('𑊩', '𑊩'), ('𑑋', '𑑏'), - ('\u{1145a}', '𑑛'), + ('𑑚', '𑑛'), ('𑑝', '𑑝'), ('𑓆', '𑓆'), ('𑗁', '𑗗'), ('𑙁', '𑙃'), ('𑙠', '𑙬'), + ('𑚹', '𑚹'), ('𑜼', '𑜾'), ('𑠻', '𑠻'), - ('\u{11944}', '\u{11946}'), + ('𑥄', '𑥆'), ('𑧢', '𑧢'), ('𑨿', '𑩆'), ('𑪚', '𑪜'), @@ -4148,6 +4272,7 @@ pub const OTHER_PUNCTUATION: &'static [(char, char)] = &[ ('𑻷', '𑻸'), ('𑿿', '𑿿'), ('𒑰', '𒑴'), + ('𒿱', '𒿲'), ('𖩮', '𖩯'), ('𖫵', '𖫵'), ('𖬷', '𖬻'), @@ -4240,9 +4365,9 @@ pub const OTHER_SYMBOL: &'static [(char, char)] = &[ ('⭅', '⭆'), ('⭍', '⭳'), ('⭶', '⮕'), - ('\u{2b97}', '⯿'), + ('⮗', '⯿'), ('⳥', '⳪'), - ('\u{2e50}', '\u{2e51}'), + ('⹐', '⹑'), ('⺀', '⺙'), ('⺛', '⻳'), ('⼀', '⿕'), @@ -4267,7 +4392,9 @@ pub const OTHER_SYMBOL: &'static [(char, char)] = &[ ('꠶', '꠷'), ('꠹', '꠹'), ('꩷', '꩹'), - ('﷽', '﷽'), + ('﵀', '﵏'), + ('﷏', '﷏'), + ('﷽', '﷿'), ('¦', '¦'), ('│', '│'), ('■', '○'), @@ -4275,7 +4402,7 @@ pub const OTHER_SYMBOL: &'static [(char, char)] = &[ ('𐄷', '𐄿'), ('𐅹', '𐆉'), ('𐆌', '𐆎'), - ('𐆐', '\u{1019c}'), + ('𐆐', '𐆜'), ('𐆠', '𐆠'), ('𐇐', '𐇼'), ('𐡷', '𐡸'), @@ -4286,13 +4413,14 @@ pub const OTHER_SYMBOL: &'static [(char, char)] = &[ ('𖬼', '𖬿'), ('𖭅', '𖭅'), ('𛲜', '𛲜'), + ('𜽐', '𜿃'), ('𝀀', '𝃵'), ('𝄀', '𝄦'), ('𝄩', '𝅘𝅥𝅲'), ('𝅪', '𝅬'), ('𝆃', '𝆄'), ('𝆌', '𝆩'), - ('𝆮', '𝇨'), + ('𝆮', '𝇪'), ('𝈀', '𝉁'), ('𝉅', '𝉅'), ('𝌀', '𝍖'), @@ -4310,38 +4438,39 @@ pub const OTHER_SYMBOL: &'static [(char, char)] = &[ ('🂱', '🂿'), ('🃁', '🃏'), ('🃑', '🃵'), - ('\u{1f10d}', '\u{1f1ad}'), + ('🄍', '🆭'), ('🇦', '🈂'), ('🈐', '🈻'), ('🉀', '🉈'), ('🉐', '🉑'), ('🉠', '🉥'), ('🌀', '🏺'), - ('🐀', '\u{1f6d7}'), - ('🛠', '🛬'), - ('🛰', '\u{1f6fc}'), + ('🐀', '🛗'), + ('🛝', '🛬'), + ('🛰', '🛼'), ('🜀', '🝳'), ('🞀', '🟘'), ('🟠', '🟫'), + ('🟰', '🟰'), ('🠀', '🠋'), ('🠐', '🡇'), ('🡐', '🡙'), ('🡠', '🢇'), ('🢐', '🢭'), - ('\u{1f8b0}', '\u{1f8b1}'), - ('🤀', '\u{1f978}'), - ('🥺', '\u{1f9cb}'), - ('🧍', '🩓'), + ('🢰', '🢱'), + ('🤀', '🩓'), ('🩠', '🩭'), - ('🩰', '\u{1fa74}'), - ('🩸', '🩺'), - ('🪀', '\u{1fa86}'), - ('🪐', '\u{1faa8}'), - ('\u{1fab0}', '\u{1fab6}'), - ('\u{1fac0}', '\u{1fac2}'), - ('\u{1fad0}', '\u{1fad6}'), - ('\u{1fb00}', '\u{1fb92}'), - ('\u{1fb94}', '\u{1fbca}'), + ('🩰', '🩴'), + ('🩸', '🩼'), + ('🪀', '🪆'), + ('🪐', '🪬'), + ('🪰', '🪺'), + ('🫀', '🫅'), + ('🫐', '🫙'), + ('🫠', '🫧'), + ('🫰', '🫶'), + ('🬀', '🮒'), + ('🮔', '🯊'), ]; pub const PARAGRAPH_SEPARATOR: &'static [(char, char)] = @@ -4381,7 +4510,7 @@ pub const PUNCTUATION: &'static [(char, char)] = &[ ('؉', '؊'), ('،', '؍'), ('؛', '؛'), - ('؞', '؟'), + ('؝', '؟'), ('٪', '٭'), ('۔', '۔'), ('܀', '܍'), @@ -4420,6 +4549,7 @@ pub const PUNCTUATION: &'static [(char, char)] = &[ ('᪠', '᪦'), ('᪨', '᪭'), ('᭚', '᭠'), + ('᭽', '᭾'), ('᯼', '᯿'), ('᰻', '᰿'), ('᱾', '᱿'), @@ -4444,7 +4574,7 @@ pub const PUNCTUATION: &'static [(char, char)] = &[ ('⵰', '⵰'), ('⸀', '⸮'), ('⸰', '⹏'), - ('\u{2e52}', '\u{2e52}'), + ('⹒', '⹝'), ('、', '〃'), ('〈', '】'), ('〔', '〟'), @@ -4498,8 +4628,9 @@ pub const PUNCTUATION: &'static [(char, char)] = &[ ('𐫰', '𐫶'), ('𐬹', '𐬿'), ('𐮙', '𐮜'), - ('\u{10ead}', '\u{10ead}'), + ('𐺭', '𐺭'), ('𐽕', '𐽙'), + ('𐾆', '𐾉'), ('𑁇', '𑁍'), ('𑂻', '𑂼'), ('𑂾', '𑃁'), @@ -4512,15 +4643,16 @@ pub const PUNCTUATION: &'static [(char, char)] = &[ ('𑈸', '𑈽'), ('𑊩', '𑊩'), ('𑑋', '𑑏'), - ('\u{1145a}', '𑑛'), + ('𑑚', '𑑛'), ('𑑝', '𑑝'), ('𑓆', '𑓆'), ('𑗁', '𑗗'), ('𑙁', '𑙃'), ('𑙠', '𑙬'), + ('𑚹', '𑚹'), ('𑜼', '𑜾'), ('𑠻', '𑠻'), - ('\u{11944}', '\u{11946}'), + ('𑥄', '𑥆'), ('𑧢', '𑧢'), ('𑨿', '𑩆'), ('𑪚', '𑪜'), @@ -4530,6 +4662,7 @@ pub const PUNCTUATION: &'static [(char, char)] = &[ ('𑻷', '𑻸'), ('𑿿', '𑿿'), ('𒑰', '𒑴'), + ('𒿱', '𒿲'), ('𖩮', '𖩯'), ('𖫵', '𖫵'), ('𖬷', '𖬻'), @@ -4620,6 +4753,8 @@ pub const SPACING_MARK: &'static [(char, char)] = &[ ('ႇ', 'ႌ'), ('ႏ', 'ႏ'), ('ႚ', 'ႜ'), + ('᜕', '᜕'), + ('᜴', '᜴'), ('ា', 'ា'), ('ើ', 'ៅ'), ('ះ', 'ៈ'), @@ -4682,7 +4817,7 @@ pub const SPACING_MARK: &'static [(char, char)] = &[ ('𑆂', '𑆂'), ('𑆳', '𑆵'), ('𑆿', '𑇀'), - ('\u{111ce}', '\u{111ce}'), + ('𑇎', '𑇎'), ('𑈬', '𑈮'), ('𑈲', '𑈳'), ('𑈵', '𑈵'), @@ -4714,11 +4849,11 @@ pub const SPACING_MARK: &'static [(char, char)] = &[ ('𑜦', '𑜦'), ('𑠬', '𑠮'), ('𑠸', '𑠸'), - ('\u{11930}', '\u{11935}'), - ('\u{11937}', '\u{11938}'), - ('\u{1193d}', '\u{1193d}'), - ('\u{11940}', '\u{11940}'), - ('\u{11942}', '\u{11942}'), + ('\u{11930}', '𑤵'), + ('𑤷', '𑤸'), + ('𑤽', '𑤽'), + ('𑥀', '𑥀'), + ('𑥂', '𑥂'), ('𑧑', '𑧓'), ('𑧜', '𑧟'), ('𑧤', '𑧤'), @@ -4735,7 +4870,7 @@ pub const SPACING_MARK: &'static [(char, char)] = &[ ('𑶖', '𑶖'), ('𑻵', '𑻶'), ('𖽑', '𖾇'), - ('\u{16ff0}', '\u{16ff1}'), + ('𖿰', '𖿱'), ('\u{1d165}', '𝅦'), ('𝅭', '\u{1d172}'), ]; @@ -4774,6 +4909,7 @@ pub const SYMBOL: &'static [(char, char)] = &[ ('۽', '۾'), ('߶', '߶'), ('߾', '߿'), + ('࢈', '࢈'), ('৲', '৳'), ('৺', '৻'), ('૱', '૱'), @@ -4812,7 +4948,7 @@ pub const SYMBOL: &'static [(char, char)] = &[ ('⁒', '⁒'), ('⁺', '⁼'), ('₊', '₌'), - ('₠', '₿'), + ('₠', '⃀'), ('℀', '℁'), ('℃', '℆'), ('℈', '℉'), @@ -4841,9 +4977,9 @@ pub const SYMBOL: &'static [(char, char)] = &[ ('⧜', '⧻'), ('⧾', '⭳'), ('⭶', '⮕'), - ('\u{2b97}', '⯿'), + ('⮗', '⯿'), ('⳥', '⳪'), - ('\u{2e50}', '\u{2e51}'), + ('⹐', '⹑'), ('⺀', '⺙'), ('⺛', '⻳'), ('⼀', '⿕'), @@ -4872,10 +5008,12 @@ pub const SYMBOL: &'static [(char, char)] = &[ ('꠶', '꠹'), ('꩷', '꩹'), ('꭛', '꭛'), - ('\u{ab6a}', '\u{ab6b}'), + ('꭪', '꭫'), ('﬩', '﬩'), - ('﮲', '﯁'), - ('﷼', '﷽'), + ('﮲', '﯂'), + ('﵀', '﵏'), + ('﷏', '﷏'), + ('﷼', '﷿'), ('﹢', '﹢'), ('﹤', '﹦'), ('﹩', '﹩'), @@ -4892,7 +5030,7 @@ pub const SYMBOL: &'static [(char, char)] = &[ ('𐄷', '𐄿'), ('𐅹', '𐆉'), ('𐆌', '𐆎'), - ('𐆐', '\u{1019c}'), + ('𐆐', '𐆜'), ('𐆠', '𐆠'), ('𐇐', '𐇼'), ('𐡷', '𐡸'), @@ -4902,13 +5040,14 @@ pub const SYMBOL: &'static [(char, char)] = &[ ('𖬼', '𖬿'), ('𖭅', '𖭅'), ('𛲜', '𛲜'), + ('𜽐', '𜿃'), ('𝀀', '𝃵'), ('𝄀', '𝄦'), ('𝄩', '𝅘𝅥𝅲'), ('𝅪', '𝅬'), ('𝆃', '𝆄'), ('𝆌', '𝆩'), - ('𝆮', '𝇨'), + ('𝆮', '𝇪'), ('𝈀', '𝉁'), ('𝉅', '𝉅'), ('𝌀', '𝍖'), @@ -4939,37 +5078,38 @@ pub const SYMBOL: &'static [(char, char)] = &[ ('🂱', '🂿'), ('🃁', '🃏'), ('🃑', '🃵'), - ('\u{1f10d}', '\u{1f1ad}'), + ('🄍', '🆭'), ('🇦', '🈂'), ('🈐', '🈻'), ('🉀', '🉈'), ('🉐', '🉑'), ('🉠', '🉥'), - ('🌀', '\u{1f6d7}'), - ('🛠', '🛬'), - ('🛰', '\u{1f6fc}'), + ('🌀', '🛗'), + ('🛝', '🛬'), + ('🛰', '🛼'), ('🜀', '🝳'), ('🞀', '🟘'), ('🟠', '🟫'), + ('🟰', '🟰'), ('🠀', '🠋'), ('🠐', '🡇'), ('🡐', '🡙'), ('🡠', '🢇'), ('🢐', '🢭'), - ('\u{1f8b0}', '\u{1f8b1}'), - ('🤀', '\u{1f978}'), - ('🥺', '\u{1f9cb}'), - ('🧍', '🩓'), + ('🢰', '🢱'), + ('🤀', '🩓'), ('🩠', '🩭'), - ('🩰', '\u{1fa74}'), - ('🩸', '🩺'), - ('🪀', '\u{1fa86}'), - ('🪐', '\u{1faa8}'), - ('\u{1fab0}', '\u{1fab6}'), - ('\u{1fac0}', '\u{1fac2}'), - ('\u{1fad0}', '\u{1fad6}'), - ('\u{1fb00}', '\u{1fb92}'), - ('\u{1fb94}', '\u{1fbca}'), + ('🩰', '🩴'), + ('🩸', '🩼'), + ('🪀', '🪆'), + ('🪐', '🪬'), + ('🪰', '🪺'), + ('🫀', '🫅'), + ('🫐', '🫙'), + ('🫠', '🫧'), + ('🫰', '🫶'), + ('🬀', '🮒'), + ('🮔', '🯊'), ]; pub const TITLECASE_LETTER: &'static [(char, char)] = &[ @@ -4998,7 +5138,6 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{5c8}', '\u{5cf}'), ('\u{5eb}', '\u{5ee}'), ('\u{5f5}', '\u{5ff}'), - ('\u{61d}', '\u{61d}'), ('\u{70e}', '\u{70e}'), ('\u{74b}', '\u{74c}'), ('\u{7b2}', '\u{7bf}'), @@ -5007,9 +5146,9 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{83f}', '\u{83f}'), ('\u{85c}', '\u{85d}'), ('\u{85f}', '\u{85f}'), - ('\u{86b}', '\u{89f}'), - ('\u{8b5}', '\u{8b5}'), - ('\u{8c8}', '\u{8d2}'), + ('\u{86b}', '\u{86f}'), + ('\u{88f}', '\u{88f}'), + ('\u{892}', '\u{897}'), ('\u{984}', '\u{984}'), ('\u{98d}', '\u{98e}'), ('\u{991}', '\u{992}'), @@ -5087,12 +5226,13 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{c0d}', '\u{c0d}'), ('\u{c11}', '\u{c11}'), ('\u{c29}', '\u{c29}'), - ('\u{c3a}', '\u{c3c}'), + ('\u{c3a}', '\u{c3b}'), ('\u{c45}', '\u{c45}'), ('\u{c49}', '\u{c49}'), ('\u{c4e}', '\u{c54}'), ('\u{c57}', '\u{c57}'), - ('\u{c5b}', '\u{c5f}'), + ('\u{c5b}', '\u{c5c}'), + ('\u{c5e}', '\u{c5f}'), ('\u{c64}', '\u{c65}'), ('\u{c70}', '\u{c76}'), ('\u{c8d}', '\u{c8d}'), @@ -5103,7 +5243,7 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{cc5}', '\u{cc5}'), ('\u{cc9}', '\u{cc9}'), ('\u{cce}', '\u{cd4}'), - ('\u{cd7}', '\u{cdd}'), + ('\u{cd7}', '\u{cdc}'), ('\u{cdf}', '\u{cdf}'), ('\u{ce4}', '\u{ce5}'), ('\u{cf0}', '\u{cf0}'), @@ -5171,8 +5311,7 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{13fe}', '\u{13ff}'), ('\u{169d}', '\u{169f}'), ('\u{16f9}', '\u{16ff}'), - ('\u{170d}', '\u{170d}'), - ('\u{1715}', '\u{171f}'), + ('\u{1716}', '\u{171e}'), ('\u{1737}', '\u{173f}'), ('\u{1754}', '\u{175f}'), ('\u{176d}', '\u{176d}'), @@ -5181,7 +5320,6 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{17de}', '\u{17df}'), ('\u{17ea}', '\u{17ef}'), ('\u{17fa}', '\u{17ff}'), - ('\u{180f}', '\u{180f}'), ('\u{181a}', '\u{181f}'), ('\u{1879}', '\u{187f}'), ('\u{18ab}', '\u{18af}'), @@ -5201,9 +5339,9 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{1a8a}', '\u{1a8f}'), ('\u{1a9a}', '\u{1a9f}'), ('\u{1aae}', '\u{1aaf}'), - ('\u{1ac1}', '\u{1aff}'), - ('\u{1b4c}', '\u{1b4f}'), - ('\u{1b7d}', '\u{1b7f}'), + ('\u{1acf}', '\u{1aff}'), + ('\u{1b4d}', '\u{1b4f}'), + ('\u{1b7f}', '\u{1b7f}'), ('\u{1bf4}', '\u{1bfb}'), ('\u{1c38}', '\u{1c3a}'), ('\u{1c4a}', '\u{1c4c}'), @@ -5211,7 +5349,6 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{1cbb}', '\u{1cbc}'), ('\u{1cc8}', '\u{1ccf}'), ('\u{1cfb}', '\u{1cff}'), - ('\u{1dfa}', '\u{1dfa}'), ('\u{1f16}', '\u{1f17}'), ('\u{1f1e}', '\u{1f1f}'), ('\u{1f46}', '\u{1f47}'), @@ -5232,15 +5369,13 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{2072}', '\u{2073}'), ('\u{208f}', '\u{208f}'), ('\u{209d}', '\u{209f}'), - ('\u{20c0}', '\u{20cf}'), + ('\u{20c1}', '\u{20cf}'), ('\u{20f1}', '\u{20ff}'), ('\u{218c}', '\u{218f}'), ('\u{2427}', '\u{243f}'), ('\u{244b}', '\u{245f}'), ('\u{2b74}', '\u{2b75}'), ('\u{2b96}', '\u{2b96}'), - ('\u{2c2f}', '\u{2c2f}'), - ('\u{2c5f}', '\u{2c5f}'), ('\u{2cf4}', '\u{2cf8}'), ('\u{2d26}', '\u{2d26}'), ('\u{2d28}', '\u{2d2c}'), @@ -5256,7 +5391,7 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{2dcf}', '\u{2dcf}'), ('\u{2dd7}', '\u{2dd7}'), ('\u{2ddf}', '\u{2ddf}'), - ('\u{2e53}', '\u{2e7f}'), + ('\u{2e5e}', '\u{2e7f}'), ('\u{2e9a}', '\u{2e9a}'), ('\u{2ef4}', '\u{2eff}'), ('\u{2fd6}', '\u{2fef}'), @@ -5268,13 +5403,14 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{318f}', '\u{318f}'), ('\u{31e4}', '\u{31ef}'), ('\u{321f}', '\u{321f}'), - ('\u{9ffd}', '\u{9fff}'), ('\u{a48d}', '\u{a48f}'), ('\u{a4c7}', '\u{a4cf}'), ('\u{a62c}', '\u{a63f}'), ('\u{a6f8}', '\u{a6ff}'), - ('\u{a7c0}', '\u{a7c1}'), - ('\u{a7cb}', '\u{a7f4}'), + ('\u{a7cb}', '\u{a7cf}'), + ('\u{a7d2}', '\u{a7d2}'), + ('\u{a7d4}', '\u{a7d4}'), + ('\u{a7da}', '\u{a7f1}'), ('\u{a82d}', '\u{a82f}'), ('\u{a83a}', '\u{a83f}'), ('\u{a878}', '\u{a87f}'), @@ -5310,11 +5446,10 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{fb3f}', '\u{fb3f}'), ('\u{fb42}', '\u{fb42}'), ('\u{fb45}', '\u{fb45}'), - ('\u{fbc2}', '\u{fbd2}'), - ('\u{fd40}', '\u{fd4f}'), + ('\u{fbc3}', '\u{fbd2}'), ('\u{fd90}', '\u{fd91}'), - ('\u{fdc8}', '\u{fdef}'), - ('\u{fdfe}', '\u{fdff}'), + ('\u{fdc8}', '\u{fdce}'), + ('\u{fdd0}', '\u{fdef}'), ('\u{fe1a}', '\u{fe1f}'), ('\u{fe53}', '\u{fe53}'), ('\u{fe67}', '\u{fe67}'), @@ -5358,10 +5493,20 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{104fc}', '\u{104ff}'), ('\u{10528}', '\u{1052f}'), ('\u{10564}', '\u{1056e}'), - ('\u{10570}', '\u{105ff}'), + ('\u{1057b}', '\u{1057b}'), + ('\u{1058b}', '\u{1058b}'), + ('\u{10593}', '\u{10593}'), + ('\u{10596}', '\u{10596}'), + ('\u{105a2}', '\u{105a2}'), + ('\u{105b2}', '\u{105b2}'), + ('\u{105ba}', '\u{105ba}'), + ('\u{105bd}', '\u{105ff}'), ('\u{10737}', '\u{1073f}'), ('\u{10756}', '\u{1075f}'), - ('\u{10768}', '\u{107ff}'), + ('\u{10768}', '\u{1077f}'), + ('\u{10786}', '\u{10786}'), + ('\u{107b1}', '\u{107b1}'), + ('\u{107bb}', '\u{107ff}'), ('\u{10806}', '\u{10807}'), ('\u{10809}', '\u{10809}'), ('\u{10836}', '\u{10836}'), @@ -5404,12 +5549,13 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{10eae}', '\u{10eaf}'), ('\u{10eb2}', '\u{10eff}'), ('\u{10f28}', '\u{10f2f}'), - ('\u{10f5a}', '\u{10faf}'), + ('\u{10f5a}', '\u{10f6f}'), + ('\u{10f8a}', '\u{10faf}'), ('\u{10fcc}', '\u{10fdf}'), ('\u{10ff7}', '\u{10fff}'), ('\u{1104e}', '\u{11051}'), - ('\u{11070}', '\u{1107e}'), - ('\u{110c2}', '\u{110cc}'), + ('\u{11076}', '\u{1107e}'), + ('\u{110c3}', '\u{110cc}'), ('\u{110ce}', '\u{110cf}'), ('\u{110e9}', '\u{110ef}'), ('\u{110fa}', '\u{110ff}'), @@ -5451,11 +5597,11 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{11645}', '\u{1164f}'), ('\u{1165a}', '\u{1165f}'), ('\u{1166d}', '\u{1167f}'), - ('\u{116b9}', '\u{116bf}'), + ('\u{116ba}', '\u{116bf}'), ('\u{116ca}', '\u{116ff}'), ('\u{1171b}', '\u{1171c}'), ('\u{1172c}', '\u{1172f}'), - ('\u{11740}', '\u{117ff}'), + ('\u{11747}', '\u{117ff}'), ('\u{1183c}', '\u{1189f}'), ('\u{118f3}', '\u{118fe}'), ('\u{11907}', '\u{11908}'), @@ -5470,7 +5616,7 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{119d8}', '\u{119d9}'), ('\u{119e5}', '\u{119ff}'), ('\u{11a48}', '\u{11a4f}'), - ('\u{11aa3}', '\u{11abf}'), + ('\u{11aa3}', '\u{11aaf}'), ('\u{11af9}', '\u{11bff}'), ('\u{11c09}', '\u{11c09}'), ('\u{11c37}', '\u{11c37}'), @@ -5498,14 +5644,16 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{1239a}', '\u{123ff}'), ('\u{1246f}', '\u{1246f}'), ('\u{12475}', '\u{1247f}'), - ('\u{12544}', '\u{12fff}'), + ('\u{12544}', '\u{12f8f}'), + ('\u{12ff3}', '\u{12fff}'), ('\u{1342f}', '\u{1342f}'), ('\u{13439}', '\u{143ff}'), ('\u{14647}', '\u{167ff}'), ('\u{16a39}', '\u{16a3f}'), ('\u{16a5f}', '\u{16a5f}'), ('\u{16a6a}', '\u{16a6d}'), - ('\u{16a70}', '\u{16acf}'), + ('\u{16abf}', '\u{16abf}'), + ('\u{16aca}', '\u{16acf}'), ('\u{16aee}', '\u{16aef}'), ('\u{16af6}', '\u{16aff}'), ('\u{16b46}', '\u{16b4f}'), @@ -5521,8 +5669,11 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{16ff2}', '\u{16fff}'), ('\u{187f8}', '\u{187ff}'), ('\u{18cd6}', '\u{18cff}'), - ('\u{18d09}', '\u{1afff}'), - ('\u{1b11f}', '\u{1b14f}'), + ('\u{18d09}', '\u{1afef}'), + ('\u{1aff4}', '\u{1aff4}'), + ('\u{1affc}', '\u{1affc}'), + ('\u{1afff}', '\u{1afff}'), + ('\u{1b123}', '\u{1b14f}'), ('\u{1b153}', '\u{1b163}'), ('\u{1b168}', '\u{1b16f}'), ('\u{1b2fc}', '\u{1bbff}'), @@ -5530,10 +5681,13 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{1bc7d}', '\u{1bc7f}'), ('\u{1bc89}', '\u{1bc8f}'), ('\u{1bc9a}', '\u{1bc9b}'), - ('\u{1bca4}', '\u{1cfff}'), + ('\u{1bca4}', '\u{1ceff}'), + ('\u{1cf2e}', '\u{1cf2f}'), + ('\u{1cf47}', '\u{1cf4f}'), + ('\u{1cfc4}', '\u{1cfff}'), ('\u{1d0f6}', '\u{1d0ff}'), ('\u{1d127}', '\u{1d128}'), - ('\u{1d1e9}', '\u{1d1ff}'), + ('\u{1d1eb}', '\u{1d1ff}'), ('\u{1d246}', '\u{1d2df}'), ('\u{1d2f4}', '\u{1d2ff}'), ('\u{1d357}', '\u{1d35f}'), @@ -5560,7 +5714,8 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{1d7cc}', '\u{1d7cd}'), ('\u{1da8c}', '\u{1da9a}'), ('\u{1daa0}', '\u{1daa0}'), - ('\u{1dab0}', '\u{1dfff}'), + ('\u{1dab0}', '\u{1deff}'), + ('\u{1df1f}', '\u{1dfff}'), ('\u{1e007}', '\u{1e007}'), ('\u{1e019}', '\u{1e01a}'), ('\u{1e022}', '\u{1e022}'), @@ -5569,9 +5724,14 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{1e12d}', '\u{1e12f}'), ('\u{1e13e}', '\u{1e13f}'), ('\u{1e14a}', '\u{1e14d}'), - ('\u{1e150}', '\u{1e2bf}'), + ('\u{1e150}', '\u{1e28f}'), + ('\u{1e2af}', '\u{1e2bf}'), ('\u{1e2fa}', '\u{1e2fe}'), - ('\u{1e300}', '\u{1e7ff}'), + ('\u{1e300}', '\u{1e7df}'), + ('\u{1e7e7}', '\u{1e7e7}'), + ('\u{1e7ec}', '\u{1e7ec}'), + ('\u{1e7ef}', '\u{1e7ef}'), + ('\u{1e7ff}', '\u{1e7ff}'), ('\u{1e8c5}', '\u{1e8c6}'), ('\u{1e8d7}', '\u{1e8ff}'), ('\u{1e94c}', '\u{1e94f}'), @@ -5625,34 +5785,35 @@ pub const UNASSIGNED: &'static [(char, char)] = &[ ('\u{1f249}', '\u{1f24f}'), ('\u{1f252}', '\u{1f25f}'), ('\u{1f266}', '\u{1f2ff}'), - ('\u{1f6d8}', '\u{1f6df}'), + ('\u{1f6d8}', '\u{1f6dc}'), ('\u{1f6ed}', '\u{1f6ef}'), ('\u{1f6fd}', '\u{1f6ff}'), ('\u{1f774}', '\u{1f77f}'), ('\u{1f7d9}', '\u{1f7df}'), - ('\u{1f7ec}', '\u{1f7ff}'), + ('\u{1f7ec}', '\u{1f7ef}'), + ('\u{1f7f1}', '\u{1f7ff}'), ('\u{1f80c}', '\u{1f80f}'), ('\u{1f848}', '\u{1f84f}'), ('\u{1f85a}', '\u{1f85f}'), ('\u{1f888}', '\u{1f88f}'), ('\u{1f8ae}', '\u{1f8af}'), ('\u{1f8b2}', '\u{1f8ff}'), - ('\u{1f979}', '\u{1f979}'), - ('\u{1f9cc}', '\u{1f9cc}'), ('\u{1fa54}', '\u{1fa5f}'), ('\u{1fa6e}', '\u{1fa6f}'), ('\u{1fa75}', '\u{1fa77}'), - ('\u{1fa7b}', '\u{1fa7f}'), + ('\u{1fa7d}', '\u{1fa7f}'), ('\u{1fa87}', '\u{1fa8f}'), - ('\u{1faa9}', '\u{1faaf}'), - ('\u{1fab7}', '\u{1fabf}'), - ('\u{1fac3}', '\u{1facf}'), - ('\u{1fad7}', '\u{1faff}'), + ('\u{1faad}', '\u{1faaf}'), + ('\u{1fabb}', '\u{1fabf}'), + ('\u{1fac6}', '\u{1facf}'), + ('\u{1fada}', '\u{1fadf}'), + ('\u{1fae8}', '\u{1faef}'), + ('\u{1faf7}', '\u{1faff}'), ('\u{1fb93}', '\u{1fb93}'), ('\u{1fbcb}', '\u{1fbef}'), ('\u{1fbfa}', '\u{1ffff}'), - ('\u{2a6de}', '\u{2a6ff}'), - ('\u{2b735}', '\u{2b73f}'), + ('\u{2a6e0}', '\u{2a6ff}'), + ('\u{2b739}', '\u{2b73f}'), ('\u{2b81e}', '\u{2b81f}'), ('\u{2cea2}', '\u{2ceaf}'), ('\u{2ebe1}', '\u{2f7ff}'), @@ -6097,7 +6258,7 @@ pub const UPPERCASE_LETTER: &'static [(char, char)] = &[ ('ℾ', 'ℿ'), ('ⅅ', 'ⅅ'), ('Ↄ', 'Ↄ'), - ('Ⰰ', 'Ⱞ'), + ('Ⰰ', 'Ⱟ'), ('Ⱡ', 'Ⱡ'), ('Ɫ', 'Ɽ'), ('Ⱨ', 'Ⱨ'), @@ -6262,13 +6423,21 @@ pub const UPPERCASE_LETTER: &'static [(char, char)] = &[ ('Ꞻ', 'Ꞻ'), ('Ꞽ', 'Ꞽ'), ('Ꞿ', 'Ꞿ'), + ('Ꟁ', 'Ꟁ'), ('Ꟃ', 'Ꟃ'), - ('Ꞔ', '\u{a7c7}'), - ('\u{a7c9}', '\u{a7c9}'), - ('\u{a7f5}', '\u{a7f5}'), + ('Ꞔ', 'Ꟈ'), + ('Ꟊ', 'Ꟊ'), + ('Ꟑ', 'Ꟑ'), + ('Ꟗ', 'Ꟗ'), + ('Ꟙ', 'Ꟙ'), + ('Ꟶ', 'Ꟶ'), ('A', 'Z'), ('𐐀', '𐐧'), ('𐒰', '𐓓'), + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), ('𐲀', '𐲲'), ('𑢠', '𑢿'), ('𖹀', '𖹟'), diff --git a/regex-syntax/src/unicode_tables/grapheme_cluster_break.rs b/regex-syntax/src/unicode_tables/grapheme_cluster_break.rs index 7df9d2b937..38cfc73afb 100644 --- a/regex-syntax/src/unicode_tables/grapheme_cluster_break.rs +++ b/regex-syntax/src/unicode_tables/grapheme_cluster_break.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate grapheme-cluster-break ucd-13.0.0 --chars +// ucd-generate grapheme-cluster-break /tmp/ucd --chars // -// Unicode version: 13.0.0. +// Unicode version: 14.0.0. // -// ucd-generate 0.2.8 is available on crates.io. +// ucd-generate 0.2.11 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("CR", CR), @@ -25,7 +25,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ pub const CR: &'static [(char, char)] = &[('\r', '\r')]; pub const CONTROL: &'static [(char, char)] = &[ - ('\u{0}', '\t'), + ('\0', '\t'), ('\u{b}', '\u{c}'), ('\u{e}', '\u{1f}'), ('\u{7f}', '\u{9f}'), @@ -71,7 +71,8 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{825}', '\u{827}'), ('\u{829}', '\u{82d}'), ('\u{859}', '\u{85b}'), - ('\u{8d3}', '\u{8e1}'), + ('\u{898}', '\u{89f}'), + ('\u{8ca}', '\u{8e1}'), ('\u{8e3}', '\u{902}'), ('\u{93a}', '\u{93a}'), ('\u{93c}', '\u{93c}'), @@ -116,6 +117,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{bd7}', '\u{bd7}'), ('\u{c00}', '\u{c00}'), ('\u{c04}', '\u{c04}'), + ('\u{c3c}', '\u{c3c}'), ('\u{c3e}', '\u{c40}'), ('\u{c46}', '\u{c48}'), ('\u{c4a}', '\u{c4d}'), @@ -171,7 +173,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{109d}', '\u{109d}'), ('\u{135d}', '\u{135f}'), ('\u{1712}', '\u{1714}'), - ('\u{1732}', '\u{1734}'), + ('\u{1732}', '\u{1733}'), ('\u{1752}', '\u{1753}'), ('\u{1772}', '\u{1773}'), ('\u{17b4}', '\u{17b5}'), @@ -180,6 +182,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{17c9}', '\u{17d3}'), ('\u{17dd}', '\u{17dd}'), ('\u{180b}', '\u{180d}'), + ('\u{180f}', '\u{180f}'), ('\u{1885}', '\u{1886}'), ('\u{18a9}', '\u{18a9}'), ('\u{1920}', '\u{1922}'), @@ -195,7 +198,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{1a65}', '\u{1a6c}'), ('\u{1a73}', '\u{1a7c}'), ('\u{1a7f}', '\u{1a7f}'), - ('\u{1ab0}', '\u{1ac0}'), + ('\u{1ab0}', '\u{1ace}'), ('\u{1b00}', '\u{1b03}'), ('\u{1b34}', '\u{1b3a}'), ('\u{1b3c}', '\u{1b3c}'), @@ -217,8 +220,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{1ced}', '\u{1ced}'), ('\u{1cf4}', '\u{1cf4}'), ('\u{1cf8}', '\u{1cf9}'), - ('\u{1dc0}', '\u{1df9}'), - ('\u{1dfb}', '\u{1dff}'), + ('\u{1dc0}', '\u{1dff}'), ('\u{200c}', '\u{200c}'), ('\u{20d0}', '\u{20f0}'), ('\u{2cef}', '\u{2cf1}'), @@ -277,11 +279,15 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{10d24}', '\u{10d27}'), ('\u{10eab}', '\u{10eac}'), ('\u{10f46}', '\u{10f50}'), + ('\u{10f82}', '\u{10f85}'), ('\u{11001}', '\u{11001}'), ('\u{11038}', '\u{11046}'), + ('\u{11070}', '\u{11070}'), + ('\u{11073}', '\u{11074}'), ('\u{1107f}', '\u{11081}'), ('\u{110b3}', '\u{110b6}'), ('\u{110b9}', '\u{110ba}'), + ('\u{110c2}', '\u{110c2}'), ('\u{11100}', '\u{11102}'), ('\u{11127}', '\u{1112b}'), ('\u{1112d}', '\u{11134}'), @@ -367,6 +373,8 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{16f8f}', '\u{16f92}'), ('\u{16fe4}', '\u{16fe4}'), ('\u{1bc9d}', '\u{1bc9e}'), + ('\u{1cf00}', '\u{1cf2d}'), + ('\u{1cf30}', '\u{1cf46}'), ('\u{1d165}', '\u{1d165}'), ('\u{1d167}', '\u{1d169}'), ('\u{1d16e}', '\u{1d172}'), @@ -386,6 +394,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), ('\u{1e130}', '\u{1e136}'), + ('\u{1e2ae}', '\u{1e2ae}'), ('\u{1e2ec}', '\u{1e2ef}'), ('\u{1e8d0}', '\u{1e8d6}'), ('\u{1e944}', '\u{1e94a}'), @@ -1206,13 +1215,14 @@ pub const PREPEND: &'static [(char, char)] = &[ ('\u{600}', '\u{605}'), ('\u{6dd}', '\u{6dd}'), ('\u{70f}', '\u{70f}'), + ('\u{890}', '\u{891}'), ('\u{8e2}', '\u{8e2}'), ('ൎ', 'ൎ'), ('\u{110bd}', '\u{110bd}'), ('\u{110cd}', '\u{110cd}'), ('𑇂', '𑇃'), - ('\u{1193f}', '\u{1193f}'), - ('\u{11941}', '\u{11941}'), + ('𑤿', '𑤿'), + ('𑥁', '𑥁'), ('𑨺', '𑨺'), ('𑪄', '𑪉'), ('𑵆', '𑵆'), @@ -1268,6 +1278,8 @@ pub const SPACINGMARK: &'static [(char, char)] = &[ ('ျ', 'ြ'), ('ၖ', 'ၗ'), ('ႄ', 'ႄ'), + ('᜕', '᜕'), + ('᜴', '᜴'), ('ា', 'ា'), ('ើ', 'ៅ'), ('ះ', 'ៈ'), @@ -1324,7 +1336,7 @@ pub const SPACINGMARK: &'static [(char, char)] = &[ ('𑆂', '𑆂'), ('𑆳', '𑆵'), ('𑆿', '𑇀'), - ('\u{111ce}', '\u{111ce}'), + ('𑇎', '𑇎'), ('𑈬', '𑈮'), ('𑈲', '𑈳'), ('𑈵', '𑈵'), @@ -1352,15 +1364,14 @@ pub const SPACINGMARK: &'static [(char, char)] = &[ ('𑚬', '𑚬'), ('𑚮', '𑚯'), ('𑚶', '𑚶'), - ('𑜠', '𑜡'), ('𑜦', '𑜦'), ('𑠬', '𑠮'), ('𑠸', '𑠸'), - ('\u{11931}', '\u{11935}'), - ('\u{11937}', '\u{11938}'), - ('\u{1193d}', '\u{1193d}'), - ('\u{11940}', '\u{11940}'), - ('\u{11942}', '\u{11942}'), + ('𑤱', '𑤵'), + ('𑤷', '𑤸'), + ('𑤽', '𑤽'), + ('𑥀', '𑥀'), + ('𑥂', '𑥂'), ('𑧑', '𑧓'), ('𑧜', '𑧟'), ('𑧤', '𑧤'), @@ -1377,7 +1388,7 @@ pub const SPACINGMARK: &'static [(char, char)] = &[ ('𑶖', '𑶖'), ('𑻵', '𑻶'), ('𖽑', '𖾇'), - ('\u{16ff0}', '\u{16ff1}'), + ('𖿰', '𖿱'), ('𝅦', '𝅦'), ('𝅭', '𝅭'), ]; diff --git a/regex-syntax/src/unicode_tables/perl_decimal.rs b/regex-syntax/src/unicode_tables/perl_decimal.rs index 2a09259fc3..9a14e43952 100644 --- a/regex-syntax/src/unicode_tables/perl_decimal.rs +++ b/regex-syntax/src/unicode_tables/perl_decimal.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate general-category ucd-13.0.0 --chars --include decimalnumber +// ucd-generate general-category /tmp/ucd --chars --include decimalnumber // -// Unicode version: 13.0.0. +// Unicode version: 14.0.0. // -// ucd-generate 0.2.8 is available on crates.io. +// ucd-generate 0.2.11 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[("Decimal_Number", DECIMAL_NUMBER)]; @@ -60,15 +60,16 @@ pub const DECIMAL_NUMBER: &'static [(char, char)] = &[ ('𑛀', '𑛉'), ('𑜰', '𑜹'), ('𑣠', '𑣩'), - ('\u{11950}', '\u{11959}'), + ('𑥐', '𑥙'), ('𑱐', '𑱙'), ('𑵐', '𑵙'), ('𑶠', '𑶩'), ('𖩠', '𖩩'), + ('𖫀', '𖫉'), ('𖭐', '𖭙'), ('𝟎', '𝟿'), ('𞅀', '𞅉'), ('𞋰', '𞋹'), ('𞥐', '𞥙'), - ('\u{1fbf0}', '\u{1fbf9}'), + ('🯰', '🯹'), ]; diff --git a/regex-syntax/src/unicode_tables/perl_space.rs b/regex-syntax/src/unicode_tables/perl_space.rs index c112dd1263..bb69ce1ba8 100644 --- a/regex-syntax/src/unicode_tables/perl_space.rs +++ b/regex-syntax/src/unicode_tables/perl_space.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate property-bool ucd-13.0.0 --chars --include whitespace +// ucd-generate property-bool /tmp/ucd --chars --include whitespace // -// Unicode version: 13.0.0. +// Unicode version: 14.0.0. // -// ucd-generate 0.2.8 is available on crates.io. +// ucd-generate 0.2.11 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[("White_Space", WHITE_SPACE)]; diff --git a/regex-syntax/src/unicode_tables/perl_word.rs b/regex-syntax/src/unicode_tables/perl_word.rs index df9eac7d75..2c8171b2ba 100644 --- a/regex-syntax/src/unicode_tables/perl_word.rs +++ b/regex-syntax/src/unicode_tables/perl_word.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate perl-word ucd-13.0.0 --chars +// ucd-generate perl-word /tmp/ucd --chars // -// Unicode version: 13.0.0. +// Unicode version: 14.0.0. // -// ucd-generate 0.2.8 is available on crates.io. +// ucd-generate 0.2.11 is available on crates.io. pub const PERL_WORD: &'static [(char, char)] = &[ ('0', '9'), @@ -57,9 +57,9 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('ࠀ', '\u{82d}'), ('ࡀ', '\u{85b}'), ('ࡠ', 'ࡪ'), - ('ࢠ', 'ࢴ'), - ('ࢶ', '\u{8c7}'), - ('\u{8d3}', '\u{8e1}'), + ('ࡰ', 'ࢇ'), + ('ࢉ', 'ࢎ'), + ('\u{898}', '\u{8e1}'), ('\u{8e3}', '\u{963}'), ('०', '९'), ('ॱ', 'ঃ'), @@ -143,11 +143,12 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('ఎ', 'ఐ'), ('ఒ', 'న'), ('ప', 'హ'), - ('ఽ', 'ౄ'), + ('\u{c3c}', 'ౄ'), ('\u{c46}', '\u{c48}'), ('\u{c4a}', '\u{c4d}'), ('\u{c55}', '\u{c56}'), ('ౘ', 'ౚ'), + ('ౝ', 'ౝ'), ('ౠ', '\u{c63}'), ('౦', '౯'), ('ಀ', 'ಃ'), @@ -160,7 +161,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('\u{cc6}', 'ೈ'), ('ೊ', '\u{ccd}'), ('\u{cd5}', '\u{cd6}'), - ('ೞ', 'ೞ'), + ('ೝ', 'ೞ'), ('ೠ', '\u{ce3}'), ('೦', '೯'), ('ೱ', 'ೲ'), @@ -242,9 +243,8 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('ᚁ', 'ᚚ'), ('ᚠ', 'ᛪ'), ('ᛮ', 'ᛸ'), - ('ᜀ', 'ᜌ'), - ('ᜎ', '\u{1714}'), - ('ᜠ', '\u{1734}'), + ('ᜀ', '᜕'), + ('ᜟ', '᜴'), ('ᝀ', '\u{1753}'), ('ᝠ', 'ᝬ'), ('ᝮ', 'ᝰ'), @@ -254,7 +254,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('ៜ', '\u{17dd}'), ('០', '៩'), ('\u{180b}', '\u{180d}'), - ('᠐', '᠙'), + ('\u{180f}', '᠙'), ('ᠠ', 'ᡸ'), ('ᢀ', 'ᢪ'), ('ᢰ', 'ᣵ'), @@ -272,8 +272,8 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('\u{1a7f}', '᪉'), ('᪐', '᪙'), ('ᪧ', 'ᪧ'), - ('\u{1ab0}', '\u{1ac0}'), - ('\u{1b00}', 'ᭋ'), + ('\u{1ab0}', '\u{1ace}'), + ('\u{1b00}', 'ᭌ'), ('᭐', '᭙'), ('\u{1b6b}', '\u{1b73}'), ('\u{1b80}', '᯳'), @@ -285,8 +285,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('Ჽ', 'Ჿ'), ('\u{1cd0}', '\u{1cd2}'), ('\u{1cd4}', 'ᳺ'), - ('ᴀ', '\u{1df9}'), - ('\u{1dfb}', 'ἕ'), + ('ᴀ', 'ἕ'), ('Ἐ', 'Ἕ'), ('ἠ', 'ὅ'), ('Ὀ', 'Ὅ'), @@ -327,9 +326,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('ⅎ', 'ⅎ'), ('Ⅰ', 'ↈ'), ('Ⓐ', 'ⓩ'), - ('Ⰰ', 'Ⱞ'), - ('ⰰ', 'ⱞ'), - ('Ⱡ', 'ⳤ'), + ('Ⰰ', 'ⳤ'), ('Ⳬ', 'ⳳ'), ('ⴀ', 'ⴥ'), ('ⴧ', 'ⴧ'), @@ -358,11 +355,10 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('ー', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', '\u{31bf}'), + ('ㆠ', 'ㆿ'), ('ㇰ', 'ㇿ'), - ('㐀', '\u{4dbf}'), - ('一', '\u{9ffc}'), - ('ꀀ', 'ꒌ'), + ('㐀', '䶿'), + ('一', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), ('ꘐ', 'ꘫ'), @@ -371,9 +367,11 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('ꙿ', '\u{a6f1}'), ('ꜗ', 'ꜟ'), ('Ꜣ', 'ꞈ'), - ('Ꞌ', 'ꞿ'), - ('Ꟃ', '\u{a7ca}'), - ('\u{a7f5}', 'ꠧ'), + ('Ꞌ', 'ꟊ'), + ('Ꟑ', 'ꟑ'), + ('ꟓ', 'ꟓ'), + ('ꟕ', 'ꟙ'), + ('ꟲ', 'ꠧ'), ('\u{a82c}', '\u{a82c}'), ('ꡀ', 'ꡳ'), ('ꢀ', '\u{a8c5}'), @@ -400,7 +398,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab69}'), + ('ꭜ', 'ꭩ'), ('ꭰ', 'ꯪ'), ('꯬', '\u{abed}'), ('꯰', '꯹'), @@ -462,9 +460,20 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('𐓘', '𐓻'), ('𐔀', '𐔧'), ('𐔰', '𐕣'), + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), ('𐘀', '𐜶'), ('𐝀', '𐝕'), ('𐝠', '𐝧'), + ('𐞀', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), ('𐠀', '𐠅'), ('𐠈', '𐠈'), ('𐠊', '𐠵'), @@ -499,27 +508,29 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('𐳀', '𐳲'), ('𐴀', '\u{10d27}'), ('𐴰', '𐴹'), - ('\u{10e80}', '\u{10ea9}'), + ('𐺀', '𐺩'), ('\u{10eab}', '\u{10eac}'), - ('\u{10eb0}', '\u{10eb1}'), + ('𐺰', '𐺱'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '\u{10f50}'), - ('\u{10fb0}', '\u{10fc4}'), + ('𐽰', '\u{10f85}'), + ('𐾰', '𐿄'), ('𐿠', '𐿶'), ('𑀀', '\u{11046}'), - ('𑁦', '𑁯'), + ('𑁦', '𑁵'), ('\u{1107f}', '\u{110ba}'), + ('\u{110c2}', '\u{110c2}'), ('𑃐', '𑃨'), ('𑃰', '𑃹'), ('\u{11100}', '\u{11134}'), ('𑄶', '𑄿'), - ('𑅄', '\u{11147}'), + ('𑅄', '𑅇'), ('𑅐', '\u{11173}'), ('𑅶', '𑅶'), ('\u{11180}', '𑇄'), ('\u{111c9}', '\u{111cc}'), - ('\u{111ce}', '𑇚'), + ('𑇎', '𑇚'), ('𑇜', '𑇜'), ('𑈀', '𑈑'), ('𑈓', '\u{11237}'), @@ -548,7 +559,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('\u{11370}', '\u{11374}'), ('𑐀', '𑑊'), ('𑑐', '𑑙'), - ('\u{1145e}', '\u{11461}'), + ('\u{1145e}', '𑑡'), ('𑒀', '𑓅'), ('𑓇', '𑓇'), ('𑓐', '𑓙'), @@ -563,16 +574,17 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('𑜀', '𑜚'), ('\u{1171d}', '\u{1172b}'), ('𑜰', '𑜹'), + ('𑝀', '𑝆'), ('𑠀', '\u{1183a}'), ('𑢠', '𑣩'), - ('𑣿', '\u{11906}'), - ('\u{11909}', '\u{11909}'), - ('\u{1190c}', '\u{11913}'), - ('\u{11915}', '\u{11916}'), - ('\u{11918}', '\u{11935}'), - ('\u{11937}', '\u{11938}'), + ('𑣿', '𑤆'), + ('𑤉', '𑤉'), + ('𑤌', '𑤓'), + ('𑤕', '𑤖'), + ('𑤘', '𑤵'), + ('𑤷', '𑤸'), ('\u{1193b}', '\u{11943}'), - ('\u{11950}', '\u{11959}'), + ('𑥐', '𑥙'), ('𑦠', '𑦧'), ('𑦪', '\u{119d7}'), ('\u{119da}', '𑧡'), @@ -581,7 +593,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('\u{11a47}', '\u{11a47}'), ('𑩐', '\u{11a99}'), ('𑪝', '𑪝'), - ('𑫀', '𑫸'), + ('𑪰', '𑫸'), ('𑰀', '𑰈'), ('𑰊', '\u{11c36}'), ('\u{11c38}', '𑱀'), @@ -603,15 +615,18 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('𑶓', '𑶘'), ('𑶠', '𑶩'), ('𑻠', '𑻶'), - ('\u{11fb0}', '\u{11fb0}'), + ('𑾰', '𑾰'), ('𒀀', '𒎙'), ('𒐀', '𒑮'), ('𒒀', '𒕃'), + ('𒾐', '𒿰'), ('𓀀', '𓐮'), ('𔐀', '𔙆'), ('𖠀', '𖨸'), ('𖩀', '𖩞'), ('𖩠', '𖩩'), + ('𖩰', '𖪾'), + ('𖫀', '𖫉'), ('𖫐', '𖫭'), ('\u{16af0}', '\u{16af4}'), ('𖬀', '\u{16b36}'), @@ -625,11 +640,14 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('\u{16f8f}', '𖾟'), ('𖿠', '𖿡'), ('𖿣', '\u{16fe4}'), - ('\u{16ff0}', '\u{16ff1}'), + ('𖿰', '𖿱'), ('𗀀', '𘟷'), - ('𘠀', '\u{18cd5}'), - ('\u{18d00}', '\u{18d08}'), - ('𛀀', '𛄞'), + ('𘠀', '𘳕'), + ('𘴀', '𘴈'), + ('𚿰', '𚿳'), + ('𚿵', '𚿻'), + ('𚿽', '𚿾'), + ('𛀀', '𛄢'), ('𛅐', '𛅒'), ('𛅤', '𛅧'), ('𛅰', '𛋻'), @@ -638,6 +656,8 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('𛲀', '𛲈'), ('𛲐', '𛲙'), ('\u{1bc9d}', '\u{1bc9e}'), + ('\u{1cf00}', '\u{1cf2d}'), + ('\u{1cf30}', '\u{1cf46}'), ('\u{1d165}', '\u{1d169}'), ('𝅭', '\u{1d172}'), ('\u{1d17b}', '\u{1d182}'), @@ -681,6 +701,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('\u{1da84}', '\u{1da84}'), ('\u{1da9b}', '\u{1da9f}'), ('\u{1daa1}', '\u{1daaf}'), + ('𝼀', '𝼞'), ('\u{1e000}', '\u{1e006}'), ('\u{1e008}', '\u{1e018}'), ('\u{1e01b}', '\u{1e021}'), @@ -690,7 +711,12 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('\u{1e130}', '𞄽'), ('𞅀', '𞅉'), ('𞅎', '𞅎'), + ('𞊐', '\u{1e2ae}'), ('𞋀', '𞋹'), + ('𞟠', '𞟦'), + ('𞟨', '𞟫'), + ('𞟭', '𞟮'), + ('𞟰', '𞟾'), ('𞠀', '𞣄'), ('\u{1e8d0}', '\u{1e8d6}'), ('𞤀', '𞥋'), @@ -731,13 +757,13 @@ pub const PERL_WORD: &'static [(char, char)] = &[ ('🄰', '🅉'), ('🅐', '🅩'), ('🅰', '🆉'), - ('\u{1fbf0}', '\u{1fbf9}'), - ('𠀀', '\u{2a6dd}'), - ('𪜀', '𫜴'), + ('🯰', '🯹'), + ('𠀀', '𪛟'), + ('𪜀', '𫜸'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), - ('\u{30000}', '\u{3134a}'), + ('𰀀', '𱍊'), ('\u{e0100}', '\u{e01ef}'), ]; diff --git a/regex-syntax/src/unicode_tables/property_bool.rs b/regex-syntax/src/unicode_tables/property_bool.rs index 21cbaf9aee..8fb2110307 100644 --- a/regex-syntax/src/unicode_tables/property_bool.rs +++ b/regex-syntax/src/unicode_tables/property_bool.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate property-bool ucd-13.0.0 --chars +// ucd-generate property-bool /tmp/ucd --chars // -// Unicode version: 13.0.0. +// Unicode version: 14.0.0. // -// ucd-generate 0.2.8 is available on crates.io. +// ucd-generate 0.2.11 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("ASCII_Hex_Digit", ASCII_HEX_DIGIT), @@ -125,8 +125,9 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('ࠚ', '\u{82c}'), ('ࡀ', 'ࡘ'), ('ࡠ', 'ࡪ'), - ('ࢠ', 'ࢴ'), - ('ࢶ', '\u{8c7}'), + ('ࡰ', 'ࢇ'), + ('ࢉ', 'ࢎ'), + ('ࢠ', 'ࣉ'), ('\u{8d4}', '\u{8df}'), ('\u{8e3}', '\u{8e9}'), ('\u{8f0}', 'ऻ'), @@ -216,6 +217,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('\u{c4a}', '\u{c4c}'), ('\u{c55}', '\u{c56}'), ('ౘ', 'ౚ'), + ('ౝ', 'ౝ'), ('ౠ', '\u{c63}'), ('ಀ', 'ಃ'), ('ಅ', 'ಌ'), @@ -227,7 +229,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('\u{cc6}', 'ೈ'), ('ೊ', '\u{ccc}'), ('\u{cd5}', '\u{cd6}'), - ('ೞ', 'ೞ'), + ('ೝ', 'ೞ'), ('ೠ', '\u{ce3}'), ('ೱ', 'ೲ'), ('\u{d00}', 'ഌ'), @@ -303,9 +305,8 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('ᚁ', 'ᚚ'), ('ᚠ', 'ᛪ'), ('ᛮ', 'ᛸ'), - ('ᜀ', 'ᜌ'), - ('ᜎ', '\u{1713}'), - ('ᜠ', '\u{1733}'), + ('ᜀ', '\u{1713}'), + ('ᜟ', '\u{1733}'), ('ᝀ', '\u{1753}'), ('ᝠ', 'ᝬ'), ('ᝮ', 'ᝰ'), @@ -329,9 +330,10 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('ᩡ', '\u{1a74}'), ('ᪧ', 'ᪧ'), ('\u{1abf}', '\u{1ac0}'), + ('\u{1acc}', '\u{1ace}'), ('\u{1b00}', 'ᬳ'), ('\u{1b35}', 'ᭃ'), - ('ᭅ', 'ᭋ'), + ('ᭅ', 'ᭌ'), ('\u{1b80}', '\u{1ba9}'), ('\u{1bac}', 'ᮯ'), ('ᮺ', 'ᯥ'), @@ -385,9 +387,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('ⅎ', 'ⅎ'), ('Ⅰ', 'ↈ'), ('Ⓐ', 'ⓩ'), - ('Ⰰ', 'Ⱞ'), - ('ⰰ', 'ⱞ'), - ('Ⱡ', 'ⳤ'), + ('Ⰰ', 'ⳤ'), ('Ⳬ', 'ⳮ'), ('Ⳳ', 'ⳳ'), ('ⴀ', 'ⴥ'), @@ -416,11 +416,10 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('ー', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', '\u{31bf}'), + ('ㆠ', 'ㆿ'), ('ㇰ', 'ㇿ'), - ('㐀', '\u{4dbf}'), - ('一', '\u{9ffc}'), - ('ꀀ', 'ꒌ'), + ('㐀', '䶿'), + ('一', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), ('ꘐ', 'ꘟ'), @@ -430,9 +429,11 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('ꙿ', 'ꛯ'), ('ꜗ', 'ꜟ'), ('Ꜣ', 'ꞈ'), - ('Ꞌ', 'ꞿ'), - ('Ꟃ', '\u{a7ca}'), - ('\u{a7f5}', 'ꠅ'), + ('Ꞌ', 'ꟊ'), + ('Ꟑ', 'ꟑ'), + ('ꟓ', 'ꟓ'), + ('ꟕ', 'ꟙ'), + ('ꟲ', 'ꠅ'), ('ꠇ', 'ꠧ'), ('ꡀ', 'ꡳ'), ('ꢀ', 'ꣃ'), @@ -463,7 +464,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab69}'), + ('ꭜ', 'ꭩ'), ('ꭰ', 'ꯪ'), ('가', '힣'), ('ힰ', 'ퟆ'), @@ -514,9 +515,20 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('𐓘', '𐓻'), ('𐔀', '𐔧'), ('𐔰', '𐕣'), + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), ('𐘀', '𐜶'), ('𐝀', '𐝕'), ('𐝠', '𐝧'), + ('𐞀', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), ('𐠀', '𐠅'), ('𐠈', '𐠈'), ('𐠊', '𐠵'), @@ -548,24 +560,27 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('𐲀', '𐲲'), ('𐳀', '𐳲'), ('𐴀', '\u{10d27}'), - ('\u{10e80}', '\u{10ea9}'), + ('𐺀', '𐺩'), ('\u{10eab}', '\u{10eac}'), - ('\u{10eb0}', '\u{10eb1}'), + ('𐺰', '𐺱'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '𐽅'), - ('\u{10fb0}', '\u{10fc4}'), + ('𐽰', '𐾁'), + ('𐾰', '𐿄'), ('𐿠', '𐿶'), ('𑀀', '\u{11045}'), + ('𑁱', '𑁵'), ('𑂂', '𑂸'), + ('\u{110c2}', '\u{110c2}'), ('𑃐', '𑃨'), ('\u{11100}', '\u{11132}'), - ('𑅄', '\u{11147}'), + ('𑅄', '𑅇'), ('𑅐', '𑅲'), ('𑅶', '𑅶'), ('\u{11180}', '𑆿'), ('𑇁', '𑇄'), - ('\u{111ce}', '\u{111cf}'), + ('𑇎', '\u{111cf}'), ('𑇚', '𑇚'), ('𑇜', '𑇜'), ('𑈀', '𑈑'), @@ -594,7 +609,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('𑐀', '𑑁'), ('\u{11443}', '𑑅'), ('𑑇', '𑑊'), - ('𑑟', '\u{11461}'), + ('𑑟', '𑑡'), ('𑒀', '𑓁'), ('𑓄', '𑓅'), ('𑓇', '𑓇'), @@ -608,16 +623,17 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('𑚸', '𑚸'), ('𑜀', '𑜚'), ('\u{1171d}', '\u{1172a}'), + ('𑝀', '𑝆'), ('𑠀', '𑠸'), ('𑢠', '𑣟'), - ('𑣿', '\u{11906}'), - ('\u{11909}', '\u{11909}'), - ('\u{1190c}', '\u{11913}'), - ('\u{11915}', '\u{11916}'), - ('\u{11918}', '\u{11935}'), - ('\u{11937}', '\u{11938}'), + ('𑣿', '𑤆'), + ('𑤉', '𑤉'), + ('𑤌', '𑤓'), + ('𑤕', '𑤖'), + ('𑤘', '𑤵'), + ('𑤷', '𑤸'), ('\u{1193b}', '\u{1193c}'), - ('\u{1193f}', '\u{11942}'), + ('𑤿', '𑥂'), ('𑦠', '𑦧'), ('𑦪', '\u{119d7}'), ('\u{119da}', '𑧟'), @@ -627,7 +643,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('\u{11a35}', '\u{11a3e}'), ('𑩐', '𑪗'), ('𑪝', '𑪝'), - ('𑫀', '𑫸'), + ('𑪰', '𑫸'), ('𑰀', '𑰈'), ('𑰊', '\u{11c36}'), ('\u{11c38}', '𑰾'), @@ -650,14 +666,16 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('𑶓', '𑶖'), ('𑶘', '𑶘'), ('𑻠', '𑻶'), - ('\u{11fb0}', '\u{11fb0}'), + ('𑾰', '𑾰'), ('𒀀', '𒎙'), ('𒐀', '𒑮'), ('𒒀', '𒕃'), + ('𒾐', '𒿰'), ('𓀀', '𓐮'), ('𔐀', '𔙆'), ('𖠀', '𖨸'), ('𖩀', '𖩞'), + ('𖩰', '𖪾'), ('𖫐', '𖫭'), ('𖬀', '𖬯'), ('𖭀', '𖭃'), @@ -669,11 +687,14 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('\u{16f8f}', '𖾟'), ('𖿠', '𖿡'), ('𖿣', '𖿣'), - ('\u{16ff0}', '\u{16ff1}'), + ('𖿰', '𖿱'), ('𗀀', '𘟷'), - ('𘠀', '\u{18cd5}'), - ('\u{18d00}', '\u{18d08}'), - ('𛀀', '𛄞'), + ('𘠀', '𘳕'), + ('𘴀', '𘴈'), + ('𚿰', '𚿳'), + ('𚿵', '𚿻'), + ('𚿽', '𚿾'), + ('𛀀', '𛄢'), ('𛅐', '𛅒'), ('𛅤', '𛅧'), ('𛅰', '𛋻'), @@ -712,6 +733,7 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('𝞊', '𝞨'), ('𝞪', '𝟂'), ('𝟄', '𝟋'), + ('𝼀', '𝼞'), ('\u{1e000}', '\u{1e006}'), ('\u{1e008}', '\u{1e018}'), ('\u{1e01b}', '\u{1e021}'), @@ -720,7 +742,12 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('𞄀', '𞄬'), ('𞄷', '𞄽'), ('𞅎', '𞅎'), + ('𞊐', '𞊭'), ('𞋀', '𞋫'), + ('𞟠', '𞟦'), + ('𞟨', '𞟫'), + ('𞟭', '𞟮'), + ('𞟰', '𞟾'), ('𞠀', '𞣄'), ('𞤀', '𞥃'), ('\u{1e947}', '\u{1e947}'), @@ -761,13 +788,13 @@ pub const ALPHABETIC: &'static [(char, char)] = &[ ('🄰', '🅉'), ('🅐', '🅩'), ('🅰', '🆉'), - ('𠀀', '\u{2a6dd}'), - ('𪜀', '𫜴'), + ('𠀀', '𪛟'), + ('𪜀', '𫜸'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), - ('\u{30000}', '\u{3134a}'), + ('𰀀', '𱍊'), ]; pub const BIDI_CONTROL: &'static [(char, char)] = &[ @@ -873,6 +900,7 @@ pub const BIDI_MIRRORED: &'static [(char, char)] = &[ ('⸌', '⸍'), ('⸜', '⸝'), ('⸠', '⸩'), + ('⹕', '⹜'), ('〈', '】'), ('〔', '〛'), ('﹙', '﹞'), @@ -936,7 +964,10 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{7fd}', '\u{7fd}'), ('\u{816}', '\u{82d}'), ('\u{859}', '\u{85b}'), - ('\u{8d3}', '\u{902}'), + ('࢈', '࢈'), + ('\u{890}', '\u{891}'), + ('\u{898}', '\u{89f}'), + ('ࣉ', '\u{902}'), ('\u{93a}', '\u{93a}'), ('\u{93c}', '\u{93c}'), ('\u{941}', '\u{948}'), @@ -977,6 +1008,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{bcd}', '\u{bcd}'), ('\u{c00}', '\u{c00}'), ('\u{c04}', '\u{c04}'), + ('\u{c3c}', '\u{c3c}'), ('\u{c3e}', '\u{c40}'), ('\u{c46}', '\u{c48}'), ('\u{c4a}', '\u{c4d}'), @@ -1028,7 +1060,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('ჼ', 'ჼ'), ('\u{135d}', '\u{135f}'), ('\u{1712}', '\u{1714}'), - ('\u{1732}', '\u{1734}'), + ('\u{1732}', '\u{1733}'), ('\u{1752}', '\u{1753}'), ('\u{1772}', '\u{1773}'), ('\u{17b4}', '\u{17b5}'), @@ -1037,7 +1069,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{17c9}', '\u{17d3}'), ('ៗ', 'ៗ'), ('\u{17dd}', '\u{17dd}'), - ('\u{180b}', '\u{180e}'), + ('\u{180b}', '\u{180f}'), ('ᡃ', 'ᡃ'), ('\u{1885}', '\u{1886}'), ('\u{18a9}', '\u{18a9}'), @@ -1055,7 +1087,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{1a73}', '\u{1a7c}'), ('\u{1a7f}', '\u{1a7f}'), ('ᪧ', 'ᪧ'), - ('\u{1ab0}', '\u{1ac0}'), + ('\u{1ab0}', '\u{1ace}'), ('\u{1b00}', '\u{1b03}'), ('\u{1b34}', '\u{1b34}'), ('\u{1b36}', '\u{1b3a}'), @@ -1081,8 +1113,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{1cf8}', '\u{1cf9}'), ('ᴬ', 'ᵪ'), ('ᵸ', 'ᵸ'), - ('ᶛ', '\u{1df9}'), - ('\u{1dfb}', '\u{1dff}'), + ('ᶛ', '\u{1dff}'), ('᾽', '᾽'), ('᾿', '῁'), ('῍', '῏'), @@ -1123,6 +1154,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('꜀', '꜡'), ('ꝰ', 'ꝰ'), ('ꞈ', '꞊'), + ('ꟲ', 'ꟴ'), ('ꟸ', 'ꟹ'), ('\u{a802}', '\u{a802}'), ('\u{a806}', '\u{a806}'), @@ -1157,12 +1189,12 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('ꫳ', 'ꫴ'), ('\u{aaf6}', '\u{aaf6}'), ('꭛', 'ꭟ'), - ('\u{ab69}', '\u{ab6b}'), + ('ꭩ', '꭫'), ('\u{abe5}', '\u{abe5}'), ('\u{abe8}', '\u{abe8}'), ('\u{abed}', '\u{abed}'), ('\u{fb1e}', '\u{fb1e}'), - ('﮲', '﯁'), + ('﮲', '﯂'), ('\u{fe00}', '\u{fe0f}'), ('︓', '︓'), ('\u{fe20}', '\u{fe2f}'), @@ -1181,6 +1213,9 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{101fd}', '\u{101fd}'), ('\u{102e0}', '\u{102e0}'), ('\u{10376}', '\u{1037a}'), + ('𐞀', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), ('\u{10a01}', '\u{10a03}'), ('\u{10a05}', '\u{10a06}'), ('\u{10a0c}', '\u{10a0f}'), @@ -1190,12 +1225,16 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{10d24}', '\u{10d27}'), ('\u{10eab}', '\u{10eac}'), ('\u{10f46}', '\u{10f50}'), + ('\u{10f82}', '\u{10f85}'), ('\u{11001}', '\u{11001}'), ('\u{11038}', '\u{11046}'), + ('\u{11070}', '\u{11070}'), + ('\u{11073}', '\u{11074}'), ('\u{1107f}', '\u{11081}'), ('\u{110b3}', '\u{110b6}'), ('\u{110b9}', '\u{110ba}'), ('\u{110bd}', '\u{110bd}'), + ('\u{110c2}', '\u{110c2}'), ('\u{110cd}', '\u{110cd}'), ('\u{11100}', '\u{11102}'), ('\u{11127}', '\u{1112b}'), @@ -1278,8 +1317,13 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{16f8f}', '𖾟'), ('𖿠', '𖿡'), ('𖿣', '\u{16fe4}'), + ('𚿰', '𚿳'), + ('𚿵', '𚿻'), + ('𚿽', '𚿾'), ('\u{1bc9d}', '\u{1bc9e}'), ('\u{1bca0}', '\u{1bca3}'), + ('\u{1cf00}', '\u{1cf2d}'), + ('\u{1cf30}', '\u{1cf46}'), ('\u{1d167}', '\u{1d169}'), ('\u{1d173}', '\u{1d182}'), ('\u{1d185}', '\u{1d18b}'), @@ -1297,6 +1341,7 @@ pub const CASE_IGNORABLE: &'static [(char, char)] = &[ ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), ('\u{1e130}', '𞄽'), + ('\u{1e2ae}', '\u{1e2ae}'), ('\u{1e2ec}', '\u{1e2ef}'), ('\u{1e8d0}', '\u{1e8d6}'), ('\u{1e944}', '𞥋'), @@ -1384,9 +1429,7 @@ pub const CASED: &'static [(char, char)] = &[ ('Ⅰ', 'ⅿ'), ('Ↄ', 'ↄ'), ('Ⓐ', 'ⓩ'), - ('Ⰰ', 'Ⱞ'), - ('ⰰ', 'ⱞ'), - ('Ⱡ', 'ⳤ'), + ('Ⰰ', 'ⳤ'), ('Ⳬ', 'ⳮ'), ('Ⳳ', 'ⳳ'), ('ⴀ', 'ⴥ'), @@ -1396,12 +1439,14 @@ pub const CASED: &'static [(char, char)] = &[ ('Ꚁ', 'ꚝ'), ('Ꜣ', 'ꞇ'), ('Ꞌ', 'ꞎ'), - ('Ꞑ', 'ꞿ'), - ('Ꟃ', '\u{a7ca}'), - ('\u{a7f5}', '\u{a7f6}'), + ('Ꞑ', 'ꟊ'), + ('Ꟑ', 'ꟑ'), + ('ꟓ', 'ꟓ'), + ('ꟕ', 'ꟙ'), + ('Ꟶ', 'ꟶ'), ('ꟸ', 'ꟺ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab68}'), + ('ꭜ', 'ꭨ'), ('ꭰ', 'ꮿ'), ('ff', 'st'), ('ﬓ', 'ﬗ'), @@ -1410,6 +1455,18 @@ pub const CASED: &'static [(char, char)] = &[ ('𐐀', '𐑏'), ('𐒰', '𐓓'), ('𐓘', '𐓻'), + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), + ('𐞀', '𐞀'), + ('𐞃', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), ('𐲀', '𐲲'), ('𐳀', '𐳲'), ('𑢠', '𑣟'), @@ -1444,6 +1501,8 @@ pub const CASED: &'static [(char, char)] = &[ ('𝞊', '𝞨'), ('𝞪', '𝟂'), ('𝟄', '𝟋'), + ('𝼀', '𝼉'), + ('𝼋', '𝼞'), ('𞤀', '𞥃'), ('🄰', '🅉'), ('🅐', '🅩'), @@ -1886,7 +1945,7 @@ pub const CHANGES_WHEN_CASEFOLDED: &'static [(char, char)] = &[ ('Ⅰ', 'Ⅿ'), ('Ↄ', 'Ↄ'), ('Ⓐ', 'Ⓩ'), - ('Ⰰ', 'Ⱞ'), + ('Ⰰ', 'Ⱟ'), ('Ⱡ', 'Ⱡ'), ('Ɫ', 'Ɽ'), ('Ⱨ', 'Ⱨ'), @@ -2051,16 +2110,24 @@ pub const CHANGES_WHEN_CASEFOLDED: &'static [(char, char)] = &[ ('Ꞻ', 'Ꞻ'), ('Ꞽ', 'Ꞽ'), ('Ꞿ', 'Ꞿ'), + ('Ꟁ', 'Ꟁ'), ('Ꟃ', 'Ꟃ'), - ('Ꞔ', '\u{a7c7}'), - ('\u{a7c9}', '\u{a7c9}'), - ('\u{a7f5}', '\u{a7f5}'), + ('Ꞔ', 'Ꟈ'), + ('Ꟊ', 'Ꟊ'), + ('Ꟑ', 'Ꟑ'), + ('Ꟗ', 'Ꟗ'), + ('Ꟙ', 'Ꟙ'), + ('Ꟶ', 'Ꟶ'), ('ꭰ', 'ꮿ'), ('ff', 'st'), ('ﬓ', 'ﬗ'), ('A', 'Z'), ('𐐀', '𐐧'), ('𐒰', '𐓓'), + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), ('𐲀', '𐲲'), ('𑢠', '𑢿'), ('𖹀', '𖹟'), @@ -2156,9 +2223,7 @@ pub const CHANGES_WHEN_CASEMAPPED: &'static [(char, char)] = &[ ('Ⅰ', 'ⅿ'), ('Ↄ', 'ↄ'), ('Ⓐ', 'ⓩ'), - ('Ⰰ', 'Ⱞ'), - ('ⰰ', 'ⱞ'), - ('Ⱡ', 'Ɒ'), + ('Ⰰ', 'Ɒ'), ('Ⱳ', 'ⱳ'), ('Ⱶ', 'ⱶ'), ('Ȿ', 'ⳣ'), @@ -2175,9 +2240,10 @@ pub const CHANGES_WHEN_CASEMAPPED: &'static [(char, char)] = &[ ('Ꞌ', 'Ɥ'), ('Ꞑ', 'ꞔ'), ('Ꞗ', 'Ɪ'), - ('Ʞ', 'ꞿ'), - ('Ꟃ', '\u{a7ca}'), - ('\u{a7f5}', '\u{a7f6}'), + ('Ʞ', 'ꟊ'), + ('Ꟑ', 'ꟑ'), + ('Ꟗ', 'ꟙ'), + ('Ꟶ', 'ꟶ'), ('ꭓ', 'ꭓ'), ('ꭰ', 'ꮿ'), ('ff', 'st'), @@ -2187,6 +2253,14 @@ pub const CHANGES_WHEN_CASEMAPPED: &'static [(char, char)] = &[ ('𐐀', '𐑏'), ('𐒰', '𐓓'), ('𐓘', '𐓻'), + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), ('𐲀', '𐲲'), ('𐳀', '𐳲'), ('𑢠', '𑣟'), @@ -2620,7 +2694,7 @@ pub const CHANGES_WHEN_LOWERCASED: &'static [(char, char)] = &[ ('Ⅰ', 'Ⅿ'), ('Ↄ', 'Ↄ'), ('Ⓐ', 'Ⓩ'), - ('Ⰰ', 'Ⱞ'), + ('Ⰰ', 'Ⱟ'), ('Ⱡ', 'Ⱡ'), ('Ɫ', 'Ɽ'), ('Ⱨ', 'Ⱨ'), @@ -2785,13 +2859,21 @@ pub const CHANGES_WHEN_LOWERCASED: &'static [(char, char)] = &[ ('Ꞻ', 'Ꞻ'), ('Ꞽ', 'Ꞽ'), ('Ꞿ', 'Ꞿ'), + ('Ꟁ', 'Ꟁ'), ('Ꟃ', 'Ꟃ'), - ('Ꞔ', '\u{a7c7}'), - ('\u{a7c9}', '\u{a7c9}'), - ('\u{a7f5}', '\u{a7f5}'), + ('Ꞔ', 'Ꟈ'), + ('Ꟊ', 'Ꟊ'), + ('Ꟑ', 'Ꟑ'), + ('Ꟗ', 'Ꟗ'), + ('Ꟙ', 'Ꟙ'), + ('Ꟶ', 'Ꟶ'), ('A', 'Z'), ('𐐀', '𐐧'), ('𐒰', '𐓓'), + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), ('𐲀', '𐲲'), ('𑢠', '𑢿'), ('𖹀', '𖹟'), @@ -3237,7 +3319,7 @@ pub const CHANGES_WHEN_TITLECASED: &'static [(char, char)] = &[ ('ⅰ', 'ⅿ'), ('ↄ', 'ↄ'), ('ⓐ', 'ⓩ'), - ('ⰰ', 'ⱞ'), + ('ⰰ', 'ⱟ'), ('ⱡ', 'ⱡ'), ('ⱥ', 'ⱦ'), ('ⱨ', 'ⱨ'), @@ -3402,10 +3484,14 @@ pub const CHANGES_WHEN_TITLECASED: &'static [(char, char)] = &[ ('ꞻ', 'ꞻ'), ('ꞽ', 'ꞽ'), ('ꞿ', 'ꞿ'), + ('ꟁ', 'ꟁ'), ('ꟃ', 'ꟃ'), - ('\u{a7c8}', '\u{a7c8}'), - ('\u{a7ca}', '\u{a7ca}'), - ('\u{a7f6}', '\u{a7f6}'), + ('ꟈ', 'ꟈ'), + ('ꟊ', 'ꟊ'), + ('ꟑ', 'ꟑ'), + ('ꟗ', 'ꟗ'), + ('ꟙ', 'ꟙ'), + ('ꟶ', 'ꟶ'), ('ꭓ', 'ꭓ'), ('ꭰ', 'ꮿ'), ('ff', 'st'), @@ -3413,6 +3499,10 @@ pub const CHANGES_WHEN_TITLECASED: &'static [(char, char)] = &[ ('a', 'z'), ('𐐨', '𐑏'), ('𐓘', '𐓻'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), ('𐳀', '𐳲'), ('𑣀', '𑣟'), ('𖹠', '𖹿'), @@ -3859,7 +3949,7 @@ pub const CHANGES_WHEN_UPPERCASED: &'static [(char, char)] = &[ ('ⅰ', 'ⅿ'), ('ↄ', 'ↄ'), ('ⓐ', 'ⓩ'), - ('ⰰ', 'ⱞ'), + ('ⰰ', 'ⱟ'), ('ⱡ', 'ⱡ'), ('ⱥ', 'ⱦ'), ('ⱨ', 'ⱨ'), @@ -4024,10 +4114,14 @@ pub const CHANGES_WHEN_UPPERCASED: &'static [(char, char)] = &[ ('ꞻ', 'ꞻ'), ('ꞽ', 'ꞽ'), ('ꞿ', 'ꞿ'), + ('ꟁ', 'ꟁ'), ('ꟃ', 'ꟃ'), - ('\u{a7c8}', '\u{a7c8}'), - ('\u{a7ca}', '\u{a7ca}'), - ('\u{a7f6}', '\u{a7f6}'), + ('ꟈ', 'ꟈ'), + ('ꟊ', 'ꟊ'), + ('ꟑ', 'ꟑ'), + ('ꟗ', 'ꟗ'), + ('ꟙ', 'ꟙ'), + ('ꟶ', 'ꟶ'), ('ꭓ', 'ꭓ'), ('ꭰ', 'ꮿ'), ('ff', 'st'), @@ -4035,6 +4129,10 @@ pub const CHANGES_WHEN_UPPERCASED: &'static [(char, char)] = &[ ('a', 'z'), ('𐐨', '𐑏'), ('𐓘', '𐓻'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), ('𐳀', '𐳲'), ('𑣀', '𑣟'), ('𖹠', '𖹿'), @@ -4056,6 +4154,7 @@ pub const DASH: &'static [(char, char)] = &[ ('⸚', '⸚'), ('⸺', '⸻'), ('⹀', '⹀'), + ('⹝', '⹝'), ('〜', '〜'), ('〰', '〰'), ('゠', '゠'), @@ -4063,7 +4162,7 @@ pub const DASH: &'static [(char, char)] = &[ ('﹘', '﹘'), ('﹣', '﹣'), ('-', '-'), - ('\u{10ead}', '\u{10ead}'), + ('𐺭', '𐺭'), ]; pub const DEFAULT_IGNORABLE_CODE_POINT: &'static [(char, char)] = &[ @@ -4072,7 +4171,7 @@ pub const DEFAULT_IGNORABLE_CODE_POINT: &'static [(char, char)] = &[ ('\u{61c}', '\u{61c}'), ('ᅟ', 'ᅠ'), ('\u{17b4}', '\u{17b5}'), - ('\u{180b}', '\u{180e}'), + ('\u{180b}', '\u{180f}'), ('\u{200b}', '\u{200f}'), ('\u{202a}', '\u{202e}'), ('\u{2060}', '\u{206f}'), @@ -4126,6 +4225,8 @@ pub const DIACRITIC: &'static [(char, char)] = &[ ('\u{7a6}', '\u{7b0}'), ('\u{7eb}', 'ߵ'), ('\u{818}', '\u{819}'), + ('\u{898}', '\u{89f}'), + ('ࣉ', '\u{8d2}'), ('\u{8e3}', '\u{8fe}'), ('\u{93c}', '\u{93c}'), ('\u{94d}', '\u{94d}'), @@ -4142,6 +4243,7 @@ pub const DIACRITIC: &'static [(char, char)] = &[ ('\u{b4d}', '\u{b4d}'), ('\u{b55}', '\u{b55}'), ('\u{bcd}', '\u{bcd}'), + ('\u{c3c}', '\u{c3c}'), ('\u{c4d}', '\u{c4d}'), ('\u{cbc}', '\u{cbc}'), ('\u{ccd}', '\u{ccd}'), @@ -4168,12 +4270,14 @@ pub const DIACRITIC: &'static [(char, char)] = &[ ('ႏ', 'ႏ'), ('ႚ', 'ႛ'), ('\u{135d}', '\u{135f}'), + ('\u{1714}', '᜕'), ('\u{17c9}', '\u{17d3}'), ('\u{17dd}', '\u{17dd}'), ('\u{1939}', '\u{193b}'), ('\u{1a75}', '\u{1a7c}'), ('\u{1a7f}', '\u{1a7f}'), - ('\u{1ab0}', '\u{1abd}'), + ('\u{1ab0}', '\u{1abe}'), + ('\u{1ac1}', '\u{1acb}'), ('\u{1b34}', '\u{1b34}'), ('᭄', '᭄'), ('\u{1b6b}', '\u{1b73}'), @@ -4186,8 +4290,7 @@ pub const DIACRITIC: &'static [(char, char)] = &[ ('᳷', '\u{1cf9}'), ('ᴬ', 'ᵪ'), ('\u{1dc4}', '\u{1dcf}'), - ('\u{1df5}', '\u{1df9}'), - ('\u{1dfd}', '\u{1dff}'), + ('\u{1df5}', '\u{1dff}'), ('᾽', '᾽'), ('᾿', '῁'), ('῍', '῏'), @@ -4218,7 +4321,7 @@ pub const DIACRITIC: &'static [(char, char)] = &[ ('\u{aabf}', 'ꫂ'), ('\u{aaf6}', '\u{aaf6}'), ('꭛', 'ꭟ'), - ('\u{ab69}', '\u{ab6b}'), + ('ꭩ', '꭫'), ('꯬', '\u{abed}'), ('\u{fb1e}', '\u{fb1e}'), ('\u{fe20}', '\u{fe2f}'), @@ -4228,9 +4331,15 @@ pub const DIACRITIC: &'static [(char, char)] = &[ ('\u{ff9e}', '\u{ff9f}'), (' ̄', ' ̄'), ('\u{102e0}', '\u{102e0}'), + ('𐞀', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), ('\u{10ae5}', '\u{10ae6}'), ('𐴢', '\u{10d27}'), ('\u{10f46}', '\u{10f50}'), + ('\u{10f82}', '\u{10f85}'), + ('\u{11046}', '\u{11046}'), + ('\u{11070}', '\u{11070}'), ('\u{110b9}', '\u{110ba}'), ('\u{11133}', '\u{11134}'), ('\u{11173}', '\u{11173}'), @@ -4250,7 +4359,7 @@ pub const DIACRITIC: &'static [(char, char)] = &[ ('𑚶', '\u{116b7}'), ('\u{1172b}', '\u{1172b}'), ('\u{11839}', '\u{1183a}'), - ('\u{1193d}', '\u{1193e}'), + ('𑤽', '\u{1193e}'), ('\u{11943}', '\u{11943}'), ('\u{119e0}', '\u{119e0}'), ('\u{11a34}', '\u{11a34}'), @@ -4263,13 +4372,19 @@ pub const DIACRITIC: &'static [(char, char)] = &[ ('\u{16af0}', '\u{16af4}'), ('\u{16b30}', '\u{16b36}'), ('\u{16f8f}', '𖾟'), - ('\u{16ff0}', '\u{16ff1}'), + ('𖿰', '𖿱'), + ('𚿰', '𚿳'), + ('𚿵', '𚿻'), + ('𚿽', '𚿾'), + ('\u{1cf00}', '\u{1cf2d}'), + ('\u{1cf30}', '\u{1cf46}'), ('\u{1d167}', '\u{1d169}'), ('𝅭', '\u{1d172}'), ('\u{1d17b}', '\u{1d182}'), ('\u{1d185}', '\u{1d18b}'), ('\u{1d1aa}', '\u{1d1ad}'), ('\u{1e130}', '\u{1e136}'), + ('\u{1e2ae}', '\u{1e2ae}'), ('\u{1e2ec}', '\u{1e2ef}'), ('\u{1e8d0}', '\u{1e8d6}'), ('\u{1e944}', '\u{1e946}'), @@ -4410,25 +4525,26 @@ pub const EMOJI: &'static [(char, char)] = &[ ('🗺', '🙏'), ('🚀', '🛅'), ('🛋', '🛒'), - ('🛕', '\u{1f6d7}'), - ('🛠', '🛥'), + ('🛕', '🛗'), + ('🛝', '🛥'), ('🛩', '🛩'), ('🛫', '🛬'), ('🛰', '🛰'), - ('🛳', '\u{1f6fc}'), + ('🛳', '🛼'), ('🟠', '🟫'), - ('\u{1f90c}', '🤺'), + ('🟰', '🟰'), + ('🤌', '🤺'), ('🤼', '🥅'), - ('🥇', '\u{1f978}'), - ('🥺', '\u{1f9cb}'), - ('🧍', '🧿'), - ('🩰', '\u{1fa74}'), - ('🩸', '🩺'), - ('🪀', '\u{1fa86}'), - ('🪐', '\u{1faa8}'), - ('\u{1fab0}', '\u{1fab6}'), - ('\u{1fac0}', '\u{1fac2}'), - ('\u{1fad0}', '\u{1fad6}'), + ('🥇', '🧿'), + ('🩰', '🩴'), + ('🩸', '🩼'), + ('🪀', '🪆'), + ('🪐', '🪬'), + ('🪰', '🪺'), + ('🫀', '🫅'), + ('🫐', '🫙'), + ('🫠', '🫧'), + ('🫰', '🫶'), ]; pub const EMOJI_COMPONENT: &'static [(char, char)] = &[ @@ -4473,18 +4589,20 @@ pub const EMOJI_MODIFIER_BASE: &'static [(char, char)] = &[ ('🚴', '🚶'), ('🛀', '🛀'), ('🛌', '🛌'), - ('\u{1f90c}', '\u{1f90c}'), + ('🤌', '🤌'), ('🤏', '🤏'), ('🤘', '🤟'), ('🤦', '🤦'), ('🤰', '🤹'), ('🤼', '🤾'), - ('\u{1f977}', '\u{1f977}'), + ('🥷', '🥷'), ('🦵', '🦶'), ('🦸', '🦹'), ('🦻', '🦻'), ('🧍', '🧏'), ('🧑', '🧝'), + ('🫃', '🫅'), + ('🫰', '🫶'), ]; pub const EMOJI_PRESENTATION: &'static [(char, char)] = &[ @@ -4553,22 +4671,24 @@ pub const EMOJI_PRESENTATION: &'static [(char, char)] = &[ ('🚀', '🛅'), ('🛌', '🛌'), ('🛐', '🛒'), - ('🛕', '\u{1f6d7}'), + ('🛕', '🛗'), + ('🛝', '🛟'), ('🛫', '🛬'), - ('🛴', '\u{1f6fc}'), + ('🛴', '🛼'), ('🟠', '🟫'), - ('\u{1f90c}', '🤺'), + ('🟰', '🟰'), + ('🤌', '🤺'), ('🤼', '🥅'), - ('🥇', '\u{1f978}'), - ('🥺', '\u{1f9cb}'), - ('🧍', '🧿'), - ('🩰', '\u{1fa74}'), - ('🩸', '🩺'), - ('🪀', '\u{1fa86}'), - ('🪐', '\u{1faa8}'), - ('\u{1fab0}', '\u{1fab6}'), - ('\u{1fac0}', '\u{1fac2}'), - ('\u{1fad0}', '\u{1fad6}'), + ('🥇', '🧿'), + ('🩰', '🩴'), + ('🩸', '🩼'), + ('🪀', '🪆'), + ('🪐', '🪬'), + ('🪰', '🪺'), + ('🫀', '🫅'), + ('🫐', '🫙'), + ('🫠', '🫧'), + ('🫰', '🫶'), ]; pub const EXTENDED_PICTOGRAPHIC: &'static [(char, char)] = &[ @@ -4623,13 +4743,13 @@ pub const EXTENDED_PICTOGRAPHIC: &'static [(char, char)] = &[ ('㊗', '㊗'), ('㊙', '㊙'), ('🀀', '\u{1f0ff}'), - ('\u{1f10d}', '\u{1f10f}'), + ('🄍', '🄏'), ('🄯', '🄯'), ('🅬', '🅱'), ('🅾', '🅿'), ('🆎', '🆎'), ('🆑', '🆚'), - ('\u{1f1ad}', '\u{1f1e5}'), + ('🆭', '\u{1f1e5}'), ('🈁', '\u{1f20f}'), ('🈚', '🈚'), ('🈯', '🈯'), @@ -4646,7 +4766,7 @@ pub const EXTENDED_PICTOGRAPHIC: &'static [(char, char)] = &[ ('\u{1f85a}', '\u{1f85f}'), ('\u{1f888}', '\u{1f88f}'), ('\u{1f8ae}', '\u{1f8ff}'), - ('\u{1f90c}', '🤺'), + ('🤌', '🤺'), ('🤼', '🥅'), ('🥇', '\u{1faff}'), ('\u{1fc00}', '\u{1fffd}'), @@ -4677,6 +4797,7 @@ pub const EXTENDER: &'static [(char, char)] = &[ ('ꫝ', 'ꫝ'), ('ꫳ', 'ꫴ'), ('ー', 'ー'), + ('𐞁', '𐞂'), ('𑍝', '𑍝'), ('𑗆', '𑗈'), ('\u{11a98}', '\u{11a98}'), @@ -4709,7 +4830,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('ׯ', '״'), ('؆', '؏'), ('؛', '؛'), - ('؞', 'ي'), + ('؝', 'ي'), ('٠', 'ٯ'), ('ٱ', 'ە'), ('۞', '۞'), @@ -4730,8 +4851,8 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('ࡀ', 'ࡘ'), ('࡞', '࡞'), ('ࡠ', 'ࡪ'), - ('ࢠ', 'ࢴ'), - ('ࢶ', '\u{8c7}'), + ('ࡰ', 'ࢎ'), + ('ࢠ', 'ࣉ'), ('ः', 'ह'), ('ऻ', 'ऻ'), ('ऽ', 'ी'), @@ -4820,6 +4941,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('ఽ', 'ఽ'), ('ు', 'ౄ'), ('ౘ', 'ౚ'), + ('ౝ', 'ౝ'), ('ౠ', 'ౡ'), ('౦', '౯'), ('౷', 'ಀ'), @@ -4833,7 +4955,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('ೃ', 'ೄ'), ('ೇ', 'ೈ'), ('ೊ', 'ೋ'), - ('ೞ', 'ೞ'), + ('ೝ', 'ೞ'), ('ೠ', 'ೡ'), ('೦', '೯'), ('ೱ', 'ೲ'), @@ -4922,10 +5044,10 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('ᏸ', 'ᏽ'), ('᐀', '᚜'), ('ᚠ', 'ᛸ'), - ('ᜀ', 'ᜌ'), - ('ᜎ', 'ᜑ'), - ('ᜠ', 'ᜱ'), - ('᜵', '᜶'), + ('ᜀ', 'ᜑ'), + ('᜕', '᜕'), + ('ᜟ', 'ᜱ'), + ('᜴', '᜶'), ('ᝀ', 'ᝑ'), ('ᝠ', 'ᝬ'), ('ᝮ', 'ᝰ'), @@ -4967,9 +5089,9 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('ᬄ', 'ᬳ'), ('ᬻ', 'ᬻ'), ('ᬽ', 'ᭁ'), - ('ᭃ', 'ᭋ'), + ('ᭃ', 'ᭌ'), ('᭐', '᭪'), - ('᭴', '᭼'), + ('᭴', '᭾'), ('ᮂ', 'ᮡ'), ('ᮦ', 'ᮧ'), ('᮪', '᮪'), @@ -5013,15 +5135,13 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('⁰', 'ⁱ'), ('⁴', '₎'), ('ₐ', 'ₜ'), - ('₠', '₿'), + ('₠', '⃀'), ('℀', '↋'), ('←', '␦'), ('⑀', '⑊'), ('①', '⭳'), ('⭶', '⮕'), - ('\u{2b97}', 'Ⱞ'), - ('ⰰ', 'ⱞ'), - ('Ⱡ', 'ⳮ'), + ('⮗', 'ⳮ'), ('Ⳳ', 'ⳳ'), ('⳹', 'ⴥ'), ('ⴧ', 'ⴧ'), @@ -5037,7 +5157,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('ⷈ', 'ⷎ'), ('ⷐ', 'ⷖ'), ('ⷘ', 'ⷞ'), - ('⸀', '\u{2e52}'), + ('⸀', '⹝'), ('⺀', '⺙'), ('⺛', '⻳'), ('⼀', '⿕'), @@ -5050,8 +5170,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('ㄱ', 'ㆎ'), ('㆐', '㇣'), ('ㇰ', '㈞'), - ('㈠', '\u{9ffc}'), - ('ꀀ', 'ꒌ'), + ('㈠', 'ꒌ'), ('꒐', '꓆'), ('ꓐ', 'ꘫ'), ('Ꙁ', 'ꙮ'), @@ -5059,9 +5178,11 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('꙾', 'ꚝ'), ('ꚠ', 'ꛯ'), ('꛲', '꛷'), - ('꜀', 'ꞿ'), - ('Ꟃ', '\u{a7ca}'), - ('\u{a7f5}', 'ꠁ'), + ('꜀', 'ꟊ'), + ('Ꟑ', 'ꟑ'), + ('ꟓ', 'ꟓ'), + ('ꟕ', 'ꟙ'), + ('ꟲ', 'ꠁ'), ('ꠃ', 'ꠅ'), ('ꠇ', 'ꠊ'), ('ꠌ', 'ꠤ'), @@ -5103,7 +5224,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('ꬑ', 'ꬖ'), ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), - ('ꬰ', '\u{ab6b}'), + ('ꬰ', '꭫'), ('ꭰ', 'ꯤ'), ('ꯦ', 'ꯧ'), ('ꯩ', '꯬'), @@ -5121,11 +5242,11 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('מּ', 'מּ'), ('נּ', 'סּ'), ('ףּ', 'פּ'), - ('צּ', '﯁'), - ('ﯓ', '﴿'), - ('ﵐ', 'ﶏ'), + ('צּ', '﯂'), + ('ﯓ', 'ﶏ'), ('ﶒ', 'ﷇ'), - ('ﷰ', '﷽'), + ('﷏', '﷏'), + ('ﷰ', '﷿'), ('︐', '︙'), ('︰', '﹒'), ('﹔', '﹦'), @@ -5151,7 +5272,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𐄀', '𐄂'), ('𐄇', '𐄳'), ('𐄷', '𐆎'), - ('𐆐', '\u{1019c}'), + ('𐆐', '𐆜'), ('𐆠', '𐆠'), ('𐇐', '𐇼'), ('𐊀', '𐊜'), @@ -5169,10 +5290,20 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𐓘', '𐓻'), ('𐔀', '𐔧'), ('𐔰', '𐕣'), - ('𐕯', '𐕯'), + ('𐕯', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), ('𐘀', '𐜶'), ('𐝀', '𐝕'), ('𐝠', '𐝧'), + ('𐞀', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), ('𐠀', '𐠅'), ('𐠈', '𐠈'), ('𐠊', '𐠵'), @@ -5209,18 +5340,22 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𐳺', '𐴣'), ('𐴰', '𐴹'), ('𐹠', '𐹾'), - ('\u{10e80}', '\u{10ea9}'), - ('\u{10ead}', '\u{10ead}'), - ('\u{10eb0}', '\u{10eb1}'), + ('𐺀', '𐺩'), + ('𐺭', '𐺭'), + ('𐺰', '𐺱'), ('𐼀', '𐼧'), ('𐼰', '𐽅'), ('𐽑', '𐽙'), - ('\u{10fb0}', '\u{10fcb}'), + ('𐽰', '𐾁'), + ('𐾆', '𐾉'), + ('𐾰', '𐿋'), ('𐿠', '𐿶'), ('𑀀', '𑀀'), ('𑀂', '𑀷'), ('𑁇', '𑁍'), ('𑁒', '𑁯'), + ('𑁱', '𑁲'), + ('𑁵', '𑁵'), ('𑂂', '𑂲'), ('𑂷', '𑂸'), ('𑂻', '𑂼'), @@ -5229,12 +5364,12 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𑃰', '𑃹'), ('𑄃', '𑄦'), ('𑄬', '𑄬'), - ('𑄶', '\u{11147}'), + ('𑄶', '𑅇'), ('𑅐', '𑅲'), ('𑅴', '𑅶'), ('𑆂', '𑆵'), ('𑆿', '𑇈'), - ('𑇍', '\u{111ce}'), + ('𑇍', '𑇎'), ('𑇐', '𑇟'), ('𑇡', '𑇴'), ('𑈀', '𑈑'), @@ -5269,7 +5404,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𑑅', '𑑅'), ('𑑇', '𑑛'), ('𑑝', '𑑝'), - ('𑑟', '\u{11461}'), + ('𑑟', '𑑡'), ('𑒀', '𑒯'), ('𑒱', '𑒲'), ('𑒹', '𑒹'), @@ -5293,27 +5428,27 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𑚬', '𑚬'), ('𑚮', '𑚯'), ('𑚶', '𑚶'), - ('𑚸', '𑚸'), + ('𑚸', '𑚹'), ('𑛀', '𑛉'), ('𑜀', '𑜚'), ('𑜠', '𑜡'), ('𑜦', '𑜦'), - ('𑜰', '𑜿'), + ('𑜰', '𑝆'), ('𑠀', '𑠮'), ('𑠸', '𑠸'), ('𑠻', '𑠻'), ('𑢠', '𑣲'), - ('𑣿', '\u{11906}'), - ('\u{11909}', '\u{11909}'), - ('\u{1190c}', '\u{11913}'), - ('\u{11915}', '\u{11916}'), - ('\u{11918}', '\u{1192f}'), - ('\u{11931}', '\u{11935}'), - ('\u{11937}', '\u{11938}'), - ('\u{1193d}', '\u{1193d}'), - ('\u{1193f}', '\u{11942}'), - ('\u{11944}', '\u{11946}'), - ('\u{11950}', '\u{11959}'), + ('𑣿', '𑤆'), + ('𑤉', '𑤉'), + ('𑤌', '𑤓'), + ('𑤕', '𑤖'), + ('𑤘', '𑤯'), + ('𑤱', '𑤵'), + ('𑤷', '𑤸'), + ('𑤽', '𑤽'), + ('𑤿', '𑥂'), + ('𑥄', '𑥆'), + ('𑥐', '𑥙'), ('𑦠', '𑦧'), ('𑦪', '𑧓'), ('𑧜', '𑧟'), @@ -5327,7 +5462,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𑩜', '𑪉'), ('𑪗', '𑪗'), ('𑪚', '𑪢'), - ('𑫀', '𑫸'), + ('𑪰', '𑫸'), ('𑰀', '𑰈'), ('𑰊', '𑰯'), ('𑰾', '𑰾'), @@ -5351,18 +5486,20 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𑶠', '𑶩'), ('𑻠', '𑻲'), ('𑻵', '𑻸'), - ('\u{11fb0}', '\u{11fb0}'), + ('𑾰', '𑾰'), ('𑿀', '𑿱'), ('𑿿', '𒎙'), ('𒐀', '𒑮'), ('𒑰', '𒑴'), ('𒒀', '𒕃'), + ('𒾐', '𒿲'), ('𓀀', '𓐮'), ('𔐀', '𔙆'), ('𖠀', '𖨸'), ('𖩀', '𖩞'), ('𖩠', '𖩩'), - ('𖩮', '𖩯'), + ('𖩮', '𖪾'), + ('𖫀', '𖫉'), ('𖫐', '𖫭'), ('𖫵', '𖫵'), ('𖬀', '𖬯'), @@ -5376,11 +5513,14 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𖽐', '𖾇'), ('𖾓', '𖾟'), ('𖿠', '𖿣'), - ('\u{16ff0}', '\u{16ff1}'), + ('𖿰', '𖿱'), ('𗀀', '𘟷'), - ('𘠀', '\u{18cd5}'), - ('\u{18d00}', '\u{18d08}'), - ('𛀀', '𛄞'), + ('𘠀', '𘳕'), + ('𘴀', '𘴈'), + ('𚿰', '𚿳'), + ('𚿵', '𚿻'), + ('𚿽', '𚿾'), + ('𛀀', '𛄢'), ('𛅐', '𛅒'), ('𛅤', '𛅧'), ('𛅰', '𛋻'), @@ -5390,6 +5530,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𛲐', '𛲙'), ('𛲜', '𛲜'), ('𛲟', '𛲟'), + ('𜽐', '𜿃'), ('𝀀', '𝃵'), ('𝄀', '𝄦'), ('𝄩', '𝅘𝅥𝅲'), @@ -5397,7 +5538,7 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𝅪', '𝅭'), ('𝆃', '𝆄'), ('𝆌', '𝆩'), - ('𝆮', '𝇨'), + ('𝆮', '𝇪'), ('𝈀', '𝉁'), ('𝉅', '𝉅'), ('𝋠', '𝋳'), @@ -5428,13 +5569,19 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('𝩭', '𝩴'), ('𝩶', '𝪃'), ('𝪅', '𝪋'), + ('𝼀', '𝼞'), ('𞄀', '𞄬'), ('𞄷', '𞄽'), ('𞅀', '𞅉'), ('𞅎', '𞅏'), + ('𞊐', '𞊭'), ('𞋀', '𞋫'), ('𞋰', '𞋹'), ('𞋿', '𞋿'), + ('𞟠', '𞟦'), + ('𞟨', '𞟫'), + ('𞟭', '𞟮'), + ('𞟰', '𞟾'), ('𞠀', '𞣄'), ('𞣇', '𞣏'), ('𞤀', '𞥃'), @@ -5483,45 +5630,46 @@ pub const GRAPHEME_BASE: &'static [(char, char)] = &[ ('🂱', '🂿'), ('🃁', '🃏'), ('🃑', '🃵'), - ('🄀', '\u{1f1ad}'), + ('🄀', '🆭'), ('🇦', '🈂'), ('🈐', '🈻'), ('🉀', '🉈'), ('🉐', '🉑'), ('🉠', '🉥'), - ('🌀', '\u{1f6d7}'), - ('🛠', '🛬'), - ('🛰', '\u{1f6fc}'), + ('🌀', '🛗'), + ('🛝', '🛬'), + ('🛰', '🛼'), ('🜀', '🝳'), ('🞀', '🟘'), ('🟠', '🟫'), + ('🟰', '🟰'), ('🠀', '🠋'), ('🠐', '🡇'), ('🡐', '🡙'), ('🡠', '🢇'), ('🢐', '🢭'), - ('\u{1f8b0}', '\u{1f8b1}'), - ('🤀', '\u{1f978}'), - ('🥺', '\u{1f9cb}'), - ('🧍', '🩓'), + ('🢰', '🢱'), + ('🤀', '🩓'), ('🩠', '🩭'), - ('🩰', '\u{1fa74}'), - ('🩸', '🩺'), - ('🪀', '\u{1fa86}'), - ('🪐', '\u{1faa8}'), - ('\u{1fab0}', '\u{1fab6}'), - ('\u{1fac0}', '\u{1fac2}'), - ('\u{1fad0}', '\u{1fad6}'), - ('\u{1fb00}', '\u{1fb92}'), - ('\u{1fb94}', '\u{1fbca}'), - ('\u{1fbf0}', '\u{1fbf9}'), - ('𠀀', '\u{2a6dd}'), - ('𪜀', '𫜴'), + ('🩰', '🩴'), + ('🩸', '🩼'), + ('🪀', '🪆'), + ('🪐', '🪬'), + ('🪰', '🪺'), + ('🫀', '🫅'), + ('🫐', '🫙'), + ('🫠', '🫧'), + ('🫰', '🫶'), + ('🬀', '🮒'), + ('🮔', '🯊'), + ('🯰', '🯹'), + ('𠀀', '𪛟'), + ('𪜀', '𫜸'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), - ('\u{30000}', '\u{3134a}'), + ('𰀀', '𱍊'), ]; pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ @@ -5549,7 +5697,8 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{825}', '\u{827}'), ('\u{829}', '\u{82d}'), ('\u{859}', '\u{85b}'), - ('\u{8d3}', '\u{8e1}'), + ('\u{898}', '\u{89f}'), + ('\u{8ca}', '\u{8e1}'), ('\u{8e3}', '\u{902}'), ('\u{93a}', '\u{93a}'), ('\u{93c}', '\u{93c}'), @@ -5594,6 +5743,7 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{bd7}', '\u{bd7}'), ('\u{c00}', '\u{c00}'), ('\u{c04}', '\u{c04}'), + ('\u{c3c}', '\u{c3c}'), ('\u{c3e}', '\u{c40}'), ('\u{c46}', '\u{c48}'), ('\u{c4a}', '\u{c4d}'), @@ -5649,7 +5799,7 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{109d}', '\u{109d}'), ('\u{135d}', '\u{135f}'), ('\u{1712}', '\u{1714}'), - ('\u{1732}', '\u{1734}'), + ('\u{1732}', '\u{1733}'), ('\u{1752}', '\u{1753}'), ('\u{1772}', '\u{1773}'), ('\u{17b4}', '\u{17b5}'), @@ -5658,6 +5808,7 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{17c9}', '\u{17d3}'), ('\u{17dd}', '\u{17dd}'), ('\u{180b}', '\u{180d}'), + ('\u{180f}', '\u{180f}'), ('\u{1885}', '\u{1886}'), ('\u{18a9}', '\u{18a9}'), ('\u{1920}', '\u{1922}'), @@ -5673,7 +5824,7 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{1a65}', '\u{1a6c}'), ('\u{1a73}', '\u{1a7c}'), ('\u{1a7f}', '\u{1a7f}'), - ('\u{1ab0}', '\u{1ac0}'), + ('\u{1ab0}', '\u{1ace}'), ('\u{1b00}', '\u{1b03}'), ('\u{1b34}', '\u{1b3a}'), ('\u{1b3c}', '\u{1b3c}'), @@ -5695,8 +5846,7 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{1ced}', '\u{1ced}'), ('\u{1cf4}', '\u{1cf4}'), ('\u{1cf8}', '\u{1cf9}'), - ('\u{1dc0}', '\u{1df9}'), - ('\u{1dfb}', '\u{1dff}'), + ('\u{1dc0}', '\u{1dff}'), ('\u{200c}', '\u{200c}'), ('\u{20d0}', '\u{20f0}'), ('\u{2cef}', '\u{2cf1}'), @@ -5755,11 +5905,15 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{10d24}', '\u{10d27}'), ('\u{10eab}', '\u{10eac}'), ('\u{10f46}', '\u{10f50}'), + ('\u{10f82}', '\u{10f85}'), ('\u{11001}', '\u{11001}'), ('\u{11038}', '\u{11046}'), + ('\u{11070}', '\u{11070}'), + ('\u{11073}', '\u{11074}'), ('\u{1107f}', '\u{11081}'), ('\u{110b3}', '\u{110b6}'), ('\u{110b9}', '\u{110ba}'), + ('\u{110c2}', '\u{110c2}'), ('\u{11100}', '\u{11102}'), ('\u{11127}', '\u{1112b}'), ('\u{1112d}', '\u{11134}'), @@ -5845,6 +5999,8 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{16f8f}', '\u{16f92}'), ('\u{16fe4}', '\u{16fe4}'), ('\u{1bc9d}', '\u{1bc9e}'), + ('\u{1cf00}', '\u{1cf2d}'), + ('\u{1cf30}', '\u{1cf46}'), ('\u{1d165}', '\u{1d165}'), ('\u{1d167}', '\u{1d169}'), ('\u{1d16e}', '\u{1d172}'), @@ -5864,6 +6020,7 @@ pub const GRAPHEME_EXTEND: &'static [(char, char)] = &[ ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), ('\u{1e130}', '\u{1e136}'), + ('\u{1e2ae}', '\u{1e2ae}'), ('\u{1e2ec}', '\u{1e2ef}'), ('\u{1e8d0}', '\u{1e8d6}'), ('\u{1e944}', '\u{1e94a}'), @@ -5887,8 +6044,8 @@ pub const GRAPHEME_LINK: &'static [(char, char)] = &[ ('\u{eba}', '\u{eba}'), ('\u{f84}', '\u{f84}'), ('\u{1039}', '\u{103a}'), - ('\u{1714}', '\u{1714}'), - ('\u{1734}', '\u{1734}'), + ('\u{1714}', '᜕'), + ('᜴', '᜴'), ('\u{17d2}', '\u{17d2}'), ('\u{1a60}', '\u{1a60}'), ('᭄', '᭄'), @@ -5904,6 +6061,7 @@ pub const GRAPHEME_LINK: &'static [(char, char)] = &[ ('\u{abed}', '\u{abed}'), ('\u{10a3f}', '\u{10a3f}'), ('\u{11046}', '\u{11046}'), + ('\u{11070}', '\u{11070}'), ('\u{1107f}', '\u{1107f}'), ('\u{110b9}', '\u{110b9}'), ('\u{11133}', '\u{11134}'), @@ -5918,7 +6076,7 @@ pub const GRAPHEME_LINK: &'static [(char, char)] = &[ ('𑚶', '𑚶'), ('\u{1172b}', '\u{1172b}'), ('\u{11839}', '\u{11839}'), - ('\u{1193d}', '\u{1193e}'), + ('𑤽', '\u{1193e}'), ('\u{119e0}', '\u{119e0}'), ('\u{11a34}', '\u{11a34}'), ('\u{11a47}', '\u{11a47}'), @@ -6007,9 +6165,9 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('ࠀ', '\u{82d}'), ('ࡀ', '\u{85b}'), ('ࡠ', 'ࡪ'), - ('ࢠ', 'ࢴ'), - ('ࢶ', '\u{8c7}'), - ('\u{8d3}', '\u{8e1}'), + ('ࡰ', 'ࢇ'), + ('ࢉ', 'ࢎ'), + ('\u{898}', '\u{8e1}'), ('\u{8e3}', '\u{963}'), ('०', '९'), ('ॱ', 'ঃ'), @@ -6093,11 +6251,12 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('ఎ', 'ఐ'), ('ఒ', 'న'), ('ప', 'హ'), - ('ఽ', 'ౄ'), + ('\u{c3c}', 'ౄ'), ('\u{c46}', '\u{c48}'), ('\u{c4a}', '\u{c4d}'), ('\u{c55}', '\u{c56}'), ('ౘ', 'ౚ'), + ('ౝ', 'ౝ'), ('ౠ', '\u{c63}'), ('౦', '౯'), ('ಀ', 'ಃ'), @@ -6110,7 +6269,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('\u{cc6}', 'ೈ'), ('ೊ', '\u{ccd}'), ('\u{cd5}', '\u{cd6}'), - ('ೞ', 'ೞ'), + ('ೝ', 'ೞ'), ('ೠ', '\u{ce3}'), ('೦', '೯'), ('ೱ', 'ೲ'), @@ -6193,9 +6352,8 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('ᚁ', 'ᚚ'), ('ᚠ', 'ᛪ'), ('ᛮ', 'ᛸ'), - ('ᜀ', 'ᜌ'), - ('ᜎ', '\u{1714}'), - ('ᜠ', '\u{1734}'), + ('ᜀ', '᜕'), + ('ᜟ', '᜴'), ('ᝀ', '\u{1753}'), ('ᝠ', 'ᝬ'), ('ᝮ', 'ᝰ'), @@ -6205,7 +6363,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('ៜ', '\u{17dd}'), ('០', '៩'), ('\u{180b}', '\u{180d}'), - ('᠐', '᠙'), + ('\u{180f}', '᠙'), ('ᠠ', 'ᡸ'), ('ᢀ', 'ᢪ'), ('ᢰ', 'ᣵ'), @@ -6224,8 +6382,8 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('᪐', '᪙'), ('ᪧ', 'ᪧ'), ('\u{1ab0}', '\u{1abd}'), - ('\u{1abf}', '\u{1ac0}'), - ('\u{1b00}', 'ᭋ'), + ('\u{1abf}', '\u{1ace}'), + ('\u{1b00}', 'ᭌ'), ('᭐', '᭙'), ('\u{1b6b}', '\u{1b73}'), ('\u{1b80}', '᯳'), @@ -6237,8 +6395,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('Ჽ', 'Ჿ'), ('\u{1cd0}', '\u{1cd2}'), ('\u{1cd4}', 'ᳺ'), - ('ᴀ', '\u{1df9}'), - ('\u{1dfb}', 'ἕ'), + ('ᴀ', 'ἕ'), ('Ἐ', 'Ἕ'), ('ἠ', 'ὅ'), ('Ὀ', 'Ὅ'), @@ -6278,9 +6435,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('ⅅ', 'ⅉ'), ('ⅎ', 'ⅎ'), ('Ⅰ', 'ↈ'), - ('Ⰰ', 'Ⱞ'), - ('ⰰ', 'ⱞ'), - ('Ⱡ', 'ⳤ'), + ('Ⰰ', 'ⳤ'), ('Ⳬ', 'ⳳ'), ('ⴀ', 'ⴥ'), ('ⴧ', 'ⴧ'), @@ -6307,11 +6462,10 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('ー', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', '\u{31bf}'), + ('ㆠ', 'ㆿ'), ('ㇰ', 'ㇿ'), - ('㐀', '\u{4dbf}'), - ('一', '\u{9ffc}'), - ('ꀀ', 'ꒌ'), + ('㐀', '䶿'), + ('一', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), ('ꘐ', 'ꘫ'), @@ -6320,9 +6474,11 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('ꙿ', '\u{a6f1}'), ('ꜗ', 'ꜟ'), ('Ꜣ', 'ꞈ'), - ('Ꞌ', 'ꞿ'), - ('Ꟃ', '\u{a7ca}'), - ('\u{a7f5}', 'ꠧ'), + ('Ꞌ', 'ꟊ'), + ('Ꟑ', 'ꟑ'), + ('ꟓ', 'ꟓ'), + ('ꟕ', 'ꟙ'), + ('ꟲ', 'ꠧ'), ('\u{a82c}', '\u{a82c}'), ('ꡀ', 'ꡳ'), ('ꢀ', '\u{a8c5}'), @@ -6349,7 +6505,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab69}'), + ('ꭜ', 'ꭩ'), ('ꭰ', 'ꯪ'), ('꯬', '\u{abed}'), ('꯰', '꯹'), @@ -6411,9 +6567,20 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('𐓘', '𐓻'), ('𐔀', '𐔧'), ('𐔰', '𐕣'), + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), ('𐘀', '𐜶'), ('𐝀', '𐝕'), ('𐝠', '𐝧'), + ('𐞀', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), ('𐠀', '𐠅'), ('𐠈', '𐠈'), ('𐠊', '𐠵'), @@ -6448,27 +6615,29 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('𐳀', '𐳲'), ('𐴀', '\u{10d27}'), ('𐴰', '𐴹'), - ('\u{10e80}', '\u{10ea9}'), + ('𐺀', '𐺩'), ('\u{10eab}', '\u{10eac}'), - ('\u{10eb0}', '\u{10eb1}'), + ('𐺰', '𐺱'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '\u{10f50}'), - ('\u{10fb0}', '\u{10fc4}'), + ('𐽰', '\u{10f85}'), + ('𐾰', '𐿄'), ('𐿠', '𐿶'), ('𑀀', '\u{11046}'), - ('𑁦', '𑁯'), + ('𑁦', '𑁵'), ('\u{1107f}', '\u{110ba}'), + ('\u{110c2}', '\u{110c2}'), ('𑃐', '𑃨'), ('𑃰', '𑃹'), ('\u{11100}', '\u{11134}'), ('𑄶', '𑄿'), - ('𑅄', '\u{11147}'), + ('𑅄', '𑅇'), ('𑅐', '\u{11173}'), ('𑅶', '𑅶'), ('\u{11180}', '𑇄'), ('\u{111c9}', '\u{111cc}'), - ('\u{111ce}', '𑇚'), + ('𑇎', '𑇚'), ('𑇜', '𑇜'), ('𑈀', '𑈑'), ('𑈓', '\u{11237}'), @@ -6497,7 +6666,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('\u{11370}', '\u{11374}'), ('𑐀', '𑑊'), ('𑑐', '𑑙'), - ('\u{1145e}', '\u{11461}'), + ('\u{1145e}', '𑑡'), ('𑒀', '𑓅'), ('𑓇', '𑓇'), ('𑓐', '𑓙'), @@ -6512,16 +6681,17 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('𑜀', '𑜚'), ('\u{1171d}', '\u{1172b}'), ('𑜰', '𑜹'), + ('𑝀', '𑝆'), ('𑠀', '\u{1183a}'), ('𑢠', '𑣩'), - ('𑣿', '\u{11906}'), - ('\u{11909}', '\u{11909}'), - ('\u{1190c}', '\u{11913}'), - ('\u{11915}', '\u{11916}'), - ('\u{11918}', '\u{11935}'), - ('\u{11937}', '\u{11938}'), + ('𑣿', '𑤆'), + ('𑤉', '𑤉'), + ('𑤌', '𑤓'), + ('𑤕', '𑤖'), + ('𑤘', '𑤵'), + ('𑤷', '𑤸'), ('\u{1193b}', '\u{11943}'), - ('\u{11950}', '\u{11959}'), + ('𑥐', '𑥙'), ('𑦠', '𑦧'), ('𑦪', '\u{119d7}'), ('\u{119da}', '𑧡'), @@ -6530,7 +6700,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('\u{11a47}', '\u{11a47}'), ('𑩐', '\u{11a99}'), ('𑪝', '𑪝'), - ('𑫀', '𑫸'), + ('𑪰', '𑫸'), ('𑰀', '𑰈'), ('𑰊', '\u{11c36}'), ('\u{11c38}', '𑱀'), @@ -6552,15 +6722,18 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('𑶓', '𑶘'), ('𑶠', '𑶩'), ('𑻠', '𑻶'), - ('\u{11fb0}', '\u{11fb0}'), + ('𑾰', '𑾰'), ('𒀀', '𒎙'), ('𒐀', '𒑮'), ('𒒀', '𒕃'), + ('𒾐', '𒿰'), ('𓀀', '𓐮'), ('𔐀', '𔙆'), ('𖠀', '𖨸'), ('𖩀', '𖩞'), ('𖩠', '𖩩'), + ('𖩰', '𖪾'), + ('𖫀', '𖫉'), ('𖫐', '𖫭'), ('\u{16af0}', '\u{16af4}'), ('𖬀', '\u{16b36}'), @@ -6574,11 +6747,14 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('\u{16f8f}', '𖾟'), ('𖿠', '𖿡'), ('𖿣', '\u{16fe4}'), - ('\u{16ff0}', '\u{16ff1}'), + ('𖿰', '𖿱'), ('𗀀', '𘟷'), - ('𘠀', '\u{18cd5}'), - ('\u{18d00}', '\u{18d08}'), - ('𛀀', '𛄞'), + ('𘠀', '𘳕'), + ('𘴀', '𘴈'), + ('𚿰', '𚿳'), + ('𚿵', '𚿻'), + ('𚿽', '𚿾'), + ('𛀀', '𛄢'), ('𛅐', '𛅒'), ('𛅤', '𛅧'), ('𛅰', '𛋻'), @@ -6587,6 +6763,8 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('𛲀', '𛲈'), ('𛲐', '𛲙'), ('\u{1bc9d}', '\u{1bc9e}'), + ('\u{1cf00}', '\u{1cf2d}'), + ('\u{1cf30}', '\u{1cf46}'), ('\u{1d165}', '\u{1d169}'), ('𝅭', '\u{1d172}'), ('\u{1d17b}', '\u{1d182}'), @@ -6630,6 +6808,7 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('\u{1da84}', '\u{1da84}'), ('\u{1da9b}', '\u{1da9f}'), ('\u{1daa1}', '\u{1daaf}'), + ('𝼀', '𝼞'), ('\u{1e000}', '\u{1e006}'), ('\u{1e008}', '\u{1e018}'), ('\u{1e01b}', '\u{1e021}'), @@ -6639,7 +6818,12 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('\u{1e130}', '𞄽'), ('𞅀', '𞅉'), ('𞅎', '𞅎'), + ('𞊐', '\u{1e2ae}'), ('𞋀', '𞋹'), + ('𞟠', '𞟦'), + ('𞟨', '𞟫'), + ('𞟭', '𞟮'), + ('𞟰', '𞟾'), ('𞠀', '𞣄'), ('\u{1e8d0}', '\u{1e8d6}'), ('𞤀', '𞥋'), @@ -6677,14 +6861,14 @@ pub const ID_CONTINUE: &'static [(char, char)] = &[ ('𞺡', '𞺣'), ('𞺥', '𞺩'), ('𞺫', '𞺻'), - ('\u{1fbf0}', '\u{1fbf9}'), - ('𠀀', '\u{2a6dd}'), - ('𪜀', '𫜴'), + ('🯰', '🯹'), + ('𠀀', '𪛟'), + ('𪜀', '𫜸'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), - ('\u{30000}', '\u{3134a}'), + ('𰀀', '𱍊'), ('\u{e0100}', '\u{e01ef}'), ]; @@ -6738,8 +6922,9 @@ pub const ID_START: &'static [(char, char)] = &[ ('ࠨ', 'ࠨ'), ('ࡀ', 'ࡘ'), ('ࡠ', 'ࡪ'), - ('ࢠ', 'ࢴ'), - ('ࢶ', '\u{8c7}'), + ('ࡰ', 'ࢇ'), + ('ࢉ', 'ࢎ'), + ('ࢠ', 'ࣉ'), ('ऄ', 'ह'), ('ऽ', 'ऽ'), ('ॐ', 'ॐ'), @@ -6804,6 +6989,7 @@ pub const ID_START: &'static [(char, char)] = &[ ('ప', 'హ'), ('ఽ', 'ఽ'), ('ౘ', 'ౚ'), + ('ౝ', 'ౝ'), ('ౠ', 'ౡ'), ('ಀ', 'ಀ'), ('ಅ', 'ಌ'), @@ -6812,10 +6998,10 @@ pub const ID_START: &'static [(char, char)] = &[ ('ಪ', 'ಳ'), ('ವ', 'ಹ'), ('ಽ', 'ಽ'), - ('ೞ', 'ೞ'), + ('ೝ', 'ೞ'), ('ೠ', 'ೡ'), ('ೱ', 'ೲ'), - ('\u{d04}', 'ഌ'), + ('ഄ', 'ഌ'), ('എ', 'ഐ'), ('ഒ', 'ഺ'), ('ഽ', 'ഽ'), @@ -6883,9 +7069,8 @@ pub const ID_START: &'static [(char, char)] = &[ ('ᚁ', 'ᚚ'), ('ᚠ', 'ᛪ'), ('ᛮ', 'ᛸ'), - ('ᜀ', 'ᜌ'), - ('ᜎ', 'ᜑ'), - ('ᜠ', 'ᜱ'), + ('ᜀ', 'ᜑ'), + ('ᜟ', 'ᜱ'), ('ᝀ', 'ᝑ'), ('ᝠ', 'ᝬ'), ('ᝮ', 'ᝰ'), @@ -6905,7 +7090,7 @@ pub const ID_START: &'static [(char, char)] = &[ ('ᨠ', 'ᩔ'), ('ᪧ', 'ᪧ'), ('ᬅ', 'ᬳ'), - ('ᭅ', 'ᭋ'), + ('ᭅ', 'ᭌ'), ('ᮃ', 'ᮠ'), ('ᮮ', 'ᮯ'), ('ᮺ', 'ᯥ'), @@ -6955,9 +7140,7 @@ pub const ID_START: &'static [(char, char)] = &[ ('ⅅ', 'ⅉ'), ('ⅎ', 'ⅎ'), ('Ⅰ', 'ↈ'), - ('Ⰰ', 'Ⱞ'), - ('ⰰ', 'ⱞ'), - ('Ⱡ', 'ⳤ'), + ('Ⰰ', 'ⳤ'), ('Ⳬ', 'ⳮ'), ('Ⳳ', 'ⳳ'), ('ⴀ', 'ⴥ'), @@ -6984,11 +7167,10 @@ pub const ID_START: &'static [(char, char)] = &[ ('ー', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', '\u{31bf}'), + ('ㆠ', 'ㆿ'), ('ㇰ', 'ㇿ'), - ('㐀', '\u{4dbf}'), - ('一', '\u{9ffc}'), - ('ꀀ', 'ꒌ'), + ('㐀', '䶿'), + ('一', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), ('ꘐ', 'ꘟ'), @@ -6998,9 +7180,11 @@ pub const ID_START: &'static [(char, char)] = &[ ('ꚠ', 'ꛯ'), ('ꜗ', 'ꜟ'), ('Ꜣ', 'ꞈ'), - ('Ꞌ', 'ꞿ'), - ('Ꟃ', '\u{a7ca}'), - ('\u{a7f5}', 'ꠁ'), + ('Ꞌ', 'ꟊ'), + ('Ꟑ', 'ꟑ'), + ('ꟓ', 'ꟓ'), + ('ꟕ', 'ꟙ'), + ('ꟲ', 'ꠁ'), ('ꠃ', 'ꠅ'), ('ꠇ', 'ꠊ'), ('ꠌ', 'ꠢ'), @@ -7037,7 +7221,7 @@ pub const ID_START: &'static [(char, char)] = &[ ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab69}'), + ('ꭜ', 'ꭩ'), ('ꭰ', 'ꯢ'), ('가', '힣'), ('ힰ', 'ퟆ'), @@ -7089,9 +7273,20 @@ pub const ID_START: &'static [(char, char)] = &[ ('𐓘', '𐓻'), ('𐔀', '𐔧'), ('𐔰', '𐕣'), + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), ('𐘀', '𐜶'), ('𐝀', '𐝕'), ('𐝠', '𐝧'), + ('𐞀', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), ('𐠀', '𐠅'), ('𐠈', '𐠈'), ('𐠊', '𐠵'), @@ -7122,19 +7317,22 @@ pub const ID_START: &'static [(char, char)] = &[ ('𐲀', '𐲲'), ('𐳀', '𐳲'), ('𐴀', '𐴣'), - ('\u{10e80}', '\u{10ea9}'), - ('\u{10eb0}', '\u{10eb1}'), + ('𐺀', '𐺩'), + ('𐺰', '𐺱'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '𐽅'), - ('\u{10fb0}', '\u{10fc4}'), + ('𐽰', '𐾁'), + ('𐾰', '𐿄'), ('𐿠', '𐿶'), ('𑀃', '𑀷'), + ('𑁱', '𑁲'), + ('𑁵', '𑁵'), ('𑂃', '𑂯'), ('𑃐', '𑃨'), ('𑄃', '𑄦'), ('𑅄', '𑅄'), - ('\u{11147}', '\u{11147}'), + ('𑅇', '𑅇'), ('𑅐', '𑅲'), ('𑅶', '𑅶'), ('𑆃', '𑆲'), @@ -7160,7 +7358,7 @@ pub const ID_START: &'static [(char, char)] = &[ ('𑍝', '𑍡'), ('𑐀', '𑐴'), ('𑑇', '𑑊'), - ('𑑟', '\u{11461}'), + ('𑑟', '𑑡'), ('𑒀', '𑒯'), ('𑓄', '𑓅'), ('𑓇', '𑓇'), @@ -7171,15 +7369,16 @@ pub const ID_START: &'static [(char, char)] = &[ ('𑚀', '𑚪'), ('𑚸', '𑚸'), ('𑜀', '𑜚'), + ('𑝀', '𑝆'), ('𑠀', '𑠫'), ('𑢠', '𑣟'), - ('𑣿', '\u{11906}'), - ('\u{11909}', '\u{11909}'), - ('\u{1190c}', '\u{11913}'), - ('\u{11915}', '\u{11916}'), - ('\u{11918}', '\u{1192f}'), - ('\u{1193f}', '\u{1193f}'), - ('\u{11941}', '\u{11941}'), + ('𑣿', '𑤆'), + ('𑤉', '𑤉'), + ('𑤌', '𑤓'), + ('𑤕', '𑤖'), + ('𑤘', '𑤯'), + ('𑤿', '𑤿'), + ('𑥁', '𑥁'), ('𑦠', '𑦧'), ('𑦪', '𑧐'), ('𑧡', '𑧡'), @@ -7190,7 +7389,7 @@ pub const ID_START: &'static [(char, char)] = &[ ('𑩐', '𑩐'), ('𑩜', '𑪉'), ('𑪝', '𑪝'), - ('𑫀', '𑫸'), + ('𑪰', '𑫸'), ('𑰀', '𑰈'), ('𑰊', '𑰮'), ('𑱀', '𑱀'), @@ -7204,14 +7403,16 @@ pub const ID_START: &'static [(char, char)] = &[ ('𑵪', '𑶉'), ('𑶘', '𑶘'), ('𑻠', '𑻲'), - ('\u{11fb0}', '\u{11fb0}'), + ('𑾰', '𑾰'), ('𒀀', '𒎙'), ('𒐀', '𒑮'), ('𒒀', '𒕃'), + ('𒾐', '𒿰'), ('𓀀', '𓐮'), ('𔐀', '𔙆'), ('𖠀', '𖨸'), ('𖩀', '𖩞'), + ('𖩰', '𖪾'), ('𖫐', '𖫭'), ('𖬀', '𖬯'), ('𖭀', '𖭃'), @@ -7224,9 +7425,12 @@ pub const ID_START: &'static [(char, char)] = &[ ('𖿠', '𖿡'), ('𖿣', '𖿣'), ('𗀀', '𘟷'), - ('𘠀', '\u{18cd5}'), - ('\u{18d00}', '\u{18d08}'), - ('𛀀', '𛄞'), + ('𘠀', '𘳕'), + ('𘴀', '𘴈'), + ('𚿰', '𚿳'), + ('𚿵', '𚿻'), + ('𚿽', '𚿾'), + ('𛀀', '𛄢'), ('𛅐', '𛅒'), ('𛅤', '𛅧'), ('𛅰', '𛋻'), @@ -7264,10 +7468,16 @@ pub const ID_START: &'static [(char, char)] = &[ ('𝞊', '𝞨'), ('𝞪', '𝟂'), ('𝟄', '𝟋'), + ('𝼀', '𝼞'), ('𞄀', '𞄬'), ('𞄷', '𞄽'), ('𞅎', '𞅎'), + ('𞊐', '𞊭'), ('𞋀', '𞋫'), + ('𞟠', '𞟦'), + ('𞟨', '𞟫'), + ('𞟭', '𞟮'), + ('𞟰', '𞟾'), ('𞠀', '𞣄'), ('𞤀', '𞥃'), ('𞥋', '𞥋'), @@ -7304,35 +7514,35 @@ pub const ID_START: &'static [(char, char)] = &[ ('𞺡', '𞺣'), ('𞺥', '𞺩'), ('𞺫', '𞺻'), - ('𠀀', '\u{2a6dd}'), - ('𪜀', '𫜴'), + ('𠀀', '𪛟'), + ('𪜀', '𫜸'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), - ('\u{30000}', '\u{3134a}'), + ('𰀀', '𱍊'), ]; pub const IDEOGRAPHIC: &'static [(char, char)] = &[ ('〆', '〇'), ('〡', '〩'), ('〸', '〺'), - ('㐀', '\u{4dbf}'), - ('一', '\u{9ffc}'), + ('㐀', '䶿'), + ('一', '鿿'), ('豈', '舘'), ('並', '龎'), ('\u{16fe4}', '\u{16fe4}'), ('𗀀', '𘟷'), - ('𘠀', '\u{18cd5}'), - ('\u{18d00}', '\u{18d08}'), + ('𘠀', '𘳕'), + ('𘴀', '𘴈'), ('𛅰', '𛋻'), - ('𠀀', '\u{2a6dd}'), - ('𪜀', '𫜴'), + ('𠀀', '𪛟'), + ('𪜀', '𫜸'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), - ('\u{30000}', '\u{3134a}'), + ('𰀀', '𱍊'), ]; pub const JOIN_CONTROL: &'static [(char, char)] = &[('\u{200c}', '\u{200d}')]; @@ -7787,7 +7997,7 @@ pub const LOWERCASE: &'static [(char, char)] = &[ ('ⅰ', 'ⅿ'), ('ↄ', 'ↄ'), ('ⓐ', 'ⓩ'), - ('ⰰ', 'ⱞ'), + ('ⰰ', 'ⱟ'), ('ⱡ', 'ⱡ'), ('ⱥ', 'ⱦ'), ('ⱨ', 'ⱨ'), @@ -7955,19 +8165,33 @@ pub const LOWERCASE: &'static [(char, char)] = &[ ('ꞻ', 'ꞻ'), ('ꞽ', 'ꞽ'), ('ꞿ', 'ꞿ'), + ('ꟁ', 'ꟁ'), ('ꟃ', 'ꟃ'), - ('\u{a7c8}', '\u{a7c8}'), - ('\u{a7ca}', '\u{a7ca}'), - ('\u{a7f6}', '\u{a7f6}'), + ('ꟈ', 'ꟈ'), + ('ꟊ', 'ꟊ'), + ('ꟑ', 'ꟑ'), + ('ꟓ', 'ꟓ'), + ('ꟕ', 'ꟕ'), + ('ꟗ', 'ꟗ'), + ('ꟙ', 'ꟙ'), + ('ꟶ', 'ꟶ'), ('ꟸ', 'ꟺ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab68}'), + ('ꭜ', 'ꭨ'), ('ꭰ', 'ꮿ'), ('ff', 'st'), ('ﬓ', 'ﬗ'), ('a', 'z'), ('𐐨', '𐑏'), ('𐓘', '𐓻'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), + ('𐞀', '𐞀'), + ('𐞃', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), ('𐳀', '𐳲'), ('𑣀', '𑣟'), ('𖹠', '𖹿'), @@ -7999,6 +8223,8 @@ pub const LOWERCASE: &'static [(char, char)] = &[ ('𝞪', '𝟂'), ('𝟄', '𝟉'), ('𝟋', '𝟋'), + ('𝼀', '𝼉'), + ('𝼋', '𝼞'), ('𞤢', '𞥃'), ]; @@ -8281,6 +8507,7 @@ pub const OTHER_ALPHABETIC: &'static [(char, char)] = &[ ('ᩕ', '\u{1a5e}'), ('ᩡ', '\u{1a74}'), ('\u{1abf}', '\u{1ac0}'), + ('\u{1acc}', '\u{1ace}'), ('\u{1b00}', 'ᬄ'), ('\u{1b35}', 'ᭃ'), ('\u{1b80}', 'ᮂ'), @@ -8325,14 +8552,16 @@ pub const OTHER_ALPHABETIC: &'static [(char, char)] = &[ ('\u{10eab}', '\u{10eac}'), ('𑀀', '𑀂'), ('\u{11038}', '\u{11045}'), + ('\u{11073}', '\u{11074}'), ('𑂂', '𑂂'), ('𑂰', '𑂸'), + ('\u{110c2}', '\u{110c2}'), ('\u{11100}', '\u{11102}'), ('\u{11127}', '\u{11132}'), ('𑅅', '𑅆'), ('\u{11180}', '𑆂'), ('𑆳', '𑆿'), - ('\u{111ce}', '\u{111cf}'), + ('𑇎', '\u{111cf}'), ('𑈬', '\u{11234}'), ('\u{11237}', '\u{11237}'), ('\u{1123e}', '\u{1123e}'), @@ -8354,11 +8583,11 @@ pub const OTHER_ALPHABETIC: &'static [(char, char)] = &[ ('\u{116ab}', '\u{116b5}'), ('\u{1171d}', '\u{1172a}'), ('𑠬', '𑠸'), - ('\u{11930}', '\u{11935}'), - ('\u{11937}', '\u{11938}'), + ('\u{11930}', '𑤵'), + ('𑤷', '𑤸'), ('\u{1193b}', '\u{1193c}'), - ('\u{11940}', '\u{11940}'), - ('\u{11942}', '\u{11942}'), + ('𑥀', '𑥀'), + ('𑥂', '𑥂'), ('𑧑', '\u{119d7}'), ('\u{119da}', '𑧟'), ('𑧤', '𑧤'), @@ -8384,7 +8613,7 @@ pub const OTHER_ALPHABETIC: &'static [(char, char)] = &[ ('\u{16f4f}', '\u{16f4f}'), ('𖽑', '𖾇'), ('\u{16f8f}', '\u{16f92}'), - ('\u{16ff0}', '\u{16ff1}'), + ('𖿰', '𖿱'), ('\u{1bc9e}', '\u{1bc9e}'), ('\u{1e000}', '\u{1e006}'), ('\u{1e008}', '\u{1e018}'), @@ -8466,6 +8695,10 @@ pub const OTHER_LOWERCASE: &'static [(char, char)] = &[ ('ꝰ', 'ꝰ'), ('ꟸ', 'ꟹ'), ('ꭜ', 'ꭟ'), + ('𐞀', '𐞀'), + ('𐞃', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), ]; pub const OTHER_MATH: &'static [(char, char)] = &[ @@ -8651,13 +8884,14 @@ pub const PREPENDED_CONCATENATION_MARK: &'static [(char, char)] = &[ ('\u{600}', '\u{605}'), ('\u{6dd}', '\u{6dd}'), ('\u{70f}', '\u{70f}'), + ('\u{890}', '\u{891}'), ('\u{8e2}', '\u{8e2}'), ('\u{110bd}', '\u{110bd}'), ('\u{110cd}', '\u{110cd}'), ]; pub const QUOTATION_MARK: &'static [(char, char)] = &[ - ('\"', '\"'), + ('"', '"'), ('\'', '\''), ('«', '«'), ('»', '»'), @@ -8682,7 +8916,7 @@ pub const SENTENCE_TERMINAL: &'static [(char, char)] = &[ ('.', '.'), ('?', '?'), ('։', '։'), - ('؞', '؟'), + ('؝', '؟'), ('۔', '۔'), ('܀', '܂'), ('߹', '߹'), @@ -8701,12 +8935,14 @@ pub const SENTENCE_TERMINAL: &'static [(char, char)] = &[ ('᪨', '᪫'), ('᭚', '᭛'), ('᭞', '᭟'), + ('᭽', '᭾'), ('᰻', '᰼'), ('᱾', '᱿'), ('‼', '‽'), ('⁇', '⁉'), ('⸮', '⸮'), ('⸼', '⸼'), + ('⹓', '⹔'), ('。', '。'), ('꓿', '꓿'), ('꘎', '꘏'), @@ -8727,6 +8963,7 @@ pub const SENTENCE_TERMINAL: &'static [(char, char)] = &[ ('。', '。'), ('𐩖', '𐩗'), ('𐽕', '𐽙'), + ('𐾆', '𐾉'), ('𑁇', '𑁈'), ('𑂾', '𑃁'), ('𑅁', '𑅃'), @@ -8741,8 +8978,8 @@ pub const SENTENCE_TERMINAL: &'static [(char, char)] = &[ ('𑗉', '𑗗'), ('𑙁', '𑙂'), ('𑜼', '𑜾'), - ('\u{11944}', '\u{11944}'), - ('\u{11946}', '\u{11946}'), + ('𑥄', '𑥄'), + ('𑥆', '𑥆'), ('𑩂', '𑩃'), ('𑪛', '𑪜'), ('𑱁', '𑱂'), @@ -8788,6 +9025,7 @@ pub const SOFT_DOTTED: &'static [(char, char)] = &[ ('𝘪', '𝘫'), ('𝙞', '𝙟'), ('𝚒', '𝚓'), + ('𝼚', '𝼚'), ]; pub const TERMINAL_PUNCTUATION: &'static [(char, char)] = &[ @@ -8802,7 +9040,7 @@ pub const TERMINAL_PUNCTUATION: &'static [(char, char)] = &[ ('׃', '׃'), ('،', '،'), ('؛', '؛'), - ('؞', '؟'), + ('؝', '؟'), ('۔', '۔'), ('܀', '܊'), ('܌', '܌'), @@ -8826,6 +9064,7 @@ pub const TERMINAL_PUNCTUATION: &'static [(char, char)] = &[ ('᪨', '᪫'), ('᭚', '᭛'), ('᭝', '᭟'), + ('᭽', '᭾'), ('᰻', '᰿'), ('᱾', '᱿'), ('‼', '‽'), @@ -8835,6 +9074,7 @@ pub const TERMINAL_PUNCTUATION: &'static [(char, char)] = &[ ('⹁', '⹁'), ('⹌', '⹌'), ('⹎', '⹏'), + ('⹓', '⹔'), ('、', '。'), ('꓾', '꓿'), ('꘍', '꘏'), @@ -8865,6 +9105,7 @@ pub const TERMINAL_PUNCTUATION: &'static [(char, char)] = &[ ('𐬺', '𐬿'), ('𐮙', '𐮜'), ('𐽕', '𐽙'), + ('𐾆', '𐾉'), ('𑁇', '𑁍'), ('𑂾', '𑃁'), ('𑅁', '𑅃'), @@ -8874,13 +9115,13 @@ pub const TERMINAL_PUNCTUATION: &'static [(char, char)] = &[ ('𑈸', '𑈼'), ('𑊩', '𑊩'), ('𑑋', '𑑍'), - ('\u{1145a}', '𑑛'), + ('𑑚', '𑑛'), ('𑗂', '𑗅'), ('𑗉', '𑗗'), ('𑙁', '𑙂'), ('𑜼', '𑜾'), - ('\u{11944}', '\u{11944}'), - ('\u{11946}', '\u{11946}'), + ('𑥄', '𑥄'), + ('𑥆', '𑥆'), ('𑩂', '𑩃'), ('𑪛', '𑪜'), ('𑪡', '𑪢'), @@ -8898,8 +9139,8 @@ pub const TERMINAL_PUNCTUATION: &'static [(char, char)] = &[ ]; pub const UNIFIED_IDEOGRAPH: &'static [(char, char)] = &[ - ('㐀', '\u{4dbf}'), - ('一', '\u{9ffc}'), + ('㐀', '䶿'), + ('一', '鿿'), ('﨎', '﨏'), ('﨑', '﨑'), ('﨓', '﨔'), @@ -8907,12 +9148,12 @@ pub const UNIFIED_IDEOGRAPH: &'static [(char, char)] = &[ ('﨡', '﨡'), ('﨣', '﨤'), ('﨧', '﨩'), - ('𠀀', '\u{2a6dd}'), - ('𪜀', '𫜴'), + ('𠀀', '𪛟'), + ('𪜀', '𫜸'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), - ('\u{30000}', '\u{3134a}'), + ('𰀀', '𱍊'), ]; pub const UPPERCASE: &'static [(char, char)] = &[ @@ -9349,7 +9590,7 @@ pub const UPPERCASE: &'static [(char, char)] = &[ ('Ⅰ', 'Ⅿ'), ('Ↄ', 'Ↄ'), ('Ⓐ', 'Ⓩ'), - ('Ⰰ', 'Ⱞ'), + ('Ⰰ', 'Ⱟ'), ('Ⱡ', 'Ⱡ'), ('Ɫ', 'Ɽ'), ('Ⱨ', 'Ⱨ'), @@ -9514,13 +9755,21 @@ pub const UPPERCASE: &'static [(char, char)] = &[ ('Ꞻ', 'Ꞻ'), ('Ꞽ', 'Ꞽ'), ('Ꞿ', 'Ꞿ'), + ('Ꟁ', 'Ꟁ'), ('Ꟃ', 'Ꟃ'), - ('Ꞔ', '\u{a7c7}'), - ('\u{a7c9}', '\u{a7c9}'), - ('\u{a7f5}', '\u{a7f5}'), + ('Ꞔ', 'Ꟈ'), + ('Ꟊ', 'Ꟊ'), + ('Ꟑ', 'Ꟑ'), + ('Ꟗ', 'Ꟗ'), + ('Ꟙ', 'Ꟙ'), + ('Ꟶ', 'Ꟶ'), ('A', 'Z'), ('𐐀', '𐐧'), ('𐒰', '𐓓'), + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), ('𐲀', '𐲲'), ('𑢠', '𑢿'), ('𖹀', '𖹟'), @@ -9563,6 +9812,7 @@ pub const UPPERCASE: &'static [(char, char)] = &[ pub const VARIATION_SELECTOR: &'static [(char, char)] = &[ ('\u{180b}', '\u{180d}'), + ('\u{180f}', '\u{180f}'), ('\u{fe00}', '\u{fe0f}'), ('\u{e0100}', '\u{e01ef}'), ]; @@ -9632,9 +9882,9 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('ࠀ', '\u{82d}'), ('ࡀ', '\u{85b}'), ('ࡠ', 'ࡪ'), - ('ࢠ', 'ࢴ'), - ('ࢶ', '\u{8c7}'), - ('\u{8d3}', '\u{8e1}'), + ('ࡰ', 'ࢇ'), + ('ࢉ', 'ࢎ'), + ('\u{898}', '\u{8e1}'), ('\u{8e3}', '\u{963}'), ('०', '९'), ('ॱ', 'ঃ'), @@ -9718,11 +9968,12 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('ఎ', 'ఐ'), ('ఒ', 'న'), ('ప', 'హ'), - ('ఽ', 'ౄ'), + ('\u{c3c}', 'ౄ'), ('\u{c46}', '\u{c48}'), ('\u{c4a}', '\u{c4d}'), ('\u{c55}', '\u{c56}'), ('ౘ', 'ౚ'), + ('ౝ', 'ౝ'), ('ౠ', '\u{c63}'), ('౦', '౯'), ('ಀ', 'ಃ'), @@ -9735,7 +9986,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('\u{cc6}', 'ೈ'), ('ೊ', '\u{ccd}'), ('\u{cd5}', '\u{cd6}'), - ('ೞ', 'ೞ'), + ('ೝ', 'ೞ'), ('ೠ', '\u{ce3}'), ('೦', '೯'), ('ೱ', 'ೲ'), @@ -9818,9 +10069,8 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('ᚁ', 'ᚚ'), ('ᚠ', 'ᛪ'), ('ᛮ', 'ᛸ'), - ('ᜀ', 'ᜌ'), - ('ᜎ', '\u{1714}'), - ('ᜠ', '\u{1734}'), + ('ᜀ', '᜕'), + ('ᜟ', '᜴'), ('ᝀ', '\u{1753}'), ('ᝠ', 'ᝬ'), ('ᝮ', 'ᝰ'), @@ -9830,7 +10080,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('ៜ', '\u{17dd}'), ('០', '៩'), ('\u{180b}', '\u{180d}'), - ('᠐', '᠙'), + ('\u{180f}', '᠙'), ('ᠠ', 'ᡸ'), ('ᢀ', 'ᢪ'), ('ᢰ', 'ᣵ'), @@ -9849,8 +10099,8 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('᪐', '᪙'), ('ᪧ', 'ᪧ'), ('\u{1ab0}', '\u{1abd}'), - ('\u{1abf}', '\u{1ac0}'), - ('\u{1b00}', 'ᭋ'), + ('\u{1abf}', '\u{1ace}'), + ('\u{1b00}', 'ᭌ'), ('᭐', '᭙'), ('\u{1b6b}', '\u{1b73}'), ('\u{1b80}', '᯳'), @@ -9862,8 +10112,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('Ჽ', 'Ჿ'), ('\u{1cd0}', '\u{1cd2}'), ('\u{1cd4}', 'ᳺ'), - ('ᴀ', '\u{1df9}'), - ('\u{1dfb}', 'ἕ'), + ('ᴀ', 'ἕ'), ('Ἐ', 'Ἕ'), ('ἠ', 'ὅ'), ('Ὀ', 'Ὅ'), @@ -9903,9 +10152,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('ⅅ', 'ⅉ'), ('ⅎ', 'ⅎ'), ('Ⅰ', 'ↈ'), - ('Ⰰ', 'Ⱞ'), - ('ⰰ', 'ⱞ'), - ('Ⱡ', 'ⳤ'), + ('Ⰰ', 'ⳤ'), ('Ⳬ', 'ⳳ'), ('ⴀ', 'ⴥ'), ('ⴧ', 'ⴧ'), @@ -9933,11 +10180,10 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('ー', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', '\u{31bf}'), + ('ㆠ', 'ㆿ'), ('ㇰ', 'ㇿ'), - ('㐀', '\u{4dbf}'), - ('一', '\u{9ffc}'), - ('ꀀ', 'ꒌ'), + ('㐀', '䶿'), + ('一', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), ('ꘐ', 'ꘫ'), @@ -9946,9 +10192,11 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('ꙿ', '\u{a6f1}'), ('ꜗ', 'ꜟ'), ('Ꜣ', 'ꞈ'), - ('Ꞌ', 'ꞿ'), - ('Ꟃ', '\u{a7ca}'), - ('\u{a7f5}', 'ꠧ'), + ('Ꞌ', 'ꟊ'), + ('Ꟑ', 'ꟑ'), + ('ꟓ', 'ꟓ'), + ('ꟕ', 'ꟙ'), + ('ꟲ', 'ꠧ'), ('\u{a82c}', '\u{a82c}'), ('ꡀ', 'ꡳ'), ('ꢀ', '\u{a8c5}'), @@ -9975,7 +10223,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab69}'), + ('ꭜ', 'ꭩ'), ('ꭰ', 'ꯪ'), ('꯬', '\u{abed}'), ('꯰', '꯹'), @@ -10043,9 +10291,20 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('𐓘', '𐓻'), ('𐔀', '𐔧'), ('𐔰', '𐕣'), + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), ('𐘀', '𐜶'), ('𐝀', '𐝕'), ('𐝠', '𐝧'), + ('𐞀', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), ('𐠀', '𐠅'), ('𐠈', '𐠈'), ('𐠊', '𐠵'), @@ -10080,27 +10339,29 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('𐳀', '𐳲'), ('𐴀', '\u{10d27}'), ('𐴰', '𐴹'), - ('\u{10e80}', '\u{10ea9}'), + ('𐺀', '𐺩'), ('\u{10eab}', '\u{10eac}'), - ('\u{10eb0}', '\u{10eb1}'), + ('𐺰', '𐺱'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '\u{10f50}'), - ('\u{10fb0}', '\u{10fc4}'), + ('𐽰', '\u{10f85}'), + ('𐾰', '𐿄'), ('𐿠', '𐿶'), ('𑀀', '\u{11046}'), - ('𑁦', '𑁯'), + ('𑁦', '𑁵'), ('\u{1107f}', '\u{110ba}'), + ('\u{110c2}', '\u{110c2}'), ('𑃐', '𑃨'), ('𑃰', '𑃹'), ('\u{11100}', '\u{11134}'), ('𑄶', '𑄿'), - ('𑅄', '\u{11147}'), + ('𑅄', '𑅇'), ('𑅐', '\u{11173}'), ('𑅶', '𑅶'), ('\u{11180}', '𑇄'), ('\u{111c9}', '\u{111cc}'), - ('\u{111ce}', '𑇚'), + ('𑇎', '𑇚'), ('𑇜', '𑇜'), ('𑈀', '𑈑'), ('𑈓', '\u{11237}'), @@ -10129,7 +10390,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('\u{11370}', '\u{11374}'), ('𑐀', '𑑊'), ('𑑐', '𑑙'), - ('\u{1145e}', '\u{11461}'), + ('\u{1145e}', '𑑡'), ('𑒀', '𑓅'), ('𑓇', '𑓇'), ('𑓐', '𑓙'), @@ -10144,16 +10405,17 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('𑜀', '𑜚'), ('\u{1171d}', '\u{1172b}'), ('𑜰', '𑜹'), + ('𑝀', '𑝆'), ('𑠀', '\u{1183a}'), ('𑢠', '𑣩'), - ('𑣿', '\u{11906}'), - ('\u{11909}', '\u{11909}'), - ('\u{1190c}', '\u{11913}'), - ('\u{11915}', '\u{11916}'), - ('\u{11918}', '\u{11935}'), - ('\u{11937}', '\u{11938}'), + ('𑣿', '𑤆'), + ('𑤉', '𑤉'), + ('𑤌', '𑤓'), + ('𑤕', '𑤖'), + ('𑤘', '𑤵'), + ('𑤷', '𑤸'), ('\u{1193b}', '\u{11943}'), - ('\u{11950}', '\u{11959}'), + ('𑥐', '𑥙'), ('𑦠', '𑦧'), ('𑦪', '\u{119d7}'), ('\u{119da}', '𑧡'), @@ -10162,7 +10424,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('\u{11a47}', '\u{11a47}'), ('𑩐', '\u{11a99}'), ('𑪝', '𑪝'), - ('𑫀', '𑫸'), + ('𑪰', '𑫸'), ('𑰀', '𑰈'), ('𑰊', '\u{11c36}'), ('\u{11c38}', '𑱀'), @@ -10184,15 +10446,18 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('𑶓', '𑶘'), ('𑶠', '𑶩'), ('𑻠', '𑻶'), - ('\u{11fb0}', '\u{11fb0}'), + ('𑾰', '𑾰'), ('𒀀', '𒎙'), ('𒐀', '𒑮'), ('𒒀', '𒕃'), + ('𒾐', '𒿰'), ('𓀀', '𓐮'), ('𔐀', '𔙆'), ('𖠀', '𖨸'), ('𖩀', '𖩞'), ('𖩠', '𖩩'), + ('𖩰', '𖪾'), + ('𖫀', '𖫉'), ('𖫐', '𖫭'), ('\u{16af0}', '\u{16af4}'), ('𖬀', '\u{16b36}'), @@ -10206,11 +10471,14 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('\u{16f8f}', '𖾟'), ('𖿠', '𖿡'), ('𖿣', '\u{16fe4}'), - ('\u{16ff0}', '\u{16ff1}'), + ('𖿰', '𖿱'), ('𗀀', '𘟷'), - ('𘠀', '\u{18cd5}'), - ('\u{18d00}', '\u{18d08}'), - ('𛀀', '𛄞'), + ('𘠀', '𘳕'), + ('𘴀', '𘴈'), + ('𚿰', '𚿳'), + ('𚿵', '𚿻'), + ('𚿽', '𚿾'), + ('𛀀', '𛄢'), ('𛅐', '𛅒'), ('𛅤', '𛅧'), ('𛅰', '𛋻'), @@ -10219,6 +10487,8 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('𛲀', '𛲈'), ('𛲐', '𛲙'), ('\u{1bc9d}', '\u{1bc9e}'), + ('\u{1cf00}', '\u{1cf2d}'), + ('\u{1cf30}', '\u{1cf46}'), ('\u{1d165}', '\u{1d169}'), ('𝅭', '\u{1d172}'), ('\u{1d17b}', '\u{1d182}'), @@ -10262,6 +10532,7 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('\u{1da84}', '\u{1da84}'), ('\u{1da9b}', '\u{1da9f}'), ('\u{1daa1}', '\u{1daaf}'), + ('𝼀', '𝼞'), ('\u{1e000}', '\u{1e006}'), ('\u{1e008}', '\u{1e018}'), ('\u{1e01b}', '\u{1e021}'), @@ -10271,7 +10542,12 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('\u{1e130}', '𞄽'), ('𞅀', '𞅉'), ('𞅎', '𞅎'), + ('𞊐', '\u{1e2ae}'), ('𞋀', '𞋹'), + ('𞟠', '𞟦'), + ('𞟨', '𞟫'), + ('𞟭', '𞟮'), + ('𞟰', '𞟾'), ('𞠀', '𞣄'), ('\u{1e8d0}', '\u{1e8d6}'), ('𞤀', '𞥋'), @@ -10309,14 +10585,14 @@ pub const XID_CONTINUE: &'static [(char, char)] = &[ ('𞺡', '𞺣'), ('𞺥', '𞺩'), ('𞺫', '𞺻'), - ('\u{1fbf0}', '\u{1fbf9}'), - ('𠀀', '\u{2a6dd}'), - ('𪜀', '𫜴'), + ('🯰', '🯹'), + ('𠀀', '𪛟'), + ('𪜀', '𫜸'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), - ('\u{30000}', '\u{3134a}'), + ('𰀀', '𱍊'), ('\u{e0100}', '\u{e01ef}'), ]; @@ -10370,8 +10646,9 @@ pub const XID_START: &'static [(char, char)] = &[ ('ࠨ', 'ࠨ'), ('ࡀ', 'ࡘ'), ('ࡠ', 'ࡪ'), - ('ࢠ', 'ࢴ'), - ('ࢶ', '\u{8c7}'), + ('ࡰ', 'ࢇ'), + ('ࢉ', 'ࢎ'), + ('ࢠ', 'ࣉ'), ('ऄ', 'ह'), ('ऽ', 'ऽ'), ('ॐ', 'ॐ'), @@ -10436,6 +10713,7 @@ pub const XID_START: &'static [(char, char)] = &[ ('ప', 'హ'), ('ఽ', 'ఽ'), ('ౘ', 'ౚ'), + ('ౝ', 'ౝ'), ('ౠ', 'ౡ'), ('ಀ', 'ಀ'), ('ಅ', 'ಌ'), @@ -10444,10 +10722,10 @@ pub const XID_START: &'static [(char, char)] = &[ ('ಪ', 'ಳ'), ('ವ', 'ಹ'), ('ಽ', 'ಽ'), - ('ೞ', 'ೞ'), + ('ೝ', 'ೞ'), ('ೠ', 'ೡ'), ('ೱ', 'ೲ'), - ('\u{d04}', 'ഌ'), + ('ഄ', 'ഌ'), ('എ', 'ഐ'), ('ഒ', 'ഺ'), ('ഽ', 'ഽ'), @@ -10515,9 +10793,8 @@ pub const XID_START: &'static [(char, char)] = &[ ('ᚁ', 'ᚚ'), ('ᚠ', 'ᛪ'), ('ᛮ', 'ᛸ'), - ('ᜀ', 'ᜌ'), - ('ᜎ', 'ᜑ'), - ('ᜠ', 'ᜱ'), + ('ᜀ', 'ᜑ'), + ('ᜟ', 'ᜱ'), ('ᝀ', 'ᝑ'), ('ᝠ', 'ᝬ'), ('ᝮ', 'ᝰ'), @@ -10537,7 +10814,7 @@ pub const XID_START: &'static [(char, char)] = &[ ('ᨠ', 'ᩔ'), ('ᪧ', 'ᪧ'), ('ᬅ', 'ᬳ'), - ('ᭅ', 'ᭋ'), + ('ᭅ', 'ᭌ'), ('ᮃ', 'ᮠ'), ('ᮮ', 'ᮯ'), ('ᮺ', 'ᯥ'), @@ -10587,9 +10864,7 @@ pub const XID_START: &'static [(char, char)] = &[ ('ⅅ', 'ⅉ'), ('ⅎ', 'ⅎ'), ('Ⅰ', 'ↈ'), - ('Ⰰ', 'Ⱞ'), - ('ⰰ', 'ⱞ'), - ('Ⱡ', 'ⳤ'), + ('Ⰰ', 'ⳤ'), ('Ⳬ', 'ⳮ'), ('Ⳳ', 'ⳳ'), ('ⴀ', 'ⴥ'), @@ -10616,11 +10891,10 @@ pub const XID_START: &'static [(char, char)] = &[ ('ー', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', '\u{31bf}'), + ('ㆠ', 'ㆿ'), ('ㇰ', 'ㇿ'), - ('㐀', '\u{4dbf}'), - ('一', '\u{9ffc}'), - ('ꀀ', 'ꒌ'), + ('㐀', '䶿'), + ('一', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), ('ꘐ', 'ꘟ'), @@ -10630,9 +10904,11 @@ pub const XID_START: &'static [(char, char)] = &[ ('ꚠ', 'ꛯ'), ('ꜗ', 'ꜟ'), ('Ꜣ', 'ꞈ'), - ('Ꞌ', 'ꞿ'), - ('Ꟃ', '\u{a7ca}'), - ('\u{a7f5}', 'ꠁ'), + ('Ꞌ', 'ꟊ'), + ('Ꟑ', 'ꟑ'), + ('ꟓ', 'ꟓ'), + ('ꟕ', 'ꟙ'), + ('ꟲ', 'ꠁ'), ('ꠃ', 'ꠅ'), ('ꠇ', 'ꠊ'), ('ꠌ', 'ꠢ'), @@ -10669,7 +10945,7 @@ pub const XID_START: &'static [(char, char)] = &[ ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab69}'), + ('ꭜ', 'ꭩ'), ('ꭰ', 'ꯢ'), ('가', '힣'), ('ힰ', 'ퟆ'), @@ -10728,9 +11004,20 @@ pub const XID_START: &'static [(char, char)] = &[ ('𐓘', '𐓻'), ('𐔀', '𐔧'), ('𐔰', '𐕣'), + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), ('𐘀', '𐜶'), ('𐝀', '𐝕'), ('𐝠', '𐝧'), + ('𐞀', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), ('𐠀', '𐠅'), ('𐠈', '𐠈'), ('𐠊', '𐠵'), @@ -10761,19 +11048,22 @@ pub const XID_START: &'static [(char, char)] = &[ ('𐲀', '𐲲'), ('𐳀', '𐳲'), ('𐴀', '𐴣'), - ('\u{10e80}', '\u{10ea9}'), - ('\u{10eb0}', '\u{10eb1}'), + ('𐺀', '𐺩'), + ('𐺰', '𐺱'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '𐽅'), - ('\u{10fb0}', '\u{10fc4}'), + ('𐽰', '𐾁'), + ('𐾰', '𐿄'), ('𐿠', '𐿶'), ('𑀃', '𑀷'), + ('𑁱', '𑁲'), + ('𑁵', '𑁵'), ('𑂃', '𑂯'), ('𑃐', '𑃨'), ('𑄃', '𑄦'), ('𑅄', '𑅄'), - ('\u{11147}', '\u{11147}'), + ('𑅇', '𑅇'), ('𑅐', '𑅲'), ('𑅶', '𑅶'), ('𑆃', '𑆲'), @@ -10799,7 +11089,7 @@ pub const XID_START: &'static [(char, char)] = &[ ('𑍝', '𑍡'), ('𑐀', '𑐴'), ('𑑇', '𑑊'), - ('𑑟', '\u{11461}'), + ('𑑟', '𑑡'), ('𑒀', '𑒯'), ('𑓄', '𑓅'), ('𑓇', '𑓇'), @@ -10810,15 +11100,16 @@ pub const XID_START: &'static [(char, char)] = &[ ('𑚀', '𑚪'), ('𑚸', '𑚸'), ('𑜀', '𑜚'), + ('𑝀', '𑝆'), ('𑠀', '𑠫'), ('𑢠', '𑣟'), - ('𑣿', '\u{11906}'), - ('\u{11909}', '\u{11909}'), - ('\u{1190c}', '\u{11913}'), - ('\u{11915}', '\u{11916}'), - ('\u{11918}', '\u{1192f}'), - ('\u{1193f}', '\u{1193f}'), - ('\u{11941}', '\u{11941}'), + ('𑣿', '𑤆'), + ('𑤉', '𑤉'), + ('𑤌', '𑤓'), + ('𑤕', '𑤖'), + ('𑤘', '𑤯'), + ('𑤿', '𑤿'), + ('𑥁', '𑥁'), ('𑦠', '𑦧'), ('𑦪', '𑧐'), ('𑧡', '𑧡'), @@ -10829,7 +11120,7 @@ pub const XID_START: &'static [(char, char)] = &[ ('𑩐', '𑩐'), ('𑩜', '𑪉'), ('𑪝', '𑪝'), - ('𑫀', '𑫸'), + ('𑪰', '𑫸'), ('𑰀', '𑰈'), ('𑰊', '𑰮'), ('𑱀', '𑱀'), @@ -10843,14 +11134,16 @@ pub const XID_START: &'static [(char, char)] = &[ ('𑵪', '𑶉'), ('𑶘', '𑶘'), ('𑻠', '𑻲'), - ('\u{11fb0}', '\u{11fb0}'), + ('𑾰', '𑾰'), ('𒀀', '𒎙'), ('𒐀', '𒑮'), ('𒒀', '𒕃'), + ('𒾐', '𒿰'), ('𓀀', '𓐮'), ('𔐀', '𔙆'), ('𖠀', '𖨸'), ('𖩀', '𖩞'), + ('𖩰', '𖪾'), ('𖫐', '𖫭'), ('𖬀', '𖬯'), ('𖭀', '𖭃'), @@ -10863,9 +11156,12 @@ pub const XID_START: &'static [(char, char)] = &[ ('𖿠', '𖿡'), ('𖿣', '𖿣'), ('𗀀', '𘟷'), - ('𘠀', '\u{18cd5}'), - ('\u{18d00}', '\u{18d08}'), - ('𛀀', '𛄞'), + ('𘠀', '𘳕'), + ('𘴀', '𘴈'), + ('𚿰', '𚿳'), + ('𚿵', '𚿻'), + ('𚿽', '𚿾'), + ('𛀀', '𛄢'), ('𛅐', '𛅒'), ('𛅤', '𛅧'), ('𛅰', '𛋻'), @@ -10903,10 +11199,16 @@ pub const XID_START: &'static [(char, char)] = &[ ('𝞊', '𝞨'), ('𝞪', '𝟂'), ('𝟄', '𝟋'), + ('𝼀', '𝼞'), ('𞄀', '𞄬'), ('𞄷', '𞄽'), ('𞅎', '𞅎'), + ('𞊐', '𞊭'), ('𞋀', '𞋫'), + ('𞟠', '𞟦'), + ('𞟨', '𞟫'), + ('𞟭', '𞟮'), + ('𞟰', '𞟾'), ('𞠀', '𞣄'), ('𞤀', '𞥃'), ('𞥋', '𞥋'), @@ -10943,11 +11245,11 @@ pub const XID_START: &'static [(char, char)] = &[ ('𞺡', '𞺣'), ('𞺥', '𞺩'), ('𞺫', '𞺻'), - ('𠀀', '\u{2a6dd}'), - ('𪜀', '𫜴'), + ('𠀀', '𪛟'), + ('𪜀', '𫜸'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), - ('\u{30000}', '\u{3134a}'), + ('𰀀', '𱍊'), ]; diff --git a/regex-syntax/src/unicode_tables/property_names.rs b/regex-syntax/src/unicode_tables/property_names.rs index 6393df2f86..3fce1bf032 100644 --- a/regex-syntax/src/unicode_tables/property_names.rs +++ b/regex-syntax/src/unicode_tables/property_names.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate property-names ucd-13.0.0 +// ucd-generate property-names /tmp/ucd // -// Unicode version: 13.0.0. +// Unicode version: 14.0.0. // -// ucd-generate 0.2.8 is available on crates.io. +// ucd-generate 0.2.11 is available on crates.io. pub const PROPERTY_NAMES: &'static [(&'static str, &'static str)] = &[ ("age", "Age"), diff --git a/regex-syntax/src/unicode_tables/property_values.rs b/regex-syntax/src/unicode_tables/property_values.rs index c46653a7b8..08a91477bf 100644 --- a/regex-syntax/src/unicode_tables/property_values.rs +++ b/regex-syntax/src/unicode_tables/property_values.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate property-values ucd-13.0.0 --include gc,script,scx,age,gcb,wb,sb +// ucd-generate property-values /tmp/ucd --include gc,script,scx,age,gcb,wb,sb // -// Unicode version: 13.0.0. +// Unicode version: 14.0.0. // -// ucd-generate 0.2.8 is available on crates.io. +// ucd-generate 0.2.11 is available on crates.io. pub const PROPERTY_VALUES: &'static [( &'static str, @@ -19,6 +19,7 @@ pub const PROPERTY_VALUES: &'static [( ("12.0", "V12_0"), ("12.1", "V12_1"), ("13.0", "V13_0"), + ("14.0", "V14_0"), ("2.0", "V2_0"), ("2.1", "V2_1"), ("3.0", "V3_0"), @@ -44,6 +45,7 @@ pub const PROPERTY_VALUES: &'static [( ("v120", "V12_0"), ("v121", "V12_1"), ("v130", "V13_0"), + ("v140", "V14_0"), ("v20", "V2_0"), ("v21", "V2_1"), ("v30", "V3_0"), @@ -233,9 +235,11 @@ pub const PROPERTY_VALUES: &'static [( ("common", "Common"), ("copt", "Coptic"), ("coptic", "Coptic"), + ("cpmn", "Cypro_Minoan"), ("cprt", "Cypriot"), ("cuneiform", "Cuneiform"), ("cypriot", "Cypriot"), + ("cyprominoan", "Cypro_Minoan"), ("cyrillic", "Cyrillic"), ("cyrl", "Cyrillic"), ("deseret", "Deseret"), @@ -391,6 +395,7 @@ pub const PROPERTY_VALUES: &'static [( ("oldsogdian", "Old_Sogdian"), ("oldsoutharabian", "Old_South_Arabian"), ("oldturkic", "Old_Turkic"), + ("olduyghur", "Old_Uyghur"), ("oriya", "Oriya"), ("orkh", "Old_Turkic"), ("orya", "Oriya"), @@ -398,6 +403,7 @@ pub const PROPERTY_VALUES: &'static [( ("osge", "Osage"), ("osma", "Osmanya"), ("osmanya", "Osmanya"), + ("ougr", "Old_Uyghur"), ("pahawhhmong", "Pahawh_Hmong"), ("palm", "Palmyrene"), ("palmyrene", "Palmyrene"), @@ -462,6 +468,7 @@ pub const PROPERTY_VALUES: &'static [( ("tamil", "Tamil"), ("taml", "Tamil"), ("tang", "Tangut"), + ("tangsa", "Tangsa"), ("tangut", "Tangut"), ("tavt", "Tai_Viet"), ("telu", "Telugu"), @@ -476,11 +483,15 @@ pub const PROPERTY_VALUES: &'static [( ("tifinagh", "Tifinagh"), ("tirh", "Tirhuta"), ("tirhuta", "Tirhuta"), + ("tnsa", "Tangsa"), + ("toto", "Toto"), ("ugar", "Ugaritic"), ("ugaritic", "Ugaritic"), ("unknown", "Unknown"), ("vai", "Vai"), ("vaii", "Vai"), + ("vith", "Vithkuqi"), + ("vithkuqi", "Vithkuqi"), ("wancho", "Wancho"), ("wara", "Warang_Citi"), ("warangciti", "Warang_Citi"), @@ -550,9 +561,11 @@ pub const PROPERTY_VALUES: &'static [( ("common", "Common"), ("copt", "Coptic"), ("coptic", "Coptic"), + ("cpmn", "Cypro_Minoan"), ("cprt", "Cypriot"), ("cuneiform", "Cuneiform"), ("cypriot", "Cypriot"), + ("cyprominoan", "Cypro_Minoan"), ("cyrillic", "Cyrillic"), ("cyrl", "Cyrillic"), ("deseret", "Deseret"), @@ -708,6 +721,7 @@ pub const PROPERTY_VALUES: &'static [( ("oldsogdian", "Old_Sogdian"), ("oldsoutharabian", "Old_South_Arabian"), ("oldturkic", "Old_Turkic"), + ("olduyghur", "Old_Uyghur"), ("oriya", "Oriya"), ("orkh", "Old_Turkic"), ("orya", "Oriya"), @@ -715,6 +729,7 @@ pub const PROPERTY_VALUES: &'static [( ("osge", "Osage"), ("osma", "Osmanya"), ("osmanya", "Osmanya"), + ("ougr", "Old_Uyghur"), ("pahawhhmong", "Pahawh_Hmong"), ("palm", "Palmyrene"), ("palmyrene", "Palmyrene"), @@ -779,6 +794,7 @@ pub const PROPERTY_VALUES: &'static [( ("tamil", "Tamil"), ("taml", "Tamil"), ("tang", "Tangut"), + ("tangsa", "Tangsa"), ("tangut", "Tangut"), ("tavt", "Tai_Viet"), ("telu", "Telugu"), @@ -793,11 +809,15 @@ pub const PROPERTY_VALUES: &'static [( ("tifinagh", "Tifinagh"), ("tirh", "Tirhuta"), ("tirhuta", "Tirhuta"), + ("tnsa", "Tangsa"), + ("toto", "Toto"), ("ugar", "Ugaritic"), ("ugaritic", "Ugaritic"), ("unknown", "Unknown"), ("vai", "Vai"), ("vaii", "Vai"), + ("vith", "Vithkuqi"), + ("vithkuqi", "Vithkuqi"), ("wancho", "Wancho"), ("wara", "Warang_Citi"), ("warangciti", "Warang_Citi"), diff --git a/regex-syntax/src/unicode_tables/script.rs b/regex-syntax/src/unicode_tables/script.rs index cd86cba0d0..3327b76aed 100644 --- a/regex-syntax/src/unicode_tables/script.rs +++ b/regex-syntax/src/unicode_tables/script.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate script ucd-13.0.0 --chars +// ucd-generate script /tmp/ucd --chars // -// Unicode version: 13.0.0. +// Unicode version: 14.0.0. // -// ucd-generate 0.2.8 is available on crates.io. +// ucd-generate 0.2.11 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Adlam", ADLAM), @@ -35,6 +35,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Coptic", COPTIC), ("Cuneiform", CUNEIFORM), ("Cypriot", CYPRIOT), + ("Cypro_Minoan", CYPRO_MINOAN), ("Cyrillic", CYRILLIC), ("Deseret", DESERET), ("Devanagari", DEVANAGARI), @@ -118,6 +119,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Old_Sogdian", OLD_SOGDIAN), ("Old_South_Arabian", OLD_SOUTH_ARABIAN), ("Old_Turkic", OLD_TURKIC), + ("Old_Uyghur", OLD_UYGHUR), ("Oriya", ORIYA), ("Osage", OSAGE), ("Osmanya", OSMANYA), @@ -149,6 +151,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Tai_Viet", TAI_VIET), ("Takri", TAKRI), ("Tamil", TAMIL), + ("Tangsa", TANGSA), ("Tangut", TANGUT), ("Telugu", TELUGU), ("Thaana", THAANA), @@ -156,8 +159,10 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Tibetan", TIBETAN), ("Tifinagh", TIFINAGH), ("Tirhuta", TIRHUTA), + ("Toto", TOTO), ("Ugaritic", UGARITIC), ("Vai", VAI), + ("Vithkuqi", VITHKUQI), ("Wancho", WANCHO), ("Warang_Citi", WARANG_CITI), ("Yezidi", YEZIDI), @@ -169,7 +174,7 @@ pub const ADLAM: &'static [(char, char)] = &[('𞤀', '𞥋'), ('𞥐', '𞥙'), ('𞥞', '𞥟')]; pub const AHOM: &'static [(char, char)] = - &[('𑜀', '𑜚'), ('\u{1171d}', '\u{1172b}'), ('𑜰', '𑜿')]; + &[('𑜀', '𑜚'), ('\u{1171d}', '\u{1172b}'), ('𑜰', '𑝆')]; pub const ANATOLIAN_HIEROGLYPHS: &'static [(char, char)] = &[('𔐀', '𔙆')]; @@ -177,23 +182,23 @@ pub const ARABIC: &'static [(char, char)] = &[ ('\u{600}', '\u{604}'), ('؆', '؋'), ('؍', '\u{61a}'), - ('\u{61c}', '\u{61c}'), - ('؞', '؞'), + ('\u{61c}', '؞'), ('ؠ', 'ؿ'), ('ف', 'ي'), ('\u{656}', 'ٯ'), ('ٱ', '\u{6dc}'), ('۞', 'ۿ'), ('ݐ', 'ݿ'), - ('ࢠ', 'ࢴ'), - ('ࢶ', '\u{8c7}'), - ('\u{8d3}', '\u{8e1}'), + ('ࡰ', 'ࢎ'), + ('\u{890}', '\u{891}'), + ('\u{898}', '\u{8e1}'), ('\u{8e3}', '\u{8ff}'), - ('ﭐ', '﯁'), + ('ﭐ', '﯂'), ('ﯓ', 'ﴽ'), - ('ﵐ', 'ﶏ'), + ('﵀', 'ﶏ'), ('ﶒ', 'ﷇ'), - ('ﷰ', '﷽'), + ('﷏', '﷏'), + ('ﷰ', '﷿'), ('ﹰ', 'ﹴ'), ('ﹶ', 'ﻼ'), ('𐹠', '𐹾'), @@ -238,7 +243,7 @@ pub const ARMENIAN: &'static [(char, char)] = pub const AVESTAN: &'static [(char, char)] = &[('𐬀', '𐬵'), ('𐬹', '𐬿')]; -pub const BALINESE: &'static [(char, char)] = &[('\u{1b00}', 'ᭋ'), ('᭐', '᭼')]; +pub const BALINESE: &'static [(char, char)] = &[('\u{1b00}', 'ᭌ'), ('᭐', '᭾')]; pub const BAMUM: &'static [(char, char)] = &[('ꚠ', '꛷'), ('𖠀', '𖨸')]; @@ -268,10 +273,10 @@ pub const BHAIKSUKI: &'static [(char, char)] = &[('𑰀', '𑰈'), ('𑰊', '\u{11c36}'), ('\u{11c38}', '𑱅'), ('𑱐', '𑱬')]; pub const BOPOMOFO: &'static [(char, char)] = - &[('˪', '˫'), ('ㄅ', 'ㄯ'), ('ㆠ', '\u{31bf}')]; + &[('˪', '˫'), ('ㄅ', 'ㄯ'), ('ㆠ', 'ㆿ')]; pub const BRAHMI: &'static [(char, char)] = - &[('𑀀', '𑁍'), ('𑁒', '𑁯'), ('\u{1107f}', '\u{1107f}')]; + &[('𑀀', '𑁍'), ('𑁒', '𑁵'), ('\u{1107f}', '\u{1107f}')]; pub const BRAILLE: &'static [(char, char)] = &[('⠀', '⣿')]; @@ -280,7 +285,7 @@ pub const BUGINESE: &'static [(char, char)] = &[('ᨀ', '\u{1a1b}'), ('᨞', ' pub const BUHID: &'static [(char, char)] = &[('ᝀ', '\u{1753}')]; pub const CANADIAN_ABORIGINAL: &'static [(char, char)] = - &[('᐀', 'ᙿ'), ('ᢰ', 'ᣵ')]; + &[('᐀', 'ᙿ'), ('ᢰ', 'ᣵ'), ('𑪰', '𑪿')]; pub const CARIAN: &'static [(char, char)] = &[('𐊠', '𐋐')]; @@ -288,7 +293,7 @@ pub const CAUCASIAN_ALBANIAN: &'static [(char, char)] = &[('𐔰', '𐕣'), ('𐕯', '𐕯')]; pub const CHAKMA: &'static [(char, char)] = - &[('\u{11100}', '\u{11134}'), ('𑄶', '\u{11147}')]; + &[('\u{11100}', '\u{11134}'), ('𑄶', '𑅇')]; pub const CHAM: &'static [(char, char)] = &[('ꨀ', '\u{aa36}'), ('ꩀ', 'ꩍ'), ('꩐', '꩙'), ('꩜', '꩟')]; @@ -296,10 +301,10 @@ pub const CHAM: &'static [(char, char)] = pub const CHEROKEE: &'static [(char, char)] = &[('Ꭰ', 'Ᏽ'), ('ᏸ', 'ᏽ'), ('ꭰ', 'ꮿ')]; -pub const CHORASMIAN: &'static [(char, char)] = &[('\u{10fb0}', '\u{10fcb}')]; +pub const CHORASMIAN: &'static [(char, char)] = &[('𐾰', '𐿋')]; pub const COMMON: &'static [(char, char)] = &[ - ('\u{0}', '@'), + ('\0', '@'), ('[', '`'), ('{', '©'), ('«', '¹'), @@ -339,7 +344,7 @@ pub const COMMON: &'static [(char, char)] = &[ ('\u{2066}', '⁰'), ('⁴', '⁾'), ('₀', '₎'), - ('₠', '₿'), + ('₠', '⃀'), ('℀', '℥'), ('℧', '℩'), ('ℬ', 'ℱ'), @@ -351,8 +356,8 @@ pub const COMMON: &'static [(char, char)] = &[ ('①', '⟿'), ('⤀', '⭳'), ('⭶', '⮕'), - ('\u{2b97}', '⯿'), - ('⸀', '\u{2e52}'), + ('⮗', '⯿'), + ('⸀', '⹝'), ('⿰', '⿻'), ('\u{3000}', '〄'), ('〆', '〆'), @@ -375,7 +380,7 @@ pub const COMMON: &'static [(char, char)] = &[ ('꤮', '꤮'), ('ꧏ', 'ꧏ'), ('꭛', '꭛'), - ('\u{ab6a}', '\u{ab6b}'), + ('꭪', '꭫'), ('﴾', '﴿'), ('︐', '︙'), ('︰', '﹒'), @@ -393,18 +398,18 @@ pub const COMMON: &'static [(char, char)] = &[ ('𐄀', '𐄂'), ('𐄇', '𐄳'), ('𐄷', '𐄿'), - ('𐆐', '\u{1019c}'), + ('𐆐', '𐆜'), ('𐇐', '𐇼'), ('𐋡', '𐋻'), - ('𖿢', '𖿣'), ('\u{1bca0}', '\u{1bca3}'), + ('𜽐', '𜿃'), ('𝀀', '𝃵'), ('𝄀', '𝄦'), ('𝄩', '𝅦'), ('𝅪', '\u{1d17a}'), ('𝆃', '𝆄'), ('𝆌', '𝆩'), - ('𝆮', '𝇨'), + ('𝆮', '𝇪'), ('𝋠', '𝋳'), ('𝌀', '𝍖'), ('𝍠', '𝍸'), @@ -437,39 +442,40 @@ pub const COMMON: &'static [(char, char)] = &[ ('🂱', '🂿'), ('🃁', '🃏'), ('🃑', '🃵'), - ('🄀', '\u{1f1ad}'), + ('🄀', '🆭'), ('🇦', '🇿'), ('🈁', '🈂'), ('🈐', '🈻'), ('🉀', '🉈'), ('🉐', '🉑'), ('🉠', '🉥'), - ('🌀', '\u{1f6d7}'), - ('🛠', '🛬'), - ('🛰', '\u{1f6fc}'), + ('🌀', '🛗'), + ('🛝', '🛬'), + ('🛰', '🛼'), ('🜀', '🝳'), ('🞀', '🟘'), ('🟠', '🟫'), + ('🟰', '🟰'), ('🠀', '🠋'), ('🠐', '🡇'), ('🡐', '🡙'), ('🡠', '🢇'), ('🢐', '🢭'), - ('\u{1f8b0}', '\u{1f8b1}'), - ('🤀', '\u{1f978}'), - ('🥺', '\u{1f9cb}'), - ('🧍', '🩓'), + ('🢰', '🢱'), + ('🤀', '🩓'), ('🩠', '🩭'), - ('🩰', '\u{1fa74}'), - ('🩸', '🩺'), - ('🪀', '\u{1fa86}'), - ('🪐', '\u{1faa8}'), - ('\u{1fab0}', '\u{1fab6}'), - ('\u{1fac0}', '\u{1fac2}'), - ('\u{1fad0}', '\u{1fad6}'), - ('\u{1fb00}', '\u{1fb92}'), - ('\u{1fb94}', '\u{1fbca}'), - ('\u{1fbf0}', '\u{1fbf9}'), + ('🩰', '🩴'), + ('🩸', '🩼'), + ('🪀', '🪆'), + ('🪐', '🪬'), + ('🪰', '🪺'), + ('🫀', '🫅'), + ('🫐', '🫙'), + ('🫠', '🫧'), + ('🫰', '🫶'), + ('🬀', '🮒'), + ('🮔', '🯊'), + ('🯰', '🯹'), ('\u{e0001}', '\u{e0001}'), ('\u{e0020}', '\u{e007f}'), ]; @@ -483,6 +489,8 @@ pub const CUNEIFORM: &'static [(char, char)] = pub const CYPRIOT: &'static [(char, char)] = &[('𐠀', '𐠅'), ('𐠈', '𐠈'), ('𐠊', '𐠵'), ('𐠷', '𐠸'), ('𐠼', '𐠼'), ('𐠿', '𐠿')]; +pub const CYPRO_MINOAN: &'static [(char, char)] = &[('𒾐', '𒿲')]; + pub const CYRILLIC: &'static [(char, char)] = &[ ('Ѐ', '\u{484}'), ('\u{487}', 'ԯ'), @@ -504,14 +512,14 @@ pub const DEVANAGARI: &'static [(char, char)] = &[ ]; pub const DIVES_AKURU: &'static [(char, char)] = &[ - ('\u{11900}', '\u{11906}'), - ('\u{11909}', '\u{11909}'), - ('\u{1190c}', '\u{11913}'), - ('\u{11915}', '\u{11916}'), - ('\u{11918}', '\u{11935}'), - ('\u{11937}', '\u{11938}'), - ('\u{1193b}', '\u{11946}'), - ('\u{11950}', '\u{11959}'), + ('𑤀', '𑤆'), + ('𑤉', '𑤉'), + ('𑤌', '𑤓'), + ('𑤕', '𑤖'), + ('𑤘', '𑤵'), + ('𑤷', '𑤸'), + ('\u{1193b}', '𑥆'), + ('𑥐', '𑥙'), ]; pub const DOGRA: &'static [(char, char)] = &[('𑠀', '𑠻')]; @@ -559,6 +567,10 @@ pub const ETHIOPIC: &'static [(char, char)] = &[ ('ꬑ', 'ꬖ'), ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), + ('𞟠', '𞟦'), + ('𞟨', '𞟫'), + ('𞟭', '𞟮'), + ('𞟰', '𞟾'), ]; pub const GEORGIAN: &'static [(char, char)] = &[ @@ -575,8 +587,7 @@ pub const GEORGIAN: &'static [(char, char)] = &[ ]; pub const GLAGOLITIC: &'static [(char, char)] = &[ - ('Ⰰ', 'Ⱞ'), - ('ⰰ', 'ⱞ'), + ('Ⰰ', 'ⱟ'), ('\u{1e000}', '\u{1e006}'), ('\u{1e008}', '\u{1e018}'), ('\u{1e01b}', '\u{1e021}'), @@ -696,18 +707,19 @@ pub const HAN: &'static [(char, char)] = &[ ('〇', '〇'), ('〡', '〩'), ('〸', '〻'), - ('㐀', '\u{4dbf}'), - ('一', '\u{9ffc}'), + ('㐀', '䶿'), + ('一', '鿿'), ('豈', '舘'), ('並', '龎'), - ('\u{16ff0}', '\u{16ff1}'), - ('𠀀', '\u{2a6dd}'), - ('𪜀', '𫜴'), + ('𖿢', '𖿣'), + ('𖿰', '𖿱'), + ('𠀀', '𪛟'), + ('𪜀', '𫜸'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), - ('\u{30000}', '\u{3134a}'), + ('𰀀', '𱍊'), ]; pub const HANGUL: &'static [(char, char)] = &[ @@ -730,7 +742,7 @@ pub const HANGUL: &'static [(char, char)] = &[ pub const HANIFI_ROHINGYA: &'static [(char, char)] = &[('𐴀', '\u{10d27}'), ('𐴰', '𐴹')]; -pub const HANUNOO: &'static [(char, char)] = &[('ᜠ', '\u{1734}')]; +pub const HANUNOO: &'static [(char, char)] = &[('ᜠ', '᜴')]; pub const HATRAN: &'static [(char, char)] = &[('𐣠', '𐣲'), ('𐣴', '𐣵'), ('𐣻', '𐣿')]; @@ -748,7 +760,7 @@ pub const HEBREW: &'static [(char, char)] = &[ ]; pub const HIRAGANA: &'static [(char, char)] = - &[('ぁ', 'ゖ'), ('ゝ', 'ゟ'), ('𛀁', '𛄞'), ('𛅐', '𛅒'), ('🈀', '🈀')]; + &[('ぁ', 'ゖ'), ('ゝ', 'ゟ'), ('𛀁', '𛄟'), ('𛅐', '𛅒'), ('🈀', '🈀')]; pub const IMPERIAL_ARAMAIC: &'static [(char, char)] = &[('𐡀', '𐡕'), ('𐡗', '𐡟')]; @@ -759,15 +771,14 @@ pub const INHERITED: &'static [(char, char)] = &[ ('\u{64b}', '\u{655}'), ('\u{670}', '\u{670}'), ('\u{951}', '\u{954}'), - ('\u{1ab0}', '\u{1ac0}'), + ('\u{1ab0}', '\u{1ace}'), ('\u{1cd0}', '\u{1cd2}'), ('\u{1cd4}', '\u{1ce0}'), ('\u{1ce2}', '\u{1ce8}'), ('\u{1ced}', '\u{1ced}'), ('\u{1cf4}', '\u{1cf4}'), ('\u{1cf8}', '\u{1cf9}'), - ('\u{1dc0}', '\u{1df9}'), - ('\u{1dfb}', '\u{1dff}'), + ('\u{1dc0}', '\u{1dff}'), ('\u{200c}', '\u{200d}'), ('\u{20d0}', '\u{20f0}'), ('\u{302a}', '\u{302d}'), @@ -777,6 +788,8 @@ pub const INHERITED: &'static [(char, char)] = &[ ('\u{101fd}', '\u{101fd}'), ('\u{102e0}', '\u{102e0}'), ('\u{1133b}', '\u{1133b}'), + ('\u{1cf00}', '\u{1cf2d}'), + ('\u{1cf30}', '\u{1cf46}'), ('\u{1d167}', '\u{1d169}'), ('\u{1d17b}', '\u{1d182}'), ('\u{1d185}', '\u{1d18b}'), @@ -794,7 +807,7 @@ pub const JAVANESE: &'static [(char, char)] = &[('\u{a980}', '꧍'), ('꧐', '꧙'), ('꧞', '꧟')]; pub const KAITHI: &'static [(char, char)] = - &[('\u{11080}', '𑃁'), ('\u{110cd}', '\u{110cd}')]; + &[('\u{11080}', '\u{110c2}'), ('\u{110cd}', '\u{110cd}')]; pub const KANNADA: &'static [(char, char)] = &[ ('ಀ', 'ಌ'), @@ -806,7 +819,7 @@ pub const KANNADA: &'static [(char, char)] = &[ ('\u{cc6}', 'ೈ'), ('ೊ', '\u{ccd}'), ('\u{cd5}', '\u{cd6}'), - ('ೞ', 'ೞ'), + ('ೝ', 'ೞ'), ('ೠ', '\u{ce3}'), ('೦', '೯'), ('ೱ', 'ೲ'), @@ -820,7 +833,11 @@ pub const KATAKANA: &'static [(char, char)] = &[ ('㌀', '㍗'), ('ヲ', 'ッ'), ('ア', 'ン'), + ('𚿰', '𚿳'), + ('𚿵', '𚿻'), + ('𚿽', '𚿾'), ('𛀀', '𛀀'), + ('𛄠', '𛄢'), ('𛅤', '𛅧'), ]; @@ -838,7 +855,7 @@ pub const KHAROSHTHI: &'static [(char, char)] = &[ ]; pub const KHITAN_SMALL_SCRIPT: &'static [(char, char)] = - &[('\u{16fe4}', '\u{16fe4}'), ('\u{18b00}', '\u{18cd5}')]; + &[('\u{16fe4}', '\u{16fe4}'), ('𘬀', '𘳕')]; pub const KHMER: &'static [(char, char)] = &[('ក', '\u{17dd}'), ('០', '៩'), ('៰', '៹'), ('᧠', '᧿')]; @@ -886,15 +903,21 @@ pub const LATIN: &'static [(char, char)] = &[ ('Ⅰ', 'ↈ'), ('Ⱡ', 'Ɀ'), ('Ꜣ', 'ꞇ'), - ('Ꞌ', 'ꞿ'), - ('Ꟃ', '\u{a7ca}'), - ('\u{a7f5}', 'ꟿ'), + ('Ꞌ', 'ꟊ'), + ('Ꟑ', 'ꟑ'), + ('ꟓ', 'ꟓ'), + ('ꟕ', 'ꟙ'), + ('ꟲ', 'ꟿ'), ('ꬰ', 'ꭚ'), ('ꭜ', 'ꭤ'), - ('ꭦ', '\u{ab69}'), + ('ꭦ', 'ꭩ'), ('ff', 'st'), ('A', 'Z'), ('a', 'z'), + ('𐞀', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), + ('𝼀', '𝼞'), ]; pub const LEPCHA: &'static [(char, char)] = @@ -921,8 +944,7 @@ pub const LINEAR_B: &'static [(char, char)] = &[ ('𐂀', '𐃺'), ]; -pub const LISU: &'static [(char, char)] = - &[('ꓐ', '꓿'), ('\u{11fb0}', '\u{11fb0}')]; +pub const LISU: &'static [(char, char)] = &[('ꓐ', '꓿'), ('𑾰', '𑾰')]; pub const LYCIAN: &'static [(char, char)] = &[('𐊀', '𐊜')]; @@ -978,15 +1000,8 @@ pub const MIAO: &'static [(char, char)] = pub const MODI: &'static [(char, char)] = &[('𑘀', '𑙄'), ('𑙐', '𑙙')]; -pub const MONGOLIAN: &'static [(char, char)] = &[ - ('᠀', '᠁'), - ('᠄', '᠄'), - ('᠆', '\u{180e}'), - ('᠐', '᠙'), - ('ᠠ', 'ᡸ'), - ('ᢀ', 'ᢪ'), - ('𑙠', '𑙬'), -]; +pub const MONGOLIAN: &'static [(char, char)] = + &[('᠀', '᠁'), ('᠄', '᠄'), ('᠆', '᠙'), ('ᠠ', 'ᡸ'), ('ᢀ', 'ᢪ'), ('𑙠', '𑙬')]; pub const MRO: &'static [(char, char)] = &[('𖩀', '𖩞'), ('𖩠', '𖩩'), ('𖩮', '𖩯')]; @@ -1004,7 +1019,7 @@ pub const NANDINAGARI: &'static [(char, char)] = pub const NEW_TAI_LUE: &'static [(char, char)] = &[('ᦀ', 'ᦫ'), ('ᦰ', 'ᧉ'), ('᧐', '᧚'), ('᧞', '᧟')]; -pub const NEWA: &'static [(char, char)] = &[('𑐀', '𑑛'), ('𑑝', '\u{11461}')]; +pub const NEWA: &'static [(char, char)] = &[('𑐀', '𑑛'), ('𑑝', '𑑡')]; pub const NKO: &'static [(char, char)] = &[('߀', 'ߺ'), ('\u{7fd}', '߿')]; @@ -1034,6 +1049,8 @@ pub const OLD_SOUTH_ARABIAN: &'static [(char, char)] = &[('𐩠', '𐩿')]; pub const OLD_TURKIC: &'static [(char, char)] = &[('𐰀', '𐱈')]; +pub const OLD_UYGHUR: &'static [(char, char)] = &[('𐽰', '𐾉')]; + pub const ORIYA: &'static [(char, char)] = &[ ('\u{b01}', 'ଃ'), ('ଅ', 'ଌ'), @@ -1118,7 +1135,7 @@ pub const SYLOTI_NAGRI: &'static [(char, char)] = &[('ꠀ', '\u{a82c}')]; pub const SYRIAC: &'static [(char, char)] = &[('܀', '܍'), ('\u{70f}', '\u{74a}'), ('ݍ', 'ݏ'), ('ࡠ', 'ࡪ')]; -pub const TAGALOG: &'static [(char, char)] = &[('ᜀ', 'ᜌ'), ('ᜎ', '\u{1714}')]; +pub const TAGALOG: &'static [(char, char)] = &[('ᜀ', '᜕'), ('ᜟ', 'ᜟ')]; pub const TAGBANWA: &'static [(char, char)] = &[('ᝠ', 'ᝬ'), ('ᝮ', 'ᝰ'), ('\u{1772}', '\u{1773}')]; @@ -1135,7 +1152,7 @@ pub const TAI_THAM: &'static [(char, char)] = &[ pub const TAI_VIET: &'static [(char, char)] = &[('ꪀ', 'ꫂ'), ('ꫛ', '꫟')]; -pub const TAKRI: &'static [(char, char)] = &[('𑚀', '𑚸'), ('𑛀', '𑛉')]; +pub const TAKRI: &'static [(char, char)] = &[('𑚀', '𑚹'), ('𑛀', '𑛉')]; pub const TAMIL: &'static [(char, char)] = &[ ('\u{b82}', 'ஃ'), @@ -1158,23 +1175,22 @@ pub const TAMIL: &'static [(char, char)] = &[ ('𑿿', '𑿿'), ]; -pub const TANGUT: &'static [(char, char)] = &[ - ('𖿠', '𖿠'), - ('𗀀', '𘟷'), - ('𘠀', '\u{18aff}'), - ('\u{18d00}', '\u{18d08}'), -]; +pub const TANGSA: &'static [(char, char)] = &[('𖩰', '𖪾'), ('𖫀', '𖫉')]; + +pub const TANGUT: &'static [(char, char)] = + &[('𖿠', '𖿠'), ('𗀀', '𘟷'), ('𘠀', '𘫿'), ('𘴀', '𘴈')]; pub const TELUGU: &'static [(char, char)] = &[ ('\u{c00}', 'ఌ'), ('ఎ', 'ఐ'), ('ఒ', 'న'), ('ప', 'హ'), - ('ఽ', 'ౄ'), + ('\u{c3c}', 'ౄ'), ('\u{c46}', '\u{c48}'), ('\u{c4a}', '\u{c4d}'), ('\u{c55}', '\u{c56}'), ('ౘ', 'ౚ'), + ('ౝ', 'ౝ'), ('ౠ', '\u{c63}'), ('౦', '౯'), ('౷', '౿'), @@ -1199,19 +1215,29 @@ pub const TIFINAGH: &'static [(char, char)] = pub const TIRHUTA: &'static [(char, char)] = &[('𑒀', '𑓇'), ('𑓐', '𑓙')]; +pub const TOTO: &'static [(char, char)] = &[('𞊐', '\u{1e2ae}')]; + pub const UGARITIC: &'static [(char, char)] = &[('𐎀', '𐎝'), ('𐎟', '𐎟')]; pub const VAI: &'static [(char, char)] = &[('ꔀ', 'ꘫ')]; +pub const VITHKUQI: &'static [(char, char)] = &[ + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), +]; + pub const WANCHO: &'static [(char, char)] = &[('𞋀', '𞋹'), ('𞋿', '𞋿')]; pub const WARANG_CITI: &'static [(char, char)] = &[('𑢠', '𑣲'), ('𑣿', '𑣿')]; -pub const YEZIDI: &'static [(char, char)] = &[ - ('\u{10e80}', '\u{10ea9}'), - ('\u{10eab}', '\u{10ead}'), - ('\u{10eb0}', '\u{10eb1}'), -]; +pub const YEZIDI: &'static [(char, char)] = + &[('𐺀', '𐺩'), ('\u{10eab}', '𐺭'), ('𐺰', '𐺱')]; pub const YI: &'static [(char, char)] = &[('ꀀ', 'ꒌ'), ('꒐', '꓆')]; diff --git a/regex-syntax/src/unicode_tables/script_extension.rs b/regex-syntax/src/unicode_tables/script_extension.rs index 7fca2af9d0..c970e01046 100644 --- a/regex-syntax/src/unicode_tables/script_extension.rs +++ b/regex-syntax/src/unicode_tables/script_extension.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate script-extension ucd-13.0.0 --chars +// ucd-generate script-extension /tmp/ucd --chars // -// Unicode version: 13.0.0. +// Unicode version: 14.0.0. // -// ucd-generate 0.2.8 is available on crates.io. +// ucd-generate 0.2.11 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Adlam", ADLAM), @@ -35,6 +35,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Coptic", COPTIC), ("Cuneiform", CUNEIFORM), ("Cypriot", CYPRIOT), + ("Cypro_Minoan", CYPRO_MINOAN), ("Cyrillic", CYRILLIC), ("Deseret", DESERET), ("Devanagari", DEVANAGARI), @@ -118,6 +119,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Old_Sogdian", OLD_SOGDIAN), ("Old_South_Arabian", OLD_SOUTH_ARABIAN), ("Old_Turkic", OLD_TURKIC), + ("Old_Uyghur", OLD_UYGHUR), ("Oriya", ORIYA), ("Osage", OSAGE), ("Osmanya", OSMANYA), @@ -149,6 +151,7 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Tai_Viet", TAI_VIET), ("Takri", TAKRI), ("Tamil", TAMIL), + ("Tangsa", TANGSA), ("Tangut", TANGUT), ("Telugu", TELUGU), ("Thaana", THAANA), @@ -156,8 +159,10 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("Tibetan", TIBETAN), ("Tifinagh", TIFINAGH), ("Tirhuta", TIRHUTA), + ("Toto", TOTO), ("Ugaritic", UGARITIC), ("Vai", VAI), + ("Vithkuqi", VITHKUQI), ("Wancho", WANCHO), ("Warang_Citi", WARANG_CITI), ("Yezidi", YEZIDI), @@ -166,28 +171,27 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ]; pub const ADLAM: &'static [(char, char)] = - &[('ـ', 'ـ'), ('𞤀', '𞥋'), ('𞥐', '𞥙'), ('𞥞', '𞥟')]; + &[('؟', '؟'), ('ـ', 'ـ'), ('𞤀', '𞥋'), ('𞥐', '𞥙'), ('𞥞', '𞥟')]; pub const AHOM: &'static [(char, char)] = - &[('𑜀', '𑜚'), ('\u{1171d}', '\u{1172b}'), ('𑜰', '𑜿')]; + &[('𑜀', '𑜚'), ('\u{1171d}', '\u{1172b}'), ('𑜰', '𑝆')]; pub const ANATOLIAN_HIEROGLYPHS: &'static [(char, char)] = &[('𔐀', '𔙆')]; pub const ARABIC: &'static [(char, char)] = &[ ('\u{600}', '\u{604}'), - ('؆', '\u{61c}'), - ('؞', '\u{6dc}'), + ('؆', '\u{6dc}'), ('۞', 'ۿ'), ('ݐ', 'ݿ'), - ('ࢠ', 'ࢴ'), - ('ࢶ', '\u{8c7}'), - ('\u{8d3}', '\u{8e1}'), + ('ࡰ', 'ࢎ'), + ('\u{890}', '\u{891}'), + ('\u{898}', '\u{8e1}'), ('\u{8e3}', '\u{8ff}'), - ('ﭐ', '﯁'), - ('ﯓ', 'ﴽ'), - ('ﵐ', 'ﶏ'), + ('ﭐ', '﯂'), + ('ﯓ', 'ﶏ'), ('ﶒ', 'ﷇ'), - ('ﷰ', '﷽'), + ('﷏', '﷏'), + ('ﷰ', '﷿'), ('ﹰ', 'ﹴ'), ('ﹶ', 'ﻼ'), ('\u{102e0}', '𐋻'), @@ -233,7 +237,7 @@ pub const ARMENIAN: &'static [(char, char)] = pub const AVESTAN: &'static [(char, char)] = &[('𐬀', '𐬵'), ('𐬹', '𐬿')]; -pub const BALINESE: &'static [(char, char)] = &[('\u{1b00}', 'ᭋ'), ('᭐', '᭼')]; +pub const BALINESE: &'static [(char, char)] = &[('\u{1b00}', 'ᭌ'), ('᭐', '᭾')]; pub const BAMUM: &'static [(char, char)] = &[('ꚠ', '꛷'), ('𖠀', '𖨸')]; @@ -284,13 +288,13 @@ pub const BOPOMOFO: &'static [(char, char)] = &[ ('〷', '〷'), ('・', '・'), ('ㄅ', 'ㄯ'), - ('ㆠ', '\u{31bf}'), + ('ㆠ', 'ㆿ'), ('﹅', '﹆'), ('。', '・'), ]; pub const BRAHMI: &'static [(char, char)] = - &[('𑀀', '𑁍'), ('𑁒', '𑁯'), ('\u{1107f}', '\u{1107f}')]; + &[('𑀀', '𑁍'), ('𑁒', '𑁵'), ('\u{1107f}', '\u{1107f}')]; pub const BRAILLE: &'static [(char, char)] = &[('⠀', '⣿')]; @@ -300,7 +304,7 @@ pub const BUGINESE: &'static [(char, char)] = pub const BUHID: &'static [(char, char)] = &[('᜵', '᜶'), ('ᝀ', '\u{1753}')]; pub const CANADIAN_ABORIGINAL: &'static [(char, char)] = - &[('᐀', 'ᙿ'), ('ᢰ', 'ᣵ')]; + &[('᐀', 'ᙿ'), ('ᢰ', 'ᣵ'), ('𑪰', '𑪿')]; pub const CARIAN: &'static [(char, char)] = &[('𐊠', '𐋐')]; @@ -308,7 +312,7 @@ pub const CAUCASIAN_ALBANIAN: &'static [(char, char)] = &[('𐔰', '𐕣'), ('𐕯', '𐕯')]; pub const CHAKMA: &'static [(char, char)] = - &[('০', '৯'), ('၀', '၉'), ('\u{11100}', '\u{11134}'), ('𑄶', '\u{11147}')]; + &[('০', '৯'), ('၀', '၉'), ('\u{11100}', '\u{11134}'), ('𑄶', '𑅇')]; pub const CHAM: &'static [(char, char)] = &[('ꨀ', '\u{aa36}'), ('ꩀ', 'ꩍ'), ('꩐', '꩙'), ('꩜', '꩟')]; @@ -316,10 +320,10 @@ pub const CHAM: &'static [(char, char)] = pub const CHEROKEE: &'static [(char, char)] = &[('Ꭰ', 'Ᏽ'), ('ᏸ', 'ᏽ'), ('ꭰ', 'ꮿ')]; -pub const CHORASMIAN: &'static [(char, char)] = &[('\u{10fb0}', '\u{10fcb}')]; +pub const CHORASMIAN: &'static [(char, char)] = &[('𐾰', '𐿋')]; pub const COMMON: &'static [(char, char)] = &[ - ('\u{0}', '@'), + ('\0', '@'), ('[', '`'), ('{', '©'), ('«', '¹'), @@ -345,7 +349,7 @@ pub const COMMON: &'static [(char, char)] = &[ ('\u{2066}', '⁰'), ('⁴', '⁾'), ('₀', '₎'), - ('₠', '₿'), + ('₠', '⃀'), ('℀', '℥'), ('℧', '℩'), ('ℬ', 'ℱ'), @@ -357,9 +361,9 @@ pub const COMMON: &'static [(char, char)] = &[ ('①', '⟿'), ('⤀', '⭳'), ('⭶', '⮕'), - ('\u{2b97}', '⯿'), + ('⮗', '⯿'), ('⸀', '⹂'), - ('⹄', '\u{2e52}'), + ('⹄', '⹝'), ('⿰', '⿻'), ('\u{3000}', '\u{3000}'), ('〄', '〄'), @@ -377,8 +381,7 @@ pub const COMMON: &'static [(char, char)] = &[ ('꜈', '꜡'), ('ꞈ', '꞊'), ('꭛', '꭛'), - ('\u{ab6a}', '\u{ab6b}'), - ('﴾', '﴿'), + ('꭪', '꭫'), ('︐', '︙'), ('︰', '﹄'), ('﹇', '﹒'), @@ -391,16 +394,16 @@ pub const COMMON: &'static [(char, char)] = &[ ('¢', '₩'), ('│', '○'), ('\u{fff9}', '�'), - ('𐆐', '\u{1019c}'), + ('𐆐', '𐆜'), ('𐇐', '𐇼'), - ('𖿢', '𖿣'), + ('𜽐', '𜿃'), ('𝀀', '𝃵'), ('𝄀', '𝄦'), ('𝄩', '𝅦'), ('𝅪', '\u{1d17a}'), ('𝆃', '𝆄'), ('𝆌', '𝆩'), - ('𝆮', '𝇨'), + ('𝆮', '𝇪'), ('𝋠', '𝋳'), ('𝌀', '𝍖'), ('𝍲', '𝍸'), @@ -433,38 +436,39 @@ pub const COMMON: &'static [(char, char)] = &[ ('🂱', '🂿'), ('🃁', '🃏'), ('🃑', '🃵'), - ('🄀', '\u{1f1ad}'), + ('🄀', '🆭'), ('🇦', '🇿'), ('🈁', '🈂'), ('🈐', '🈻'), ('🉀', '🉈'), ('🉠', '🉥'), - ('🌀', '\u{1f6d7}'), - ('🛠', '🛬'), - ('🛰', '\u{1f6fc}'), + ('🌀', '🛗'), + ('🛝', '🛬'), + ('🛰', '🛼'), ('🜀', '🝳'), ('🞀', '🟘'), ('🟠', '🟫'), + ('🟰', '🟰'), ('🠀', '🠋'), ('🠐', '🡇'), ('🡐', '🡙'), ('🡠', '🢇'), ('🢐', '🢭'), - ('\u{1f8b0}', '\u{1f8b1}'), - ('🤀', '\u{1f978}'), - ('🥺', '\u{1f9cb}'), - ('🧍', '🩓'), + ('🢰', '🢱'), + ('🤀', '🩓'), ('🩠', '🩭'), - ('🩰', '\u{1fa74}'), - ('🩸', '🩺'), - ('🪀', '\u{1fa86}'), - ('🪐', '\u{1faa8}'), - ('\u{1fab0}', '\u{1fab6}'), - ('\u{1fac0}', '\u{1fac2}'), - ('\u{1fad0}', '\u{1fad6}'), - ('\u{1fb00}', '\u{1fb92}'), - ('\u{1fb94}', '\u{1fbca}'), - ('\u{1fbf0}', '\u{1fbf9}'), + ('🩰', '🩴'), + ('🩸', '🩼'), + ('🪀', '🪆'), + ('🪐', '🪬'), + ('🪰', '🪺'), + ('🫀', '🫅'), + ('🫐', '🫙'), + ('🫠', '🫧'), + ('🫰', '🫶'), + ('🬀', '🮒'), + ('🮔', '🯊'), + ('🯰', '🯹'), ('\u{e0001}', '\u{e0001}'), ('\u{e0020}', '\u{e007f}'), ]; @@ -487,6 +491,8 @@ pub const CYPRIOT: &'static [(char, char)] = &[ ('𐠿', '𐠿'), ]; +pub const CYPRO_MINOAN: &'static [(char, char)] = &[('𐄀', '𐄁'), ('𒾐', '𒿲')]; + pub const CYRILLIC: &'static [(char, char)] = &[ ('Ѐ', 'ԯ'), ('ᲀ', 'ᲈ'), @@ -512,14 +518,14 @@ pub const DEVANAGARI: &'static [(char, char)] = &[ ]; pub const DIVES_AKURU: &'static [(char, char)] = &[ - ('\u{11900}', '\u{11906}'), - ('\u{11909}', '\u{11909}'), - ('\u{1190c}', '\u{11913}'), - ('\u{11915}', '\u{11916}'), - ('\u{11918}', '\u{11935}'), - ('\u{11937}', '\u{11938}'), - ('\u{1193b}', '\u{11946}'), - ('\u{11950}', '\u{11959}'), + ('𑤀', '𑤆'), + ('𑤉', '𑤉'), + ('𑤌', '𑤓'), + ('𑤕', '𑤖'), + ('𑤘', '𑤵'), + ('𑤷', '𑤸'), + ('\u{1193b}', '𑥆'), + ('𑥐', '𑥙'), ]; pub const DOGRA: &'static [(char, char)] = @@ -568,6 +574,10 @@ pub const ETHIOPIC: &'static [(char, char)] = &[ ('ꬑ', 'ꬖ'), ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), + ('𞟠', '𞟦'), + ('𞟨', '𞟫'), + ('𞟭', '𞟮'), + ('𞟰', '𞟾'), ]; pub const GEORGIAN: &'static [(char, char)] = &[ @@ -585,8 +595,7 @@ pub const GEORGIAN: &'static [(char, char)] = &[ pub const GLAGOLITIC: &'static [(char, char)] = &[ ('\u{484}', '\u{484}'), ('\u{487}', '\u{487}'), - ('Ⰰ', 'Ⱞ'), - ('ⰰ', 'ⱞ'), + ('Ⰰ', 'ⱟ'), ('⹃', '⹃'), ('\u{a66f}', '\u{a66f}'), ('\u{1e000}', '\u{1e006}'), @@ -739,23 +748,24 @@ pub const HAN: &'static [(char, char)] = &[ ('㍘', '㍰'), ('㍻', '㍿'), ('㏠', '㏾'), - ('㐀', '\u{4dbf}'), - ('一', '\u{9ffc}'), + ('㐀', '䶿'), + ('一', '鿿'), ('꜀', '꜇'), ('豈', '舘'), ('並', '龎'), ('﹅', '﹆'), ('。', '・'), - ('\u{16ff0}', '\u{16ff1}'), + ('𖿢', '𖿣'), + ('𖿰', '𖿱'), ('𝍠', '𝍱'), ('🉐', '🉑'), - ('𠀀', '\u{2a6dd}'), - ('𪜀', '𫜴'), + ('𠀀', '𪛟'), + ('𪜀', '𫜸'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), - ('\u{30000}', '\u{3134a}'), + ('𰀀', '𱍊'), ]; pub const HANGUL: &'static [(char, char)] = &[ @@ -823,7 +833,7 @@ pub const HIRAGANA: &'static [(char, char)] = &[ ('。', '・'), ('ー', 'ー'), ('\u{ff9e}', '\u{ff9f}'), - ('𛀁', '𛄞'), + ('𛀁', '𛄟'), ('𛅐', '𛅒'), ('🈀', '🈀'), ]; @@ -836,7 +846,7 @@ pub const INHERITED: &'static [(char, char)] = &[ ('\u{343}', '\u{344}'), ('\u{346}', '\u{362}'), ('\u{953}', '\u{954}'), - ('\u{1ab0}', '\u{1ac0}'), + ('\u{1ab0}', '\u{1ace}'), ('\u{1dc2}', '\u{1df7}'), ('\u{1df9}', '\u{1df9}'), ('\u{1dfb}', '\u{1dff}'), @@ -845,6 +855,8 @@ pub const INHERITED: &'static [(char, char)] = &[ ('\u{fe00}', '\u{fe0f}'), ('\u{fe20}', '\u{fe2d}'), ('\u{101fd}', '\u{101fd}'), + ('\u{1cf00}', '\u{1cf2d}'), + ('\u{1cf30}', '\u{1cf46}'), ('\u{1d167}', '\u{1d169}'), ('\u{1d17b}', '\u{1d182}'), ('\u{1d185}', '\u{1d18b}'), @@ -861,8 +873,12 @@ pub const INSCRIPTIONAL_PARTHIAN: &'static [(char, char)] = pub const JAVANESE: &'static [(char, char)] = &[('\u{a980}', '꧍'), ('ꧏ', '꧙'), ('꧞', '꧟')]; -pub const KAITHI: &'static [(char, char)] = - &[('०', '९'), ('꠰', '꠹'), ('\u{11080}', '𑃁'), ('\u{110cd}', '\u{110cd}')]; +pub const KAITHI: &'static [(char, char)] = &[ + ('०', '९'), + ('꠰', '꠹'), + ('\u{11080}', '\u{110c2}'), + ('\u{110cd}', '\u{110cd}'), +]; pub const KANNADA: &'static [(char, char)] = &[ ('\u{951}', '\u{952}'), @@ -876,7 +892,7 @@ pub const KANNADA: &'static [(char, char)] = &[ ('\u{cc6}', 'ೈ'), ('ೊ', '\u{ccd}'), ('\u{cd5}', '\u{cd6}'), - ('ೞ', 'ೞ'), + ('ೝ', 'ೞ'), ('ೠ', '\u{ce3}'), ('೦', '೯'), ('ೱ', 'ೲ'), @@ -902,7 +918,11 @@ pub const KATAKANA: &'static [(char, char)] = &[ ('㌀', '㍗'), ('﹅', '﹆'), ('。', '\u{ff9f}'), + ('𚿰', '𚿳'), + ('𚿵', '𚿻'), + ('𚿽', '𚿾'), ('𛀀', '𛀀'), + ('𛄠', '𛄢'), ('𛅤', '𛅧'), ]; @@ -920,7 +940,7 @@ pub const KHAROSHTHI: &'static [(char, char)] = &[ ]; pub const KHITAN_SMALL_SCRIPT: &'static [(char, char)] = - &[('\u{16fe4}', '\u{16fe4}'), ('\u{18b00}', '\u{18cd5}')]; + &[('\u{16fe4}', '\u{16fe4}'), ('𘬀', '𘳕')]; pub const KHMER: &'static [(char, char)] = &[('ក', '\u{17dd}'), ('០', '៩'), ('៰', '៹'), ('᧠', '᧿')]; @@ -976,16 +996,22 @@ pub const LATIN: &'static [(char, char)] = &[ ('Ⱡ', 'Ɀ'), ('꜀', '꜇'), ('Ꜣ', 'ꞇ'), - ('Ꞌ', 'ꞿ'), - ('Ꟃ', '\u{a7ca}'), - ('\u{a7f5}', 'ꟿ'), + ('Ꞌ', 'ꟊ'), + ('Ꟑ', 'ꟑ'), + ('ꟓ', 'ꟓ'), + ('ꟕ', 'ꟙ'), + ('ꟲ', 'ꟿ'), ('꤮', '꤮'), ('ꬰ', 'ꭚ'), ('ꭜ', 'ꭤ'), - ('ꭦ', '\u{ab69}'), + ('ꭦ', 'ꭩ'), ('ff', 'st'), ('A', 'Z'), ('a', 'z'), + ('𐞀', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), + ('𝼀', '𝼞'), ]; pub const LEPCHA: &'static [(char, char)] = @@ -1016,8 +1042,7 @@ pub const LINEAR_B: &'static [(char, char)] = &[ ('𐄷', '𐄿'), ]; -pub const LISU: &'static [(char, char)] = - &[('ꓐ', '꓿'), ('\u{11fb0}', '\u{11fb0}')]; +pub const LISU: &'static [(char, char)] = &[('ꓐ', '꓿'), ('𑾰', '𑾰')]; pub const LYCIAN: &'static [(char, char)] = &[('𐊀', '𐊜')]; @@ -1082,8 +1107,7 @@ pub const MODI: &'static [(char, char)] = &[('꠰', '꠹'), ('𑘀', '𑙄'), ('𑙐', '𑙙')]; pub const MONGOLIAN: &'static [(char, char)] = &[ - ('᠀', '\u{180e}'), - ('᠐', '᠙'), + ('᠀', '᠙'), ('ᠠ', 'ᡸ'), ('ᢀ', 'ᢪ'), ('\u{202f}', '\u{202f}'), @@ -1115,9 +1139,16 @@ pub const NANDINAGARI: &'static [(char, char)] = &[ pub const NEW_TAI_LUE: &'static [(char, char)] = &[('ᦀ', 'ᦫ'), ('ᦰ', 'ᧉ'), ('᧐', '᧚'), ('᧞', '᧟')]; -pub const NEWA: &'static [(char, char)] = &[('𑐀', '𑑛'), ('𑑝', '\u{11461}')]; +pub const NEWA: &'static [(char, char)] = &[('𑐀', '𑑛'), ('𑑝', '𑑡')]; -pub const NKO: &'static [(char, char)] = &[('߀', 'ߺ'), ('\u{7fd}', '߿')]; +pub const NKO: &'static [(char, char)] = &[ + ('،', '،'), + ('؛', '؛'), + ('؟', '؟'), + ('߀', 'ߺ'), + ('\u{7fd}', '߿'), + ('﴾', '﴿'), +]; pub const NUSHU: &'static [(char, char)] = &[('𖿡', '𖿡'), ('𛅰', '𛋻')]; @@ -1146,6 +1177,9 @@ pub const OLD_SOUTH_ARABIAN: &'static [(char, char)] = &[('𐩠', '𐩿')]; pub const OLD_TURKIC: &'static [(char, char)] = &[('𐰀', '𐱈')]; +pub const OLD_UYGHUR: &'static [(char, char)] = + &[('ـ', 'ـ'), ('𐫲', '𐫲'), ('𐽰', '𐾉')]; + pub const ORIYA: &'static [(char, char)] = &[ ('\u{951}', '\u{952}'), ('।', '॥'), @@ -1253,10 +1287,11 @@ pub const SYRIAC: &'static [(char, char)] = &[ ('ݍ', 'ݏ'), ('ࡠ', 'ࡪ'), ('\u{1df8}', '\u{1df8}'), + ('\u{1dfa}', '\u{1dfa}'), ]; pub const TAGALOG: &'static [(char, char)] = - &[('ᜀ', 'ᜌ'), ('ᜎ', '\u{1714}'), ('᜵', '᜶')]; + &[('ᜀ', '᜕'), ('ᜟ', 'ᜟ'), ('᜵', '᜶')]; pub const TAGBANWA: &'static [(char, char)] = &[('᜵', '᜶'), ('ᝠ', 'ᝬ'), ('ᝮ', 'ᝰ'), ('\u{1772}', '\u{1773}')]; @@ -1275,7 +1310,7 @@ pub const TAI_THAM: &'static [(char, char)] = &[ pub const TAI_VIET: &'static [(char, char)] = &[('ꪀ', 'ꫂ'), ('ꫛ', '꫟')]; pub const TAKRI: &'static [(char, char)] = - &[('।', '॥'), ('꠰', '꠹'), ('𑚀', '𑚸'), ('𑛀', '𑛉')]; + &[('।', '॥'), ('꠰', '꠹'), ('𑚀', '𑚹'), ('𑛀', '𑛉')]; pub const TAMIL: &'static [(char, char)] = &[ ('\u{951}', '\u{952}'), @@ -1305,12 +1340,10 @@ pub const TAMIL: &'static [(char, char)] = &[ ('𑿿', '𑿿'), ]; -pub const TANGUT: &'static [(char, char)] = &[ - ('𖿠', '𖿠'), - ('𗀀', '𘟷'), - ('𘠀', '\u{18aff}'), - ('\u{18d00}', '\u{18d08}'), -]; +pub const TANGSA: &'static [(char, char)] = &[('𖩰', '𖪾'), ('𖫀', '𖫉')]; + +pub const TANGUT: &'static [(char, char)] = + &[('𖿠', '𖿠'), ('𗀀', '𘟷'), ('𘠀', '𘫿'), ('𘴀', '𘴈')]; pub const TELUGU: &'static [(char, char)] = &[ ('\u{951}', '\u{952}'), @@ -1319,11 +1352,12 @@ pub const TELUGU: &'static [(char, char)] = &[ ('ఎ', 'ఐ'), ('ఒ', 'న'), ('ప', 'హ'), - ('ఽ', 'ౄ'), + ('\u{c3c}', 'ౄ'), ('\u{c46}', '\u{c48}'), ('\u{c4a}', '\u{c4d}'), ('\u{c55}', '\u{c56}'), ('ౘ', 'ౚ'), + ('ౝ', 'ౝ'), ('ౠ', '\u{c63}'), ('౦', '౯'), ('౷', '౿'), @@ -1365,10 +1399,23 @@ pub const TIRHUTA: &'static [(char, char)] = &[ ('𑓐', '𑓙'), ]; +pub const TOTO: &'static [(char, char)] = &[('𞊐', '\u{1e2ae}')]; + pub const UGARITIC: &'static [(char, char)] = &[('𐎀', '𐎝'), ('𐎟', '𐎟')]; pub const VAI: &'static [(char, char)] = &[('ꔀ', 'ꘫ')]; +pub const VITHKUQI: &'static [(char, char)] = &[ + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), +]; + pub const WANCHO: &'static [(char, char)] = &[('𞋀', '𞋹'), ('𞋿', '𞋿')]; pub const WARANG_CITI: &'static [(char, char)] = &[('𑢠', '𑣲'), ('𑣿', '𑣿')]; @@ -1378,9 +1425,9 @@ pub const YEZIDI: &'static [(char, char)] = &[ ('؛', '؛'), ('؟', '؟'), ('٠', '٩'), - ('\u{10e80}', '\u{10ea9}'), - ('\u{10eab}', '\u{10ead}'), - ('\u{10eb0}', '\u{10eb1}'), + ('𐺀', '𐺩'), + ('\u{10eab}', '𐺭'), + ('𐺰', '𐺱'), ]; pub const YI: &'static [(char, char)] = &[ diff --git a/regex-syntax/src/unicode_tables/sentence_break.rs b/regex-syntax/src/unicode_tables/sentence_break.rs index 67d830f74b..db8ad282bb 100644 --- a/regex-syntax/src/unicode_tables/sentence_break.rs +++ b/regex-syntax/src/unicode_tables/sentence_break.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate sentence-break ucd-13.0.0 --chars +// ucd-generate sentence-break /tmp/ucd --chars // -// Unicode version: 13.0.0. +// Unicode version: 14.0.0. // -// ucd-generate 0.2.8 is available on crates.io. +// ucd-generate 0.2.11 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("ATerm", ATERM), @@ -29,7 +29,7 @@ pub const ATERM: &'static [(char, char)] = pub const CR: &'static [(char, char)] = &[('\r', '\r')]; pub const CLOSE: &'static [(char, char)] = &[ - ('\"', '\"'), + ('"', '"'), ('\'', ')'), ('[', '['), (']', ']'), @@ -57,6 +57,7 @@ pub const CLOSE: &'static [(char, char)] = &[ ('⸜', '⸝'), ('⸠', '⸩'), ('⹂', '⹂'), + ('⹕', '⹜'), ('〈', '】'), ('〔', '〛'), ('〝', '〟'), @@ -100,7 +101,8 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{825}', '\u{827}'), ('\u{829}', '\u{82d}'), ('\u{859}', '\u{85b}'), - ('\u{8d3}', '\u{8e1}'), + ('\u{898}', '\u{89f}'), + ('\u{8ca}', '\u{8e1}'), ('\u{8e3}', 'ः'), ('\u{93a}', '\u{93c}'), ('ा', 'ॏ'), @@ -142,6 +144,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('ொ', '\u{bcd}'), ('\u{bd7}', '\u{bd7}'), ('\u{c00}', '\u{c04}'), + ('\u{c3c}', '\u{c3c}'), ('\u{c3e}', 'ౄ'), ('\u{c46}', '\u{c48}'), ('\u{c4a}', '\u{c4d}'), @@ -193,13 +196,14 @@ pub const EXTEND: &'static [(char, char)] = &[ ('ႏ', 'ႏ'), ('ႚ', '\u{109d}'), ('\u{135d}', '\u{135f}'), - ('\u{1712}', '\u{1714}'), - ('\u{1732}', '\u{1734}'), + ('\u{1712}', '᜕'), + ('\u{1732}', '᜴'), ('\u{1752}', '\u{1753}'), ('\u{1772}', '\u{1773}'), ('\u{17b4}', '\u{17d3}'), ('\u{17dd}', '\u{17dd}'), ('\u{180b}', '\u{180d}'), + ('\u{180f}', '\u{180f}'), ('\u{1885}', '\u{1886}'), ('\u{18a9}', '\u{18a9}'), ('\u{1920}', 'ᤫ'), @@ -208,7 +212,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('ᩕ', '\u{1a5e}'), ('\u{1a60}', '\u{1a7c}'), ('\u{1a7f}', '\u{1a7f}'), - ('\u{1ab0}', '\u{1ac0}'), + ('\u{1ab0}', '\u{1ace}'), ('\u{1b00}', 'ᬄ'), ('\u{1b34}', '᭄'), ('\u{1b6b}', '\u{1b73}'), @@ -221,8 +225,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{1ced}', '\u{1ced}'), ('\u{1cf4}', '\u{1cf4}'), ('᳷', '\u{1cf9}'), - ('\u{1dc0}', '\u{1df9}'), - ('\u{1dfb}', '\u{1dff}'), + ('\u{1dc0}', '\u{1dff}'), ('\u{200c}', '\u{200d}'), ('\u{20d0}', '\u{20f0}'), ('\u{2cef}', '\u{2cf1}'), @@ -277,10 +280,14 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{10d24}', '\u{10d27}'), ('\u{10eab}', '\u{10eac}'), ('\u{10f46}', '\u{10f50}'), + ('\u{10f82}', '\u{10f85}'), ('𑀀', '𑀂'), ('\u{11038}', '\u{11046}'), + ('\u{11070}', '\u{11070}'), + ('\u{11073}', '\u{11074}'), ('\u{1107f}', '𑂂'), ('𑂰', '\u{110ba}'), + ('\u{110c2}', '\u{110c2}'), ('\u{11100}', '\u{11102}'), ('\u{11127}', '\u{11134}'), ('𑅅', '𑅆'), @@ -288,7 +295,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{11180}', '𑆂'), ('𑆳', '𑇀'), ('\u{111c9}', '\u{111cc}'), - ('\u{111ce}', '\u{111cf}'), + ('𑇎', '\u{111cf}'), ('𑈬', '\u{11237}'), ('\u{1123e}', '\u{1123e}'), ('\u{112df}', '\u{112ea}'), @@ -311,11 +318,11 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{116ab}', '\u{116b7}'), ('\u{1171d}', '\u{1172b}'), ('𑠬', '\u{1183a}'), - ('\u{11930}', '\u{11935}'), - ('\u{11937}', '\u{11938}'), + ('\u{11930}', '𑤵'), + ('𑤷', '𑤸'), ('\u{1193b}', '\u{1193e}'), - ('\u{11940}', '\u{11940}'), - ('\u{11942}', '\u{11943}'), + ('𑥀', '𑥀'), + ('𑥂', '\u{11943}'), ('𑧑', '\u{119d7}'), ('\u{119da}', '\u{119e0}'), ('𑧤', '𑧤'), @@ -344,8 +351,10 @@ pub const EXTEND: &'static [(char, char)] = &[ ('𖽑', '𖾇'), ('\u{16f8f}', '\u{16f92}'), ('\u{16fe4}', '\u{16fe4}'), - ('\u{16ff0}', '\u{16ff1}'), + ('𖿰', '𖿱'), ('\u{1bc9d}', '\u{1bc9e}'), + ('\u{1cf00}', '\u{1cf2d}'), + ('\u{1cf30}', '\u{1cf46}'), ('\u{1d165}', '\u{1d169}'), ('𝅭', '\u{1d172}'), ('\u{1d17b}', '\u{1d182}'), @@ -364,6 +373,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), ('\u{1e130}', '\u{1e136}'), + ('\u{1e2ae}', '\u{1e2ae}'), ('\u{1e2ec}', '\u{1e2ef}'), ('\u{1e8d0}', '\u{1e8d6}'), ('\u{1e944}', '\u{1e94a}'), @@ -377,6 +387,7 @@ pub const FORMAT: &'static [(char, char)] = &[ ('\u{61c}', '\u{61c}'), ('\u{6dd}', '\u{6dd}'), ('\u{70f}', '\u{70f}'), + ('\u{890}', '\u{891}'), ('\u{8e2}', '\u{8e2}'), ('\u{180e}', '\u{180e}'), ('\u{200b}', '\u{200b}'), @@ -833,7 +844,7 @@ pub const LOWER: &'static [(char, char)] = &[ ('ⅰ', 'ⅿ'), ('ↄ', 'ↄ'), ('ⓐ', 'ⓩ'), - ('ⰰ', 'ⱞ'), + ('ⰰ', 'ⱟ'), ('ⱡ', 'ⱡ'), ('ⱥ', 'ⱦ'), ('ⱨ', 'ⱨ'), @@ -1001,19 +1012,33 @@ pub const LOWER: &'static [(char, char)] = &[ ('ꞻ', 'ꞻ'), ('ꞽ', 'ꞽ'), ('ꞿ', 'ꞿ'), + ('ꟁ', 'ꟁ'), ('ꟃ', 'ꟃ'), - ('\u{a7c8}', '\u{a7c8}'), - ('\u{a7ca}', '\u{a7ca}'), - ('\u{a7f6}', '\u{a7f6}'), + ('ꟈ', 'ꟈ'), + ('ꟊ', 'ꟊ'), + ('ꟑ', 'ꟑ'), + ('ꟓ', 'ꟓ'), + ('ꟕ', 'ꟕ'), + ('ꟗ', 'ꟗ'), + ('ꟙ', 'ꟙ'), + ('ꟶ', 'ꟶ'), ('ꟸ', 'ꟺ'), ('ꬰ', 'ꭚ'), - ('ꭜ', '\u{ab68}'), + ('ꭜ', 'ꭨ'), ('ꭰ', 'ꮿ'), ('ff', 'st'), ('ﬓ', 'ﬗ'), ('a', 'z'), ('𐐨', '𐑏'), ('𐓘', '𐓻'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), + ('𐞀', '𐞀'), + ('𐞃', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), ('𐳀', '𐳲'), ('𑣀', '𑣟'), ('𖹠', '𖹿'), @@ -1045,6 +1070,8 @@ pub const LOWER: &'static [(char, char)] = &[ ('𝞪', '𝟂'), ('𝟄', '𝟉'), ('𝟋', '𝟋'), + ('𝼀', '𝼉'), + ('𝼋', '𝼞'), ('𞤢', '𞥃'), ]; @@ -1100,17 +1127,18 @@ pub const NUMERIC: &'static [(char, char)] = &[ ('𑛀', '𑛉'), ('𑜰', '𑜹'), ('𑣠', '𑣩'), - ('\u{11950}', '\u{11959}'), + ('𑥐', '𑥙'), ('𑱐', '𑱙'), ('𑵐', '𑵙'), ('𑶠', '𑶩'), ('𖩠', '𖩩'), + ('𖫀', '𖫉'), ('𖭐', '𖭙'), ('𝟎', '𝟿'), ('𞅀', '𞅉'), ('𞋰', '𞋹'), ('𞥐', '𞥙'), - ('\u{1fbf0}', '\u{1fbf9}'), + ('🯰', '🯹'), ]; pub const OLETTER: &'static [(char, char)] = &[ @@ -1146,8 +1174,9 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ࠨ', 'ࠨ'), ('ࡀ', 'ࡘ'), ('ࡠ', 'ࡪ'), - ('ࢠ', 'ࢴ'), - ('ࢶ', '\u{8c7}'), + ('ࡰ', 'ࢇ'), + ('ࢉ', 'ࢎ'), + ('ࢠ', 'ࣉ'), ('ऄ', 'ह'), ('ऽ', 'ऽ'), ('ॐ', 'ॐ'), @@ -1212,6 +1241,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ప', 'హ'), ('ఽ', 'ఽ'), ('ౘ', 'ౚ'), + ('ౝ', 'ౝ'), ('ౠ', 'ౡ'), ('ಀ', 'ಀ'), ('ಅ', 'ಌ'), @@ -1220,10 +1250,10 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ಪ', 'ಳ'), ('ವ', 'ಹ'), ('ಽ', 'ಽ'), - ('ೞ', 'ೞ'), + ('ೝ', 'ೞ'), ('ೠ', 'ೡ'), ('ೱ', 'ೲ'), - ('\u{d04}', 'ഌ'), + ('ഄ', 'ഌ'), ('എ', 'ഐ'), ('ഒ', 'ഺ'), ('ഽ', 'ഽ'), @@ -1286,9 +1316,8 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ᚁ', 'ᚚ'), ('ᚠ', 'ᛪ'), ('ᛮ', 'ᛸ'), - ('ᜀ', 'ᜌ'), - ('ᜎ', 'ᜑ'), - ('ᜠ', 'ᜱ'), + ('ᜀ', 'ᜑ'), + ('ᜟ', 'ᜱ'), ('ᝀ', 'ᝑ'), ('ᝠ', 'ᝬ'), ('ᝮ', 'ᝰ'), @@ -1309,7 +1338,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ᨠ', 'ᩔ'), ('ᪧ', 'ᪧ'), ('ᬅ', 'ᬳ'), - ('ᭅ', 'ᭋ'), + ('ᭅ', 'ᭌ'), ('ᮃ', 'ᮠ'), ('ᮮ', 'ᮯ'), ('ᮺ', 'ᯥ'), @@ -1347,11 +1376,10 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ー', 'ヿ'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', '\u{31bf}'), + ('ㆠ', 'ㆿ'), ('ㇰ', 'ㇿ'), - ('㐀', '\u{4dbf}'), - ('一', '\u{9ffc}'), - ('ꀀ', 'ꒌ'), + ('㐀', '䶿'), + ('一', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), ('ꘐ', 'ꘟ'), @@ -1362,6 +1390,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ꜗ', 'ꜟ'), ('ꞈ', 'ꞈ'), ('ꞏ', 'ꞏ'), + ('ꟲ', 'ꟴ'), ('ꟷ', 'ꟷ'), ('ꟻ', 'ꠁ'), ('ꠃ', 'ꠅ'), @@ -1399,7 +1428,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('ꬑ', 'ꬖ'), ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), - ('\u{ab69}', '\u{ab69}'), + ('ꭩ', 'ꭩ'), ('ꯀ', 'ꯢ'), ('가', '힣'), ('ힰ', 'ퟆ'), @@ -1449,6 +1478,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𐘀', '𐜶'), ('𐝀', '𐝕'), ('𐝠', '𐝧'), + ('𐞁', '𐞂'), ('𐠀', '𐠅'), ('𐠈', '𐠈'), ('𐠊', '𐠵'), @@ -1477,19 +1507,22 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𐮀', '𐮑'), ('𐰀', '𐱈'), ('𐴀', '𐴣'), - ('\u{10e80}', '\u{10ea9}'), - ('\u{10eb0}', '\u{10eb1}'), + ('𐺀', '𐺩'), + ('𐺰', '𐺱'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '𐽅'), - ('\u{10fb0}', '\u{10fc4}'), + ('𐽰', '𐾁'), + ('𐾰', '𐿄'), ('𐿠', '𐿶'), ('𑀃', '𑀷'), + ('𑁱', '𑁲'), + ('𑁵', '𑁵'), ('𑂃', '𑂯'), ('𑃐', '𑃨'), ('𑄃', '𑄦'), ('𑅄', '𑅄'), - ('\u{11147}', '\u{11147}'), + ('𑅇', '𑅇'), ('𑅐', '𑅲'), ('𑅶', '𑅶'), ('𑆃', '𑆲'), @@ -1515,7 +1548,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𑍝', '𑍡'), ('𑐀', '𑐴'), ('𑑇', '𑑊'), - ('𑑟', '\u{11461}'), + ('𑑟', '𑑡'), ('𑒀', '𑒯'), ('𑓄', '𑓅'), ('𑓇', '𑓇'), @@ -1526,14 +1559,15 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𑚀', '𑚪'), ('𑚸', '𑚸'), ('𑜀', '𑜚'), + ('𑝀', '𑝆'), ('𑠀', '𑠫'), - ('𑣿', '\u{11906}'), - ('\u{11909}', '\u{11909}'), - ('\u{1190c}', '\u{11913}'), - ('\u{11915}', '\u{11916}'), - ('\u{11918}', '\u{1192f}'), - ('\u{1193f}', '\u{1193f}'), - ('\u{11941}', '\u{11941}'), + ('𑣿', '𑤆'), + ('𑤉', '𑤉'), + ('𑤌', '𑤓'), + ('𑤕', '𑤖'), + ('𑤘', '𑤯'), + ('𑤿', '𑤿'), + ('𑥁', '𑥁'), ('𑦠', '𑦧'), ('𑦪', '𑧐'), ('𑧡', '𑧡'), @@ -1544,7 +1578,7 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𑩐', '𑩐'), ('𑩜', '𑪉'), ('𑪝', '𑪝'), - ('𑫀', '𑫸'), + ('𑪰', '𑫸'), ('𑰀', '𑰈'), ('𑰊', '𑰮'), ('𑱀', '𑱀'), @@ -1558,14 +1592,16 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𑵪', '𑶉'), ('𑶘', '𑶘'), ('𑻠', '𑻲'), - ('\u{11fb0}', '\u{11fb0}'), + ('𑾰', '𑾰'), ('𒀀', '𒎙'), ('𒐀', '𒑮'), ('𒒀', '𒕃'), + ('𒾐', '𒿰'), ('𓀀', '𓐮'), ('𔐀', '𔙆'), ('𖠀', '𖨸'), ('𖩀', '𖩞'), + ('𖩰', '𖪾'), ('𖫐', '𖫭'), ('𖬀', '𖬯'), ('𖭀', '𖭃'), @@ -1577,9 +1613,12 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𖿠', '𖿡'), ('𖿣', '𖿣'), ('𗀀', '𘟷'), - ('𘠀', '\u{18cd5}'), - ('\u{18d00}', '\u{18d08}'), - ('𛀀', '𛄞'), + ('𘠀', '𘳕'), + ('𘴀', '𘴈'), + ('𚿰', '𚿳'), + ('𚿵', '𚿻'), + ('𚿽', '𚿾'), + ('𛀀', '𛄢'), ('𛅐', '𛅒'), ('𛅤', '𛅧'), ('𛅰', '𛋻'), @@ -1587,10 +1626,16 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𛱰', '𛱼'), ('𛲀', '𛲈'), ('𛲐', '𛲙'), + ('𝼊', '𝼊'), ('𞄀', '𞄬'), ('𞄷', '𞄽'), ('𞅎', '𞅎'), + ('𞊐', '𞊭'), ('𞋀', '𞋫'), + ('𞟠', '𞟦'), + ('𞟨', '𞟫'), + ('𞟭', '𞟮'), + ('𞟰', '𞟾'), ('𞠀', '𞣄'), ('𞥋', '𞥋'), ('𞸀', '𞸃'), @@ -1626,13 +1671,13 @@ pub const OLETTER: &'static [(char, char)] = &[ ('𞺡', '𞺣'), ('𞺥', '𞺩'), ('𞺫', '𞺻'), - ('𠀀', '\u{2a6dd}'), - ('𪜀', '𫜴'), + ('𠀀', '𪛟'), + ('𪜀', '𫜸'), ('𫝀', '𫠝'), ('𫠠', '𬺡'), ('𬺰', '𮯠'), ('丽', '𪘀'), - ('\u{30000}', '\u{3134a}'), + ('𰀀', '𱍊'), ]; pub const SCONTINUE: &'static [(char, char)] = &[ @@ -1661,7 +1706,7 @@ pub const STERM: &'static [(char, char)] = &[ ('!', '!'), ('?', '?'), ('։', '։'), - ('؞', '؟'), + ('؝', '؟'), ('۔', '۔'), ('܀', '܂'), ('߹', '߹'), @@ -1680,12 +1725,14 @@ pub const STERM: &'static [(char, char)] = &[ ('᪨', '᪫'), ('᭚', '᭛'), ('᭞', '᭟'), + ('᭽', '᭾'), ('᰻', '᰼'), ('᱾', '᱿'), ('‼', '‽'), ('⁇', '⁉'), ('⸮', '⸮'), ('⸼', '⸼'), + ('⹓', '⹔'), ('。', '。'), ('꓿', '꓿'), ('꘎', '꘏'), @@ -1704,6 +1751,7 @@ pub const STERM: &'static [(char, char)] = &[ ('。', '。'), ('𐩖', '𐩗'), ('𐽕', '𐽙'), + ('𐾆', '𐾉'), ('𑁇', '𑁈'), ('𑂾', '𑃁'), ('𑅁', '𑅃'), @@ -1718,8 +1766,8 @@ pub const STERM: &'static [(char, char)] = &[ ('𑗉', '𑗗'), ('𑙁', '𑙂'), ('𑜼', '𑜾'), - ('\u{11944}', '\u{11944}'), - ('\u{11946}', '\u{11946}'), + ('𑥄', '𑥄'), + ('𑥆', '𑥆'), ('𑩂', '𑩃'), ('𑪛', '𑪜'), ('𑱁', '𑱂'), @@ -2183,7 +2231,7 @@ pub const UPPER: &'static [(char, char)] = &[ ('Ⅰ', 'Ⅿ'), ('Ↄ', 'Ↄ'), ('Ⓐ', 'Ⓩ'), - ('Ⰰ', 'Ⱞ'), + ('Ⰰ', 'Ⱟ'), ('Ⱡ', 'Ⱡ'), ('Ɫ', 'Ɽ'), ('Ⱨ', 'Ⱨ'), @@ -2348,13 +2396,21 @@ pub const UPPER: &'static [(char, char)] = &[ ('Ꞻ', 'Ꞻ'), ('Ꞽ', 'Ꞽ'), ('Ꞿ', 'Ꞿ'), + ('Ꟁ', 'Ꟁ'), ('Ꟃ', 'Ꟃ'), - ('Ꞔ', '\u{a7c7}'), - ('\u{a7c9}', '\u{a7c9}'), - ('\u{a7f5}', '\u{a7f5}'), + ('Ꞔ', 'Ꟈ'), + ('Ꟊ', 'Ꟊ'), + ('Ꟑ', 'Ꟑ'), + ('Ꟗ', 'Ꟗ'), + ('Ꟙ', 'Ꟙ'), + ('Ꟶ', 'Ꟶ'), ('A', 'Z'), ('𐐀', '𐐧'), ('𐒰', '𐓓'), + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), ('𐲀', '𐲲'), ('𑢠', '𑢿'), ('𖹀', '𖹟'), diff --git a/regex-syntax/src/unicode_tables/word_break.rs b/regex-syntax/src/unicode_tables/word_break.rs index bd23e00a87..19b2a1c64e 100644 --- a/regex-syntax/src/unicode_tables/word_break.rs +++ b/regex-syntax/src/unicode_tables/word_break.rs @@ -1,10 +1,10 @@ // DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY: // -// ucd-generate word-break ucd-13.0.0 --chars +// ucd-generate word-break /tmp/ucd --chars // -// Unicode version: 13.0.0. +// Unicode version: 14.0.0. // -// ucd-generate 0.2.8 is available on crates.io. +// ucd-generate 0.2.11 is available on crates.io. pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[ ("ALetter", ALETTER), @@ -75,8 +75,9 @@ pub const ALETTER: &'static [(char, char)] = &[ ('ࠨ', 'ࠨ'), ('ࡀ', 'ࡘ'), ('ࡠ', 'ࡪ'), - ('ࢠ', 'ࢴ'), - ('ࢶ', '\u{8c7}'), + ('ࡰ', 'ࢇ'), + ('ࢉ', 'ࢎ'), + ('ࢠ', 'ࣉ'), ('ऄ', 'ह'), ('ऽ', 'ऽ'), ('ॐ', 'ॐ'), @@ -141,6 +142,7 @@ pub const ALETTER: &'static [(char, char)] = &[ ('ప', 'హ'), ('ఽ', 'ఽ'), ('ౘ', 'ౚ'), + ('ౝ', 'ౝ'), ('ౠ', 'ౡ'), ('ಀ', 'ಀ'), ('ಅ', 'ಌ'), @@ -149,10 +151,10 @@ pub const ALETTER: &'static [(char, char)] = &[ ('ಪ', 'ಳ'), ('ವ', 'ಹ'), ('ಽ', 'ಽ'), - ('ೞ', 'ೞ'), + ('ೝ', 'ೞ'), ('ೠ', 'ೡ'), ('ೱ', 'ೲ'), - ('\u{d04}', 'ഌ'), + ('ഄ', 'ഌ'), ('എ', 'ഐ'), ('ഒ', 'ഺ'), ('ഽ', 'ഽ'), @@ -197,9 +199,8 @@ pub const ALETTER: &'static [(char, char)] = &[ ('ᚁ', 'ᚚ'), ('ᚠ', 'ᛪ'), ('ᛮ', 'ᛸ'), - ('ᜀ', 'ᜌ'), - ('ᜎ', 'ᜑ'), - ('ᜠ', 'ᜱ'), + ('ᜀ', 'ᜑ'), + ('ᜟ', 'ᜱ'), ('ᝀ', 'ᝑ'), ('ᝠ', 'ᝬ'), ('ᝮ', 'ᝰ'), @@ -211,7 +212,7 @@ pub const ALETTER: &'static [(char, char)] = &[ ('ᤀ', 'ᤞ'), ('ᨀ', 'ᨖ'), ('ᬅ', 'ᬳ'), - ('ᭅ', 'ᭋ'), + ('ᭅ', 'ᭌ'), ('ᮃ', 'ᮠ'), ('ᮮ', 'ᮯ'), ('ᮺ', 'ᯥ'), @@ -263,9 +264,7 @@ pub const ALETTER: &'static [(char, char)] = &[ ('ⅎ', 'ⅎ'), ('Ⅰ', 'ↈ'), ('Ⓐ', 'ⓩ'), - ('Ⰰ', 'Ⱞ'), - ('ⰰ', 'ⱞ'), - ('Ⱡ', 'ⳤ'), + ('Ⰰ', 'ⳤ'), ('Ⳬ', 'ⳮ'), ('Ⳳ', 'ⳳ'), ('ⴀ', 'ⴥ'), @@ -287,7 +286,7 @@ pub const ALETTER: &'static [(char, char)] = &[ ('〻', '〼'), ('ㄅ', 'ㄯ'), ('ㄱ', 'ㆎ'), - ('ㆠ', '\u{31bf}'), + ('ㆠ', 'ㆿ'), ('ꀀ', 'ꒌ'), ('ꓐ', 'ꓽ'), ('ꔀ', 'ꘌ'), @@ -296,9 +295,11 @@ pub const ALETTER: &'static [(char, char)] = &[ ('Ꙁ', 'ꙮ'), ('ꙿ', 'ꚝ'), ('ꚠ', 'ꛯ'), - ('꜈', 'ꞿ'), - ('Ꟃ', '\u{a7ca}'), - ('\u{a7f5}', 'ꠁ'), + ('꜈', 'ꟊ'), + ('Ꟑ', 'ꟑ'), + ('ꟓ', 'ꟓ'), + ('ꟕ', 'ꟙ'), + ('ꟲ', 'ꠁ'), ('ꠃ', 'ꠅ'), ('ꠇ', 'ꠊ'), ('ꠌ', 'ꠢ'), @@ -322,7 +323,7 @@ pub const ALETTER: &'static [(char, char)] = &[ ('ꬑ', 'ꬖ'), ('ꬠ', 'ꬦ'), ('ꬨ', 'ꬮ'), - ('ꬰ', '\u{ab69}'), + ('ꬰ', 'ꭩ'), ('ꭰ', 'ꯢ'), ('가', '힣'), ('ힰ', 'ퟆ'), @@ -365,9 +366,20 @@ pub const ALETTER: &'static [(char, char)] = &[ ('𐓘', '𐓻'), ('𐔀', '𐔧'), ('𐔰', '𐕣'), + ('𐕰', '𐕺'), + ('𐕼', '𐖊'), + ('𐖌', '𐖒'), + ('𐖔', '𐖕'), + ('𐖗', '𐖡'), + ('𐖣', '𐖱'), + ('𐖳', '𐖹'), + ('𐖻', '𐖼'), ('𐘀', '𐜶'), ('𐝀', '𐝕'), ('𐝠', '𐝧'), + ('𐞀', '𐞅'), + ('𐞇', '𐞰'), + ('𐞲', '𐞺'), ('𐠀', '𐠅'), ('𐠈', '𐠈'), ('𐠊', '𐠵'), @@ -398,19 +410,22 @@ pub const ALETTER: &'static [(char, char)] = &[ ('𐲀', '𐲲'), ('𐳀', '𐳲'), ('𐴀', '𐴣'), - ('\u{10e80}', '\u{10ea9}'), - ('\u{10eb0}', '\u{10eb1}'), + ('𐺀', '𐺩'), + ('𐺰', '𐺱'), ('𐼀', '𐼜'), ('𐼧', '𐼧'), ('𐼰', '𐽅'), - ('\u{10fb0}', '\u{10fc4}'), + ('𐽰', '𐾁'), + ('𐾰', '𐿄'), ('𐿠', '𐿶'), ('𑀃', '𑀷'), + ('𑁱', '𑁲'), + ('𑁵', '𑁵'), ('𑂃', '𑂯'), ('𑃐', '𑃨'), ('𑄃', '𑄦'), ('𑅄', '𑅄'), - ('\u{11147}', '\u{11147}'), + ('𑅇', '𑅇'), ('𑅐', '𑅲'), ('𑅶', '𑅶'), ('𑆃', '𑆲'), @@ -436,7 +451,7 @@ pub const ALETTER: &'static [(char, char)] = &[ ('𑍝', '𑍡'), ('𑐀', '𑐴'), ('𑑇', '𑑊'), - ('𑑟', '\u{11461}'), + ('𑑟', '𑑡'), ('𑒀', '𑒯'), ('𑓄', '𑓅'), ('𑓇', '𑓇'), @@ -448,13 +463,13 @@ pub const ALETTER: &'static [(char, char)] = &[ ('𑚸', '𑚸'), ('𑠀', '𑠫'), ('𑢠', '𑣟'), - ('𑣿', '\u{11906}'), - ('\u{11909}', '\u{11909}'), - ('\u{1190c}', '\u{11913}'), - ('\u{11915}', '\u{11916}'), - ('\u{11918}', '\u{1192f}'), - ('\u{1193f}', '\u{1193f}'), - ('\u{11941}', '\u{11941}'), + ('𑣿', '𑤆'), + ('𑤉', '𑤉'), + ('𑤌', '𑤓'), + ('𑤕', '𑤖'), + ('𑤘', '𑤯'), + ('𑤿', '𑤿'), + ('𑥁', '𑥁'), ('𑦠', '𑦧'), ('𑦪', '𑧐'), ('𑧡', '𑧡'), @@ -465,7 +480,7 @@ pub const ALETTER: &'static [(char, char)] = &[ ('𑩐', '𑩐'), ('𑩜', '𑪉'), ('𑪝', '𑪝'), - ('𑫀', '𑫸'), + ('𑪰', '𑫸'), ('𑰀', '𑰈'), ('𑰊', '𑰮'), ('𑱀', '𑱀'), @@ -479,14 +494,16 @@ pub const ALETTER: &'static [(char, char)] = &[ ('𑵪', '𑶉'), ('𑶘', '𑶘'), ('𑻠', '𑻲'), - ('\u{11fb0}', '\u{11fb0}'), + ('𑾰', '𑾰'), ('𒀀', '𒎙'), ('𒐀', '𒑮'), ('𒒀', '𒕃'), + ('𒾐', '𒿰'), ('𓀀', '𓐮'), ('𔐀', '𔙆'), ('𖠀', '𖨸'), ('𖩀', '𖩞'), + ('𖩰', '𖪾'), ('𖫐', '𖫭'), ('𖬀', '𖬯'), ('𖭀', '𖭃'), @@ -532,10 +549,16 @@ pub const ALETTER: &'static [(char, char)] = &[ ('𝞊', '𝞨'), ('𝞪', '𝟂'), ('𝟄', '𝟋'), + ('𝼀', '𝼞'), ('𞄀', '𞄬'), ('𞄷', '𞄽'), ('𞅎', '𞅎'), + ('𞊐', '𞊭'), ('𞋀', '𞋫'), + ('𞟠', '𞟦'), + ('𞟨', '𞟫'), + ('𞟭', '𞟮'), + ('𞟰', '𞟾'), ('𞠀', '𞣄'), ('𞤀', '𞥃'), ('𞥋', '𞥋'), @@ -579,7 +602,7 @@ pub const ALETTER: &'static [(char, char)] = &[ pub const CR: &'static [(char, char)] = &[('\r', '\r')]; -pub const DOUBLE_QUOTE: &'static [(char, char)] = &[('\"', '\"')]; +pub const DOUBLE_QUOTE: &'static [(char, char)] = &[('"', '"')]; pub const EXTEND: &'static [(char, char)] = &[ ('\u{300}', '\u{36f}'), @@ -606,7 +629,8 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{825}', '\u{827}'), ('\u{829}', '\u{82d}'), ('\u{859}', '\u{85b}'), - ('\u{8d3}', '\u{8e1}'), + ('\u{898}', '\u{89f}'), + ('\u{8ca}', '\u{8e1}'), ('\u{8e3}', 'ः'), ('\u{93a}', '\u{93c}'), ('ा', 'ॏ'), @@ -648,6 +672,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('ொ', '\u{bcd}'), ('\u{bd7}', '\u{bd7}'), ('\u{c00}', '\u{c04}'), + ('\u{c3c}', '\u{c3c}'), ('\u{c3e}', 'ౄ'), ('\u{c46}', '\u{c48}'), ('\u{c4a}', '\u{c4d}'), @@ -699,13 +724,14 @@ pub const EXTEND: &'static [(char, char)] = &[ ('ႏ', 'ႏ'), ('ႚ', '\u{109d}'), ('\u{135d}', '\u{135f}'), - ('\u{1712}', '\u{1714}'), - ('\u{1732}', '\u{1734}'), + ('\u{1712}', '᜕'), + ('\u{1732}', '᜴'), ('\u{1752}', '\u{1753}'), ('\u{1772}', '\u{1773}'), ('\u{17b4}', '\u{17d3}'), ('\u{17dd}', '\u{17dd}'), ('\u{180b}', '\u{180d}'), + ('\u{180f}', '\u{180f}'), ('\u{1885}', '\u{1886}'), ('\u{18a9}', '\u{18a9}'), ('\u{1920}', 'ᤫ'), @@ -714,7 +740,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('ᩕ', '\u{1a5e}'), ('\u{1a60}', '\u{1a7c}'), ('\u{1a7f}', '\u{1a7f}'), - ('\u{1ab0}', '\u{1ac0}'), + ('\u{1ab0}', '\u{1ace}'), ('\u{1b00}', 'ᬄ'), ('\u{1b34}', '᭄'), ('\u{1b6b}', '\u{1b73}'), @@ -727,8 +753,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{1ced}', '\u{1ced}'), ('\u{1cf4}', '\u{1cf4}'), ('᳷', '\u{1cf9}'), - ('\u{1dc0}', '\u{1df9}'), - ('\u{1dfb}', '\u{1dff}'), + ('\u{1dc0}', '\u{1dff}'), ('\u{200c}', '\u{200c}'), ('\u{20d0}', '\u{20f0}'), ('\u{2cef}', '\u{2cf1}'), @@ -783,10 +808,14 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{10d24}', '\u{10d27}'), ('\u{10eab}', '\u{10eac}'), ('\u{10f46}', '\u{10f50}'), + ('\u{10f82}', '\u{10f85}'), ('𑀀', '𑀂'), ('\u{11038}', '\u{11046}'), + ('\u{11070}', '\u{11070}'), + ('\u{11073}', '\u{11074}'), ('\u{1107f}', '𑂂'), ('𑂰', '\u{110ba}'), + ('\u{110c2}', '\u{110c2}'), ('\u{11100}', '\u{11102}'), ('\u{11127}', '\u{11134}'), ('𑅅', '𑅆'), @@ -794,7 +823,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{11180}', '𑆂'), ('𑆳', '𑇀'), ('\u{111c9}', '\u{111cc}'), - ('\u{111ce}', '\u{111cf}'), + ('𑇎', '\u{111cf}'), ('𑈬', '\u{11237}'), ('\u{1123e}', '\u{1123e}'), ('\u{112df}', '\u{112ea}'), @@ -817,11 +846,11 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{116ab}', '\u{116b7}'), ('\u{1171d}', '\u{1172b}'), ('𑠬', '\u{1183a}'), - ('\u{11930}', '\u{11935}'), - ('\u{11937}', '\u{11938}'), + ('\u{11930}', '𑤵'), + ('𑤷', '𑤸'), ('\u{1193b}', '\u{1193e}'), - ('\u{11940}', '\u{11940}'), - ('\u{11942}', '\u{11943}'), + ('𑥀', '𑥀'), + ('𑥂', '\u{11943}'), ('𑧑', '\u{119d7}'), ('\u{119da}', '\u{119e0}'), ('𑧤', '𑧤'), @@ -850,8 +879,10 @@ pub const EXTEND: &'static [(char, char)] = &[ ('𖽑', '𖾇'), ('\u{16f8f}', '\u{16f92}'), ('\u{16fe4}', '\u{16fe4}'), - ('\u{16ff0}', '\u{16ff1}'), + ('𖿰', '𖿱'), ('\u{1bc9d}', '\u{1bc9e}'), + ('\u{1cf00}', '\u{1cf2d}'), + ('\u{1cf30}', '\u{1cf46}'), ('\u{1d165}', '\u{1d169}'), ('𝅭', '\u{1d172}'), ('\u{1d17b}', '\u{1d182}'), @@ -870,6 +901,7 @@ pub const EXTEND: &'static [(char, char)] = &[ ('\u{1e023}', '\u{1e024}'), ('\u{1e026}', '\u{1e02a}'), ('\u{1e130}', '\u{1e136}'), + ('\u{1e2ae}', '\u{1e2ae}'), ('\u{1e2ec}', '\u{1e2ef}'), ('\u{1e8d0}', '\u{1e8d6}'), ('\u{1e944}', '\u{1e94a}'), @@ -894,6 +926,7 @@ pub const FORMAT: &'static [(char, char)] = &[ ('\u{61c}', '\u{61c}'), ('\u{6dd}', '\u{6dd}'), ('\u{70f}', '\u{70f}'), + ('\u{890}', '\u{891}'), ('\u{8e2}', '\u{8e2}'), ('\u{180e}', '\u{180e}'), ('\u{200e}', '\u{200f}'), @@ -932,7 +965,11 @@ pub const KATAKANA: &'static [(char, char)] = &[ ('㋐', '㋾'), ('㌀', '㍗'), ('ヲ', 'ン'), + ('𚿰', '𚿳'), + ('𚿵', '𚿻'), + ('𚿽', '𚿾'), ('𛀀', '𛀀'), + ('𛄠', '𛄢'), ('𛅤', '𛅧'), ]; @@ -1031,17 +1068,18 @@ pub const NUMERIC: &'static [(char, char)] = &[ ('𑛀', '𑛉'), ('𑜰', '𑜹'), ('𑣠', '𑣩'), - ('\u{11950}', '\u{11959}'), + ('𑥐', '𑥙'), ('𑱐', '𑱙'), ('𑵐', '𑵙'), ('𑶠', '𑶩'), ('𖩠', '𖩩'), + ('𖫀', '𖫉'), ('𖭐', '𖭙'), ('𝟎', '𝟿'), ('𞅀', '𞅉'), ('𞋰', '𞋹'), ('𞥐', '𞥙'), - ('\u{1fbf0}', '\u{1fbf9}'), + ('🯰', '🯹'), ]; pub const REGIONAL_INDICATOR: &'static [(char, char)] = &[('🇦', '🇿')]; diff --git a/scripts/generate-unicode-tables b/scripts/generate-unicode-tables index c01df16e7e..a670cb404f 100755 --- a/scripts/generate-unicode-tables +++ b/scripts/generate-unicode-tables @@ -7,14 +7,17 @@ # # $ mkdir ucd # $ cd ucd -# $ curl -LO https://www.unicode.org/Public/zipped/12.1.0/UCD.zip +# $ curl -LO https://www.unicode.org/Public/zipped/14.0.0/UCD.zip # $ unzip UCD.zip -# $ curl -LO https://unicode.org/Public/emoji/12.0/emoji-data.txt # # And then run this script from the root of this repository by pointing it at # the data directory downloaded above: # # $ ./scripts/generate-unicode-tables path/to/ucd +# +# Once complete, if you are upgrading to a new version of Unicode, +# you'll need to add a new "age" value to the 'ages' routine in +# regex-syntax/src/unicode.rs. if [ $# != 1 ]; then echo "Usage: $(basename "$0") " >&2 diff --git a/tests/unicode.rs b/tests/unicode.rs index 9f1cd0c01f..9b32286247 100644 --- a/tests/unicode.rs +++ b/tests/unicode.rs @@ -232,3 +232,20 @@ mat!(uni_class_sb2, r"\p{sb=lower}", "\u{0469}", Some((0, 2))); mat!(uni_class_sb3, r"\p{sb=Close}", "\u{FF60}", Some((0, 3))); mat!(uni_class_sb4, r"\p{sb=Close}", "\u{1F677}", Some((0, 4))); mat!(uni_class_sb5, r"\p{sb=SContinue}", "\u{FF64}", Some((0, 3))); + +// Test 'Vithkuqi' support, which was added in Unicode 14. +// See: https://github.com/rust-lang/regex/issues/877 +mat!( + uni_vithkuqi_literal_upper, + r"(?i)^\u{10570}$", + "\u{10570}", + Some((0, 4)) +); +mat!( + uni_vithkuqi_literal_lower, + r"(?i)^\u{10570}$", + "\u{10597}", + Some((0, 4)) +); +mat!(uni_vithkuqi_word_upper, r"^\w$", "\u{10570}", Some((0, 4))); +mat!(uni_vithkuqi_word_lower, r"^\w$", "\u{10597}", Some((0, 4)));