Skip to content

Commit

Permalink
data: update to UCD 16
Browse files Browse the repository at this point in the history
  • Loading branch information
BurntSushi committed Sep 29, 2024
1 parent d3d3ff7 commit 8bcdbe3
Show file tree
Hide file tree
Showing 12 changed files with 2,064 additions and 595 deletions.
65 changes: 45 additions & 20 deletions regex-automata/src/util/unicode_data/perl_word.rs
Original file line number Diff line number Diff line change
@@ -1,10 +1,10 @@
// DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY:
//
// ucd-generate perl-word tmp/ucd-15.0.0/ --chars
// ucd-generate perl-word ucd-16.0.0 --chars
//
// Unicode version: 15.0.0.
// Unicode version: 16.0.0.
//
// ucd-generate 0.2.15 is available on crates.io.
// ucd-generate 0.3.1 is available on crates.io.

pub const PERL_WORD: &'static [(char, char)] = &[
('0', '9'),
Expand Down Expand Up @@ -59,7 +59,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[
('ࡠ', 'ࡪ'),
('ࡰ', 'ࢇ'),
('ࢉ', 'ࢎ'),
('\u{898}', '\u{8e1}'),
('\u{897}', '\u{8e1}'),
('\u{8e3}', '\u{963}'),
('०', '९'),
('ॱ', 'ঃ'),
Expand Down Expand Up @@ -158,8 +158,8 @@ pub const PERL_WORD: &'static [(char, char)] = &[
('ಪ', 'ಳ'),
('ವ', 'ಹ'),
('\u{cbc}', 'ೄ'),
('\u{cc6}', ''),
('', '\u{ccd}'),
('\u{cc6}', '\u{cc8}'),
('\u{cca}', '\u{ccd}'),
('\u{cd5}', '\u{cd6}'),
('ೝ', 'ೞ'),
('ೠ', '\u{ce3}'),
Expand Down Expand Up @@ -243,8 +243,8 @@ pub const PERL_WORD: &'static [(char, char)] = &[
('ᚁ', 'ᚚ'),
('ᚠ', 'ᛪ'),
('ᛮ', 'ᛸ'),
('ᜀ', ''),
('ᜟ', ''),
('ᜀ', '\u{1715}'),
('ᜟ', '\u{1734}'),
('ᝀ', '\u{1753}'),
('ᝠ', 'ᝬ'),
('ᝮ', 'ᝰ'),
Expand Down Expand Up @@ -276,11 +276,11 @@ pub const PERL_WORD: &'static [(char, char)] = &[
('\u{1b00}', 'ᭌ'),
('᭐', '᭙'),
('\u{1b6b}', '\u{1b73}'),
('\u{1b80}', ''),
('\u{1b80}', '\u{1bf3}'),
('ᰀ', '\u{1c37}'),
('᱀', '᱉'),
('ᱍ', 'ᱽ'),
('ᲀ', ''),
('ᲀ', ''),
('Ა', 'Ჺ'),
('Ჽ', 'Ჿ'),
('\u{1cd0}', '\u{1cd2}'),
Expand Down Expand Up @@ -367,10 +367,10 @@ pub const PERL_WORD: &'static [(char, char)] = &[
('ꙿ', '\u{a6f1}'),
('ꜗ', 'ꜟ'),
('Ꜣ', 'ꞈ'),
('Ꞌ', ''),
('Ꞌ', ''),
('Ꟑ', 'ꟑ'),
('ꟓ', 'ꟓ'),
('ꟕ', ''),
('ꟕ', ''),
('ꟲ', 'ꠧ'),
('\u{a82c}', '\u{a82c}'),
('ꡀ', 'ꡳ'),
Expand All @@ -379,9 +379,9 @@ pub const PERL_WORD: &'static [(char, char)] = &[
('\u{a8e0}', 'ꣷ'),
('ꣻ', 'ꣻ'),
('ꣽ', '\u{a92d}'),
('ꤰ', ''),
('ꤰ', '\u{a953}'),
('ꥠ', 'ꥼ'),
('\u{a980}', ''),
('\u{a980}', '\u{a9c0}'),
('ꧏ', '꧙'),
('ꧠ', 'ꧾ'),
('ꨀ', '\u{aa36}'),
Expand Down Expand Up @@ -468,6 +468,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[
('𐖣', '𐖱'),
('𐖳', '𐖹'),
('𐖻', '𐖼'),
('𐗀', '𐗳'),
('𐘀', '𐜶'),
('𐝀', '𐝕'),
('𐝠', '𐝧'),
Expand Down Expand Up @@ -508,10 +509,14 @@ pub const PERL_WORD: &'static [(char, char)] = &[
('𐳀', '𐳲'),
('𐴀', '\u{10d27}'),
('𐴰', '𐴹'),
('𐵀', '𐵥'),
('\u{10d69}', '\u{10d6d}'),
('𐵯', '𐶅'),
('𐺀', '𐺩'),
('\u{10eab}', '\u{10eac}'),
('𐺰', '𐺱'),
('\u{10efd}', '𐼜'),
('𐻂', '𐻄'),
('\u{10efc}', '𐼜'),
('𐼧', '𐼧'),
('𐼰', '\u{10f50}'),
('𐽰', '\u{10f85}'),
Expand Down Expand Up @@ -551,12 +556,22 @@ pub const PERL_WORD: &'static [(char, char)] = &[
('𑌵', '𑌹'),
('\u{1133b}', '𑍄'),
('𑍇', '𑍈'),
('𑍋', '𑍍'),
('𑍋', '\u{1134d}'),
('𑍐', '𑍐'),
('\u{11357}', '\u{11357}'),
('𑍝', '𑍣'),
('\u{11366}', '\u{1136c}'),
('\u{11370}', '\u{11374}'),
('𑎀', '𑎉'),
('𑎋', '𑎋'),
('𑎎', '𑎎'),
('𑎐', '𑎵'),
('𑎷', '\u{113c0}'),
('\u{113c2}', '\u{113c2}'),
('\u{113c5}', '\u{113c5}'),
('\u{113c7}', '𑏊'),
('𑏌', '𑏓'),
('\u{113e1}', '\u{113e2}'),
('𑐀', '𑑊'),
('𑑐', '𑑙'),
('\u{1145e}', '𑑡'),
Expand All @@ -571,6 +586,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[
('𑙐', '𑙙'),
('𑚀', '𑚸'),
('𑛀', '𑛉'),
('𑛐', '𑛣'),
('𑜀', '𑜚'),
('\u{1171d}', '\u{1172b}'),
('𑜰', '𑜹'),
Expand All @@ -594,6 +610,8 @@ pub const PERL_WORD: &'static [(char, char)] = &[
('𑩐', '\u{11a99}'),
('𑪝', '𑪝'),
('𑪰', '𑫸'),
('𑯀', '𑯠'),
('𑯰', '𑯹'),
('𑰀', '𑰈'),
('𑰊', '\u{11c36}'),
('\u{11c38}', '𑱀'),
Expand All @@ -618,15 +636,17 @@ pub const PERL_WORD: &'static [(char, char)] = &[
('\u{11f00}', '𑼐'),
('𑼒', '\u{11f3a}'),
('𑼾', '\u{11f42}'),
('𑽐', '𑽙'),
('𑽐', '\u{11f5a}'),
('𑾰', '𑾰'),
('𒀀', '𒎙'),
('𒐀', '𒑮'),
('𒒀', '𒕃'),
('𒾐', '𒿰'),
('𓀀', '𓐯'),
('\u{13440}', '\u{13455}'),
('𓑠', '𔏺'),
('𔐀', '𔙆'),
('𖄀', '𖄹'),
('𖠀', '𖨸'),
('𖩀', '𖩞'),
('𖩠', '𖩩'),
Expand All @@ -639,16 +659,18 @@ pub const PERL_WORD: &'static [(char, char)] = &[
('𖭐', '𖭙'),
('𖭣', '𖭷'),
('𖭽', '𖮏'),
('𖵀', '𖵬'),
('𖵰', '𖵹'),
('𖹀', '𖹿'),
('𖼀', '𖽊'),
('\u{16f4f}', '𖾇'),
('\u{16f8f}', '𖾟'),
('𖿠', '𖿡'),
('𖿣', '\u{16fe4}'),
('𖿰', '𖿱'),
('\u{16ff0}', '\u{16ff1}'),
('𗀀', '𘟷'),
('𘠀', '𘳕'),
('𘴀', '𘴈'),
('𘳿', '𘴈'),
('𚿰', '𚿳'),
('𚿵', '𚿻'),
('𚿽', '𚿾'),
Expand All @@ -663,10 +685,11 @@ pub const PERL_WORD: &'static [(char, char)] = &[
('𛲀', '𛲈'),
('𛲐', '𛲙'),
('\u{1bc9d}', '\u{1bc9e}'),
('𜳰', '𜳹'),
('\u{1cf00}', '\u{1cf2d}'),
('\u{1cf30}', '\u{1cf46}'),
('\u{1d165}', '\u{1d169}'),
('𝅭', '\u{1d172}'),
('\u{1d16d}', '\u{1d172}'),
('\u{1d17b}', '\u{1d182}'),
('\u{1d185}', '\u{1d18b}'),
('\u{1d1aa}', '\u{1d1ad}'),
Expand Down Expand Up @@ -724,6 +747,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[
('𞊐', '\u{1e2ae}'),
('𞋀', '𞋹'),
('𞓐', '𞓹'),
('𞗐', '𞗺'),
('𞟠', '𞟦'),
('𞟨', '𞟫'),
('𞟭', '𞟮'),
Expand Down Expand Up @@ -774,6 +798,7 @@ pub const PERL_WORD: &'static [(char, char)] = &[
('𫝀', '𫠝'),
('𫠠', '𬺡'),
('𬺰', '𮯠'),
('𮯰', '𮹝'),
('丽', '𪘀'),
('𰀀', '𱍊'),
('𱍐', '𲎯'),
Expand Down
77 changes: 66 additions & 11 deletions regex-syntax/src/unicode_tables/age.rs
Original file line number Diff line number Diff line change
@@ -1,10 +1,10 @@
// DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY:
//
// ucd-generate age ucd-15.0.0 --chars
// ucd-generate age ucd-16.0.0 --chars
//
// Unicode version: 15.0.0.
// Unicode version: 16.0.0.
//
// ucd-generate 0.2.14 is available on crates.io.
// ucd-generate 0.3.1 is available on crates.io.

pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[
("V10_0", V10_0),
Expand All @@ -14,6 +14,8 @@ pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[
("V13_0", V13_0),
("V14_0", V14_0),
("V15_0", V15_0),
("V15_1", V15_1),
("V16_0", V16_0),
("V1_1", V1_1),
("V2_0", V2_0),
("V2_1", V2_1),
Expand Down Expand Up @@ -238,7 +240,7 @@ pub const V13_0: &'static [(char, char)] = &[
('𑥐', '𑥙'),
('𑾰', '𑾰'),
('\u{16fe4}', '\u{16fe4}'),
('𖿰', '𖿱'),
('\u{16ff0}', '\u{16ff1}'),
('𘫳', '𘳕'),
('𘴀', '𘴈'),
('🄍', '🄏'),
Expand Down Expand Up @@ -277,7 +279,7 @@ pub const V14_0: &'static [(char, char)] = &[
('ౝ', 'ౝ'),
('ೝ', 'ೝ'),
('ᜍ', 'ᜍ'),
('', ''),
('\u{1715}', '\u{1715}'),
('ᜟ', 'ᜟ'),
('\u{180f}', '\u{180f}'),
('\u{1ac1}', '\u{1ace}'),
Expand Down Expand Up @@ -382,6 +384,59 @@ pub const V15_0: &'static [(char, char)] = &[
('𱍐', '𲎯'),
];

pub const V15_1: &'static [(char, char)] =
&[('⿼', '⿿'), ('㇯', '㇯'), ('𮯰', '𮹝')];

pub const V16_0: &'static [(char, char)] = &[
('\u{897}', '\u{897}'),
('᭎', '᭏'),
('᭿', '᭿'),
('Ᲊ', 'ᲊ'),
('␧', '␩'),
('㇤', '㇥'),
('Ɤ', 'ꟍ'),
('Ꟛ', 'Ƛ'),
('𐗀', '𐗳'),
('𐵀', '𐵥'),
('\u{10d69}', '𐶅'),
('𐶎', '𐶏'),
('𐻂', '𐻄'),
('\u{10efc}', '\u{10efc}'),
('𑎀', '𑎉'),
('𑎋', '𑎋'),
('𑎎', '𑎎'),
('𑎐', '𑎵'),
('𑎷', '\u{113c0}'),
('\u{113c2}', '\u{113c2}'),
('\u{113c5}', '\u{113c5}'),
('\u{113c7}', '𑏊'),
('𑏌', '𑏕'),
('𑏗', '𑏘'),
('\u{113e1}', '\u{113e2}'),
('𑛐', '𑛣'),
('𑯀', '𑯡'),
('𑯰', '𑯹'),
('\u{11f5a}', '\u{11f5a}'),
('𓑠', '𔏺'),
('𖄀', '𖄹'),
('𖵀', '𖵹'),
('𘳿', '𘳿'),
('𜰀', '𜳹'),
('𜴀', '𜺳'),
('𞗐', '𞗺'),
('𞗿', '𞗿'),
('🢲', '🢻'),
('🣀', '🣁'),
('🪉', '🪉'),
('🪏', '🪏'),
('🪾', '🪾'),
('🫆', '🫆'),
('🫜', '🫜'),
('🫟', '🫟'),
('🫩', '🫩'),
('🯋', '🯯'),
];

pub const V1_1: &'static [(char, char)] = &[
('\0', 'ǵ'),
('Ǻ', 'ȗ'),
Expand Down Expand Up @@ -530,8 +585,8 @@ pub const V1_1: &'static [(char, char)] = &[
('ಪ', 'ಳ'),
('ವ', 'ಹ'),
('ಾ', 'ೄ'),
('\u{cc6}', ''),
('', '\u{ccd}'),
('\u{cc6}', '\u{cc8}'),
('\u{cca}', '\u{ccd}'),
('\u{cd5}', '\u{cd6}'),
('ೞ', 'ೞ'),
('ೠ', 'ೡ'),
Expand Down Expand Up @@ -1174,7 +1229,7 @@ pub const V5_1: &'static [(char, char)] = &[
('ၚ', '႙'),
('႞', '႟'),
('ᢪ', 'ᢪ'),
('\u{1b80}', ''),
('\u{1b80}', '\u{1baa}'),
('ᮮ', '᮹'),
('ᰀ', '\u{1c37}'),
('᰻', '᱉'),
Expand Down Expand Up @@ -1212,7 +1267,7 @@ pub const V5_1: &'static [(char, char)] = &[
('ꟻ', 'ꟿ'),
('ꢀ', '\u{a8c4}'),
('꣎', '꣙'),
('꤀', ''),
('꤀', '\u{a953}'),
('꥟', '꥟'),
('ꨀ', '\u{aa36}'),
('ꩀ', 'ꩍ'),
Expand Down Expand Up @@ -1340,7 +1395,7 @@ pub const V6_0: &'static [(char, char)] = &[
('ྌ', '\u{f8f}'),
('࿙', '࿚'),
('\u{135d}', '\u{135e}'),
('ᯀ', ''),
('ᯀ', '\u{1bf3}'),
('᯼', '᯿'),
('\u{1dfc}', '\u{1dfc}'),
('ₕ', 'ₜ'),
Expand Down Expand Up @@ -1606,7 +1661,7 @@ pub const V7_0: &'static [(char, char)] = &[
('𑌵', '𑌹'),
('\u{1133c}', '𑍄'),
('𑍇', '𑍈'),
('𑍋', '𑍍'),
('𑍋', '\u{1134d}'),
('\u{11357}', '\u{11357}'),
('𑍝', '𑍣'),
('\u{11366}', '\u{1136c}'),
Expand Down
Loading

0 comments on commit 8bcdbe3

Please sign in to comment.