Skip to content

Commit 20e0388

Browse files
committed
✨ add ecmaVersion:2021
1 parent 2e46e8a commit 20e0388

File tree

5 files changed

+32
-7
lines changed

5 files changed

+32
-7
lines changed

scripts/update-unicode-properties.ts

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -18,12 +18,19 @@ const DataSources = [
1818
scValues: "#table-unicode-script-values",
1919
},
2020
{
21-
url: "https://tc39.es/ecma262/",
21+
url: "https://www.ecma-international.org/ecma-262/11.0/",
2222
version: 2020,
2323
binProperties: "#table-binary-unicode-properties",
2424
gcValues: "#table-unicode-general-category-values",
2525
scValues: "#table-unicode-script-values",
2626
},
27+
{
28+
url: "https://tc39.es/ecma262/",
29+
version: 2021,
30+
binProperties: "#table-binary-unicode-properties",
31+
gcValues: "#table-unicode-general-category-values",
32+
scValues: "#table-unicode-script-values",
33+
},
2734
]
2835
const FILE_PATH = "src/unicode/properties.ts"
2936
const logger = console

src/ecma-versions.ts

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
export type EcmaVersion = 5 | 2015 | 2016 | 2017 | 2018 | 2019 | 2020
1+
export type EcmaVersion = 5 | 2015 | 2016 | 2017 | 2018 | 2019 | 2020 | 2021

src/parser.ts

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -506,7 +506,7 @@ export namespace RegExpParser {
506506
* - `2015` added `u` and `y` flags.
507507
* - `2018` added `s` flag, Named Capturing Group, Lookbehind Assertion,
508508
* and Unicode Property Escape.
509-
* - `2019` and `2020` added more valid Unicode Property Escapes.
509+
* - `2019`, `2020`, and `2021` added more valid Unicode Property Escapes.
510510
*/
511511
ecmaVersion?: EcmaVersion
512512
}

src/unicode/properties.ts

Lines changed: 21 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -7,10 +7,18 @@ class DataSet {
77
private _set2019: Set<string> | undefined
88
private _raw2020: string
99
private _set2020: Set<string> | undefined
10-
public constructor(raw2018: string, raw2019: string, raw2020: string) {
10+
private _raw2021: string
11+
private _set2021: Set<string> | undefined
12+
public constructor(
13+
raw2018: string,
14+
raw2019: string,
15+
raw2020: string,
16+
raw2021: string,
17+
) {
1118
this._raw2018 = raw2018
1219
this._raw2019 = raw2019
1320
this._raw2020 = raw2020
21+
this._raw2021 = raw2021
1422
}
1523
public get es2018(): Set<string> {
1624
return (
@@ -27,6 +35,11 @@ class DataSet {
2735
this._set2020 || (this._set2020 = new Set(this._raw2020.split(" ")))
2836
)
2937
}
38+
public get es2021(): Set<string> {
39+
return (
40+
this._set2021 || (this._set2021 = new Set(this._raw2021.split(" ")))
41+
)
42+
}
3043
}
3144

3245
const gcNameSet = new Set(["General_Category", "gc"])
@@ -35,16 +48,19 @@ const gcValueSets = new DataSet(
3548
"C Cased_Letter Cc Cf Close_Punctuation Cn Co Combining_Mark Connector_Punctuation Control Cs Currency_Symbol Dash_Punctuation Decimal_Number Enclosing_Mark Final_Punctuation Format Initial_Punctuation L LC Letter Letter_Number Line_Separator Ll Lm Lo Lowercase_Letter Lt Lu M Mark Math_Symbol Mc Me Mn Modifier_Letter Modifier_Symbol N Nd Nl No Nonspacing_Mark Number Open_Punctuation Other Other_Letter Other_Number Other_Punctuation Other_Symbol P Paragraph_Separator Pc Pd Pe Pf Pi Po Private_Use Ps Punctuation S Sc Separator Sk Sm So Space_Separator Spacing_Mark Surrogate Symbol Titlecase_Letter Unassigned Uppercase_Letter Z Zl Zp Zs cntrl digit punct",
3649
"",
3750
"",
51+
"",
3852
)
3953
const scValueSets = new DataSet(
4054
"Adlam Adlm Aghb Ahom Anatolian_Hieroglyphs Arab Arabic Armenian Armi Armn Avestan Avst Bali Balinese Bamu Bamum Bass Bassa_Vah Batak Batk Beng Bengali Bhaiksuki Bhks Bopo Bopomofo Brah Brahmi Brai Braille Bugi Buginese Buhd Buhid Cakm Canadian_Aboriginal Cans Cari Carian Caucasian_Albanian Chakma Cham Cher Cherokee Common Copt Coptic Cprt Cuneiform Cypriot Cyrillic Cyrl Deseret Deva Devanagari Dsrt Dupl Duployan Egyp Egyptian_Hieroglyphs Elba Elbasan Ethi Ethiopic Geor Georgian Glag Glagolitic Gonm Goth Gothic Gran Grantha Greek Grek Gujarati Gujr Gurmukhi Guru Han Hang Hangul Hani Hano Hanunoo Hatr Hatran Hebr Hebrew Hira Hiragana Hluw Hmng Hung Imperial_Aramaic Inherited Inscriptional_Pahlavi Inscriptional_Parthian Ital Java Javanese Kaithi Kali Kana Kannada Katakana Kayah_Li Khar Kharoshthi Khmer Khmr Khoj Khojki Khudawadi Knda Kthi Lana Lao Laoo Latin Latn Lepc Lepcha Limb Limbu Lina Linb Linear_A Linear_B Lisu Lyci Lycian Lydi Lydian Mahajani Mahj Malayalam Mand Mandaic Mani Manichaean Marc Marchen Masaram_Gondi Meetei_Mayek Mend Mende_Kikakui Merc Mero Meroitic_Cursive Meroitic_Hieroglyphs Miao Mlym Modi Mong Mongolian Mro Mroo Mtei Mult Multani Myanmar Mymr Nabataean Narb Nbat New_Tai_Lue Newa Nko Nkoo Nshu Nushu Ogam Ogham Ol_Chiki Olck Old_Hungarian Old_Italic Old_North_Arabian Old_Permic Old_Persian Old_South_Arabian Old_Turkic Oriya Orkh Orya Osage Osge Osma Osmanya Pahawh_Hmong Palm Palmyrene Pau_Cin_Hau Pauc Perm Phag Phags_Pa Phli Phlp Phnx Phoenician Plrd Prti Psalter_Pahlavi Qaac Qaai Rejang Rjng Runic Runr Samaritan Samr Sarb Saur Saurashtra Sgnw Sharada Shavian Shaw Shrd Sidd Siddham SignWriting Sind Sinh Sinhala Sora Sora_Sompeng Soyo Soyombo Sund Sundanese Sylo Syloti_Nagri Syrc Syriac Tagalog Tagb Tagbanwa Tai_Le Tai_Tham Tai_Viet Takr Takri Tale Talu Tamil Taml Tang Tangut Tavt Telu Telugu Tfng Tglg Thaa Thaana Thai Tibetan Tibt Tifinagh Tirh Tirhuta Ugar Ugaritic Vai Vaii Wara Warang_Citi Xpeo Xsux Yi Yiii Zanabazar_Square Zanb Zinh Zyyy",
4155
"Dogr Dogra Gong Gunjala_Gondi Hanifi_Rohingya Maka Makasar Medefaidrin Medf Old_Sogdian Rohg Sogd Sogdian Sogo",
4256
"Elym Elymaic Hmnp Nand Nandinagari Nyiakeng_Puachue_Hmong Wancho Wcho",
57+
"Chorasmian Chrs Diak Dives_Akuru Khitan_Small_Script Kits Yezi Yezidi",
4358
)
4459
const binPropertySets = new DataSet(
4560
"AHex ASCII ASCII_Hex_Digit Alpha Alphabetic Any Assigned Bidi_C Bidi_Control Bidi_M Bidi_Mirrored CI CWCF CWCM CWKCF CWL CWT CWU Case_Ignorable Cased Changes_When_Casefolded Changes_When_Casemapped Changes_When_Lowercased Changes_When_NFKC_Casefolded Changes_When_Titlecased Changes_When_Uppercased DI Dash Default_Ignorable_Code_Point Dep Deprecated Dia Diacritic Emoji Emoji_Component Emoji_Modifier Emoji_Modifier_Base Emoji_Presentation Ext Extender Gr_Base Gr_Ext Grapheme_Base Grapheme_Extend Hex Hex_Digit IDC IDS IDSB IDST IDS_Binary_Operator IDS_Trinary_Operator ID_Continue ID_Start Ideo Ideographic Join_C Join_Control LOE Logical_Order_Exception Lower Lowercase Math NChar Noncharacter_Code_Point Pat_Syn Pat_WS Pattern_Syntax Pattern_White_Space QMark Quotation_Mark RI Radical Regional_Indicator SD STerm Sentence_Terminal Soft_Dotted Term Terminal_Punctuation UIdeo Unified_Ideograph Upper Uppercase VS Variation_Selector White_Space XIDC XIDS XID_Continue XID_Start space",
4661
"Extended_Pictographic",
4762
"",
63+
"EBase EComp EMod EPres ExtPict",
4864
)
4965

5066
export function isValidUnicodeProperty(
@@ -59,7 +75,8 @@ export function isValidUnicodeProperty(
5975
return (
6076
(version >= 2018 && scValueSets.es2018.has(value)) ||
6177
(version >= 2019 && scValueSets.es2019.has(value)) ||
62-
(version >= 2020 && scValueSets.es2020.has(value))
78+
(version >= 2020 && scValueSets.es2020.has(value)) ||
79+
(version >= 2021 && scValueSets.es2021.has(value))
6380
)
6481
}
6582
return false
@@ -71,6 +88,7 @@ export function isValidLoneUnicodeProperty(
7188
): boolean {
7289
return (
7390
(version >= 2018 && binPropertySets.es2018.has(value)) ||
74-
(version >= 2019 && binPropertySets.es2019.has(value))
91+
(version >= 2019 && binPropertySets.es2019.has(value)) ||
92+
(version >= 2021 && binPropertySets.es2021.has(value))
7593
)
7694
}

src/validator.ts

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -131,7 +131,7 @@ export namespace RegExpValidator {
131131
* - `2015` added `u` and `y` flags.
132132
* - `2018` added `s` flag, Named Capturing Group, Lookbehind Assertion,
133133
* and Unicode Property Escape.
134-
* - `2019` and `2020` added more valid Unicode Property Escapes.
134+
* - `2019`, `2020`, and `2021` added more valid Unicode Property Escapes.
135135
*/
136136
ecmaVersion?: EcmaVersion
137137

0 commit comments

Comments
 (0)