-
Notifications
You must be signed in to change notification settings - Fork 34
/
Copy pathgenerate-regex.js
59 lines (48 loc) · 1.43 KB
/
generate-regex.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
import { promises as fs } from 'node:fs'
import regenerate from 'regenerate'
// @ts-expect-error: untyped
import alphabetics from '@unicode/unicode-13.0.0/Binary_Property/Alphabetic/code-points.js'
const categoryBase = new URL('../node_modules/@unicode/unicode-13.0.0/General_Category/', import.meta.url)
// Unicode General Categories to remove.
const ranges = [
// Some numbers:
'Other_Number',
// Some punctuation:
'Close_Punctuation',
'Final_Punctuation',
'Initial_Punctuation',
'Open_Punctuation',
'Other_Punctuation',
// All except a normal `-` (dash)
'Dash_Punctuation',
// All:
'Symbol',
'Control',
'Private_Use',
'Format',
'Unassigned',
// All except a normal ` ` (space)
'Separator'
]
const generator = regenerate()
let index = -1
// Add code points to strip.
while (++index < ranges.length) {
const name = ranges[index]
/** @type {{default: Array<number>}} */
const { default: codePoints } = await import(new URL(name + '/code-points.js', categoryBase).href)
generator.add(codePoints)
}
generator
// Some overlap between letters and Other Symbol.
.remove(alphabetics)
// Spaces are turned to `-`
.remove(' ')
// Dash is kept.
.remove('-')
await fs.writeFile('regex.js', [
'// This module is generated by `script/`.',
'/* eslint-disable no-control-regex, no-misleading-character-class, no-useless-escape */',
'export const regex = ' + generator.toRegExp() + 'g',
''
].join('\n'))