|
|
|
|
|
|
|
const posixClasses = { |
|
'[:alnum:]': ['\\p{L}\\p{Nl}\\p{Nd}', true], |
|
'[:alpha:]': ['\\p{L}\\p{Nl}', true], |
|
'[:ascii:]': ['\\x' + '00-\\x' + '7f', false], |
|
'[:blank:]': ['\\p{Zs}\\t', true], |
|
'[:cntrl:]': ['\\p{Cc}', true], |
|
'[:digit:]': ['\\p{Nd}', true], |
|
'[:graph:]': ['\\p{Z}\\p{C}', true, true], |
|
'[:lower:]': ['\\p{Ll}', true], |
|
'[:print:]': ['\\p{C}', true], |
|
'[:punct:]': ['\\p{P}', true], |
|
'[:space:]': ['\\p{Z}\\t\\r\\n\\v\\f', true], |
|
'[:upper:]': ['\\p{Lu}', true], |
|
'[:word:]': ['\\p{L}\\p{Nl}\\p{Nd}\\p{Pc}', true], |
|
'[:xdigit:]': ['A-Fa-f0-9', false], |
|
}; |
|
|
|
|
|
const braceEscape = (s) => s.replace(/[[\]\\-]/g, '\\$&'); |
|
|
|
const regexpEscape = (s) => s.replace(/[-[\]{}()*+?.,\\^$|#\s]/g, '\\$&'); |
|
|
|
const rangesToString = (ranges) => ranges.join(''); |
|
|
|
|
|
|
|
|
|
|
|
|
|
export const parseClass = (glob, position) => { |
|
const pos = position; |
|
|
|
if (glob.charAt(pos) !== '[') { |
|
throw new Error('not in a brace expression'); |
|
} |
|
|
|
const ranges = []; |
|
const negs = []; |
|
let i = pos + 1; |
|
let sawStart = false; |
|
let uflag = false; |
|
let escaping = false; |
|
let negate = false; |
|
let endPos = pos; |
|
let rangeStart = ''; |
|
WHILE: while (i < glob.length) { |
|
const c = glob.charAt(i); |
|
if ((c === '!' || c === '^') && i === pos + 1) { |
|
negate = true; |
|
i++; |
|
continue; |
|
} |
|
if (c === ']' && sawStart && !escaping) { |
|
endPos = i + 1; |
|
break; |
|
} |
|
sawStart = true; |
|
if (c === '\\') { |
|
if (!escaping) { |
|
escaping = true; |
|
i++; |
|
continue; |
|
} |
|
|
|
} |
|
if (c === '[' && !escaping) { |
|
|
|
for (const [cls, [unip, u, neg]] of Object.entries(posixClasses)) { |
|
if (glob.startsWith(cls, i)) { |
|
|
|
if (rangeStart) { |
|
return ['$.', false, glob.length - pos, true]; |
|
} |
|
i += cls.length; |
|
if (neg) |
|
negs.push(unip); |
|
else |
|
ranges.push(unip); |
|
uflag = uflag || u; |
|
continue WHILE; |
|
} |
|
} |
|
} |
|
|
|
escaping = false; |
|
if (rangeStart) { |
|
|
|
|
|
if (c > rangeStart) { |
|
ranges.push(braceEscape(rangeStart) + '-' + braceEscape(c)); |
|
} |
|
else if (c === rangeStart) { |
|
ranges.push(braceEscape(c)); |
|
} |
|
rangeStart = ''; |
|
i++; |
|
continue; |
|
} |
|
|
|
|
|
if (glob.startsWith('-]', i + 1)) { |
|
ranges.push(braceEscape(c + '-')); |
|
i += 2; |
|
continue; |
|
} |
|
if (glob.startsWith('-', i + 1)) { |
|
rangeStart = c; |
|
i += 2; |
|
continue; |
|
} |
|
|
|
ranges.push(braceEscape(c)); |
|
i++; |
|
} |
|
if (endPos < i) { |
|
|
|
|
|
return ['', false, 0, false]; |
|
} |
|
|
|
|
|
if (!ranges.length && !negs.length) { |
|
return ['$.', false, glob.length - pos, true]; |
|
} |
|
|
|
|
|
|
|
|
|
if (negs.length === 0 && |
|
ranges.length === 1 && |
|
/^\\?.$/.test(ranges[0]) && |
|
!negate) { |
|
const r = ranges[0].length === 2 ? ranges[0].slice(-1) : ranges[0]; |
|
return [regexpEscape(r), false, endPos - pos, false]; |
|
} |
|
const sranges = '[' + (negate ? '^' : '') + rangesToString(ranges) + ']'; |
|
const snegs = '[' + (negate ? '' : '^') + rangesToString(negs) + ']'; |
|
const comb = ranges.length && negs.length |
|
? '(' + sranges + '|' + snegs + ')' |
|
: ranges.length |
|
? sranges |
|
: snegs; |
|
return [comb, uflag, endPos - pos, true]; |
|
}; |
|
|