@fable-org/fable-library-js
Version:
Core library used by F# projects compiled with fable.io
203 lines (202 loc) • 6.98 kB
JavaScript
import * as Unicode from "./Unicode.13.0.0.js";
import { Exception } from "./Util.js";
function getCategoryFunc() {
// unpack Unicode codepoint ranges (delta encoded) and general categories
const offset = 35; // offsets unprintable characters
const a1 = [...Unicode.rangeDeltas].map((ch) => (ch.codePointAt(0) ?? 0) - offset);
const a2 = [...Unicode.categories].map((ch) => (ch.codePointAt(0) ?? 0) - offset);
const codepoints = new Uint32Array(a1);
const categories = new Uint8Array(a2);
for (let i = 1; i < codepoints.length; ++i) {
codepoints[i] += codepoints[i - 1];
}
// binary search in unicode ranges
return (cp) => {
let hi = codepoints.length;
let lo = 0;
while (hi - lo > 1) {
const mid = Math.floor((hi + lo) / 2);
const test = codepoints[mid];
if (cp < test) {
hi = mid;
}
else if (cp === test) {
hi = lo = mid;
break;
}
else if (test < cp) {
lo = mid;
}
}
return categories[lo];
};
}
export const UnicodeCategory = {
UppercaseLetter: 0,
LowercaseLetter: 1,
TitlecaseLetter: 2,
ModifierLetter: 3,
OtherLetter: 4,
NonSpacingMark: 5,
SpacingCombiningMark: 6,
EnclosingMark: 7,
DecimalDigitNumber: 8,
LetterNumber: 9,
OtherNumber: 10,
SpaceSeparator: 11,
LineSeparator: 12,
ParagraphSeparator: 13,
Control: 14,
Format: 15,
Surrogate: 16,
PrivateUse: 17,
ConnectorPunctuation: 18,
DashPunctuation: 19,
OpenPunctuation: 20,
ClosePunctuation: 21,
InitialQuotePunctuation: 22,
FinalQuotePunctuation: 23,
OtherPunctuation: 24,
MathSymbol: 25,
CurrencySymbol: 26,
ModifierSymbol: 27,
OtherSymbol: 28,
OtherNotAssigned: 29,
};
const isControlMask = 1 << UnicodeCategory.Control;
const isDigitMask = 1 << UnicodeCategory.DecimalDigitNumber;
const isLetterMask = 0
| 1 << UnicodeCategory.UppercaseLetter
| 1 << UnicodeCategory.LowercaseLetter
| 1 << UnicodeCategory.TitlecaseLetter
| 1 << UnicodeCategory.ModifierLetter
| 1 << UnicodeCategory.OtherLetter;
const isLetterOrDigitMask = isLetterMask | isDigitMask;
const isUpperMask = 1 << UnicodeCategory.UppercaseLetter;
const isLowerMask = 1 << UnicodeCategory.LowercaseLetter;
const isNumberMask = 0
| 1 << UnicodeCategory.DecimalDigitNumber
| 1 << UnicodeCategory.LetterNumber
| 1 << UnicodeCategory.OtherNumber;
const isPunctuationMask = 0
| 1 << UnicodeCategory.ConnectorPunctuation
| 1 << UnicodeCategory.DashPunctuation
| 1 << UnicodeCategory.OpenPunctuation
| 1 << UnicodeCategory.ClosePunctuation
| 1 << UnicodeCategory.InitialQuotePunctuation
| 1 << UnicodeCategory.FinalQuotePunctuation
| 1 << UnicodeCategory.OtherPunctuation;
const isSeparatorMask = 0
| 1 << UnicodeCategory.SpaceSeparator
| 1 << UnicodeCategory.LineSeparator
| 1 << UnicodeCategory.ParagraphSeparator;
const isSymbolMask = 0
| 1 << UnicodeCategory.MathSymbol
| 1 << UnicodeCategory.CurrencySymbol
| 1 << UnicodeCategory.ModifierSymbol
| 1 << UnicodeCategory.OtherSymbol;
const isWhiteSpaceMask = 0
| 1 << UnicodeCategory.SpaceSeparator
| 1 << UnicodeCategory.LineSeparator
| 1 << UnicodeCategory.ParagraphSeparator;
const unicodeCategoryFunc = getCategoryFunc();
function charCodeAt(s, index) {
if (index >= 0 && index < s.length) {
return s.charCodeAt(index);
}
else {
throw new Exception("Index out of range.");
}
}
export const getUnicodeCategory = (s) => getUnicodeCategory2(s, 0);
export const isControl = (s) => isControl2(s, 0);
export const isDigit = (s) => isDigit2(s, 0);
export const isLetter = (s) => isLetter2(s, 0);
export const isLetterOrDigit = (s) => isLetterOrDigit2(s, 0);
export const isUpper = (s) => isUpper2(s, 0);
export const isLower = (s) => isLower2(s, 0);
export const isNumber = (s) => isNumber2(s, 0);
export const isPunctuation = (s) => isPunctuation2(s, 0);
export const isSeparator = (s) => isSeparator2(s, 0);
export const isSymbol = (s) => isSymbol2(s, 0);
export const isWhiteSpace = (s) => isWhiteSpace2(s, 0);
export const isHighSurrogate = (s) => isHighSurrogate2(s, 0);
export const isLowSurrogate = (s) => isLowSurrogate2(s, 0);
export const isSurrogate = (s) => isSurrogate2(s, 0);
export function getUnicodeCategory2(s, index) {
const cp = charCodeAt(s, index);
return unicodeCategoryFunc(cp);
}
export function isControl2(s, index) {
const test = 1 << getUnicodeCategory2(s, index);
return (test & isControlMask) !== 0;
}
export function isDigit2(s, index) {
const test = 1 << getUnicodeCategory2(s, index);
return (test & isDigitMask) !== 0;
}
export function isLetter2(s, index) {
const test = 1 << getUnicodeCategory2(s, index);
return (test & isLetterMask) !== 0;
}
export function isLetterOrDigit2(s, index) {
const test = 1 << getUnicodeCategory2(s, index);
return (test & isLetterOrDigitMask) !== 0;
}
export function isUpper2(s, index) {
const test = 1 << getUnicodeCategory2(s, index);
return (test & isUpperMask) !== 0;
}
export function isLower2(s, index) {
const test = 1 << getUnicodeCategory2(s, index);
return (test & isLowerMask) !== 0;
}
export function isNumber2(s, index) {
const test = 1 << getUnicodeCategory2(s, index);
return (test & isNumberMask) !== 0;
}
export function isPunctuation2(s, index) {
const test = 1 << getUnicodeCategory2(s, index);
return (test & isPunctuationMask) !== 0;
}
export function isSeparator2(s, index) {
const test = 1 << getUnicodeCategory2(s, index);
return (test & isSeparatorMask) !== 0;
}
export function isSymbol2(s, index) {
const test = 1 << getUnicodeCategory2(s, index);
return (test & isSymbolMask) !== 0;
}
export function isWhiteSpace2(s, index) {
const test = 1 << getUnicodeCategory2(s, index);
if ((test & isWhiteSpaceMask) !== 0) {
return true;
}
const cp = charCodeAt(s, index);
return (0x09 <= cp && cp <= 0x0D) || cp === 0x85 || cp === 0xA0;
}
export function isHighSurrogate2(s, index) {
const cp = charCodeAt(s, index);
return (0xD800 <= cp && cp <= 0xDBFF);
}
export function isLowSurrogate2(s, index) {
const cp = charCodeAt(s, index);
return (0xDC00 <= cp && cp <= 0xDFFF);
}
export function isSurrogate2(s, index) {
const cp = charCodeAt(s, index);
return (0xD800 <= cp && cp <= 0xDFFF);
}
export function isSurrogatePair(s, index) {
return typeof index === "number"
? isHighSurrogate2(s, index) && isLowSurrogate2(s, index + 1)
: isHighSurrogate(s) && isLowSurrogate(index);
}
export function parse(input) {
if (input.length === 1) {
return input[0];
}
else {
throw new Exception("String must be exactly one character long.");
}
}