@atproto/api
Version:
Client library for atproto and Bluesky
212 lines (195 loc) β’ 8.76 kB
text/typescript
import { Facet, RichText, UnicodeString, sanitizeRichText } from '../src'
describe('sanitizeRichText: cleanNewlines', () => {
it('removes more than two consecutive new lines', () => {
const input = new RichText({
text: 'test\n\n\n\n\ntest\n\n\n\n\n\n\ntest\n\n\n\n\n\n\ntest\n\n\n\n\n\n\ntest',
})
const output = sanitizeRichText(input, { cleanNewlines: true })
expect(String(output.unicodeText)).toEqual(
'test\n\ntest\n\ntest\n\ntest\n\ntest',
)
})
it('removes more than two consecutive new lines w/fat unicode', () => {
const input = new RichText({
text: 'testπ¨βπ©βπ§βπ§\n\n\n\n\nπ¨βπ©βπ§βπ§test\n\n\n\n\n\n\ntestπ¨βπ©βπ§βπ§\n\n\n\n\n\n\ntest\n\n\n\n\n\n\nπ¨βπ©βπ§βπ§test',
})
const output = sanitizeRichText(input, { cleanNewlines: true })
expect(String(output.unicodeText)).toEqual(
'testπ¨βπ©βπ§βπ§\n\nπ¨βπ©βπ§βπ§test\n\ntestπ¨βπ©βπ§βπ§\n\ntest\n\nπ¨βπ©βπ§βπ§test',
)
})
it('removes more than two consecutive new lines with spaces', () => {
const input = new RichText({
text: 'test\n\n\n\n\ntest\n \n \n \n \n\n\ntest\n\n\n\n\n\n\ntest\n\n\n\n\n \n\ntest',
})
const output = sanitizeRichText(input, { cleanNewlines: true })
expect(String(output.unicodeText)).toEqual(
'test\n\ntest\n\ntest\n\ntest\n\ntest',
)
})
it('returns original string if there are no consecutive new lines', () => {
const input = new RichText({ text: 'test\n\ntest\n\ntest\n\ntest\n\ntest' })
const output = sanitizeRichText(input, { cleanNewlines: true })
expect(String(output.unicodeText)).toEqual(String(input.unicodeText))
})
it('returns original string if there are no new lines', () => {
const input = new RichText({ text: 'test test test test test' })
const output = sanitizeRichText(input, { cleanNewlines: true })
expect(String(output.unicodeText)).toEqual(String(input.unicodeText))
})
it('returns empty string if input is empty', () => {
const input = new RichText({ text: '' })
const output = sanitizeRichText(input, { cleanNewlines: true })
expect(String(output.unicodeText)).toEqual('')
})
it('works with different types of new line characters', () => {
const input = new RichText({
text: 'test\r\ntest\n\rtest\rtest\n\n\n\ntest\n\r \n \n \n \n\n\ntest',
})
const output = sanitizeRichText(input, { cleanNewlines: true })
expect(String(output.unicodeText)).toEqual(
'test\r\ntest\n\rtest\rtest\n\ntest\n\ntest',
)
})
it('removes more than two consecutive new lines with zero width space', () => {
const input = new RichText({
text: 'test\n\n\n\n\ntest\n\u200B\u200B\n\n\n\ntest\n \u200B\u200B \n\n\n\ntest\n\n\n\n\n\n\ntest',
})
const output = sanitizeRichText(input, { cleanNewlines: true })
expect(String(output.unicodeText)).toEqual(
'test\n\ntest\n\ntest\n\ntest\n\ntest',
)
})
it('removes more than two consecutive new lines with zero width non-joiner', () => {
const input = new RichText({
text: 'test\n\n\n\n\ntest\n\u200C\u200C\n\n\n\ntest\n \u200C\u200C \n\n\n\ntest\n\n\n\n\n\n\ntest',
})
const output = sanitizeRichText(input, { cleanNewlines: true })
expect(String(output.unicodeText)).toEqual(
'test\n\ntest\n\ntest\n\ntest\n\ntest',
)
})
it('removes more than two consecutive new lines with zero width joiner', () => {
const input = new RichText({
text: 'test\n\n\n\n\ntest\n\u200D\u200D\n\n\n\ntest\n \u200D\u200D \n\n\n\ntest\n\n\n\n\n\n\ntest',
})
const output = sanitizeRichText(input, { cleanNewlines: true })
expect(String(output.unicodeText)).toEqual(
'test\n\ntest\n\ntest\n\ntest\n\ntest',
)
})
it('removes more than two consecutive new lines with soft hyphen', () => {
const input = new RichText({
text: 'test\n\n\n\n\ntest\n\u00AD\u00AD\n\n\n\ntest\n \u00AD\u00AD \n\n\n\ntest\n\n\n\n\n\n\ntest',
})
const output = sanitizeRichText(input, { cleanNewlines: true })
expect(String(output.unicodeText)).toEqual(
'test\n\ntest\n\ntest\n\ntest\n\ntest',
)
})
it('removes more than two consecutive new lines with word joiner', () => {
const input = new RichText({
text: 'test\n\n\n\n\ntest\n\u2060\u2060\n\n\n\ntest\n \u2060\u2060 \n\n\n\ntest\n\n\n\n\n\n\ntest',
})
const output = sanitizeRichText(input, { cleanNewlines: true })
expect(String(output.unicodeText)).toEqual(
'test\n\ntest\n\ntest\n\ntest\n\ntest',
)
})
})
describe('sanitizeRichText w/facets: cleanNewlines', () => {
it('preserves entities as expected', () => {
const input = new RichText({
text: 'test\n\n\n\n\ntest\n\n\n\n\n\n\ntest\n\n\n\n\n\n\ntest\n\n\n\n\n\n\ntest',
facets: [
{ index: { byteStart: 0, byteEnd: 13 }, features: [{ $type: '' }] },
{ index: { byteStart: 13, byteEnd: 24 }, features: [{ $type: '' }] },
{ index: { byteStart: 9, byteEnd: 15 }, features: [{ $type: '' }] },
{ index: { byteStart: 4, byteEnd: 9 }, features: [{ $type: '' }] },
],
})
const output = sanitizeRichText(input, { cleanNewlines: true })
expect(facetToStr(String(input.unicodeText), input.facets?.[0])).toEqual(
'test\n\n\n\n\ntest',
)
expect(facetToStr(String(input.unicodeText), input.facets?.[1])).toEqual(
'\n\n\n\n\n',
)
expect(facetToStr(String(input.unicodeText), input.facets?.[2])).toEqual(
'test\n\n',
)
expect(facetToStr(String(input.unicodeText), input.facets?.[3])).toEqual(
'\n\n\n\n\n\n\ntest',
)
expect(String(output.unicodeText)).toEqual(
'test\n\ntest\n\ntest\n\ntest\n\ntest',
)
expect(facetToStr(String(output.unicodeText), output.facets?.[0])).toEqual(
'test\n\ntest',
)
expect(facetToStr(String(output.unicodeText), output.facets?.[1])).toEqual(
'test',
)
expect(facetToStr(String(output.unicodeText), output.facets?.[2])).toEqual(
'test',
)
expect(output.facets?.[3]).toEqual(undefined)
})
it('preserves entities as expected w/fat unicode', () => {
const str = new UnicodeString(
'π¨βπ©βπ§βπ§test\n\n\n\n\nπ¨βπ©βπ§βπ§test\n\n\n\n\nπ¨βπ©βπ§βπ§test\n\n\n\n\nπ¨βπ©βπ§βπ§test\n\n\n\n\nπ¨βπ©βπ§βπ§test\n\n\n\n\nπ¨βπ©βπ§βπ§test\n\n\n\n\nπ¨βπ©βπ§βπ§test\n\n\n\n\n',
)
let lastI = 0
const makeFacet = (match: string) => {
const i = str.utf16.indexOf(match, lastI)
lastI = i + match.length
const byteStart = str.utf16IndexToUtf8Index(i)
const byteEnd = byteStart + new UnicodeString(match).length
return {
index: { byteStart, byteEnd },
features: [{ $type: '' }],
}
}
const input = new RichText({
text: str.utf16,
facets: [
makeFacet('π¨βπ©βπ§βπ§test\n\n\n\n\nπ¨βπ©βπ§βπ§test'),
makeFacet('\n\n\n\n\nπ¨βπ©βπ§βπ§test'),
makeFacet('π¨βπ©βπ§βπ§test\n\n'),
makeFacet('\n\n'),
],
})
const output = sanitizeRichText(input, { cleanNewlines: true })
expect(facetToStr(String(input.unicodeText), input.facets?.[0])).toEqual(
'π¨βπ©βπ§βπ§test\n\n\n\n\nπ¨βπ©βπ§βπ§test',
)
expect(facetToStr(String(input.unicodeText), input.facets?.[1])).toEqual(
'\n\n\n\n\nπ¨βπ©βπ§βπ§test',
)
expect(facetToStr(String(input.unicodeText), input.facets?.[2])).toEqual(
'π¨βπ©βπ§βπ§test\n\n',
)
expect(facetToStr(String(input.unicodeText), input.facets?.[3])).toEqual(
'\n\n',
)
expect(String(output.unicodeText)).toEqual(
'π¨βπ©βπ§βπ§test\n\nπ¨βπ©βπ§βπ§test\n\nπ¨βπ©βπ§βπ§test\n\nπ¨βπ©βπ§βπ§test\n\nπ¨βπ©βπ§βπ§test\n\nπ¨βπ©βπ§βπ§test\n\nπ¨βπ©βπ§βπ§test\n\n',
)
expect(facetToStr(String(output.unicodeText), output.facets?.[0])).toEqual(
'π¨βπ©βπ§βπ§test\n\nπ¨βπ©βπ§βπ§test',
)
expect(facetToStr(String(output.unicodeText), output.facets?.[1])).toEqual(
'π¨βπ©βπ§βπ§test',
)
expect(facetToStr(String(output.unicodeText), output.facets?.[2])).toEqual(
'π¨βπ©βπ§βπ§test',
)
expect(output.facets?.[3]).toEqual(undefined)
})
})
function facetToStr(str: string, ent?: Facet) {
if (!ent) {
return ''
}
return new UnicodeString(str).slice(ent.index.byteStart, ent.index.byteEnd)
}