UNPKG

spacy

Version:

JavaScript API for spaCy with Python REST API

63 lines (53 loc) 1.79 kB
import spacy from '../src'; import { Doc, Token, Span } from '../src/tokens'; import { text, words, spaces, attrs } from './util' jest.mock('../src/language'); const nlp = spacy.load('en_core_web_sm'); test('allows manual construction', async () => { const doc = await nlp(text); const span = new Span(doc, 6, 9); expect(span).toBeInstanceOf(Span); expect(span.text).toBe('sentence about Facebook'); }); test('allows being sliced off Doc', async () => { const doc = await nlp(text); const span = doc.slice(6, 9); expect(span).toBeInstanceOf(Span); expect(span.text).toBe('sentence about Facebook'); }); test('has Span attributes', async () => { const doc = await nlp(text); const span = doc.slice(6, 9); expect(span.toString()).toBe('sentence about Facebook'); expect(span.length).toBe(3); expect(span.start).toBe(6); expect(span.end).toBe(9); expect(span.label).toBeUndefined(); }); test('has parent Doc', async() => { const doc = await nlp(text); const span = doc.slice(6, 9); expect(span.doc).toBeInstanceOf(Doc); expect(span.doc).toBe(doc); }); test('has entity label', async () => { const doc = await nlp(text); const span = doc.slice(8, 9); expect(span.toString()).toBe('Facebook'); expect(span.label).toBe('ORG'); }); test('allows token indexing', async () => { const doc = await nlp(text); const span = doc.slice(6, 9); for (let i = 0; i < span.length; i++) { expect(span[i]).toBeInstanceOf(Token); } expect(span[span.length + 1]).toBeUndefined(); }); test('allows token iteration', async () => { const doc = await nlp(text); const span = doc.slice(6, 9); for (let token of span) { expect(token).toBeInstanceOf(Token); } });