UNPKG

spacy

Version:

JavaScript API for spaCy with Python REST API

418 lines (417 loc) 11.9 kB
export const text = 'Hello world! This is a sentence about Facebook.'; export const words = ['Hello', 'world', '!', 'This', 'is', 'a', 'sentence', 'about', 'Facebook', '.']; export const spaces = [true, false, true, true, true, true, true, true, false, false]; export const attrs = { "model": "en_core_web_sm", "doc": { "text": "Hello world! This is a sentence about Facebook.", "text_with_ws": "Hello world! This is a sentence about Facebook.", "cats": {}, "is_tagged": true, "is_parsed": true, "is_sentenced": true }, "ents": [ { "start": 8, "end": 9, "label": "ORG" } ], "sents": [ { "start": 0, "end": 3 }, { "start": 3, "end": 10 } ], "noun_chunks": [ { "start": 0, "end": 2 }, { "start": 5, "end": 7 }, { "start": 8, "end": 9 } ], "tokens": [ { "text": "Hello", "text_with_ws": "Hello ", "whitespace": " ", "orth": 15777305708150031551, "i": 0, "ent_type": "", "ent_iob": "O", "lemma": "hello", "norm": "hello", "lower": "hello", "shape": "Xxxxx", "prefix": "H", "suffix": "llo", "pos": "INTJ", "tag": "UH", "dep": "intj", "is_alpha": true, "is_ascii": true, "is_digit": false, "is_lower": false, "is_upper": false, "is_title": true, "is_punct": false, "is_left_punct": false, "is_right_punct": false, "is_space": false, "is_bracket": false, "is_currency": false, "like_url": false, "like_num": false, "like_email": false, "is_oov": true, "is_stop": false, "is_sent_start": null, "head": 1 }, { "text": "world", "text_with_ws": "world", "whitespace": "", "orth": 1703489418272052182, "i": 1, "ent_type": "", "ent_iob": "O", "lemma": "world", "norm": "world", "lower": "world", "shape": "xxxx", "prefix": "w", "suffix": "rld", "pos": "NOUN", "tag": "NN", "dep": "ROOT", "is_alpha": true, "is_ascii": true, "is_digit": false, "is_lower": true, "is_upper": false, "is_title": false, "is_punct": false, "is_left_punct": false, "is_right_punct": false, "is_space": false, "is_bracket": false, "is_currency": false, "like_url": false, "like_num": false, "like_email": false, "is_oov": true, "is_stop": false, "is_sent_start": null, "head": 1 }, { "text": "!", "text_with_ws": "! ", "whitespace": " ", "orth": 17494803046312582752, "i": 2, "ent_type": "", "ent_iob": "O", "lemma": "!", "norm": "!", "lower": "!", "shape": "!", "prefix": "!", "suffix": "!", "pos": "PUNCT", "tag": ".", "dep": "punct", "is_alpha": false, "is_ascii": true, "is_digit": false, "is_lower": false, "is_upper": false, "is_title": false, "is_punct": true, "is_left_punct": false, "is_right_punct": false, "is_space": false, "is_bracket": false, "is_currency": false, "like_url": false, "like_num": false, "like_email": false, "is_oov": true, "is_stop": false, "is_sent_start": null, "head": 1 }, { "text": "This", "text_with_ws": "This ", "whitespace": " ", "orth": 12943039165150086467, "i": 3, "ent_type": "", "ent_iob": "O", "lemma": "this", "norm": "this", "lower": "this", "shape": "Xxxx", "prefix": "T", "suffix": "his", "pos": "DET", "tag": "DT", "dep": "nsubj", "is_alpha": true, "is_ascii": true, "is_digit": false, "is_lower": false, "is_upper": false, "is_title": true, "is_punct": false, "is_left_punct": false, "is_right_punct": false, "is_space": false, "is_bracket": false, "is_currency": false, "like_url": false, "like_num": false, "like_email": false, "is_oov": true, "is_stop": false, "is_sent_start": true, "head": 4 }, { "text": "is", "text_with_ws": "is ", "whitespace": " ", "orth": 3411606890003347522, "i": 4, "ent_type": "", "ent_iob": "O", "lemma": "be", "norm": "is", "lower": "is", "shape": "xx", "prefix": "i", "suffix": "is", "pos": "VERB", "tag": "VBZ", "dep": "ROOT", "is_alpha": true, "is_ascii": true, "is_digit": false, "is_lower": true, "is_upper": false, "is_title": false, "is_punct": false, "is_left_punct": false, "is_right_punct": false, "is_space": false, "is_bracket": false, "is_currency": false, "like_url": false, "like_num": false, "like_email": false, "is_oov": true, "is_stop": true, "is_sent_start": null, "head": 4 }, { "text": "a", "text_with_ws": "a ", "whitespace": " ", "orth": 11901859001352538922, "i": 5, "ent_type": "", "ent_iob": "O", "lemma": "a", "norm": "gonna", "lower": "a", "shape": "x", "prefix": "a", "suffix": "a", "pos": "DET", "tag": "DT", "dep": "det", "is_alpha": true, "is_ascii": true, "is_digit": false, "is_lower": true, "is_upper": false, "is_title": false, "is_punct": false, "is_left_punct": false, "is_right_punct": false, "is_space": false, "is_bracket": false, "is_currency": false, "like_url": false, "like_num": false, "like_email": false, "is_oov": true, "is_stop": true, "is_sent_start": null, "head": 6 }, { "text": "sentence", "text_with_ws": "sentence ", "whitespace": " ", "orth": 18108853898452662235, "i": 6, "ent_type": "", "ent_iob": "O", "lemma": "sentence", "norm": "sentence", "lower": "sentence", "shape": "xxxx", "prefix": "s", "suffix": "nce", "pos": "NOUN", "tag": "NN", "dep": "attr", "is_alpha": true, "is_ascii": true, "is_digit": false, "is_lower": true, "is_upper": false, "is_title": false, "is_punct": false, "is_left_punct": false, "is_right_punct": false, "is_space": false, "is_bracket": false, "is_currency": false, "like_url": false, "like_num": false, "like_email": false, "is_oov": true, "is_stop": false, "is_sent_start": null, "head": 4 }, { "text": "about", "text_with_ws": "about ", "whitespace": " ", "orth": 942632335873952620, "i": 7, "ent_type": "", "ent_iob": "O", "lemma": "about", "norm": "about", "lower": "about", "shape": "xxxx", "prefix": "a", "suffix": "out", "pos": "ADP", "tag": "IN", "dep": "prep", "is_alpha": true, "is_ascii": true, "is_digit": false, "is_lower": true, "is_upper": false, "is_title": false, "is_punct": false, "is_left_punct": false, "is_right_punct": false, "is_space": false, "is_bracket": false, "is_currency": false, "like_url": false, "like_num": false, "like_email": false, "is_oov": true, "is_stop": true, "is_sent_start": null, "head": 6 }, { "text": "Facebook", "text_with_ws": "Facebook", "whitespace": "", "orth": 8081970590932371665, "i": 8, "ent_type": "ORG", "ent_iob": "B", "lemma": "facebook", "norm": "facebook", "lower": "facebook", "shape": "Xxxxx", "prefix": "F", "suffix": "ook", "pos": "PROPN", "tag": "NNP", "dep": "pobj", "is_alpha": true, "is_ascii": true, "is_digit": false, "is_lower": false, "is_upper": false, "is_title": true, "is_punct": false, "is_left_punct": false, "is_right_punct": false, "is_space": false, "is_bracket": false, "is_currency": false, "like_url": false, "like_num": false, "like_email": false, "is_oov": true, "is_stop": false, "is_sent_start": null, "head": 7 }, { "text": ".", "text_with_ws": ".", "whitespace": "", "orth": 12646065887601541794, "i": 9, "ent_type": "", "ent_iob": "O", "lemma": ".", "norm": ".", "lower": ".", "shape": ".", "prefix": ".", "suffix": ".", "pos": "PUNCT", "tag": ".", "dep": "punct", "is_alpha": false, "is_ascii": true, "is_digit": false, "is_lower": false, "is_upper": false, "is_title": false, "is_punct": true, "is_left_punct": false, "is_right_punct": false, "is_space": false, "is_bracket": false, "is_currency": false, "like_url": false, "like_num": false, "like_email": false, "is_oov": true, "is_stop": false, "is_sent_start": null, "head": 4 } ] }