UNPKG

sbd-fork

Version:

Split text into sentences with Sentence Boundary Detection (SBD).

47 lines (46 loc) 2.32 kB
/*jshint node:true, laxcomma:true */ /*global describe:true, it:true */ "use strict"; var assert = require('assert'); var tokenizer = require('../lib/tokenizer'); describe('Save newlines', function () { describe('Basic', function () { var entry = "First sentence... Another list: \n - green \n - blue \n - red"; var sentences = tokenizer.sentences(entry); it('second sentence should have newlines', function () { assert.equal(sentences[1], "Another list: \n - green \n - blue \n - red"); }); }); describe('Sentence without lists', function () { var entry = "First sentence... Another sentence.\nThis is a new paragraph."; var sentences = tokenizer.sentences(entry); it('second sentence should have newlines', function () { assert.equal(sentences.length, 3); }); }); describe('With option to use newlines as sentence boundaries', function () { var entry = "First sentence... Another list: \n - green \n - blue \n - red"; var sentences = tokenizer.sentences(entry, { "newline_boundaries": true }); it('second sentence should have newlines', function () { assert.equal(sentences.length, 5); }); }); describe('Multiline strings', function () { var entry = "How now brown cow.\ \ Peter Piper Picked a peck of pickled peppers. A peck of pickled peppers peter piper picked."; var sentences = tokenizer.sentences(entry); it('Should have 3 sentences ending in periods', function () { assert.equal(sentences[0], "How now brown cow."); assert.equal(sentences[1], "Peter Piper Picked a peck of pickled peppers."); }); }); describe('Template multiline strings', function () { var entry = "How now brown cow.\n\n Peter Piper Picked a peck of pickled peppers. A peck of pickled peppers peter piper picked."; var sentences = tokenizer.sentences(entry, { "newline_boundaries": true }); it('Should have 3 sentences ending in periods', function () { assert.equal(sentences[0], "How now brown cow."); assert.equal(sentences[1], "Peter Piper Picked a peck of pickled peppers."); }); }); });