chinese-tokenizer
Version:
Simple algorithm to tokenize Chinese texts into words using CC-CEDICT.
33 lines (32 loc) • 721 B
JSON
{
"name": "chinese-tokenizer",
"version": "2.4.0",
"description": "Simple algorithm to tokenize Chinese texts into words using CC-CEDICT.",
"main": "./src/main.js",
"repository": {
"type": "git",
"url": "git+https://github.com/yishn/chinese-tokenizer.git"
},
"keywords": [
"chinese",
"text",
"tokenizer",
"words",
"language"
],
"author": "Yichuan Shen",
"license": "MIT",
"bugs": {
"url": "https://github.com/yishn/chinese-tokenizer/issues"
},
"homepage": "https://github.com/yishn/chinese-tokenizer",
"scripts": {
"test": "tap tests/*.test.js"
},
"dependencies": {
"prettify-pinyin": "^0.1.5"
},
"devDependencies": {
"tap": "^14.2.0"
}
}