UNPKG

@thi.ng/text-analysis

Version:

Text tokenization, transformation & analysis transducers, utilities, stop words, porter stemming, vector encodings, similarities

145 lines 3.37 kB
{ "name": "@thi.ng/text-analysis", "version": "0.4.16", "description": "Text tokenization, transformation & analysis transducers, utilities, stop words, porter stemming, vector encodings, similarities", "type": "module", "module": "./index.js", "typings": "./index.d.ts", "sideEffects": false, "repository": { "type": "git", "url": "https://github.com/thi-ng/umbrella.git" }, "homepage": "https://thi.ng/text-analysis", "funding": [ { "type": "github", "url": "https://github.com/sponsors/postspectacular" }, { "type": "patreon", "url": "https://patreon.com/thing_umbrella" }, { "type": "liberapay", "url": "https://liberapay.com/thi.ng" } ], "author": "Karsten Schmidt (https://thi.ng)", "license": "Apache-2.0", "scripts": { "build": "yarn build:esbuild && yarn build:decl", "build:decl": "tsc --declaration --emitDeclarationOnly", "build:esbuild": "esbuild --format=esm --platform=neutral --target=es2022 --tsconfig=tsconfig.json --outdir=. src/**/*.ts", "clean": "bun ../../tools/src/clean-package.ts", "doc": "typedoc --options ../../typedoc.json --out doc src/index.ts", "doc:readme": "bun ../../tools/src/module-stats.ts && bun ../../tools/src/readme.ts", "pub": "yarn npm publish --access public", "test": "bun test", "tool:tangle": "../../node_modules/.bin/tangle src/**/*.ts" }, "dependencies": { "@thi.ng/api": "^8.12.1", "@thi.ng/arrays": "^2.13.9", "@thi.ng/bidir-index": "^1.3.6", "@thi.ng/checks": "^3.7.16", "@thi.ng/distance": "^3.0.14", "@thi.ng/k-means": "^2.0.12", "@thi.ng/strings": "^3.9.21", "@thi.ng/transducers": "^9.6.7", "@thi.ng/vectors": "^8.6.4" }, "devDependencies": { "esbuild": "^0.25.8", "typedoc": "^0.28.9", "typescript": "^5.9.2" }, "keywords": [ "analysis", "centroid", "cluster", "composition", "decode", "dense", "encode", "frequency", "functional", "histogram", "k-means", "ngram", "pipeline", "similarity", "sparse", "stem", "text", "tf-idf", "tokenizer", "transducer", "typescript", "vocabulary", "vector" ], "publishConfig": { "access": "public" }, "browser": { "process": false, "setTimeout": false }, "engines": { "node": ">=18" }, "files": [ "./*.js", "./*.d.ts" ], "exports": { ".": { "default": "./index.js" }, "./api": { "default": "./api.js" }, "./cluster": { "default": "./cluster.js" }, "./frequencies": { "default": "./frequencies.js" }, "./ngrams": { "default": "./ngrams.js" }, "./replace": { "default": "./replace.js" }, "./similarity": { "default": "./similarity.js" }, "./stem": { "default": "./stem.js" }, "./stop-words": { "default": "./stop-words.js" }, "./tf-idf": { "default": "./tf-idf.js" }, "./tokenize": { "default": "./tokenize.js" }, "./vec": { "default": "./vec.js" }, "./vocab": { "default": "./vocab.js" }, "./xform": { "default": "./xform.js" } }, "thi.ng": { "status": "alpha", "year": 2021 }, "gitHead": "9a998c33c7a524c95b552b9cbdc2734d28a5dafc\n" }