UNPKG

contacted-chunking

Version:

Semantically create chunks from large texts. Useful for workflows involving large language models (LLMs).

51 lines (50 loc) 1.44 kB
{ "name": "contacted-chunking", "version": "2.4.1", "description": "Semantically create chunks from large texts. Useful for workflows involving large language models (LLMs).", "homepage": "https://www.equilllabs.com/projects/semantic-chunking", "repository": { "type": "git", "url": "https://github.com/jparkerweb/semantic-chunking.git" }, "bugs": { "url": "https://github.com/jparkerweb/semantic-chunking/issues", "email": "equilllabs@gmail.com" }, "main": "chunkit.js", "type": "module", "keywords": [ "semantic", "chunking", "sentence", "similarity", "cosine", "chunk", "rag", "splitting", "transformers", "transformers.js", "emmbeddings", "onnx", "xenova", "text-processing", "nlp", "webui", "ml", "BERT" ], "author": "jparkerweb@gmail.com", "license": "ISC", "scripts": { "clean-models": "find ./models -type f ! -name '*.url' -delete", "clean-models-win": "powershell -Command \"Get-ChildItem -Path ./models -Recurse | Where-Object { !$_.PSIsContainer -and $_.Extension -ne '.url' } | Remove-Item\"", "download-models": "node ./tools/download-models.js" }, "dependencies": { "@huggingface/transformers": "^3.2.0", "@stdlib/nlp-sentencize": "^0.2.2", "cli-progress": "^3.12.0", "fs": "^0.0.1-security", "lru-cache": "^11.0.2" } }