multi-voice-sdk
Version:
A universal Text-to-Speech (TTS) and Speech-to-Text (STT) SDK supporting multiple providers (OpenAI, Google Gemini, Deepgram, Groq PlayAI, Cartesia, AssemblyAI) with audio merging capabilities
61 lines (60 loc) • 1.35 kB
JSON
{
"name": "multi-voice-sdk",
"version": "1.1.0",
"description": "A universal Text-to-Speech (TTS) and Speech-to-Text (STT) SDK supporting multiple providers (OpenAI, Google Gemini, Deepgram, Groq PlayAI, Cartesia, AssemblyAI) with audio merging capabilities",
"main": "index.js",
"type": "module",
"exports": {
".": {
"import": "./index.js",
"types": "./index.d.ts"
}
},
"files": [
"index.js",
"index.d.ts",
"src/",
"README.md",
"LICENSE"
],
"scripts": {
"dev": "node example.js",
"test": "echo \"Error: no test specified\" && exit 1"
},
"keywords": [
"tts",
"text-to-speech",
"stt",
"speech-to-text",
"transcription",
"audio",
"openai",
"gemini",
"deepgram",
"assemblyai",
"groq",
"playai",
"cartesia",
"voice",
"speech-synthesis",
"speech-recognition",
"ai",
"audio-processing"
],
"author": "Akshay Kambli <https://github.com/ARK018>",
"license": "ISC",
"dependencies": {
"@cartesia/cartesia-js": "^2.2.4",
"@deepgram/sdk": "^4.2.0",
"@google/genai": "^1.4.0",
"assemblyai": "^4.13.3",
"ffmpeg-static": "^5.2.0",
"fluent-ffmpeg": "^2.1.3",
"groq-sdk": "^0.25.0",
"openai": "^5.1.1",
"wav": "^1.0.2"
},
"devDependencies": {
"dotenv": "^16.5.0"
}
}