Skip to content

Commit

Permalink
Migrate TTS/ASR to @Davi-ai fork; Support visemes (#7)
Browse files Browse the repository at this point in the history
* This change switches TTS ponyfill to @Davi-ai fork. See the reasons for creating the fork is here: compulim/web-speech-cognitive-services#173 (comment)

* The @Davi-ai fork was modified to adjust typing, ASR final results and, additionally, excessive logging was removed.

* This change enables sending VISEME events inside SpeechState, to control external avatars. For now, the VISEME events gets transformed to stream of FURHAT_BLENDSHAPES events which control Furhat lipsync.

* Extensive test coverage for ASR and TTS (including streaming). To test streaming one needs to run SSE server (~test/server.js~)
  • Loading branch information
vladmaraev committed Oct 24, 2024
1 parent 0fee799 commit 48781a4
Show file tree
Hide file tree
Showing 15 changed files with 5,627 additions and 2,400 deletions.

Large diffs are not rendered by default.

35 changes: 27 additions & 8 deletions package.json
Original file line number Diff line number Diff line change
@@ -1,27 +1,37 @@
{
"name": "speechstate",
"version": "2.6.0",
"version": "2.7.0",
"license": "GPL-3.0",
"type": "module",
"homepage": "http://localhost/speechstate",
"main": "./dist/index.js",
"types": "./dist/index.d.ts",
"files": ["/dist"],
"files": [
"/dist"
],
"dependencies": {
"microsoft-cognitiveservices-speech-sdk": "^1.31.0",
"web-speech-cognitive-services": "^7.1.3",
"@vladmaraev/web-speech-cognitive-services-davi": "^2.0.16",
"xstate": "^5.17.4"
},
"scripts": {
"dev": "vite",
"compile": "tsc",
"test": "vitest",
"test:browser": "vitest"
"test:browser": "vitest",
"sse": "node test/server"
},
"eslintConfig": {
"extends": ["react-app", "react-app/jest"]
"extends": [
"react-app",
"react-app/jest"
]
},
"browserslist": {
"production": [">0.2%", "not dead", "not op_mini all"],
"production": [
">0.2%",
"not dead",
"not op_mini all"
],
"development": [
"last 1 chrome version",
"last 1 firefox version",
Expand All @@ -35,6 +45,8 @@
"@types/webspeechapi": "^0.0.29",
"@vitest/browser": "^2.0.5",
"buffer": "^5.5.0||^6.0.0",
"cors": "^2.8.5",
"express": "^4.19.2",
"jest": "^29.5.0",
"jest-environment-jsdom": "^29.5.0",
"ts-jest": "^29.1.0",
Expand All @@ -44,7 +56,11 @@
"webdriverio": "^9.0.7",
"ws": "^8.16.0"
},
"trustedDependencies": ["p-defer-es5", "edgedriver", "core-js-pure"],
"trustedDependencies": [
"p-defer-es5",
"edgedriver",
"core-js-pure"
],
"packageManager": "[email protected]",
"description": "* SDK",
"directories": {
Expand All @@ -58,5 +74,8 @@
"author": "Vlad Maraev",
"bugs": {
"url": "https://github.com/vladmaraev/speechstate/issues"
},
"resolutions": {
"@davi-ai/web-speech-cognitive-services-davi@^2.0.8": "patch:@davi-ai/web-speech-cognitive-services-davi@npm%3A2.0.8#./.yarn/patches/@davi-ai-web-speech-cognitive-services-davi-npm-2.0.8-c22c46cebd.patch"
}
}
Loading

0 comments on commit 48781a4

Please sign in to comment.