-
Notifications
You must be signed in to change notification settings - Fork 493
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
[DOW-101] LiveKit integration (#591)
* checkpoint * livekit v0 * in progress changes * integrate with worker * fix import * update deps and remove unneeded files * integrate it properly into app * fix interrupts * make transcript publish work * a confounding fix * isort * constants, some cleanup --------- Co-authored-by: Kian <[email protected]>
- Loading branch information
Showing
14 changed files
with
3,854 additions
and
303 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,3 @@ | ||
``` | ||
poetry run python app.py dev | ||
``` |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,107 @@ | ||
import asyncio | ||
import os | ||
|
||
from livekit.agents import JobContext, JobRequest, WorkerOptions, cli | ||
from loguru import logger | ||
from pydantic_settings import BaseSettings, SettingsConfigDict | ||
|
||
from vocode.logging import configure_pretty_logging | ||
from vocode.streaming.action.end_conversation import EndConversationVocodeActionConfig | ||
from vocode.streaming.agent.chat_gpt_agent import ChatGPTAgent | ||
from vocode.streaming.livekit.livekit_conversation import LiveKitConversation | ||
from vocode.streaming.models.actions import ( | ||
PhraseBasedActionTrigger, | ||
PhraseBasedActionTriggerConfig, | ||
PhraseTrigger, | ||
) | ||
from vocode.streaming.models.agent import ChatGPTAgentConfig | ||
from vocode.streaming.models.message import BaseMessage | ||
from vocode.streaming.models.synthesizer import AzureSynthesizerConfig | ||
from vocode.streaming.models.transcriber import ( | ||
DeepgramTranscriberConfig, | ||
PunctuationEndpointingConfig, | ||
) | ||
from vocode.streaming.output_device.livekit_output_device import LiveKitOutputDevice | ||
from vocode.streaming.synthesizer.azure_synthesizer import AzureSynthesizer | ||
from vocode.streaming.transcriber.deepgram_transcriber import DeepgramTranscriber | ||
|
||
|
||
class Settings(BaseSettings): | ||
|
||
livekit_api_key: str = "ENTER_YOUR_LIVE_KIT_API_KEY" | ||
livekit_api_secret: str = "ENTER_YOUR_LIVE_KIT_API_SECRET" | ||
livekit_ws_url: str = "ENTER_YOUR_LIVE_KIT_WS_URL" | ||
|
||
# This means a .env file can be used to overload these settings | ||
# ex: "OPENAI_API_KEY=my_key" will set openai_api_key over the default above | ||
model_config = SettingsConfigDict( | ||
env_file=".env", | ||
env_file_encoding="utf-8", | ||
extra="ignore", | ||
) | ||
|
||
|
||
async def wait_for_termination(conversation: LiveKitConversation, ctx: JobContext): | ||
await conversation.wait_for_termination() | ||
await conversation.terminate() | ||
await ctx.room.disconnect() | ||
|
||
|
||
async def entrypoint(ctx: JobContext): | ||
configure_pretty_logging() | ||
output_device = LiveKitOutputDevice() | ||
conversation = LiveKitConversation( | ||
output_device=output_device, | ||
transcriber=DeepgramTranscriber( | ||
DeepgramTranscriberConfig.from_livekit_input_device( | ||
endpointing_config=PunctuationEndpointingConfig(), | ||
api_key=os.getenv("DEEPGRAM_API_KEY"), | ||
), | ||
), | ||
agent=ChatGPTAgent( | ||
ChatGPTAgentConfig( | ||
openai_api_key=os.getenv("OPENAI_API_KEY"), | ||
initial_message=BaseMessage(text="What up"), | ||
prompt_preamble="""The AI is having a pleasant conversation about life""", | ||
actions=[ | ||
EndConversationVocodeActionConfig( | ||
action_trigger=PhraseBasedActionTrigger( | ||
config=PhraseBasedActionTriggerConfig( | ||
phrase_triggers=[ | ||
PhraseTrigger( | ||
phrase="goodbye", | ||
conditions=["phrase_condition_type_contains"], | ||
) | ||
] | ||
) | ||
) | ||
) | ||
], | ||
) | ||
), | ||
synthesizer=AzureSynthesizer( | ||
synthesizer_config=AzureSynthesizerConfig.from_output_device( | ||
output_device=output_device, | ||
voice_name="en-US-AriaNeural", | ||
) | ||
), | ||
) | ||
await conversation.start_room(ctx.room) | ||
asyncio.create_task(wait_for_termination(conversation, ctx)) | ||
|
||
|
||
async def request_fnc(req: JobRequest) -> None: | ||
logger.info("received request %s", req) | ||
await req.accept(entrypoint) | ||
|
||
|
||
if __name__ == "__main__": | ||
settings = Settings() | ||
cli.run_app( | ||
WorkerOptions( | ||
request_fnc, | ||
api_key=settings.livekit_api_key, | ||
api_secret=settings.livekit_api_secret, | ||
ws_url=settings.livekit_ws_url, | ||
) | ||
) |
Large diffs are not rendered by default.
Oops, something went wrong.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,19 @@ | ||
[tool.poetry] | ||
name = "livekit_app" | ||
version = "0.1.0" | ||
description = "" | ||
authors = ["Your Name <[email protected]>"] | ||
readme = "README.md" | ||
package-mode = false | ||
|
||
[tool.poetry.dependencies] | ||
python = "^3.11" | ||
livekit = "^0.11.1" | ||
livekit-api = "^0.5.0" | ||
vocode = { path = "../..", develop = true } | ||
livekit-agents = "^0.7.2" | ||
|
||
|
||
[build-system] | ||
requires = ["poetry-core"] | ||
build-backend = "poetry.core.masonry.api" |
Oops, something went wrong.