|
6 | 6 |
|
7 | 7 | """Gemini Travel Companion |
8 | 8 |
|
9 | | -This module implements a chatbot using Google's Gemini Multimodal Live model. |
| 9 | +This module implements a chatbot using Google's Gemini Live model. |
10 | 10 | It includes: |
11 | 11 | - Real-time audio interaction through Daily |
12 | 12 | - Function calling |
|
32 | 32 | from pipecat.processors.frameworks.rtvi import RTVIConfig, RTVIObserver, RTVIProcessor |
33 | 33 | from pipecat.runner.types import RunnerArguments |
34 | 34 | from pipecat.runner.utils import create_transport |
35 | | -from pipecat.services.gemini_multimodal_live.gemini import GeminiMultimodalLiveLLMService |
| 35 | +from pipecat.services.google.gemini_live.llm import GeminiLiveLLMService |
36 | 36 | from pipecat.transports.base_transport import BaseTransport, TransportParams |
37 | 37 | from pipecat.transports.daily.transport import DailyParams |
38 | 38 |
|
|
47 | 47 | audio_out_enabled=True, |
48 | 48 | video_in_enabled=True, |
49 | 49 | # set stop_secs to something roughly similar to the internal setting |
50 | | - # of the Multimodal Live api, just to align events. This doesn't really |
51 | | - # matter because we can only use the Multimodal Live API's phrase |
| 50 | + # of the Gemini Live api, just to align events. This doesn't really |
| 51 | + # matter because we can only use the Gemini Live API's phrase |
52 | 52 | # endpointing, for now. |
53 | 53 | vad_analyzer=SileroVADAnalyzer(params=VADParams(stop_secs=0.5)), |
54 | 54 | ), |
55 | 55 | } |
56 | 56 |
|
57 | | -# Search tool can only be used together with other tools when using the Multimodal Live API |
| 57 | +# Search tool can only be used together with other tools when using the Gemini Live API |
58 | 58 | # Otherwise it should be used alone. |
59 | 59 | # We are registering the tools here, but who are handling them is the RTVI client |
60 | 60 | get_location_function = FunctionSchema( |
@@ -113,14 +113,14 @@ async def run_bot(transport: BaseTransport, runner_args: RunnerArguments): |
113 | 113 | """Main bot execution function. |
114 | 114 |
|
115 | 115 | Sets up and runs the bot pipeline including: |
116 | | - - Gemini Live multimodal model integration |
| 116 | + - Gemini Live model integration |
117 | 117 | - Voice activity detection |
118 | 118 | - Animation processing |
119 | 119 | - RTVI event handling |
120 | 120 | """ |
121 | 121 |
|
122 | | - # Initialize the Gemini Multimodal Live model |
123 | | - llm = GeminiMultimodalLiveLLMService( |
| 122 | + # Initialize the Gemini Live model |
| 123 | + llm = GeminiLiveLLMService( |
124 | 124 | api_key=os.getenv("GOOGLE_API_KEY"), |
125 | 125 | voice_id="Puck", # Aoede, Charon, Fenrir, Kore, Puck |
126 | 126 | system_instruction=system_instruction, |
|
0 commit comments