update libs

Picovoice · bejager · May 10, 2024 · Apr 9, 2024 · Apr 9, 2024 · Apr 9, 2024
commit 9126b618c3e756be02f8e0eca04605e06f261748
diff --git a/binding/python/_orca.py b/binding/python/_orca.py
@@ -141,16 +141,31 @@ class COrcaStream(Structure):
 
     class Stream:
         """
-        TODO
+        Orca Stream object that allows to convert a stream of text to a stream of audio.
         """
+
         def __init__(self, handle: POINTER('Orca.COrcaStream'), orca: 'Orca') -> None:
             self._handle = handle
             self._orca = orca
 
         def synthesize(self, text: str) -> Optional[Sequence[int]]:
             """
-            TODO
+            Adds a chunk of text to the OrcaStream object and generates audio if enough text has been added.
+            This function is expected to be called multiple times with consecutive chunks of text from a text stream.
+            The incoming text is buffered as it arrives until the length is long enough to convert a chunk of the
+            buffered text into audio. The caller needs to use `pv_orca_stream_flush()` to generate the audio chunk
+            for the remaining text that has not yet been synthesized.
+            The caller is responsible for deleting the generated audio with `pv_orca_pcm_delete()`.
+
+            :param text: A chunk of text from a text input stream, comprised of valid characters.
+            Valid characters can be retrieved by calling `pv_orca_valid_characters()`.
+            Custom pronunciations can be embedded in the text via the syntax `{word|pronunciation}`.
+            They need to be added in a single call to this function.
+            The pronunciation is expressed in ARPAbet format, e.g.: `I {liv|L IH V} in {Sevilla|S EH V IY Y AH}`.
+            :return: The generated audio as a sequence of 16-bit linearly-encoded integers, `NULL` if no
+            audio chunk has been produced.
             """
+
             c_num_samples = c_int32()
             c_pcm = POINTER(c_int16)()
 
@@ -172,8 +187,14 @@ def synthesize(self, text: str) -> Optional[Sequence[int]]:
 
         def flush(self) -> Optional[Sequence[int]]:
             """
-            TODO
+            Generates audio for all the buffered text that was added to the OrcaStream object
+            via `pv_orca_stream_synthesize()`.
+            The caller is responsible for deleting the generated audio with `pv_orca_pcm_delete()`.
+
+            :return: The generated audio as a sequence of 16-bit linearly-encoded integers, `NULL` if no
+            audio chunk has been produced.
             """
+
             c_num_samples = c_int32()
             c_pcm = POINTER(c_int16)()
 
@@ -194,8 +215,9 @@ def flush(self) -> Optional[Sequence[int]]:
 
         def close(self) -> None:
             """
-            TODO
+            Releases the resources acquired by the OrcaStream object.
             """
+
             self._orca._stream_close_func(self._handle)
 
     def __init__(self, access_key: str, model_path: str, library_path: str) -> None:
@@ -555,7 +577,7 @@ def synthesize_to_file(
 
     def open_stream(self, speech_rate: Optional[float] = None, random_state: Optional[int] = None) -> 'Orca.Stream':
         """
-        Opens a stream for streaming synthesis.
+        Opens a stream for streaming text synthesis.
 
         :param speech_rate: Rate of speech of the generated audio.
         :param random_state: Random seed for the synthesis process.

diff --git a/demo/python/demo_util.py b/demo/python/demo_util.py
@@ -89,25 +89,33 @@ class LLM:
     Keep the conversation flowing. 
     Ask relevant follow-up questions. 
     """
+    DEFAULT_USER_PROMPT = "Your prompt: "
+    DEFAULT_ASSISTANT_PROMPT = "Assistant: "
 
     def __init__(
             self,
             synthesize_text_callback: Optional[Callable[[str], None]],
+            user_prompt: Optional[str] = None,
+            assistant_prompt: Optional[str] = None,
     ) -> None:
         self._synthesize_text_callback = synthesize_text_callback
 
+        self._user_prompt = user_prompt if user_prompt is not None else self.DEFAULT_USER_PROMPT
+        self._assistant_prompt = assistant_prompt if assistant_prompt is not None else self.DEFAULT_ASSISTANT_PROMPT
+
     def chat(self, user_input: str) -> Generator[str, None, None]:
+        print(self._assistant_prompt, end="")
         for token in self._chat(user_input=user_input):
             if token is not None and self._synthesize_text_callback is not None:
-                    self._synthesize_text_callback(token)
+                self._synthesize_text_callback(token)
             yield token
 
     def _chat(self, user_input: str) -> Generator[str, None, None]:
         raise NotImplementedError(
             f"Method `chat_stream` must be implemented in a subclass of {self.__class__.__name__}")
 
-    def user_prompt(self, user_prompt: str) -> str:
-        return input(user_prompt)
+    def get_user_input(self) -> str:
+        return input(self._user_prompt)
 
     @classmethod
     def create(cls, llm_type: LLMs, **kwargs) -> 'LLM':
@@ -123,10 +131,11 @@ def create(cls, llm_type: LLMs, **kwargs) -> 'LLM':
 
 
 class DummyLLM(LLM):
-    USER_PROMPT = "Press ENTER to generate a demo LLM response"
+    USER_PROMPT = "Press ENTER to generate a demo LLM response\n"
+    ASSISTANT_PROMPT = ""
 
     def __init__(self, tokens_per_second: int = 8, **kwargs: Any) -> None:
-        super().__init__(user_prompt=self.USER_PROMPT, **kwargs)
+        super().__init__(user_prompt=self.USER_PROMPT, assistant_prompt=self.ASSISTANT_PROMPT, **kwargs)
 
         self._encoder = tiktoken.encoding_for_model("gpt-4")
         self._tokens_delay = 1 / tokens_per_second
@@ -153,6 +162,7 @@ def _chat(self, user_input: str) -> Generator[str, None, None]:
 
 class OpenAILLM(LLM):
     MODEL_NAME = "gpt-3.5-turbo"
+
     def __init__(
             self,
             access_key: str,

diff --git a/demo/python/streaming_orca_demo.py b/demo/python/streaming_orca_demo.py
@@ -14,9 +14,6 @@
 
 from demo_util import *
 
-USER_PROMPT = "Your prompt:\n"
-ASSISTANT_PROMPT = "Assistant:"
-
 
 def get_llm_init_kwargs(args: argparse.Namespace) -> dict:
     kwargs = dict()
@@ -76,32 +73,32 @@ def main(args: argparse.Namespace) -> None:
     llm_init_kwargs = get_llm_init_kwargs(args)
     llm = LLM.create(
         llm_type, 
-        synthesize_text_callback=synthesize_text_callback, 
+        synthesize_text_callback=synthesize_text_callback,
         **llm_init_kwargs)
 
     print("PICOVOICE ORCA STREAMING TTS DEMO")
     print("This demo let's you chat with an LLM. The response is read out loud by a TTS system. Press Ctrl+C to exit.\n")
 
     try:
         while True:
-            text = llm.user_prompt(user_prompt=USER_PROMPT)        
+            text = llm.get_user_input()
             generator = llm.chat(user_input=text)
 
             llm_message = ""
             num_tokens = 0
 
-            print(ASSISTANT_PROMPT)
             while True:
                 try:
                     if timestamps.time_llm_request < 0:
                         timestamps.time_llm_request = time.time()
                     token = next(generator)  # TODO: change to standard loop 
 
-                    if token is not None:
-                        print(token, end="", flush=True)
                     if timestamps.time_first_llm_token < 0:
                         timestamps.time_first_llm_token = time.time()
 
+                    if token is not None:
+                        print(token, end="", flush=True)
+
                     if token is not None:
                         llm_message += token
                 except StopIteration:

diff --git a/lib/android/arm64-v8a/libpv_orca.so b/lib/android/arm64-v8a/libpv_orca.so
diff --git a/lib/android/armeabi-v7a/libpv_orca.so b/lib/android/armeabi-v7a/libpv_orca.so
diff --git a/lib/android/x86/libpv_orca.so b/lib/android/x86/libpv_orca.so
diff --git a/lib/android/x86_64/libpv_orca.so b/lib/android/x86_64/libpv_orca.so
diff --git a/lib/ios/PvOrca.xcframework/ios-arm64/PvOrca.framework/PvOrca b/lib/ios/PvOrca.xcframework/ios-arm64/PvOrca.framework/PvOrca
diff --git a/lib/ios/PvOrca.xcframework/ios-arm64_x86_64-simulator/PvOrca.framework/PvOrca b/lib/ios/PvOrca.xcframework/ios-arm64_x86_64-simulator/PvOrca.framework/PvOrca
diff --git a/lib/java/jetson/cortex-a57-aarch64/libpv_orca_jni.so b/lib/java/jetson/cortex-a57-aarch64/libpv_orca_jni.so
diff --git a/lib/java/linux/x86_64/libpv_orca_jni.so b/lib/java/linux/x86_64/libpv_orca_jni.so
diff --git a/lib/java/mac/arm64/libpv_orca_jni.dylib b/lib/java/mac/arm64/libpv_orca_jni.dylib
diff --git a/lib/java/mac/x86_64/libpv_orca_jni.dylib b/lib/java/mac/x86_64/libpv_orca_jni.dylib
diff --git a/lib/java/raspberry-pi/cortex-a53-aarch64/libpv_orca_jni.so b/lib/java/raspberry-pi/cortex-a53-aarch64/libpv_orca_jni.so
diff --git a/lib/java/raspberry-pi/cortex-a53/libpv_orca_jni.so b/lib/java/raspberry-pi/cortex-a53/libpv_orca_jni.so
diff --git a/lib/java/raspberry-pi/cortex-a72-aarch64/libpv_orca_jni.so b/lib/java/raspberry-pi/cortex-a72-aarch64/libpv_orca_jni.so
diff --git a/lib/java/raspberry-pi/cortex-a72/libpv_orca_jni.so b/lib/java/raspberry-pi/cortex-a72/libpv_orca_jni.so
diff --git a/lib/java/raspberry-pi/cortex-a76-aarch64/libpv_orca_jni.so b/lib/java/raspberry-pi/cortex-a76-aarch64/libpv_orca_jni.so
diff --git a/lib/java/raspberry-pi/cortex-a76/libpv_orca_jni.so b/lib/java/raspberry-pi/cortex-a76/libpv_orca_jni.so
diff --git a/lib/java/windows/amd64/pv_orca_jni.dll b/lib/java/windows/amd64/pv_orca_jni.dll
diff --git a/lib/jetson/cortex-a57-aarch64/libpv_orca.so b/lib/jetson/cortex-a57-aarch64/libpv_orca.so
diff --git a/lib/linux/x86_64/libpv_orca.so b/lib/linux/x86_64/libpv_orca.so
diff --git a/lib/raspberry-pi/cortex-a53-aarch64/libpv_orca.so b/lib/raspberry-pi/cortex-a53-aarch64/libpv_orca.so
diff --git a/lib/raspberry-pi/cortex-a53/libpv_orca.so b/lib/raspberry-pi/cortex-a53/libpv_orca.so
diff --git a/lib/raspberry-pi/cortex-a72-aarch64/libpv_orca.so b/lib/raspberry-pi/cortex-a72-aarch64/libpv_orca.so
diff --git a/lib/raspberry-pi/cortex-a72/libpv_orca.so b/lib/raspberry-pi/cortex-a72/libpv_orca.so
diff --git a/lib/raspberry-pi/cortex-a76-aarch64/libpv_orca.so b/lib/raspberry-pi/cortex-a76-aarch64/libpv_orca.so
diff --git a/lib/raspberry-pi/cortex-a76/libpv_orca.so b/lib/raspberry-pi/cortex-a76/libpv_orca.so
diff --git a/lib/wasm/pv_orca.wasm b/lib/wasm/pv_orca.wasm
diff --git a/lib/wasm/pv_orca_simd.wasm b/lib/wasm/pv_orca_simd.wasm
diff --git a/lib/windows/amd64/libpv_orca.dll b/lib/windows/amd64/libpv_orca.dll