From 65237962b87064fa8d57bccae52139e1d8dbdde6 Mon Sep 17 00:00:00 2001
From: Guiners <rkoza@softserveinc.com>
Date: Mon, 28 Jul 2025 13:09:30 +0200
Subject: [PATCH 1/7] adding live_txt_with_audio with test

---
 genai/live/live_txt_with_audio.py | 70 +++++++++++++++++++++++++++++++
 genai/live/requirements.txt       |  3 +-
 genai/live/test_live_examples.py  |  6 +++
 3 files changed, 78 insertions(+), 1 deletion(-)
 create mode 100644 genai/live/live_txt_with_audio.py

diff --git a/genai/live/live_txt_with_audio.py b/genai/live/live_txt_with_audio.py
new file mode 100644
index 00000000000..11ca218854e
--- /dev/null
+++ b/genai/live/live_txt_with_audio.py
@@ -0,0 +1,70 @@
+# Copyright 2024 Google LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+
+# Test file: https://storage.googleapis.com/generativeai-downloads/data/16000.wav
+# Install helpers for converting files: pip install librosa soundfile
+
+import asyncio
+
+
+async def generate_content() -> list[str]:
+    # [START googlegenaisdk_live_txt_with_audio]
+    import io
+    import requests
+    from google import genai
+    from google.genai.types import Modality, LiveConnectConfig, Blob
+    import soundfile as sf
+    import librosa
+
+    client = genai.Client()
+    model = "gemini-2.0-flash-live-preview-04-09"
+    config = LiveConnectConfig(response_modalities=[Modality.TEXT])
+
+    async with client.aio.live.connect(model=model, config=config) as session:
+        audio_url = "https://storage.googleapis.com/generativeai-downloads/data/16000.wav"
+        response = requests.get(audio_url)
+        response.raise_for_status()
+        buffer = io.BytesIO(response.content)
+        y, sr = librosa.load(buffer, sr=16000)
+        sf.write(buffer, y, sr, format="RAW", subtype="PCM_16")
+        buffer.seek(0)
+        audio_bytes = buffer.read()
+
+        # If you've pre-converted to sample.pcm using ffmpeg, use this instead:
+        # audio_bytes = Path("sample.pcm").read_bytes()
+
+        print("> Answer to this audio url", audio_url, "\n")
+
+        await session.send_realtime_input(
+            media=Blob(data=audio_bytes, mime_type="audio/pcm;rate=16000")
+        )
+
+        response = []
+
+        async for message in session.receive():
+            if message.text is not None:
+                response.append(message.text)
+
+        print("".join(response))
+    # Example output:
+    # > Answer to this audio url https://storage.googleapis.com/generativeai-downloads/data/16000.wav
+    # Yes, I can hear you. How can I help you today?
+    # [STOP googlegenaisdk_live_txt_with_audio]
+    return response
+
+
+
+if __name__ == "__main__":
+    asyncio.run(generate_content())
\ No newline at end of file
diff --git a/genai/live/requirements.txt b/genai/live/requirements.txt
index c12e6a7e2f7..8fa57b6175c 100644
--- a/genai/live/requirements.txt
+++ b/genai/live/requirements.txt
@@ -1,3 +1,4 @@
 google-genai==1.20.0
 scipy==1.15.3
-websockets==15.0.1
\ No newline at end of file
+websockets==15.0.1
+librosa==0.11.0
\ No newline at end of file
diff --git a/genai/live/test_live_examples.py b/genai/live/test_live_examples.py
index ce382539861..1ce0eeb5bb2 100644
--- a/genai/live/test_live_examples.py
+++ b/genai/live/test_live_examples.py
@@ -25,6 +25,7 @@
 import live_websocket_textgen_with_audio
 import live_websocket_textgen_with_txt
 import live_with_txt
+import live_txt_with_audio
 
 os.environ["GOOGLE_GENAI_USE_VERTEXAI"] = "True"
 os.environ["GOOGLE_CLOUD_LOCATION"] = "us-central1"
@@ -55,3 +56,8 @@ async def test_live_websocket_audiogen_with_txt() -> None:
 @pytest.mark.asyncio
 async def test_live_websocket_audiotranscript_with_txt() -> None:
     assert await live_websocket_audiotranscript_with_txt.generate_content()
+
+
+@pytest.mark.asyncio
+async def test_live_txt_with_audio() -> None:
+    assert await live_txt_with_audio.generate_content()

From 9b400a31e9741b6bd5eab1a36d7797ecd712caac Mon Sep 17 00:00:00 2001
From: Guiners <rkoza@softserveinc.com>
Date: Mon, 28 Jul 2025 14:38:57 +0200
Subject: [PATCH 2/7] adding live_audio_with_txt with test

---
 genai/live/live_audio_with_txt.py | 87 +++++++++++++++++++++++++++++++
 genai/live/requirements.txt       |  3 +-
 genai/live/test_live_examples.py  |  7 +++
 3 files changed, 96 insertions(+), 1 deletion(-)
 create mode 100644 genai/live/live_audio_with_txt.py

diff --git a/genai/live/live_audio_with_txt.py b/genai/live/live_audio_with_txt.py
new file mode 100644
index 00000000000..f12eaab447d
--- /dev/null
+++ b/genai/live/live_audio_with_txt.py
@@ -0,0 +1,87 @@
+# Copyright 2024 Google LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+
+# Test file: https://storage.googleapis.com/generativeai-downloads/data/16000.wav
+# Install helpers for converting files: pip install librosa soundfile
+
+import asyncio
+
+
+async def generate_content() -> list[str]:
+    # [START googlegenaisdk_live_audio_with_txt]
+    import numpy as np
+    from IPython.display import Audio, Markdown, display
+    from google import genai
+    from google.genai.types import (
+        Content,
+        LiveConnectConfig,
+        Modality,
+        Part,
+        SpeechConfig,
+        VoiceConfig,
+        PrebuiltVoiceConfig,
+    )
+
+    client = genai.Client()
+    voice_name = "Aoede"
+
+    config = LiveConnectConfig(
+        response_modalities=[Modality.AUDIO],
+        speech_config=SpeechConfig(
+            voice_config=VoiceConfig(
+                prebuilt_voice_config=PrebuiltVoiceConfig(
+                    voice_name=voice_name,
+                )
+            ),
+        ),
+    )
+    model = "gemini-2.0-flash-live-preview-04-09"
+
+    async with client.aio.live.connect(
+            model=model,
+            config=config,
+    ) as session:
+        text_input = "Hello? Gemini are you there?"
+        print("> ", text_input, "\n")
+
+        await session.send_client_content(
+            turns=Content(role="user", parts=[Part(text=text_input)]))
+
+        audio_data = []
+        async for message in session.receive():
+            if (
+                    message.server_content.model_turn
+                    and message.server_content.model_turn.parts
+            ):
+                for part in message.server_content.model_turn.parts:
+                    if part.inline_data:
+                        audio_data.append(
+                            np.frombuffer(part.inline_data.data, dtype=np.int16)
+                        )
+
+        if audio_data:
+            print("Received audio answer:")
+            display(Audio(np.concatenate(audio_data), rate=24000, autoplay=True))
+
+    # Example output:
+    # >  Hello? Gemini are you there?
+    # Received audio answer:
+    # <IPython.lib.display.Audio object>
+    # [STOP googlegenaisdk_live_audio_with_txt]
+    return []
+
+
+if __name__ == "__main__":
+    asyncio.run(generate_content())
\ No newline at end of file
diff --git a/genai/live/requirements.txt b/genai/live/requirements.txt
index 8fa57b6175c..0c3280258af 100644
--- a/genai/live/requirements.txt
+++ b/genai/live/requirements.txt
@@ -1,4 +1,5 @@
 google-genai==1.20.0
 scipy==1.15.3
 websockets==15.0.1
-librosa==0.11.0
\ No newline at end of file
+librosa==0.11.0
+IPython==8.26.0
diff --git a/genai/live/test_live_examples.py b/genai/live/test_live_examples.py
index 1ce0eeb5bb2..372f84341d7 100644
--- a/genai/live/test_live_examples.py
+++ b/genai/live/test_live_examples.py
@@ -26,6 +26,7 @@
 import live_websocket_textgen_with_txt
 import live_with_txt
 import live_txt_with_audio
+import live_audio_with_txt
 
 os.environ["GOOGLE_GENAI_USE_VERTEXAI"] = "True"
 os.environ["GOOGLE_CLOUD_LOCATION"] = "us-central1"
@@ -61,3 +62,9 @@ async def test_live_websocket_audiotranscript_with_txt() -> None:
 @pytest.mark.asyncio
 async def test_live_txt_with_audio() -> None:
     assert await live_txt_with_audio.generate_content()
+
+
+@pytest.mark.asyncio
+async def test_live_audio_with_txt() -> None:
+    result = await live_audio_with_txt.generate_content()
+    assert result is not None

From 973f133bc6d48a03caa4601ad7bbf3141ac93b29 Mon Sep 17 00:00:00 2001
From: Guiners <rkoza@softserveinc.com>
Date: Mon, 28 Jul 2025 14:40:26 +0200
Subject: [PATCH 3/7] adding live_audio_with_txt with test

---
 genai/live/live_audio_with_txt.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/genai/live/live_audio_with_txt.py b/genai/live/live_audio_with_txt.py
index f12eaab447d..27e9a90ea6e 100644
--- a/genai/live/live_audio_with_txt.py
+++ b/genai/live/live_audio_with_txt.py
@@ -72,7 +72,7 @@ async def generate_content() -> list[str]:
                         )
 
         if audio_data:
-            print("Received audio answer:")
+            print("Received audio answer: ")
             display(Audio(np.concatenate(audio_data), rate=24000, autoplay=True))
 
     # Example output:

From 4858df193c231e882851bc1653b14399bda25dc0 Mon Sep 17 00:00:00 2001
From: Guiners <rkoza@softserveinc.com>
Date: Mon, 28 Jul 2025 15:06:03 +0200
Subject: [PATCH 4/7] adding live_transcribe_with_audio with test

---
 genai/live/live_audio_with_txt.py             | 15 +++--
 genai/live/live_transcribe_with_audio.py      | 66 +++++++++++++++++++
 genai/live/live_txt_with_audio.py             |  7 +-
 .../live/live_websocket_audiogen_with_txt.py  | 28 ++++----
 ...live_websocket_audiotranscript_with_txt.py | 24 ++++---
 .../live/live_websocket_textgen_with_audio.py | 24 ++++---
 genai/live/live_websocket_textgen_with_txt.py | 20 +++---
 genai/live/live_with_txt.py                   |  4 +-
 genai/live/test_live_examples.py              |  7 ++
 9 files changed, 144 insertions(+), 51 deletions(-)
 create mode 100644 genai/live/live_transcribe_with_audio.py

diff --git a/genai/live/live_audio_with_txt.py b/genai/live/live_audio_with_txt.py
index 27e9a90ea6e..f7b0954bec5 100644
--- a/genai/live/live_audio_with_txt.py
+++ b/genai/live/live_audio_with_txt.py
@@ -36,6 +36,7 @@ async def generate_content() -> list[str]:
 
     client = genai.Client()
     voice_name = "Aoede"
+    model = "gemini-2.0-flash-live-preview-04-09"
 
     config = LiveConnectConfig(
         response_modalities=[Modality.AUDIO],
@@ -47,23 +48,23 @@ async def generate_content() -> list[str]:
             ),
         ),
     )
-    model = "gemini-2.0-flash-live-preview-04-09"
 
     async with client.aio.live.connect(
-            model=model,
-            config=config,
+        model=model,
+        config=config,
     ) as session:
         text_input = "Hello? Gemini are you there?"
         print("> ", text_input, "\n")
 
         await session.send_client_content(
-            turns=Content(role="user", parts=[Part(text=text_input)]))
+            turns=Content(role="user", parts=[Part(text=text_input)])
+        )
 
         audio_data = []
         async for message in session.receive():
             if (
-                    message.server_content.model_turn
-                    and message.server_content.model_turn.parts
+                message.server_content.model_turn
+                and message.server_content.model_turn.parts
             ):
                 for part in message.server_content.model_turn.parts:
                     if part.inline_data:
@@ -84,4 +85,4 @@ async def generate_content() -> list[str]:
 
 
 if __name__ == "__main__":
-    asyncio.run(generate_content())
\ No newline at end of file
+    asyncio.run(generate_content())
diff --git a/genai/live/live_transcribe_with_audio.py b/genai/live/live_transcribe_with_audio.py
new file mode 100644
index 00000000000..201c8c4ba3f
--- /dev/null
+++ b/genai/live/live_transcribe_with_audio.py
@@ -0,0 +1,66 @@
+# Copyright 2024 Google LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+
+# Test file: https://storage.googleapis.com/generativeai-downloads/data/16000.wav
+# Install helpers for converting files: pip install librosa soundfile
+
+import asyncio
+
+
+async def generate_content():
+    # [START googlegenaisdk_live_transcribe_with_audio]
+    from google import genai
+    from google.genai.types import (
+        LiveConnectConfig,
+        Modality,
+        AudioTranscriptionConfig,
+        Part,
+        Content,
+    )
+
+    client = genai.Client()
+    model = "gemini-2.0-flash-live-preview-04-09"
+    config = LiveConnectConfig(
+        response_modalities=[Modality.AUDIO],
+        input_audio_transcription=AudioTranscriptionConfig(),
+        output_audio_transcription=AudioTranscriptionConfig(),
+    )
+
+    async with client.aio.live.connect(model=model, config=config) as session:
+        input_txt = "Hello? Gemini are you there?"
+        print("> ", input_txt, "\n")
+
+        await session.send_client_content(
+            turns=Content(role="user", parts=[Part(text=input_txt)]), turn_complete=True
+        )
+
+        response = []
+
+        async for message in session.receive():
+            if message.server_content.output_transcription:
+                if message.server_content.output_transcription.text is not None:
+                    response.append(message.server_content.output_transcription.text)
+
+        print("".join(response))
+
+    # Example output:
+    # >  Hello? Gemini are you there?
+    # Yes, I'm here. What would you like to talk about?
+    # [STOP googlegenaisdk_live_transcribe_with_audio]
+    return response
+
+
+if __name__ == "__main__":
+    asyncio.run(generate_content())
diff --git a/genai/live/live_txt_with_audio.py b/genai/live/live_txt_with_audio.py
index 11ca218854e..d27fca65999 100644
--- a/genai/live/live_txt_with_audio.py
+++ b/genai/live/live_txt_with_audio.py
@@ -33,7 +33,9 @@ async def generate_content() -> list[str]:
     config = LiveConnectConfig(response_modalities=[Modality.TEXT])
 
     async with client.aio.live.connect(model=model, config=config) as session:
-        audio_url = "https://storage.googleapis.com/generativeai-downloads/data/16000.wav"
+        audio_url = (
+            "https://storage.googleapis.com/generativeai-downloads/data/16000.wav"
+        )
         response = requests.get(audio_url)
         response.raise_for_status()
         buffer = io.BytesIO(response.content)
@@ -65,6 +67,5 @@ async def generate_content() -> list[str]:
     return response
 
 
-
 if __name__ == "__main__":
-    asyncio.run(generate_content())
\ No newline at end of file
+    asyncio.run(generate_content())
diff --git a/genai/live/live_websocket_audiogen_with_txt.py b/genai/live/live_websocket_audiogen_with_txt.py
index f7b6f07e5f8..277d4d5f8ba 100644
--- a/genai/live/live_websocket_audiogen_with_txt.py
+++ b/genai/live/live_websocket_audiogen_with_txt.py
@@ -20,7 +20,9 @@ def get_bearer_token() -> str:
     import google.auth
     from google.auth.transport.requests import Request
 
-    creds, _ = google.auth.default(scopes=["https://www.googleapis.com/auth/cloud-platform"])
+    creds, _ = google.auth.default(
+        scopes=["https://www.googleapis.com/auth/cloud-platform"]
+    )
     auth_req = Request()
     creds.refresh(auth_req)
     bearer_token = creds.token
@@ -55,9 +57,7 @@ async def generate_content() -> str:
 
     # Websocket Configuration
     WEBSOCKET_HOST = "us-central1-aiplatform.googleapis.com"
-    WEBSOCKET_SERVICE_URL = (
-        f"wss://{WEBSOCKET_HOST}/ws/google.cloud.aiplatform.v1.LlmBidiService/BidiGenerateContent"
-    )
+    WEBSOCKET_SERVICE_URL = f"wss://{WEBSOCKET_HOST}/ws/google.cloud.aiplatform.v1.LlmBidiService/BidiGenerateContent"
 
     # Websocket Authentication
     headers = {
@@ -66,9 +66,7 @@ async def generate_content() -> str:
     }
 
     # Model Configuration
-    model_path = (
-        f"projects/{PROJECT_ID}/locations/{LOCATION}/publishers/google/models/{GEMINI_MODEL_NAME}"
-    )
+    model_path = f"projects/{PROJECT_ID}/locations/{LOCATION}/publishers/google/models/{GEMINI_MODEL_NAME}"
     model_generation_config = {
         "response_modalities": ["AUDIO"],
         "speech_config": {
@@ -77,7 +75,9 @@ async def generate_content() -> str:
         },
     }
 
-    async with connect(WEBSOCKET_SERVICE_URL, additional_headers=headers) as websocket_session:
+    async with connect(
+        WEBSOCKET_SERVICE_URL, additional_headers=headers
+    ) as websocket_session:
         # 1. Send setup configuration
         websocket_config = {
             "setup": {
@@ -120,7 +120,9 @@ async def generate_content() -> str:
             server_content = response_chunk.get("serverContent")
             if not server_content:
                 # This might indicate an error or an unexpected message format
-                print(f"Received non-serverContent message or empty content: {response_chunk}")
+                print(
+                    f"Received non-serverContent message or empty content: {response_chunk}"
+                )
                 break
 
             # Collect audio chunks
@@ -129,7 +131,9 @@ async def generate_content() -> str:
                 for part in model_turn["parts"]:
                     if part["inlineData"]["mimeType"] == "audio/pcm":
                         audio_chunk = base64.b64decode(part["inlineData"]["data"])
-                        aggregated_response_parts.append(np.frombuffer(audio_chunk, dtype=np.int16))
+                        aggregated_response_parts.append(
+                            np.frombuffer(audio_chunk, dtype=np.int16)
+                        )
 
             # End of response
             if server_content.get("turnComplete"):
@@ -137,7 +141,9 @@ async def generate_content() -> str:
 
         # Save audio to a file
         if aggregated_response_parts:
-            wavfile.write("output.wav", 24000, np.concatenate(aggregated_response_parts))
+            wavfile.write(
+                "output.wav", 24000, np.concatenate(aggregated_response_parts)
+            )
         # Example response:
         #     Setup Response: {'setupComplete': {}}
         #     Input: Hello? Gemini are you there?
diff --git a/genai/live/live_websocket_audiotranscript_with_txt.py b/genai/live/live_websocket_audiotranscript_with_txt.py
index 5192b81ef17..5304e1914bb 100644
--- a/genai/live/live_websocket_audiotranscript_with_txt.py
+++ b/genai/live/live_websocket_audiotranscript_with_txt.py
@@ -20,7 +20,9 @@ def get_bearer_token() -> str:
     import google.auth
     from google.auth.transport.requests import Request
 
-    creds, _ = google.auth.default(scopes=["https://www.googleapis.com/auth/cloud-platform"])
+    creds, _ = google.auth.default(
+        scopes=["https://www.googleapis.com/auth/cloud-platform"]
+    )
     auth_req = Request()
     creds.refresh(auth_req)
     bearer_token = creds.token
@@ -55,9 +57,7 @@ async def generate_content() -> str:
 
     # Websocket Configuration
     WEBSOCKET_HOST = "us-central1-aiplatform.googleapis.com"
-    WEBSOCKET_SERVICE_URL = (
-        f"wss://{WEBSOCKET_HOST}/ws/google.cloud.aiplatform.v1.LlmBidiService/BidiGenerateContent"
-    )
+    WEBSOCKET_SERVICE_URL = f"wss://{WEBSOCKET_HOST}/ws/google.cloud.aiplatform.v1.LlmBidiService/BidiGenerateContent"
 
     # Websocket Authentication
     headers = {
@@ -66,9 +66,7 @@ async def generate_content() -> str:
     }
 
     # Model Configuration
-    model_path = (
-        f"projects/{PROJECT_ID}/locations/{LOCATION}/publishers/google/models/{GEMINI_MODEL_NAME}"
-    )
+    model_path = f"projects/{PROJECT_ID}/locations/{LOCATION}/publishers/google/models/{GEMINI_MODEL_NAME}"
     model_generation_config = {
         "response_modalities": ["AUDIO"],
         "speech_config": {
@@ -77,7 +75,9 @@ async def generate_content() -> str:
         },
     }
 
-    async with connect(WEBSOCKET_SERVICE_URL, additional_headers=headers) as websocket_session:
+    async with connect(
+        WEBSOCKET_SERVICE_URL, additional_headers=headers
+    ) as websocket_session:
         # 1. Send setup configuration
         websocket_config = {
             "setup": {
@@ -125,7 +125,9 @@ async def generate_content() -> str:
             server_content = response_chunk.get("serverContent")
             if not server_content:
                 # This might indicate an error or an unexpected message format
-                print(f"Received non-serverContent message or empty content: {response_chunk}")
+                print(
+                    f"Received non-serverContent message or empty content: {response_chunk}"
+                )
                 break
 
             # Transcriptions
@@ -142,7 +144,9 @@ async def generate_content() -> str:
                 for part in model_turn["parts"]:
                     if part["inlineData"]["mimeType"] == "audio/pcm":
                         audio_chunk = base64.b64decode(part["inlineData"]["data"])
-                        aggregated_response_parts.append(np.frombuffer(audio_chunk, dtype=np.int16))
+                        aggregated_response_parts.append(
+                            np.frombuffer(audio_chunk, dtype=np.int16)
+                        )
 
             # End of response
             if server_content.get("turnComplete"):
diff --git a/genai/live/live_websocket_textgen_with_audio.py b/genai/live/live_websocket_textgen_with_audio.py
index de6fd9d55c3..f91cff35b57 100644
--- a/genai/live/live_websocket_textgen_with_audio.py
+++ b/genai/live/live_websocket_textgen_with_audio.py
@@ -20,7 +20,9 @@ def get_bearer_token() -> str:
     import google.auth
     from google.auth.transport.requests import Request
 
-    creds, _ = google.auth.default(scopes=["https://www.googleapis.com/auth/cloud-platform"])
+    creds, _ = google.auth.default(
+        scopes=["https://www.googleapis.com/auth/cloud-platform"]
+    )
     auth_req = Request()
     creds.refresh(auth_req)
     bearer_token = creds.token
@@ -65,9 +67,7 @@ def read_wavefile(filepath: str) -> tuple[str, str]:
 
     # Websocket Configuration
     WEBSOCKET_HOST = "us-central1-aiplatform.googleapis.com"
-    WEBSOCKET_SERVICE_URL = (
-        f"wss://{WEBSOCKET_HOST}/ws/google.cloud.aiplatform.v1.LlmBidiService/BidiGenerateContent"
-    )
+    WEBSOCKET_SERVICE_URL = f"wss://{WEBSOCKET_HOST}/ws/google.cloud.aiplatform.v1.LlmBidiService/BidiGenerateContent"
 
     # Websocket Authentication
     headers = {
@@ -76,12 +76,12 @@ def read_wavefile(filepath: str) -> tuple[str, str]:
     }
 
     # Model Configuration
-    model_path = (
-        f"projects/{PROJECT_ID}/locations/{LOCATION}/publishers/google/models/{GEMINI_MODEL_NAME}"
-    )
+    model_path = f"projects/{PROJECT_ID}/locations/{LOCATION}/publishers/google/models/{GEMINI_MODEL_NAME}"
     model_generation_config = {"response_modalities": ["TEXT"]}
 
-    async with connect(WEBSOCKET_SERVICE_URL, additional_headers=headers) as websocket_session:
+    async with connect(
+        WEBSOCKET_SERVICE_URL, additional_headers=headers
+    ) as websocket_session:
         # 1. Send setup configuration
         websocket_config = {
             "setup": {
@@ -105,7 +105,9 @@ def read_wavefile(filepath: str) -> tuple[str, str]:
             return "Error: WebSocket setup failed."
 
         # 3. Send audio message
-        encoded_audio_message, mime_type = read_wavefile("hello_gemini_are_you_there.wav")
+        encoded_audio_message, mime_type = read_wavefile(
+            "hello_gemini_are_you_there.wav"
+        )
         # Example audio message:  "Hello? Gemini are you there?"
 
         user_message = {
@@ -136,7 +138,9 @@ def read_wavefile(filepath: str) -> tuple[str, str]:
             server_content = response_chunk.get("serverContent")
             if not server_content:
                 # This might indicate an error or an unexpected message format
-                print(f"Received non-serverContent message or empty content: {response_chunk}")
+                print(
+                    f"Received non-serverContent message or empty content: {response_chunk}"
+                )
                 break
 
             # Collect text responses
diff --git a/genai/live/live_websocket_textgen_with_txt.py b/genai/live/live_websocket_textgen_with_txt.py
index b36487cc9a0..f8e88fa0521 100644
--- a/genai/live/live_websocket_textgen_with_txt.py
+++ b/genai/live/live_websocket_textgen_with_txt.py
@@ -20,7 +20,9 @@ def get_bearer_token() -> str:
     import google.auth
     from google.auth.transport.requests import Request
 
-    creds, _ = google.auth.default(scopes=["https://www.googleapis.com/auth/cloud-platform"])
+    creds, _ = google.auth.default(
+        scopes=["https://www.googleapis.com/auth/cloud-platform"]
+    )
     auth_req = Request()
     creds.refresh(auth_req)
     bearer_token = creds.token
@@ -51,9 +53,7 @@ async def generate_content() -> str:
 
     # Websocket Configuration
     WEBSOCKET_HOST = "us-central1-aiplatform.googleapis.com"
-    WEBSOCKET_SERVICE_URL = (
-        f"wss://{WEBSOCKET_HOST}/ws/google.cloud.aiplatform.v1.LlmBidiService/BidiGenerateContent"
-    )
+    WEBSOCKET_SERVICE_URL = f"wss://{WEBSOCKET_HOST}/ws/google.cloud.aiplatform.v1.LlmBidiService/BidiGenerateContent"
 
     # Websocket Authentication
     headers = {
@@ -62,12 +62,12 @@ async def generate_content() -> str:
     }
 
     # Model Configuration
-    model_path = (
-        f"projects/{PROJECT_ID}/locations/{LOCATION}/publishers/google/models/{GEMINI_MODEL_NAME}"
-    )
+    model_path = f"projects/{PROJECT_ID}/locations/{LOCATION}/publishers/google/models/{GEMINI_MODEL_NAME}"
     model_generation_config = {"response_modalities": ["TEXT"]}
 
-    async with connect(WEBSOCKET_SERVICE_URL, additional_headers=headers) as websocket_session:
+    async with connect(
+        WEBSOCKET_SERVICE_URL, additional_headers=headers
+    ) as websocket_session:
         # 1. Send setup configuration
         websocket_config = {
             "setup": {
@@ -110,7 +110,9 @@ async def generate_content() -> str:
             server_content = response_chunk.get("serverContent")
             if not server_content:
                 # This might indicate an error or an unexpected message format
-                print(f"Received non-serverContent message or empty content: {response_chunk}")
+                print(
+                    f"Received non-serverContent message or empty content: {response_chunk}"
+                )
                 break
 
             # Collect text responses
diff --git a/genai/live/live_with_txt.py b/genai/live/live_with_txt.py
index a3c75188439..fd412af7740 100644
--- a/genai/live/live_with_txt.py
+++ b/genai/live/live_with_txt.py
@@ -35,7 +35,9 @@ async def generate_content() -> list[str]:
     ) as session:
         text_input = "Hello? Gemini, are you there?"
         print("> ", text_input, "\n")
-        await session.send_client_content(turns=Content(role="user", parts=[Part(text=text_input)]))
+        await session.send_client_content(
+            turns=Content(role="user", parts=[Part(text=text_input)])
+        )
 
         response = []
 
diff --git a/genai/live/test_live_examples.py b/genai/live/test_live_examples.py
index 372f84341d7..4f05dc4299d 100644
--- a/genai/live/test_live_examples.py
+++ b/genai/live/test_live_examples.py
@@ -27,6 +27,7 @@
 import live_with_txt
 import live_txt_with_audio
 import live_audio_with_txt
+import live_transcribe_with_audio
 
 os.environ["GOOGLE_GENAI_USE_VERTEXAI"] = "True"
 os.environ["GOOGLE_CLOUD_LOCATION"] = "us-central1"
@@ -68,3 +69,9 @@ async def test_live_txt_with_audio() -> None:
 async def test_live_audio_with_txt() -> None:
     result = await live_audio_with_txt.generate_content()
     assert result is not None
+
+
+@pytest.mark.asyncio
+async def test_live_transcribe_with_audio() -> None:
+    result = await live_transcribe_with_audio.generate_content()
+    assert result is not None

From 359384bdbbd9e2d04829f0a3d1915bf82b8dc5db Mon Sep 17 00:00:00 2001
From: Robert Kozak <50328216+Guiners@users.noreply.github.com>
Date: Mon, 1 Sep 2025 14:24:40 +0200
Subject: [PATCH 5/7] Update genai/live/test_live_examples.py

Co-authored-by: gemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com>
---
 genai/live/test_live_examples.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/genai/live/test_live_examples.py b/genai/live/test_live_examples.py
index 4f05dc4299d..a05e76f1a40 100644
--- a/genai/live/test_live_examples.py
+++ b/genai/live/test_live_examples.py
@@ -25,8 +25,8 @@
 import live_websocket_textgen_with_audio
 import live_websocket_textgen_with_txt
 import live_with_txt
-import live_txt_with_audio
 import live_audio_with_txt
+import live_txt_with_audio
 import live_transcribe_with_audio
 
 os.environ["GOOGLE_GENAI_USE_VERTEXAI"] = "True"

From 68ae455c6994ae3d879d8ebcb70c2d0393e1bc08 Mon Sep 17 00:00:00 2001
From: Guiners <rkoza@softserveinc.com>
Date: Mon, 1 Sep 2025 14:33:26 +0200
Subject: [PATCH 6/7] codereview fix

---
 genai/live/live_audio_with_txt.py | 2 +-
 genai/live/live_txt_with_audio.py | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/genai/live/live_audio_with_txt.py b/genai/live/live_audio_with_txt.py
index f7b0954bec5..40a78a64734 100644
--- a/genai/live/live_audio_with_txt.py
+++ b/genai/live/live_audio_with_txt.py
@@ -80,7 +80,7 @@ async def generate_content() -> list[str]:
     # >  Hello? Gemini are you there?
     # Received audio answer:
     # <IPython.lib.display.Audio object>
-    # [STOP googlegenaisdk_live_audio_with_txt]
+    # [END googlegenaisdk_live_audio_with_txt]
     return []
 
 
diff --git a/genai/live/live_txt_with_audio.py b/genai/live/live_txt_with_audio.py
index d27fca65999..e6a0e00e19d 100644
--- a/genai/live/live_txt_with_audio.py
+++ b/genai/live/live_txt_with_audio.py
@@ -63,7 +63,7 @@ async def generate_content() -> list[str]:
     # Example output:
     # > Answer to this audio url https://storage.googleapis.com/generativeai-downloads/data/16000.wav
     # Yes, I can hear you. How can I help you today?
-    # [STOP googlegenaisdk_live_txt_with_audio]
+    # [END googlegenaisdk_live_txt_with_audio]
     return response
 
 

From 2585661b4e5b0a112fbbbf579b3b2c0104eaa93b Mon Sep 17 00:00:00 2001
From: Guiners <rkoza@softserveinc.com>
Date: Fri, 5 Sep 2025 10:51:43 +0200
Subject: [PATCH 7/7] codereview fix

---
 genai/live/live_audiogen_with_txt.py          | 12 +++++++++---
 genai/live/live_code_exec_with_txt.py         | 10 ++++++++--
 genai/live/live_func_call_with_txt.py         | 12 +++++++++---
 genai/live/live_ground_googsearch_with_txt.py | 10 ++++++++--
 genai/live/live_structured_ouput_with_txt.py  |  6 ++++--
 genai/live/live_transcribe_with_audio.py      |  9 +++++++--
 genai/live/live_with_txt.py                   |  9 +++++++--
 genai/live/test_live_examples.py              | 10 +++++-----
 8 files changed, 57 insertions(+), 21 deletions(-)

diff --git a/genai/live/live_audiogen_with_txt.py b/genai/live/live_audiogen_with_txt.py
index cf7f24a6fc4..477d4f0d40d 100644
--- a/genai/live/live_audiogen_with_txt.py
+++ b/genai/live/live_audiogen_with_txt.py
@@ -24,9 +24,15 @@ async def generate_content() -> None:
     import numpy as np
     import scipy.io.wavfile as wavfile
     from google import genai
-    from google.genai.types import (Content, LiveConnectConfig, Modality, Part,
-                                    PrebuiltVoiceConfig, SpeechConfig,
-                                    VoiceConfig)
+    from google.genai.types import (
+        Content,
+        LiveConnectConfig,
+        Modality,
+        Part,
+        PrebuiltVoiceConfig,
+        SpeechConfig,
+        VoiceConfig,
+    )
 
     client = genai.Client()
     model = "gemini-2.0-flash-live-preview-04-09"
diff --git a/genai/live/live_code_exec_with_txt.py b/genai/live/live_code_exec_with_txt.py
index 70db7402ee7..6aa1cae7b6d 100644
--- a/genai/live/live_code_exec_with_txt.py
+++ b/genai/live/live_code_exec_with_txt.py
@@ -18,8 +18,14 @@
 async def generate_content() -> list[str]:
     # [START googlegenaisdk_live_code_exec_with_txt]
     from google import genai
-    from google.genai.types import (Content, LiveConnectConfig, Modality, Part,
-                                    Tool, ToolCodeExecution)
+    from google.genai.types import (
+        Content,
+        LiveConnectConfig,
+        Modality,
+        Part,
+        Tool,
+        ToolCodeExecution,
+    )
 
     client = genai.Client()
     model_id = "gemini-2.0-flash-live-preview-04-09"
diff --git a/genai/live/live_func_call_with_txt.py b/genai/live/live_func_call_with_txt.py
index 7761a49b7b6..b29dd96b78a 100644
--- a/genai/live/live_func_call_with_txt.py
+++ b/genai/live/live_func_call_with_txt.py
@@ -20,9 +20,15 @@
 async def generate_content() -> list[FunctionResponse]:
     # [START googlegenaisdk_live_func_call_with_txt]
     from google import genai
-    from google.genai.types import (Content, FunctionDeclaration,
-                                    FunctionResponse, LiveConnectConfig,
-                                    Modality, Part, Tool)
+    from google.genai.types import (
+        Content,
+        FunctionDeclaration,
+        FunctionResponse,
+        LiveConnectConfig,
+        Modality,
+        Part,
+        Tool,
+    )
 
     client = genai.Client()
     model_id = "gemini-2.0-flash-live-preview-04-09"
diff --git a/genai/live/live_ground_googsearch_with_txt.py b/genai/live/live_ground_googsearch_with_txt.py
index cfca4a87e1c..82f4281ae6a 100644
--- a/genai/live/live_ground_googsearch_with_txt.py
+++ b/genai/live/live_ground_googsearch_with_txt.py
@@ -19,8 +19,14 @@
 async def generate_content() -> list[str]:
     # [START googlegenaisdk_live_ground_googsearch_with_txt]
     from google import genai
-    from google.genai.types import (Content, GoogleSearch, LiveConnectConfig,
-                                    Modality, Part, Tool)
+    from google.genai.types import (
+        Content,
+        GoogleSearch,
+        LiveConnectConfig,
+        Modality,
+        Part,
+        Tool,
+    )
 
     client = genai.Client()
     model_id = "gemini-2.0-flash-live-preview-04-09"
diff --git a/genai/live/live_structured_ouput_with_txt.py b/genai/live/live_structured_ouput_with_txt.py
index f0b2466ff5f..38b7df52fcb 100644
--- a/genai/live/live_structured_ouput_with_txt.py
+++ b/genai/live/live_structured_ouput_with_txt.py
@@ -30,8 +30,10 @@ def generate_content() -> CalendarEvent:
     import google.auth.transport.requests
     import openai
     from google.auth import default
-    from openai.types.chat import (ChatCompletionSystemMessageParam,
-                                   ChatCompletionUserMessageParam)
+    from openai.types.chat import (
+        ChatCompletionSystemMessageParam,
+        ChatCompletionUserMessageParam,
+    )
 
     project_id = os.environ["GOOGLE_CLOUD_PROJECT"]
     location = "us-central1"
diff --git a/genai/live/live_transcribe_with_audio.py b/genai/live/live_transcribe_with_audio.py
index b702672bc76..644c486675f 100644
--- a/genai/live/live_transcribe_with_audio.py
+++ b/genai/live/live_transcribe_with_audio.py
@@ -22,8 +22,13 @@
 async def generate_content() -> list[str]:
     # [START googlegenaisdk_live_transcribe_with_audio]
     from google import genai
-    from google.genai.types import (AudioTranscriptionConfig, Content,
-                                    LiveConnectConfig, Modality, Part)
+    from google.genai.types import (
+        AudioTranscriptionConfig,
+        Content,
+        LiveConnectConfig,
+        Modality,
+        Part,
+    )
 
     client = genai.Client()
     model = "gemini-live-2.5-flash-preview-native-audio"
diff --git a/genai/live/live_with_txt.py b/genai/live/live_with_txt.py
index 8b8b0908127..76fab43398b 100644
--- a/genai/live/live_with_txt.py
+++ b/genai/live/live_with_txt.py
@@ -18,8 +18,13 @@
 async def generate_content() -> list[str]:
     # [START googlegenaisdk_live_with_txt]
     from google import genai
-    from google.genai.types import (Content, HttpOptions, LiveConnectConfig,
-                                    Modality, Part)
+    from google.genai.types import (
+        Content,
+        HttpOptions,
+        LiveConnectConfig,
+        Modality,
+        Part,
+    )
 
     client = genai.Client(http_options=HttpOptions(api_version="v1beta1"))
     model_id = "gemini-2.0-flash-live-preview-04-09"
diff --git a/genai/live/test_live_examples.py b/genai/live/test_live_examples.py
index adab0df412e..7959d1a91e2 100644
--- a/genai/live/test_live_examples.py
+++ b/genai/live/test_live_examples.py
@@ -105,16 +105,16 @@ async def test_live_structured_ouput_with_txt() -> None:
 
 @pytest.mark.asyncio
 async def test_live_txt_with_audio() -> None:
-   assert await live_txt_with_audio.generate_content()
+    assert await live_txt_with_audio.generate_content()
 
 
 @pytest.mark.asyncio
 async def test_live_audio_with_txt() -> None:
-   result = await live_audio_with_txt.generate_content()
-   assert result is not None
+    result = await live_audio_with_txt.generate_content()
+    assert result is not None
 
 
 @pytest.mark.asyncio
 async def test_live_transcribe_with_audio() -> None:
-   result = await live_transcribe_with_audio.generate_content()
-   assert result is not None
+    result = await live_transcribe_with_audio.generate_content()
+    assert result is not None