WMS ID 9001: Update sdk version, imports and listed additional steps in md file (#387)

chandra-c-chud-oracle · web-flow · commit ab9bd471fdd5 · 2025-03-28T13:44:06.000+02:00
update sdk version, imports and listed additional steps in md file for the same
diff --git a/oci-artificial-intelligence/ai-speech/transcribe-live-audio/files/realtime_example.py b/oci-artificial-intelligence/ai-speech/transcribe-live-audio/files/realtime_example.py
@@ -5,7 +5,7 @@
 from oci.config import from_file
 from oci.auth.signers.security_token_signer import SecurityTokenSigner
 
-from oci.ai_speech_realtime import (
+from oci_ai_speech_realtime import (
     RealtimeSpeechClient, 
     RealtimeSpeechClientListener
 )
@@ -109,6 +109,9 @@ def on_network_event(self, ackmessage):
 
     def on_error(self):
         return super().on_error()
+    
+    def on_close(self, error_code, error_message):
+        return super().on_close(error_code, error_message)
 
 
 if __name__ == "__main__":
@@ -123,7 +126,7 @@ def message_callback(message):
     )
     realtime_speech_parameters.partial_silence_threshold_in_ms = 0
     realtime_speech_parameters.final_silence_threshold_in_ms = 2000
-    # realtime_speech_parameters.encoding="audio/raw;rate=16000"
+    realtime_speech_parameters.encoding="audio/raw;rate=16000"
     realtime_speech_parameters.punctuation = (
         realtime_speech_parameters.PUNCTUATION_AUTO
     )
@@ -146,7 +149,7 @@ def message_callback(message):
     #     }
     # ]
 
-    realtime_speech_url = "wss://realtime.aiservice-preprod.ap-sydney-1.oci.oraclecloud.com"
+    realtime_speech_url = "wss://realtime.aiservice.uk-london-1.oci.oraclecloud.com"
     client =  RealtimeSpeechClient(
             realtime_speech_parameters=realtime_speech_parameters,
             config=config,
diff --git a/oci-artificial-intelligence/ai-speech/transcribe-live-audio/files/requirements.txt b/oci-artificial-intelligence/ai-speech/transcribe-live-audio/files/requirements.txt
@@ -0,0 +1,2 @@
+PyAudio>=0.2.14
+oci-ai-speech-realtime>=2.1.0
diff --git a/oci-artificial-intelligence/ai-speech/transcribe-live-audio/transcribe-live-audio.md b/oci-artificial-intelligence/ai-speech/transcribe-live-audio/transcribe-live-audio.md
@@ -82,6 +82,23 @@ First, refer to lab 4 (Access OCI speech with OCI SDKs (Optional)) for API signi
 
 Click [here](https://docs.oracle.com/en-us/iaas/Content/API/Concepts/sdks.htm) for documentation regarding AI Speech SDK
 
+Along with the OCI SDK, install the OCI AI Speech live transcription SDK:
+
+```
+pip install oci-ai-speech-realtime
+```
+
+To allow recording and streaming of audio install the PyAudio package:
+
+```
+pip install pyaudio>=0.2.14
+```
+
+Alternatively, both the required packages can be installed using the `requirements.txt` present [here](./files/requirements.txt):
+```
+pip install -r requirements.txt
+```
+
 OCI AI Speech live transcription uses websockets to relay audio data and receive text transcriptions in real time. This means your client must implement some key listener functions:
 
 <strong>Python example:</strong>
@@ -178,7 +195,7 @@ class MyRealtimeListener(RealtimeClientListener):
 
 `model_domain` : <strong>"GENERIC"</strong>
 
-`partial_silence_threshold_in_ms` : <strong>500</strong>
+`partial_silence_threshold_in_ms` : <strong>0</strong>
 
 `final_silence_threshold_in_ms` : <strong>2000</strong>
 

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+PyAudio>=0.2.14`
	`2`	`+oci-ai-speech-realtime>=2.1.0`