document start_recognition_timeout error

JamesG-Speechmatics · JamesG-Speechmatics · commit 53f6200dcfe7 · 2025-11-18T10:09:59.000Z
diff --git a/docs/api-ref/realtime-transcription-websocket.mdx b/docs/api-ref/realtime-transcription-websocket.mdx
@@ -169,6 +169,7 @@ In the Realtime SaaS, an in-band error message can be followed by a WebSocket cl
 | 4005 | `quota_exceeded` |
 | 4006 | `timelimit_exceeded` |
 | 4013 | `job_error` |
+<!-- | 4xxx | `start_recognition_timeout` | TODO -->
 
 {/* Manually generated TOC, since we're using JSX sections */}
 export const toc = [
diff --git a/docs/speech-to-text/features/audio-filtering.mdx b/docs/speech-to-text/features/audio-filtering.mdx
@@ -1,5 +1,5 @@
 ---
-description: "Learn how to utilize Audio Filtering to remove background speech" 
+description: "Learn how to utilize audio filtering to remove background speech"
 keywords: 
   [ 
     speechmatics, 
@@ -15,19 +15,19 @@ keywords:
 import Tabs from "@theme/Tabs"; 
 import TabItem from "@theme/TabItem"; 
 
-# Audio Filtering 
+# Audio filtering
 
-Audio Filtering pre-processes input audio to remove low-volume background speech which might otherwise be detected and transcribed.
+Audio filtering pre-processes input audio to remove low-volume background speech which might otherwise be detected and transcribed.
 
 :::info
-This can be useful, for example, in a call center to avoid transcribing other agents' speech from the background.
+This can be useful, for example, in a call center to avoid transcribing other agents' background speech.
 :::
 
-If you're new to Speechmatics, start by exploring our guides on [Transcribing a File](/speech-to-text/batch/quickstart) or [Transcribing in Real-Time](/speech-to-text/realtime/quickstart). 
+If you're new to Speechmatics, start by exploring our guides on [transcribing a file](/speech-to-text/batch/quickstart) or [transcribing in real-time](/speech-to-text/realtime/quickstart).
 
 ## Example
 
-To activate Audio Filtering, include the following configuration:  
+To activate audio filtering, include the following configuration:
 
 ```json
 {
@@ -41,13 +41,15 @@ To activate Audio Filtering, include the following configuration:
   }
 }
 ```
-This will avoid processing any audio which is below the `3.4` volume threshold. For technical details on how this threshold is used see [here](#technical-details)
+This will avoid processing any audio which is below the `3.4` volume threshold. For technical details on how this threshold is calculated and used, see [here](#technical-details)
 
 `volume_threshold` supports a range of `0 - 100` where `0` does not filter any audio and `100` removes all audio.
 
-## Volume Labelling
+In realtime mode, the threshold can be adjusted dynamically with the  [SetRecognitionConfig](/api-ref/realtime-transcription-websocket#setrecognitionconfig) message.
 
-If Audio Filtering is configured, words will be labelled with their volume like this (range for `volume_threshold` is `0-100`):
+## Volume labelling
+
+If audio filtering is configured, words will be labelled with their volume like this (the range for `volume_threshold` is `0-100`):
 
 ```json
     {
@@ -69,7 +71,7 @@ These values can be used as a guide to setting the volume threshold, but we reco
 
 To obtain volume labelling without filtering any audio, supply an empty config object (`{}`) or set the `volume_threshold` to `0.0`.
 
-## Technical Details
+## Technical details
 
 Once the audio is in a raw format (16kHz 16bit mono), it is split into 0.01s chunks. For each chunk, the root mean square amplitude of the signal is calculated, and scaled to the range `0 - 100`. If the volume is less than the supplied cut-off, the chunk will be replaced with silence.
 
diff --git a/spec/flow-api.yaml b/spec/flow-api.yaml
@@ -234,6 +234,7 @@ components:
         - timelimit_exceeded
         - quota_exceeded
         - unknown_error
+        - start_recognition_timeout
 
     ToolTypeEnum:
       type: string
diff --git a/spec/realtime.yaml b/spec/realtime.yaml
@@ -1067,6 +1067,7 @@ components:
         | `data_error` | Unable to accept the data specified - usually because there is too much data being sent at once |
         | `buffer_error` | Unable to fit the data in a corresponding buffer. This can happen for clients sending the input data faster than real-time. |
         | `protocol_error` | Message received was syntactically correct, but could not be accepted due to protocol limitations. This is usually caused by messages sent in the wrong order. |
+        | `start_recognition_timeout` | The timeout for sending StartRecognition has been exceeded (SaaS only) |
         | `quota_exceeded` | Maximum number of concurrent connections allowed for the contract has been reached |
         | `timelimit_exceeded` | Usage quota for the contract has been reached |
         | `idle_timeout` | Idle duration limit was reached (no audio data sent within the last hour), a closing handshake with code 1008 follows this in-band error. |
@@ -1093,6 +1094,7 @@ components:
         - data_error
         - buffer_error
         - protocol_error
+        - start_recognition_timeout
         - quota_exceeded
         - timelimit_exceeded
         - idle_timeout