speechmatics · JamesG-Speechmatics · May 20, 2025 · Mar 28, 2025 · May 15, 2025 · May 16, 2025
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -5,6 +5,12 @@ All notable changes to this project will be documented in this file.
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
 
+## [3.0.4] - 2025-05-19
+
+### Added
+
+- Support end-of-utterance messages (DEL-24982)
+
 ## [3.0.3] - 2025-03-03
 
 ### Added

diff --git a/VERSION b/VERSION
@@ -1 +1 @@
-3.0.3
+3.0.4
diff --git a/speechmatics/cli.py b/speechmatics/cli.py
@@ -284,6 +284,11 @@ def get_transcription_config(
     ]:
         config[option] = True if args.get(option) else config.get(option)
 
+    if args.get("end_of_utterance_silence_trigger") is not None:
+        config["conversation_config"] = {
+            "end_of_utterance_silence_trigger": args.get("end_of_utterance_silence_trigger")
+        }
+
     if args.get("volume_threshold") is not None:
         config["audio_filtering_config"] = {
             "volume_threshold": args.get("volume_threshold")
@@ -547,6 +552,13 @@ def audio_event_handler(message):
         sys.stdout.write(f"{escape_seq}[{event_name}]\n")
         transcripts.text += f"[{event_name}] "
 
+    def end_of_utterance_handler(message):
+        if print_json:
+            print(json.dumps(message))
+            return
+        sys.stdout.write("[EndOfUtterance]\n")
+        transcripts.text += "[EndOfUtterance]"
+
     def partial_translation_handler(message):
         if print_json:
             print(json.dumps(message))
@@ -581,6 +593,8 @@ def end_of_transcript_handler(_):
     # print transcription (if text was requested without translation)
 
     api.add_event_handler(ServerMessageType.AudioEventStarted, audio_event_handler)
+    api.add_event_handler(ServerMessageType.EndOfUtterance, end_of_utterance_handler)
+
     if print_json:
         if enable_partials or enable_translation_partials:
             api.add_event_handler(

diff --git a/speechmatics/cli_parser.py b/speechmatics/cli_parser.py
@@ -218,6 +218,14 @@ def get_arg_parser():
         default=None,
         help=("Filter out quiet audio which falls below this threshold (0.0-100.0)"),
     )
+    config_parser.add_argument(
+        "--end-of-utterance-silence-trigger",
+        dest="end_of_utterance_silence_trigger",
+        type=float,
+        default=None,
+        help=("Generate an EndOfUtterance message from the server after this many seconds of silence (0.0-2.0)"),
+
+    )
     config_parser.add_argument(
         "--remove-disfluencies",
         default=None,

diff --git a/speechmatics/models.py b/speechmatics/models.py
@@ -153,7 +153,13 @@ class TranslationConfig:
     def asdict(self):
         return asdict(self)
 
+@dataclass
+class ConversationConfig:
+    """Conversation config."""
 
+    end_of_utterance_silence_trigger: Optional[float] = None
+    """How much silence in seconds is required to trigger end of utterance detection."""
+
 @dataclass
 class RTTranslationConfig(TranslationConfig):
     """Real-time mode: Translation config."""
@@ -268,6 +274,9 @@ class TranscriptionConfig(_TranscriptionConfig):
     """Indicates if partial translation, where words are produced
     immediately, is enabled."""
 
+    conversation_config: Optional[ConversationConfig] = None
+    """Optional configuration for end-of-utterance detection."""
+
     translation_config: Optional[TranslationConfig] = None
     """Optional configuration for translation."""
 
@@ -531,6 +540,9 @@ class ServerMessageType(str, Enum):
     AddTranscript = "AddTranscript"
     """Indicates the final transcript of a part of the audio."""
 
+    EndOfUtterance = "EndOfUtterance"
+    """Indicates that an utterance has ended, based on silence"""
+
     AudioEventStarted = "AudioEventStarted"
     """Indicates the start of an audio event."""