Skip to content

Commit b2f57f3

Browse files
Google APIscopybara-github
authored andcommitted
feat: adds endpointing sensitivity to streaming recognition features
PiperOrigin-RevId: 871987204
1 parent 45e46bd commit b2f57f3

File tree

3 files changed

+37
-3
lines changed

3 files changed

+37
-3
lines changed

google/cloud/speech/v2/cloud_speech.proto

Lines changed: 27 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
// Copyright 2025 Google LLC
1+
// Copyright 2026 Google LLC
22
//
33
// Licensed under the Apache License, Version 2.0 (the "License");
44
// you may not use this file except in compliance with the License.
@@ -1184,6 +1184,28 @@ message StreamingRecognitionFeatures {
11841184
google.protobuf.Duration speech_end_timeout = 2;
11851185
}
11861186

1187+
// Endpointing sensitivity is intended for applications that want to minimize
1188+
// result latency, possibly at the expense of quality. Some utterances may be
1189+
// broken up into multiple fragments.
1190+
enum EndpointingSensitivity {
1191+
// If no value is specified, the values for
1192+
// ENDPOINTING_SENSITIVITY_STANDARD will be used.
1193+
ENDPOINTING_SENSITIVITY_UNSPECIFIED = 0;
1194+
1195+
// Standard sensitivity, no optimization for latency.
1196+
ENDPOINTING_SENSITIVITY_STANDARD = 1;
1197+
1198+
// Super short sensitivity, optimized for super short utterances like single
1199+
// words ("Yes", "No", "Hello", etc.) or a single phrase, command or short
1200+
// query (e.g. "check balance", "five dollars", "call Mom").
1201+
ENDPOINTING_SENSITIVITY_SUPERSHORT = 2;
1202+
1203+
// Short sensitivity, optimized for short utterances like single sentences.
1204+
// (e.g. "Remind me to call the dentist tomorrow morning at nine",
1205+
// "Navigate to the nearest coffee shop that is currently open")
1206+
ENDPOINTING_SENSITIVITY_SHORT = 3;
1207+
}
1208+
11871209
// If `true`, responses with voice activity speech events will be returned as
11881210
// they are detected.
11891211
bool enable_voice_activity_events = 1;
@@ -1197,6 +1219,10 @@ message StreamingRecognitionFeatures {
11971219
// duration has elapsed after the last VOICE_ACTIVITY speech event has been
11981220
// sent. The field `voice_activity_events` must also be set to true.
11991221
VoiceActivityTimeout voice_activity_timeout = 3;
1222+
1223+
// Optional. Endpointing sensitivity for this stream.
1224+
EndpointingSensitivity endpointing_sensitivity = 8
1225+
[(google.api.field_behavior) = OPTIONAL];
12001226
}
12011227

12021228
// Provides configuration information for the StreamingRecognize request.

google/cloud/speech/v2/locations_metadata.proto

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
// Copyright 2025 Google LLC
1+
// Copyright 2026 Google LLC
22
//
33
// Licensed under the Apache License, Version 2.0 (the "License");
44
// you may not use this file except in compliance with the License.

google/cloud/speech/v2/speech_v2.yaml

Lines changed: 9 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -31,7 +31,15 @@ documentation:
3131
description: Gets information about a location.
3232

3333
- selector: google.cloud.location.Locations.ListLocations
34-
description: Lists information about the supported locations for this service.
34+
description: |-
35+
Lists information about the supported locations for this service.
36+
This method can be called in two ways:
37+
38+
* **List all public locations:** Use the path `GET /v1/locations`.
39+
* **List project-visible locations:** Use the path
40+
`GET /v1/projects/{project_id}/locations`. This may include public
41+
locations as well as private or other locations specifically visible
42+
to the project.
3543
3644
http:
3745
rules:

0 commit comments

Comments
 (0)