From 32e533f892fc00c497a3e2deaf76c251e4ee63a8 Mon Sep 17 00:00:00 2001
From: pabloFuente <pablofuenteperez@gmail.com>
Date: Wed, 18 Jun 2025 20:25:05 +0200
Subject: [PATCH] Added sarvam STT AI provider to agent-speech-processing.yaml

---
 community/agent-speech-processing.yaml | 10 +++++++++-
 pro/agent-speech-processing.yaml       | 10 +++++++++-
 2 files changed, 18 insertions(+), 2 deletions(-)

diff --git a/community/agent-speech-processing.yaml b/community/agent-speech-processing.yaml
index f22e621..b105214 100644
--- a/community/agent-speech-processing.yaml
+++ b/community/agent-speech-processing.yaml
@@ -10,7 +10,7 @@ live_captions:
   # - manual: the agent will connect to new Rooms only when your application dictates it by using the Agent Dispatch API.
   processing: automatic
 
-  # Which speech-to-text AI provider to use [aws, azure, google, opeanai, groq, deepgram, assemblyai, fal, clova, speechmatics, gladia]
+  # Which speech-to-text AI provider to use [aws, azure, google, opeanai, groq, deepgram, assemblyai, fal, clova, speechmatics, gladia, sarvam]
   # The custom configuration for the selected provider must be set below
   provider:
 
@@ -216,3 +216,11 @@ live_captions:
     languages:
     # Whether to allow switching between languages during recognition. Defaults to True
     code_switching:
+
+  sarvam:
+    # API key for Sarvam. See https://dashboard.sarvam.ai/key-management
+    api_key:
+    # BCP-47 language code for supported Indian languages. See https://docs.sarvam.ai/api-reference-docs/speech-to-text/transcribe#request.body.language_code.language_code
+    language:
+    # The Sarvam STT model to use. See https://docs.sarvam.ai/api-reference-docs/speech-to-text/transcribe#request.body.model.model
+    model:
diff --git a/pro/agent-speech-processing.yaml b/pro/agent-speech-processing.yaml
index f22e621..b105214 100644
--- a/pro/agent-speech-processing.yaml
+++ b/pro/agent-speech-processing.yaml
@@ -10,7 +10,7 @@ live_captions:
   # - manual: the agent will connect to new Rooms only when your application dictates it by using the Agent Dispatch API.
   processing: automatic
 
-  # Which speech-to-text AI provider to use [aws, azure, google, opeanai, groq, deepgram, assemblyai, fal, clova, speechmatics, gladia]
+  # Which speech-to-text AI provider to use [aws, azure, google, opeanai, groq, deepgram, assemblyai, fal, clova, speechmatics, gladia, sarvam]
   # The custom configuration for the selected provider must be set below
   provider:
 
@@ -216,3 +216,11 @@ live_captions:
     languages:
     # Whether to allow switching between languages during recognition. Defaults to True
     code_switching:
+
+  sarvam:
+    # API key for Sarvam. See https://dashboard.sarvam.ai/key-management
+    api_key:
+    # BCP-47 language code for supported Indian languages. See https://docs.sarvam.ai/api-reference-docs/speech-to-text/transcribe#request.body.language_code.language_code
+    language:
+    # The Sarvam STT model to use. See https://docs.sarvam.ai/api-reference-docs/speech-to-text/transcribe#request.body.model.model
+    model: