CSDK-2246 daily-python: add Deepgram TTS example

aconchillo · aconchillo · commit 60755ee7b632 · 2024-03-14T23:21:39.000-07:00
diff --git a/demos/README.md b/demos/README.md
@@ -3,6 +3,7 @@
 Here you can find a few demos that use Daily's Python SDK:
 
 - **audio**: Examples on how to send and receive RAW audio or WAV files.
+- **deepgram**: An example showing how to use Deepgram [Text-To-Speech](https://developers.deepgram.com/docs/text-to-speech) API.
 - **flask**: A demo that uses [Flask](https://flask.palletsprojects.com/) and [Celery](https://docs.celeryq.dev/) to launch multiple concurrent audio bots.
 - **google**: Audio examples using Google [Speech-To-Text](https://cloud.google.com/speech-to-text) and [Text-To-Speech](https://cloud.google.com/text-to-speech) APIs.
 - **gstreamer**: A media player based on [GStreamer](https://gstreamer.freedesktop.org/) that sends a video file into a meeting.
diff --git a/demos/deepgram/deepgram_text_to_speech.py b/demos/deepgram/deepgram_text_to_speech.py
@@ -0,0 +1,91 @@
+#
+# This demo will join a Daily meeting and, given a text file with senteces (one
+# per line), will translate text into audio using Deepgram's Text-To-Speech API
+# and will send it into the meeting.
+#
+# The demo requires a Deepgram API key set in the DG_API_KEY environment variable.
+#
+# See https://developers.deepgram.com/docs/text-to-speech
+#
+# Usage: python3 deepgram_speech_to_text.py -m MEETING_URL -i FILE
+#
+
+import argparse
+import os
+import time
+
+from daily import *
+from deepgram import (
+    DeepgramClient,
+    SpeakOptions,
+)
+
+parser = argparse.ArgumentParser()
+parser.add_argument("-m", "--meeting", required=True, help="Meeting URL")
+parser.add_argument(
+    "-i",
+    "--input",
+    required=True,
+    help="File with sentences (one per line)")
+args = parser.parse_args()
+
+Daily.init()
+
+# We create a virtual microphone device so we can read audio samples from the
+# meeting.
+microphone = Daily.create_microphone_device(
+    "my-mic", sample_rate=16000, channels=1)
+
+client = CallClient()
+
+print()
+print(f"Joining {args.meeting} ...")
+
+# Join and tell our call client that we will be using our new virtual
+# microphone.
+client.join(args.meeting, client_settings={
+    "inputs": {
+        "microphone": {
+            "isEnabled": True,
+            "settings": {
+                "deviceId": "my-mic"
+            }
+        }
+    }
+})
+
+# Make sure we are joined. It would be better to use join() completion
+# callback.
+time.sleep(3)
+
+sentences_file = open(args.input, "r")
+
+deepgram = DeepgramClient(api_key=os.getenv("DG_API_KEY"))
+
+speak_options = SpeakOptions(
+    model="aura-asteria-en",
+    encoding="linear16",
+    sample_rate="16000",
+    container="none"
+)
+
+print()
+
+for sentence in sentences_file.readlines():
+    print(f"Processing: {sentence.strip()}")
+    print()
+
+    speak_source = {
+        "text": sentence.strip()
+    }
+
+    response = deepgram.speak.v("1").stream(speak_source, speak_options)
+
+    # Send all the audio frames to the microphone.
+    microphone.write_frames(response.stream.read())
+
+# Let everything finish
+time.sleep(2)
+
+client.leave()
+client.release()
diff --git a/demos/google/google_text_to_speech.py b/demos/google/google_text_to_speech.py
@@ -7,7 +7,7 @@
 #
 # See https://cloud.google.com/text-to-speech/docs/before-you-begin
 #
-# Usage: python3 google_speech_to_text.py -m MEETING_URL
+# Usage: python3 google_speech_to_text.py -m MEETING_URL -i FILE
 #
 
 from daily import *
diff --git a/demos/requirements.txt b/demos/requirements.txt
@@ -1,4 +1,5 @@
 celery==5.3.6
+deepgram-sdk==3.2.1
 flask==3.0.1
 google-cloud-speech==2.24.0
 google-cloud-texttospeech==2.16.0

Original file line number	Diff line number	Diff line change
`@@ -7,7 +7,7 @@`
`7`	`7`	`#`
`8`	`8`	`# See https://cloud.google.com/text-to-speech/docs/before-you-begin`
`9`	`9`	`#`
`10`		`-# Usage: python3 google_speech_to_text.py -m MEETING_URL`
	`10`	`+# Usage: python3 google_speech_to_text.py -m MEETING_URL -i FILE`
`11`	`11`	`#`
`12`	`12`
`13`	`13`	`from daily import *`
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,5 @@`
`1`	`1`	`celery==5.3.6`
	`2`	`+deepgram-sdk==3.2.1`
`2`	`3`	`flask==3.0.1`
`3`	`4`	`google-cloud-speech==2.24.0`
`4`	`5`	`google-cloud-texttospeech==2.16.0`