Trying with channels

2022-02-11 13:46:14 +01:00 · 2022-02-11 13:46:14 +01:00 · f63fb5d01b
parent 46e602ba36
commit f63fb5d01b
3 changed files with 44 additions and 27 deletions
--- a/Cargo.lock
+++ b/Cargo.lock
@ -284,6 +284,7 @@ dependencies = [
 "tokio",
 "tokio-stream",
 "tonic",
 "tracing",
 "tracing-subscriber",
 ]
--- a/Cargo.toml
+++ b/Cargo.toml
@ -6,6 +6,7 @@ edition = "2021"
 [dependencies]
 eyre = "0.6.6"
 log = "0.4"
 tracing = "0.1"
 tracing-subscriber = { version = "0.3", features = ["env-filter"] }
 tokio = { version = "1.15", features = ["macros", "rt-multi-thread", "fs"] }
 google-authz = { version = "1.0.0-alpha.2", features = ["tonic"] }
@ -18,4 +19,7 @@ prost-types = { version = "0.9" }
 google-api-proto = { version = "1.0.0-alpha", features = ["google-cloud-translation-v3", "google-cloud-speech-v1"] }
 tokio-stream = "0.1.8"
 futures-util = "0.3"
-async-stream = "*"
+async-stream = "*"
 #glib = "0.15.4"
 #gst = { package = "gstreamer", version = "0.18.3" }
 #gstreamer-base = "0.18.0"
--- a/src/main.rs
+++ b/src/main.rs
@ -8,6 +8,7 @@ use google_authz::{Credentials, GoogleAuthz};
 use log::{debug, info};
 use tokio::io::AsyncReadExt;
 use tonic::transport::Channel;
 use tracing::Instrument;
 #[tokio::main]
 async fn main() -> eyre::Result<()> {
@ -36,28 +37,31 @@ async fn main() -> eyre::Result<()> {
    let mut client = SpeechClient::new(channel);
-    let outbound = async_stream::stream! {
+
-        let request = StreamingRecognizeRequest {
+    let (sender, mut receiver) = tokio::sync::mpsc::unbounded_channel();
-            streaming_request: Some(StreamingRequest::StreamingConfig(
+
-                StreamingRecognitionConfig {
+    sender.send(StreamingRecognizeRequest {
-                    config: Some(RecognitionConfig {
+        streaming_request: Some(StreamingRequest::StreamingConfig(
-                        encoding: AudioEncoding::Flac.into(), // matching current example file
+            StreamingRecognitionConfig {
-                        sample_rate_hertz: 44_100,            // matching current example file
+                config: Some(RecognitionConfig {
-                        audio_channel_count: 2,
+                    encoding: AudioEncoding::Flac.into(), // matching current example file
-                        language_code: "en-US".to_string(),   // we only support en-US to start with
+                    sample_rate_hertz: 44_100,            // matching current example file
-                        model: "video".to_string(),           // dictate does not set this option
+                    audio_channel_count: 2,
-                        use_enhanced: true,                   // dictate does not set this option
+                    language_code: "en-US".to_string(),   // we only support en-US to start with
-                        profanity_filter: true,               // used by Dictate, so we also use it here
+                    model: "video".to_string(),           // dictate does not set this option
-                        enable_word_time_offsets: true, // important so we can get the spoken word time ranges
+                    use_enhanced: true,                   // dictate does not set this option
-                        max_alternatives: 1,            // make sure the default is used
+                    profanity_filter: true,               // used by Dictate, so we also use it here
-                        ..Default::default()
+                    enable_word_time_offsets: true, // important so we can get the spoken word time ranges
-                    }),
+                    max_alternatives: 1,            // make sure the default is used
-                    single_utterance: false,
+                    ..Default::default()
-                    interim_results: false,
+                }),
-                },
+                single_utterance: false,
-            )),
+                interim_results: false,
-        };
+            },
-        yield request;
+        )),
    })?;
    tokio::spawn(async move {
        let file = tokio::fs::File::open("some-audio.flac").await.unwrap();
        let mut audio_file = tokio::io::BufReader::new(file);
        // read file chunk
@ -69,18 +73,26 @@ async fn main() -> eyre::Result<()> {
                    BytesMut::from(&buffer.as_slice()[..n]).freeze(),
                )),
            };
-            yield request;
+            sender.send(request).unwrap();
-            // debug!("added a buffer to the sender queue: {} bytes", n);
+            //debug!("added a buffer to the sender queue: {} bytes", n);
            tokio::time::sleep(std::time::Duration::from_millis(100)).await;
        }
    }).instrument(tracing::info_span!("audio-source")).await?;
    let message = async_stream::stream! {
        while let Some(message) = receiver.recv().await {
            debug!("drained message inside stream...");
            yield message;
        }
    };
    let response = client
-        .streaming_recognize(tonic::Request::new(outbound))
+        .streaming_recognize(tonic::Request::new(message))
        .await?;
    let mut inbound = response.into_inner();
-    while let Some(response) = inbound.message().await? {
+    while let Some(response) = inbound.message().instrument(tracing::info_span!("transcription-results")).await? {
        let mut num_results = 0;
        for res in &response.results {
            num_results = num_results + 1;