fixit: clean up transcribe/microphone (GoogleCloudPlatform#10104)

yil532 · web-flow · commit 53650ba9894e · 2023-05-29T09:18:35.000Z
## Description Fixes #<ISSUE-NUMBER> Note: Before submitting a pull request, please open an issue for discussion if you are not associated with Google. ## Checklist - [ ] I have followed [Sample Guidelines from AUTHORING_GUIDE.MD](https://togithub.com/GoogleCloudPlatform/python-docs-samples/blob/main/AUTHORING_GUIDE.md) - [ ] README is updated to include [all relevant information](https://togithub.com/GoogleCloudPlatform/python-docs-samples/blob/main/AUTHORING_GUIDE.md#readme-file) - [ ] **Tests** pass: `nox -s py-3.9` (see [Test Environment Setup](https://togithub.com/GoogleCloudPlatform/python-docs-samples/blob/main/AUTHORING_GUIDE.md#test-environment-setup)) - [ ] **Lint** pass: `nox -s lint` (see [Test Environment Setup](https://togithub.com/GoogleCloudPlatform/python-docs-samples/blob/main/AUTHORING_GUIDE.md#test-environment-setup)) - [ ] These samples need a new **API enabled** in testing projects to pass (let us know which ones) - [ ] These samples need a new/updated **env vars** in testing projects set to pass (let us know which ones) - [ ] This sample adds a new sample directory, and I updated the [CODEOWNERS file](https://togithub.com/GoogleCloudPlatform/python-docs-samples/blob/main/.github/CODEOWNERS) with the codeowners for this sample - [ ] This sample adds a new **Product API**, and I updated the [Blunderbuss issue/PR auto-assigner](https://togithub.com/GoogleCloudPlatform/python-docs-samples/blob/main/.github/blunderbuss.yml) with the codeowners for this sample - [ ] Please **merge** this PR for me once it is approved
diff --git a/speech/microphone/transcribe_streaming_infinite.py b/speech/microphone/transcribe_streaming_infinite.py
@@ -44,16 +44,33 @@
 YELLOW = "\033[0;33m"
 
 
-def get_current_time():
-    """Return Current Time in MS."""
+def get_current_time() -> int:
+    """Return Current Time in MS.
+
+    Returns:
+        int: Current Time in MS.
+    """
 
     return int(round(time.time() * 1000))
 
 
 class ResumableMicrophoneStream:
     """Opens a recording stream as a generator yielding the audio chunks."""
 
-    def __init__(self, rate, chunk_size):
+    def __init__(
+            self: object,
+            rate: int,
+            chunk_size: int,
+    ) -> None:
+        """Creates a resumable microphone stream.
+
+        Args:
+        self: The class instance.
+        rate: The audio file's sampling rate.
+        chunk_size: The audio file's chunk size.
+
+        returns: None
+        """
         self._rate = rate
         self.chunk_size = chunk_size
         self._num_channels = 1
@@ -82,13 +99,33 @@ def __init__(self, rate, chunk_size):
             stream_callback=self._fill_buffer,
         )
 
-    def __enter__(self):
+    def __enter__(self: object) -> object:
+        """Opens the stream.
 
+        Args:
+        self: The class instance.
+
+        returns: None
+        """
         self.closed = False
         return self
 
-    def __exit__(self, type, value, traceback):
-
+    def __exit__(
+            self: object,
+            type: object,
+            value: object,
+            traceback: object,
+    ) -> object:
+        """Closes the stream and releases resources.
+
+        Args:
+        self: The class instance.
+        type: The exception type.
+        value: The exception value.
+        traceback: The exception traceback.
+
+        returns: None
+        """
         self._audio_stream.stop_stream()
         self._audio_stream.close()
         self.closed = True
@@ -97,15 +134,34 @@ def __exit__(self, type, value, traceback):
         self._buff.put(None)
         self._audio_interface.terminate()
 
-    def _fill_buffer(self, in_data, *args, **kwargs):
-        """Continuously collect data from the audio stream, into the buffer."""
-
+    def _fill_buffer(
+            self: object,
+            in_data: object,
+            *args: object,
+            **kwargs: object,
+    ) -> object:
+        """Continuously collect data from the audio stream, into the buffer.
+
+        Args:
+        self: The class instance.
+        in_data: The audio data as a bytes object.
+        args: Additional arguments.
+        kwargs: Additional arguments.
+
+        returns: None
+        """
         self._buff.put(in_data)
         return None, pyaudio.paContinue
 
-    def generator(self):
-        """Stream Audio from microphone to API and to local buffer"""
+    def generator(self: object) -> object:
+        """Stream Audio from microphone to API and to local buffer
 
+        Args:
+            self: The class instance.
+
+        returns:
+            The data from the audio stream.
+        """
         while not self.closed:
             data = []
 
@@ -160,7 +216,10 @@ def generator(self):
             yield b"".join(data)
 
 
-def listen_print_loop(responses, stream):
+def listen_print_loop(
+        responses: object,
+        stream: object
+) -> object:
     """Iterates through server responses and prints them.
 
     The responses passed is a generator that will block until a response
@@ -174,8 +233,14 @@ def listen_print_loop(responses, stream):
     response is an interim one, print a line feed at the end of it, to allow
     the next result to overwrite it, until the response is a final one. For the
     final one, print a newline to preserve the finalized transcription.
-    """
 
+    Arg:
+        responses: The responses returned from the API.
+        stream: The audio stream to be processed.
+
+    Returns:
+        The transcript of the result
+    """
     for response in responses:
 
         if get_current_time() - stream.start_time > STREAMING_LIMIT:
@@ -227,18 +292,18 @@ def listen_print_loop(responses, stream):
                 sys.stdout.write("Exiting...\n")
                 stream.closed = True
                 break
-
         else:
             sys.stdout.write(RED)
             sys.stdout.write("\033[K")
             sys.stdout.write(str(corrected_time) + ": " + transcript + "\r")
 
             stream.last_transcript_was_final = False
 
+        return transcript
 
-def main():
-    """start bidirectional streaming from microphone input to speech API"""
 
+def main() -> None:
+    """start bidirectional streaming from microphone input to speech API"""
     client = speech.SpeechClient()
     config = speech.RecognitionConfig(
         encoding=speech.RecognitionConfig.AudioEncoding.LINEAR16,
diff --git a/speech/microphone/transcribe_streaming_mic.py b/speech/microphone/transcribe_streaming_mic.py
@@ -41,15 +41,21 @@
 class MicrophoneStream:
     """Opens a recording stream as a generator yielding the audio chunks."""
 
-    def __init__(self, rate, chunk):
+    def __init__(
+            self: object,
+            rate: int = RATE,
+            chunk: int = CHUNK
+    ) -> None:
+        """The audio -- and generator -- is guaranteed to be on the main thread.
+        """
         self._rate = rate
         self._chunk = chunk
 
         # Create a thread-safe buffer of audio data
         self._buff = queue.Queue()
         self.closed = True
 
-    def __enter__(self):
+    def __enter__(self: object) -> object:
         self._audio_interface = pyaudio.PyAudio()
         self._audio_stream = self._audio_interface.open(
             format=pyaudio.paInt16,
@@ -69,7 +75,13 @@ def __enter__(self):
 
         return self
 
-    def __exit__(self, type, value, traceback):
+    def __exit__(
+            self: object,
+            type: object,
+            value: object,
+            traceback: object,
+    ) -> None:
+        """Closes the stream, regardless of whether the connection was lost or not."""
         self._audio_stream.stop_stream()
         self._audio_stream.close()
         self.closed = True
@@ -78,12 +90,36 @@ def __exit__(self, type, value, traceback):
         self._buff.put(None)
         self._audio_interface.terminate()
 
-    def _fill_buffer(self, in_data, frame_count, time_info, status_flags):
-        """Continuously collect data from the audio stream, into the buffer."""
+    def _fill_buffer(
+            self: object,
+            in_data: object,
+            frame_count: int,
+            time_info: object,
+            status_flags: object,
+    ) -> object:
+        """Continuously collect data from the audio stream, into the buffer.
+
+        Args:
+            in_data: The audio data as a bytes object
+            frame_count: The number of frames captured
+            time_info: The time information
+            status_flags: The status flags
+
+        Returns:
+            The audio data as a bytes object
+        """
         self._buff.put(in_data)
         return None, pyaudio.paContinue
 
-    def generator(self):
+    def generator(self: object) -> object:
+        """Generates audio chunks from the stream of audio data in chunks.
+
+        Args:
+            self: The MicrophoneStream object
+
+        Returns:
+            A generator that outputs audio chunks.
+        """
         while not self.closed:
             # Use a blocking get() to ensure there's at least one chunk of
             # data, and stop iteration if the chunk is None, indicating the
@@ -106,7 +142,7 @@ def generator(self):
             yield b"".join(data)
 
 
-def listen_print_loop(responses):
+def listen_print_loop(responses: object) -> str:
     """Iterates through server responses and prints them.
 
     The responses passed is a generator that will block until a response
@@ -120,6 +156,12 @@ def listen_print_loop(responses):
     response is an interim one, print a line feed at the end of it, to allow
     the next result to overwrite it, until the response is a final one. For the
     final one, print a newline to preserve the finalized transcription.
+
+    Args:
+        responses: List of server responses
+
+    Returns:
+        The transcribed text.
     """
     num_chars_printed = 0
     for response in responses:
@@ -160,8 +202,11 @@ def listen_print_loop(responses):
 
             num_chars_printed = 0
 
+        return transcript
+
 
-def main():
+def main() -> None:
+    """Transcribe speech from audio file."""
     # See http://g.co/cloud/speech/docs/languages
     # for a list of supported languages.
     language_code = "en-US"  # a BCP-47 language tag
diff --git a/speech/microphone/transcribe_streaming_mic_test.py b/speech/microphone/transcribe_streaming_mic_test.py
@@ -19,17 +19,31 @@
 
 from unittest import mock
 
+import pytest
+
 RESOURCES = os.path.join(os.path.dirname(__file__), "resources")
 
 
 class MockPyAudio:
-    def __init__(self, audio_filename):
+    def __init__(
+            self: object,
+            audio_filename: str
+    ) -> None:
         self.audio_filename = audio_filename
 
-    def __call__(self, *args):
+    def __call__(
+            self: object,
+            *args: object
+    ) -> object:
         return self
 
-    def open(self, stream_callback, rate, *args, **kwargs):
+    def open(
+            self: object,
+            stream_callback: object,
+            rate: int,
+            *args: object,
+            **kwargs: object
+    ) -> object:
         self.rate = rate
         self.closed = threading.Event()
         self.stream_thread = threading.Thread(
@@ -39,16 +53,22 @@ def open(self, stream_callback, rate, *args, **kwargs):
         self.stream_thread.start()
         return self
 
-    def close(self):
+    def close(self: object) -> None:
         self.closed.set()
 
-    def stop_stream(self):
+    def stop_stream(self: object) -> None:
         pass
 
-    def terminate(self):
+    def terminate(self: object) -> None:
         pass
 
-    def stream_audio(self, audio_filename, callback, closed, num_frames=512):
+    def stream_audio(
+            self: object,
+            audio_filename: str,
+            callback: object,
+            closed: object,
+            num_frames: int = 512,
+    ) -> None:
         with open(audio_filename, "rb") as audio_file:
             while not closed.is_set():
                 # Approximate realtime by sleeping for the appropriate time for
@@ -64,7 +84,7 @@ def stream_audio(self, audio_filename, callback, closed, num_frames=512):
     "sys.modules",
     pyaudio=mock.MagicMock(PyAudio=MockPyAudio(os.path.join(RESOURCES, "quit.raw"))),
 )
-def test_main(capsys):
+def test_main(capsys: pytest.CaptureFixture) -> None:
     import transcribe_streaming_mic
 
     transcribe_streaming_mic.main()