Feedback updates.

daspecster · daspecster · commit 89ff561c755b · 2016-10-18T13:10:08.000-04:00
diff --git a/docs/speech-streaming.rst b/docs/speech-streaming.rst
@@ -13,11 +13,3 @@ Streaming Speech Result
   :members:
   :undoc-members:
   :show-inheritance:
-
-Streaming Endpointer Type
-=========================
-
-.. automodule:: google.cloud.speech.endpointer_type
-  :members:
-  :undoc-members:
-  :show-inheritance:
diff --git a/docs/speech-usage.rst b/docs/speech-usage.rst
@@ -155,41 +155,43 @@ data to possible text alternatives on the fly.
 
 .. code-block:: python
 
-    >>> import io
     >>> from google.cloud import speech
     >>> client = speech.Client()
-    >>> with io.open('./hello.wav', 'rb') as stream:
+    >>> with open('./hello.wav', 'rb') as stream:
     ...     sample = client.sample(stream=stream, encoding=speech.Encoding.LINEAR16,
     ...                            sample_rate=16000)
     ...     for response in client.stream_recognize(sample):
     ...         print(response.transcript)
-    hello
     ...         print(response.is_final)
+    hello
     True
 
 
-By setting ``interim_results`` to true, interim results (tentative hypotheses)
+By setting ``interim_results`` to :data:`True`, interim results (tentative hypotheses)
 may be returned as they become available (these interim results are indicated
-with the is_final=false flag). If false or omitted, only is_final=true
+with the ``is_final=false`` flag). If :data:`False` or omitted, only ``is_final=true``
 result(s) are returned.
 
 .. code-block:: python
 
-    >>> import io
     >>> from google.cloud import speech
     >>> client = speech.Client()
-    >>> with io.open('./hello.wav', 'rb') as stream:
-    >>>     sample = client.sample(stream=stream, encoding=speech.Encoding.LINEAR16,
+    >>> with open('./hello.wav', 'rb') as stream:
+    ...     sample = client.sample(stream=stream, encoding=speech.Encoding.LINEAR16,
     ...                            sample_rate=16000)
     ...     for response in client.stream_recognize(sample,
     ...                                             interim_results=True):
+    ...         print('====Response====')
     ...         print(response.transcript)
-    hell
     ...         print(response.is_final)
+    ====Response====
+    he
     False
-    ...         print(response.transcript)
+    ====Response====
+    hell
+    False
+    ====Repsonse====
     hello
-    ...         print(response.is_final)
     True
 
 
@@ -204,13 +206,15 @@ See: `Single Utterance`_
 
 .. code-block:: python
 
-    >>> with io.open('./hello_pause_goodbye.wav', 'rb') as stream:
-    >>>     sample = client.sample(stream=stream, encoding=speech.Encoding.LINEAR16,
+    >>> with open('./hello_pause_goodbye.wav', 'rb') as stream:
+    ...     sample = client.sample(stream=stream, encoding=speech.Encoding.LINEAR16,
     ...                            sample_rate=16000)
-    ...     stream_container = client.stream_recognize(sample,
-    ...                                                single_utterance=True)
-    >>> print(stream_container.get_full_text())
+    ...     for response in client.stream_recognize(sample,
+    ...                                             single_utterance=True):
+    ...         print(response.transcript)
+    ...         print(response.is_final)
     hello
+    True
 
 .. _Single Utterance: https://cloud.google.com/speech/reference/rpc/google.cloud.speech.v1beta1#streamingrecognitionconfig
 .. _sync_recognize: https://cloud.google.com/speech/reference/rest/v1beta1/speech/syncrecognize
diff --git a/speech/google/cloud/speech/client.py b/speech/google/cloud/speech/client.py
@@ -234,6 +234,9 @@ def stream_recognize(self, sample, language_code=None,
 
             See: https://cloud.google.com/speech/limits#content
 
+        Yields :class:`~streaming_response.StreamingSpeechResponse` containing
+        results and metadata from the streaming request.
+
         :type sample: :class:`~google.cloud.speech.sample.Sample`
         :param sample: Instance of ``Sample`` containing audio information.
 
@@ -264,8 +267,8 @@ def stream_recognize(self, sample, language_code=None,
                                and phrases. This can also be used to add new
                                words to the vocabulary of the recognizer.
 
-        :type single_utterance: boolean
-        :param single_utterance: [Optional] If false or omitted, the recognizer
+        :type single_utterance: bool
+        :param single_utterance: (Optional) If false or omitted, the recognizer
                                  will perform continuous recognition
                                  (continuing to process audio even if the user
                                  pauses speaking) until the client closes the
@@ -282,13 +285,15 @@ def stream_recognize(self, sample, language_code=None,
                                  SpeechRecognitionResult with the is_final flag
                                  set to true.
 
-        :type interim_results: boolean
-        :param interim_results: [Optional] If true, interim results (tentative
+        :type interim_results: bool
+        :param interim_results: (Optional) If true, interim results (tentative
                                 hypotheses) may be returned as they become
                                 available (these interim results are indicated
                                 with the is_final=false flag). If false or
                                 omitted, only is_final=true result(s) are
                                 returned.
+
+        :raises: :class:`EnvironmentError` if gRPC is not enabled.
         """
         if not _USE_GAX:
             raise EnvironmentError('gRPC is required to use this API.')
@@ -301,7 +306,7 @@ def stream_recognize(self, sample, language_code=None,
                                         interim_results=interim_results)
 
         for response in self.speech_api.streaming_recognize(requests):
-            if hasattr(response, 'results') or interim_results:
+            if getattr(response, 'results', None) or interim_results:
                 yield StreamingSpeechResponse.from_pb(response)
 
     @property
@@ -414,8 +419,8 @@ def _make_request_stream(sample, language_code=None, max_alternatives=None,
                            and phrases. This can also be used to add new
                            words to the vocabulary of the recognizer.
 
-    :type single_utterance: boolean
-    :param single_utterance: [Optional] If false or omitted, the recognizer
+    :type single_utterance: bool
+    :param single_utterance: (Optional) If false or omitted, the recognizer
                              will perform continuous recognition
                              (continuing to process audio even if the user
                              pauses speaking) until the client closes the
@@ -432,8 +437,8 @@ def _make_request_stream(sample, language_code=None, max_alternatives=None,
                              SpeechRecognitionResult with the is_final flag
                              set to true.
 
-    :type interim_results: boolean
-    :param interim_results: [Optional] If true, interim results (tentative
+    :type interim_results: bool
+    :param interim_results: (Optional) If true, interim results (tentative
                             hypotheses) may be returned as they become
                             available (these interim results are indicated
                             with the is_final=false flag). If false or
@@ -452,7 +457,6 @@ def _make_request_stream(sample, language_code=None, max_alternatives=None,
         data = sample.stream.read(sample.chunk_size)
         if not data:
             break
-        # Optimize the request data size to around 100ms.
         yield StreamingRecognizeRequest(audio_content=data)
 
 
@@ -466,12 +470,12 @@ def _make_streaming_config(sample, language_code,
     :param sample: Instance of ``Sample`` containing audio information.
 
     :type language_code: str
-    :param language_code: (Optional) The language of the supplied audio as
+    :param language_code: The language of the supplied audio as
                           BCP-47 language tag. Example: ``'en-GB'``.
                           If omitted, defaults to ``'en-US'``.
 
     :type max_alternatives: int
-    :param max_alternatives: (Optional) Maximum number of recognition
+    :param max_alternatives: Maximum number of recognition
                              hypotheses to be returned. The server may
                              return fewer than maxAlternatives.
                              Valid values are 0-30. A value of 0 or 1
@@ -492,8 +496,8 @@ def _make_streaming_config(sample, language_code,
                            and phrases. This can also be used to add new
                            words to the vocabulary of the recognizer.
 
-    :type single_utterance: boolean
-    :param single_utterance: [Optional] If false or omitted, the recognizer
+    :type single_utterance: bool
+    :param single_utterance: If false or omitted, the recognizer
                              will perform continuous recognition
                              (continuing to process audio even if the user
                              pauses speaking) until the client closes the
@@ -510,8 +514,8 @@ def _make_streaming_config(sample, language_code,
                              SpeechRecognitionResult with the is_final flag
                              set to true.
 
-    :type interim_results: boolean
-    :param interim_results: [Optional] If true, interim results (tentative
+    :type interim_results: bool
+    :param interim_results: If true, interim results (tentative
                             hypotheses) may be returned as they become
                             available (these interim results are indicated
                             with the is_final=false flag). If false or
diff --git a/speech/google/cloud/speech/endpointer_type.py b/speech/google/cloud/speech/endpointer_type.py
diff --git a/speech/google/cloud/speech/sample.py b/speech/google/cloud/speech/sample.py
@@ -77,7 +77,7 @@ def chunk_size(self):
         :rtype: int
         :returns: Optimized chunk size.
         """
-        return int(self.sample_rate / 10)
+        return int(self.sample_rate / 10.0)
 
     @property
     def source_uri(self):
diff --git a/speech/google/cloud/speech/streaming_response.py b/speech/google/cloud/speech/streaming_response.py
@@ -15,6 +15,7 @@
 """Representation of a GAPIC Speech API response."""
 
 from google.cloud.speech.streaming_result import StreamingSpeechResult
+from google.cloud.gapic.speech.v1beta1.enums import StreamingRecognizeResponse
 
 
 class StreamingSpeechResponse(object):
@@ -38,7 +39,7 @@ def __init__(self, error=None, endpointer_type=None, results=None,
                  result_index=None):
         results = results or []
         self._error = error
-        self._endpointer_type = EndpointerType.reverse_map.get(
+        self._endpointer_type = EndpointerType.REVERSE_MAP.get(
             endpointer_type, None)
         self._result_index = result_index
         self._results = [StreamingSpeechResult.from_pb(result)
@@ -91,7 +92,7 @@ def is_final(self):
         :returns: True if the result has completed it's processing.
         """
         if self.results:
-            return bool(self.results[0].is_final)
+            return self.results[0].is_final
         else:
             return False
 
@@ -123,26 +124,27 @@ def transcript(self):
         if self.results and self.results[0].alternatives:
             return self.results[0].alternatives[0].transcript
         else:
-            return ''
+            return None
 
 
-class EndpointerType(object):
+class EndpointerType(StreamingRecognizeResponse.EndpointerType):
     """Endpointer type for tracking state of Speech API detection.
 
+    ENDPOINTER_EVENT_UNSPECIFIED (int): No endpointer event specified.
+    START_OF_SPEECH (int): Speech has been detected in the audio stream.
+    END_OF_SPEECH (int): Speech has ceased to be detected in the audio
+    stream.
+    END_OF_AUDIO (int): The end of the audio stream has been reached. and
+    it is being processed.
+    END_OF_UTTERANCE (int): This event is only sent when
+    ``single_utterance`` is ``true``. It indicates that the server has
+    detected the end of the user's speech utterance and expects no
+    additional speech. Therefore, the server will not process additional
+    audio. The client should stop sending additional audio data.
+
     See:
     https://cloud.google.com/speech/reference/rpc/\
     google.cloud.speech.v1beta1#endpointertype
     """
-    ENDPOINTER_EVENT_UNSPECIFIED = 0
-    START_OF_SPEECH = 1
-    END_OF_SPEECH = 2
-    END_OF_AUDIO = 3
-    END_OF_UTTERANCE = 4
-
-    reverse_map = {
-        0: 'ENDPOINTER_EVENT_UNSPECIFIED',
-        1: 'START_OF_SPEECH',
-        2: 'END_OF_SPEECH',
-        3: 'END_OF_AUDIO',
-        4: 'END_OF_UTTERANCE'
-    }
+    REVERSE_MAP = {v: k for k, v
+                   in vars(StreamingRecognizeResponse.EndpointerType).items()}
diff --git a/speech/google/cloud/speech/streaming_result.py b/speech/google/cloud/speech/streaming_result.py
@@ -70,4 +70,4 @@ def is_final(self):
         :rtype: bool
         :returns: True if the result has completed it's processing.
         """
-        return bool(self._is_final)
+        return self._is_final
diff --git a/speech/unit_tests/test_client.py b/speech/unit_tests/test_client.py
@@ -251,19 +251,30 @@ def test_stream_recognize(self):
         sample = client.sample(stream=stream,
                                encoding=Encoding.LINEAR16,
                                sample_rate=self.SAMPLE_RATE)
-        results = client.stream_recognize(sample)
+        responses = client.stream_recognize(sample)
 
-        self.assertIsInstance(next(results), StreamingSpeechResponse)
+        self.assertIsInstance(next(responses), StreamingSpeechResponse)
         requests = []
         for req in client.speech_api._requests:
             requests.append(req)
         self.assertEqual(len(requests), 2)
 
 
+class _MockSpeechGAPICAlternative(object):
+    transcript = 'hello there!'
+    confidence = 0.9704365
+
+
+class _MockSpeechGAPICResult(object):
+    alternatives = [_MockSpeechGAPICAlternative()]
+    is_final = False
+    stability = 0.0
+
+
 class _MockGAPICSpeechResponse(object):
     error = None
     endpointer_type = None
-    results = []
+    results = [_MockSpeechGAPICResult()]
     result_index = 0
 
 
diff --git a/speech/unit_tests/test_response.py b/speech/unit_tests/test_response.py
@@ -30,7 +30,7 @@ def test_ctor(self):
         self.assertEqual(response.confidence, 0.0)
         self.assertEqual(response.endpointer_type, None)
         self.assertEqual(response.results, [])
-        self.assertEqual(response.transcript, '')
+        self.assertEqual(response.transcript, None)
         self.assertFalse(response.is_final)
 
     def test_from_pb(self):