Add Sample factory to Client.

daspecster · daspecster · commit 04bf28dee7c0 · 2016-10-06T14:20:27.000-04:00
diff --git a/docs/speech-usage.rst b/docs/speech-usage.rst
@@ -45,11 +45,12 @@ See: `Speech Asynchronous Recognize`_
 .. code-block:: python
 
     >>> import time
-    >>> from google.cloud.speech.sample import Sample
+    >>> from google.cloud import speech
     >>> from google.cloud.speech.encoding import Encoding
-    >>> sample = Sample(source_uri='gs://my-bucket/recording.flac',
-    ...                 encoding=Encoding.FLAC,
-    ...                 sample_rate=44100)
+    >>> client = speech.Client()
+    >>> sample = client.sample(source_uri='gs://my-bucket/recording.flac',
+    ...                        encoding=Encoding.FLAC,
+    ...                        sample_rate=44100)
     >>> operation = client.async_recognize(sample, max_alternatives=2)
     >>> retry_count = 100
     >>> while retry_count > 0 and not operation.complete:
@@ -75,11 +76,12 @@ Great Britian.
 
 .. code-block:: python
 
-    >>> from google.cloud.speech.sample import Sample
+    >>> from google.cloud import speech
     >>> from google.cloud.speech.encoding import Encoding
-    >>> sample = Sample(source_uri='gs://my-bucket/recording.flac',
-    ...                 encoding=Encoding.FLAC,
-    ...                 sample_rate=44100)
+    >>> client = speech.Client()
+    >>> sample = client.sample(source_uri='gs://my-bucket/recording.flac',
+    ...                        encoding=Encoding.FLAC,
+    ...                        sample_rate=44100)
     >>> operation = client.async_recognize(sample, max_alternatives=2)
      >>> alternatives = client.sync_recognize(
      ...     'FLAC', 16000, source_uri='gs://my-bucket/recording.flac',
@@ -99,11 +101,12 @@ Example of using the profanity filter.
 
 .. code-block:: python
 
-    >>> from google.cloud.speech.sample import Sample
+    >>> from google.cloud import speech
     >>> from google.cloud.speech.encoding import Encoding
-    >>> sample = Sample(source_uri='gs://my-bucket/recording.flac',
-    ...                 encoding=Encoding.FLAC,
-    ...                 sample_rate=44100)
+    >>> client = speech.Client()
+    >>> sample = client.sample(source_uri='gs://my-bucket/recording.flac',
+    ...                        encoding=Encoding.FLAC,
+    ...                        sample_rate=44100)
     >>> alternatives = client.sync_recognize(sample, max_alternatives=1,
     ...                                      profanity_filter=True)
     >>> for alternative in alternatives:
@@ -120,11 +123,12 @@ words to the vocabulary of the recognizer.
 
 .. code-block:: python
 
-    >>> from google.cloud.speech.sample import Sample
+    >>> from google.cloud import speech
     >>> from google.cloud.speech.encoding import Encoding
-    >>> sample = Sample(source_uri='gs://my-bucket/recording.flac',
-    ...                 encoding=Encoding.FLAC,
-    ...                 sample_rate=44100)
+    >>> client = speech.Client()
+    >>> sample = client.sample(source_uri='gs://my-bucket/recording.flac',
+    ...                        encoding=Encoding.FLAC,
+    ...                        sample_rate=44100)
     >>> hints = ['hi', 'good afternoon']
     >>> alternatives = client.sync_recognize(sample, max_alternatives=2,
     ...                                      speech_context=hints)
diff --git a/speech/google/cloud/speech/client.py b/speech/google/cloud/speech/client.py
@@ -20,6 +20,7 @@
 from google.cloud import client as client_module
 from google.cloud.speech.connection import Connection
 from google.cloud.speech.operation import Operation
+from google.cloud.speech.sample import Sample
 
 
 class Client(client_module.Client):
@@ -97,6 +98,41 @@ def async_recognize(self, sample, language_code=None,
 
         return Operation.from_api_repr(self, api_response)
 
+    @staticmethod
+    def sample(content=None, source_uri=None, encoding=None,
+               sample_rate=None):
+        """Factory: construct Sample to use when making recognize requests.
+
+        :type content: bytes
+        :param content: (Optional) Byte stream of audio.
+
+        :type source_uri: str
+        :param source_uri: (Optional) URI that points to a file that contains
+                           audio data bytes as specified in RecognitionConfig.
+                           Currently, only Google Cloud Storage URIs are
+                           supported, which must be specified in the following
+                           format: ``gs://bucket_name/object_name``.
+
+        :type encoding: str
+        :param encoding: encoding of audio data sent in all RecognitionAudio
+                         messages, can be one of: :attr:`~.Encoding.LINEAR16`,
+                         :attr:`~.Encoding.FLAC`, :attr:`~.Encoding.MULAW`,
+                         :attr:`~.Encoding.AMR`, :attr:`~.Encoding.AMR_WB`
+
+        :type sample_rate: int
+        :param sample_rate: Sample rate in Hertz of the audio data sent in all
+                            requests. Valid values are: 8000-48000. For best
+                            results, set the sampling rate of the audio source
+                            to 16000 Hz. If that's not possible, use the
+                            native sample rate of the audio source (instead of
+                            re-sampling).
+
+        :rtype: :class:`~google.cloud.speech.sample.Sample`
+        :returns: Instance of ``Sample``.
+        """
+        return Sample(content=content, source_uri=source_uri,
+                      encoding=encoding, sample_rate=sample_rate)
+
     def sync_recognize(self, sample, language_code=None,
                        max_alternatives=None, profanity_filter=None,
                        speech_context=None):
diff --git a/speech/unit_tests/test_client.py b/speech/unit_tests/test_client.py
@@ -19,6 +19,7 @@ class TestClient(unittest.TestCase):
     SAMPLE_RATE = 16000
     HINTS = ['hi']
     AUDIO_SOURCE_URI = 'gs://sample-bucket/sample-recording.flac'
+    AUDIO_CONTENT = '/9j/4QNURXhpZgAASUkq'
 
     def _getTargetClass(self):
         from google.cloud.speech.client import Client
@@ -37,15 +38,36 @@ def test_ctor(self):
         self.assertTrue(client.connection.credentials is creds)
         self.assertTrue(client.connection.http is http)
 
+    def test_create_sample_from_client(self):
+        from google.cloud.speech.encoding import Encoding
+        from google.cloud.speech.sample import Sample
+
+        credentials = _Credentials()
+        client = self._makeOne(credentials=credentials)
+
+        sample = client.sample(source_uri=self.AUDIO_SOURCE_URI,
+                               encoding=Encoding.FLAC,
+                               sample_rate=self.SAMPLE_RATE)
+        self.assertIsInstance(sample, Sample)
+        self.assertEqual(sample.source_uri, self.AUDIO_SOURCE_URI)
+        self.assertEqual(sample.sample_rate, self.SAMPLE_RATE)
+        self.assertEqual(sample.encoding, Encoding.FLAC)
+
+        content_sample = client.sample(content=self.AUDIO_CONTENT,
+                                       encoding=Encoding.FLAC,
+                                       sample_rate=self.SAMPLE_RATE)
+        self.assertEqual(content_sample.content, self.AUDIO_CONTENT)
+        self.assertEqual(content_sample.sample_rate, self.SAMPLE_RATE)
+        self.assertEqual(content_sample.encoding, Encoding.FLAC)
+
     def test_sync_recognize_content_with_optional_parameters(self):
         import base64
         from google.cloud._helpers import _to_bytes
         from google.cloud.speech.encoding import Encoding
         from google.cloud.speech.sample import Sample
         from unit_tests._fixtures import SYNC_RECOGNIZE_RESPONSE
 
-        _AUDIO_CONTENT = _to_bytes('/9j/4QNURXhpZgAASUkq')
-        _B64_AUDIO_CONTENT = base64.b64encode(_AUDIO_CONTENT)
+        _B64_AUDIO_CONTENT = base64.b64encode(_to_bytes(self.AUDIO_CONTENT))
         RETURNED = SYNC_RECOGNIZE_RESPONSE
         REQUEST = {
             'config': {
@@ -70,7 +92,7 @@ def test_sync_recognize_content_with_optional_parameters(self):
 
         encoding = Encoding.FLAC
 
-        sample = Sample(content=_AUDIO_CONTENT, encoding=encoding,
+        sample = Sample(content=self.AUDIO_CONTENT, encoding=encoding,
                         sample_rate=self.SAMPLE_RATE)
         response = client.sync_recognize(sample,
                                          language_code='EN',