From e5184af54876abdc0499f1959c444e95933ec207 Mon Sep 17 00:00:00 2001
From: Thomas Schultz <daspecster@gmail.com>
Date: Mon, 26 Sep 2016 14:38:48 -0400
Subject: [PATCH 1/4] Add speech asynchronous recognize support.

---
 docs/index.rst                           |   2 +
 docs/speech-client.rst                   |   2 +-
 docs/speech-encoding.rst                 |   7 +
 docs/speech-operation.rst                |   7 +
 docs/speech-usage.rst                    |  38 +++-
 google/cloud/speech/encoding.py          |  39 ++++
 google/cloud/speech/operation.py         | 159 +++++++++++++++
 speech/google/cloud/speech/client.py     | 238 +++++++++++++++++------
 speech/google/cloud/speech/connection.py |   2 +-
 speech/unit_tests/_fixtures.py           |  42 ++++
 speech/unit_tests/test_client.py         |  42 +++-
 speech/unit_tests/test_connection.py     |   6 +-
 unit_tests/speech/test_operation.py      |  93 +++++++++
 13 files changed, 605 insertions(+), 72 deletions(-)
 create mode 100644 docs/speech-encoding.rst
 create mode 100644 docs/speech-operation.rst
 create mode 100644 google/cloud/speech/encoding.py
 create mode 100644 google/cloud/speech/operation.py
 create mode 100644 unit_tests/speech/test_operation.py
diff --git a/docs/index.rst b/docs/index.rst
index f258ba89c2d2..fee7e851ff21 100644
--- a/docs/index.rst
+++ b/docs/index.rst
@@ -173,6 +173,8 @@
 
   speech-usage
   Client <speech-client>
+  speech-encoding
+  speech-operation
 
 .. toctree::
   :maxdepth: 0
diff --git a/docs/speech-client.rst b/docs/speech-client.rst
index 1162e5454a97..1e14b24eeac5 100644
--- a/docs/speech-client.rst
+++ b/docs/speech-client.rst
@@ -1,5 +1,5 @@
 Speech Client
-================
+=============
 
 .. automodule:: google.cloud.speech.client
   :members:
diff --git a/docs/speech-encoding.rst b/docs/speech-encoding.rst
new file mode 100644
index 000000000000..affe80a4ebd2
--- /dev/null
+++ b/docs/speech-encoding.rst
@@ -0,0 +1,7 @@
+Speech Encoding
+===============
+
+.. automodule:: google.cloud.speech.encoding
+  :members:
+  :undoc-members:
+  :show-inheritance:
diff --git a/docs/speech-operation.rst b/docs/speech-operation.rst
new file mode 100644
index 000000000000..5c0ec3b92b12
--- /dev/null
+++ b/docs/speech-operation.rst
@@ -0,0 +1,7 @@
+Speech Operation
+================
+
+.. automodule:: google.cloud.speech.operation
+  :members:
+  :undoc-members:
+  :show-inheritance:
diff --git a/docs/speech-usage.rst b/docs/speech-usage.rst
index 57e274608b40..b7b55e4a49c4 100644
--- a/docs/speech-usage.rst
+++ b/docs/speech-usage.rst
@@ -2,7 +2,8 @@ Using the API
 =============
 
 The `Google Speech`_ API enables developers to convert audio to text.
-The API recognizes over 80 languages and variants, to support your global user base.
+The API recognizes over 80 languages and variants, to support your global user
+base.
 
 .. warning::
 
@@ -30,11 +31,41 @@ create an instance of :class:`~google.cloud.speech.client.Client`.
      >>> client = speech.Client()
 
 
+Asychronous Recognition
+-----------------------
+
+The :meth:`~google.cloud.speech.Client.async_recognize` sends audio data to the
+Speech API and initiates a Long Running Operation. Using this operation, you
+can periodically poll for recognition results. Use asynchronous requests for
+audio data of any duration up to 80 minutes.
+
+See: `Speech Asynchronous Recognize`_
+
+
+  .. code-block:: python
+
+      >>> import time
+      >>> operation = client.async_recognize(
+      ...     None, 'gs://my-bucket/recording.flac',
+      ...     'FLAC', 16000, max_alternatives=2)
+      >>> retry_count = 100
+      >>> while retry_count > 0 and not operation.complete:
+      ...     retry_count -= 1
+      ...     time.sleep(10)
+      ...     operation.poll()  # API call
+      >>> operation.complete
+      True
+      >>> operation.results[0]['alternatives'][0]['transcript']
+      "how old is the Brooklyn Bridge"
+      >>> operation.results[0]['alternatives'][0]['confidence']
+      0.98267895
+
+
 Synchronous Recognition
 -----------------------
 
-The :meth:`~google.cloud.speech.Client.sync_recognize` method converts speech data to text
-and returns alternative text transcriptons.
+The :meth:`~google.cloud.speech.Client.sync_recognize` method converts speech
+data to text and returns alternative text transcriptons.
 
   .. code-block:: python
 
@@ -53,3 +84,4 @@ and returns alternative text transcriptons.
      confidence: 0
 
 .. _sync_recognize: https://cloud.google.com/speech/reference/rest/v1beta1/speech/syncrecognize
+.. _Speech Asynchronous Recognize: https://cloud.google.com/speech/reference/rest/v1beta1/speech/asyncrecognize
diff --git a/google/cloud/speech/encoding.py b/google/cloud/speech/encoding.py
new file mode 100644
index 000000000000..4fdaa3367834
--- /dev/null
+++ b/google/cloud/speech/encoding.py
@@ -0,0 +1,39 @@
+# Copyright 2016 Google Inc. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Encodings used by the Google Cloud Speech API."""
+
+
+class Encoding(object):
+    """Audio encoding types.
+
+    See:
+    https://cloud.google.com/speech/reference/rest/v1beta1/\
+    RecognitionConfig#AudioEncoding
+    """
+
+    LINEAR16 = 'LINEAR16'
+    """LINEAR16 encoding type."""
+
+    FLAC = 'FLAC'
+    """FLAC encoding type."""
+
+    MULAW = 'MULAW'
+    """MULAW encoding type."""
+
+    AMR = 'AMR'
+    """AMR encoding type."""
+
+    AMR_WB = 'AMR_WB'
+    """AMR_WB encoding type."""
diff --git a/google/cloud/speech/operation.py b/google/cloud/speech/operation.py
new file mode 100644
index 000000000000..b623ba637c79
--- /dev/null
+++ b/google/cloud/speech/operation.py
@@ -0,0 +1,159 @@
+# Copyright 2016 Google Inc. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Long running operation representation for Google Speech API"""
+
+from google.cloud._helpers import _rfc3339_to_datetime
+
+
+class Operation(object):
+    """Representation of a Google API Long-Running Operation.
+
+    :type name: int
+    :param name: ID assigned to an operation.
+
+    :type complete: bool
+    :param complete: True if operation is complete, else False.
+
+    :type last_updated: datetime
+    :param last_updated: The last time the operation was updated.
+
+    :type progress_percent: int
+    :param progress_percent: Percentage of operation that has been completed.
+
+    :type results: dict
+    :param results: Dictionary with transcript and score of operation.
+
+    :type start_time: datetime
+    :param start_time: Datetime when operation was started.
+    """
+    def __init__(self, client, name, complete=False, last_updated=None,
+                 progress_percent=0, results=None, start_time=None):
+        self.client = client
+        self.name = name
+        self._complete = complete
+        self._last_updated = last_updated
+        self._progress_percent = progress_percent
+        self._results = results
+        self._start_time = start_time
+
+    @classmethod
+    def from_api_repr(cls, client, response):
+        """Factory:  construct an instance from Google Speech API.
+
+        :type response: dict
+        :param response: Dictionary response from Google Speech Operations API.
+
+        :rtype: :class:`Operation`
+        :returns: Instance of `~google.cloud.speech.operations.Operation`.
+        """
+        last_updated = None
+        progress_percent = 0
+        results = None
+        start_time = None
+
+        name = response['name']
+        metadata = response.get('metadata', None)
+
+        if metadata:
+            last_updated = _rfc3339_to_datetime(metadata.get('lastUpdateTime'))
+            start_time = _rfc3339_to_datetime(metadata.get('startTime'))
+            progress_percent = metadata.get('progressPercent')
+
+        if response.get('response'):
+            results = response.get('response').get('results')
+        complete = response.get('done', False)
+
+        return cls(client, name, complete, last_updated, progress_percent,
+                   results, start_time)
+
+    @property
+    def complete(self):
+        """Completion state of the `Operation`.
+
+        :rtype: bool
+        :returns: True if already completed, else false.
+        """
+        return self._complete
+
+    @property
+    def last_updated(self):
+        """Operation last updated time.
+
+        :rtype: datetime
+        :returns: RFC3339 last updated time of the operation.
+        """
+        return self._last_updated
+
+    @property
+    def progress_percent(self):
+        """Progress percentage of operation.
+
+        :rtype: int
+        :returns: Percentage of operation completed. [0-100]
+        """
+        return self._progress_percent
+
+    @property
+    def results(self):
+        """Results dictionary with transcript information.
+
+        :rtype: dict
+        :returns: Dictionary with transcript and confidence score.
+        """
+        return self._results
+
+    @property
+    def start_time(self):
+        """Operation start time.
+
+        :rtype: datetime
+        :returns: RFC3339 start time of the operation.
+        """
+        return self._start_time
+
+    def poll(self):
+        """Check if the operation has finished.
+
+        :rtype: bool
+        :returns: A boolean indicating if the current operation has completed.
+        :raises: :class:`ValueError <exceptions.ValueError>` if the operation
+                 has already completed.
+        """
+        if self.complete:
+            raise ValueError('The operation has completed.')
+
+        path = 'operations/%s' % (self.name,)
+        api_response = self.client.connection.api_request(method='GET',
+                                                          path=path)
+        self._update(api_response)
+        return self.complete
+
+    def _update(self, response):
+        """Update Operation instance with latest data from Speech API.
+
+        .. _speech_operations: https://cloud.google.com/speech/reference/\
+                               rest/v1beta1/operations
+
+        :type response: dict
+        :param response: Response from Speech API Operations endpoint.
+                         See: `speech_operations`_.
+        """
+        metadata = response['metadata']
+        results = response.get('response', {}).get('results')
+        self._last_updated = _rfc3339_to_datetime(metadata['lastUpdateTime'])
+        self._results = results
+        self._start_time = _rfc3339_to_datetime(metadata['startTime'])
+        self._complete = response.get('done', False)
+        self._progress_percent = metadata.get('progressPercent', 0)
diff --git a/speech/google/cloud/speech/client.py b/speech/google/cloud/speech/client.py
index 7f30b06c05ba..8226fd76c644 100644
--- a/speech/google/cloud/speech/client.py
+++ b/speech/google/cloud/speech/client.py
@@ -19,30 +19,8 @@
 from google.cloud._helpers import _to_bytes
 from google.cloud import client as client_module
 from google.cloud.speech.connection import Connection
-
-
-class Encoding(object):
-    """Audio encoding types.
-
-    See:
-    https://cloud.google.com/speech/reference/rest/v1beta1/\
-    RecognitionConfig#AudioEncoding
-    """
-
-    LINEAR16 = 'LINEAR16'
-    """LINEAR16 encoding type."""
-
-    FLAC = 'FLAC'
-    """FLAC encoding type."""
-
-    MULAW = 'MULAW'
-    """MULAW encoding type."""
-
-    AMR = 'AMR'
-    """AMR encoding type."""
-
-    AMR_WB = 'AMR_WB'
-    """AMR_WB encoding type."""
+from google.cloud.speech.encoding import Encoding
+from google.cloud.speech.operation import Operation
 
 
 class Client(client_module.Client):
@@ -68,6 +46,81 @@ class Client(client_module.Client):
 
     _connection_class = Connection
 
+    def async_recognize(self, content, source_uri, encoding, sample_rate,
+                        language_code=None, max_alternatives=None,
+                        profanity_filter=None, speech_context=None):
+        """Asychronous Recognize request to Google Speech API.
+
+        .. _async_recognize: https://cloud.google.com/speech/reference/\
+                             rest/v1beta1/speech/asyncrecognize
+
+        See `async_recognize`_.
+
+        :type content: bytes
+        :param content: Byte stream of audio.
+
+        :type source_uri: str
+        :param source_uri: URI that points to a file that contains audio
+                           data bytes as specified in RecognitionConfig.
+                           Currently, only Google Cloud Storage URIs are
+                           supported, which must be specified in the following
+                           format: ``gs://bucket_name/object_name``.
+
+        :type encoding: str
+        :param encoding: encoding of audio data sent in all RecognitionAudio
+                         messages, can be one of: :attr:`~.Encoding.LINEAR16`,
+                         :attr:`~.Encoding.FLAC`, :attr:`~.Encoding.MULAW`,
+                         :attr:`~.Encoding.AMR`, :attr:`~.Encoding.AMR_WB`
+
+        :type sample_rate: int
+        :param sample_rate: Sample rate in Hertz of the audio data sent in all
+                            requests. Valid values are: 8000-48000. For best
+                            results, set the sampling rate of the audio source
+                            to 16000 Hz. If that's not possible, use the
+                            native sample rate of the audio source (instead of
+                            re-sampling).
+
+        :type language_code: str
+        :param language_code: (Optional) The language of the supplied audio as
+                              BCP-47 language tag. Example: ``'en-GB'``.
+                              If omitted, defaults to ``'en-US'``.
+
+        :type max_alternatives: int
+        :param max_alternatives: (Optional) Maximum number of recognition
+                                 hypotheses to be returned. The server may
+                                 return fewer than maxAlternatives.
+                                 Valid values are 0-30. A value of 0 or 1
+                                 will return a maximum of 1. Defaults to 1
+
+        :type profanity_filter: bool
+        :param profanity_filter: If True, the server will attempt to filter
+                                 out profanities, replacing all but the
+                                 initial character in each filtered word with
+                                 asterisks, e.g. ``'f***'``. If False or
+                                 omitted, profanities won't be filtered out.
+
+        :type speech_context: list
+        :param speech_context: A list of strings (max 50) containing words and
+                               phrases "hints" so that the speech recognition
+                               is more likely to recognize them. This can be
+                               used to improve the accuracy for specific words
+                               and phrases. This can also be used to add new
+                               words to the vocabulary of the recognizer.
+
+        :rtype: `~google.cloud.speech.operation.Operation`
+        :returns: ``Operation`` for asynchronous request to Google Speech API.
+        """
+
+        data = _build_request_data(content, source_uri, encoding,
+                                   sample_rate, language_code,
+                                   max_alternatives, profanity_filter,
+                                   speech_context)
+
+        api_response = self.connection.api_request(
+            method='POST', path='speech:asyncrecognize', data=data)
+
+        return Operation.from_api_repr(self, api_response)
+
     def sync_recognize(self, content, source_uri, encoding, sample_rate,
                        language_code=None, max_alternatives=None,
                        profanity_filter=None, speech_context=None):
@@ -139,44 +192,115 @@ def sync_recognize(self, content, source_uri, encoding, sample_rate,
                     between 0 and 1.
         """
 
-        if content is None and source_uri is None:
-            raise ValueError('content and source_uri cannot be both '
-                             'equal to None')
-
-        if content is not None and source_uri is not None:
-            raise ValueError('content and source_uri cannot be both '
-                             'different from None')
+        data = _build_request_data(content, source_uri, encoding,
+                                   sample_rate, language_code,
+                                   max_alternatives, profanity_filter,
+                                   speech_context)
 
-        if encoding is None:
-            raise ValueError('encoding cannot be None')
-        if sample_rate is None:
-            raise ValueError('sample_rate cannot be None')
+        api_response = self.connection.api_request(
+            method='POST', path='speech:syncrecognize', data=data)
 
-        if content is not None:
-            audio = {'content': b64encode(_to_bytes(content))}
+        if len(api_response['results']) == 1:
+            return api_response['results'][0]['alternatives']
         else:
-            audio = {'uri': source_uri}
+            raise ValueError('result in api should have length 1')
 
-        config = {'encoding': encoding, 'sampleRate': sample_rate}
 
-        if language_code is not None:
-            config['languageCode'] = language_code
-        if max_alternatives is not None:
-            config['maxAlternatives'] = max_alternatives
-        if profanity_filter is not None:
-            config['profanityFilter'] = profanity_filter
-        if speech_context is not None:
-            config['speechContext'] = {'phrases': speech_context}
+def _build_request_data(content, source_uri, encoding, sample_rate,
+                        language_code=None, max_alternatives=None,
+                        profanity_filter=None, speech_context=None):
+    """Builds the request data before making API request.
+
+    :type content: bytes
+    :param content: Byte stream of audio.
+
+    :type source_uri: str
+    :param source_uri: URI that points to a file that contains audio
+                       data bytes as specified in RecognitionConfig.
+                       Currently, only Google Cloud Storage URIs are
+                       supported, which must be specified in the following
+                       format: ``gs://bucket_name/object_name``.
+
+    :type encoding: str
+    :param encoding: encoding of audio data sent in all RecognitionAudio
+                     messages, can be one of: :attr:`~.Encoding.LINEAR16`,
+                     :attr:`~.Encoding.FLAC`, :attr:`~.Encoding.MULAW`,
+                     :attr:`~.Encoding.AMR`, :attr:`~.Encoding.AMR_WB`
+
+    :type sample_rate: int
+    :param sample_rate: Sample rate in Hertz of the audio data sent in all
+                        requests. Valid values are: 8000-48000. For best
+                        results, set the sampling rate of the audio source
+                        to 16000 Hz. If that's not possible, use the
+                        native sample rate of the audio source (instead of
+                        re-sampling).
+
+    :type language_code: str
+    :param language_code: (Optional) The language of the supplied audio as
+                          BCP-47 language tag. Example: ``'en-GB'``.
+                          If omitted, defaults to ``'en-US'``.
+
+    :type max_alternatives: int
+    :param max_alternatives: (Optional) Maximum number of recognition
+                             hypotheses to be returned. The server may
+                             return fewer than maxAlternatives.
+                             Valid values are 0-30. A value of 0 or 1
+                             will return a maximum of 1. Defaults to 1
+
+    :type profanity_filter: bool
+    :param profanity_filter: If True, the server will attempt to filter
+                             out profanities, replacing all but the
+                             initial character in each filtered word with
+                             asterisks, e.g. ``'f***'``. If False or
+                             omitted, profanities won't be filtered out.
+
+    :type speech_context: list
+    :param speech_context: A list of strings (max 50) containing words and
+                           phrases "hints" so that the speech recognition
+                           is more likely to recognize them. This can be
+                           used to improve the accuracy for specific words
+                           and phrases. This can also be used to add new
+                           words to the vocabulary of the recognizer.
+
+    :rtype: dict
+    :returns: Dictionary with required data for Google Speech API.
+    """
+    if content is None and source_uri is None:
+        raise ValueError('content and source_uri cannot be both '
+                         'equal to None')
 
-        data = {
-            'audio': audio,
-            'config': config,
-        }
+    if content is not None and source_uri is not None:
+        raise ValueError('content and source_uri cannot be both '
+                         'different from None')
 
-        api_response = self.connection.api_request(
-            method='POST', path='syncrecognize', data=data)
+    if encoding is None:
+        raise ValueError('encoding cannot be None')
 
-        if len(api_response['results']) == 1:
-            return api_response['results'][0]['alternatives']
-        else:
-            raise ValueError('result in api should have length 1')
+    encoding_value = getattr(Encoding, encoding)
+
+    if sample_rate is None:
+        raise ValueError('sample_rate cannot be None')
+
+    if content is not None:
+        audio = {'content': b64encode(_to_bytes(content))}
+    else:
+        audio = {'uri': source_uri}
+
+    config = {'encoding': encoding_value,
+              'sampleRate': sample_rate}
+
+    if language_code is not None:
+        config['languageCode'] = language_code
+    if max_alternatives is not None:
+        config['maxAlternatives'] = max_alternatives
+    if profanity_filter is not None:
+        config['profanityFilter'] = profanity_filter
+    if speech_context is not None:
+        config['speechContext'] = {'phrases': speech_context}
+
+    data = {
+        'audio': audio,
+        'config': config,
+    }
+
+    return data
diff --git a/speech/google/cloud/speech/connection.py b/speech/google/cloud/speech/connection.py
index 3decf19290d8..d74d729344e8 100644
--- a/speech/google/cloud/speech/connection.py
+++ b/speech/google/cloud/speech/connection.py
@@ -26,7 +26,7 @@ class Connection(base_connection.JSONConnection):
     API_VERSION = 'v1beta1'
     """The version of the API, used in building the API call's URL."""
 
-    API_URL_TEMPLATE = '{api_base_url}/{api_version}/speech:{path}'
+    API_URL_TEMPLATE = '{api_base_url}/{api_version}/{path}'
     """A template for the URL of a particular API call."""
 
     SCOPE = ('https://www.googleapis.com/auth/cloud-platform',)
diff --git a/speech/unit_tests/_fixtures.py b/speech/unit_tests/_fixtures.py
index 9665fef535d8..41d7da711148 100644
--- a/speech/unit_tests/_fixtures.py
+++ b/speech/unit_tests/_fixtures.py
@@ -28,3 +28,45 @@
 SYNC_RECOGNIZE_EMPTY_RESPONSE = {
     'results': [],
 }
+
+ASYNC_RECOGNIZE_RESPONSE = {
+    'name': '123456789'
+}
+
+OPERATION_COMPLETE_RESPONSE = {
+    'name': '123456789',
+    'metadata': {
+        '@type': ('type.googleapis.com/'
+                  'google.cloud.speech.v1beta1.AsyncRecognizeMetadata'),
+        'progressPercent': 100,
+        'startTime': '2016-09-22T17:52:25.536964Z',
+        'lastUpdateTime': '2016-09-22T17:52:27.802902Z'
+    },
+    'done': True,
+    'response': {
+        '@type': ('type.googleapis.com/'
+                  'google.cloud.speech.v1beta1.AsyncRecognizeResponse'),
+        'results': [
+            {
+                'alternatives': [
+                    {
+                        'transcript': 'how old is the Brooklyn Bridge',
+                        'confidence': 0.98267895
+                    }
+                ]
+            }
+        ]
+    }
+}
+
+OPERATION_INCOMPLETE_RESPONSE = {
+    'name': '123456789',
+    'metadata': {
+        '@type': ('type.googleapis.com/'
+                  'google.cloud.speech.v1beta1.AsyncRecognizeMetadata'),
+        'progressPercent': 27,
+        'startTime': '2016-09-22T17:52:25.536964Z',
+        'lastUpdateTime': '2016-09-22T17:52:27.802902Z'
+    },
+    'done': False
+}
diff --git a/speech/unit_tests/test_client.py b/speech/unit_tests/test_client.py
index 53e1eb67b89e..b73ffece41da 100644
--- a/speech/unit_tests/test_client.py
+++ b/speech/unit_tests/test_client.py
@@ -40,8 +40,8 @@ def test_ctor(self):
     def test_sync_recognize_content_with_optional_parameters(self):
         import base64
         from google.cloud._helpers import _to_bytes
-        from google.cloud.speech.client import Encoding
-        from unit_tests._fixtures import SYNC_RECOGNIZE_RESPONSE
+        from google.cloud.speech.encoding import Encoding
+        from unit_tests.speech._fixtures import SYNC_RECOGNIZE_RESPONSE
 
         _AUDIO_CONTENT = _to_bytes('/9j/4QNURXhpZgAASUkq')
         _B64_AUDIO_CONTENT = base64.b64encode(_AUDIO_CONTENT)
@@ -82,14 +82,19 @@ def test_sync_recognize_content_with_optional_parameters(self):
         self.assertEqual(len(req), 3)
         self.assertEqual(req['data'], REQUEST)
         self.assertEqual(req['method'], 'POST')
-        self.assertEqual(req['path'], 'syncrecognize')
+        self.assertEqual(req['path'], 'speech:syncrecognize')
 
         expected = SYNC_RECOGNIZE_RESPONSE['results'][0]['alternatives']
         self.assertEqual(response, expected)
 
     def test_sync_recognize_source_uri_without_optional_parameters(self):
+<<<<<<< b7f004e00f1ee021b0cb7ac9261fcc6c021dfacb:speech/unit_tests/test_client.py
         from google.cloud.speech.client import Encoding
         from unit_tests._fixtures import SYNC_RECOGNIZE_RESPONSE
+=======
+        from google.cloud.speech.encoding import Encoding
+        from unit_tests.speech._fixtures import SYNC_RECOGNIZE_RESPONSE
+>>>>>>> Add speech asynchronous recognize support.:unit_tests/speech/test_client.py
 
         RETURNED = SYNC_RECOGNIZE_RESPONSE
         REQUEST = {
@@ -116,13 +121,13 @@ def test_sync_recognize_source_uri_without_optional_parameters(self):
         self.assertEqual(len(req), 3)
         self.assertEqual(req['data'], REQUEST)
         self.assertEqual(req['method'], 'POST')
-        self.assertEqual(req['path'], 'syncrecognize')
+        self.assertEqual(req['path'], 'speech:syncrecognize')
 
         expected = SYNC_RECOGNIZE_RESPONSE['results'][0]['alternatives']
         self.assertEqual(response, expected)
 
     def test_sync_recognize_without_content_or_source_uri(self):
-        from google.cloud.speech.client import Encoding
+        from google.cloud.speech.encoding import Encoding
 
         credentials = _Credentials()
         client = self._makeOne(credentials=credentials)
@@ -132,7 +137,7 @@ def test_sync_recognize_without_content_or_source_uri(self):
 
     def test_sync_recognize_with_content_and_source_uri(self):
         from google.cloud._helpers import _to_bytes
-        from google.cloud.speech.client import Encoding
+        from google.cloud.speech.encoding import Encoding
         _AUDIO_CONTENT = _to_bytes('/9j/4QNURXhpZgAASUkq')
 
         credentials = _Credentials()
@@ -151,7 +156,7 @@ def test_sync_recognize_without_encoding(self):
                                   self.SAMPLE_RATE)
 
     def test_sync_recognize_without_samplerate(self):
-        from google.cloud.speech.client import Encoding
+        from google.cloud.speech.encoding import Encoding
 
         credentials = _Credentials()
         client = self._makeOne(credentials=credentials)
@@ -161,8 +166,13 @@ def test_sync_recognize_without_samplerate(self):
                                   None)
 
     def test_sync_recognize_with_empty_results(self):
+<<<<<<< b7f004e00f1ee021b0cb7ac9261fcc6c021dfacb:speech/unit_tests/test_client.py
         from google.cloud.speech.client import Encoding
         from unit_tests._fixtures import SYNC_RECOGNIZE_EMPTY_RESPONSE
+=======
+        from google.cloud.speech.encoding import Encoding
+        from unit_tests.speech._fixtures import SYNC_RECOGNIZE_EMPTY_RESPONSE
+>>>>>>> Add speech asynchronous recognize support.:unit_tests/speech/test_client.py
 
         credentials = _Credentials()
         client = self._makeOne(credentials=credentials)
@@ -172,6 +182,24 @@ def test_sync_recognize_with_empty_results(self):
             client.sync_recognize(None, self.AUDIO_SOURCE_URI, Encoding.FLAC,
                                   self.SAMPLE_RATE)
 
+    def test_async_recognize(self):
+        from unit_tests.speech._fixtures import ASYNC_RECOGNIZE_RESPONSE
+        from google.cloud.speech.encoding import Encoding
+        from google.cloud.speech.operation import Operation
+        RETURNED = ASYNC_RECOGNIZE_RESPONSE
+
+        credentials = _Credentials()
+        client = self._makeOne(credentials=credentials)
+        client.connection = _Connection(RETURNED)
+
+        encoding = Encoding.FLAC
+
+        operation = client.async_recognize(None, self.AUDIO_SOURCE_URI,
+                                           encoding,
+                                           self.SAMPLE_RATE)
+        self.assertIsInstance(operation, Operation)
+        self.assertFalse(operation.complete)
+
 
 class _Credentials(object):
 
diff --git a/speech/unit_tests/test_connection.py b/speech/unit_tests/test_connection.py
index ea9471dc4937..0de94cb1d7c1 100644
--- a/speech/unit_tests/test_connection.py
+++ b/speech/unit_tests/test_connection.py
@@ -26,11 +26,11 @@ def _makeOne(self, *args, **kw):
 
     def test_build_api_url(self):
         conn = self._makeOne()
+        method = 'speech:syncrecognize'
         uri = '/'.join([
             conn.API_BASE_URL,
             conn.API_VERSION,
-            'speech',
+            method,
         ])
-        method = 'syncrecognize'
-        uri += ':' + method
+
         self.assertEqual(conn.build_api_url(method), uri)
diff --git a/unit_tests/speech/test_operation.py b/unit_tests/speech/test_operation.py
new file mode 100644
index 000000000000..a616064043af
--- /dev/null
+++ b/unit_tests/speech/test_operation.py
@@ -0,0 +1,93 @@
+import unittest
+
+
+class OperationTests(unittest.TestCase):
+
+    OPERATION_NAME = '123456789'
+
+    def _getTargetClass(self):
+        from google.cloud.speech.operation import Operation
+        return Operation
+
+    def _makeOne(self, *args, **kwargs):
+        return self._getTargetClass()(*args, **kwargs)
+
+    def test_ctor_defaults(self):
+        client = _Client()
+        operation = self._makeOne(client, self.OPERATION_NAME)
+        self.assertEqual('123456789', operation.name)
+        self.assertFalse(operation.complete)
+        self.assertIsNone(operation.last_updated)
+        self.assertEqual(0, operation.progress_percent)
+        self.assertIsNone(operation.results)
+        self.assertIsNone(operation.start_time)
+
+    def test_from_api_repr(self):
+        from unit_tests.speech._fixtures import OPERATION_COMPLETE_RESPONSE
+        RESPONSE = OPERATION_COMPLETE_RESPONSE
+
+        client = _Client()
+        connection = _Connection(OPERATION_COMPLETE_RESPONSE)
+        client.connection = connection
+        operation = self._getTargetClass().from_api_repr(client, RESPONSE)
+
+        self.assertEqual('123456789', operation.name)
+        self.assertTrue(operation.complete)
+
+        alternatives = operation.results[0]['alternatives']
+
+        self.assertEqual('how old is the Brooklyn Bridge',
+                         alternatives[0]['transcript'])
+        self.assertEqual(0.98267895, alternatives[0]['confidence'])
+        self.assertTrue(operation.complete)
+
+    def test_update_response(self):
+        from unit_tests.speech._fixtures import ASYNC_RECOGNIZE_RESPONSE
+        from unit_tests.speech._fixtures import OPERATION_COMPLETE_RESPONSE
+        RESPONSE = ASYNC_RECOGNIZE_RESPONSE
+
+        client = _Client()
+        connection = _Connection(OPERATION_COMPLETE_RESPONSE)
+        client.connection = connection
+        operation = self._getTargetClass().from_api_repr(client, RESPONSE)
+        self.assertEqual('123456789', operation.name)
+
+        operation._update(OPERATION_COMPLETE_RESPONSE)
+        self.assertTrue(operation.complete)
+
+    def test_poll(self):
+        from unit_tests.speech._fixtures import ASYNC_RECOGNIZE_RESPONSE
+        from unit_tests.speech._fixtures import OPERATION_COMPLETE_RESPONSE
+        RESPONSE = ASYNC_RECOGNIZE_RESPONSE
+        client = _Client()
+        connection = _Connection(OPERATION_COMPLETE_RESPONSE)
+        client.connection = connection
+
+        operation = self._getTargetClass().from_api_repr(client, RESPONSE)
+        self.assertFalse(operation.complete)
+        operation.poll()
+        self.assertTrue(operation.complete)
+
+    def test_poll_complete(self):
+        from unit_tests.speech._fixtures import OPERATION_COMPLETE_RESPONSE
+        RESPONSE = OPERATION_COMPLETE_RESPONSE
+        client = _Client()
+        connection = _Connection(OPERATION_COMPLETE_RESPONSE)
+        client.connection = connection
+
+        operation = self._getTargetClass().from_api_repr(client, RESPONSE)
+        self.assertTrue(operation.complete)
+        with self.assertRaises(ValueError):
+            operation.poll()
+
+
+class _Connection(object):
+    def __init__(self, response):
+        self.response = response
+
+    def api_request(self, method, path):
+        return self.response
+
+
+class _Client(object):
+    connection = None

From 92b2b89bb84eebd8b9b7ee1d91920286ad24bb41 Mon Sep 17 00:00:00 2001
From: Thomas Schultz <daspecster@gmail.com>
Date: Tue, 27 Sep 2016 10:16:29 -0400
Subject: [PATCH 2/4] Remove 'alternatives' key when accessing results.

---
 docs/speech-usage.rst               |  6 +--
 google/cloud/speech/operation.py    | 74 ++++++++++++++++++++---------
 speech/unit_tests/_fixtures.py      | 16 +++----
 unit_tests/speech/test_operation.py | 10 ++--
 4 files changed, 69 insertions(+), 37 deletions(-)

diff --git a/docs/speech-usage.rst b/docs/speech-usage.rst
index b7b55e4a49c4..509c59b1b579 100644
--- a/docs/speech-usage.rst
+++ b/docs/speech-usage.rst
@@ -55,9 +55,9 @@ See: `Speech Asynchronous Recognize`_
       ...     operation.poll()  # API call
       >>> operation.complete
       True
-      >>> operation.results[0]['alternatives'][0]['transcript']
-      "how old is the Brooklyn Bridge"
-      >>> operation.results[0]['alternatives'][0]['confidence']
+      >>> operation.results[0].transcript
+      'how old is the Brooklyn Bridge'
+      >>> operation.results[0].confidence
       0.98267895
 
 
diff --git a/google/cloud/speech/operation.py b/google/cloud/speech/operation.py
index b623ba637c79..56515d0102e0 100644
--- a/google/cloud/speech/operation.py
+++ b/google/cloud/speech/operation.py
@@ -15,11 +15,15 @@
 """Long running operation representation for Google Speech API"""
 
 from google.cloud._helpers import _rfc3339_to_datetime
+from google.cloud import operation
 
 
-class Operation(object):
+class Operation(operation.Operation):
     """Representation of a Google API Long-Running Operation.
 
+    :type client: :class:`~google.cloud.speech.client.Client`
+    :param client: Instance of speech client.
+
     :type name: int
     :param name: ID assigned to an operation.
 
@@ -52,31 +56,21 @@ def __init__(self, client, name, complete=False, last_updated=None,
     def from_api_repr(cls, client, response):
         """Factory:  construct an instance from Google Speech API.
 
+        :type client: :class:`~google.cloud.speech.client.Client`
+        :param client: Instance of speech client.
+
         :type response: dict
         :param response: Dictionary response from Google Speech Operations API.
 
         :rtype: :class:`Operation`
         :returns: Instance of `~google.cloud.speech.operations.Operation`.
         """
-        last_updated = None
-        progress_percent = 0
-        results = None
-        start_time = None
-
         name = response['name']
-        metadata = response.get('metadata', None)
-
-        if metadata:
-            last_updated = _rfc3339_to_datetime(metadata.get('lastUpdateTime'))
-            start_time = _rfc3339_to_datetime(metadata.get('startTime'))
-            progress_percent = metadata.get('progressPercent')
-
-        if response.get('response'):
-            results = response.get('response').get('results')
         complete = response.get('done', False)
 
-        return cls(client, name, complete, last_updated, progress_percent,
-                   results, start_time)
+        operation_instance = cls(client, name, complete)
+        operation_instance._update(response)
+        return operation_instance
 
     @property
     def complete(self):
@@ -150,10 +144,46 @@ def _update(self, response):
         :param response: Response from Speech API Operations endpoint.
                          See: `speech_operations`_.
         """
-        metadata = response['metadata']
-        results = response.get('response', {}).get('results')
-        self._last_updated = _rfc3339_to_datetime(metadata['lastUpdateTime'])
+        metadata = response.get('metadata', None)
+        raw_results = response.get('response', {}).get('results', None)
+        results = []
+        if raw_results:
+            for result in raw_results[0]['alternatives']:
+                results.append(Transcript(result))
+        if metadata:
+            self._last_updated = _rfc3339_to_datetime(
+                metadata['lastUpdateTime'])
+            self._start_time = _rfc3339_to_datetime(metadata['startTime'])
+            self._progress_percent = metadata.get('progressPercent', 0)
+
         self._results = results
-        self._start_time = _rfc3339_to_datetime(metadata['startTime'])
         self._complete = response.get('done', False)
-        self._progress_percent = metadata.get('progressPercent', 0)
+
+
+class Transcript(object):
+    """Representation of Speech Transcripts
+
+    :type result: dict
+    :param result: Dictionary of transcript and confidence of recognition.
+    """
+    def __init__(self, result):
+        self._transcript = result.get('transcript')
+        self._confidence = result.get('confidence')
+
+    @property
+    def transcript(self):
+        """Transcript text from audio.
+
+        :rtype: str
+        :returns: Text detected in audio.
+        """
+        return self._transcript
+
+    @property
+    def confidence(self):
+        """Confidence score for recognized speech.
+
+        :rtype: float
+        :returns: Confidence score of recognized speech [0-1].
+        """
+        return self._confidence
diff --git a/speech/unit_tests/_fixtures.py b/speech/unit_tests/_fixtures.py
index 41d7da711148..7980ed862038 100644
--- a/speech/unit_tests/_fixtures.py
+++ b/speech/unit_tests/_fixtures.py
@@ -40,7 +40,7 @@
                   'google.cloud.speech.v1beta1.AsyncRecognizeMetadata'),
         'progressPercent': 100,
         'startTime': '2016-09-22T17:52:25.536964Z',
-        'lastUpdateTime': '2016-09-22T17:52:27.802902Z'
+        'lastUpdateTime': '2016-09-22T17:52:27.802902Z',
     },
     'done': True,
     'response': {
@@ -52,11 +52,11 @@
                     {
                         'transcript': 'how old is the Brooklyn Bridge',
                         'confidence': 0.98267895
-                    }
-                ]
-            }
-        ]
-    }
+                    },
+                ],
+            },
+        ],
+    },
 }
 
 OPERATION_INCOMPLETE_RESPONSE = {
@@ -66,7 +66,7 @@
                   'google.cloud.speech.v1beta1.AsyncRecognizeMetadata'),
         'progressPercent': 27,
         'startTime': '2016-09-22T17:52:25.536964Z',
-        'lastUpdateTime': '2016-09-22T17:52:27.802902Z'
+        'lastUpdateTime': '2016-09-22T17:52:27.802902Z',
     },
-    'done': False
+    'done': False,
 }
diff --git a/unit_tests/speech/test_operation.py b/unit_tests/speech/test_operation.py
index a616064043af..e44a29084aab 100644
--- a/unit_tests/speech/test_operation.py
+++ b/unit_tests/speech/test_operation.py
@@ -24,6 +24,7 @@ def test_ctor_defaults(self):
 
     def test_from_api_repr(self):
         from unit_tests.speech._fixtures import OPERATION_COMPLETE_RESPONSE
+        from google.cloud.speech.operation import Transcript
         RESPONSE = OPERATION_COMPLETE_RESPONSE
 
         client = _Client()
@@ -34,11 +35,10 @@ def test_from_api_repr(self):
         self.assertEqual('123456789', operation.name)
         self.assertTrue(operation.complete)
 
-        alternatives = operation.results[0]['alternatives']
-
+        self.assertIsInstance(operation.results[0], Transcript)
         self.assertEqual('how old is the Brooklyn Bridge',
-                         alternatives[0]['transcript'])
-        self.assertEqual(0.98267895, alternatives[0]['confidence'])
+                         operation.results[0].transcript)
+        self.assertEqual(0.98267895, operation.results[0].confidence)
         self.assertTrue(operation.complete)
 
     def test_update_response(self):
@@ -84,8 +84,10 @@ def test_poll_complete(self):
 class _Connection(object):
     def __init__(self, response):
         self.response = response
+        self._requested = []
 
     def api_request(self, method, path):
+        self._requested.append({'method': method, 'path': path})
         return self.response
 
 

From ce01e9a38305029e239ab4c216d0257dd3ecf987 Mon Sep 17 00:00:00 2001
From: Thomas Schultz <daspecster@gmail.com>
Date: Tue, 27 Sep 2016 16:14:37 -0400
Subject: [PATCH 3/4] Add Transcript and Metadata classes.

---
 docs/index.rst                                |  2 +
 docs/speech-metadata.rst                      |  7 ++
 docs/speech-transcript.rst                    |  7 ++
 .../google}/cloud/speech/encoding.py          |  0
 speech/google/cloud/speech/metadata.py        | 78 +++++++++++++++++
 .../google}/cloud/speech/operation.py         | 83 +++----------------
 speech/google/cloud/speech/transcript.py      | 44 ++++++++++
 speech/unit_tests/test_client.py              | 15 +---
 speech/unit_tests/test_metadata.py            | 50 +++++++++++
 .../unit_tests}/test_operation.py             | 34 +++++---
 speech/unit_tests/test_transcript.py          | 32 +++++++
 11 files changed, 260 insertions(+), 92 deletions(-)
 create mode 100644 docs/speech-metadata.rst
 create mode 100644 docs/speech-transcript.rst
 rename {google => speech/google}/cloud/speech/encoding.py (100%)
 create mode 100644 speech/google/cloud/speech/metadata.py
 rename {google => speech/google}/cloud/speech/operation.py (63%)
 create mode 100644 speech/google/cloud/speech/transcript.py
 create mode 100644 speech/unit_tests/test_metadata.py
 rename {unit_tests/speech => speech/unit_tests}/test_operation.py (70%)
 create mode 100644 speech/unit_tests/test_transcript.py

diff --git a/docs/index.rst b/docs/index.rst
index fee7e851ff21..dc5a47e7fac4 100644
--- a/docs/index.rst
+++ b/docs/index.rst
@@ -174,7 +174,9 @@
   speech-usage
   Client <speech-client>
   speech-encoding
+  speech-metadata
   speech-operation
+  speech-transcript
 
 .. toctree::
   :maxdepth: 0
diff --git a/docs/speech-metadata.rst b/docs/speech-metadata.rst
new file mode 100644
index 000000000000..575094a2d0f2
--- /dev/null
+++ b/docs/speech-metadata.rst
@@ -0,0 +1,7 @@
+Speech Metadata
+===============
+
+.. automodule:: google.cloud.speech.metadata
+  :members:
+  :undoc-members:
+  :show-inheritance:
diff --git a/docs/speech-transcript.rst b/docs/speech-transcript.rst
new file mode 100644
index 000000000000..f71f72bd2645
--- /dev/null
+++ b/docs/speech-transcript.rst
@@ -0,0 +1,7 @@
+Speech Transcript
+=================
+
+.. automodule:: google.cloud.speech.transcript
+  :members:
+  :undoc-members:
+  :show-inheritance:
diff --git a/google/cloud/speech/encoding.py b/speech/google/cloud/speech/encoding.py
similarity index 100%
rename from google/cloud/speech/encoding.py
rename to speech/google/cloud/speech/encoding.py
diff --git a/speech/google/cloud/speech/metadata.py b/speech/google/cloud/speech/metadata.py
new file mode 100644
index 000000000000..89a8ff3369d9
--- /dev/null
+++ b/speech/google/cloud/speech/metadata.py
@@ -0,0 +1,78 @@
+# Copyright 2016 Google Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Metadata representation from Google Speech API"""
+
+from google.cloud._helpers import _rfc3339_to_datetime
+
+
+class Metadata(object):
+    """Representation of metadata from a Google Speech API Operation.
+
+    :type last_update: datetime
+    :param last_update: When the Speech operation was last updated.
+
+    :type start_time: datetime
+    :param start_time: When the Speech operation was started.
+
+    :type progress_percent: int
+    :param progress_percent: Percentage of operation that has been completed.
+    """
+    def __init__(self, last_update, start_time, progress_percent):
+        self._last_update = last_update
+        self._start_time = start_time
+        self._progress_percent = progress_percent
+
+    @classmethod
+    def from_api_repr(cls, response):
+        """Factory: construct representation of operation metadata.
+
+        :type response: dict
+        :param response: Dictionary containing operation metadata.
+
+        :rtype: :class:`~google.cloud.speech.metadata.Metadata`
+        :returns: Instance of operation Metadata.
+        """
+        last_update = _rfc3339_to_datetime(response['lastUpdateTime'])
+        start_time = _rfc3339_to_datetime(response['startTime'])
+        progress_percent = response['progressPercent']
+
+        return cls(last_update, start_time, progress_percent)
+
+    @property
+    def last_update(self):
+        """Last time operation was updated.
+
+        :rtype: datetime
+        :returns: Datetime when operation was last updated.
+        """
+        return self._last_update
+
+    @property
+    def start_time(self):
+        """Start time of operation.
+
+        :rtype: datetime
+        :returns: Datetime when operation was started.
+        """
+        return self._start_time
+
+    @property
+    def progress_percent(self):
+        """Progress percentage completed of operation.
+
+        :rtype: int
+        :returns: Percentage of operation completed.
+        """
+        return self._progress_percent
diff --git a/google/cloud/speech/operation.py b/speech/google/cloud/speech/operation.py
similarity index 63%
rename from google/cloud/speech/operation.py
rename to speech/google/cloud/speech/operation.py
index 56515d0102e0..69614b16cb7f 100644
--- a/google/cloud/speech/operation.py
+++ b/speech/google/cloud/speech/operation.py
@@ -14,7 +14,8 @@
 
 """Long running operation representation for Google Speech API"""
 
-from google.cloud._helpers import _rfc3339_to_datetime
+from google.cloud.speech.metadata import Metadata
+from google.cloud.speech.transcript import Transcript
 from google.cloud import operation
 
 
@@ -30,27 +31,19 @@ class Operation(operation.Operation):
     :type complete: bool
     :param complete: True if operation is complete, else False.
 
-    :type last_updated: datetime
-    :param last_updated: The last time the operation was updated.
-
-    :type progress_percent: int
-    :param progress_percent: Percentage of operation that has been completed.
+    :type metadata: :class:`~google.cloud.speech.metadata.Metadata`
+    :param metadata: Instance of ``Metadata`` with operation information.
 
     :type results: dict
     :param results: Dictionary with transcript and score of operation.
-
-    :type start_time: datetime
-    :param start_time: Datetime when operation was started.
     """
-    def __init__(self, client, name, complete=False, last_updated=None,
-                 progress_percent=0, results=None, start_time=None):
+    def __init__(self, client, name, complete=False, metadata=None,
+                 results=None):
         self.client = client
         self.name = name
         self._complete = complete
-        self._last_updated = last_updated
-        self._progress_percent = progress_percent
+        self._metadata = metadata
         self._results = results
-        self._start_time = start_time
 
     @classmethod
     def from_api_repr(cls, client, response):
@@ -82,22 +75,13 @@ def complete(self):
         return self._complete
 
     @property
-    def last_updated(self):
-        """Operation last updated time.
-
-        :rtype: datetime
-        :returns: RFC3339 last updated time of the operation.
-        """
-        return self._last_updated
-
-    @property
-    def progress_percent(self):
-        """Progress percentage of operation.
+    def metadata(self):
+        """Metadata of operation.
 
-        :rtype: int
-        :returns: Percentage of operation completed. [0-100]
+        :rtype: :class:`~google.cloud.speech.metadata.Metadata`
+        :returns: Instance of ``Metadata``.
         """
-        return self._progress_percent
+        return self._metadata
 
     @property
     def results(self):
@@ -108,15 +92,6 @@ def results(self):
         """
         return self._results
 
-    @property
-    def start_time(self):
-        """Operation start time.
-
-        :rtype: datetime
-        :returns: RFC3339 start time of the operation.
-        """
-        return self._start_time
-
     def poll(self):
         """Check if the operation has finished.
 
@@ -151,39 +126,7 @@ def _update(self, response):
             for result in raw_results[0]['alternatives']:
                 results.append(Transcript(result))
         if metadata:
-            self._last_updated = _rfc3339_to_datetime(
-                metadata['lastUpdateTime'])
-            self._start_time = _rfc3339_to_datetime(metadata['startTime'])
-            self._progress_percent = metadata.get('progressPercent', 0)
+            self._metadata = Metadata.from_api_repr(metadata)
 
         self._results = results
         self._complete = response.get('done', False)
-
-
-class Transcript(object):
-    """Representation of Speech Transcripts
-
-    :type result: dict
-    :param result: Dictionary of transcript and confidence of recognition.
-    """
-    def __init__(self, result):
-        self._transcript = result.get('transcript')
-        self._confidence = result.get('confidence')
-
-    @property
-    def transcript(self):
-        """Transcript text from audio.
-
-        :rtype: str
-        :returns: Text detected in audio.
-        """
-        return self._transcript
-
-    @property
-    def confidence(self):
-        """Confidence score for recognized speech.
-
-        :rtype: float
-        :returns: Confidence score of recognized speech [0-1].
-        """
-        return self._confidence
diff --git a/speech/google/cloud/speech/transcript.py b/speech/google/cloud/speech/transcript.py
new file mode 100644
index 000000000000..bbe915396c5c
--- /dev/null
+++ b/speech/google/cloud/speech/transcript.py
@@ -0,0 +1,44 @@
+# Copyright 2016 Google Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Transcript representation for Google Speech API"""
+
+
+class Transcript(object):
+    """Representation of Speech Transcripts
+
+    :type result: dict
+    :param result: Dictionary of transcript and confidence of recognition.
+    """
+    def __init__(self, result):
+        self._transcript = result.get('transcript')
+        self._confidence = result.get('confidence')
+
+    @property
+    def transcript(self):
+        """Transcript text from audio.
+
+        :rtype: str
+        :returns: Text detected in audio.
+        """
+        return self._transcript
+
+    @property
+    def confidence(self):
+        """Confidence score for recognized speech.
+
+        :rtype: float
+        :returns: Confidence score of recognized speech [0-1].
+        """
+        return self._confidence
diff --git a/speech/unit_tests/test_client.py b/speech/unit_tests/test_client.py
index b73ffece41da..200562ea2661 100644
--- a/speech/unit_tests/test_client.py
+++ b/speech/unit_tests/test_client.py
@@ -41,7 +41,7 @@ def test_sync_recognize_content_with_optional_parameters(self):
         import base64
         from google.cloud._helpers import _to_bytes
         from google.cloud.speech.encoding import Encoding
-        from unit_tests.speech._fixtures import SYNC_RECOGNIZE_RESPONSE
+        from unit_tests._fixtures import SYNC_RECOGNIZE_RESPONSE
 
         _AUDIO_CONTENT = _to_bytes('/9j/4QNURXhpZgAASUkq')
         _B64_AUDIO_CONTENT = base64.b64encode(_AUDIO_CONTENT)
@@ -88,13 +88,8 @@ def test_sync_recognize_content_with_optional_parameters(self):
         self.assertEqual(response, expected)
 
     def test_sync_recognize_source_uri_without_optional_parameters(self):
-<<<<<<< b7f004e00f1ee021b0cb7ac9261fcc6c021dfacb:speech/unit_tests/test_client.py
         from google.cloud.speech.client import Encoding
         from unit_tests._fixtures import SYNC_RECOGNIZE_RESPONSE
-=======
-        from google.cloud.speech.encoding import Encoding
-        from unit_tests.speech._fixtures import SYNC_RECOGNIZE_RESPONSE
->>>>>>> Add speech asynchronous recognize support.:unit_tests/speech/test_client.py
 
         RETURNED = SYNC_RECOGNIZE_RESPONSE
         REQUEST = {
@@ -166,13 +161,8 @@ def test_sync_recognize_without_samplerate(self):
                                   None)
 
     def test_sync_recognize_with_empty_results(self):
-<<<<<<< b7f004e00f1ee021b0cb7ac9261fcc6c021dfacb:speech/unit_tests/test_client.py
         from google.cloud.speech.client import Encoding
         from unit_tests._fixtures import SYNC_RECOGNIZE_EMPTY_RESPONSE
-=======
-        from google.cloud.speech.encoding import Encoding
-        from unit_tests.speech._fixtures import SYNC_RECOGNIZE_EMPTY_RESPONSE
->>>>>>> Add speech asynchronous recognize support.:unit_tests/speech/test_client.py
 
         credentials = _Credentials()
         client = self._makeOne(credentials=credentials)
@@ -183,7 +173,7 @@ def test_sync_recognize_with_empty_results(self):
                                   self.SAMPLE_RATE)
 
     def test_async_recognize(self):
-        from unit_tests.speech._fixtures import ASYNC_RECOGNIZE_RESPONSE
+        from unit_tests._fixtures import ASYNC_RECOGNIZE_RESPONSE
         from google.cloud.speech.encoding import Encoding
         from google.cloud.speech.operation import Operation
         RETURNED = ASYNC_RECOGNIZE_RESPONSE
@@ -199,6 +189,7 @@ def test_async_recognize(self):
                                            self.SAMPLE_RATE)
         self.assertIsInstance(operation, Operation)
         self.assertFalse(operation.complete)
+        self.assertIsNone(operation.metadata)
 
 
 class _Credentials(object):
diff --git a/speech/unit_tests/test_metadata.py b/speech/unit_tests/test_metadata.py
new file mode 100644
index 000000000000..8e1dcd03e733
--- /dev/null
+++ b/speech/unit_tests/test_metadata.py
@@ -0,0 +1,50 @@
+# Copyright 2016 Google Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+
+class TestMetadata(unittest.TestCase):
+    OPERATION_ID = 123456789
+
+    def _getTargetClass(self):
+        from google.cloud.speech.metadata import Metadata
+        return Metadata
+
+    def _makeOne(self, *args, **kwargs):
+        return self._getTargetClass()(*args, **kwargs)
+
+    def test_ctor(self):
+        last_update = 'last_update'
+        start_time = 'start_time'
+        progress_percent = 23
+        metadata = self._makeOne(last_update, start_time, progress_percent)
+        self.assertEqual('last_update', metadata.last_update)
+        self.assertEqual('start_time', metadata.start_time)
+        self.assertEqual(23, metadata.progress_percent)
+
+    def test_from_api_repr(self):
+        import datetime
+        from google.cloud._helpers import _rfc3339_to_datetime
+        from unit_tests._fixtures import OPERATION_INCOMPLETE_RESPONSE as DATA
+        METADATA = DATA['metadata']
+
+        start_time = _rfc3339_to_datetime(METADATA['startTime'])
+        last_update = _rfc3339_to_datetime(METADATA['lastUpdateTime'])
+        metadata = self._getTargetClass().from_api_repr(METADATA)
+        self.assertIsInstance(metadata.last_update, datetime.datetime)
+        self.assertEqual(last_update, metadata.last_update)
+        self.assertIsInstance(metadata.start_time, datetime.datetime)
+        self.assertEqual(start_time, metadata.start_time)
+        self.assertEqual(27, metadata.progress_percent)
diff --git a/unit_tests/speech/test_operation.py b/speech/unit_tests/test_operation.py
similarity index 70%
rename from unit_tests/speech/test_operation.py
rename to speech/unit_tests/test_operation.py
index e44a29084aab..a1e063ae1432 100644
--- a/unit_tests/speech/test_operation.py
+++ b/speech/unit_tests/test_operation.py
@@ -1,3 +1,17 @@
+# Copyright 2016 Google Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
 import unittest
 
 
@@ -17,13 +31,11 @@ def test_ctor_defaults(self):
         operation = self._makeOne(client, self.OPERATION_NAME)
         self.assertEqual('123456789', operation.name)
         self.assertFalse(operation.complete)
-        self.assertIsNone(operation.last_updated)
-        self.assertEqual(0, operation.progress_percent)
+        self.assertIsNone(operation.metadata)
         self.assertIsNone(operation.results)
-        self.assertIsNone(operation.start_time)
 
     def test_from_api_repr(self):
-        from unit_tests.speech._fixtures import OPERATION_COMPLETE_RESPONSE
+        from unit_tests._fixtures import OPERATION_COMPLETE_RESPONSE
         from google.cloud.speech.operation import Transcript
         RESPONSE = OPERATION_COMPLETE_RESPONSE
 
@@ -42,8 +54,8 @@ def test_from_api_repr(self):
         self.assertTrue(operation.complete)
 
     def test_update_response(self):
-        from unit_tests.speech._fixtures import ASYNC_RECOGNIZE_RESPONSE
-        from unit_tests.speech._fixtures import OPERATION_COMPLETE_RESPONSE
+        from unit_tests._fixtures import ASYNC_RECOGNIZE_RESPONSE
+        from unit_tests._fixtures import OPERATION_COMPLETE_RESPONSE
         RESPONSE = ASYNC_RECOGNIZE_RESPONSE
 
         client = _Client()
@@ -51,13 +63,13 @@ def test_update_response(self):
         client.connection = connection
         operation = self._getTargetClass().from_api_repr(client, RESPONSE)
         self.assertEqual('123456789', operation.name)
-
         operation._update(OPERATION_COMPLETE_RESPONSE)
         self.assertTrue(operation.complete)
 
     def test_poll(self):
-        from unit_tests.speech._fixtures import ASYNC_RECOGNIZE_RESPONSE
-        from unit_tests.speech._fixtures import OPERATION_COMPLETE_RESPONSE
+        from google.cloud.speech.operation import Metadata
+        from unit_tests._fixtures import ASYNC_RECOGNIZE_RESPONSE
+        from unit_tests._fixtures import OPERATION_COMPLETE_RESPONSE
         RESPONSE = ASYNC_RECOGNIZE_RESPONSE
         client = _Client()
         connection = _Connection(OPERATION_COMPLETE_RESPONSE)
@@ -67,9 +79,11 @@ def test_poll(self):
         self.assertFalse(operation.complete)
         operation.poll()
         self.assertTrue(operation.complete)
+        self.assertIsInstance(operation.metadata, Metadata)
+        self.assertEqual(100, operation.metadata.progress_percent)
 
     def test_poll_complete(self):
-        from unit_tests.speech._fixtures import OPERATION_COMPLETE_RESPONSE
+        from unit_tests._fixtures import OPERATION_COMPLETE_RESPONSE
         RESPONSE = OPERATION_COMPLETE_RESPONSE
         client = _Client()
         connection = _Connection(OPERATION_COMPLETE_RESPONSE)
diff --git a/speech/unit_tests/test_transcript.py b/speech/unit_tests/test_transcript.py
new file mode 100644
index 000000000000..b585d6e7429c
--- /dev/null
+++ b/speech/unit_tests/test_transcript.py
@@ -0,0 +1,32 @@
+# Copyright 2016 Google Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+
+class TestTranscript(unittest.TestCase):
+    def _getTargetClass(self):
+        from google.cloud.speech.transcript import Transcript
+        return Transcript
+
+    def _makeOne(self, *args, **kwargs):
+        return self._getTargetClass()(*args, **kwargs)
+
+    def test_ctor(self):
+        from unit_tests._fixtures import OPERATION_COMPLETE_RESPONSE as DATA
+        TRANSCRIPT_DATA = DATA['response']['results'][0]['alternatives'][0]
+        transcript = self._makeOne(TRANSCRIPT_DATA)
+        self.assertEqual('how old is the Brooklyn Bridge',
+                         transcript.transcript)
+        self.assertEqual(0.98267895, transcript.confidence)

From 08e9e03d10518d7e78d04294790738dbb9d4890e Mon Sep 17 00:00:00 2001
From: Thomas Schultz <daspecster@gmail.com>
Date: Wed, 28 Sep 2016 05:56:14 -0400
Subject: [PATCH 4/4] Add missing request assertions for operation.poll.

---
 speech/unit_tests/test_operation.py | 39 ++++++++++++++++++-----------
 1 file changed, 25 insertions(+), 14 deletions(-)

diff --git a/speech/unit_tests/test_operation.py b/speech/unit_tests/test_operation.py
index a1e063ae1432..2ebce2c75ce1 100644
--- a/speech/unit_tests/test_operation.py
+++ b/speech/unit_tests/test_operation.py
@@ -29,7 +29,7 @@ def _makeOne(self, *args, **kwargs):
     def test_ctor_defaults(self):
         client = _Client()
         operation = self._makeOne(client, self.OPERATION_NAME)
-        self.assertEqual('123456789', operation.name)
+        self.assertEqual(operation.name, '123456789')
         self.assertFalse(operation.complete)
         self.assertIsNone(operation.metadata)
         self.assertIsNone(operation.results)
@@ -37,21 +37,22 @@ def test_ctor_defaults(self):
     def test_from_api_repr(self):
         from unit_tests._fixtures import OPERATION_COMPLETE_RESPONSE
         from google.cloud.speech.operation import Transcript
+        from google.cloud.speech.metadata import Metadata
         RESPONSE = OPERATION_COMPLETE_RESPONSE
 
         client = _Client()
-        connection = _Connection(OPERATION_COMPLETE_RESPONSE)
-        client.connection = connection
         operation = self._getTargetClass().from_api_repr(client, RESPONSE)
 
         self.assertEqual('123456789', operation.name)
         self.assertTrue(operation.complete)
 
         self.assertIsInstance(operation.results[0], Transcript)
-        self.assertEqual('how old is the Brooklyn Bridge',
-                         operation.results[0].transcript)
-        self.assertEqual(0.98267895, operation.results[0].confidence)
+        self.assertEqual(operation.results[0].transcript,
+                         'how old is the Brooklyn Bridge')
+        self.assertEqual(operation.results[0].confidence, 0.98267895)
         self.assertTrue(operation.complete)
+        self.assertIsInstance(operation.metadata, Metadata)
+        self.assertEqual(operation.metadata.progress_percent, 100)
 
     def test_update_response(self):
         from unit_tests._fixtures import ASYNC_RECOGNIZE_RESPONSE
@@ -59,10 +60,8 @@ def test_update_response(self):
         RESPONSE = ASYNC_RECOGNIZE_RESPONSE
 
         client = _Client()
-        connection = _Connection(OPERATION_COMPLETE_RESPONSE)
-        client.connection = connection
         operation = self._getTargetClass().from_api_repr(client, RESPONSE)
-        self.assertEqual('123456789', operation.name)
+        self.assertEqual(operation.name, '123456789')
         operation._update(OPERATION_COMPLETE_RESPONSE)
         self.assertTrue(operation.complete)
 
@@ -80,23 +79,35 @@ def test_poll(self):
         operation.poll()
         self.assertTrue(operation.complete)
         self.assertIsInstance(operation.metadata, Metadata)
-        self.assertEqual(100, operation.metadata.progress_percent)
+        self.assertEqual(operation.metadata.progress_percent, 100)
+        requested = client.connection._requested
+        self.assertEqual(requested[0]['method'], 'GET')
+        self.assertEqual(requested[0]['path'],
+                         'operations/%s' % (operation.name,))
 
     def test_poll_complete(self):
         from unit_tests._fixtures import OPERATION_COMPLETE_RESPONSE
-        RESPONSE = OPERATION_COMPLETE_RESPONSE
+        from unit_tests._fixtures import OPERATION_INCOMPLETE_RESPONSE
+        RESPONSE = OPERATION_INCOMPLETE_RESPONSE
+
         client = _Client()
         connection = _Connection(OPERATION_COMPLETE_RESPONSE)
         client.connection = connection
-
         operation = self._getTargetClass().from_api_repr(client, RESPONSE)
-        self.assertTrue(operation.complete)
+
+        self.assertFalse(operation.complete)
+        operation.poll()  # Update the operation with complete data.
+
         with self.assertRaises(ValueError):
             operation.poll()
+        requested = client.connection._requested
+        self.assertEqual(requested[0]['method'], 'GET')
+        self.assertEqual(requested[0]['path'],
+                         'operations/%s' % (operation.name,))
 
 
 class _Connection(object):
-    def __init__(self, response):
+    def __init__(self, response=None):
         self.response = response
         self._requested = []