You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
103 lines
4.5 KiB
103 lines
4.5 KiB
# |
|
# Licensed to the Apache Software Foundation (ASF) under one |
|
# or more contributor license agreements. See the NOTICE file |
|
# distributed with this work for additional information |
|
# regarding copyright ownership. The ASF licenses this file |
|
# to you under the Apache License, Version 2.0 (the |
|
# "License"); you may not use this file except in compliance |
|
# with the License. You may obtain a copy of the License at |
|
# |
|
# http://www.apache.org/licenses/LICENSE-2.0 |
|
# |
|
# Unless required by applicable law or agreed to in writing, |
|
# software distributed under the License is distributed on an |
|
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
|
# KIND, either express or implied. See the License for the |
|
# specific language governing permissions and limitations |
|
# under the License. |
|
"""This module contains a Google Cloud Speech Hook.""" |
|
from typing import Dict, Optional, Sequence, Union |
|
|
|
from airflow.providers.google.common.hooks.base_google import GoogleBaseHook |
|
from google.api_core.retry import Retry |
|
from google.cloud.speech_v1 import SpeechClient |
|
from google.cloud.speech_v1.types import RecognitionAudio, RecognitionConfig |
|
|
|
|
|
class CloudSpeechToTextHook(GoogleBaseHook): |
|
""" |
|
Hook for Google Cloud Speech API. |
|
|
|
:param gcp_conn_id: The connection ID to use when fetching connection info. |
|
:type gcp_conn_id: str |
|
:param delegate_to: The account to impersonate using domain-wide delegation of authority, |
|
if any. For this to work, the service account making the request must have |
|
domain-wide delegation enabled. |
|
:type delegate_to: str |
|
:param impersonation_chain: Optional service account to impersonate using short-term |
|
credentials, or chained list of accounts required to get the access_token |
|
of the last account in the list, which will be impersonated in the request. |
|
If set as a string, the account must grant the originating account |
|
the Service Account Token Creator IAM role. |
|
If set as a sequence, the identities from the list must grant |
|
Service Account Token Creator IAM role to the directly preceding identity, with first |
|
account from the list granting this role to the originating account. |
|
:type impersonation_chain: Union[str, Sequence[str]] |
|
""" |
|
|
|
def __init__( |
|
self, |
|
gcp_conn_id: str = "google_cloud_default", |
|
delegate_to: Optional[str] = None, |
|
impersonation_chain: Optional[Union[str, Sequence[str]]] = None, |
|
) -> None: |
|
super().__init__( |
|
gcp_conn_id=gcp_conn_id, |
|
delegate_to=delegate_to, |
|
impersonation_chain=impersonation_chain, |
|
) |
|
self._client = None |
|
|
|
def get_conn(self) -> SpeechClient: |
|
""" |
|
Retrieves connection to Cloud Speech. |
|
|
|
:return: Google Cloud Speech client object. |
|
:rtype: google.cloud.speech_v1.SpeechClient |
|
""" |
|
if not self._client: |
|
self._client = SpeechClient( |
|
credentials=self._get_credentials(), client_info=self.client_info |
|
) |
|
return self._client |
|
|
|
@GoogleBaseHook.quota_retry() |
|
def recognize_speech( |
|
self, |
|
config: Union[Dict, RecognitionConfig], |
|
audio: Union[Dict, RecognitionAudio], |
|
retry: Optional[Retry] = None, |
|
timeout: Optional[float] = None, |
|
): |
|
""" |
|
Recognizes audio input |
|
|
|
:param config: information to the recognizer that specifies how to process the request. |
|
https://googleapis.github.io/google-cloud-python/latest/speech/gapic/v1/types.html#google.cloud.speech_v1.types.RecognitionConfig |
|
:type config: dict or google.cloud.speech_v1.types.RecognitionConfig |
|
:param audio: audio data to be recognized |
|
https://googleapis.github.io/google-cloud-python/latest/speech/gapic/v1/types.html#google.cloud.speech_v1.types.RecognitionAudio |
|
:type audio: dict or google.cloud.speech_v1.types.RecognitionAudio |
|
:param retry: (Optional) A retry object used to retry requests. If None is specified, |
|
requests will not be retried. |
|
:type retry: google.api_core.retry.Retry |
|
:param timeout: (Optional) The amount of time, in seconds, to wait for the request to complete. |
|
Note that if retry is specified, the timeout applies to each individual attempt. |
|
:type timeout: float |
|
""" |
|
client = self.get_conn() |
|
response = client.recognize( |
|
config=config, audio=audio, retry=retry, timeout=timeout |
|
) |
|
self.log.info("Recognised speech: %s", response) |
|
return response
|
|
|