You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
329 lines
15 KiB
329 lines
15 KiB
# |
|
# Licensed to the Apache Software Foundation (ASF) under one |
|
# or more contributor license agreements. See the NOTICE file |
|
# distributed with this work for additional information |
|
# regarding copyright ownership. The ASF licenses this file |
|
# to you under the Apache License, Version 2.0 (the |
|
# "License"); you may not use this file except in compliance |
|
# with the License. You may obtain a copy of the License at |
|
# |
|
# http://www.apache.org/licenses/LICENSE-2.0 |
|
# |
|
# Unless required by applicable law or agreed to in writing, |
|
# software distributed under the License is distributed on an |
|
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
|
# KIND, either express or implied. See the License for the |
|
# specific language governing permissions and limitations |
|
# under the License. |
|
"""This module contains Google Cloud Vision operators.""" |
|
from typing import Dict, Optional, Sequence, Union |
|
|
|
from airflow.models import BaseOperator |
|
from airflow.providers.google.cloud.hooks.video_intelligence import ( |
|
CloudVideoIntelligenceHook, |
|
) |
|
from airflow.utils.decorators import apply_defaults |
|
from google.api_core.retry import Retry |
|
from google.cloud.videointelligence_v1 import enums |
|
from google.cloud.videointelligence_v1.types import VideoContext |
|
from google.protobuf.json_format import MessageToDict |
|
|
|
|
|
class CloudVideoIntelligenceDetectVideoLabelsOperator(BaseOperator): |
|
""" |
|
Performs video annotation, annotating video labels. |
|
|
|
.. seealso:: |
|
For more information on how to use this operator, take a look at the guide: |
|
:ref:`howto/operator:CloudVideoIntelligenceDetectVideoLabelsOperator`. |
|
|
|
:param input_uri: Input video location. Currently, only Google Cloud Storage URIs are supported, |
|
which must be specified in the following format: ``gs://bucket-id/object-id``. |
|
:type input_uri: str |
|
:param input_content: The video data bytes. |
|
If unset, the input video(s) should be specified via ``input_uri``. |
|
If set, ``input_uri`` should be unset. |
|
:type input_content: bytes |
|
:param output_uri: Optional, location where the output (in JSON format) should be stored. Currently, only |
|
Google Cloud Storage URIs are supported, which must be specified in the following format: |
|
``gs://bucket-id/object-id``. |
|
:type output_uri: str |
|
:param video_context: Optional, Additional video context and/or feature-specific parameters. |
|
:type video_context: dict or google.cloud.videointelligence_v1.types.VideoContext |
|
:param location: Optional, cloud region where annotation should take place. Supported cloud regions: |
|
us-east1, us-west1, europe-west1, asia-east1. If no region is specified, a region will be determined |
|
based on video file location. |
|
:type location: str |
|
:param retry: Retry object used to determine when/if to retry requests. |
|
If None is specified, requests will not be retried. |
|
:type retry: google.api_core.retry.Retry |
|
:param timeout: Optional, The amount of time, in seconds, to wait for the request to complete. |
|
Note that if retry is specified, the timeout applies to each individual attempt. |
|
:type timeout: float |
|
:param gcp_conn_id: Optional, The connection ID used to connect to Google Cloud. |
|
Defaults to ``google_cloud_default``. |
|
:type gcp_conn_id: str |
|
:param impersonation_chain: Optional service account to impersonate using short-term |
|
credentials, or chained list of accounts required to get the access_token |
|
of the last account in the list, which will be impersonated in the request. |
|
If set as a string, the account must grant the originating account |
|
the Service Account Token Creator IAM role. |
|
If set as a sequence, the identities from the list must grant |
|
Service Account Token Creator IAM role to the directly preceding identity, with first |
|
account from the list granting this role to the originating account (templated). |
|
:type impersonation_chain: Union[str, Sequence[str]] |
|
""" |
|
|
|
# [START gcp_video_intelligence_detect_labels_template_fields] |
|
template_fields = ( |
|
"input_uri", |
|
"output_uri", |
|
"gcp_conn_id", |
|
"impersonation_chain", |
|
) |
|
# [END gcp_video_intelligence_detect_labels_template_fields] |
|
|
|
@apply_defaults |
|
def __init__( |
|
self, |
|
*, |
|
input_uri: str, |
|
input_content: Optional[bytes] = None, |
|
output_uri: Optional[str] = None, |
|
video_context: Union[Dict, VideoContext] = None, |
|
location: Optional[str] = None, |
|
retry: Optional[Retry] = None, |
|
timeout: Optional[float] = None, |
|
gcp_conn_id: str = "google_cloud_default", |
|
impersonation_chain: Optional[Union[str, Sequence[str]]] = None, |
|
**kwargs, |
|
) -> None: |
|
super().__init__(**kwargs) |
|
self.input_uri = input_uri |
|
self.input_content = input_content |
|
self.output_uri = output_uri |
|
self.video_context = video_context |
|
self.location = location |
|
self.retry = retry |
|
self.gcp_conn_id = gcp_conn_id |
|
self.timeout = timeout |
|
self.impersonation_chain = impersonation_chain |
|
|
|
def execute(self, context): |
|
hook = CloudVideoIntelligenceHook( |
|
gcp_conn_id=self.gcp_conn_id, |
|
impersonation_chain=self.impersonation_chain, |
|
) |
|
operation = hook.annotate_video( |
|
input_uri=self.input_uri, |
|
input_content=self.input_content, |
|
video_context=self.video_context, |
|
location=self.location, |
|
retry=self.retry, |
|
features=[enums.Feature.LABEL_DETECTION], |
|
timeout=self.timeout, |
|
) |
|
self.log.info("Processing video for label annotations") |
|
result = MessageToDict(operation.result()) |
|
self.log.info("Finished processing.") |
|
return result |
|
|
|
|
|
class CloudVideoIntelligenceDetectVideoExplicitContentOperator(BaseOperator): |
|
""" |
|
Performs video annotation, annotating explicit content. |
|
|
|
.. seealso:: |
|
For more information on how to use this operator, take a look at the guide: |
|
:ref:`howto/operator:CloudVideoIntelligenceDetectVideoExplicitContentOperator` |
|
|
|
:param input_uri: Input video location. Currently, only Google Cloud Storage URIs are supported, |
|
which must be specified in the following format: ``gs://bucket-id/object-id``. |
|
:type input_uri: str |
|
:param input_content: The video data bytes. |
|
If unset, the input video(s) should be specified via ``input_uri``. |
|
If set, ``input_uri`` should be unset. |
|
:type input_content: bytes |
|
:param output_uri: Optional, location where the output (in JSON format) should be stored. Currently, only |
|
Google Cloud Storage URIs are supported, which must be specified in the following format: |
|
``gs://bucket-id/object-id``. |
|
:type output_uri: str |
|
:param video_context: Optional, Additional video context and/or feature-specific parameters. |
|
:type video_context: dict or google.cloud.videointelligence_v1.types.VideoContext |
|
:param location: Optional, cloud region where annotation should take place. Supported cloud regions: |
|
us-east1, us-west1, europe-west1, asia-east1. If no region is specified, a region will be determined |
|
based on video file location. |
|
:type location: str |
|
:param retry: Retry object used to determine when/if to retry requests. |
|
If None is specified, requests will not be retried. |
|
:type retry: google.api_core.retry.Retry |
|
:param timeout: Optional, The amount of time, in seconds, to wait for the request to complete. |
|
Note that if retry is specified, the timeout applies to each individual attempt. |
|
:type timeout: float |
|
:param gcp_conn_id: Optional, The connection ID used to connect to Google Cloud |
|
Defaults to ``google_cloud_default``. |
|
:type gcp_conn_id: str |
|
:param impersonation_chain: Optional service account to impersonate using short-term |
|
credentials, or chained list of accounts required to get the access_token |
|
of the last account in the list, which will be impersonated in the request. |
|
If set as a string, the account must grant the originating account |
|
the Service Account Token Creator IAM role. |
|
If set as a sequence, the identities from the list must grant |
|
Service Account Token Creator IAM role to the directly preceding identity, with first |
|
account from the list granting this role to the originating account (templated). |
|
:type impersonation_chain: Union[str, Sequence[str]] |
|
""" |
|
|
|
# [START gcp_video_intelligence_detect_explicit_content_template_fields] |
|
template_fields = ( |
|
"input_uri", |
|
"output_uri", |
|
"gcp_conn_id", |
|
"impersonation_chain", |
|
) |
|
# [END gcp_video_intelligence_detect_explicit_content_template_fields] |
|
|
|
@apply_defaults |
|
def __init__( |
|
self, |
|
*, |
|
input_uri: str, |
|
output_uri: Optional[str] = None, |
|
input_content: Optional[bytes] = None, |
|
video_context: Union[Dict, VideoContext] = None, |
|
location: Optional[str] = None, |
|
retry: Optional[Retry] = None, |
|
timeout: Optional[float] = None, |
|
gcp_conn_id: str = "google_cloud_default", |
|
impersonation_chain: Optional[Union[str, Sequence[str]]] = None, |
|
**kwargs, |
|
) -> None: |
|
super().__init__(**kwargs) |
|
self.input_uri = input_uri |
|
self.output_uri = output_uri |
|
self.input_content = input_content |
|
self.video_context = video_context |
|
self.location = location |
|
self.retry = retry |
|
self.gcp_conn_id = gcp_conn_id |
|
self.timeout = timeout |
|
self.impersonation_chain = impersonation_chain |
|
|
|
def execute(self, context): |
|
hook = CloudVideoIntelligenceHook( |
|
gcp_conn_id=self.gcp_conn_id, |
|
impersonation_chain=self.impersonation_chain, |
|
) |
|
operation = hook.annotate_video( |
|
input_uri=self.input_uri, |
|
input_content=self.input_content, |
|
video_context=self.video_context, |
|
location=self.location, |
|
retry=self.retry, |
|
features=[enums.Feature.EXPLICIT_CONTENT_DETECTION], |
|
timeout=self.timeout, |
|
) |
|
self.log.info("Processing video for explicit content annotations") |
|
result = MessageToDict(operation.result()) |
|
self.log.info("Finished processing.") |
|
return result |
|
|
|
|
|
class CloudVideoIntelligenceDetectVideoShotsOperator(BaseOperator): |
|
""" |
|
Performs video annotation, annotating video shots. |
|
|
|
.. seealso:: |
|
For more information on how to use this operator, take a look at the guide: |
|
:ref:`howto/operator:CloudVideoIntelligenceDetectVideoShotsOperator` |
|
|
|
:param input_uri: Input video location. Currently, only Google Cloud Storage URIs are supported, |
|
which must be specified in the following format: ``gs://bucket-id/object-id``. |
|
:type input_uri: str |
|
:param input_content: The video data bytes. |
|
If unset, the input video(s) should be specified via ``input_uri``. |
|
If set, ``input_uri`` should be unset. |
|
:type input_content: bytes |
|
:param output_uri: Optional, location where the output (in JSON format) should be stored. Currently, only |
|
Google Cloud Storage URIs are supported, which must be specified in the following format: |
|
``gs://bucket-id/object-id``. |
|
:type output_uri: str |
|
:param video_context: Optional, Additional video context and/or feature-specific parameters. |
|
:type video_context: dict or google.cloud.videointelligence_v1.types.VideoContext |
|
:param location: Optional, cloud region where annotation should take place. Supported cloud regions: |
|
us-east1, us-west1, europe-west1, asia-east1. If no region is specified, a region will be determined |
|
based on video file location. |
|
:type location: str |
|
:param retry: Retry object used to determine when/if to retry requests. |
|
If None is specified, requests will not be retried. |
|
:type retry: google.api_core.retry.Retry |
|
:param timeout: Optional, The amount of time, in seconds, to wait for the request to complete. |
|
Note that if retry is specified, the timeout applies to each individual attempt. |
|
:type timeout: float |
|
:param gcp_conn_id: Optional, The connection ID used to connect to Google Cloud. |
|
Defaults to ``google_cloud_default``. |
|
:type gcp_conn_id: str |
|
:param impersonation_chain: Optional service account to impersonate using short-term |
|
credentials, or chained list of accounts required to get the access_token |
|
of the last account in the list, which will be impersonated in the request. |
|
If set as a string, the account must grant the originating account |
|
the Service Account Token Creator IAM role. |
|
If set as a sequence, the identities from the list must grant |
|
Service Account Token Creator IAM role to the directly preceding identity, with first |
|
account from the list granting this role to the originating account (templated). |
|
:type impersonation_chain: Union[str, Sequence[str]] |
|
""" |
|
|
|
# [START gcp_video_intelligence_detect_video_shots_template_fields] |
|
template_fields = ( |
|
"input_uri", |
|
"output_uri", |
|
"gcp_conn_id", |
|
"impersonation_chain", |
|
) |
|
# [END gcp_video_intelligence_detect_video_shots_template_fields] |
|
|
|
@apply_defaults |
|
def __init__( |
|
self, |
|
*, |
|
input_uri: str, |
|
output_uri: Optional[str] = None, |
|
input_content: Optional[bytes] = None, |
|
video_context: Union[Dict, VideoContext] = None, |
|
location: Optional[str] = None, |
|
retry: Optional[Retry] = None, |
|
timeout: Optional[float] = None, |
|
gcp_conn_id: str = "google_cloud_default", |
|
impersonation_chain: Optional[Union[str, Sequence[str]]] = None, |
|
**kwargs, |
|
) -> None: |
|
super().__init__(**kwargs) |
|
self.input_uri = input_uri |
|
self.output_uri = output_uri |
|
self.input_content = input_content |
|
self.video_context = video_context |
|
self.location = location |
|
self.retry = retry |
|
self.gcp_conn_id = gcp_conn_id |
|
self.timeout = timeout |
|
self.impersonation_chain = impersonation_chain |
|
|
|
def execute(self, context): |
|
hook = CloudVideoIntelligenceHook( |
|
gcp_conn_id=self.gcp_conn_id, |
|
impersonation_chain=self.impersonation_chain, |
|
) |
|
operation = hook.annotate_video( |
|
input_uri=self.input_uri, |
|
input_content=self.input_content, |
|
video_context=self.video_context, |
|
location=self.location, |
|
retry=self.retry, |
|
features=[enums.Feature.SHOT_CHANGE_DETECTION], |
|
timeout=self.timeout, |
|
) |
|
self.log.info("Processing video for video shots annotations") |
|
result = MessageToDict(operation.result()) |
|
self.log.info("Finished processing.") |
|
return result
|
|
|