openapi-directory

Version:

Building & bundling https://github.com/APIs-guru/openapi-directory for easy use from JS

github.com/httptoolkit/openapi-directory-js

1 lines • 72 kB

JSON

{"openapi":"3.0.0","info":{"contact":{"name":"Google","url":"https://google.com"},"description":"Detects objects, explicit content, and scene changes in videos. It also specifies the region for annotation and transcribes speech to text.","title":"Cloud Video Intelligence","version":"v1","x-apiClientRegistration":{"url":"https://console.developers.google.com"},"x-apisguru-categories":["media"],"x-logo":{"url":"https://www.google.com/images/branding/googlelogo/2x/googlelogo_color_272x92dp.png"},"x-origin":[{"converter":{"url":"https://github.com/lucybot/api-spec-converter","version":"2.7.18"},"format":"google","url":"https://videointelligence.googleapis.com/$discovery/rest?version=v1","version":"v1"}],"x-preferred":true,"x-providerName":"googleapis.com","x-serviceName":"videointelligence"},"externalDocs":{"url":"https://cloud.google.com/video-intelligence/docs/"},"tags":[{"name":"operations"},{"name":"videos"}],"paths":{"/v1/operations":{"get":{"description":"Lists operations that match the specified filter in the request. If the\nserver doesn't support this method, it returns `UNIMPLEMENTED`.\n\nNOTE: the `name` binding allows API services to override the binding\nto use different resource name schemes, such as `users/*/operations`. To\noverride the binding, API services can add a binding such as\n`\"/v1/{name=users/*}/operations\"` to their service configuration.\nFor backwards compatibility, the default name includes the operations\ncollection id, however overriding users must ensure the name binding\nis the parent resource, without the operations collection id.","operationId":"videointelligence.operations.list","parameters":[{"description":"The standard list filter.","in":"query","name":"filter","schema":{"type":"string"}},{"description":"The name of the operation's parent resource.","in":"query","name":"name","schema":{"type":"string"}},{"description":"The standard list page size.","in":"query","name":"pageSize","schema":{"type":"integer"}},{"description":"The standard list page token.","in":"query","name":"pageToken","schema":{"type":"string"}}],"responses":{"200":{"description":"Successful response","content":{"*/*":{"schema":{"$ref":"#/components/schemas/GoogleLongrunning_ListOperationsResponse"}}}}},"security":[{"Oauth2":["https://www.googleapis.com/auth/cloud-platform"]}],"tags":["operations"]},"parameters":[{"$ref":"#/components/parameters/_.xgafv"},{"$ref":"#/components/parameters/access_token"},{"$ref":"#/components/parameters/alt"},{"$ref":"#/components/parameters/callback"},{"$ref":"#/components/parameters/fields"},{"$ref":"#/components/parameters/key"},{"$ref":"#/components/parameters/oauth_token"},{"$ref":"#/components/parameters/prettyPrint"},{"$ref":"#/components/parameters/quotaUser"},{"$ref":"#/components/parameters/uploadType"},{"$ref":"#/components/parameters/upload_protocol"}]},"/v1/operations/{name}":{"delete":{"description":"Deletes a long-running operation. This method indicates that the client is\nno longer interested in the operation result. It does not cancel the\noperation. If the server doesn't support this method, it returns\n`google.rpc.Code.UNIMPLEMENTED`.","operationId":"videointelligence.operations.delete","parameters":[{"description":"The name of the operation resource to be deleted.","in":"path","name":"name","required":true,"x-reservedExpansion":true,"schema":{"type":"string"}}],"responses":{"200":{"description":"Successful response","content":{"*/*":{"schema":{"$ref":"#/components/schemas/GoogleProtobuf_Empty"}}}}},"security":[{"Oauth2":["https://www.googleapis.com/auth/cloud-platform"]}],"tags":["operations"]},"get":{"description":"Gets the latest state of a long-running operation. Clients can use this\nmethod to poll the operation result at intervals as recommended by the API\nservice.","operationId":"videointelligence.operations.get","parameters":[{"description":"The name of the operation resource.","in":"path","name":"name","required":true,"x-reservedExpansion":true,"schema":{"type":"string"}}],"responses":{"200":{"description":"Successful response","content":{"*/*":{"schema":{"$ref":"#/components/schemas/GoogleLongrunning_Operation"}}}}},"security":[{"Oauth2":["https://www.googleapis.com/auth/cloud-platform"]}],"tags":["operations"]},"parameters":[{"$ref":"#/components/parameters/_.xgafv"},{"$ref":"#/components/parameters/access_token"},{"$ref":"#/components/parameters/alt"},{"$ref":"#/components/parameters/callback"},{"$ref":"#/components/parameters/fields"},{"$ref":"#/components/parameters/key"},{"$ref":"#/components/parameters/oauth_token"},{"$ref":"#/components/parameters/prettyPrint"},{"$ref":"#/components/parameters/quotaUser"},{"$ref":"#/components/parameters/uploadType"},{"$ref":"#/components/parameters/upload_protocol"}]},"/v1/operations/{name}:cancel":{"parameters":[{"$ref":"#/components/parameters/_.xgafv"},{"$ref":"#/components/parameters/access_token"},{"$ref":"#/components/parameters/alt"},{"$ref":"#/components/parameters/callback"},{"$ref":"#/components/parameters/fields"},{"$ref":"#/components/parameters/key"},{"$ref":"#/components/parameters/oauth_token"},{"$ref":"#/components/parameters/prettyPrint"},{"$ref":"#/components/parameters/quotaUser"},{"$ref":"#/components/parameters/uploadType"},{"$ref":"#/components/parameters/upload_protocol"}],"post":{"description":"Starts asynchronous cancellation on a long-running operation. The server\nmakes a best effort to cancel the operation, but success is not\nguaranteed. If the server doesn't support this method, it returns\n`google.rpc.Code.UNIMPLEMENTED`. Clients can use\nOperations.GetOperation or\nother methods to check whether the cancellation succeeded or whether the\noperation completed despite cancellation. On successful cancellation,\nthe operation is not deleted; instead, it becomes an operation with\nan Operation.error value with a google.rpc.Status.code of 1,\ncorresponding to `Code.CANCELLED`.","operationId":"videointelligence.operations.cancel","parameters":[{"description":"The name of the operation resource to be cancelled.","in":"path","name":"name","required":true,"x-reservedExpansion":true,"schema":{"type":"string"}}],"requestBody":{"content":{"application/json":{"schema":{"$ref":"#/components/schemas/GoogleLongrunning_CancelOperationRequest"}}}},"responses":{"200":{"description":"Successful response","content":{"*/*":{"schema":{"$ref":"#/components/schemas/GoogleProtobuf_Empty"}}}}},"security":[{"Oauth2":["https://www.googleapis.com/auth/cloud-platform"]}],"tags":["operations"]}},"/v1/videos:annotate":{"parameters":[{"$ref":"#/components/parameters/_.xgafv"},{"$ref":"#/components/parameters/access_token"},{"$ref":"#/components/parameters/alt"},{"$ref":"#/components/parameters/callback"},{"$ref":"#/components/parameters/fields"},{"$ref":"#/components/parameters/key"},{"$ref":"#/components/parameters/oauth_token"},{"$ref":"#/components/parameters/prettyPrint"},{"$ref":"#/components/parameters/quotaUser"},{"$ref":"#/components/parameters/uploadType"},{"$ref":"#/components/parameters/upload_protocol"}],"post":{"description":"Performs asynchronous video annotation. Progress and results can be\nretrieved through the `google.longrunning.Operations` interface.\n`Operation.metadata` contains `AnnotateVideoProgress` (progress).\n`Operation.response` contains `AnnotateVideoResponse` (results).","operationId":"videointelligence.videos.annotate","requestBody":{"content":{"application/json":{"schema":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_AnnotateVideoRequest"}}}},"responses":{"200":{"description":"Successful response","content":{"*/*":{"schema":{"$ref":"#/components/schemas/GoogleLongrunning_Operation"}}}}},"security":[{"Oauth2":["https://www.googleapis.com/auth/cloud-platform"]}],"tags":["videos"]}}},"servers":[{"url":"https://videointelligence.googleapis.com/"}],"components":{"parameters":{"access_token":{"description":"OAuth access token.","in":"query","name":"access_token","schema":{"type":"string"}},"alt":{"description":"Data format for response.","in":"query","name":"alt","schema":{"type":"string","enum":["json","media","proto"],"default":"json"}},"callback":{"description":"JSONP","in":"query","name":"callback","schema":{"type":"string"}},"fields":{"description":"Selector specifying which fields to include in a partial response.","in":"query","name":"fields","schema":{"type":"string"}},"key":{"description":"API key. Your API key identifies your project and provides you with API access, quota, and reports. Required unless you provide an OAuth 2.0 token.","in":"query","name":"key","schema":{"type":"string"}},"oauth_token":{"description":"OAuth 2.0 token for the current user.","in":"query","name":"oauth_token","schema":{"type":"string"}},"prettyPrint":{"description":"Returns response with indentations and line breaks.","in":"query","name":"prettyPrint","schema":{"type":"boolean","default":true}},"quotaUser":{"description":"Available to use for quota purposes for server-side applications. Can be any arbitrary string assigned to a user, but should not exceed 40 characters.","in":"query","name":"quotaUser","schema":{"type":"string"}},"uploadType":{"description":"Legacy upload protocol for media (e.g. \"media\", \"multipart\").","in":"query","name":"uploadType","schema":{"type":"string"}},"upload_protocol":{"description":"Upload protocol for media (e.g. \"raw\", \"multipart\").","in":"query","name":"upload_protocol","schema":{"type":"string"}},"_.xgafv":{"description":"V1 error format.","in":"query","name":"$.xgafv","schema":{"type":"string","enum":["1","2"]}}},"securitySchemes":{"Oauth2":{"description":"Oauth 2.0 authentication","type":"oauth2","flows":{"implicit":{"authorizationUrl":"https://accounts.google.com/o/oauth2/auth","scopes":{"https://www.googleapis.com/auth/cloud-platform":"View and manage your data across Google Cloud Platform services"}}}}},"schemas":{"GoogleCloudVideointelligenceV1_AnnotateVideoProgress":{"description":"Video annotation progress. Included in the `metadata`\nfield of the `Operation` returned by the `GetOperation`\ncall of the `google::longrunning::Operations` service.","properties":{"annotationProgress":{"description":"Progress metadata for all videos specified in `AnnotateVideoRequest`.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_VideoAnnotationProgress"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1_AnnotateVideoRequest":{"description":"Video annotation request.","properties":{"features":{"description":"Requested video annotation features.","items":{"enum":["FEATURE_UNSPECIFIED","LABEL_DETECTION","SHOT_CHANGE_DETECTION","EXPLICIT_CONTENT_DETECTION","SPEECH_TRANSCRIPTION"],"type":"string"},"type":"array"},"inputContent":{"description":"The video data bytes.\nIf unset, the input video(s) should be specified via `input_uri`.\nIf set, `input_uri` should be unset.","format":"byte","type":"string"},"inputUri":{"description":"Input video location. Currently, only\n[Google Cloud Storage](https://cloud.google.com/storage/) URIs are\nsupported, which must be specified in the following format:\n`gs://bucket-id/object-id` (other URI formats return\ngoogle.rpc.Code.INVALID_ARGUMENT). For more information, see\n[Request URIs](/storage/docs/reference-uris).\nA video URI may include wildcards in `object-id`, and thus identify\nmultiple videos. Supported wildcards: '*' to match 0 or more characters;\n'?' to match 1 character. If unset, the input video should be embedded\nin the request as `input_content`. If set, `input_content` should be unset.","type":"string"},"locationId":{"description":"Optional cloud region where annotation should take place. Supported cloud\nregions: `us-east1`, `us-west1`, `europe-west1`, `asia-east1`. If no region\nis specified, a region will be determined based on video file location.","type":"string"},"outputUri":{"description":"Optional location where the output (in JSON format) should be stored.\nCurrently, only [Google Cloud Storage](https://cloud.google.com/storage/)\nURIs are supported, which must be specified in the following format:\n`gs://bucket-id/object-id` (other URI formats return\ngoogle.rpc.Code.INVALID_ARGUMENT). For more information, see\n[Request URIs](/storage/docs/reference-uris).","type":"string"},"videoContext":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_VideoContext"}},"type":"object"},"GoogleCloudVideointelligenceV1_AnnotateVideoResponse":{"description":"Video annotation response. Included in the `response`\nfield of the `Operation` returned by the `GetOperation`\ncall of the `google::longrunning::Operations` service.","properties":{"annotationResults":{"description":"Annotation results for all videos specified in `AnnotateVideoRequest`.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_VideoAnnotationResults"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1_Entity":{"description":"Detected entity from video analysis.","properties":{"description":{"description":"Textual description, e.g. `Fixed-gear bicycle`.","type":"string"},"entityId":{"description":"Opaque entity ID. Some IDs may be available in\n[Google Knowledge Graph Search\nAPI](https://developers.google.com/knowledge-graph/).","type":"string"},"languageCode":{"description":"Language code for `description` in BCP-47 format.","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1_ExplicitContentAnnotation":{"description":"Explicit content annotation (based on per-frame visual signals only).\nIf no explicit content has been detected in a frame, no annotations are\npresent for that frame.","properties":{"frames":{"description":"All video frames where explicit content was detected.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_ExplicitContentFrame"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1_ExplicitContentDetectionConfig":{"description":"Config for EXPLICIT_CONTENT_DETECTION.","properties":{"model":{"description":"Model to use for explicit content detection.\nSupported values: \"builtin/stable\" (the default if unset) and\n\"builtin/latest\".","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1_ExplicitContentFrame":{"description":"Video frame level annotation results for explicit content.","properties":{"pornographyLikelihood":{"description":"Likelihood of the pornography content..","enum":["LIKELIHOOD_UNSPECIFIED","VERY_UNLIKELY","UNLIKELY","POSSIBLE","LIKELY","VERY_LIKELY"],"type":"string"},"timeOffset":{"description":"Time-offset, relative to the beginning of the video, corresponding to the\nvideo frame for this location.","format":"google-duration","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1_LabelAnnotation":{"description":"Label annotation.","properties":{"categoryEntities":{"description":"Common categories for the detected entity.\nE.g. when the label is `Terrier` the category is likely `dog`. And in some\ncases there might be more than one categories e.g. `Terrier` could also be\na `pet`.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_Entity"},"type":"array"},"entity":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_Entity"},"frames":{"description":"All video frames where a label was detected.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_LabelFrame"},"type":"array"},"segments":{"description":"All video segments where a label was detected.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_LabelSegment"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1_LabelDetectionConfig":{"description":"Config for LABEL_DETECTION.","properties":{"labelDetectionMode":{"description":"What labels should be detected with LABEL_DETECTION, in addition to\nvideo-level labels or segment-level labels.\nIf unspecified, defaults to `SHOT_MODE`.","enum":["LABEL_DETECTION_MODE_UNSPECIFIED","SHOT_MODE","FRAME_MODE","SHOT_AND_FRAME_MODE"],"type":"string"},"model":{"description":"Model to use for label detection.\nSupported values: \"builtin/stable\" (the default if unset) and\n\"builtin/latest\".","type":"string"},"stationaryCamera":{"description":"Whether the video has been shot from a stationary (i.e. non-moving) camera.\nWhen set to true, might improve detection accuracy for moving objects.\nShould be used with `SHOT_AND_FRAME_MODE` enabled.","type":"boolean"}},"type":"object"},"GoogleCloudVideointelligenceV1_LabelFrame":{"description":"Video frame level annotation results for label detection.","properties":{"confidence":{"description":"Confidence that the label is accurate. Range: [0, 1].","format":"float","type":"number"},"timeOffset":{"description":"Time-offset, relative to the beginning of the video, corresponding to the\nvideo frame for this location.","format":"google-duration","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1_LabelSegment":{"description":"Video segment level annotation results for label detection.","properties":{"confidence":{"description":"Confidence that the label is accurate. Range: [0, 1].","format":"float","type":"number"},"segment":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_VideoSegment"}},"type":"object"},"GoogleCloudVideointelligenceV1_ShotChangeDetectionConfig":{"description":"Config for SHOT_CHANGE_DETECTION.","properties":{"model":{"description":"Model to use for shot change detection.\nSupported values: \"builtin/stable\" (the default if unset) and\n\"builtin/latest\".","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1_SpeechContext":{"description":"Provides \"hints\" to the speech recognizer to favor specific words and phrases\nin the results.","properties":{"phrases":{"description":"*Optional* A list of strings containing words and phrases \"hints\" so that\nthe speech recognition is more likely to recognize them. This can be used\nto improve the accuracy for specific words and phrases, for example, if\nspecific commands are typically spoken by the user. This can also be used\nto add additional words to the vocabulary of the recognizer. See\n[usage limits](https://cloud.google.com/speech/limits#content).","items":{"type":"string"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1_SpeechRecognitionAlternative":{"description":"Alternative hypotheses (a.k.a. n-best list).","properties":{"confidence":{"description":"The confidence estimate between 0.0 and 1.0. A higher number\nindicates an estimated greater likelihood that the recognized words are\ncorrect. This field is typically provided only for the top hypothesis, and\nonly for `is_final=true` results. Clients should not rely on the\n`confidence` field as it is not guaranteed to be accurate or consistent.\nThe default of 0.0 is a sentinel value indicating `confidence` was not set.","format":"float","type":"number"},"transcript":{"description":"Transcript text representing the words that the user spoke.","type":"string"},"words":{"description":"A list of word-specific information for each recognized word.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_WordInfo"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1_SpeechTranscription":{"description":"A speech recognition result corresponding to a portion of the audio.","properties":{"alternatives":{"description":"May contain one or more recognition hypotheses (up to the maximum specified\nin `max_alternatives`). These alternatives are ordered in terms of\naccuracy, with the top (first) alternative being the most probable, as\nranked by the recognizer.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_SpeechRecognitionAlternative"},"type":"array"},"languageCode":{"description":"Output only. The\n[BCP-47](https://www.rfc-editor.org/rfc/bcp/bcp47.txt) language tag of the\nlanguage in this result. This language code was detected to have the most\nlikelihood of being spoken in the audio.","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1_SpeechTranscriptionConfig":{"description":"Config for SPEECH_TRANSCRIPTION.","properties":{"audioTracks":{"description":"*Optional* For file formats, such as MXF or MKV, supporting multiple audio\ntracks, specify up to two tracks. Default: track 0.","items":{"format":"int32","type":"integer"},"type":"array"},"diarizationSpeakerCount":{"description":"*Optional*\nIf set, specifies the estimated number of speakers in the conversation.\nIf not set, defaults to '2'.\nIgnored unless enable_speaker_diarization is set to true.","format":"int32","type":"integer"},"enableAutomaticPunctuation":{"description":"*Optional* If 'true', adds punctuation to recognition result hypotheses.\nThis feature is only available in select languages. Setting this for\nrequests in other languages has no effect at all. The default 'false' value\ndoes not add punctuation to result hypotheses. NOTE: \"This is currently\noffered as an experimental service, complimentary to all users. In the\nfuture this may be exclusively available as a premium feature.\"","type":"boolean"},"enableSpeakerDiarization":{"description":"*Optional* If 'true', enables speaker detection for each recognized word in\nthe top alternative of the recognition result using a speaker_tag provided\nin the WordInfo.\nNote: When this is true, we send all the words from the beginning of the\naudio for the top alternative in every consecutive responses.\nThis is done in order to improve our speaker tags as our models learn to\nidentify the speakers in the conversation over time.","type":"boolean"},"enableWordConfidence":{"description":"*Optional* If `true`, the top result includes a list of words and the\nconfidence for those words. If `false`, no word-level confidence\ninformation is returned. The default is `false`.","type":"boolean"},"filterProfanity":{"description":"*Optional* If set to `true`, the server will attempt to filter out\nprofanities, replacing all but the initial character in each filtered word\nwith asterisks, e.g. \"f***\". If set to `false` or omitted, profanities\nwon't be filtered out.","type":"boolean"},"languageCode":{"description":"*Required* The language of the supplied audio as a\n[BCP-47](https://www.rfc-editor.org/rfc/bcp/bcp47.txt) language tag.\nExample: \"en-US\".\nSee [Language Support](https://cloud.google.com/speech/docs/languages)\nfor a list of the currently supported language codes.","type":"string"},"maxAlternatives":{"description":"*Optional* Maximum number of recognition hypotheses to be returned.\nSpecifically, the maximum number of `SpeechRecognitionAlternative` messages\nwithin each `SpeechTranscription`. The server may return fewer than\n`max_alternatives`. Valid values are `0`-`30`. A value of `0` or `1` will\nreturn a maximum of one. If omitted, will return a maximum of one.","format":"int32","type":"integer"},"speechContexts":{"description":"*Optional* A means to provide context to assist the speech recognition.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_SpeechContext"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1_VideoAnnotationProgress":{"description":"Annotation progress for a single video.","properties":{"inputUri":{"description":"Video file location in\n[Google Cloud Storage](https://cloud.google.com/storage/).","type":"string"},"progressPercent":{"description":"Approximate percentage processed thus far. Guaranteed to be\n100 when fully processed.","format":"int32","type":"integer"},"startTime":{"description":"Time when the request was received.","format":"google-datetime","type":"string"},"updateTime":{"description":"Time of the most recent update.","format":"google-datetime","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1_VideoAnnotationResults":{"description":"Annotation results for a single video.","properties":{"error":{"$ref":"#/components/schemas/GoogleRpc_Status"},"explicitAnnotation":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_ExplicitContentAnnotation"},"frameLabelAnnotations":{"description":"Label annotations on frame level.\nThere is exactly one element for each unique label.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_LabelAnnotation"},"type":"array"},"inputUri":{"description":"Video file location in\n[Google Cloud Storage](https://cloud.google.com/storage/).","type":"string"},"segmentLabelAnnotations":{"description":"Label annotations on video level or user specified segment level.\nThere is exactly one element for each unique label.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_LabelAnnotation"},"type":"array"},"shotAnnotations":{"description":"Shot annotations. Each shot is represented as a video segment.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_VideoSegment"},"type":"array"},"shotLabelAnnotations":{"description":"Label annotations on shot level.\nThere is exactly one element for each unique label.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_LabelAnnotation"},"type":"array"},"speechTranscriptions":{"description":"Speech transcription.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_SpeechTranscription"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1_VideoContext":{"description":"Video context and/or feature-specific parameters.","properties":{"explicitContentDetectionConfig":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_ExplicitContentDetectionConfig"},"labelDetectionConfig":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_LabelDetectionConfig"},"segments":{"description":"Video segments to annotate. The segments may overlap and are not required\nto be contiguous or span the whole video. If unspecified, each video is\ntreated as a single segment.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_VideoSegment"},"type":"array"},"shotChangeDetectionConfig":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_ShotChangeDetectionConfig"},"speechTranscriptionConfig":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1_SpeechTranscriptionConfig"}},"type":"object"},"GoogleCloudVideointelligenceV1_VideoSegment":{"description":"Video segment.","properties":{"endTimeOffset":{"description":"Time-offset, relative to the beginning of the video,\ncorresponding to the end of the segment (inclusive).","format":"google-duration","type":"string"},"startTimeOffset":{"description":"Time-offset, relative to the beginning of the video,\ncorresponding to the start of the segment (inclusive).","format":"google-duration","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1_WordInfo":{"description":"Word-specific information for recognized words. Word information is only\nincluded in the response when certain request parameters are set, such\nas `enable_word_time_offsets`.","properties":{"confidence":{"description":"Output only. The confidence estimate between 0.0 and 1.0. A higher number\nindicates an estimated greater likelihood that the recognized words are\ncorrect. This field is set only for the top alternative.\nThis field is not guaranteed to be accurate and users should not rely on it\nto be always provided.\nThe default of 0.0 is a sentinel value indicating `confidence` was not set.","format":"float","type":"number"},"endTime":{"description":"Time offset relative to the beginning of the audio, and\ncorresponding to the end of the spoken word. This field is only set if\n`enable_word_time_offsets=true` and only in the top hypothesis. This is an\nexperimental feature and the accuracy of the time offset can vary.","format":"google-duration","type":"string"},"speakerTag":{"description":"Output only. A distinct integer value is assigned for every speaker within\nthe audio. This field specifies which one of those speakers was detected to\nhave spoken this word. Value ranges from 1 up to diarization_speaker_count,\nand is only set if speaker diarization is enabled.","format":"int32","type":"integer"},"startTime":{"description":"Time offset relative to the beginning of the audio, and\ncorresponding to the start of the spoken word. This field is only set if\n`enable_word_time_offsets=true` and only in the top hypothesis. This is an\nexperimental feature and the accuracy of the time offset can vary.","format":"google-duration","type":"string"},"word":{"description":"The word corresponding to this set of information.","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1beta2_AnnotateVideoProgress":{"description":"Video annotation progress. Included in the `metadata`\nfield of the `Operation` returned by the `GetOperation`\ncall of the `google::longrunning::Operations` service.","properties":{"annotationProgress":{"description":"Progress metadata for all videos specified in `AnnotateVideoRequest`.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1beta2_VideoAnnotationProgress"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1beta2_AnnotateVideoResponse":{"description":"Video annotation response. Included in the `response`\nfield of the `Operation` returned by the `GetOperation`\ncall of the `google::longrunning::Operations` service.","properties":{"annotationResults":{"description":"Annotation results for all videos specified in `AnnotateVideoRequest`.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1beta2_VideoAnnotationResults"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1beta2_Entity":{"description":"Detected entity from video analysis.","properties":{"description":{"description":"Textual description, e.g. `Fixed-gear bicycle`.","type":"string"},"entityId":{"description":"Opaque entity ID. Some IDs may be available in\n[Google Knowledge Graph Search\nAPI](https://developers.google.com/knowledge-graph/).","type":"string"},"languageCode":{"description":"Language code for `description` in BCP-47 format.","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1beta2_ExplicitContentAnnotation":{"description":"Explicit content annotation (based on per-frame visual signals only).\nIf no explicit content has been detected in a frame, no annotations are\npresent for that frame.","properties":{"frames":{"description":"All video frames where explicit content was detected.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1beta2_ExplicitContentFrame"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1beta2_ExplicitContentFrame":{"description":"Video frame level annotation results for explicit content.","properties":{"pornographyLikelihood":{"description":"Likelihood of the pornography content..","enum":["LIKELIHOOD_UNSPECIFIED","VERY_UNLIKELY","UNLIKELY","POSSIBLE","LIKELY","VERY_LIKELY"],"type":"string"},"timeOffset":{"description":"Time-offset, relative to the beginning of the video, corresponding to the\nvideo frame for this location.","format":"google-duration","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1beta2_LabelAnnotation":{"description":"Label annotation.","properties":{"categoryEntities":{"description":"Common categories for the detected entity.\nE.g. when the label is `Terrier` the category is likely `dog`. And in some\ncases there might be more than one categories e.g. `Terrier` could also be\na `pet`.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1beta2_Entity"},"type":"array"},"entity":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1beta2_Entity"},"frames":{"description":"All video frames where a label was detected.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1beta2_LabelFrame"},"type":"array"},"segments":{"description":"All video segments where a label was detected.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1beta2_LabelSegment"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1beta2_LabelFrame":{"description":"Video frame level annotation results for label detection.","properties":{"confidence":{"description":"Confidence that the label is accurate. Range: [0, 1].","format":"float","type":"number"},"timeOffset":{"description":"Time-offset, relative to the beginning of the video, corresponding to the\nvideo frame for this location.","format":"google-duration","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1beta2_LabelSegment":{"description":"Video segment level annotation results for label detection.","properties":{"confidence":{"description":"Confidence that the label is accurate. Range: [0, 1].","format":"float","type":"number"},"segment":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1beta2_VideoSegment"}},"type":"object"},"GoogleCloudVideointelligenceV1beta2_SpeechRecognitionAlternative":{"description":"Alternative hypotheses (a.k.a. n-best list).","properties":{"confidence":{"description":"The confidence estimate between 0.0 and 1.0. A higher number\nindicates an estimated greater likelihood that the recognized words are\ncorrect. This field is typically provided only for the top hypothesis, and\nonly for `is_final=true` results. Clients should not rely on the\n`confidence` field as it is not guaranteed to be accurate or consistent.\nThe default of 0.0 is a sentinel value indicating `confidence` was not set.","format":"float","type":"number"},"transcript":{"description":"Transcript text representing the words that the user spoke.","type":"string"},"words":{"description":"A list of word-specific information for each recognized word.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1beta2_WordInfo"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1beta2_SpeechTranscription":{"description":"A speech recognition result corresponding to a portion of the audio.","properties":{"alternatives":{"description":"May contain one or more recognition hypotheses (up to the maximum specified\nin `max_alternatives`). These alternatives are ordered in terms of\naccuracy, with the top (first) alternative being the most probable, as\nranked by the recognizer.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1beta2_SpeechRecognitionAlternative"},"type":"array"},"languageCode":{"description":"Output only. The\n[BCP-47](https://www.rfc-editor.org/rfc/bcp/bcp47.txt) language tag of the\nlanguage in this result. This language code was detected to have the most\nlikelihood of being spoken in the audio.","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1beta2_VideoAnnotationProgress":{"description":"Annotation progress for a single video.","properties":{"inputUri":{"description":"Video file location in\n[Google Cloud Storage](https://cloud.google.com/storage/).","type":"string"},"progressPercent":{"description":"Approximate percentage processed thus far. Guaranteed to be\n100 when fully processed.","format":"int32","type":"integer"},"startTime":{"description":"Time when the request was received.","format":"google-datetime","type":"string"},"updateTime":{"description":"Time of the most recent update.","format":"google-datetime","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1beta2_VideoAnnotationResults":{"description":"Annotation results for a single video.","properties":{"error":{"$ref":"#/components/schemas/GoogleRpc_Status"},"explicitAnnotation":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1beta2_ExplicitContentAnnotation"},"frameLabelAnnotations":{"description":"Label annotations on frame level.\nThere is exactly one element for each unique label.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1beta2_LabelAnnotation"},"type":"array"},"inputUri":{"description":"Video file location in\n[Google Cloud Storage](https://cloud.google.com/storage/).","type":"string"},"segmentLabelAnnotations":{"description":"Label annotations on video level or user specified segment level.\nThere is exactly one element for each unique label.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1beta2_LabelAnnotation"},"type":"array"},"shotAnnotations":{"description":"Shot annotations. Each shot is represented as a video segment.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1beta2_VideoSegment"},"type":"array"},"shotLabelAnnotations":{"description":"Label annotations on shot level.\nThere is exactly one element for each unique label.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1beta2_LabelAnnotation"},"type":"array"},"speechTranscriptions":{"description":"Speech transcription.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1beta2_SpeechTranscription"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1beta2_VideoSegment":{"description":"Video segment.","properties":{"endTimeOffset":{"description":"Time-offset, relative to the beginning of the video,\ncorresponding to the end of the segment (inclusive).","format":"google-duration","type":"string"},"startTimeOffset":{"description":"Time-offset, relative to the beginning of the video,\ncorresponding to the start of the segment (inclusive).","format":"google-duration","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1beta2_WordInfo":{"description":"Word-specific information for recognized words. Word information is only\nincluded in the response when certain request parameters are set, such\nas `enable_word_time_offsets`.","properties":{"confidence":{"description":"Output only. The confidence estimate between 0.0 and 1.0. A higher number\nindicates an estimated greater likelihood that the recognized words are\ncorrect. This field is set only for the top alternative.\nThis field is not guaranteed to be accurate and users should not rely on it\nto be always provided.\nThe default of 0.0 is a sentinel value indicating `confidence` was not set.","format":"float","type":"number"},"endTime":{"description":"Time offset relative to the beginning of the audio, and\ncorresponding to the end of the spoken word. This field is only set if\n`enable_word_time_offsets=true` and only in the top hypothesis. This is an\nexperimental feature and the accuracy of the time offset can vary.","format":"google-duration","type":"string"},"speakerTag":{"description":"Output only. A distinct integer value is assigned for every speaker within\nthe audio. This field specifies which one of those speakers was detected to\nhave spoken this word. Value ranges from 1 up to diarization_speaker_count,\nand is only set if speaker diarization is enabled.","format":"int32","type":"integer"},"startTime":{"description":"Time offset relative to the beginning of the audio, and\ncorresponding to the start of the spoken word. This field is only set if\n`enable_word_time_offsets=true` and only in the top hypothesis. This is an\nexperimental feature and the accuracy of the time offset can vary.","format":"google-duration","type":"string"},"word":{"description":"The word corresponding to this set of information.","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1p1beta1_AnnotateVideoProgress":{"description":"Video annotation progress. Included in the `metadata`\nfield of the `Operation` returned by the `GetOperation`\ncall of the `google::longrunning::Operations` service.","properties":{"annotationProgress":{"description":"Progress metadata for all videos specified in `AnnotateVideoRequest`.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1p1beta1_VideoAnnotationProgress"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1p1beta1_AnnotateVideoResponse":{"description":"Video annotation response. Included in the `response`\nfield of the `Operation` returned by the `GetOperation`\ncall of the `google::longrunning::Operations` service.","properties":{"annotationResults":{"description":"Annotation results for all videos specified in `AnnotateVideoRequest`.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1p1beta1_VideoAnnotationResults"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1p1beta1_Entity":{"description":"Detected entity from video analysis.","properties":{"description":{"description":"Textual description, e.g. `Fixed-gear bicycle`.","type":"string"},"entityId":{"description":"Opaque entity ID. Some IDs may be available in\n[Google Knowledge Graph Search\nAPI](https://developers.google.com/knowledge-graph/).","type":"string"},"languageCode":{"description":"Language code for `description` in BCP-47 format.","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1p1beta1_ExplicitContentAnnotation":{"description":"Explicit content annotation (based on per-frame visual signals only).\nIf no explicit content has been detected in a frame, no annotations are\npresent for that frame.","properties":{"frames":{"description":"All video frames where explicit content was detected.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1p1beta1_ExplicitContentFrame"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1p1beta1_ExplicitContentFrame":{"description":"Video frame level annotation results for explicit content.","properties":{"pornographyLikelihood":{"description":"Likelihood of the pornography content..","enum":["LIKELIHOOD_UNSPECIFIED","VERY_UNLIKELY","UNLIKELY","POSSIBLE","LIKELY","VERY_LIKELY"],"type":"string"},"timeOffset":{"description":"Time-offset, relative to the beginning of the video, corresponding to the\nvideo frame for this location.","format":"google-duration","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1p1beta1_LabelAnnotation":{"description":"Label annotation.","properties":{"categoryEntities":{"description":"Common categories for the detected entity.\nE.g. when the label is `Terrier` the category is likely `dog`. And in some\ncases there might be more than one categories e.g. `Terrier` could also be\na `pet`.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1p1beta1_Entity"},"type":"array"},"entity":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1p1beta1_Entity"},"frames":{"description":"All video frames where a label was detected.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1p1beta1_LabelFrame"},"type":"array"},"segments":{"description":"All video segments where a label was detected.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1p1beta1_LabelSegment"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1p1beta1_LabelFrame":{"description":"Video frame level annotation results for label detection.","properties":{"confidence":{"description":"Confidence that the label is accurate. Range: [0, 1].","format":"float","type":"number"},"timeOffset":{"description":"Time-offset, relative to the beginning of the video, corresponding to the\nvideo frame for this location.","format":"google-duration","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1p1beta1_LabelSegment":{"description":"Video segment level annotation results for label detection.","properties":{"confidence":{"description":"Confidence that the label is accurate. Range: [0, 1].","format":"float","type":"number"},"segment":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1p1beta1_VideoSegment"}},"type":"object"},"GoogleCloudVideointelligenceV1p1beta1_SpeechRecognitionAlternative":{"description":"Alternative hypotheses (a.k.a. n-best list).","properties":{"confidence":{"description":"The confidence estimate between 0.0 and 1.0. A higher number\nindicates an estimated greater likelihood that the recognized words are\ncorrect. This field is typically provided only for the top hypothesis, and\nonly for `is_final=true` results. Clients should not rely on the\n`confidence` field as it is not guaranteed to be accurate or consistent.\nThe default of 0.0 is a sentinel value indicating `confidence` was not set.","format":"float","type":"number"},"transcript":{"description":"Transcript text representing the words that the user spoke.","type":"string"},"words":{"description":"A list of word-specific information for each recognized word.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1p1beta1_WordInfo"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1p1beta1_SpeechTranscription":{"description":"A speech recognition result corresponding to a portion of the audio.","properties":{"alternatives":{"description":"May contain one or more recognition hypotheses (up to the maximum specified\nin `max_alternatives`). These alternatives are ordered in terms of\naccuracy, with the top (first) alternative being the most probable, as\nranked by the recognizer.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1p1beta1_SpeechRecognitionAlternative"},"type":"array"},"languageCode":{"description":"Output only. The\n[BCP-47](https://www.rfc-editor.org/rfc/bcp/bcp47.txt) language tag of the\nlanguage in this result. This language code was detected to have the most\nlikelihood of being spoken in the audio.","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1p1beta1_VideoAnnotationProgress":{"description":"Annotation progress for a single video.","properties":{"inputUri":{"description":"Video file location in\n[Google Cloud Storage](https://cloud.google.com/storage/).","type":"string"},"progressPercent":{"description":"Approximate percentage processed thus far. Guaranteed to be\n100 when fully processed.","format":"int32","type":"integer"},"startTime":{"description":"Time when the request was received.","format":"google-datetime","type":"string"},"updateTime":{"description":"Time of the most recent update.","format":"google-datetime","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1p1beta1_VideoAnnotationResults":{"description":"Annotation results for a single video.","properties":{"error":{"$ref":"#/components/schemas/GoogleRpc_Status"},"explicitAnnotation":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1p1beta1_ExplicitContentAnnotation"},"frameLabelAnnotations":{"description":"Label annotations on frame level.\nThere is exactly one element for each unique label.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1p1beta1_LabelAnnotation"},"type":"array"},"inputUri":{"description":"Video file location in\n[Google Cloud Storage](https://cloud.google.com/storage/).","type":"string"},"segmentLabelAnnotations":{"description":"Label annotations on video level or user specified segment level.\nThere is exactly one element for each unique label.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1p1beta1_LabelAnnotation"},"type":"array"},"shotAnnotations":{"description":"Shot annotations. Each shot is represented as a video segment.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1p1beta1_VideoSegment"},"type":"array"},"shotLabelAnnotations":{"description":"Label annotations on shot level.\nThere is exactly one element for each unique label.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1p1beta1_LabelAnnotation"},"type":"array"},"speechTranscriptions":{"description":"Speech transcription.","items":{"$ref":"#/components/schemas/GoogleCloudVideointelligenceV1p1beta1_SpeechTranscription"},"type":"array"}},"type":"object"},"GoogleCloudVideointelligenceV1p1beta1_VideoSegment":{"description":"Video segment.","properties":{"endTimeOffset":{"description":"Time-offset, relative to the beginning of the video,\ncorresponding to the end of the segment (inclusive).","format":"google-duration","type":"string"},"startTimeOffset":{"description":"Time-offset, relative to the beginning of the video,\ncorresponding to the start of the segment (inclusive).","format":"google-duration","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1p1beta1_WordInfo":{"description":"Word-specific information for recognized words. Word information is only\nincluded in the response when certain request parameters are set, such\nas `enable_word_time_offsets`.","properties":{"confidence":{"description":"Output only. The confidence estimate between 0.0 and 1.0. A higher number\nindicates an estimated greater likelihood that the recognized words are\ncorrect. This field is set only for the top alternative.\nThis field is not guaranteed to be accurate and users should not rely on it\nto be always provided.\nThe default of 0.0 is a sentinel value indicating `confidence` was not set.","format":"float","type":"number"},"endTime":{"description":"Time offset relative to the beginning of the audio, and\ncorresponding to the end of the spoken word. This field is only set if\n`enable_word_time_offsets=true` and only in the top hypothesis. This is an\nexperimental feature and the accuracy of the time offset can vary.","format":"google-duration","type":"string"},"speakerTag":{"description":"Output only. A distinct integer value is assigned for every speaker within\nthe audio. This field specifies which one of those speakers was detected to\nhave spoken this word. Value ranges from 1 up to diarization_speaker_count,\nand is only set if speaker diarization is enabled.","format":"int32","type":"integer"},"startTime":{"description":"Time offset relative to the beginning of the audio, and\ncorresponding to the start of the spoken word. This field is only set if\n`enable_word_time_offsets=true` and only in the top hypothesis. This is an\nexperimental feature and the accuracy of the time offset can vary.","format":"google-duration","type":"string"},"word":{"description":"The word corresponding to this set of information.","type":"string"}},"type":"object"},"GoogleCloudVideointelligenceV1p2beta1_AnnotateVideoProgress":{"description":"Video annotation progress. Included in the `metadata`\nfield of the `Operation` returned by the `GetOperation`\ncall of the `google::longrunning::Operations` service.","properties":{"annotationProgress":{"description":"