UNPKG

@pulumi/gcp

Version:

A Pulumi package for creating and managing Google Cloud Platform resources.

pulumi/pulumi-gcp

340 lines • 12.8 kB

JavaScript

"use strict"; // *** WARNING: this file was generated by pulumi-language-nodejs. *** // *** Do not edit by hand unless you're certain you know what you are doing! *** var __createBinding = (this && this.__createBinding) || (Object.create ? (function(o, m, k, k2) { if (k2 === undefined) k2 = k; var desc = Object.getOwnPropertyDescriptor(m, k); if (!desc || ("get" in desc ? !m.__esModule : desc.writable || desc.configurable)) { desc = { enumerable: true, get: function() { return m[k]; } }; } Object.defineProperty(o, k2, desc); }) : (function(o, m, k, k2) { if (k2 === undefined) k2 = k; o[k2] = m[k]; })); var __setModuleDefault = (this && this.__setModuleDefault) || (Object.create ? (function(o, v) { Object.defineProperty(o, "default", { enumerable: true, value: v }); }) : function(o, v) { o["default"] = v; }); var __importStar = (this && this.__importStar) || function (mod) { if (mod && mod.__esModule) return mod; var result = {}; if (mod != null) for (var k in mod) if (k !== "default" && Object.prototype.hasOwnProperty.call(mod, k)) __createBinding(result, mod, k); __setModuleDefault(result, mod); return result; }; Object.defineProperty(exports, "__esModule", { value: true }); exports.AiEndpointWithModelGardenDeployment = void 0; const pulumi = __importStar(require("@pulumi/pulumi")); const utilities = __importStar(require("../utilities")); /** * Create an Endpoint and deploy a Model Garden model to it. * * To get more information about EndpointWithModelGardenDeployment, see: * * * [API documentation](https://cloud.google.com/vertex-ai/docs/reference/rest/v1/projects.locations/deploy) * * How-to Guides * * [Overview of Model Garden](https://cloud.google.com/vertex-ai/generative-ai/docs/model-garden/explore-models) * * [Overview of self-deployed models](https://cloud.google.com/vertex-ai/generative-ai/docs/model-garden/self-deployed-models) * * [Use models in Model Garden](https://cloud.google.com/vertex-ai/generative-ai/docs/model-garden/use-models) * * ## Example Usage * * ### Vertex Ai Deploy Basic * * ```typescript * import * as pulumi from "@pulumi/pulumi"; * import * as gcp from "@pulumi/gcp"; * * const deploy = new gcp.vertex.AiEndpointWithModelGardenDeployment("deploy", { * publisherModelName: "publishers/google/models/paligemma@paligemma-224-float32", * location: "us-central1", * modelConfig: { * acceptEula: true, * }, * }); * ``` * ### Vertex Ai Deploy Huggingface Model * * ```typescript * import * as pulumi from "@pulumi/pulumi"; * import * as gcp from "@pulumi/gcp"; * * const deploy = new gcp.vertex.AiEndpointWithModelGardenDeployment("deploy", { * huggingFaceModelId: "Qwen/Qwen3-0.6B", * location: "us-central1", * modelConfig: { * acceptEula: true, * }, * }); * ``` * ### Vertex Ai Deploy With Configs * * ```typescript * import * as pulumi from "@pulumi/pulumi"; * import * as gcp from "@pulumi/gcp"; * * const deploy = new gcp.vertex.AiEndpointWithModelGardenDeployment("deploy", { * publisherModelName: "publishers/google/models/paligemma@paligemma-224-float32", * location: "us-central1", * modelConfig: { * acceptEula: true, * }, * deployConfig: { * dedicatedResources: { * machineSpec: { * machineType: "g2-standard-16", * acceleratorType: "NVIDIA_L4", * acceleratorCount: 1, * }, * minReplicaCount: 1, * }, * }, * }); * ``` * ### Vertex Ai Deploy Multiple Models In Parallel * * ```typescript * import * as pulumi from "@pulumi/pulumi"; * import * as gcp from "@pulumi/gcp"; * * const deploy_gemma_11_2b_it = new gcp.vertex.AiEndpointWithModelGardenDeployment("deploy-gemma-1_1-2b-it", { * publisherModelName: "publishers/google/models/gemma@gemma-1.1-2b-it", * location: "us-central1", * modelConfig: { * acceptEula: true, * }, * deployConfig: { * dedicatedResources: { * machineSpec: { * machineType: "g2-standard-12", * acceleratorType: "us-central1", * acceleratorCount: 1, * }, * minReplicaCount: 1, * }, * }, * }); * const deploy_qwen3_06b = new gcp.vertex.AiEndpointWithModelGardenDeployment("deploy-qwen3-0_6b", { * huggingFaceModelId: "Qwen/Qwen3-0.6B", * location: "us-central1", * modelConfig: { * acceptEula: true, * }, * deployConfig: { * dedicatedResources: { * machineSpec: { * machineType: "g2-standard-12", * acceleratorType: "NVIDIA_L4", * acceleratorCount: 1, * }, * minReplicaCount: 1, * }, * }, * }); * const deploy_llama_32_1b = new gcp.vertex.AiEndpointWithModelGardenDeployment("deploy-llama-3_2-1b", { * publisherModelName: "publishers/meta/models/llama3-2@llama-3.2-1b", * location: "us-central1", * modelConfig: { * acceptEula: true, * }, * deployConfig: { * dedicatedResources: { * machineSpec: { * machineType: "g2-standard-12", * acceleratorType: "NVIDIA_L4", * acceleratorCount: 1, * }, * minReplicaCount: 1, * }, * }, * }); * ``` * ### Vertex Ai Deploy Multiple Models In Sequence * * ```typescript * import * as pulumi from "@pulumi/pulumi"; * import * as gcp from "@pulumi/gcp"; * * const deploy_gemma_11_2b_it = new gcp.vertex.AiEndpointWithModelGardenDeployment("deploy-gemma-1_1-2b-it", { * publisherModelName: "publishers/google/models/gemma@gemma-1.1-2b-it", * location: "us-central1", * modelConfig: { * acceptEula: true, * }, * deployConfig: { * dedicatedResources: { * machineSpec: { * machineType: "g2-standard-12", * acceleratorType: "NVIDIA_L4", * acceleratorCount: 1, * }, * minReplicaCount: 1, * }, * }, * }); * const deploy_qwen3_06b = new gcp.vertex.AiEndpointWithModelGardenDeployment("deploy-qwen3-0_6b", { * huggingFaceModelId: "Qwen/Qwen3-0.6B", * location: "us-central1", * modelConfig: { * acceptEula: true, * }, * deployConfig: { * dedicatedResources: { * machineSpec: { * machineType: "g2-standard-12", * acceleratorType: "NVIDIA_L4", * acceleratorCount: 1, * }, * minReplicaCount: 1, * }, * }, * }, { * dependsOn: [deploy_gemma_11_2b_it], * }); * const deploy_llama_32_1b = new gcp.vertex.AiEndpointWithModelGardenDeployment("deploy-llama-3_2-1b", { * publisherModelName: "publishers/meta/models/llama3-2@llama-3.2-1b", * location: "us-central1", * modelConfig: { * acceptEula: true, * }, * deployConfig: { * dedicatedResources: { * machineSpec: { * machineType: "g2-standard-12", * acceleratorType: "NVIDIA_L4", * acceleratorCount: 1, * }, * minReplicaCount: 1, * }, * }, * }, { * dependsOn: [deploy_qwen3_06b], * }); * ``` * ### Vertex Ai Deploy Psc Endpoint * * ```typescript * import * as pulumi from "@pulumi/pulumi"; * import * as gcp from "@pulumi/gcp"; * * const deploy = new gcp.vertex.AiEndpointWithModelGardenDeployment("deploy", { * publisherModelName: "publishers/google/models/paligemma@paligemma-224-float32", * location: "us-central1", * modelConfig: { * acceptEula: true, * }, * endpointConfig: { * privateServiceConnectConfig: { * enablePrivateServiceConnect: true, * projectAllowlists: ["my-project-id"], * }, * }, * }); * ``` * ### Vertex Ai Deploy Psc Endpoint Automated * * ```typescript * import * as pulumi from "@pulumi/pulumi"; * import * as gcp from "@pulumi/gcp"; * * const network = new gcp.compute.Network("network", { * name: "network", * autoCreateSubnetworks: false, * }); * const project = gcp.organizations.getProject({}); * const deploy = new gcp.vertex.AiEndpointWithModelGardenDeployment("deploy", { * publisherModelName: "publishers/google/models/paligemma@paligemma-224-float32", * location: "us-central1", * modelConfig: { * acceptEula: true, * }, * endpointConfig: { * privateServiceConnectConfig: { * enablePrivateServiceConnect: true, * projectAllowlists: [project.then(project => project.id)], * pscAutomationConfigs: { * projectId: project.then(project => project.id), * network: network.id, * }, * }, * }, * }); * const subnetwork = new gcp.compute.Subnetwork("subnetwork", { * name: "subnetwork", * ipCidrRange: "192.168.0.0/24", * region: "us-central1", * network: network.id, * }); * ``` * * ## Import * * This resource does not support import. */ class AiEndpointWithModelGardenDeployment extends pulumi.CustomResource { /** * Get an existing AiEndpointWithModelGardenDeployment resource's state with the given name, ID, and optional extra * properties used to qualify the lookup. * * @param name The _unique_ name of the resulting resource. * @param id The _unique_ provider ID of the resource to lookup. * @param state Any extra arguments used during the lookup. * @param opts Optional settings to control the behavior of the CustomResource. */ static get(name, id, state, opts) { return new AiEndpointWithModelGardenDeployment(name, state, { ...opts, id: id }); } /** @internal */ static __pulumiType = 'gcp:vertex/aiEndpointWithModelGardenDeployment:AiEndpointWithModelGardenDeployment'; /** * Returns true if the given object is an instance of AiEndpointWithModelGardenDeployment. This is designed to work even * when multiple copies of the Pulumi SDK have been loaded into the same process. */ static isInstance(obj) { if (obj === undefined || obj === null) { return false; } return obj['__pulumiType'] === AiEndpointWithModelGardenDeployment.__pulumiType; } constructor(name, argsOrState, opts) { let resourceInputs = {}; opts = opts || {}; if (opts.id) { const state = argsOrState; resourceInputs["deletionPolicy"] = state?.deletionPolicy; resourceInputs["deployConfig"] = state?.deployConfig; resourceInputs["deployedModelDisplayName"] = state?.deployedModelDisplayName; resourceInputs["deployedModelId"] = state?.deployedModelId; resourceInputs["endpoint"] = state?.endpoint; resourceInputs["endpointConfig"] = state?.endpointConfig; resourceInputs["huggingFaceModelId"] = state?.huggingFaceModelId; resourceInputs["location"] = state?.location; resourceInputs["modelConfig"] = state?.modelConfig; resourceInputs["project"] = state?.project; resourceInputs["publisherModelName"] = state?.publisherModelName; } else { const args = argsOrState; if (args?.location === undefined && !opts.urn) { throw new Error("Missing required property 'location'"); } resourceInputs["deletionPolicy"] = args?.deletionPolicy; resourceInputs["deployConfig"] = args?.deployConfig; resourceInputs["endpointConfig"] = args?.endpointConfig; resourceInputs["huggingFaceModelId"] = args?.huggingFaceModelId; resourceInputs["location"] = args?.location; resourceInputs["modelConfig"] = args?.modelConfig; resourceInputs["project"] = args?.project; resourceInputs["publisherModelName"] = args?.publisherModelName; resourceInputs["deployedModelDisplayName"] = undefined /*out*/; resourceInputs["deployedModelId"] = undefined /*out*/; resourceInputs["endpoint"] = undefined /*out*/; } opts = pulumi.mergeOptions(utilities.resourceOptsDefaults(), opts); super(AiEndpointWithModelGardenDeployment.__pulumiType, name, resourceInputs, opts); } } exports.AiEndpointWithModelGardenDeployment = AiEndpointWithModelGardenDeployment; //# sourceMappingURL=aiEndpointWithModelGardenDeployment.js.map