ai-platform/snippets/deploy-model.js

/* * Copyright 2020 Google LLC * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * https://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ 'use strict'; async function main( modelId, deployedModelDisplayName, endpointId, project, location = 'us-central1' ) { // [START aiplatform_deploy_model_sample] /** * TODO(developer): Uncomment these variables before running the sample.\ * (Not necessary if passing values as arguments) */ // const modelId = "YOUR_MODEL_ID"; // const endpointId = 'YOUR_ENDPOINT_ID'; // const deployedModelDisplayName = 'YOUR_DEPLOYED_MODEL_DISPLAY_NAME'; // const project = 'YOUR_PROJECT_ID'; // const location = 'YOUR_PROJECT_LOCATION'; const modelName = `projects/${project}/locations/${location}/models/${modelId}`; const endpoint = `projects/${project}/locations/${location}/endpoints/${endpointId}`; // Imports the Google Cloud Endpoint Service Client library const {EndpointServiceClient} = require('@google-cloud/aiplatform'); // Specifies the location of the api endpoint: const clientOptions = { apiEndpoint: 'us-central1-aiplatform.googleapis.com', }; // Instantiates a client const endpointServiceClient = new EndpointServiceClient(clientOptions); async function deployModel() { // Configure the parent resource // key '0' assigns traffic for the newly deployed model // Traffic percentage values must add up to 100 // Leave dictionary empty if endpoint should not accept any traffic const trafficSplit = {0: 100}; const deployedModel = { // format: 'projects/{project}/locations/{location}/models/{model}' model: modelName, displayName: deployedModelDisplayName, automaticResources: {minReplicaCount: 1, maxReplicaCount: 1}, }; const request = { endpoint, deployedModel, trafficSplit, }; // Get and print out a list of all the endpoints for this resource const [response] = await endpointServiceClient.deployModel(request); console.log(`Long running operation : ${response.name}`); // Wait for operation to complete await response.promise(); const result = response.result; console.log('Deploy model response'); const modelDeployed = result.deployedModel; console.log('\tDeployed model'); if (!modelDeployed) { console.log('\t\tId : {}'); console.log('\t\tModel : {}'); console.log('\t\tDisplay name : {}'); console.log('\t\tCreate time : {}'); console.log('\t\tDedicated resources'); console.log('\t\t\tMin replica count : {}'); console.log('\t\t\tMachine spec {}'); console.log('\t\t\t\tMachine type : {}'); console.log('\t\t\t\tAccelerator type : {}'); console.log('\t\t\t\tAccelerator count : {}'); console.log('\t\tAutomatic resources'); console.log('\t\t\tMin replica count : {}'); console.log('\t\t\tMax replica count : {}'); } else { console.log(`\t\tId : ${modelDeployed.id}`); console.log(`\t\tModel : ${modelDeployed.model}`); console.log(`\t\tDisplay name : ${modelDeployed.displayName}`); console.log(`\t\tCreate time : ${modelDeployed.createTime}`); const dedicatedResources = modelDeployed.dedicatedResources; console.log('\t\tDedicated resources'); if (!dedicatedResources) { console.log('\t\t\tMin replica count : {}'); console.log('\t\t\tMachine spec {}'); console.log('\t\t\t\tMachine type : {}'); console.log('\t\t\t\tAccelerator type : {}'); console.log('\t\t\t\tAccelerator count : {}'); } else { console.log( `\t\t\tMin replica count : \ ${dedicatedResources.minReplicaCount}` ); const machineSpec = dedicatedResources.machineSpec; console.log('\t\t\tMachine spec'); console.log(`\t\t\t\tMachine type : ${machineSpec.machineType}`); console.log( `\t\t\t\tAccelerator type : ${machineSpec.acceleratorType}` ); console.log( `\t\t\t\tAccelerator count : ${machineSpec.acceleratorCount}` ); } const automaticResources = modelDeployed.automaticResources; console.log('\t\tAutomatic resources'); if (!automaticResources) { console.log('\t\t\tMin replica count : {}'); console.log('\t\t\tMax replica count : {}'); } else { console.log( `\t\t\tMin replica count : \ ${automaticResources.minReplicaCount}` ); console.log( `\t\t\tMax replica count : \ ${automaticResources.maxReplicaCount}` ); } } } deployModel(); // [END aiplatform_deploy_model_sample] } process.on('unhandledRejection', err => { console.error(err.message); process.exitCode = 1; }); main(...process.argv.slice(2));

ai-platform/snippets/deploy-model.js (100 lines of code) (raw):