aiplatform/api/AIPlatform.Samples/MultimodalMultiImage.cs (61 lines of code) (raw):
/*
* Copyright 2024 Google LLC
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* https://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
// [START generativeaionvertexai_gemini_single_turn_multi_image]
using Google.Api.Gax.Grpc;
using Google.Cloud.AIPlatform.V1;
using Google.Protobuf;
using System.Net.Http;
using System.Text;
using System.Threading.Tasks;
public class MultimodalMultiImage
{
public async Task<string> GenerateContent(
string projectId = "your-project-id",
string location = "us-central1",
string publisher = "google",
string model = "gemini-2.0-flash-001"
)
{
var predictionServiceClient = new PredictionServiceClientBuilder
{
Endpoint = $"{location}-aiplatform.googleapis.com"
}.Build();
ByteString colosseum = await ReadImageFileAsync(
"https://storage.googleapis.com/cloud-samples-data/vertex-ai/llm/prompts/landmark1.png");
ByteString forbiddenCity = await ReadImageFileAsync(
"https://storage.googleapis.com/cloud-samples-data/vertex-ai/llm/prompts/landmark2.png");
ByteString christRedeemer = await ReadImageFileAsync(
"https://storage.googleapis.com/cloud-samples-data/vertex-ai/llm/prompts/landmark3.png");
var generateContentRequest = new GenerateContentRequest
{
Model = $"projects/{projectId}/locations/{location}/publishers/{publisher}/models/{model}",
Contents =
{
new Content
{
Role = "USER",
Parts =
{
new Part { InlineData = new() { MimeType = "image/png", Data = colosseum }},
new Part { Text = "city: Rome, Landmark: the Colosseum" },
new Part { InlineData = new() { MimeType = "image/png", Data = forbiddenCity }},
new Part { Text = "city: Beijing, Landmark: Forbidden City"},
new Part { InlineData = new() { MimeType = "image/png", Data = christRedeemer }}
}
}
}
};
using PredictionServiceClient.StreamGenerateContentStream response = predictionServiceClient.StreamGenerateContent(generateContentRequest);
StringBuilder fullText = new();
AsyncResponseStream<GenerateContentResponse> responseStream = response.GetResponseStream();
await foreach (GenerateContentResponse responseItem in responseStream)
{
fullText.Append(responseItem.Candidates[0].Content.Parts[0].Text);
}
return fullText.ToString();
}
private static async Task<ByteString> ReadImageFileAsync(string url)
{
using HttpClient client = new();
using var response = await client.GetAsync(url);
byte[] imageBytes = await response.Content.ReadAsByteArrayAsync();
return ByteString.CopyFrom(imageBytes);
}
}
// [END generativeaionvertexai_gemini_single_turn_multi_image]