python-batch/cuda_pubsub/nvidia-python.yaml (33 lines of code) (raw):
# Copyright 2023 Google LLC
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
project_id: "project_id"
region: "us-central1"
volumes:
- {bucket_name: "<my_bucket>", gcs_path: "/mnt/disks/work"}
job_prefix: 'nvidia-python-'
task_count: 12 #optional
parallelism: 4 #optional
task_count_per_node: 4 #optional
machine_type: "n1-standard-4"
accelerator:
type: "nvidia-tesla-t4"
count: 2
install_gpu_drivers: y
cpu_milli: 1000 #optional
memory_mib: 102400 #optional
container:
image_uri: "us-central1-docker.pkg.dev/<my_project>/cuda/pybatch:latest"
entry_point: "/bin/bash"
commands:
- -c
- "
export PID=$(gcloud config get-value project);
echo python3 /tmp/pull_fifo_id.py --project_id=$PID --job_id=$TOPIC_ID;
export FIFO_ID=$(python3 /tmp/pull_fifo_id.py --project_id=$PID --job_id=$TOPIC_ID);
echo Obtained FIFO_ID: --- $FIFO_ID ---;
if [ -z \"$FIFO_ID\" ]; then echo FIFO NOT DEFINED -- exiting; exit 0; fi;
echo Running FIFO_ID: $FIFO_ID;
mkdir -p /mnt/disks/work/dir_${BATCH_JOB_ID};
/tmp/simpleCUFFT_2d_MGPU >> /mnt/disks/work/dir_${BATCH_JOB_ID}/out_${FIFO_ID}.txt
"
labels:
env: "container"
type: "nvidia"