components/otelopscol/receiver/nvmlreceiver/metadata.yaml (52 lines of code) (raw):

# Copyright 2025 Google LLC # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. type: nvml status: class: receiver stability: beta: [metrics] attributes: uuid: type: string description: GPU universally unique identifier gpu_number: type: string description: GPU index starting at 0. model: type: string description: GPU model memory_state: type: string description: GPU memory used or free. enum: [used, free] pid: type: int description: Process ID. process: type: string description: Process name. command: type: string description: Process command. command_line: type: string description: Process command line, 1024 characters maximum. owner: type: string description: Process owner. metrics: nvml.gpu.utilization: enabled: true description: Fraction of time GPU was not idle since the last sample. unit: "1" gauge: value_type: double attributes: [model, gpu_number, uuid] nvml.gpu.memory.bytes_used: enabled: true description: Current number of GPU memory bytes used by state. Summing the values of all states yields the total GPU memory space. unit: By gauge: value_type: int attributes: [model, gpu_number, uuid, memory_state] nvml.gpu.processes.utilization: enabled: true description: Fraction of time over the process's life thus far during which one or more kernels was executing on the GPU. unit: "1" gauge: value_type: double attributes: [model, gpu_number, uuid, pid, process, command, command_line, owner] nvml.gpu.processes.max_bytes_used: enabled: true description: Maximum total GPU memory in bytes that was ever allocated by the process. unit: By gauge: value_type: int attributes: [model, gpu_number, uuid, pid, process, command, command_line, owner]