internal/processmetrics/computeresources/hana_computeresources.go (108 lines of code) (raw):

/* Copyright 2022 Google LLC Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at https://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ package computeresources import ( "context" mrpb "google.golang.org/genproto/googleapis/monitoring/v3" "github.com/cenkalti/backoff/v4" "github.com/shirou/gopsutil/v3/process" "github.com/GoogleCloudPlatform/sapagent/internal/processmetrics/sapcontrol" cnfpb "github.com/GoogleCloudPlatform/sapagent/protos/configuration" sapb "github.com/GoogleCloudPlatform/sapagent/protos/sapapp" "github.com/GoogleCloudPlatform/workloadagentplatform/sharedlibraries/cloudmonitoring" "github.com/GoogleCloudPlatform/workloadagentplatform/sharedlibraries/commandlineexecutor" "github.com/GoogleCloudPlatform/workloadagentplatform/sharedlibraries/log" ) const ( hanaCPUPath = "/sap/hana/cpu/utilization" hanaMemoryPath = "/sap/hana/memory/utilization" hanaIOPSReadsPath = "/sap/hana/iops/reads" hanaIOPSWritesPath = "/sap/hana/iops/writes" ) type ( // HANAInstanceProperties have the required context for collecting metrics for cpu // memory per process for HANA, Netweaver and SAP Control. // It also implements the InstanceProperiesInterface for abstraction as defined in the // computreresources.go file. HANAInstanceProperties struct { Config *cnfpb.Configuration Client cloudmonitoring.TimeSeriesCreator Executor commandlineexecutor.Execute SAPInstance *sapb.SAPInstance LastValue map[string]*process.IOCountersStat NewProcHelper NewProcessWithContextHelper SAPControlClient sapcontrol.ClientInterface SkippedMetrics map[string]bool PMBackoffPolicy backoff.BackOffContext } ) // Collect SAP additional metrics like per process CPU and per process memory // utilization of SAP HANA Processes. // Collect method keeps on collecting all the metrics it can, logs errors if it encounters // any and returns the collected metrics with the last error encountered while collecting metrics. func (p *HANAInstanceProperties) Collect(ctx context.Context) ([]*mrpb.TimeSeries, error) { params := Parameters{ executor: p.Executor, client: p.Client, Config: p.Config, memoryMetricPath: hanaMemoryPath, cpuMetricPath: hanaCPUPath, iopsReadsMetricPath: hanaIOPSReadsPath, iopsWritesMetricPath: hanaIOPSWritesPath, LastValue: p.LastValue, SAPInstance: p.SAPInstance, NewProc: p.NewProcHelper, SAPControlClient: p.SAPControlClient, } var metricsCollectionErr error processes := CollectProcessesForInstance(ctx, params) if len(processes) == 0 { log.CtxLogger(ctx).Debug("Cannot collect CPU and memory per process for hana, empty process list.") return nil, nil } res := make([]*mrpb.TimeSeries, 0) if _, ok := p.SkippedMetrics[hanaCPUPath]; !ok { cpuMetrics, err := collectTimeSeriesMetrics(ctx, params, processes, collectCPUMetric) if err != nil { metricsCollectionErr = err } if cpuMetrics != nil { res = append(res, cpuMetrics...) } } if _, ok := p.SkippedMetrics[hanaMemoryPath]; !ok { memoryMetrics, err := collectTimeSeriesMetrics(ctx, params, processes, collectMemoryMetric) if err != nil { metricsCollectionErr = err } if memoryMetrics != nil { res = append(res, memoryMetrics...) } } skipIOPS := p.SkippedMetrics[hanaIOPSReadsPath] || p.SkippedMetrics[hanaIOPSWritesPath] if !skipIOPS { iopsMetrics, err := collectTimeSeriesMetrics(ctx, params, processes, collectDiskIOPSMetric) if err != nil { metricsCollectionErr = err } if iopsMetrics != nil { res = append(res, iopsMetrics...) } } return res, metricsCollectionErr } // CollectWithRetry decorates the Collect method with retry mechanism. func (p *HANAInstanceProperties) CollectWithRetry(ctx context.Context) ([]*mrpb.TimeSeries, error) { var ( attempt = 1 res []*mrpb.TimeSeries ) err := backoff.Retry(func() error { var err error select { case <-ctx.Done(): log.CtxLogger(ctx).Debugw("Context cancelled, exiting CollectWithRetry", "InstanceId", p.SAPInstance.GetInstanceId()) return nil default: res, err = p.Collect(ctx) if err != nil { log.CtxLogger(ctx).Debugw("Error in Collection", "attempt", attempt, "error", err) attempt++ } return err } }, p.PMBackoffPolicy) if err != nil { log.CtxLogger(ctx).Debugw("Retry limit exceeded", "InstanceId", p.SAPInstance.GetInstanceId()) } return res, err }