internal/processmetrics/computeresources/hana_computeresources.go (108 lines of code) (raw):
/*
Copyright 2022 Google LLC
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
package computeresources
import (
"context"
mrpb "google.golang.org/genproto/googleapis/monitoring/v3"
"github.com/cenkalti/backoff/v4"
"github.com/shirou/gopsutil/v3/process"
"github.com/GoogleCloudPlatform/sapagent/internal/processmetrics/sapcontrol"
cnfpb "github.com/GoogleCloudPlatform/sapagent/protos/configuration"
sapb "github.com/GoogleCloudPlatform/sapagent/protos/sapapp"
"github.com/GoogleCloudPlatform/workloadagentplatform/sharedlibraries/cloudmonitoring"
"github.com/GoogleCloudPlatform/workloadagentplatform/sharedlibraries/commandlineexecutor"
"github.com/GoogleCloudPlatform/workloadagentplatform/sharedlibraries/log"
)
const (
hanaCPUPath = "/sap/hana/cpu/utilization"
hanaMemoryPath = "/sap/hana/memory/utilization"
hanaIOPSReadsPath = "/sap/hana/iops/reads"
hanaIOPSWritesPath = "/sap/hana/iops/writes"
)
type (
// HANAInstanceProperties have the required context for collecting metrics for cpu
// memory per process for HANA, Netweaver and SAP Control.
// It also implements the InstanceProperiesInterface for abstraction as defined in the
// computreresources.go file.
HANAInstanceProperties struct {
Config *cnfpb.Configuration
Client cloudmonitoring.TimeSeriesCreator
Executor commandlineexecutor.Execute
SAPInstance *sapb.SAPInstance
LastValue map[string]*process.IOCountersStat
NewProcHelper NewProcessWithContextHelper
SAPControlClient sapcontrol.ClientInterface
SkippedMetrics map[string]bool
PMBackoffPolicy backoff.BackOffContext
}
)
// Collect SAP additional metrics like per process CPU and per process memory
// utilization of SAP HANA Processes.
// Collect method keeps on collecting all the metrics it can, logs errors if it encounters
// any and returns the collected metrics with the last error encountered while collecting metrics.
func (p *HANAInstanceProperties) Collect(ctx context.Context) ([]*mrpb.TimeSeries, error) {
params := Parameters{
executor: p.Executor,
client: p.Client,
Config: p.Config,
memoryMetricPath: hanaMemoryPath,
cpuMetricPath: hanaCPUPath,
iopsReadsMetricPath: hanaIOPSReadsPath,
iopsWritesMetricPath: hanaIOPSWritesPath,
LastValue: p.LastValue,
SAPInstance: p.SAPInstance,
NewProc: p.NewProcHelper,
SAPControlClient: p.SAPControlClient,
}
var metricsCollectionErr error
processes := CollectProcessesForInstance(ctx, params)
if len(processes) == 0 {
log.CtxLogger(ctx).Debug("Cannot collect CPU and memory per process for hana, empty process list.")
return nil, nil
}
res := make([]*mrpb.TimeSeries, 0)
if _, ok := p.SkippedMetrics[hanaCPUPath]; !ok {
cpuMetrics, err := collectTimeSeriesMetrics(ctx, params, processes, collectCPUMetric)
if err != nil {
metricsCollectionErr = err
}
if cpuMetrics != nil {
res = append(res, cpuMetrics...)
}
}
if _, ok := p.SkippedMetrics[hanaMemoryPath]; !ok {
memoryMetrics, err := collectTimeSeriesMetrics(ctx, params, processes, collectMemoryMetric)
if err != nil {
metricsCollectionErr = err
}
if memoryMetrics != nil {
res = append(res, memoryMetrics...)
}
}
skipIOPS := p.SkippedMetrics[hanaIOPSReadsPath] || p.SkippedMetrics[hanaIOPSWritesPath]
if !skipIOPS {
iopsMetrics, err := collectTimeSeriesMetrics(ctx, params, processes, collectDiskIOPSMetric)
if err != nil {
metricsCollectionErr = err
}
if iopsMetrics != nil {
res = append(res, iopsMetrics...)
}
}
return res, metricsCollectionErr
}
// CollectWithRetry decorates the Collect method with retry mechanism.
func (p *HANAInstanceProperties) CollectWithRetry(ctx context.Context) ([]*mrpb.TimeSeries, error) {
var (
attempt = 1
res []*mrpb.TimeSeries
)
err := backoff.Retry(func() error {
var err error
select {
case <-ctx.Done():
log.CtxLogger(ctx).Debugw("Context cancelled, exiting CollectWithRetry", "InstanceId", p.SAPInstance.GetInstanceId())
return nil
default:
res, err = p.Collect(ctx)
if err != nil {
log.CtxLogger(ctx).Debugw("Error in Collection", "attempt", attempt, "error", err)
attempt++
}
return err
}
}, p.PMBackoffPolicy)
if err != nil {
log.CtxLogger(ctx).Debugw("Retry limit exceeded", "InstanceId", p.SAPInstance.GetInstanceId())
}
return res, err
}