internal/processmetrics/netweaver/netweaver.go

/* Copyright 2022 Google LLC Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at https://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ // Package netweaver contains functions that gather SAP NetWeaver system metrics for the SAP agent. package netweaver import ( "bufio" "context" "fmt" "io" "net/http" "regexp" "strconv" "strings" "time" "github.com/cenkalti/backoff/v4" "github.com/GoogleCloudPlatform/sapagent/internal/processmetrics/sapcontrol" "github.com/GoogleCloudPlatform/sapagent/internal/sapcontrolclient" "github.com/GoogleCloudPlatform/sapagent/internal/utils/protostruct" "github.com/GoogleCloudPlatform/workloadagentplatform/sharedlibraries/cloudmonitoring" "github.com/GoogleCloudPlatform/workloadagentplatform/sharedlibraries/commandlineexecutor" "github.com/GoogleCloudPlatform/workloadagentplatform/sharedlibraries/log" "github.com/GoogleCloudPlatform/workloadagentplatform/sharedlibraries/metricevents" "github.com/GoogleCloudPlatform/workloadagentplatform/sharedlibraries/timeseries" mrpb "google.golang.org/genproto/googleapis/monitoring/v3" tspb "google.golang.org/protobuf/types/known/timestamppb" cnfpb "github.com/GoogleCloudPlatform/sapagent/protos/configuration" sapb "github.com/GoogleCloudPlatform/sapagent/protos/sapapp" ) type ( // InstanceProperties struct has necessary context for Metrics collection. InstanceProperties struct { SAPInstance *sapb.SAPInstance Config *cnfpb.Configuration Client cloudmonitoring.TimeSeriesCreator SkippedMetrics map[string]bool PMBackoffPolicy backoff.BackOffContext } ) // Netweaver system availability. const ( systemAtLeastOneProcessNotGreen = 0 systemAllProcessesGreen = 1 ) const ( metricURL = "workload.googleapis.com" nwServicePath = "/sap/nw/service" nwICMRCodePath = "/sap/nw/icm/rcode" nwICMRTimePath = "/sap/nw/icm/rtime" nwMSResponseCodePath = "/sap/nw/ms/rcode" nwMSResponseTimePath = "/sap/nw/ms/rtime" nwMSWorkProcessesPath = "/sap/nw/ms/wp" nwABAPProcBusyPath = "/sap/nw/abap/proc/busy" nwABAPProcCountPath = "/sap/nw/abap/proc/count" nwABAPProcUtilPath = "/sap/nw/abap/proc/utilization" nwABAPProcQueueCurrentPath = "/sap/nw/abap/queue/current" nwABAPProcQueuePeakPath = "/sap/nw/abap/queue/peak" nwABAPSessionsPath = "/sap/nw/abap/sessions" nwABAPRFCPath = "/sap/nw/abap/rfc" nwEnqLocksPath = "/sap/nw/enq/locks/usercountowner" nwInstanceRolePath = "/sap/nw/instance/role" ) var ( msWorkProcess = regexp.MustCompile(`LB=([0-9]+)`) // regex for finding application processes // Matching groups: // 1. Process name // 2. SID // 3. Instance type // 4. Instance number // 5. Profile path root // 6. SID // 7. SID // 8. Instance type // 9. Instance number // 10. Instance name appProcessRegex = regexp.MustCompile(`(dw|enq|en|enqr|er|jc|ms)\.sap([A-Za-z][A-Za-z0-9]{2})_(D|ASCS|ERS|SCS|J)([0-9]{2}) pf=/(usr/sap|sapmnt)/([A-Za-z][A-Za-z0-9]{2})/SYS/profile/([A-Za-z][A-Za-z0-9]{2})_(D|ASCS|SCS|ERS|J)([0-9]{2})_(.*)`) ) // Collect is Netweaver implementation of Collector interface from processmetrics.go. // Returns a list of NetWeaver related metrics. // Collect method keeps on collecting all the metrics it can, logs errors if it encounters // any and returns the collected metrics with the last error encountered while collecting metrics. func (p *InstanceProperties) Collect(ctx context.Context) ([]*mrpb.TimeSeries, error) { scc := sapcontrolclient.New(p.SAPInstance.GetInstanceNumber()) var metricsCollectionError error metrics, err := collectNetWeaverMetrics(ctx, p, scc) if err != nil { metricsCollectionError = err } httpMetrics, err := collectHTTPMetrics(ctx, p) if err != nil { metricsCollectionError = err } if httpMetrics != nil { metrics = append(metrics, httpMetrics...) } abapProcessStatusMetrics, err := collectABAPProcessStatus(ctx, p, scc) if err != nil { metricsCollectionError = err } if abapProcessStatusMetrics != nil { metrics = append(metrics, abapProcessStatusMetrics...) } abapQueueStats, err := collectABAPQueueStats(ctx, p, scc) if err != nil { metricsCollectionError = err } if abapQueueStats != nil { metrics = append(metrics, abapQueueStats...) } dpmonPath := `/usr/sap/` + p.SAPInstance.GetSapsid() + `/SYS/exe/run/dpmon` command := `-c 'echo q | %s pf=%s v'` abapSessionParams := commandlineexecutor.Params{ User: p.SAPInstance.GetUser(), Executable: "bash", ArgsToSplit: fmt.Sprintf(command, dpmonPath, p.SAPInstance.GetProfilePath()), Env: []string{ "PATH=$PATH:" + p.SAPInstance.GetLdLibraryPath(), "LD_LIBRARY_PATH=" + p.SAPInstance.GetLdLibraryPath(), }, } abapSessionStats, err := collectABAPSessionStats(ctx, p, commandlineexecutor.ExecuteCommand, abapSessionParams) if err != nil { metricsCollectionError = err } if abapSessionStats != nil { metrics = append(metrics, abapSessionStats...) } command = `-c 'echo q | %s pf=%s c'` abapRFCParams := commandlineexecutor.Params{ User: p.SAPInstance.GetUser(), Executable: "bash", ArgsToSplit: fmt.Sprintf(command, dpmonPath, p.SAPInstance.GetProfilePath()), Env: []string{ "PATH=$PATH:" + p.SAPInstance.GetLdLibraryPath(), "LD_LIBRARY_PATH=" + p.SAPInstance.GetLdLibraryPath(), }, } rffcConnectionsMetric, err := collectRFCConnections(ctx, p, commandlineexecutor.ExecuteCommand, abapRFCParams) if err != nil { metricsCollectionError = err } if rffcConnectionsMetric != nil { metrics = append(metrics, rffcConnectionsMetric...) } enqLockParams := commandlineexecutor.Params{ User: p.SAPInstance.GetUser(), Executable: p.SAPInstance.GetSapcontrolPath(), ArgsToSplit: fmt.Sprintf("-nr %s -function EnqGetLockTable", p.SAPInstance.GetInstanceNumber()), Env: []string{"LD_LIBRARY_PATH=" + p.SAPInstance.GetLdLibraryPath()}, } enqLockMetrics, err := collectEnqLockMetrics(ctx, p, commandlineexecutor.ExecuteCommand, enqLockParams, scc) if err != nil { metricsCollectionError = err } if enqLockMetrics != nil { metrics = append(metrics, enqLockMetrics...) } roleMetrics, err := collectRoleMetrics(ctx, p, commandlineexecutor.ExecuteCommand) if err != nil { log.CtxLogger(ctx).Debugw("Error in collecting role metrics", "error", err) metricsCollectionError = err } if roleMetrics != nil { metrics = append(metrics, roleMetrics) } return metrics, metricsCollectionError } // CollectWithRetry decorates the Collect method with retry mechanism. func (p *InstanceProperties) CollectWithRetry(ctx context.Context) ([]*mrpb.TimeSeries, error) { var ( attempt = 1 res []*mrpb.TimeSeries ) err := backoff.Retry(func() error { select { case <-ctx.Done(): log.CtxLogger(ctx).Info("Process metrics context cancelled, exiting collectAndSend.") return nil default: log.CtxLogger(ctx).Debugw("Attempting collector retry", "attempt", attempt) var err error res, err = p.Collect(ctx) if err != nil { log.CtxLogger(ctx).Debugw("Error in Collection", "attempt", attempt, "error", err) attempt++ } return err } }, p.PMBackoffPolicy) if err != nil { log.CtxLogger(ctx).Debugw("Retry limit exceeded", "InstanceId", p.SAPInstance.GetInstanceId(), "error", err) } log.CtxLogger(ctx).Debugw("Collected netweaver metrics", "metrics", res) return res, err } // collectNetWeaverMetrics builds a slice of SAP metrics containing all relevant NetWeaver metrics func collectNetWeaverMetrics(ctx context.Context, p *InstanceProperties, scc sapcontrol.ClientInterface) ([]*mrpb.TimeSeries, error) { if _, ok := p.SkippedMetrics[nwServicePath]; ok { return nil, nil } now := tspb.Now() sc := &sapcontrol.Properties{Instance: p.SAPInstance} var ( err error procs map[int]*sapcontrol.ProcessStatus ) procs, err = sc.GetProcessList(ctx, scc) if err != nil { log.CtxLogger(ctx).Debugw("Error performing GetProcessList web method", log.Error(err)) labels := map[string]string{"instance_type": p.SAPInstance.GetKind().String()} metric := createMetrics(p, nwServicePath, labels, now, systemAtLeastOneProcessNotGreen) log.CtxLogger(ctx).Debugw("Sending default /nw/service metric", "metric", metric) return []*mrpb.TimeSeries{metric}, err } metrics := collectServiceMetrics(ctx, p, procs, now) return metrics, nil } // collectServiceMetrics collects NetWeaver "service" metrics describing Netweaver service // processes as managed by the sapcontrol program. func collectServiceMetrics(ctx context.Context, p *InstanceProperties, procs map[int]*sapcontrol.ProcessStatus, now *tspb.Timestamp) (metrics []*mrpb.TimeSeries) { start := tspb.Now() for _, proc := range procs { instanceType := p.SAPInstance.GetKind().String() switch proc.Name { case "gwrd", "sapwebdisp": // For gwrd or web dispatcher process running on another instance, categorize it as "APP" instanceType = sapb.InstanceKind_APP.String() } extraLabels := map[string]string{ "service_name": proc.Name, "instance_type": instanceType, } value := boolToInt64(proc.IsGreen) log.CtxLogger(ctx).Debugw("Creating metrics for process", "metric", nwServicePath, "process", proc.Name, "instanceid", p.SAPInstance.GetInstanceId(), "value", value) metricevents.AddEvent(ctx, metricevents.Parameters{ Path: metricURL + nwServicePath, Message: fmt.Sprintf("NetWeaver service process status for process %s", proc.Name), Value: strconv.FormatInt(value, 10), Labels: metricLabels(p, extraLabels), Identifier: proc.Name, }) metrics = append(metrics, createMetrics(p, nwServicePath, extraLabels, now, value)) } log.CtxLogger(ctx).Debugw("Time taken to collect metrics in collectServiceMetrics()", "time", time.Since(start.AsTime())) return metrics } // collectHTTPMetrics collects the HTTP health check metrics for different types of // Netweaver instances based on their types. func collectHTTPMetrics(ctx context.Context, p *InstanceProperties) ([]*mrpb.TimeSeries, error) { url := p.SAPInstance.GetNetweaverHealthCheckUrl() if url == "" { log.CtxLogger(ctx).Debugw("SAP Instance HTTP health check URL is empty", "instanceid", p.SAPInstance.GetInstanceId(), "url", url) return nil, fmt.Errorf("SAP Instance HTTP health check URL is empty %s", p.SAPInstance.GetInstanceId()) } log.CtxLogger(ctx).Debugw("SAP Instance HTTP health check", "instanceid", p.SAPInstance.GetInstanceId(), "url", url) switch strings.ToUpper(p.SAPInstance.GetServiceName()) { case "SAP-ICM-ABAP", "SAP-ICM-JAVA": return collectICMMetrics(ctx, p, url) case "SAP-CS": return collectMessageServerMetrics(ctx, p, url) default: log.CtxLogger(ctx).Debugw("unsupported service name", "serviceName", p.SAPInstance.GetServiceName()) return nil, fmt.Errorf("unsupported service name: %s", p.SAPInstance.GetServiceName()) } } // collectICMMetrics makes HTTP GET request on given URL. // Returns metrics built using: // - HTTP response code. // - Total time taken by the request. func collectICMMetrics(ctx context.Context, p *InstanceProperties, url string) ([]*mrpb.TimeSeries, error) { // Since these metrics are derived from the same operation, even if one of the metric is skipped the whole group will be skipped from collection. if _, ok := p.SkippedMetrics[nwICMRCodePath]; ok { return nil, nil } now := tspb.Now() response, err := http.Get(url) timeTaken := time.Since(now.AsTime()) if err != nil { log.CtxLogger(ctx).Debugw("HTTP GET failed", "instanceid", p.SAPInstance.GetInstanceId(), "url", url, "error", err) return nil, err } defer response.Body.Close() extraLabels := map[string]string{"service_name": p.SAPInstance.GetServiceName()} log.CtxLogger(ctx).Debugw("Time taken to collect metrics in collectICMMetrics", "time", time.Since(now.AsTime())) return []*mrpb.TimeSeries{ createMetrics(p, nwICMRCodePath, extraLabels, now, int64(response.StatusCode)), createMetrics(p, nwICMRTimePath, extraLabels, now, timeTaken.Milliseconds()), }, nil } // collectMessageServerMetrics uses HTTP GET on given URL to collect message server metrics. // Returns // - Two metrics - HTTP response code and response time for all HTTP status codes. // - Additional work process count as reported by the message server info page on StatusOK(200). // - A nil in case of errors in HTTP GET request failures. func collectMessageServerMetrics(ctx context.Context, p *InstanceProperties, url string) ([]*mrpb.TimeSeries, error) { // Since these metrics are derived from the same operation, even if one of the metric is skipped the whole group will be skipped from collection. if _, ok := p.SkippedMetrics[nwMSResponseCodePath]; ok { return nil, nil } now := tspb.Now() response, err := http.Get(url) timeTaken := time.Since(now.AsTime()) if err != nil { log.CtxLogger(ctx).Debugw("HTTP GET failed", "instanceid", p.SAPInstance.GetInstanceId(), "url", url, "error", err) return nil, err } defer response.Body.Close() extraLabels := map[string]string{"service_name": p.SAPInstance.GetServiceName()} metrics := []*mrpb.TimeSeries{ createMetrics(p, nwMSResponseCodePath, extraLabels, now, int64(response.StatusCode)), createMetrics(p, nwMSResponseTimePath, extraLabels, now, timeTaken.Milliseconds()), } if response.StatusCode != http.StatusOK { log.CtxLogger(ctx).Debugw("HTTP GET failed", "statuscode", response.StatusCode, "response", response) log.CtxLogger(ctx).Debugw("Time taken to collect metrics in collectMessageServerMetrics()", "time", time.Since(now.AsTime())) return nil, fmt.Errorf("HTTP GET failed code: %d", response.StatusCode) } workProcessCount, err := parseWorkProcessCount(response.Body) if err != nil { log.CtxLogger(ctx).Debugw("Reading work process count from message server info page failed", "error", err) return nil, err } log.CtxLogger(ctx).Debugw("Time taken to collect metrics in collectMessageServerMetrics()", "time", time.Since(now.AsTime())) return append(metrics, createMetrics(p, nwMSWorkProcessesPath, extraLabels, now, int64(workProcessCount))), nil } // parseWorkProcessCount processes the HTTP text/plain response body one line at a time // to find the message server work process count. // Returns the work process count on success, an error on failures. func parseWorkProcessCount(r io.ReadCloser) (count int, err error) { scanner := bufio.NewScanner(r) // NOMUTANTS--cannot test if text is or is not read one line at a time. scanner.Split(bufio.ScanLines) for scanner.Scan() { if match := msWorkProcess.FindStringSubmatch(scanner.Text()); len(match) == 2 { if count, err = strconv.Atoi(match[1]); err != nil { return 0, err } return count, nil } } return 0, fmt.Errorf("work process count not found") } // collectABAPProcessStatus collects the ABAP worker process status metrics. func collectABAPProcessStatus(ctx context.Context, p *InstanceProperties, scc sapcontrol.ClientInterface) ([]*mrpb.TimeSeries, error) { now := tspb.Now() // Since these metrics are derived from the same operation, even if one of the metric is skipped the whole group will be skipped from collection. skipABAPProcessStatus := p.SkippedMetrics[nwABAPProcCountPath] || p.SkippedMetrics[nwABAPProcBusyPath] || p.SkippedMetrics[nwABAPProcUtilPath] if skipABAPProcessStatus { return nil, nil } sc := &sapcontrol.Properties{Instance: p.SAPInstance} var ( err error processCount map[string]int busyProcessCount map[string]int busyPercentage map[string]int ) wpDetails, err := sc.ABAPGetWPTable(ctx, scc) if err != nil { log.CtxLogger(ctx).Debugw("Sapcontrol web method failed", "error", err) return nil, err } processCount = wpDetails.Processes busyProcessCount = wpDetails.BusyProcesses busyPercentage = wpDetails.BusyProcessPercentage var metrics []*mrpb.TimeSeries for k, v := range processCount { extraLabels := map[string]string{"abap_process": k} log.CtxLogger(ctx).Debugw("Creating metric for abap_process", "metric", nwABAPProcCountPath, "abapprocess", k, "instancenumber", p.SAPInstance.GetInstanceNumber(), "value", v) metrics = append(metrics, createMetrics(p, nwABAPProcCountPath, extraLabels, now, int64(v))) } for k, v := range busyProcessCount { extraLabels := map[string]string{"abap_process": k} log.CtxLogger(ctx).Debugw("Creating metric for abap_process", "metric", nwABAPProcBusyPath, "abapprocess", k, "instancenumber", p.SAPInstance.GetInstanceNumber(), "value", v) metrics = append(metrics, createMetrics(p, nwABAPProcBusyPath, extraLabels, now, int64(v))) } for k, v := range busyPercentage { extraLabels := map[string]string{"abap_process": k} log.CtxLogger(ctx).Debugw("Creating metric for abap_process", "metric", nwABAPProcUtilPath, "abapprocess", k, "instancenumber", p.SAPInstance.GetInstanceNumber(), "value", v) metrics = append(metrics, createMetrics(p, nwABAPProcUtilPath, extraLabels, now, int64(v))) } log.CtxLogger(ctx).Debugw("Time taken to collect metrics in collectABAPProcessStatus()", "time", time.Since(now.AsTime())) return metrics, nil } // collectABAPQueueStats collects ABAP Queue utilization metrics using dpmon tool. func collectABAPQueueStats(ctx context.Context, p *InstanceProperties, scc sapcontrol.ClientInterface) ([]*mrpb.TimeSeries, error) { now := tspb.Now() // Since these metrics are derived from the same operation, even if one of the metric is skipped the whole group will be skipped from collection. skipABAPQueue := p.SkippedMetrics[nwABAPProcQueueCurrentPath] || p.SkippedMetrics[nwABAPProcQueuePeakPath] if skipABAPQueue { return nil, nil } sc := &sapcontrol.Properties{Instance: p.SAPInstance} var ( err error currentQueueUsage map[string]int64 peakQueueUsage map[string]int64 ) currentQueueUsage, peakQueueUsage, err = sc.GetQueueStatistic(ctx, scc) if err != nil { log.CtxLogger(ctx).Debugw("Sapcontrol web method failed", "error", err) return nil, err } var metrics []*mrpb.TimeSeries for k, v := range currentQueueUsage { extraLabels := map[string]string{"abap_queue": k} log.CtxLogger(ctx).Debugw("Creating metric with labels", "metric", nwABAPProcQueueCurrentPath, "labels", extraLabels, "instancenumber", p.SAPInstance.GetInstanceNumber(), "value", v) metrics = append(metrics, createMetrics(p, nwABAPProcQueueCurrentPath, extraLabels, now, int64(v))) } for k, v := range peakQueueUsage { extraLabels := map[string]string{"abap_queue_peak": k} log.CtxLogger(ctx).Debugw("Creating metric with labels", "metric", nwABAPProcQueueCurrentPath, "labels", extraLabels, "instancenumber", p.SAPInstance.GetInstanceNumber(), "value", v) metrics = append(metrics, createMetrics(p, nwABAPProcQueuePeakPath, extraLabels, now, int64(v))) } log.CtxLogger(ctx).Debugw("Time taken to collect metrics in collectABAPQueueStats()", "time", time.Since(now.AsTime())) return metrics, nil } // collectABAPSessionStats collects ABAP session related metrics using dpmon tool. func collectABAPSessionStats(ctx context.Context, p *InstanceProperties, exec commandlineexecutor.Execute, params commandlineexecutor.Params) ([]*mrpb.TimeSeries, error) { now := tspb.Now() if _, ok := p.SkippedMetrics[nwABAPSessionsPath]; ok { return nil, nil } results := exec(ctx, params) log.CtxLogger(ctx).Debugw("DPMON for sessionStat output", "stdout", results.StdOut, "stderr", results.StdErr, "exitcode", results.ExitCode, "error", results.Error) if results.Error != nil { log.CtxLogger(ctx).Debugw("DPMON failed", log.Error(results.Error)) return nil, results.Error } var metrics []*mrpb.TimeSeries sessionCounts, totalCount, err := parseABAPSessionStats(results.StdOut) if err != nil { log.CtxLogger(ctx).Debugw("DPMON ran successfully, but no ABAP session currently active", log.Error(err)) return nil, err } for k, v := range sessionCounts { extraLabels := map[string]string{"abap_session_type": k} log.CtxLogger(ctx).Debugw("Creating metric with labels", "metric", nwABAPSessionsPath, "labels", extraLabels, "instancenumber", p.SAPInstance.GetInstanceNumber(), "value", v) metrics = append(metrics, createMetrics(p, nwABAPSessionsPath, extraLabels, now, int64(v))) } extraLabels := map[string]string{"abap_session_type": "total_count"} log.CtxLogger(ctx).Debugw("Creating metric with labels", "metric", nwABAPSessionsPath, "labels", extraLabels, "instancenumber", p.SAPInstance.GetInstanceNumber(), "value", totalCount) metrics = append(metrics, createMetrics(p, nwABAPSessionsPath, extraLabels, now, int64(totalCount))) log.CtxLogger(ctx).Debugw("Time taken to collect metrics in collectABAPSessionStats()", "time", time.Since(now.AsTime())) return metrics, nil } // collectRFCConnections collects the ABAP RFC connection metrics using dpmon tool. func collectRFCConnections(ctx context.Context, p *InstanceProperties, exec commandlineexecutor.Execute, params commandlineexecutor.Params) ([]*mrpb.TimeSeries, error) { now := tspb.Now() if _, ok := p.SkippedMetrics[nwABAPRFCPath]; ok { return nil, nil } result := exec(ctx, params) log.CtxLogger(ctx).Debugw("DPMON for RFC output", "stdout", result.StdOut, "stderr", result.StdErr, "exitcode", result.ExitCode, "error", result.Error) if result.Error != nil { log.CtxLogger(ctx).Debugw("DPMON for RFC failed", log.Error(result.Error)) return nil, result.Error } var metrics []*mrpb.TimeSeries rfcStateCount := parseRFCStats(result.StdOut) for k, v := range rfcStateCount { extraLabels := map[string]string{"abap_rfc_conn": k} log.CtxLogger(ctx).Debugw("Creating metric with labels", "metric", nwABAPRFCPath, "labels", extraLabels, "instancenumber", p.SAPInstance.GetInstanceNumber(), "value", v) metrics = append(metrics, createMetrics(p, nwABAPRFCPath, extraLabels, now, int64(v))) } log.CtxLogger(ctx).Debugw("Time taken to collect metrics in collectRFCConnections()", "time", time.Since(now.AsTime())) return metrics, nil } // collectEnqLockMetrics builds Enq Locks for SAP Netweaver ASCS instances. func collectEnqLockMetrics(ctx context.Context, p *InstanceProperties, exec commandlineexecutor.Execute, params commandlineexecutor.Params, scc sapcontrol.ClientInterface) ([]*mrpb.TimeSeries, error) { if _, ok := p.SkippedMetrics[nwEnqLocksPath]; ok { return nil, nil } instance := p.SAPInstance.GetInstanceId() if !strings.HasPrefix(instance, "ASCS") && !strings.HasPrefix(instance, "ERS") { log.CtxLogger(ctx).Debugw("The Enq Lock metric is only applicable for application type: ASCS.", "InstanceID", p.SAPInstance.InstanceId) return nil, nil } now := tspb.Now() sc := &sapcontrol.Properties{Instance: p.SAPInstance} var enqLocks []*sapcontrol.EnqLock var err error enqLocks, err = sc.EnqGetLockTable(ctx, scc) if err != nil { return nil, err } var metrics []*mrpb.TimeSeries for _, lock := range enqLocks { extraLabels := map[string]string{ "lock_name": lock.LockName, "lock_arg": lock.LockArg, "lock_mode": lock.LockMode, "owner": lock.Owner, "owner_vb": lock.OwnerVB, "user_count_owner": fmt.Sprintf("%d", lock.UserCountOwner), "user_count_owner_vb": fmt.Sprintf("%d", lock.UserCountOwnerVB), "client": lock.Client, "user": lock.User, "transaction": lock.Transaction, "object": lock.Object, "backup": lock.Backup, } log.CtxLogger(ctx).Debugw("Creating metric with labels", "metric", nwEnqLocksPath, "labels", extraLabels, "instancenumber", p.SAPInstance.GetInstanceNumber(), "value", lock.UserCountOwner) metrics = append(metrics, createMetrics(p, nwEnqLocksPath, extraLabels, now, lock.UserCountOwner)) } return metrics, nil } func collectRoleMetrics(ctx context.Context, p *InstanceProperties, exec commandlineexecutor.Execute) (*mrpb.TimeSeries, error) { params := commandlineexecutor.Params{ Executable: "ps", Args: []string{"-ef"}, } result := exec(ctx, params) if result.Error != nil { return nil, result.Error } roles := map[string]string{ "ascs": "false", "ers": "false", "app": "false", } hasRole := false hasEnq := false hasMS := false lines := strings.Split(result.StdOut, "\n") for _, line := range lines { matches := appProcessRegex.FindStringSubmatch(line) log.CtxLogger(ctx).Debugw("Line", "line", line, "matches", matches) if len(matches) < 3 { continue } bin := matches[1] sid := strings.ToUpper(matches[2]) if sid != p.SAPInstance.GetSapsid() { continue } switch bin { case "enqr", "er": log.CtxLogger(ctx).Debugw("Found enqr or er", "bin", bin) roles["ers"] = "true" hasRole = true case "ms": log.CtxLogger(ctx).Debugw("Found ms", "bin", bin) hasMS = true hasRole = true case "enq", "en": log.CtxLogger(ctx).Debugw("Found enq or en", "bin", bin) hasEnq = true hasRole = true case "dw", "jc": log.CtxLogger(ctx).Debugw("Found dw or jc", "bin", bin) roles["app"] = "true" hasRole = true } } if hasMS && hasEnq { log.CtxLogger(ctx).Debugw("Found both ms and enq.", "hasMS", hasMS, "hasEnq", hasEnq) roles["ascs"] = "true" hasRole = true } if !hasRole { return nil, nil } return createMetrics(p, nwInstanceRolePath, roles, tspb.Now(), 1), nil } // createMetrics - create mrpb.TimeSeries object for the given metric. func createMetrics(p *InstanceProperties, mPath string, extraLabels map[string]string, now *tspb.Timestamp, val int64) *mrpb.TimeSeries { params := timeseries.Params{ CloudProp: protostruct.ConvertCloudPropertiesToStruct(p.Config.CloudProperties), MetricType: metricURL + mPath, MetricLabels: metricLabels(p, extraLabels), Timestamp: now, Int64Value: val, BareMetal: p.Config.BareMetal, } return timeseries.BuildInt(params) } // metricLabels appends the default SAP Instance labels and extra labels // to return a consolidated map of metric labels. func metricLabels(p *InstanceProperties, extraLabels map[string]string) map[string]string { defaultLabels := map[string]string{ "sid": p.SAPInstance.GetSapsid(), "instance_nr": p.SAPInstance.GetInstanceNumber(), "instance_name": p.Config.CloudProperties.InstanceName, } for k, v := range extraLabels { defaultLabels[k] = v } return defaultLabels } // contains checks if a string slice contains a given string. func contains(list []string, s string) bool { for _, t := range list { if s == t { return true } } return false } // boolToInt64 converts bool to int64. func boolToInt64(b bool) int64 { if b { return 1 } return 0 }

internal/processmetrics/netweaver/netweaver.go (561 lines of code) (raw):