dlp/snippets/inspect/inspect_string_excluding_substring.go (83 lines of code) (raw):

// Copyright 2023 Google LLC // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // https://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. package inspect // [START dlp_inspect_string_custom_excluding_substring] import ( "context" "fmt" "io" dlp "cloud.google.com/go/dlp/apiv2" "cloud.google.com/go/dlp/apiv2/dlppb" ) // inspectStringCustomExcludingSubstring inspects a string for sensitive data, excluding a custom substring func inspectStringCustomExcludingSubstring(w io.Writer, projectID, textToInspect, customDetectorPattern string, excludedSubstringList []string) error { // projectId := "your-project-id" // textToInspect := "Name: Doe, John. Name: Example, Jimmy" // customDetectorPattern := "[A-Z][a-z]{1,15}, [A-Z][a-z]{1,15}" // excludedSubstringList := []string{"Jimmy"} ctx := context.Background() // Initialize a client once and reuse it to send multiple requests. Clients // are safe to use across goroutines. When the client is no longer needed, // call the Close method to cleanup its resources. client, err := dlp.NewClient(ctx) if err != nil { return err } // Closing the client safely cleans up background resources. defer client.Close() // Specify the type and content to be inspected. contentItem := &dlppb.ContentItem{ DataItem: &dlppb.ContentItem_ByteItem{ ByteItem: &dlppb.ByteContentItem{ Type: dlppb.ByteContentItem_TEXT_UTF8, Data: []byte(textToInspect), }, }, } // Specify the type of info the inspection will look for. infoType := &dlppb.InfoType{ Name: "CUSTOM_NAME_DETECTOR", } customInfotype := &dlppb.CustomInfoType{ InfoType: infoType, Type: &dlppb.CustomInfoType_Regex_{ Regex: &dlppb.CustomInfoType_Regex{ Pattern: customDetectorPattern, }, }, } // Exclude partial matches from the specified excludedSubstringList. exclusionRule := &dlppb.ExclusionRule{ Type: &dlppb.ExclusionRule_Dictionary{ Dictionary: &dlppb.CustomInfoType_Dictionary{ Source: &dlppb.CustomInfoType_Dictionary_WordList_{ WordList: &dlppb.CustomInfoType_Dictionary_WordList{ Words: excludedSubstringList, }, }, }, }, MatchingType: dlppb.MatchingType_MATCHING_TYPE_PARTIAL_MATCH, } // Construct a ruleset that applies the exclusion rule to the EMAIL_ADDRESSES infoType. ruleSet := &dlppb.InspectionRuleSet{ InfoTypes: []*dlppb.InfoType{ infoType, }, Rules: []*dlppb.InspectionRule{ { Type: &dlppb.InspectionRule_ExclusionRule{ ExclusionRule: exclusionRule, }, }, }, } // Construct the Inspect request to be sent by the client. req := &dlppb.InspectContentRequest{ Parent: fmt.Sprintf("projects/%s/locations/global", projectID), Item: contentItem, InspectConfig: &dlppb.InspectConfig{ CustomInfoTypes: []*dlppb.CustomInfoType{ customInfotype, }, IncludeQuote: true, RuleSet: []*dlppb.InspectionRuleSet{ ruleSet, }, }, } // Send the request. resp, err := client.InspectContent(ctx, req) if err != nil { return err } // Process the results. fmt.Fprintf(w, "Findings: %v\n", len(resp.Result.Findings)) for _, v := range resp.GetResult().Findings { fmt.Fprintf(w, "Quote: %v\n", v.GetQuote()) fmt.Fprintf(w, "Infotype Name: %v\n", v.GetInfoType().GetName()) fmt.Fprintf(w, "Likelihood: %v\n", v.GetLikelihood()) } return nil } // [END dlp_inspect_string_custom_excluding_substring]