forked from GoogleCloudPlatform/python-docs-samples
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathdlp_inspect_text_file.py
More file actions
60 lines (51 loc) · 1.92 KB
/
dlp_inspect_text_file.py
File metadata and controls
60 lines (51 loc) · 1.92 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
# Copyright 2018 Google Inc.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import sys
# [START dlp_inspect_text_file]
# Import the Google Cloud Data Loss Prevention library
import google.cloud.dlp
def inspect_text_file(
project_id='YOUR_PROJECT_ID',
file_path='path/to/file.txt'):
# Instantiate a client
dlp = google.cloud.dlp.DlpServiceClient()
# Get the bytes of the file
with open(file_path, mode='rb') as fh:
file_bytes = fh.read()
# Construct request
parent = dlp.project_path(project_id)
item = {'byte_item': {'type': 'TEXT_UTF8', 'data': file_bytes}}
inspect_config = {
# The infoTypes of information to match
'info_types': [
{'name': 'PHONE_NUMBER'},
{'name': 'EMAIL_ADDRESS'},
{'name': 'CREDIT_CARD_NUMBER'},
],
# Whether to include the matching string
'include_quote': True,
}
# Run request
response = dlp.inspect_content(parent, inspect_config, item)
# Print the results
if response.result.findings:
for finding in response.result.findings:
print('Quote: {}'.format(finding.quote))
print('Info type: {}'.format(finding.info_type.name))
print('Likelihood: {}'.format(finding.likelihood))
else:
print('No findings.')
# [END dlp_inspect_text_file]
if __name__ == '__main__':
inspect_text_file(project_id=sys.argv[1], file_path=sys.argv[2])