@@ -75,6 +75,8 @@ class FileType(proto.Enum):
75
75
AVRO = 7
76
76
CSV = 8
77
77
TSV = 9
78
+ POWERPOINT = 11
79
+ EXCEL = 12
78
80
79
81
80
82
class InfoType (proto .Message ):
@@ -188,23 +190,20 @@ class Dictionary(proto.Message):
188
190
Plane <https://en.wikipedia.org/wiki/Plane_%28Unicode%29#Basic_Multilingual_Plane>`__
189
191
will be replaced with whitespace when scanning for matches, so the
190
192
dictionary phrase "Sam Johnson" will match all three phrases "sam
191
- johnson",
192
- Plane](https://en.wikipedia.org/wiki/Plane_%28Unicode%29#Basic_Multilingual_Plane)
193
- surrounding any match must be of a different type than the adjacent
194
- characters within the word, so letters must be next to non-letters
195
- and digits next to non-digits. For example, the dictionary word
196
- "jen" will match the first three letters of the text "jen123" but
197
- will return no matches for "jennifer".
193
+ johnson", "Sam, Johnson", and "Sam (Johnson)". Additionally, the
194
+ characters surrounding any match must be of a different type than
195
+ the adjacent characters within the word, so letters must be next to
196
+ non-letters and digits next to non-digits. For example, the
197
+ dictionary word "jen" will match the first three letters of the text
198
+ "jen123" but will return no matches for "jennifer".
198
199
199
200
Dictionary words containing a large number of characters that are
200
201
not letters or digits may result in unexpected findings because such
201
202
characters are treated as whitespace. The
202
203
`limits <https://cloud.google.com/dlp/limits>`__ page contains
203
204
details about the size limits of dictionaries. For dictionaries that
204
205
do not fit within these constraints, consider using
205
- ``LargeCustomDictionaryConfig`` in the
206
- `limits <https://cloud.google.com/dlp/limits>`__ page contains
207
- details about
206
+ ``LargeCustomDictionaryConfig`` in the ``StoredInfoType`` API.
208
207
209
208
This message has `oneof`_ fields (mutually exclusive fields).
210
209
For each oneof, at most one member field can be set at the same time.
@@ -260,11 +259,9 @@ class Regex(proto.Message):
260
259
be found under the google/re2 repository on
261
260
GitHub.
262
261
group_indexes (Sequence[int]):
263
- (https://github.com/google/re2/wiki/Syntax)
264
- can be found under the The index of the submatch
265
- to extract as findings. When not specified, the
266
- entire match is returned. No more than 3 may be
267
- included.
262
+ The index of the submatch to extract as
263
+ findings. When not specified, the entire match
264
+ is returned. No more than 3 may be included.
268
265
"""
269
266
270
267
pattern = proto .Field (proto .STRING , number = 1 ,)
@@ -275,10 +272,10 @@ class SurrogateType(proto.Message):
275
272
such as
276
273
```CryptoReplaceFfxFpeConfig`` <https://cloud.google.com/dlp/docs/reference/rest/v2/organizations.deidentifyTemplates#cryptoreplaceffxfpeconfig>`__.
277
274
These types of transformations are those that perform
278
- pseudonymization, thereby producing a "surrogate" as
279
- ```CryptoReplaceFfxFpeConfig`` <https://cloud.google.com/dlp/docs/reference/rest/v2/organizations.deidentifyTemplates#cryptoreplaceffxfpeconfig>`__.
280
- transformation such as ``surrogate_info_type``. This CustomInfoType
281
- does not support the use of ``detection_rules``.
275
+ pseudonymization, thereby producing a "surrogate" as output. This
276
+ should be used in conjunction with a field on the transformation
277
+ such as ``surrogate_info_type``. This CustomInfoType does not
278
+ support the use of ``detection_rules``.
282
279
283
280
"""
284
281
@@ -527,11 +524,9 @@ class CloudStorageRegexFileSet(proto.Message):
527
524
guide can be found under the google/re2 repository on
528
525
GitHub.
529
526
exclude_regex (Sequence[str]):
530
- `syntax <https://github.com/google/re2/wiki/Syntax>`__; a
531
- guide can be found A list of regular expressions matching
532
- file paths to exclude. All files in the bucket that match at
533
- least one of these regular expressions will be excluded from
534
- the scan.
527
+ A list of regular expressions matching file paths to
528
+ exclude. All files in the bucket that match at least one of
529
+ these regular expressions will be excluded from the scan.
535
530
536
531
Regular expressions use RE2
537
532
`syntax <https://github.com/google/re2/wiki/Syntax>`__; a
0 commit comments