Skip to content

Commit 64f7880

Browse files
Google APIscopybara-github
authored andcommitted
docs: Regenerated REST and RPC Document AI documentation to include missing changes from September 2024 to November 2025
docs: Fixed language issues in multiple message field descriptions PiperOrigin-RevId: 859310712
1 parent 3a1589f commit 64f7880

File tree

3 files changed

+48
-44
lines changed

3 files changed

+48
-44
lines changed

google/cloud/documentai/v1/document.proto

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1195,10 +1195,10 @@ message Document {
11951195
// entity extraction results at different stages of the processing.
11961196
repeated EntitiesRevision entities_revisions = 22;
11971197

1198-
// The entity revision id that `document.entities` field is based on.
1198+
// The entity revision ID that `document.entities` field is based on.
11991199
// If this field is set and `entities_revisions` is not empty, the entities in
12001200
// `document.entities` field are the entities in the entity revision with this
1201-
// id and `document.entity_validation_output` field is the
1201+
// ID and `document.entity_validation_output` field is the
12021202
// `entity_validation_output` field in this entity revision.
12031203
string entities_revision_id = 23;
12041204
}

google/cloud/documentai/v1beta3/document.proto

Lines changed: 42 additions & 40 deletions
Original file line numberDiff line numberDiff line change
@@ -180,9 +180,9 @@ message Document {
180180

181181
// Confidence of the current
182182
// [Layout][google.cloud.documentai.v1beta3.Document.Page.Layout] within
183-
// context of the object this layout is for. e.g. confidence can be for a
184-
// single token, a table, a visual element, etc. depending on context.
185-
// Range `[0, 1]`.
183+
// context of the object this layout is for. For example, confidence can
184+
// be for a single token, a table, a visual element, etc. depending on
185+
// context. Range `[0, 1]`.
186186
float confidence = 2;
187187

188188
// The bounding polygon for the
@@ -340,8 +340,8 @@ message Document {
340340
repeated DetectedLanguage detected_languages = 2;
341341
}
342342

343-
// Detected non-text visual elements e.g. checkbox, signature etc. on the
344-
// page.
343+
// Detected non-text visual elements, for example, checkbox, signature, etc.
344+
// on the page.
345345
message VisualElement {
346346
// [Layout][google.cloud.documentai.v1beta3.Document.Page.Layout] for
347347
// [VisualElement][google.cloud.documentai.v1beta3.Document.Page.VisualElement].
@@ -400,7 +400,8 @@ message Document {
400400
message FormField {
401401
// [Layout][google.cloud.documentai.v1beta3.Document.Page.Layout] for the
402402
// [FormField][google.cloud.documentai.v1beta3.Document.Page.FormField]
403-
// name. e.g. `Address`, `Email`, `Grand total`, `Phone number`, etc.
403+
// name. For example, `Address`, `Email`, `Grand total`, `Phone number`,
404+
// etc.
404405
Layout field_name = 1;
405406

406407
// [Layout][google.cloud.documentai.v1beta3.Document.Page.Layout] for the
@@ -529,7 +530,7 @@ message Document {
529530
// A list of visually detected tokens on the page.
530531
repeated Token tokens = 8;
531532

532-
// A list of detected non-text visual elements e.g. checkbox,
533+
// A list of detected non-text visual elements for example, checkbox,
533534
// signature etc. on the page.
534535
repeated VisualElement visual_elements = 9;
535536

@@ -627,10 +628,10 @@ message Document {
627628
// [Document.text][google.cloud.documentai.v1beta3.Document.text].
628629
TextAnchor text_anchor = 1 [(google.api.field_behavior) = OPTIONAL];
629630

630-
// Required. Entity type from a schema e.g. `Address`.
631+
// Required. Entity type from a schema for example, `Address`.
631632
string type = 2 [(google.api.field_behavior) = REQUIRED];
632633

633-
// Optional. Text value of the entity e.g. `1600 Amphitheatre Pkwy`.
634+
// Optional. Text value of the entity for example, `1600 Amphitheatre Pkwy`.
634635
string mention_text = 3 [(google.api.field_behavior) = OPTIONAL];
635636

636637
// Optional. Deprecated. Use `id` field instead.
@@ -643,14 +644,14 @@ message Document {
643644
// the page where it was found.
644645
PageAnchor page_anchor = 6 [(google.api.field_behavior) = OPTIONAL];
645646

646-
// Optional. Canonical id. This will be a unique value in the entity list
647+
// Optional. Canonical ID. This will be a unique value in the entity list
647648
// for this document.
648649
string id = 7 [(google.api.field_behavior) = OPTIONAL];
649650

650651
// Optional. Normalized entity value. Absent if the extracted value could
651-
// not be converted or the type (e.g. address) is not supported for certain
652-
// parsers. This field is also only populated for certain supported document
653-
// types.
652+
// not be converted or the type (for example, address) is not supported for
653+
// certain parsers. This field is also only populated for certain supported
654+
// document types.
654655
NormalizedValue normalized_value = 9
655656
[(google.api.field_behavior) = OPTIONAL];
656657

@@ -672,10 +673,10 @@ message Document {
672673
// Relationship between
673674
// [Entities][google.cloud.documentai.v1beta3.Document.Entity].
674675
message EntityRelation {
675-
// Subject entity id.
676+
// Subject entity ID.
676677
string subject_id = 1;
677678

678-
// Object entity id.
679+
// Object entity ID.
679680
string object_id = 2;
680681

681682
// Relationship description.
@@ -805,7 +806,7 @@ message Document {
805806
// of entities, properties within entities, etc.) in the parent revision.
806807
int32 index = 3;
807808

808-
// The id of the parent provenance.
809+
// The ID of the parent provenance.
809810
int32 id = 2 [deprecated = true];
810811
}
811812

@@ -845,7 +846,7 @@ message Document {
845846
// The index of the revision that produced this element.
846847
int32 revision = 1 [deprecated = true];
847848

848-
// The Id of this operation. Needs to be unique within the scope of the
849+
// The ID of this operation. Needs to be unique within the scope of the
849850
// revision.
850851
int32 id = 2 [deprecated = true];
851852

@@ -860,7 +861,7 @@ message Document {
860861
message Revision {
861862
// Human Review information of the document.
862863
message HumanReview {
863-
// Human review state. e.g. `requested`, `succeeded`, `rejected`.
864+
// Human review state. For example, `requested`, `succeeded`, `rejected`.
864865
string state = 1;
865866

866867
// A message providing more details about the current state of processing.
@@ -870,7 +871,7 @@ message Document {
870871

871872
// Who/what made the change
872873
oneof source {
873-
// If the change was made by a person specify the name or id of that
874+
// If the change was made by a person specify the name or ID of that
874875
// person.
875876
string agent = 4;
876877

@@ -879,7 +880,7 @@ message Document {
879880
string processor = 5;
880881
}
881882

882-
// Id of the revision, internally generated by doc proto storage.
883+
// ID of the revision, internally generated by doc proto storage.
883884
// Unique within the context of the document.
884885
string id = 1;
885886

@@ -888,7 +889,7 @@ message Document {
888889
// index into the `revisions` field.
889890
repeated int32 parent = 2 [deprecated = true];
890891

891-
// The revisions that this revision is based on. Must include all the ids
892+
// The revisions that this revision is based on. Must include all the IDs
892893
// that have anything to do with this revision - eg. there are
893894
// `provenance.parent.revision` fields that index into this field.
894895
repeated string parent_ids = 7;
@@ -1012,18 +1013,18 @@ message Document {
10121013
message LayoutImageBlock {
10131014
// Source of the image.
10141015
oneof image_source {
1015-
// Optional. Asset id of the inline image. If set, find the image
1016+
// Optional. Asset ID of the inline image. If set, find the image
10161017
// content in the blob_assets field.
10171018
string blob_asset_id = 4 [(google.api.field_behavior) = OPTIONAL];
10181019

1019-
// Optional. Google Cloud Storage uri of the image.
1020+
// Optional. Google Cloud Storage URI of the image.
10201021
string gcs_uri = 5 [(google.api.field_behavior) = OPTIONAL];
10211022

1022-
// Optional. Data uri of the image.
1023+
// Optional. Data URI of the image.
10231024
// It is composed of four parts: a prefix (data:), a MIME type
10241025
// indicating the type of data, an optional base64 token if
10251026
// non-textual, and the data itself:
1026-
// data:[<mediatype>][;base64],<data>
1027+
// data:[<mediatype>][;base64],<data>.
10271028
string data_uri = 6 [(google.api.field_behavior) = OPTIONAL];
10281029
}
10291030

@@ -1102,18 +1103,18 @@ message Document {
11021103
message ImageChunkField {
11031104
// Source of the image.
11041105
oneof image_source {
1105-
// Optional. Asset id of the inline image. If set, find the image
1106+
// Optional. Asset ID of the inline image. If set, find the image
11061107
// content in the blob_assets field.
11071108
string blob_asset_id = 1 [(google.api.field_behavior) = OPTIONAL];
11081109

1109-
// Optional. Google Cloud Storage uri of the image.
1110+
// Optional. Google Cloud Storage URI of the image.
11101111
string gcs_uri = 2 [(google.api.field_behavior) = OPTIONAL];
11111112

1112-
// Optional. Data uri of the image.
1113+
// Optional. Data URI of the image.
11131114
// It is composed of four parts: a prefix (data:), a MIME type
11141115
// indicating the type of data, an optional base64 token if
11151116
// non-textual, and the data itself:
1116-
// data:[<mediatype>][;base64],<data>
1117+
// data:[<mediatype>][;base64],<data>.
11171118
string data_uri = 3 [(google.api.field_behavior) = OPTIONAL];
11181119
}
11191120

@@ -1128,7 +1129,7 @@ message Document {
11281129
}
11291130

11301131
// The chunk field in the chunk. A chunk field could be one of the various
1131-
// types (e.g. image, table) supported.
1132+
// types (for example, image, table) supported.
11321133
message ChunkField {
11331134
// The type of the chunk field.
11341135
oneof field_type {
@@ -1167,13 +1168,13 @@ message Document {
11671168
}
11681169

11691170
// Represents a blob asset. It's used to store the content of the inline blob
1170-
// in this document, e.g. image bytes, such that it can be referenced by
1171-
// other fields in the document via asset id.
1171+
// in this document, for example, image bytes, such that it can be referenced
1172+
// by other fields in the document via asset ID.
11721173
message BlobAsset {
1173-
// Optional. The id of the blob asset.
1174+
// Optional. The ID of the blob asset.
11741175
string asset_id = 1 [(google.api.field_behavior) = OPTIONAL];
11751176

1176-
// Optional. The content of the blob asset, e.g. image bytes.
1177+
// Optional. The content of the blob asset, for example, image bytes.
11771178
bytes content = 2 [(google.api.field_behavior) = OPTIONAL];
11781179

11791180
// The mime type of the blob asset.
@@ -1228,7 +1229,7 @@ message Document {
12281229

12291230
// Entity revision.
12301231
message EntitiesRevision {
1231-
// The revision id.
1232+
// The revision ID.
12321233
string revision_id = 1;
12331234

12341235
// The entities in this revision.
@@ -1302,8 +1303,9 @@ message Document {
13021303
ChunkedDocument chunked_document = 18;
13031304

13041305
// Optional. The blob assets in this document. This is used to store the
1305-
// content of the inline blobs in this document, e.g. image bytes, such that
1306-
// it can be referenced by other fields in the document via asset id.
1306+
// content of the inline blobs in this document, for example, image bytes,
1307+
// such that it can be referenced by other fields in the document via asset
1308+
// id.
13071309
repeated BlobAsset blob_assets = 19 [(google.api.field_behavior) = OPTIONAL];
13081310

13091311
// The entity validation output for the document. This is the validation
@@ -1315,10 +1317,10 @@ message Document {
13151317
// entity extraction results at different stages of the processing.
13161318
repeated EntitiesRevision entities_revisions = 22;
13171319

1318-
// The entity revision id that `document.entities` field is based on.
1320+
// The entity revision ID that `document.entities` field is based on.
13191321
// If this field is set and `entities_revisions` is not empty, the entities in
13201322
// `document.entities` field are the entities in the entity revision with this
1321-
// id and `document.entity_validation_output` field is the
1323+
// ID and `document.entity_validation_output` field is the
13221324
// `entity_validation_output` field in this entity revision.
13231325
string entities_revision_id = 23;
13241326
}
@@ -1345,7 +1347,7 @@ message RevisionRef {
13451347
// Reads the revision by the predefined case.
13461348
RevisionCase revision_case = 1;
13471349

1348-
// Reads the revision given by the id.
1350+
// Reads the revision given by the ID.
13491351
string revision_id = 2;
13501352

13511353
// Reads the revision generated by the processor version.

google/cloud/documentai/v1beta3/document_processor_service.proto

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -359,13 +359,15 @@ message ProcessOptions {
359359
[(google.api.field_behavior) = OPTIONAL];
360360

361361
// Optional. The number of tokens to group together when evaluating
362-
// semantic similarity. THIS FIELD IS NOT YET USED.
362+
// semantic similarity.
363+
// **Note:** This field is not yet used.
363364
bool semantic_chunking_group_size = 3
364365
[(google.api.field_behavior) = OPTIONAL];
365366

366367
// Optional. The percentile of cosine dissimilarity that must be exceeded
367368
// between a group of tokens and the next. The smaller this number is, the
368-
// more chunks will be generated. THIS FIELD IS NOT YET USED.
369+
// more chunks will be generated.
370+
// **Note:** This field is not yet used.
369371
int32 breakpoint_percentile_threshold = 4
370372
[(google.api.field_behavior) = OPTIONAL];
371373
}

0 commit comments

Comments
 (0)