@@ -131,11 +131,11 @@ message ReadSession {
131131 }
132132
133133 // Optional. Specifies a table sampling percentage. Specifically, the query
134- // planner will use TABLESAMPLE SYSTEM (sample_percentage PERCENT). This
135- // samples at the file-level. It will randomly choose for each file whether
136- // to include that file in the sample returned. Note, that if the table only
137- // has one file, then TABLESAMPLE SYSTEM will select that file and return
138- // all returnable rows contained within.
134+ // planner will use TABLESAMPLE SYSTEM (sample_percentage PERCENT). The
135+ // sampling percentage is applied at the data block granularity. It will
136+ // randomly choose for each data block whether to read the rows in that data
137+ // block. For more details, see
138+ // https://cloud.google.com/bigquery/docs/table-sampling)
139139 optional double sample_percentage = 5
140140 [(google.api.field_behavior ) = OPTIONAL ];
141141 }
@@ -194,6 +194,14 @@ message ReadSession {
194194 int64 estimated_total_bytes_scanned = 12
195195 [(google.api.field_behavior ) = OUTPUT_ONLY ];
196196
197+ // Output only. A pre-projected estimate of the total physical size (in bytes)
198+ // of files this session will scan when all streams are completely consumed.
199+ // This estimate does not depend on the selected columns and can be based on
200+ // metadata from the table which might be incomplete or stale. Only set for
201+ // BigLake tables.
202+ int64 estimated_total_physical_file_size = 15
203+ [(google.api.field_behavior ) = OUTPUT_ONLY ];
204+
197205 // Output only. An estimate on the number of rows present in this session's
198206 // streams. This estimate is based on metadata from the table which might be
199207 // incomplete or stale.
0 commit comments