Coverage for /pythoncovmergedfiles/medio/medio/usr/local/lib/python3.11/site-packages/google/cloud/bigquery/job/load.py: 57%

3# Licensed under the Apache License, Version 2.0 (the "License");

4# you may not use this file except in compliance with the License.

5# You may obtain a copy of the License at

7# http://www.apache.org/licenses/LICENSE-2.0

9# Unless required by applicable law or agreed to in writing, software

10# distributed under the License is distributed on an "AS IS" BASIS,

11# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

12# See the License for the specific language governing permissions and

13# limitations under the License.

15"""Classes for load jobs."""

17import typing

18from typing import FrozenSet, List, Iterable, Optional, Union

20from google.cloud.bigquery.encryption_configuration import EncryptionConfiguration

21from google.cloud.bigquery.enums import SourceColumnMatch

22from google.cloud.bigquery.external_config import HivePartitioningOptions

23from google.cloud.bigquery.format_options import ParquetOptions

24from google.cloud.bigquery import _helpers

25from google.cloud.bigquery.schema import SchemaField

26from google.cloud.bigquery.schema import _to_schema_fields

27from google.cloud.bigquery.table import RangePartitioning

28from google.cloud.bigquery.table import TableReference

29from google.cloud.bigquery.table import TimePartitioning

30from google.cloud.bigquery.job.base import _AsyncJob

31from google.cloud.bigquery.job.base import _JobConfig

32from google.cloud.bigquery.job.base import _JobReference

33from google.cloud.bigquery.query import ConnectionProperty

36class ColumnNameCharacterMap:

37 """Indicates the character map used for column names.

39 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#columnnamecharactermap

40 """

42 COLUMN_NAME_CHARACTER_MAP_UNSPECIFIED = "COLUMN_NAME_CHARACTER_MAP_UNSPECIFIED"

43 """Unspecified column name character map."""

45 STRICT = "STRICT"

46 """Support flexible column name and reject invalid column names."""

48 V1 = "V1"

49 """ Support alphanumeric + underscore characters and names must start with

50 a letter or underscore. Invalid column names will be normalized."""

52 V2 = "V2"

53 """Support flexible column name. Invalid column names will be normalized."""

56class LoadJobConfig(_JobConfig):

57 """Configuration options for load jobs.

59 Set properties on the constructed configuration by using the property name

60 as the name of a keyword argument. Values which are unset or :data:`None`

61 use the BigQuery REST API default values. See the `BigQuery REST API

62 reference documentation

63 <https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad>`_

64 for a list of default values.

66 Required options differ based on the

67 :attr:`~google.cloud.bigquery.job.LoadJobConfig.source_format` value.

68 For example, the BigQuery API's default value for

69 :attr:`~google.cloud.bigquery.job.LoadJobConfig.source_format` is ``"CSV"``.

70 When loading a CSV file, either

71 :attr:`~google.cloud.bigquery.job.LoadJobConfig.schema` must be set or

72 :attr:`~google.cloud.bigquery.job.LoadJobConfig.autodetect` must be set to

73 :data:`True`.

74 """

76 def __init__(self, **kwargs) -> None:

77 super(LoadJobConfig, self).__init__("load", **kwargs)

79 @property

80 def allow_jagged_rows(self):

81 """Optional[bool]: Allow missing trailing optional columns (CSV only).

83 See:

84 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.allow_jagged_rows

85 """

86 return self._get_sub_prop("allowJaggedRows")

88 @allow_jagged_rows.setter

89 def allow_jagged_rows(self, value):

90 self._set_sub_prop("allowJaggedRows", value)

92 @property

93 def allow_quoted_newlines(self):

94 """Optional[bool]: Allow quoted data containing newline characters (CSV only).

96 See:

97 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.allow_quoted_newlines

98 """

99 return self._get_sub_prop("allowQuotedNewlines")

100

101 @allow_quoted_newlines.setter

102 def allow_quoted_newlines(self, value):

103 self._set_sub_prop("allowQuotedNewlines", value)

104

105 @property

106 def autodetect(self):

107 """Optional[bool]: Automatically infer the schema from a sample of the data.

108

109 See:

110 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.autodetect

111 """

112 return self._get_sub_prop("autodetect")

113

114 @autodetect.setter

115 def autodetect(self, value):

116 self._set_sub_prop("autodetect", value)

117

118 @property

119 def clustering_fields(self):

120 """Optional[List[str]]: Fields defining clustering for the table

121

122 (Defaults to :data:`None`).

123

124 Clustering fields are immutable after table creation.

125

126 .. note::

127

128 BigQuery supports clustering for both partitioned and

129 non-partitioned tables.

130 """

131 prop = self._get_sub_prop("clustering")

132 if prop is not None:

133 return list(prop.get("fields", ()))

134

135 @clustering_fields.setter

136 def clustering_fields(self, value):

137 """Optional[List[str]]: Fields defining clustering for the table

138

139 (Defaults to :data:`None`).

140 """

141 if value is not None:

142 self._set_sub_prop("clustering", {"fields": value})

143 else:

144 self._del_sub_prop("clustering")

145

146 @property

147 def connection_properties(self) -> List[ConnectionProperty]:

148 """Connection properties.

149

150 See

151 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.connection_properties

152

153 .. versionadded:: 3.7.0

154 """

155 resource = self._get_sub_prop("connectionProperties", [])

156 return [ConnectionProperty.from_api_repr(prop) for prop in resource]

157

158 @connection_properties.setter

159 def connection_properties(self, value: Iterable[ConnectionProperty]):

160 self._set_sub_prop(

161 "connectionProperties",

162 [prop.to_api_repr() for prop in value],

163 )

164

165 @property

166 def create_disposition(self):

167 """Optional[google.cloud.bigquery.job.CreateDisposition]: Specifies behavior

168 for creating tables.

169

170 See:

171 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.create_disposition

172 """

173 return self._get_sub_prop("createDisposition")

174

175 @create_disposition.setter

176 def create_disposition(self, value):

177 self._set_sub_prop("createDisposition", value)

178

179 @property

180 def create_session(self) -> Optional[bool]:

181 """[Preview] If :data:`True`, creates a new session, where

182 :attr:`~google.cloud.bigquery.job.LoadJob.session_info` will contain a

183 random server generated session id.

184

185 If :data:`False`, runs load job with an existing ``session_id`` passed in

186 :attr:`~google.cloud.bigquery.job.LoadJobConfig.connection_properties`,

187 otherwise runs load job in non-session mode.

188

189 See

190 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.create_session

191

192 .. versionadded:: 3.7.0

193 """

194 return self._get_sub_prop("createSession")

195

196 @create_session.setter

197 def create_session(self, value: Optional[bool]):

198 self._set_sub_prop("createSession", value)

199

200 @property

201 def decimal_target_types(self) -> Optional[FrozenSet[str]]:

202 """Possible SQL data types to which the source decimal values are converted.

203

204 See:

205 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.decimal_target_types

206

207 .. versionadded:: 2.21.0

208 """

209 prop = self._get_sub_prop("decimalTargetTypes")

210 if prop is not None:

211 prop = frozenset(prop)

212 return prop

213

214 @decimal_target_types.setter

215 def decimal_target_types(self, value: Optional[Iterable[str]]):

216 if value is not None:

217 self._set_sub_prop("decimalTargetTypes", list(value))

218 else:

219 self._del_sub_prop("decimalTargetTypes")

220

221 @property

222 def destination_encryption_configuration(self):

223 """Optional[google.cloud.bigquery.encryption_configuration.EncryptionConfiguration]: Custom

224 encryption configuration for the destination table.

225

226 Custom encryption configuration (e.g., Cloud KMS keys) or :data:`None`

227 if using default encryption.

228

229 See:

230 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.destination_encryption_configuration

231 """

232 prop = self._get_sub_prop("destinationEncryptionConfiguration")

233 if prop is not None:

234 prop = EncryptionConfiguration.from_api_repr(prop)

235 return prop

236

237 @destination_encryption_configuration.setter

238 def destination_encryption_configuration(self, value):

239 api_repr = value

240 if value is not None:

241 api_repr = value.to_api_repr()

242 self._set_sub_prop("destinationEncryptionConfiguration", api_repr)

243 else:

244 self._del_sub_prop("destinationEncryptionConfiguration")

245

246 @property

247 def destination_table_description(self):

248 """Optional[str]: Description of the destination table.

249

250 See:

251 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#DestinationTableProperties.FIELDS.description

252 """

253 prop = self._get_sub_prop("destinationTableProperties")

254 if prop is not None:

255 return prop["description"]

256

257 @destination_table_description.setter

258 def destination_table_description(self, value):

259 keys = [self._job_type, "destinationTableProperties", "description"]

260 if value is not None:

261 _helpers._set_sub_prop(self._properties, keys, value)

262 else:

263 _helpers._del_sub_prop(self._properties, keys)

264

265 @property

266 def destination_table_friendly_name(self):

267 """Optional[str]: Name given to destination table.

268

269 See:

270 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#DestinationTableProperties.FIELDS.friendly_name

271 """

272 prop = self._get_sub_prop("destinationTableProperties")

273 if prop is not None:

274 return prop["friendlyName"]

275

276 @destination_table_friendly_name.setter

277 def destination_table_friendly_name(self, value):

278 keys = [self._job_type, "destinationTableProperties", "friendlyName"]

279 if value is not None:

280 _helpers._set_sub_prop(self._properties, keys, value)

281 else:

282 _helpers._del_sub_prop(self._properties, keys)

283

284 @property

285 def encoding(self):

286 """Optional[google.cloud.bigquery.job.Encoding]: The character encoding of the

287 data.

288

289 See:

290 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.encoding

291 """

292 return self._get_sub_prop("encoding")

293

294 @encoding.setter

295 def encoding(self, value):

296 self._set_sub_prop("encoding", value)

297

298 @property

299 def field_delimiter(self):

300 """Optional[str]: The separator for fields in a CSV file.

301

302 See:

303 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.field_delimiter

304 """

305 return self._get_sub_prop("fieldDelimiter")

306

307 @field_delimiter.setter

308 def field_delimiter(self, value):

309 self._set_sub_prop("fieldDelimiter", value)

310

311 @property

312 def hive_partitioning(self):

313 """Optional[:class:`~.external_config.HivePartitioningOptions`]: [Beta] When set, \

314 it configures hive partitioning support.

315

316 .. note::

317 **Experimental**. This feature is experimental and might change or

318 have limited support.

319

320 See:

321 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.hive_partitioning_options

322 """

323 prop = self._get_sub_prop("hivePartitioningOptions")

324 if prop is None:

325 return None

326 return HivePartitioningOptions.from_api_repr(prop)

327

328 @hive_partitioning.setter

329 def hive_partitioning(self, value):

330 if value is not None:

331 if isinstance(value, HivePartitioningOptions):

332 value = value.to_api_repr()

333 else:

334 raise TypeError("Expected a HivePartitioningOptions instance or None.")

335

336 self._set_sub_prop("hivePartitioningOptions", value)

337

338 @property

339 def ignore_unknown_values(self):

340 """Optional[bool]: Ignore extra values not represented in the table schema.

341

342 See:

343 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.ignore_unknown_values

344 """

345 return self._get_sub_prop("ignoreUnknownValues")

346

347 @ignore_unknown_values.setter

348 def ignore_unknown_values(self, value):

349 self._set_sub_prop("ignoreUnknownValues", value)

350

351 @property

352 def json_extension(self):

353 """Optional[str]: The extension to use for writing JSON data to BigQuery. Only supports GeoJSON currently.

354

355 See: https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.json_extension

356

357 """

358 return self._get_sub_prop("jsonExtension")

359

360 @json_extension.setter

361 def json_extension(self, value):

362 self._set_sub_prop("jsonExtension", value)

363

364 @property

365 def max_bad_records(self):

366 """Optional[int]: Number of invalid rows to ignore.

367

368 See:

369 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.max_bad_records

370 """

371 return _helpers._int_or_none(self._get_sub_prop("maxBadRecords"))

372

373 @max_bad_records.setter

374 def max_bad_records(self, value):

375 self._set_sub_prop("maxBadRecords", value)

376

377 @property

378 def null_marker(self):

379 """Optional[str]: Represents a null value (CSV only).

380

381 See:

382 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.null_marker

383 """

384 return self._get_sub_prop("nullMarker")

385

386 @null_marker.setter

387 def null_marker(self, value):

388 self._set_sub_prop("nullMarker", value)

389

390 @property

391 def null_markers(self) -> Optional[List[str]]:

392 """Optional[List[str]]: A list of strings represented as SQL NULL values in a CSV file.

393

394 .. note::

395 null_marker and null_markers can't be set at the same time.

396 If null_marker is set, null_markers has to be not set.

397 If null_markers is set, null_marker has to be not set.

398 If both null_marker and null_markers are set at the same time, a user error would be thrown.

399 Any strings listed in null_markers, including empty string would be interpreted as SQL NULL.

400 This applies to all column types.

401

402 See:

403 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.null_markers

404 """

405 return self._get_sub_prop("nullMarkers")

406

407 @null_markers.setter

408 def null_markers(self, value: Optional[List[str]]):

409 self._set_sub_prop("nullMarkers", value)

410

411 @property

412 def preserve_ascii_control_characters(self):

413 """Optional[bool]: Preserves the embedded ASCII control characters when sourceFormat is set to CSV.

414

415 See:

416 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.preserve_ascii_control_characters

417 """

418 return self._get_sub_prop("preserveAsciiControlCharacters")

419

420 @preserve_ascii_control_characters.setter

421 def preserve_ascii_control_characters(self, value):

422 self._set_sub_prop("preserveAsciiControlCharacters", bool(value))

423

424 @property

425 def projection_fields(self) -> Optional[List[str]]:

426 """Optional[List[str]]: If

427 :attr:`google.cloud.bigquery.job.LoadJobConfig.source_format` is set to

428 "DATASTORE_BACKUP", indicates which entity properties to load into

429 BigQuery from a Cloud Datastore backup.

430

431 Property names are case sensitive and must be top-level properties. If

432 no properties are specified, BigQuery loads all properties. If any

433 named property isn't found in the Cloud Datastore backup, an invalid

434 error is returned in the job result.

435

436 See:

437 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.projection_fields

438 """

439 return self._get_sub_prop("projectionFields")

440

441 @projection_fields.setter

442 def projection_fields(self, value: Optional[List[str]]):

443 self._set_sub_prop("projectionFields", value)

444

445 @property

446 def quote_character(self):

447 """Optional[str]: Character used to quote data sections (CSV only).

448

449 See:

450 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.quote

451 """

452 return self._get_sub_prop("quote")

453

454 @quote_character.setter

455 def quote_character(self, value):

456 self._set_sub_prop("quote", value)

457

458 @property

459 def range_partitioning(self):

460 """Optional[google.cloud.bigquery.table.RangePartitioning]:

461 Configures range-based partitioning for destination table.

462

463 .. note::

464 **Beta**. The integer range partitioning feature is in a

465 pre-release state and might change or have limited support.

466

467 Only specify at most one of

468 :attr:`~google.cloud.bigquery.job.LoadJobConfig.time_partitioning` or

469 :attr:`~google.cloud.bigquery.job.LoadJobConfig.range_partitioning`.

470

471 Raises:

472 ValueError:

473 If the value is not

474 :class:`~google.cloud.bigquery.table.RangePartitioning` or

475 :data:`None`.

476 """

477 resource = self._get_sub_prop("rangePartitioning")

478 if resource is not None:

479 return RangePartitioning(_properties=resource)

480

481 @range_partitioning.setter

482 def range_partitioning(self, value):

483 resource = value

484 if isinstance(value, RangePartitioning):

485 resource = value._properties

486 elif value is not None:

487 raise ValueError(

488 "Expected value to be RangePartitioning or None, got {}.".format(value)

489 )

490 self._set_sub_prop("rangePartitioning", resource)

491

492 @property

493 def reference_file_schema_uri(self):

494 """Optional[str]:

495 When creating an external table, the user can provide a reference file with the

496 table schema. This is enabled for the following formats:

497

498 AVRO, PARQUET, ORC

499 """

500 return self._get_sub_prop("referenceFileSchemaUri")

501

502 @reference_file_schema_uri.setter

503 def reference_file_schema_uri(self, value):

504 return self._set_sub_prop("referenceFileSchemaUri", value)

505

506 @property

507 def schema(self):

508 """Optional[Sequence[Union[ \

509 :class:`~google.cloud.bigquery.schema.SchemaField`, \

510 Mapping[str, Any] \

511 ]]]: Schema of the destination table.

512

513 See:

514 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.schema

515 """

516 schema = _helpers._get_sub_prop(self._properties, ["load", "schema", "fields"])

517 if schema is None:

518 return

519 return [SchemaField.from_api_repr(field) for field in schema]

520

521 @schema.setter

522 def schema(self, value):

523 if value is None:

524 self._del_sub_prop("schema")

525 return

526

527 value = _to_schema_fields(value)

528

529 _helpers._set_sub_prop(

530 self._properties,

531 ["load", "schema", "fields"],

532 [field.to_api_repr() for field in value],

533 )

534

535 @property

536 def schema_update_options(self):

537 """Optional[List[google.cloud.bigquery.job.SchemaUpdateOption]]: Specifies

538 updates to the destination table schema to allow as a side effect of

539 the load job.

540 """

541 return self._get_sub_prop("schemaUpdateOptions")

542

543 @schema_update_options.setter

544 def schema_update_options(self, values):

545 self._set_sub_prop("schemaUpdateOptions", values)

546

547 @property

548 def skip_leading_rows(self):

549 """Optional[int]: Number of rows to skip when reading data (CSV only).

550

551 See:

552 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.skip_leading_rows

553 """

554 return _helpers._int_or_none(self._get_sub_prop("skipLeadingRows"))

555

556 @skip_leading_rows.setter

557 def skip_leading_rows(self, value):

558 self._set_sub_prop("skipLeadingRows", str(value))

559

560 @property

561 def source_format(self):

562 """Optional[google.cloud.bigquery.job.SourceFormat]: File format of the data.

563

564 See:

565 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.source_format

566 """

567 return self._get_sub_prop("sourceFormat")

568

569 @source_format.setter

570 def source_format(self, value):

571 self._set_sub_prop("sourceFormat", value)

572

573 @property

574 def source_column_match(self) -> Optional[SourceColumnMatch]:

575 """Optional[google.cloud.bigquery.enums.SourceColumnMatch]: Controls the

576 strategy used to match loaded columns to the schema. If not set, a sensible

577 default is chosen based on how the schema is provided. If autodetect is

578 used, then columns are matched by name. Otherwise, columns are matched by

579 position. This is done to keep the behavior backward-compatible.

580

581 Acceptable values are:

582

583 SOURCE_COLUMN_MATCH_UNSPECIFIED: Unspecified column name match option.

584 POSITION: matches by position. This assumes that the columns are ordered

585 the same way as the schema.

586 NAME: matches by name. This reads the header row as column names and

587 reorders columns to match the field names in the schema.

588

589 See:

590

591 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.source_column_match

592 """

593 value = self._get_sub_prop("sourceColumnMatch")

594 return SourceColumnMatch(value) if value is not None else None

595

596 @source_column_match.setter

597 def source_column_match(self, value: Union[SourceColumnMatch, str, None]):

598 if value is not None and not isinstance(value, (SourceColumnMatch, str)):

599 raise TypeError(

600 "value must be a google.cloud.bigquery.enums.SourceColumnMatch, str, or None"

601 )

602 if isinstance(value, SourceColumnMatch):

603 value = value.value

604 self._set_sub_prop("sourceColumnMatch", value if value else None)

605

606 @property

607 def date_format(self) -> Optional[str]:

608 """Optional[str]: Date format used for parsing DATE values.

609

610 See:

611 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.date_format

612 """

613 return self._get_sub_prop("dateFormat")

614

615 @date_format.setter

616 def date_format(self, value: Optional[str]):

617 self._set_sub_prop("dateFormat", value)

618

619 @property

620 def datetime_format(self) -> Optional[str]:

621 """Optional[str]: Date format used for parsing DATETIME values.

622

623 See:

624 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.datetime_format

625 """

626 return self._get_sub_prop("datetimeFormat")

627

628 @datetime_format.setter

629 def datetime_format(self, value: Optional[str]):

630 self._set_sub_prop("datetimeFormat", value)

631

632 @property

633 def time_zone(self) -> Optional[str]:

634 """Optional[str]: Default time zone that will apply when parsing timestamp

635 values that have no specific time zone.

636

637 See:

638 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.time_zone

639 """

640 return self._get_sub_prop("timeZone")

641

642 @time_zone.setter

643 def time_zone(self, value: Optional[str]):

644 self._set_sub_prop("timeZone", value)

645

646 @property

647 def time_format(self) -> Optional[str]:

648 """Optional[str]: Date format used for parsing TIME values.

649

650 See:

651 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.time_format

652 """

653 return self._get_sub_prop("timeFormat")

654

655 @time_format.setter

656 def time_format(self, value: Optional[str]):

657 self._set_sub_prop("timeFormat", value)

658

659 @property

660 def timestamp_format(self) -> Optional[str]:

661 """Optional[str]: Date format used for parsing TIMESTAMP values.

662

663 See:

664 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.timestamp_format

665 """

666 return self._get_sub_prop("timestampFormat")

667

668 @timestamp_format.setter

669 def timestamp_format(self, value: Optional[str]):

670 self._set_sub_prop("timestampFormat", value)

671

672 @property

673 def time_partitioning(self):

674 """Optional[google.cloud.bigquery.table.TimePartitioning]: Specifies time-based

675 partitioning for the destination table.

676

677 Only specify at most one of

678 :attr:`~google.cloud.bigquery.job.LoadJobConfig.time_partitioning` or

679 :attr:`~google.cloud.bigquery.job.LoadJobConfig.range_partitioning`.

680 """

681 prop = self._get_sub_prop("timePartitioning")

682 if prop is not None:

683 prop = TimePartitioning.from_api_repr(prop)

684 return prop

685

686 @time_partitioning.setter

687 def time_partitioning(self, value):

688 api_repr = value

689 if value is not None:

690 api_repr = value.to_api_repr()

691 self._set_sub_prop("timePartitioning", api_repr)

692 else:

693 self._del_sub_prop("timePartitioning")

694

695 @property

696 def use_avro_logical_types(self):

697 """Optional[bool]: For loads of Avro data, governs whether Avro logical types are

698 converted to their corresponding BigQuery types (e.g. TIMESTAMP) rather than

699 raw types (e.g. INTEGER).

700 """

701 return self._get_sub_prop("useAvroLogicalTypes")

702

703 @use_avro_logical_types.setter

704 def use_avro_logical_types(self, value):

705 self._set_sub_prop("useAvroLogicalTypes", bool(value))

706

707 @property

708 def write_disposition(self):

709 """Optional[google.cloud.bigquery.job.WriteDisposition]: Action that occurs if

710 the destination table already exists.

711

712 See:

713 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.write_disposition

714 """

715 return self._get_sub_prop("writeDisposition")

716

717 @write_disposition.setter

718 def write_disposition(self, value):

719 self._set_sub_prop("writeDisposition", value)

720

721 @property

722 def parquet_options(self):

723 """Optional[google.cloud.bigquery.format_options.ParquetOptions]: Additional

724 properties to set if ``sourceFormat`` is set to PARQUET.

725

726 See:

727 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.parquet_options

728 """

729 prop = self._get_sub_prop("parquetOptions")

730 if prop is not None:

731 prop = ParquetOptions.from_api_repr(prop)

732 return prop

733

734 @parquet_options.setter

735 def parquet_options(self, value):

736 if value is not None:

737 self._set_sub_prop("parquetOptions", value.to_api_repr())

738 else:

739 self._del_sub_prop("parquetOptions")

740

741 @property

742 def column_name_character_map(self) -> str:

743 """Optional[google.cloud.bigquery.job.ColumnNameCharacterMap]:

744 Character map supported for column names in CSV/Parquet loads. Defaults

745 to STRICT and can be overridden by Project Config Service. Using this

746 option with unsupported load formats will result in an error.

747

748 See

749 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.column_name_character_map

750 """

751 return self._get_sub_prop(

752 "columnNameCharacterMap",

753 ColumnNameCharacterMap.COLUMN_NAME_CHARACTER_MAP_UNSPECIFIED,

754 )

755

756 @column_name_character_map.setter

757 def column_name_character_map(self, value: Optional[str]):

758 if value is None:

759 value = ColumnNameCharacterMap.COLUMN_NAME_CHARACTER_MAP_UNSPECIFIED

760 self._set_sub_prop("columnNameCharacterMap", value)

761

762

763class LoadJob(_AsyncJob):

764 """Asynchronous job for loading data into a table.

765

766 Can load from Google Cloud Storage URIs or from a file.

767

768 Args:

769 job_id (str): the job's ID

770

771 source_uris (Optional[Sequence[str]]):

772 URIs of one or more data files to be loaded. See

773 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.source_uris

774 for supported URI formats. Pass None for jobs that load from a file.

775

776 destination (google.cloud.bigquery.table.TableReference): reference to table into which data is to be loaded.

777

778 client (google.cloud.bigquery.client.Client):

779 A client which holds credentials and project configuration

780 for the dataset (which requires a project).

781 """

782

783 _JOB_TYPE = "load"

784 _CONFIG_CLASS = LoadJobConfig

785

786 def __init__(self, job_id, source_uris, destination, client, job_config=None):

787 super(LoadJob, self).__init__(job_id, client)

788

789 if job_config is not None:

790 self._properties["configuration"] = job_config._properties

791

792 if source_uris is not None:

793 _helpers._set_sub_prop(

794 self._properties, ["configuration", "load", "sourceUris"], source_uris

795 )

796

797 if destination is not None:

798 _helpers._set_sub_prop(

799 self._properties,

800 ["configuration", "load", "destinationTable"],

801 destination.to_api_repr(),

802 )

803

804 @property

805 def configuration(self) -> LoadJobConfig:

806 """The configuration for this load job."""

807 return typing.cast(LoadJobConfig, super().configuration)

808

809 @property

810 def destination(self):

811 """google.cloud.bigquery.table.TableReference: table where loaded rows are written

812

813 See:

814 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.destination_table

815 """

816 dest_config = _helpers._get_sub_prop(

817 self._properties, ["configuration", "load", "destinationTable"]

818 )

819 return TableReference.from_api_repr(dest_config)

820

821 @property

822 def source_uris(self):

823 """Optional[Sequence[str]]: URIs of data files to be loaded. See

824 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad.FIELDS.source_uris

825 for supported URI formats. None for jobs that load from a file.

826 """

827 return _helpers._get_sub_prop(

828 self._properties, ["configuration", "load", "sourceUris"]

829 )

830

831 @property

832 def allow_jagged_rows(self):

833 """See

834 :attr:`google.cloud.bigquery.job.LoadJobConfig.allow_jagged_rows`.

835 """

836 return self.configuration.allow_jagged_rows

837

838 @property

839 def allow_quoted_newlines(self):

840 """See

841 :attr:`google.cloud.bigquery.job.LoadJobConfig.allow_quoted_newlines`.

842 """

843 return self.configuration.allow_quoted_newlines

844

845 @property

846 def autodetect(self):

847 """See

848 :attr:`google.cloud.bigquery.job.LoadJobConfig.autodetect`.

849 """

850 return self.configuration.autodetect

851

852 @property

853 def connection_properties(self) -> List[ConnectionProperty]:

854 """See

855 :attr:`google.cloud.bigquery.job.LoadJobConfig.connection_properties`.

856

857 .. versionadded:: 3.7.0

858 """

859 return self.configuration.connection_properties

860

861 @property

862 def create_disposition(self):

863 """See

864 :attr:`google.cloud.bigquery.job.LoadJobConfig.create_disposition`.

865 """

866 return self.configuration.create_disposition

867

868 @property

869 def create_session(self) -> Optional[bool]:

870 """See

871 :attr:`google.cloud.bigquery.job.LoadJobConfig.create_session`.

872

873 .. versionadded:: 3.7.0

874 """

875 return self.configuration.create_session

876

877 @property

878 def encoding(self):

879 """See

880 :attr:`google.cloud.bigquery.job.LoadJobConfig.encoding`.

881 """

882 return self.configuration.encoding

883

884 @property

885 def field_delimiter(self):

886 """See

887 :attr:`google.cloud.bigquery.job.LoadJobConfig.field_delimiter`.

888 """

889 return self.configuration.field_delimiter

890

891 @property

892 def ignore_unknown_values(self):

893 """See

894 :attr:`google.cloud.bigquery.job.LoadJobConfig.ignore_unknown_values`.

895 """

896 return self.configuration.ignore_unknown_values

897

898 @property

899 def max_bad_records(self):

900 """See

901 :attr:`google.cloud.bigquery.job.LoadJobConfig.max_bad_records`.

902 """

903 return self.configuration.max_bad_records

904

905 @property

906 def null_marker(self):

907 """See

908 :attr:`google.cloud.bigquery.job.LoadJobConfig.null_marker`.

909 """

910 return self.configuration.null_marker

911

912 @property

913 def null_markers(self):

914 """See

915 :attr:`google.cloud.bigquery.job.LoadJobConfig.null_markers`.

916 """

917 return self.configuration.null_markers

918

919 @property

920 def quote_character(self):

921 """See

922 :attr:`google.cloud.bigquery.job.LoadJobConfig.quote_character`.

923 """

924 return self.configuration.quote_character

925

926 @property

927 def reference_file_schema_uri(self):

928 """See:

929 attr:`google.cloud.bigquery.job.LoadJobConfig.reference_file_schema_uri`.

930 """

931 return self.configuration.reference_file_schema_uri

932

933 @property

934 def skip_leading_rows(self):

935 """See

936 :attr:`google.cloud.bigquery.job.LoadJobConfig.skip_leading_rows`.

937 """

938 return self.configuration.skip_leading_rows

939

940 @property

941 def source_format(self):

942 """See

943 :attr:`google.cloud.bigquery.job.LoadJobConfig.source_format`.

944 """

945 return self.configuration.source_format

946

947 @property

948 def write_disposition(self):

949 """See

950 :attr:`google.cloud.bigquery.job.LoadJobConfig.write_disposition`.

951 """

952 return self.configuration.write_disposition

953

954 @property

955 def schema(self):

956 """See

957 :attr:`google.cloud.bigquery.job.LoadJobConfig.schema`.

958 """

959 return self.configuration.schema

960

961 @property

962 def destination_encryption_configuration(self):

963 """google.cloud.bigquery.encryption_configuration.EncryptionConfiguration: Custom

964 encryption configuration for the destination table.

965

966 Custom encryption configuration (e.g., Cloud KMS keys)

967 or :data:`None` if using default encryption.

968

969 See

970 :attr:`google.cloud.bigquery.job.LoadJobConfig.destination_encryption_configuration`.

971 """

972 return self.configuration.destination_encryption_configuration

973

974 @property

975 def destination_table_description(self):

976 """Optional[str] name given to destination table.

977

978 See:

979 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#DestinationTableProperties.FIELDS.description

980 """

981 return self.configuration.destination_table_description

982

983 @property

984 def destination_table_friendly_name(self):

985 """Optional[str] name given to destination table.

986

987 See:

988 https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#DestinationTableProperties.FIELDS.friendly_name

989 """

990 return self.configuration.destination_table_friendly_name

991

992 @property

993 def range_partitioning(self):

994 """See

995 :attr:`google.cloud.bigquery.job.LoadJobConfig.range_partitioning`.

996 """

997 return self.configuration.range_partitioning

998

999 @property

1000 def time_partitioning(self):

1001 """See

1002 :attr:`google.cloud.bigquery.job.LoadJobConfig.time_partitioning`.

1003 """

1004 return self.configuration.time_partitioning

1005

1006 @property

1007 def use_avro_logical_types(self):

1008 """See

1009 :attr:`google.cloud.bigquery.job.LoadJobConfig.use_avro_logical_types`.

1010 """

1011 return self.configuration.use_avro_logical_types

1012

1013 @property

1014 def clustering_fields(self):

1015 """See

1016 :attr:`google.cloud.bigquery.job.LoadJobConfig.clustering_fields`.

1017 """

1018 return self.configuration.clustering_fields

1019

1020 @property

1021 def source_column_match(self) -> Optional[SourceColumnMatch]:

1022 """See

1023 :attr:`google.cloud.bigquery.job.LoadJobConfig.source_column_match`.

1024 """

1025 return self.configuration.source_column_match

1026

1027 @property

1028 def date_format(self):

1029 """See

1030 :attr:`google.cloud.bigquery.job.LoadJobConfig.date_format`.

1031 """

1032 return self.configuration.date_format

1033

1034 @property

1035 def datetime_format(self):

1036 """See

1037 :attr:`google.cloud.bigquery.job.LoadJobConfig.datetime_format`.

1038 """

1039 return self.configuration.datetime_format

1040

1041 @property

1042 def time_zone(self):

1043 """See

1044 :attr:`google.cloud.bigquery.job.LoadJobConfig.time_zone`.

1045 """

1046 return self.configuration.time_zone

1047

1048 @property

1049 def time_format(self):

1050 """See

1051 :attr:`google.cloud.bigquery.job.LoadJobConfig.time_format`.

1052 """

1053 return self.configuration.time_format

1054

1055 @property

1056 def timestamp_format(self):

1057 """See

1058 :attr:`google.cloud.bigquery.job.LoadJobConfig.timestamp_format`.

1059 """

1060 return self.configuration.timestamp_format

1061

1062 @property

1063 def schema_update_options(self):

1064 """See

1065 :attr:`google.cloud.bigquery.job.LoadJobConfig.schema_update_options`.

1066 """

1067 return self.configuration.schema_update_options

1068

1069 @property

1070 def input_file_bytes(self):

1071 """Count of bytes loaded from source files.

1072

1073 Returns:

1074 Optional[int]: the count (None until set from the server).

1075

1076 Raises:

1077 ValueError: for invalid value types.

1078 """

1079 return _helpers._int_or_none(

1080 _helpers._get_sub_prop(

1081 self._properties, ["statistics", "load", "inputFileBytes"]

1082 )

1083 )

1084

1085 @property

1086 def input_files(self):

1087 """Count of source files.

1088

1089 Returns:

1090 Optional[int]: the count (None until set from the server).

1091 """

1092 return _helpers._int_or_none(

1093 _helpers._get_sub_prop(

1094 self._properties, ["statistics", "load", "inputFiles"]

1095 )

1096 )

1097

1098 @property

1099 def output_bytes(self):

1100 """Count of bytes saved to destination table.

1101

1102 Returns:

1103 Optional[int]: the count (None until set from the server).

1104 """

1105 return _helpers._int_or_none(

1106 _helpers._get_sub_prop(

1107 self._properties, ["statistics", "load", "outputBytes"]

1108 )

1109 )

1110

1111 @property

1112 def output_rows(self):

1113 """Count of rows saved to destination table.

1114

1115 Returns:

1116 Optional[int]: the count (None until set from the server).

1117 """

1118 return _helpers._int_or_none(

1119 _helpers._get_sub_prop(

1120 self._properties, ["statistics", "load", "outputRows"]

1121 )

1122 )

1123

1124 def to_api_repr(self):

1125 """Generate a resource for :meth:`_begin`."""

1126 # Exclude statistics, if set.

1127 return {

1128 "jobReference": self._properties["jobReference"],

1129 "configuration": self._properties["configuration"],

1130 }

1131

1132 @classmethod

1133 def from_api_repr(cls, resource: dict, client) -> "LoadJob":

1134 """Factory: construct a job given its API representation

1135

1136 .. note::

1137

1138 This method assumes that the project found in the resource matches

1139 the client's project.

1140

1141 Args:

1142 resource (Dict): dataset job representation returned from the API

1143

1144 client (google.cloud.bigquery.client.Client):

1145 Client which holds credentials and project

1146 configuration for the dataset.

1147

1148 Returns:

1149 google.cloud.bigquery.job.LoadJob: Job parsed from ``resource``.

1150 """

1151 cls._check_resource_config(resource)

1152 job_ref = _JobReference._from_api_repr(resource["jobReference"])

1153 job = cls(job_ref, None, None, client)

1154 job._set_properties(resource)

1155 return job