Skip to content

Commit fc9f2be

Browse files
author
Tom McCormick
committed
cleanup tests
1 parent 4175559 commit fc9f2be

File tree

3 files changed

+90
-270
lines changed

3 files changed

+90
-270
lines changed

pyiceberg/io/pyarrow.py

Lines changed: 9 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -692,7 +692,7 @@ def schema_to_pyarrow(
692692
schema: Union[Schema, IcebergType],
693693
metadata: Dict[bytes, bytes] = EMPTY_DICT,
694694
include_field_ids: bool = True,
695-
file_format: Optional[FileFormat] = None,
695+
file_format: FileFormat = FileFormat.PARQUET,
696696
) -> pa.schema:
697697
return visit(schema, _ConvertToArrowSchema(metadata, include_field_ids, file_format))
698698

@@ -1253,18 +1253,14 @@ def primitive(self, primitive: pa.DataType) -> T:
12531253

12541254
def _get_field_id(field: pa.Field) -> Optional[int]:
12551255
"""Return the Iceberg field ID from Parquet or ORC metadata if available."""
1256-
if not field.metadata:
1257-
return None
1258-
1259-
# Try Parquet field ID first
1260-
field_id_bytes = field.metadata.get(PYARROW_PARQUET_FIELD_ID_KEY)
1261-
if field_id_bytes:
1262-
return int(field_id_bytes.decode())
1263-
1264-
# Fallback: try ORC field ID
1265-
field_id_bytes = field.metadata.get(ORC_FIELD_ID_KEY)
1266-
if field_id_bytes:
1267-
return int(field_id_bytes.decode())
1256+
if field.metadata:
1257+
# Try Parquet field ID first
1258+
if field_id_bytes := field.metadata.get(PYARROW_PARQUET_FIELD_ID_KEY):
1259+
return int(field_id_bytes.decode())
1260+
1261+
# Fallback: try ORC field ID
1262+
if field_id_bytes := field.metadata.get(ORC_FIELD_ID_KEY):
1263+
return int(field_id_bytes.decode())
12681264

12691265
return None
12701266

0 commit comments

Comments
 (0)