Skip to content

Commit 2c0ffd3

Browse files
Update python/ray/data/datasource/parquet_meta_provider.py
Co-authored-by: gemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com> Signed-off-by: Howie Tien <sword865@163.com>
1 parent b1c9309 commit 2c0ffd3

File tree

1 file changed

+3
-2
lines changed

1 file changed

+3
-2
lines changed

python/ray/data/datasource/parquet_meta_provider.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -269,7 +269,8 @@ def _dedupe_fragment_metadata(
269269
"""
270270
schema_to_id = {} # schema_ser -> schema_id
271271
id_to_schema = {} # schema_id -> schema_ser
272-
stripped_metadatas = []
272+
schema_to_id = {} # schema_ser -> schema_id
273+
id_to_schema = {} # schema_id -> schema_ser
273274

274275
for metadata in metadatas:
275276
# Get the current schema serialization
@@ -287,6 +288,6 @@ def _dedupe_fragment_metadata(
287288
existing_schema_ser = id_to_schema[schema_id]
288289
metadata.set_schema_pickled(existing_schema_ser)
289290

290-
stripped_metadatas.append(metadata)
291+
return metadatas
291292

292293
return stripped_metadatas

0 commit comments

Comments
 (0)