Skip to content

Commit

Permalink
remove duplicative all-at-once concatenate w/ join (#168)
Browse files Browse the repository at this point in the history
  • Loading branch information
d33bs authored Mar 16, 2024
1 parent d88ede7 commit 4f4b6da
Showing 1 changed file with 0 additions and 14 deletions.
14 changes: 0 additions & 14 deletions cytotable/convert.py
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,6 @@
CytoTable: convert - transforming data for use with pyctyominer.
"""


import itertools
import logging
import uuid
Expand Down Expand Up @@ -841,19 +840,6 @@ def _concat_join_sources(
if pathlib.Path(dest_path).is_dir():
shutil.rmtree(path=dest_path)

# write the concatted result as a parquet file
_write_parquet_table_with_metadata(
table=pa.concat_tables(
tables=[
parquet.read_table(
table_path, memory_map=CYTOTABLE_ARROW_USE_MEMORY_MAPPING
)
for table_path in join_sources
]
),
where=dest_path,
)

# build a parquet file writer which will be used to append files
# as a single concatted parquet file, referencing the first file's schema
# (all must be the same schema)
Expand Down

0 comments on commit 4f4b6da

Please sign in to comment.