Matthew Powers
06/13/2023, 1:15 PMdef read_delta(
table_uri,
version=None,
storage_options=None,
without_files=False,
columns=None,
filters=None,
):
dt = DeltaTable(table_uri, version, storage_options, without_files)
fragments = dt.to_pyarrow_dataset().get_fragments(filter=filters)
filenames = list(f"{table_uri}/{fragment.path}" for fragment in fragments)
ddf = dd.read_parquet(filenames, engine="pyarrow", columns=columns)
return ddf