Commit 4a539a7b authored by Jeremie Hallal's avatar Jeremie Hallal
Browse files

not retreiving stat if not needed

parent 6e82f31d
Pipeline #71540 passed with stages
in 58 minutes and 16 seconds
......@@ -151,10 +151,13 @@ async def get_data_version(
raise BulkNotFound(record_id=record_id, bulk_id=None)
if prefix == BULK_URN_PREFIX_VERSION:
columns = None
stat = dask_blob_storage.read_stat(record_id, bulk_id)
if data_param.curves:
stat = dask_blob_storage.read_stat(record_id, bulk_id)
existing_col = set(stat['schema'])
columns = DataFrameRender.get_matching_column(data_param.get_curves_list(), existing_col)
elif data_param.describe:
stat = dask_blob_storage.read_stat(record_id, bulk_id)
# loading the dataframe with filter on columns is faster than filtering columns on df
df = await dask_blob_storage.load_bulk(record_id, bulk_id, columns=columns)
elif prefix is None:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment