Skip to content

Commit 4c3231d

Browse files
committed
Make sure to pass features into the embed storage branch as well.
1 parent e74b3a0 commit 4c3231d

1 file changed

Lines changed: 1 addition & 0 deletions

File tree

src/datasets/iterable_dataset.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4450,6 +4450,7 @@ def _push_parquet_shards_to_hub_single(
44504450
partial(embed_table_storage, token_per_repo_id=self._token_per_repo_id),
44514451
batched=True,
44524452
batch_size=get_arrow_writer_batch_size_from_features(shard.features),
4453+
features=shard.features,
44534454
)
44544455
shard_path_in_repo = f"{data_dir}/{split}-{index:05d}-of-{num_shards:05d}.parquet"
44554456
tmp_file = tempfile.NamedTemporaryFile(suffix=".parquet", delete=False)

0 commit comments

Comments
 (0)