Skip to content

Commit 50fcf69

Browse files
Avoid multiple default config names (#7585)
* Avoid creating duplicated default config names * Fix style * Revert "Fix style" This reverts commit d19a5bc.
1 parent 8add786 commit 50fcf69

File tree

2 files changed

+14
-10
lines changed

2 files changed

+14
-10
lines changed

src/datasets/arrow_dataset.py

Lines changed: 7 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -5752,16 +5752,18 @@ def push_to_hub(
57525752
}
57535753
else:
57545754
metadata_config_to_dump = {"data_files": [{"split": split, "path": f"{data_dir}/{split}-*"}]}
5755+
configs_to_dump = {config_name: metadata_config_to_dump}
57555756
if set_default and config_name != "default":
57565757
if metadata_configs:
5757-
default_config_name = metadata_configs.get_default_config_name()
5758-
if default_config_name == "default":
5758+
current_default_config_name = metadata_configs.get_default_config_name()
5759+
if current_default_config_name == "default":
57595760
raise ValueError(
57605761
"There exists a configuration named 'default'. To set a different configuration as default, "
57615762
"rename the 'default' one first."
57625763
)
5763-
else:
5764-
_ = metadata_configs[default_config_name].pop("default")
5764+
if current_default_config_name:
5765+
_ = metadata_configs[current_default_config_name].pop("default")
5766+
configs_to_dump[current_default_config_name] = metadata_configs[current_default_config_name]
57655767
metadata_config_to_dump["default"] = True
57665768
# push to the deprecated dataset_infos.json
57675769
if repo_with_dataset_infos:
@@ -5779,7 +5781,7 @@ def push_to_hub(
57795781
)
57805782
# push to README
57815783
DatasetInfosDict({config_name: info_to_dump}).to_dataset_card_data(dataset_card_data)
5782-
MetadataConfigs({config_name: metadata_config_to_dump}).to_dataset_card_data(dataset_card_data)
5784+
MetadataConfigs(configs_to_dump).to_dataset_card_data(dataset_card_data)
57835785
dataset_card = DatasetCard(f"---\n{dataset_card_data}\n---\n") if dataset_card is None else dataset_card
57845786
additions.append(
57855787
CommitOperationAdd(path_in_repo=config.REPOCARD_FILENAME, path_or_fileobj=str(dataset_card).encode())

src/datasets/dataset_dict.py

Lines changed: 7 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1830,16 +1830,18 @@ def push_to_hub(
18301830
metadata_config_to_dump = {
18311831
"data_files": [{"split": split, "path": f"{data_dir}/{split}-*"} for split in self.keys()],
18321832
}
1833+
configs_to_dump = {config_name: metadata_config_to_dump}
18331834
if set_default and config_name != "default":
18341835
if metadata_configs:
1835-
default_config_name = metadata_configs.get_default_config_name()
1836-
if default_config_name == "default":
1836+
current_default_config_name = metadata_configs.get_default_config_name()
1837+
if current_default_config_name == "default":
18371838
raise ValueError(
18381839
"There exists a configuration named 'default'. To set a different configuration as default, "
18391840
"rename the 'default' one first."
18401841
)
1841-
else:
1842-
_ = metadata_configs[default_config_name].pop("default")
1842+
if current_default_config_name:
1843+
_ = metadata_configs[current_default_config_name].pop("default")
1844+
configs_to_dump[current_default_config_name] = metadata_configs[current_default_config_name]
18431845
metadata_config_to_dump["default"] = True
18441846
# push to the deprecated dataset_infos.json
18451847
if repo_with_dataset_infos:
@@ -1860,7 +1862,7 @@ def push_to_hub(
18601862
)
18611863
# push to README
18621864
DatasetInfosDict({config_name: info_to_dump}).to_dataset_card_data(dataset_card_data)
1863-
MetadataConfigs({config_name: metadata_config_to_dump}).to_dataset_card_data(dataset_card_data)
1865+
MetadataConfigs(configs_to_dump).to_dataset_card_data(dataset_card_data)
18641866
dataset_card = DatasetCard(f"---\n{dataset_card_data}\n---\n") if dataset_card is None else dataset_card
18651867
additions.append(
18661868
CommitOperationAdd(

0 commit comments

Comments
 (0)