Skip to content

Commit 0605a39

Browse files
committed
add --merge-pull-request option for convert_to_parquet
1 parent b1bfe15 commit 0605a39

File tree

1 file changed

+24
-2
lines changed

1 file changed

+24
-2
lines changed

src/datasets/commands/convert_to_parquet.py

Lines changed: 24 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,9 @@
11
from argparse import ArgumentParser
22
from typing import Optional
33

4+
from huggingface_hub import HfApi
5+
6+
import datasets.config
47
from datasets.commands import BaseDatasetsCLICommand
58
from datasets.hub import convert_to_parquet
69

@@ -26,6 +29,11 @@ def register_subcommand(parser):
2629
parser.add_argument(
2730
"--trust_remote_code", action="store_true", help="whether to trust the code execution of the load script"
2831
)
32+
parser.add_argument(
33+
"--merge-pull-request",
34+
action="store_true",
35+
help="whether to automatically merge the pull request(s) after conversion",
36+
)
2937
parser.set_defaults(func=_command_factory)
3038

3139
def __init__(
@@ -39,8 +47,22 @@ def __init__(
3947
self._token = token
4048
self._revision = revision
4149
self._trust_remote_code = trust_remote_code
50+
self._merge_pull_request = False
4251

4352
def run(self) -> None:
44-
_ = convert_to_parquet(
45-
self._dataset_id, revision=self._revision, token=self._token, trust_remote_code=self._trust_remote_code
53+
commit_info = convert_to_parquet(
54+
self._dataset_id,
55+
revision=self._revision,
56+
token=self._token,
57+
trust_remote_code=self._trust_remote_code,
58+
merge_pull_request=self._merge_pull_request,
4659
)
60+
61+
if self._merge_pull_request:
62+
api = HfApi(endpoint=datasets.config.HF_ENDPOINT, token=self._token)
63+
api.merge_pull_request(
64+
repo_id=self._dataset_id,
65+
discussion_num=int(commit_info.pr_num),
66+
token=self._token,
67+
repo_type="dataset",
68+
)

0 commit comments

Comments
 (0)