import warnings
from typing import Optional
import click
from .base import CONTEXT_SETTINGS, command_wrap, ClickErrorException
from ..operate import upload_file_to_file, upload_directory_as_archive, upload_directory_as_directory
from ..operate.base import REPO_TYPES, RepoTypeTyping, get_hf_client
[docs]class NoRemotePathAssignedWithUpload(ClickErrorException):
"""
Custom exception class for indicating that no remote path in the repository is assigned.
"""
exit_code = 0x21
def _add_upload_subcommand(cli: click.Group) -> click.Group:
"""
Add the 'upload' subcommand to the CLI.
:param cli: The Click CLI application.
:type cli: click.Group
:return: The modified Click CLI application.
:rtype: click.Group
"""
@cli.command('upload', help='Upload data from HuggingFace.\n\n'
'Set environment $HF_TOKEN to use your own access token.',
context_settings=CONTEXT_SETTINGS)
@click.option('-r', '--repository', 'repo_id', type=str, required=True,
help='Repository to upload to.')
@click.option('-t', '--type', 'repo_type', type=click.Choice(REPO_TYPES), default='dataset',
help='Type of the HuggingFace repository.', show_default=True)
@click.option('-f', '--filename', 'file_in_repo', type=str, default=None,
help='File in repository to upload.')
@click.option('-a', '--archive', 'archive_in_repo', type=str, default=None,
help='Archive file in repository to upload and extract from')
@click.option('-d', '--directory', 'dir_in_repo', type=str, default=None,
help='Directory in repository to upload the full directory tree.')
@click.option('-i', '--input', 'input_path', type=str, required=True,
help='Input path for upload.')
@click.option('-R', '--revision', 'revision', type=str, default='main',
help='Revision of repository.', show_default=True)
@click.option('-c', '--clear', 'clear', is_flag=True, type=bool, default=False,
help='Clear the remote directory before uploading.\n'
'Only applied when -d is used.', show_default=True)
@click.option('-p', '--private', 'private', is_flag=True, type=bool, default=False,
help='Use private repository when created.', show_default=True)
@command_wrap()
def upload(repo_id: str, repo_type: RepoTypeTyping,
file_in_repo: Optional[str], archive_in_repo: Optional[str], dir_in_repo: Optional[str],
input_path: str, revision: str, clear: bool, private: bool):
"""
Upload data to HuggingFace repositories.
:param repo_id: Repository to upload to.
:type repo_id: str
:param repo_type: Type of the HuggingFace repository.
:type repo_type: RepoTypeTyping
:param file_in_repo: File in repository to upload.
:type file_in_repo: Optional[str]
:param archive_in_repo: Archive file in repository to upload and extract from.
:type archive_in_repo: Optional[str]
:param dir_in_repo: Directory in repository to upload the full directory tree.
:type dir_in_repo: Optional[str]
:param input_path: Input path for upload.
:type input_path: str
:param revision: Revision of repository.
:type revision: str
:param clear: Clear the remote directory before uploading.
Only applied when -d is used.
:type clear: bool
:param private: Use private repository when created.
:type private: bool
"""
if not file_in_repo and not archive_in_repo and not dir_in_repo:
raise NoRemotePathAssignedWithUpload('No remote path in repository assigned.\n'
'One of the -f, -a, or -d option is required.')
hf_client = get_hf_client()
if not hf_client.repo_exists(repo_id, repo_type=repo_type):
hf_client.create_repo(repo_id, repo_type=repo_type, exist_ok=True, private=private)
if bool(hf_client.repo_info(repo_id, repo_type=repo_type).private) != bool(private):
hf_client.update_repo_visibility(repo_id, repo_type=repo_type, private=bool(private))
if file_in_repo:
if archive_in_repo:
warnings.warn('File in repository assigned, value of -a option will be ignored.')
if dir_in_repo:
warnings.warn('File in repository assigned, value of -d option will be ignored.')
upload_file_to_file(
local_file=input_path,
repo_id=repo_id,
file_in_repo=file_in_repo,
repo_type=repo_type,
revision=revision,
)
elif archive_in_repo:
if dir_in_repo:
warnings.warn('Archive in repository assigned, value of -d option will be ignored.')
upload_directory_as_archive(
local_directory=input_path,
repo_id=repo_id,
archive_in_repo=archive_in_repo,
repo_type=repo_type,
revision=revision,
silent=False,
)
elif dir_in_repo:
upload_directory_as_directory(
local_directory=input_path,
repo_id=repo_id,
path_in_repo=dir_in_repo,
repo_type=repo_type,
revision=revision,
clear=clear,
)
else:
assert False, 'Should not reach this line, it must be a bug!' # pragma: no cover
return cli