2023-05-10 18:17:35 +09:00
|
|
|
import os
|
2023-07-19 21:47:47 +09:00
|
|
|
from argparse import Namespace
|
2023-05-10 18:17:35 +09:00
|
|
|
from concurrent.futures import ThreadPoolExecutor
|
2023-07-19 21:47:47 +09:00
|
|
|
from typing import Any
|
2023-05-10 18:17:35 +09:00
|
|
|
|
|
|
|
from pydantic.dataclasses import dataclass
|
|
|
|
|
2023-12-12 20:05:46 +09:00
|
|
|
from mdrsclient.api import FilesApi, FoldersApi
|
2023-05-10 18:17:35 +09:00
|
|
|
from mdrsclient.commands.base import BaseCommand
|
|
|
|
from mdrsclient.connection import MDRSConnection
|
2024-07-08 20:35:48 +09:00
|
|
|
from mdrsclient.exceptions import IllegalArgumentException, UnexpectedException
|
2024-07-22 14:35:34 +09:00
|
|
|
from mdrsclient.models import File, Folder, Laboratory
|
2023-05-10 18:17:35 +09:00
|
|
|
from mdrsclient.settings import CONCURRENT
|
|
|
|
|
|
|
|
|
|
|
|
@dataclass(frozen=True)
|
|
|
|
class DownloadFileInfo:
|
|
|
|
file: File
|
|
|
|
path: str
|
|
|
|
|
|
|
|
|
2024-07-08 20:35:48 +09:00
|
|
|
@dataclass
|
|
|
|
class DownloadContext:
|
|
|
|
hasError: bool
|
2024-09-18 10:56:40 +09:00
|
|
|
isSkipIfExists: bool
|
2024-07-08 20:35:48 +09:00
|
|
|
files: list[DownloadFileInfo]
|
|
|
|
|
|
|
|
|
2023-05-10 18:17:35 +09:00
|
|
|
class DownloadCommand(BaseCommand):
|
|
|
|
@classmethod
|
2023-07-19 21:47:47 +09:00
|
|
|
def register(cls, parsers: Any) -> None:
|
2023-05-10 18:17:35 +09:00
|
|
|
download_parser = parsers.add_parser("download", help="download the file or folder")
|
|
|
|
download_parser.add_argument(
|
|
|
|
"-r", "--recursive", help="download folders and their contents recursive", action="store_true"
|
|
|
|
)
|
2024-09-18 10:56:40 +09:00
|
|
|
download_parser.add_argument(
|
|
|
|
"-s",
|
|
|
|
"--skip-if-exists",
|
|
|
|
help="skip the download if file is already downloaded and file size is the same",
|
|
|
|
action="store_true",
|
|
|
|
)
|
2024-07-22 14:35:34 +09:00
|
|
|
download_parser.add_argument(
|
|
|
|
"-e", "--exclude", help="exclude to download path matched file or folders", action="append"
|
|
|
|
)
|
2023-05-10 20:10:43 +09:00
|
|
|
download_parser.add_argument("-p", "--password", help="password to use when open locked folder")
|
2023-05-10 18:17:35 +09:00
|
|
|
download_parser.add_argument("remote_path", help="remote file path (remote:/lab/path/file)")
|
|
|
|
download_parser.add_argument("local_path", help="local folder path (/foo/bar/)")
|
2023-07-19 21:47:47 +09:00
|
|
|
download_parser.set_defaults(func=cls.func)
|
2023-05-10 18:17:35 +09:00
|
|
|
|
2023-07-19 21:47:47 +09:00
|
|
|
@classmethod
|
|
|
|
def func(cls, args: Namespace) -> None:
|
|
|
|
remote_path = str(args.remote_path)
|
|
|
|
local_path = str(args.local_path)
|
|
|
|
is_recursive = bool(args.recursive)
|
2024-09-18 10:56:40 +09:00
|
|
|
is_skip_if_exists = bool(args.skip_if_exists)
|
2023-07-19 21:47:47 +09:00
|
|
|
password = str(args.password) if args.password else None
|
2024-07-22 14:35:34 +09:00
|
|
|
excludes = list(map(lambda x: str(x).rstrip("/").lower(), args.exclude)) if args.exclude is not None else []
|
2024-09-18 10:56:40 +09:00
|
|
|
cls.download(remote_path, local_path, is_recursive, is_skip_if_exists, password, excludes)
|
2023-07-19 21:47:47 +09:00
|
|
|
|
|
|
|
@classmethod
|
2024-07-22 14:35:34 +09:00
|
|
|
def download(
|
2024-10-23 18:33:12 +09:00
|
|
|
cls,
|
|
|
|
remote_path: str,
|
|
|
|
local_path: str,
|
|
|
|
is_recursive: bool,
|
|
|
|
is_skip_if_exists: bool,
|
|
|
|
password: str | None,
|
|
|
|
excludes: list[str],
|
2024-07-22 14:35:34 +09:00
|
|
|
) -> None:
|
2023-07-19 21:47:47 +09:00
|
|
|
(remote, laboratory_name, r_path) = cls._parse_remote_host_with_path(remote_path)
|
2023-05-10 18:17:35 +09:00
|
|
|
r_path = r_path.rstrip("/")
|
|
|
|
r_dirname = os.path.dirname(r_path)
|
|
|
|
r_basename = os.path.basename(r_path)
|
2023-07-19 21:47:47 +09:00
|
|
|
connection = cls._create_connection(remote)
|
|
|
|
l_dirname = os.path.realpath(local_path)
|
2023-05-10 18:17:35 +09:00
|
|
|
if not os.path.isdir(l_dirname):
|
2023-07-19 21:47:47 +09:00
|
|
|
raise IllegalArgumentException(f"Local directory `{local_path}` not found.")
|
|
|
|
laboratory = cls._find_laboratory(connection, laboratory_name)
|
|
|
|
r_parent_folder = cls._find_folder(connection, laboratory, r_dirname, password)
|
2023-05-10 18:17:35 +09:00
|
|
|
file = r_parent_folder.find_file(r_basename)
|
|
|
|
if file is not None:
|
2024-07-22 14:35:34 +09:00
|
|
|
if cls.__check_excludes(excludes, laboratory, r_parent_folder, file):
|
|
|
|
return
|
2024-09-18 10:56:40 +09:00
|
|
|
context = DownloadContext(False, is_skip_if_exists, [])
|
2023-05-10 18:17:35 +09:00
|
|
|
l_path = os.path.join(l_dirname, r_basename)
|
2024-07-08 20:35:48 +09:00
|
|
|
context.files.append(DownloadFileInfo(file, l_path))
|
|
|
|
cls.__multiple_download(connection, context)
|
2023-05-10 18:17:35 +09:00
|
|
|
else:
|
|
|
|
folder = r_parent_folder.find_sub_folder(r_basename)
|
|
|
|
if folder is None:
|
|
|
|
raise IllegalArgumentException(f"File or folder `{r_path}` not found.")
|
2023-07-19 21:47:47 +09:00
|
|
|
if not is_recursive:
|
2023-05-10 18:17:35 +09:00
|
|
|
raise IllegalArgumentException(f"Cannot download `{r_path}`: Is a folder.")
|
2023-12-12 20:05:46 +09:00
|
|
|
folder_api = FoldersApi(connection)
|
2024-07-22 14:35:34 +09:00
|
|
|
cls.__multiple_download_pickup_recursive_files(
|
2024-09-18 10:56:40 +09:00
|
|
|
connection, folder_api, laboratory, folder.id, l_dirname, excludes, is_skip_if_exists
|
2024-07-22 14:35:34 +09:00
|
|
|
)
|
2023-05-10 18:17:35 +09:00
|
|
|
|
2023-07-19 21:47:47 +09:00
|
|
|
@classmethod
|
2023-05-10 18:17:35 +09:00
|
|
|
def __multiple_download_pickup_recursive_files(
|
2024-07-22 14:35:34 +09:00
|
|
|
cls,
|
|
|
|
connection: MDRSConnection,
|
|
|
|
folder_api: FoldersApi,
|
|
|
|
laboratory: Laboratory,
|
|
|
|
folder_id: str,
|
|
|
|
basedir: str,
|
|
|
|
excludes: list[str],
|
2024-10-23 18:33:12 +09:00
|
|
|
is_skip_if_exists: bool,
|
2023-05-10 18:17:35 +09:00
|
|
|
) -> None:
|
2024-09-18 10:56:40 +09:00
|
|
|
context = DownloadContext(False, is_skip_if_exists, [])
|
2023-05-10 18:17:35 +09:00
|
|
|
folder = folder_api.retrieve(folder_id)
|
|
|
|
dirname = os.path.join(basedir, folder.name)
|
2024-07-22 14:35:34 +09:00
|
|
|
if cls.__check_excludes(excludes, laboratory, folder, None):
|
|
|
|
return
|
2023-05-10 18:17:35 +09:00
|
|
|
if not os.path.exists(dirname):
|
|
|
|
os.makedirs(dirname)
|
|
|
|
print(dirname)
|
|
|
|
for file in folder.files:
|
2024-07-22 14:35:34 +09:00
|
|
|
if cls.__check_excludes(excludes, laboratory, folder, file):
|
|
|
|
continue
|
2023-05-10 18:17:35 +09:00
|
|
|
path = os.path.join(dirname, file.name)
|
2024-07-08 20:35:48 +09:00
|
|
|
context.files.append(DownloadFileInfo(file, path))
|
|
|
|
cls.__multiple_download(connection, context)
|
|
|
|
if context.hasError:
|
|
|
|
raise UnexpectedException("Some files failed to download.")
|
2023-05-10 18:17:35 +09:00
|
|
|
for sub_folder in folder.sub_folders:
|
2024-07-22 14:35:34 +09:00
|
|
|
cls.__multiple_download_pickup_recursive_files(
|
2024-09-18 10:56:40 +09:00
|
|
|
connection, folder_api, laboratory, sub_folder.id, dirname, excludes, is_skip_if_exists
|
2024-07-22 14:35:34 +09:00
|
|
|
)
|
2023-05-10 18:17:35 +09:00
|
|
|
|
2023-07-19 21:47:47 +09:00
|
|
|
@classmethod
|
2024-07-08 20:35:48 +09:00
|
|
|
def __multiple_download(cls, connection: MDRSConnection, context: DownloadContext) -> None:
|
2023-12-12 20:05:46 +09:00
|
|
|
file_api = FilesApi(connection)
|
2023-05-10 18:17:35 +09:00
|
|
|
with ThreadPoolExecutor(max_workers=CONCURRENT) as pool:
|
2024-09-18 10:56:40 +09:00
|
|
|
results = pool.map(
|
|
|
|
lambda x: cls.__multiple_download_worker(file_api, x, context.isSkipIfExists), context.files
|
|
|
|
)
|
2024-07-08 20:35:48 +09:00
|
|
|
hasError = next(filter(lambda x: x is False, results), None)
|
|
|
|
if hasError is not None:
|
|
|
|
context.hasError = True
|
2023-05-10 18:17:35 +09:00
|
|
|
|
2023-07-19 21:47:47 +09:00
|
|
|
@classmethod
|
2024-09-18 10:56:40 +09:00
|
|
|
def __multiple_download_worker(cls, file_api: FilesApi, info: DownloadFileInfo, is_skip_if_exists: bool) -> bool:
|
|
|
|
if not is_skip_if_exists or os.path.exists(info.path) and info.file.size != os.path.getsize(info.path):
|
|
|
|
try:
|
|
|
|
file_api.download(info.file, info.path)
|
|
|
|
except Exception:
|
|
|
|
return False
|
2023-05-10 18:17:35 +09:00
|
|
|
print(info.path)
|
2024-07-08 20:35:48 +09:00
|
|
|
return True
|
2024-07-22 14:35:34 +09:00
|
|
|
|
|
|
|
@classmethod
|
|
|
|
def __check_excludes(cls, excludes: list[str], laboratory: Laboratory, folder: Folder, file: File | None) -> bool:
|
2024-10-23 18:33:12 +09:00
|
|
|
path = f"/{laboratory.name}{folder.path}{file.name if file is not None else ''}".rstrip("/").lower()
|
2024-07-22 14:35:34 +09:00
|
|
|
return path in excludes
|