| |
| |
| |
| |
| |
| |
| import math |
| import requests |
| from tqdm import tqdm |
|
|
| from .misc import sizeof_fmt |
|
|
|
|
| def download_file_from_google_drive(file_id, save_path): |
| """Download files from google drive. |
| |
| Ref: |
| https://stackoverflow.com/questions/25010369/wget-curl-large-file-from-google-drive # noqa E501 |
| |
| Args: |
| file_id (str): File id. |
| save_path (str): Save path. |
| """ |
|
|
| session = requests.Session() |
| URL = 'https://docs.google.com/uc?export=download' |
| params = {'id': file_id} |
|
|
| response = session.get(URL, params=params, stream=True) |
| token = get_confirm_token(response) |
| if token: |
| params['confirm'] = token |
| response = session.get(URL, params=params, stream=True) |
|
|
| |
| response_file_size = session.get( |
| URL, params=params, stream=True, headers={'Range': 'bytes=0-2'}) |
| if 'Content-Range' in response_file_size.headers: |
| file_size = int( |
| response_file_size.headers['Content-Range'].split('/')[1]) |
| else: |
| file_size = None |
|
|
| save_response_content(response, save_path, file_size) |
|
|
|
|
| def get_confirm_token(response): |
| for key, value in response.cookies.items(): |
| if key.startswith('download_warning'): |
| return value |
| return None |
|
|
|
|
| def save_response_content(response, |
| destination, |
| file_size=None, |
| chunk_size=32768): |
| if file_size is not None: |
| pbar = tqdm(total=math.ceil(file_size / chunk_size), unit='chunk') |
|
|
| readable_file_size = sizeof_fmt(file_size) |
| else: |
| pbar = None |
|
|
| with open(destination, 'wb') as f: |
| downloaded_size = 0 |
| for chunk in response.iter_content(chunk_size): |
| downloaded_size += chunk_size |
| if pbar is not None: |
| pbar.update(1) |
| pbar.set_description(f'Download {sizeof_fmt(downloaded_size)} ' |
| f'/ {readable_file_size}') |
| if chunk: |
| f.write(chunk) |
| if pbar is not None: |
| pbar.close() |
|
|