This repository has been archived by the owner on Nov 17, 2023. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 6.8k
Make Gluon download function to be atomic #12572
Merged
Merged
Changes from 26 commits
Commits
Show all changes
38 commits
Select commit
Hold shift + click to select a range
b7fc61d
use rename trick to achieve atomic write but didn't support python2 a…
stu1130 657a921
add test for multiprocess download
stu1130 353221a
implement atomic_replace referred by https://github.com/untitaker/pyt…
stu1130 32ff8cd
change the number of testing process to 10
stu1130 7ded536
add docstring and disable linter
stu1130 b4c6b1f
half way to address some issue reviewer have
stu1130 901ed34
use warning instead of raise UserWarn
stu1130 a9d40c4
Merge branch 'master' of https://github.com/apache/incubator-mxnet
stu1130 91f9ca9
check for sha1
stu1130 9ab6341
Trigger CI
stu1130 1985726
fix the logic of checking hash
stu1130 429684a
Merge branch 'master' of https://github.com/apache/incubator-mxnet
stu1130 df2a9ef
refine the error message
stu1130 602b7d0
Merge branch 'master' of https://github.com/apache/incubator-mxnet
stu1130 3bed37c
add more comments and expose the error message to the user
stu1130 f0b8c5d
delete trailing whitespace
stu1130 47f65c2
rename _path_to_encode to _str_to_unicode
stu1130 85f9408
Merge branch 'master' of https://github.com/apache/incubator-mxnet
stu1130 5a01234
Merge branch 'master' of https://github.com/apache/incubator-mxnet
stu1130 8f58746
Merge branch 'master' of https://github.com/apache/incubator-mxnet
stu1130 b4235f0
fix the error message bug and add remove when the movefile fail on wi…
stu1130 f0776b9
add remove temp file for non-windows os
stu1130 c7756df
handle the OSError caused by os.remove
stu1130 971ecf9
Trigger CI
stu1130 1531594
Merge branch 'master' of https://github.com/apache/incubator-mxnet
stu1130 4dec67c
Merge branch 'master' into fix_race_condion_download
stu1130 3e799de
Merge branch 'master' of https://github.com/apache/incubator-mxnet
stu1130 af5b8ec
use finally to raise failure of atomic replace
stu1130 25e21b6
Merge commit '5314cf4742767319ce356bd5154c6885380e0d5c' into fix_race…
stu1130 f690c69
Merge branch 'master' of https://github.com/apache/incubator-mxnet
stu1130 0212e5a
Merge branch 'master' into fix_race_condion_download
stu1130 6af8945
add missing try except block for os.remove
stu1130 a091a97
Merge branch 'master' of https://github.com/apache/incubator-mxnet
stu1130 6765862
add retries value to error message
stu1130 f1359be
Merge branch 'master' of https://github.com/apache/incubator-mxnet
stu1130 a7b7b12
Merge branch 'master' into fix_race_condion_download
stu1130 e360853
Merge branch 'master' of https://github.com/apache/incubator-mxnet
stu1130 3662d38
Merge branch 'master' into fix_race_condion_download
stu1130 File filter
Filter by extension
Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -22,7 +22,9 @@ | |
'check_sha1', 'download'] | ||
|
||
import os | ||
import sys | ||
import hashlib | ||
import uuid | ||
import warnings | ||
import collections | ||
import weakref | ||
|
@@ -195,6 +197,59 @@ def check_sha1(filename, sha1_hash): | |
return sha1.hexdigest() == sha1_hash | ||
|
||
|
||
if not sys.platform.startswith('win32'): | ||
# refer to https://github.com/untitaker/python-atomicwrites | ||
def _replace_atomic(src, dst): | ||
"""Implement atomic os.replace with linux and OSX. Internal use only""" | ||
try: | ||
os.rename(src, dst) | ||
except OSError: | ||
try: | ||
os.remove(src) | ||
except OSError: | ||
pass | ||
raise OSError( | ||
'Moving downloaded temp file - {}, to {} failed. Please retry the download.'.format(src, dst)) | ||
else: | ||
import ctypes | ||
|
||
_MOVEFILE_REPLACE_EXISTING = 0x1 | ||
# Setting this value guarantees that a move performed as a copy | ||
# and delete operation is flushed to disk before the function returns. | ||
# The flush occurs at the end of the copy operation. | ||
_MOVEFILE_WRITE_THROUGH = 0x8 | ||
_windows_default_flags = _MOVEFILE_WRITE_THROUGH | ||
|
||
text_type = unicode if sys.version_info[0] == 2 else str # noqa | ||
|
||
def _str_to_unicode(x): | ||
"""Handle text decoding. Internal use only""" | ||
if not isinstance(x, text_type): | ||
return x.decode(sys.getfilesystemencoding()) | ||
return x | ||
|
||
def _handle_errors(rv, src): | ||
"""Handle WinError. Internal use only""" | ||
if not rv: | ||
msg = ctypes.FormatError(ctypes.GetLastError()) | ||
# if the MoveFileExW fail, remove the tempfile | ||
try: | ||
os.remove(src) | ||
except OSError: | ||
pass | ||
raise OSError(msg) | ||
|
||
def _replace_atomic(src, dst): | ||
"""Implement atomic os.replace with windows. | ||
refer to https://docs.microsoft.com/en-us/windows/desktop/api/winbase/nf-winbase-movefileexw | ||
The function fails when one of the process(copy, flush, delete) fails. | ||
Internal use only""" | ||
_handle_errors(ctypes.windll.kernel32.MoveFileExW( | ||
_str_to_unicode(src), _str_to_unicode(dst), | ||
_windows_default_flags | _MOVEFILE_REPLACE_EXISTING | ||
), src) | ||
|
||
|
||
def download(url, path=None, overwrite=False, sha1_hash=None, retries=5, verify_ssl=True): | ||
"""Download an given URL | ||
|
||
|
@@ -231,7 +286,7 @@ def download(url, path=None, overwrite=False, sha1_hash=None, retries=5, verify_ | |
fname = os.path.join(path, url.split('/')[-1]) | ||
else: | ||
fname = path | ||
assert retries >= 0, "Number of retries should be at least 0" | ||
assert retries >= 0, 'Number of retries should be at least 0' | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. include the value of retries in the error message. |
||
|
||
if not verify_ssl: | ||
warnings.warn( | ||
|
@@ -242,31 +297,44 @@ def download(url, path=None, overwrite=False, sha1_hash=None, retries=5, verify_ | |
dirname = os.path.dirname(os.path.abspath(os.path.expanduser(fname))) | ||
if not os.path.exists(dirname): | ||
os.makedirs(dirname) | ||
while retries+1 > 0: | ||
while retries + 1 > 0: | ||
# Disable pyling too broad Exception | ||
# pylint: disable=W0703 | ||
try: | ||
print('Downloading %s from %s...'%(fname, url)) | ||
print('Downloading {} from {}...'.format(fname, url)) | ||
r = requests.get(url, stream=True, verify=verify_ssl) | ||
if r.status_code != 200: | ||
raise RuntimeError("Failed downloading url %s"%url) | ||
with open(fname, 'wb') as f: | ||
raise RuntimeError('Failed downloading url {}'.format(url)) | ||
# create uuid for temporary files | ||
random_uuid = str(uuid.uuid4()) | ||
with open('{}.{}'.format(fname, random_uuid), 'wb') as f: | ||
for chunk in r.iter_content(chunk_size=1024): | ||
if chunk: # filter out keep-alive new chunks | ||
f.write(chunk) | ||
# if the target file exists(created by other processes) | ||
# and have the same hash with target file | ||
# delete the temporary file | ||
if not os.path.exists(fname) or (sha1_hash and not check_sha1(fname, sha1_hash)): | ||
# atmoic operation in the same file system | ||
_replace_atomic('{}.{}'.format(fname, random_uuid), fname) | ||
else: | ||
os.remove('{}.{}'.format(fname, random_uuid)) | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. should this be protected within try..except? |
||
warnings.warn( | ||
'File {} exists in file system so the downloaded file is deleted'.format(fname)) | ||
if sha1_hash and not check_sha1(fname, sha1_hash): | ||
raise UserWarning('File {} is downloaded but the content hash does not match.'\ | ||
' The repo may be outdated or download may be incomplete. '\ | ||
'If the "repo_url" is overridden, consider switching to '\ | ||
'the default repo.'.format(fname)) | ||
raise UserWarning( | ||
'File {} is downloaded but the content hash does not match.' | ||
' The repo may be outdated or download may be incomplete. ' | ||
'If the "repo_url" is overridden, consider switching to ' | ||
'the default repo.'.format(fname)) | ||
break | ||
except Exception as e: | ||
retries -= 1 | ||
if retries <= 0: | ||
raise e | ||
else: | ||
print("download failed, retrying, {} attempt{} left" | ||
.format(retries, 's' if retries > 1 else '')) | ||
print('download failed due to {}, retrying, {} attempt{} left' | ||
.format(repr(e), retries, 's' if retries > 1 else '')) | ||
|
||
return fname | ||
|
||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Add this suggestion to a batch that can be applied as a single commit.
This suggestion is invalid because no changes were made to the code.
Suggestions cannot be applied while the pull request is closed.
Suggestions cannot be applied while viewing a subset of changes.
Only one suggestion per line can be applied in a batch.
Add this suggestion to a batch that can be applied as a single commit.
Applying suggestions on deleted lines is not supported.
You must change the existing code in this line in order to create a valid suggestion.
Outdated suggestions cannot be applied.
This suggestion has been applied or marked resolved.
Suggestions cannot be applied from pending reviews.
Suggestions cannot be applied on multi-line comments.
Suggestions cannot be applied while the pull request is queued to merge.
Suggestion cannot be applied right now. Please check back later.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
include this part in a finally block