Skip to content
This repository has been archived by the owner on Nov 17, 2023. It is now read-only.

Commit

Permalink
Don't use namespace for pow() function, since it is built into cuda m…
Browse files Browse the repository at this point in the history
…ath library, and cast the second argument so it will find an acceptable form. (#19532)

Remove thrust library override and use default from cuda 11.0.

Fix lint.

Co-authored-by: Joe Evans <[email protected]>
  • Loading branch information
josephevans and Joe Evans authored Nov 14, 2020
1 parent 6ca77dd commit 1f15d98
Show file tree
Hide file tree
Showing 2 changed files with 5 additions and 20 deletions.
17 changes: 1 addition & 16 deletions ci/build_windows.py
Original file line number Diff line number Diff line change
Expand Up @@ -157,20 +157,6 @@ def windows_build(args):
mxnet_root = get_mxnet_root()
logging.info("Found MXNet root: {}".format(mxnet_root))

if 'GPU' in args.flavour:
# Get Thrust version to be shipped in Cuda 11, due to flakyness of
# older Thrust versions with MSVC 19 compiler
with remember_cwd():
tmpdirname = tempfile.mkdtemp()
os.chdir(tmpdirname)
r = requests.get('https://github.com/thrust/thrust/archive/1.9.8.zip', allow_redirects=True)
with open('thrust.zip', 'wb') as f:
f.write(r.content)
with zipfile.ZipFile('thrust.zip', 'r') as zip_ref:
zip_ref.extractall('.')
thrust_path = os.path.join(tmpdirname, "thrust-1.9.8")


# cuda thrust / CUB + VS 2019 is flaky: try multiple times if fail
MAXIMUM_TRY = 5
build_try = 0
Expand All @@ -184,8 +170,7 @@ def windows_build(args):
os.chdir(path)
env = os.environ.copy()
if 'GPU' in args.flavour:
env["CXXFLAGS"] = '/FS /MD /O2 /Ob2 /I {}'.format(thrust_path)
env["CUDAFLAGS"] = '-I {}'.format(thrust_path)
env["CXXFLAGS"] = '/FS /MD /O2 /Ob2'
cmd = "\"{}\" && cmake -GNinja {} {}".format(args.vcvars,
CMAKE_FLAGS[args.flavour],
mxnet_root)
Expand Down
8 changes: 4 additions & 4 deletions src/operator/contrib/multi_lamb.cu
Original file line number Diff line number Diff line change
Expand Up @@ -50,10 +50,10 @@ __global__ void KernelStep1(const MultiLAMBKernelParam<DType, MPDType> kernel_pa

MPDType biascorrection1, biascorrection2;
if (bias_correction) {
biascorrection1 = 1.0 -
static_cast<MPDType>(std::pow(beta1, kernel_params.step_count[tensor_id]));
biascorrection2 = 1.0 -
static_cast<MPDType>(std::pow(beta2, kernel_params.step_count[tensor_id]));
biascorrection1 = 1.0 - static_cast<MPDType>(
pow(beta1, static_cast<float>(kernel_params.step_count[tensor_id])));
biascorrection2 = 1.0 - static_cast<MPDType>(
pow(beta2, static_cast<float>(kernel_params.step_count[tensor_id])));
} else {
biascorrection1 = static_cast<MPDType>(1.0);
biascorrection2 = static_cast<MPDType>(1.0);
Expand Down

0 comments on commit 1f15d98

Please sign in to comment.