You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@mxnet.apache.org by ap...@apache.org on 2019/09/30 21:15:44 UTC
[incubator-mxnet] branch master updated (66f1656 -> 810e67c)
This is an automated email from the ASF dual-hosted git repository.
apeforest pushed a change to branch master
in repository https://gitbox.apache.org/repos/asf/incubator-mxnet.git.
from 66f1656 [MXNET-978] Higher Order Gradient Support `arcsinh`, `arccosh`. (#15530)
add 810e67c Add fast implementation of LARS (#16122)
No new revisions were added by this update.
Summary of changes:
python/mxnet/optimizer/optimizer.py | 271 ++++++++++++++++-
src/operator/contrib/multi_lars-inl.h | 100 +++++++
src/operator/contrib/multi_lars.cc | 56 ++++
.../multi_lars.cu} | 12 +-
src/operator/contrib/multi_sum_sq-inl.h | 100 +++++++
src/operator/contrib/multi_sum_sq.cc | 84 ++++++
src/operator/contrib/multi_sum_sq.cu | 173 +++++++++++
src/operator/contrib/preloaded_multi_sgd-inl.h | 332 +++++++++++++++++++++
src/operator/contrib/preloaded_multi_sgd.cc | 245 +++++++++++++++
.../{amp_graph_pass.cc => preloaded_multi_sgd.cu} | 44 +--
.../lenet5_train.py => nightly/test_optimizer.py} | 67 +++--
tests/python/gpu/test_operator_gpu.py | 153 ++++++++++
12 files changed, 1567 insertions(+), 70 deletions(-)
create mode 100644 src/operator/contrib/multi_lars-inl.h
create mode 100644 src/operator/contrib/multi_lars.cc
copy src/operator/{numpy/np_broadcast_reduce_op_index.cu => contrib/multi_lars.cu} (77%)
create mode 100644 src/operator/contrib/multi_sum_sq-inl.h
create mode 100644 src/operator/contrib/multi_sum_sq.cc
create mode 100644 src/operator/contrib/multi_sum_sq.cu
create mode 100644 src/operator/contrib/preloaded_multi_sgd-inl.h
create mode 100755 src/operator/contrib/preloaded_multi_sgd.cc
copy src/operator/contrib/{amp_graph_pass.cc => preloaded_multi_sgd.cu} (55%)
copy tests/{python/tensorrt/lenet5_train.py => nightly/test_optimizer.py} (58%)