This is an automated email from the ASF dual-hosted git repository.

nswamy pushed a change to branch fit-api
in repository https://gitbox.apache.org/repos/asf/incubator-mxnet.git.


    from c2e2f80  [MXNET-1344, 1346][FIT API] Retrieve Batch size and Logging 
verbose support for Gluon fit() API (#14587)
     new c35a82c  Fix shape inference pass (#14153)
     new 7dc7db0  Relaxing type requirements for reshape_like op (#14325)
     new 778e495  Updated news.md with the latest mkldnn submodule version 
(#14298)
     new d014ff3  Enhance gpu quantization (#14094)
     new ae2dda2  Bypass ThreadedEngine in 
test_operator_gpu.py:test_convolution_multiple_streams. (#14338)
     new ae4703b  Limit workspace for cudnnGet results (#14326)
     new 8287656  [MXNET-1331] Removal of non-MXNET classes from JAR (#14303)
     new f0cd148  fix render issue in NDArray linalg docs (#14258)
     new e64cfaa  Add more support for mxnet_to_coreml (#14222)
     new f6dc492   Add default parameters for Scala NDArray.arange (#13816)
     new b5e0890  Register fake grad to subgraph and quantized operators 
(#14275)
     new d58764c  corrected a spellign (#14247)
     new 0f96e66  [MXNET-1324] Add NaiveRunGraph to imperative utils (#14192)
     new e14e8be  Updates build_lib.sh to copy the cub library license (#14347)
     new 7e14eb4  Add MKLDNN headers to pip package (#14339)
     new 1b4e080  compatibility with opencv4 (#14313)
     new 43d87b0  [MXNET-1291] solve pylint errors in examples with issue 
no.12205 (#13848)
     new 9a6cd58  #14199: catch subprocess.CalledProcessError in get_gpus() 
(#14212)
     new 2447f80  print error message for mxnet::cpp::Operator::Invoke when 
failed (#14318)
     new 6b2b44a  Bulked op segments to allow Variable nodes (#14200)
     new 8658a1b  Fixes #14181, validate model output shape for ObjectDetector. 
(#14215)
     new c9d57bf  Optimizer MXKVStoreUpdater bug fix in serializeState method 
(#14337)
     new 0b3a965  Installs qemu pip requirements from qemu requirements file 
(#14355)
     new d503bb4  Optimize NMS part 2 (#14352)
     new 1bb78eb  add exception (#14362)
     new f8eeab7  MKLDNN based Quantized FullyConnected Operator and its fusion 
(#14128)
     new a26b3fc  add pos_weight for SigmoidBinaryCrossEntropyLoss (#13612)
     new 0c51c69  Julia: split symbolic-node.jl into several snippets (#14024)
     new 16eb81a  Fix NaN value comparisons in relu, max and min ops (#14262)
     new 897bf59  [clojure-package][wip] add `->nd-vec` function in 
`ndarray.clj` (#14308)
     new 43b03ab  support leading dimension of -1 in ravel/unravel (#14356)
     new d5bf85b  fix engine crash in shutdown phase (#14382)
     new c152c39  Flaky test 
https://github.com/apache/incubator-mxnet/issues/14189 (#14190)
     new 25560b3  Julia: rename `mx.clip` to `clamp` for `NDArray` (#14027)
     new d0a2f8d  add backgroud class in box_nms (#14058)
     new 19f05b0  CI Changes for Codified Windows AMIs (#14336)
     new f981f4e  [Clojure] Helper function for n-dim vector to ndarray (#14305)
     new 3e94618  [DOC] fix sym.arange doc (#14237)
     new 95baafb  Julia: add binding for runtime feature detection (#13992)
     new c45e9ac  [MXNET-1093] Add python3 Docker images for each MXNet release 
(#12791)
     new 438aa6e  Enable bulking test on windows (#14392)
     new 38d3151  [MXNET-1327] Allow RNN Layers to be initialized to fp16 
(#14219)
     new 86601d7  Disables flaky test_operator.test_sgld test (#14410)
     new dc1238b  Fix relative difference scala (#14417)
     new 4f1e22b  Cudnn conv dgrad algo filtering (#14310)
     new 692f8fb  [MXNET-1226] add Docs update for MXNet Java (#14395)
     new 361acc9  fix Makefile (#14424)
     new 36d84c8  [MXNET-1291] solve pylint errors in examples with issue 
no.12205 (#13938)
     new 6599756  Disables flaky TestStochasticTiming_2D test (#14412)
     new 2b315c1  Add dtype visualization to plot_network (#14066)
     new 207c6c1  Support multi-threading for Custom Operator (#14363)
     new 506bc77  Fix entropy for uint8 (#14150)
     new c73a3c4  what's new - add 1.4.0 release (#14435)
     new 5809c2d  moveaxis operator now accepts negative indices and sequence 
of ints as well. (#14321)
     new 314a41a  Add repr for SymbolBlock (#14423)
     new c47d8c8  temporarily disable integ tests with a dependency on origami 
repo (#14448)
     new 09a4d64  fix OOM error during resource allocation (#14444)
     new 711b8b5  Correct update count with Gluon trainer and 
update_on_kvstore=False (#14377)
     new a0c4177  Update MKL-DNN to v0.18 release (was: fix the Dense layer 
issue) (#13668)
     new 48131ed  Speedup _contrib_index_copy (#14359)
     new 7ffa150  Fix crashes on visualization (#14425)
     new f1103ad  add contributors from intel (#14455)
     new ffc0708  begin=end not a valid input (#14403)
     new dbc86a7  Fix memory leak for size-zero ndarray (#14365)
     new 56c0d8f  [Doc] Start the tutorials for MKL-DNN backend (#14202)
     new 73b9890  Enforce determinism for backwards compatibility checker 
(#14463)
     new adc0ce7  [MKL-DNN] Enable s8 support for inner product and 3d input 
with flatten=false (#14466)
     new 73fe286  Fixes the test_sgld (#14473)
     new 708931a  Revert "Fix memory leak for size-zero ndarray (#14365)" 
(#14477)
     new 4b256aa  fix custom operation in fork (#14451)
     new d0aab5e  Change Straight Dope to Dive into Deep Learning (#14465)
     new 2e218fc  Added link to landing page for Java examples (#14481)
     new 199c3bb  Fixes test_operator_gpu.test_multinomial_generator (#14475)
     new 07901c3  [MXNET-949] Module API to Gluon API tutorial (#12542)
     new a211550  Fixed tutorial warnings (#14472)
     new 308c4e6  Add examples of running MXNet with Horovod (#14286)
     new ce5bc19  Fixes for CI downloads (#14504)
     new 0ab1da2  Enhance PartitionGraph (#14277)
     new f1354b4  [MXNET-1285] Draw bounding box with Scala/Java Image API 
(#14474)
     new dee351b  reenable the test (#14483)
     new a350661  Fix script retrieval (#14519)
     new 890b186  add filter to warnings (#14532)
     new a41a643  Adds context parameter to check_rnn_layer_forward calls in 
test_lstmp (#14529)
     new c4b8d30  Performance improving for MKL-DNN Quantized FullyConnected 
(#14528)
     new db55051  speedup SequenceMask on GPU (#14445)
     new a310b44  Tidy up storage allocation and deallocation (#14480)
     new 0c3d11d  Memory fixes. Resolves #10867, and resolves #14080 (#14372)
     new a3c11da  Remove unnecessary "also" in README.md (#14543)
     new 0f0b2dd  [clojure]: add comp-metric based on CompositeEvalMetric 
(#14553)
     new c95afee  Chouffe/clojure fix tests (#14531)
     new e761e2f  [clojure][image] add draw-bounding-box interop (#14533)
     new b4583cb  fix tests (#14565)
     new 25cdb1c  Enhance subgraph API (#14113)
     new ee341b8  Do not touch GPU 0 during ReleaseAll (#14550)
     new ea4f571  Change CUB submodule to track Nvidia CUB project. (#13322)
     new e444341  Fixes static build script for cub directory rename (#14578)
     new e5aadca  example/ssd/evaluate/eval_metric.py (#14561)
     new a4b85a5  Support SyncBatchNorm5D (#14542)
     new 984d70f  Disable Flaky Test test_poisson_generator (#14540)
     new b6a767d  [MXNET-1357] Fix the cpp-examples to add exception handling 
(#14441)
     new 821502a  Updates gpu tests to use CUDNN_VERSION supplied by the 
environment but default to 7.0.3 if not set (#14595)
     new 04979b4  fix build cpp examples option (#14562)
     new deeba00  Fix flaky test poisson generator & 
test_negative_binomial_generator (#14571)
     new 3a5dc6e  Fixing unintentional variable overloading (#14438)
     new 8ddede0  [MXNET-1379] update reshape operator (#14600)
     new 3414b06  Updated documentation about nightly tests (#14493)
     new d843a85  set _scale in Trainer using optimizer rescale_grad (#14593)
     new 49c1ccc  Add Gluon Transformer Crop (#14259)
     new 996d2b1  fix quantize graph pass (#14605)
     new 943b734  GELU (#14449)
     new 736be66  added note about cuda9.2 requirement (#14140)
     new 6b800e4  Add BERT QA Scala/Java example (#14592)

The 9463 revisions listed above as "new" are entirely new to this
repository and will be described in separate emails.  The revisions
listed as "add" were already present in the repository and have only
been added to this reference.


Summary of changes:
 .gitmodules                                        |   6 +-
 3rdparty/cub                                       |   1 -
 3rdparty/mkldnn                                    |   2 +-
 3rdparty/nvidia_cub                                |   1 +
 CMakeLists.txt                                     |   5 +-
 CONTRIBUTORS.md                                    |  23 +-
 LICENSE                                            |   4 +-
 MKLDNN_README.md                                   | 314 +------
 Makefile                                           |  32 +-
 NEWS.md                                            |   4 +-
 R-package/tests/testthat/get_data.R                |  11 +-
 R-package/vignettes/CatsDogsFinetune.Rmd           |   4 +-
 .../classifyRealImageWithPretrainedModel.Rmd       |   2 +-
 README.md                                          |   7 +-
 benchmark/python/control_flow/rnn.py               |   7 +-
 ci/build_windows.py                                |   6 +-
 ci/docker/install/ubuntu_mklml.sh                  |   2 +-
 ci/docker/qemu/runtime_functions.py                |   4 +-
 ci/docker/qemu/vmcontrol.py                        |   1 +
 ci/docker/runtime_functions.sh                     |  12 +-
 ci/jenkins/Jenkins_steps.groovy                    |  32 +-
 ci/jenkins/Jenkinsfile_windows_cpu                 |  10 +-
 ci/jenkins/Jenkinsfile_windows_gpu                 |  10 +-
 ci/qemu/README.md                                  |   4 +
 ci/qemu/test_requirements.txt                      |   3 +
 ci/windows/test_py2_cpu.ps1                        |   6 +-
 ci/windows/test_py2_gpu.ps1                        |  10 +-
 ci/windows/test_py3_cpu.ps1                        |   6 +-
 ci/windows/test_py3_gpu.ps1                        |  10 +-
 cmake/DownloadMKLML.cmake                          |  14 +-
 contrib/clojure-package/integration-tests.sh       |   2 +-
 .../src/org/apache/clojure_mxnet/eval_metric.clj   |  18 +-
 .../src/org/apache/clojure_mxnet/image.clj         |  66 ++
 .../src/org/apache/clojure_mxnet/ndarray.clj       |  79 +-
 .../src/org/apache/clojure_mxnet/util.clj          |  37 +-
 .../clojure-package/test/dev/generator_test.clj    |  87 +-
 .../org/apache/clojure_mxnet/eval_metric_test.clj  |   9 +
 .../org/apache/clojure_mxnet/executor_test.clj     |   8 +-
 .../clojure_mxnet/infer/imageclassifier_test.clj   |  12 +-
 .../test/org/apache/clojure_mxnet/module_test.clj  |  38 +-
 .../test/org/apache/clojure_mxnet/ndarray_test.clj |  36 +-
 .../org/apache/clojure_mxnet/operator_test.clj     |  12 +-
 .../test/org/apache/clojure_mxnet/symbol_test.clj  |  10 +-
 .../test/org/apache/clojure_mxnet/util_test.clj    |  31 +-
 cpp-package/CMakeLists.txt                         |   2 +-
 cpp-package/example/alexnet.cpp                    |  77 +-
 cpp-package/example/charRNN.cpp                    |   3 +
 cpp-package/example/feature_extract/run.sh         |   7 +-
 cpp-package/example/get_data.sh                    |  61 +-
 cpp-package/example/googlenet.cpp                  |   2 +
 cpp-package/example/inception_bn.cpp               |  37 +-
 .../inference/unit_test_inception_inference.sh     |   4 +-
 cpp-package/example/lenet.cpp                      |   3 +
 cpp-package/example/lenet_with_mxdataiter.cpp      |  34 +-
 cpp-package/example/mlp.cpp                        |   3 +
 cpp-package/example/mlp_cpu.cpp                    |   2 +
 cpp-package/example/mlp_csv.cpp                    |   2 +
 cpp-package/example/mlp_gpu.cpp                    |   2 +
 cpp-package/example/resnet.cpp                     |  57 +-
 cpp-package/example/test_score.cpp                 |   4 +-
 cpp-package/example/utils.h                        |   9 +
 cpp-package/include/mxnet-cpp/operator.hpp         |   8 +-
 docker/docker-python/Dockerfile.mxnet.python.cpu   |  11 +-
 .../docker-python/Dockerfile.mxnet.python.cpu.mkl  |  11 +-
 .../docker-python/Dockerfile.mxnet.python.gpu.cu80 |  11 +-
 .../Dockerfile.mxnet.python.gpu.cu80.mkl           |  11 +-
 .../docker-python/Dockerfile.mxnet.python.gpu.cu90 |  11 +-
 .../Dockerfile.mxnet.python.gpu.cu90.mkl           |  11 +-
 .../docker-python/Dockerfile.mxnet.python.gpu.cu92 |  11 +-
 .../Dockerfile.mxnet.python.gpu.cu92.mkl           |  11 +-
 ...net.python.cpu => Dockerfile.mxnet.python3.cpu} |  11 +-
 ...on.cpu.mkl => Dockerfile.mxnet.python3.cpu.mkl} |  11 +-
 ....gpu.cu80 => Dockerfile.mxnet.python3.gpu.cu80} |  11 +-
 ...0.mkl => Dockerfile.mxnet.python3.gpu.cu80.mkl} |  11 +-
 ....gpu.cu90 => Dockerfile.mxnet.python3.gpu.cu90} |  11 +-
 ...0.mkl => Dockerfile.mxnet.python3.gpu.cu90.mkl} |  11 +-
 ....gpu.cu92 => Dockerfile.mxnet.python3.gpu.cu92} |  11 +-
 ...2.mkl => Dockerfile.mxnet.python3.gpu.cu92.mkl} |  11 +-
 docker/docker-python/README.md                     |  58 +-
 docker/docker-python/build_python_dockerfile.sh    | 178 +++-
 docs/_static/mxnet-theme/navbar.html               |   4 +-
 docs/api/perl/index.md                             |   2 +-
 docs/community/ecosystem.md                        |   2 +-
 docs/faq/env_var.md                                |  11 +-
 docs/faq/perf.md                                   |   2 +-
 docs/gluon/index.md                                |  14 +-
 docs/install/index.md                              |   6 +-
 docs/install/java_setup.md                         |  32 +-
 docs/install/ubuntu_setup.md                       |   2 +-
 docs/install/windows_setup.md                      |   4 +-
 docs/tutorials/c++/subgraphAPI.md                  |  40 +-
 docs/tutorials/gluon/customop.md                   |  20 +
 .../gluon/gluon_from_experiment_to_deployment.md   |   4 +-
 docs/tutorials/gluon/hybrid.md                     |   8 +-
 docs/tutorials/gluon/save_load_params.md           |   5 +-
 docs/tutorials/index.md                            |   9 +-
 docs/tutorials/java/mxnet_java_on_intellij.md      |  27 +-
 .../tutorials/mkldnn/MKLDNN_README.md              |  14 +-
 docs/tutorials/{vision => mkldnn}/index.md         |   0
 docs/tutorials/onnx/fine_tuning_gluon.md           |   5 +-
 docs/tutorials/onnx/inference_on_onnx_model.md     |   6 +-
 docs/tutorials/python/matrix_factorization.md      | 289 ------
 docs/tutorials/python/module_to_gluon.md           | 365 ++++++++
 example/README.md                                  |   1 +
 example/bayesian-methods/bdk_demo.py               |   3 +-
 example/caffe/caffe_net.py                         |   4 +-
 example/caffe/train_model.py                       |   4 +-
 example/capsnet/capsulenet.py                      |   7 +-
 .../data_helpers.py                                |   3 +-
 .../cnn_chinese_text_classification/text_cnn.py    |   9 +-
 example/cnn_text_classification/data_helpers.py    |   8 +-
 example/cnn_text_classification/text_cnn.py        | 162 +++-
 example/ctc/captcha_generator.py                   |  45 +-
 example/ctc/ctc_metrics.py                         |  20 +-
 example/ctc/hyperparams.py                         |   6 +-
 example/ctc/lstm_ocr_infer.py                      |   7 +-
 example/ctc/lstm_ocr_train.py                      |   4 +-
 example/ctc/multiproc_data.py                      |  35 +-
 example/ctc/ocr_iter.py                            |  17 +-
 example/ctc/ocr_predict.py                         |  22 +-
 example/deep-embedded-clustering/autoencoder.py    |  29 +-
 example/deep-embedded-clustering/data.py           |   8 +-
 example/deep-embedded-clustering/dec.py            |  31 +-
 example/deep-embedded-clustering/model.py          |   3 +-
 example/distributed_training-horovod/README.md     | 201 +++++
 .../distributed_training-horovod/gluon_mnist.py    | 186 ++++
 .../distributed_training-horovod/module_mnist.py   | 162 ++++
 .../resnet50_imagenet.py                           | 453 ++++++++++
 example/distributed_training/cifar10_dist.py       |  78 +-
 example/gluon/dc_gan/dcgan.py                      |  67 +-
 example/gluon/lstm_crf/lstm_crf.py                 |  62 +-
 example/image-classification/README.md             |   2 +-
 example/image-classification/common/util.py        |   8 +-
 example/quantization/imagenet_gen_qsym_mkldnn.py   |   7 +-
 example/recommenders/matrix_fact.py                |   8 +-
 example/ssd/evaluate/eval_metric.py                |   2 +-
 include/mxnet/c_api_test.h                         |   2 +-
 include/mxnet/imperative.h                         |  23 +-
 include/mxnet/ndarray.h                            |   8 +-
 julia/NEWS.md                                      |   7 +-
 julia/deps/build.jl                                |   7 +-
 julia/models/Inception/get.sh                      |   2 +-
 julia/src/MXNet.jl                                 |   3 +-
 julia/src/base.jl                                  |   7 +-
 julia/src/deprecated.jl                            |   8 +-
 julia/src/ndarray/arithmetic.jl                    |  52 +-
 julia/src/ndarray/remap.jl                         |  12 +
 julia/src/optimizer.jl                             |   2 +-
 julia/src/runtime.jl                               |  76 ++
 julia/src/symbolic-node.jl                         | 987 +--------------------
 julia/src/symbolic-node/arithmetic.jl              | 127 +++
 julia/src/symbolic-node/array.jl                   | 122 +++
 julia/src/symbolic-node/autodiff.jl                | 178 ++++
 julia/src/symbolic-node/io.jl                      |  58 ++
 julia/src/symbolic-node/op.jl                      | 444 +++++++++
 julia/src/symbolic-node/show.jl                    |  62 ++
 julia/src/symbolic-node/type.jl                    | 123 +++
 julia/test/unittest/ndarray.jl                     |  12 +-
 make/config.mk                                     |   4 +
 make/crosscompile.jetson.mk                        |   4 +
 make/maven/maven_darwin_mkl.mk                     |   4 +
 make/maven/maven_linux_cu90mkl.mk                  |   4 +
 make/maven/maven_linux_cu92mkl.mk                  |   4 +
 make/maven/maven_linux_mkl.mk                      |   4 +
 make/osx.mk                                        |   4 +
 make/pip/pip_darwin_cpu.mk                         |   4 +
 make/pip/pip_darwin_mkl.mk                         |   4 +
 make/pip/pip_linux_cpu.mk                          |   4 +
 make/pip/pip_linux_cu100.mk                        |   4 +
 make/pip/pip_linux_cu100mkl.mk                     |   4 +
 make/pip/pip_linux_cu75.mk                         |   4 +
 make/pip/pip_linux_cu75mkl.mk                      |   4 +
 make/pip/pip_linux_cu80.mk                         |   4 +
 make/pip/pip_linux_cu80mkl.mk                      |   4 +
 make/pip/pip_linux_cu90.mk                         |   4 +
 make/pip/pip_linux_cu90mkl.mk                      |   4 +
 make/pip/pip_linux_cu91.mk                         |   4 +
 make/pip/pip_linux_cu91mkl.mk                      |   4 +
 make/pip/pip_linux_cu92.mk                         |   4 +
 make/pip/pip_linux_cu92mkl.mk                      |   4 +
 make/pip/pip_linux_mkl.mk                          |   4 +
 make/readthedocs.mk                                |   4 +
 matlab/get_inception_model.sh                      |   2 +-
 mkldnn.mk                                          |   5 +
 perl-package/AI-MXNet/lib/AI/MXNet.pm              |  12 +-
 python/mxnet/contrib/quantization.py               |  12 +-
 python/mxnet/gluon/block.py                        |   8 +
 python/mxnet/gluon/data/vision/transforms.py       |  61 ++
 python/mxnet/gluon/loss.py                         |  85 +-
 python/mxnet/gluon/nn/activations.py               |  21 +-
 python/mxnet/gluon/rnn/rnn_layer.py                |  59 +-
 python/mxnet/gluon/trainer.py                      |   8 +-
 python/mxnet/image/image.py                        |   2 +-
 python/mxnet/initializer.py                        |  13 +
 python/mxnet/ndarray/ndarray.py                    |  40 +-
 python/mxnet/optimizer/optimizer.py                |  17 +-
 python/mxnet/symbol/symbol.py                      |  10 +-
 python/mxnet/test_utils.py                         |  13 +-
 python/mxnet/util.py                               |  16 +
 python/mxnet/visualization.py                      |  71 +-
 scala-package/.gitignore                           |   1 +
 .../assembly/src/main/assembly/assembly.xml        |   2 +
 .../src/main/scala/org/apache/mxnet/Executor.scala |  47 +-
 .../src/main/scala/org/apache/mxnet/Image.scala    |  54 ++
 .../src/main/scala/org/apache/mxnet/LibInfo.scala  |   5 +-
 .../src/main/scala/org/apache/mxnet/NDArray.scala  |  21 +-
 .../main/scala/org/apache/mxnet/Optimizer.scala    |  36 +-
 .../scala/org/apache/mxnet/ResourceScope.scala     |  21 +-
 .../src/main/scala/org/apache/mxnet/Symbol.scala   |  21 +-
 .../scala/org/apache/mxnet/javaapi/Image.scala     |  46 +-
 .../org/apache/mxnet/{ => javaapi}/Layout.scala    |  13 +-
 .../mxnet/module/DataParallelExecutorGroup.scala   |  11 +-
 .../scala/org/apache/mxnet/optimizer/Adam.scala    | 101 +--
 .../java/org/apache/mxnet/javaapi/ImageTest.java   |  20 +-
 .../test/scala/org/apache/mxnet/CheckUtils.scala   |   4 +-
 .../test/scala/org/apache/mxnet/ImageSuite.scala   |  21 +
 .../test/scala/org/apache/mxnet/NDArraySuite.scala |  35 +-
 .../org/apache/mxnet/ResourceScopeSuite.scala      |  33 +
 scala-package/deploy/src/main/deploy/deploy.xml    |  10 +
 scala-package/examples/pom.xml                     |   5 +
 .../get_resnet_data.sh => bert/get_bert_data.sh}   |  18 +-
 .../bert/run_bert_qa_example.sh}                   |   6 +-
 .../javaapi/infer/bert/BertDataParser.java         | 126 +++
 .../mxnetexamples/javaapi/infer/bert/BertQA.java   | 148 +++
 .../mxnetexamples/javaapi/infer/bert/README.md     | 103 +++
 .../javaapi/infer/objectdetector/README.md         |   2 +-
 .../infer/objectdetector/SSDClassifierExample.java |  41 +-
 .../javaapi/infer/predictor/BertExampleTest.java   |  71 ++
 .../org/apache/mxnet/infer/ImageClassifier.scala   |   2 +
 .../org/apache/mxnet/infer/ObjectDetector.scala    |  27 +-
 .../scala/org/apache/mxnet/infer/Predictor.scala   |   7 +
 .../mxnet/infer/javaapi/ObjectDetectorOutput.scala |   4 +-
 .../infer/javaapi/ObjectDetectorOutputTest.java    |   4 +-
 scala-package/mxnet-demo/java-demo/README.md       |   2 +
 .../main/native/org_apache_mxnet_native_c_api.cc   |  13 +-
 .../main/native/org_apache_mxnet_native_c_api.h    |   8 +-
 src/c_api/c_api.cc                                 |   1 +
 src/c_api/c_api_symbolic.cc                        |  17 +-
 src/c_api/c_api_test.cc                            |  21 +-
 src/engine/threaded_engine.h                       |   9 +
 src/executor/graph_executor.cc                     | 433 +++++----
 src/executor/graph_executor.h                      |   6 +-
 src/executor/infer_graph_attr_pass.cc              |  76 +-
 src/imperative/cached_op.cc                        | 115 ++-
 src/imperative/cached_op.h                         |  11 +-
 src/imperative/imperative.cc                       |   3 +-
 src/imperative/imperative_utils.cc                 | 235 +++--
 src/imperative/imperative_utils.h                  |  15 +-
 src/initialize.cc                                  |   5 +
 src/io/image_aug_default.cc                        |   1 +
 src/io/image_det_aug_default.cc                    |   1 +
 src/io/image_io.cc                                 |   1 +
 src/io/opencv_compatibility.h                      |  59 ++
 src/ndarray/ndarray.cc                             |   8 +-
 src/operator/contrib/bounding_box-common.h         |  30 +
 src/operator/contrib/bounding_box-inl.cuh          |  70 +-
 src/operator/contrib/bounding_box-inl.h            |  76 +-
 src/operator/contrib/bounding_box.cc               |   8 +-
 src/operator/contrib/index_copy-inl.h              |  93 +-
 src/operator/contrib/index_copy.cc                 | 120 +++
 src/operator/contrib/index_copy.cu                 | 110 ++-
 src/operator/contrib/sync_batch_norm-inl.h         |  31 +-
 src/operator/custom/custom-inl.h                   |  72 +-
 src/operator/custom/custom.cc                      |   5 -
 src/operator/image/crop-inl.h                      | 190 ++++
 src/operator/image/{resize.cc => crop.cc}          |  76 +-
 src/operator/leaky_relu-inl.h                      |  21 +-
 src/operator/mshadow_op.h                          |  63 +-
 src/operator/nn/batch_norm.cu                      |   4 +-
 src/operator/nn/cudnn/cudnn_batch_norm-inl.h       |  14 +-
 src/operator/nn/cudnn/cudnn_convolution-inl.h      |  31 +-
 src/operator/nn/cudnn/cudnn_deconvolution-inl.h    |  24 +-
 src/operator/nn/fully_connected-inl.h              |   6 +
 src/operator/nn/fully_connected.cc                 |  10 +-
 src/operator/nn/mkldnn/mkldnn_base.cc              |   2 +
 .../nn/mkldnn/mkldnn_fully_connected-inl.h         | 133 +++
 src/operator/nn/mkldnn/mkldnn_fully_connected.cc   | 343 ++++---
 src/operator/operator_tune.cc                      |   2 +
 src/operator/quantization/dequantize.cc            |   3 +
 .../mkldnn/mkldnn_quantized_fully_connected.cc     | 118 +++
 ...tized_pooling.cc => mkldnn_quantized_ops-inl.h} |  35 +-
 src/operator/quantization/quantize-inl.h           |   4 +
 src/operator/quantization/quantize.cc              |   3 +
 src/operator/quantization/quantize_graph_pass.cc   |  12 +-
 src/operator/quantization/quantize_v2-inl.h        |   4 +
 src/operator/quantization/quantize_v2.cc           |   3 +
 src/operator/quantization/quantized_concat.cc      |   3 +
 src/operator/quantization/quantized_conv.cc        |   3 +
 src/operator/quantization/quantized_flatten.cc     |   3 +
 .../quantization/quantized_fully_connected.cc      | 144 ++-
 .../quantization/quantized_fully_connected.cu      |   5 +
 src/operator/quantization/quantized_pooling.cc     |   3 +
 src/operator/quantization/requantize.cc            |   3 +
 src/operator/sequence_mask-inl.h                   |  79 +-
 src/operator/sequence_mask.cc                      |  64 ++
 src/operator/sequence_mask.cu                      |  59 ++
 .../{partition_graph.cc => build_subgraph.cc}      | 387 ++++----
 ...property.cc => default_subgraph_property_v2.cc} |  25 +-
 src/operator/subgraph/mkldnn/mkldnn_conv.cc        |   3 +
 ...rty.cc => mkldnn_conv_post_quantize_property.h} |  37 +-
 ...dnn_conv_property.cc => mkldnn_conv_property.h} |  25 +-
 src/operator/subgraph/mkldnn/mkldnn_fc.cc          | 448 ++++++++++
 .../mkldnn/mkldnn_fc_post_quantize_property.h      | 215 +++++
 src/operator/subgraph/mkldnn/mkldnn_fc_property.h  | 190 ++++
 .../mkldnn_post_quantize_align_scale_property.h    | 164 ++++
 ...ldnn_conv-inl.h => mkldnn_subgraph_property.cc} |  25 +-
 src/operator/subgraph/subgraph_property.h          | 223 ++++-
 src/operator/tensor/elemwise_unary_op_basic.cc     |  11 +-
 src/operator/tensor/init_op.h                      |   5 +
 src/operator/tensor/la_op.cc                       |  16 +-
 src/operator/tensor/matrix_op-inl.h                |  65 +-
 src/operator/tensor/ravel.cc                       |   6 +-
 src/operator/tensor/ravel.h                        |   3 +-
 src/resource.cc                                    |  30 +-
 src/storage/cpu_device_storage.h                   |  25 +-
 src/storage/cpu_shared_storage_manager.h           |   7 +-
 src/storage/gpu_device_storage.h                   |  19 +-
 src/storage/naive_storage_manager.h                |   2 +-
 src/storage/pinned_memory_storage.h                |  21 +-
 src/storage/pooled_storage_manager.h               |  36 +-
 src/storage/storage.cc                             |  12 +-
 src/storage/storage_manager.h                      |  11 +-
 tests/cpp/include/test_util.h                      |   8 +-
 tests/cpp/operator/batchnorm_test.cc               |   4 +-
 tests/cpp/operator/mkldnn_test.cc                  |   2 +-
 tests/cpp/storage/storage_test.cc                  |  15 +
 tests/nightly/README.md                            |  10 +-
 .../model_backward_compat_checker.sh               |   3 +-
 .../train_mxnet_legacy_models.sh                   |   1 +
 tests/python/gpu/test_gluon_gpu.py                 | 279 +++---
 tests/python/gpu/test_kvstore_gpu.py               |   6 +-
 tests/python/gpu/test_operator_gpu.py              | 112 ++-
 tests/python/mkl/test_subgraph.py                  | 298 ++++++-
 tests/python/quantization/test_quantization.py     | 197 +++-
 tests/python/unittest/common.py                    |  50 ++
 tests/python/unittest/test_contrib_operator.py     |  41 +-
 tests/python/unittest/test_dynamic_shape.py        |  54 ++
 tests/python/unittest/test_gluon.py                | 143 ++-
 tests/python/unittest/test_gluon_data_vision.py    |  75 +-
 tests/python/unittest/test_gluon_rnn.py            |  98 +-
 tests/python/unittest/test_gluon_trainer.py        |  21 +-
 tests/python/unittest/test_loss.py                 |  35 +-
 tests/python/unittest/test_ndarray.py              | 101 ++-
 tests/python/unittest/test_operator.py             | 226 ++++-
 tests/python/unittest/test_optimizer.py            |   4 +-
 tests/python/unittest/test_random.py               |  10 +-
 tests/python/unittest/test_subgraph_op.py          |  89 +-
 tests/python/unittest/test_symbol.py               |  13 +
 tests/python/unittest/test_viz.py                  |   2 +
 tests/requirements.txt                             |   3 +
 tests/tutorials/test_sanity_tutorials.py           |   2 +
 tests/tutorials/test_tutorials.py                  |   7 +-
 tools/bandwidth/test_measure.py                    |  10 +-
 tools/coreml/converter/_layers.py                  |  46 +-
 tools/coreml/converter/_mxnet_converter.py         |   3 +
 tools/coreml/test/test_mxnet_converter.py          |  67 ++
 tools/dependencies/README.md                       |   2 +-
 tools/dependencies/curl.sh                         |   4 +-
 tools/dependencies/eigen.sh                        |   4 +-
 tools/dependencies/libpng.sh                       |   4 +-
 tools/dependencies/libtiff.sh                      |   4 +-
 tools/dependencies/libturbojpeg.sh                 |   4 +-
 tools/dependencies/libz.sh                         |   4 +-
 tools/dependencies/lz4.sh                          |   4 +-
 tools/dependencies/make_shared_dependencies.sh     |  28 +-
 tools/dependencies/openblas.sh                     |   4 +-
 tools/dependencies/opencv.sh                       |   4 +-
 tools/dependencies/openssl.sh                      |   4 +-
 tools/dependencies/protobuf.sh                     |   4 +-
 tools/dependencies/zmq.sh                          |   4 +-
 tools/im2rec.cc                                    |   1 +
 tools/pip/MANIFEST.in                              |   1 +
 tools/pip/setup.py                                 |   2 +
 tools/staticbuild/build_lib.sh                     |   4 +
 374 files changed, 11163 insertions(+), 4292 deletions(-)
 delete mode 160000 3rdparty/cub
 create mode 160000 3rdparty/nvidia_cub
 create mode 100644 ci/qemu/test_requirements.txt
 copy docker/docker-python/{Dockerfile.mxnet.python.cpu => 
Dockerfile.mxnet.python3.cpu} (81%)
 copy docker/docker-python/{Dockerfile.mxnet.python.cpu.mkl => 
Dockerfile.mxnet.python3.cpu.mkl} (81%)
 copy docker/docker-python/{Dockerfile.mxnet.python.gpu.cu80 => 
Dockerfile.mxnet.python3.gpu.cu80} (81%)
 copy docker/docker-python/{Dockerfile.mxnet.python.gpu.cu80.mkl => 
Dockerfile.mxnet.python3.gpu.cu80.mkl} (81%)
 copy docker/docker-python/{Dockerfile.mxnet.python.gpu.cu90 => 
Dockerfile.mxnet.python3.gpu.cu90} (81%)
 copy docker/docker-python/{Dockerfile.mxnet.python.gpu.cu90.mkl => 
Dockerfile.mxnet.python3.gpu.cu90.mkl} (81%)
 copy docker/docker-python/{Dockerfile.mxnet.python.gpu.cu92 => 
Dockerfile.mxnet.python3.gpu.cu92} (81%)
 copy docker/docker-python/{Dockerfile.mxnet.python.gpu.cu92.mkl => 
Dockerfile.mxnet.python3.gpu.cu92.mkl} (81%)
 copy MKLDNN_README.md => docs/tutorials/mkldnn/MKLDNN_README.md (92%)
 copy docs/tutorials/{vision => mkldnn}/index.md (100%)
 delete mode 100644 docs/tutorials/python/matrix_factorization.md
 create mode 100644 docs/tutorials/python/module_to_gluon.md
 create mode 100644 example/distributed_training-horovod/README.md
 create mode 100644 example/distributed_training-horovod/gluon_mnist.py
 create mode 100644 example/distributed_training-horovod/module_mnist.py
 create mode 100644 example/distributed_training-horovod/resnet50_imagenet.py
 create mode 100644 julia/src/runtime.jl
 create mode 100644 julia/src/symbolic-node/arithmetic.jl
 create mode 100644 julia/src/symbolic-node/array.jl
 create mode 100644 julia/src/symbolic-node/autodiff.jl
 create mode 100644 julia/src/symbolic-node/io.jl
 create mode 100644 julia/src/symbolic-node/op.jl
 create mode 100644 julia/src/symbolic-node/show.jl
 create mode 100644 julia/src/symbolic-node/type.jl
 copy scala-package/core/src/main/scala/org/apache/mxnet/{ => 
javaapi}/Layout.scala (77%)
 copy scala-package/examples/scripts/infer/{imageclassifier/get_resnet_data.sh 
=> bert/get_bert_data.sh} (67%)
 copy scala-package/examples/scripts/{benchmark/run_java_inference_bm.sh => 
infer/bert/run_bert_qa_example.sh} (90%)
 mode change 100644 => 100755
 create mode 100644 
scala-package/examples/src/main/java/org/apache/mxnetexamples/javaapi/infer/bert/BertDataParser.java
 create mode 100644 
scala-package/examples/src/main/java/org/apache/mxnetexamples/javaapi/infer/bert/BertQA.java
 create mode 100644 
scala-package/examples/src/main/java/org/apache/mxnetexamples/javaapi/infer/bert/README.md
 create mode 100644 
scala-package/examples/src/test/java/org/apache/mxnetexamples/javaapi/infer/predictor/BertExampleTest.java
 create mode 100644 src/io/opencv_compatibility.h
 create mode 100644 src/operator/image/crop-inl.h
 copy src/operator/image/{resize.cc => crop.cc} (51%)
 create mode 100644 src/operator/nn/mkldnn/mkldnn_fully_connected-inl.h
 create mode 100644 
src/operator/quantization/mkldnn/mkldnn_quantized_fully_connected.cc
 copy src/operator/quantization/mkldnn/{mkldnn_quantized_pooling.cc => 
mkldnn_quantized_ops-inl.h} (55%)
 rename src/operator/subgraph/{partition_graph.cc => build_subgraph.cc} (69%)
 copy src/operator/subgraph/{default_subgraph_property.cc => 
default_subgraph_property_v2.cc} (73%)
 rename src/operator/subgraph/mkldnn/{mkldnn_conv_post_quantize_property.cc => 
mkldnn_conv_post_quantize_property.h} (84%)
 rename src/operator/subgraph/mkldnn/{mkldnn_conv_property.cc => 
mkldnn_conv_property.h} (91%)
 create mode 100644 src/operator/subgraph/mkldnn/mkldnn_fc.cc
 create mode 100644 
src/operator/subgraph/mkldnn/mkldnn_fc_post_quantize_property.h
 create mode 100644 src/operator/subgraph/mkldnn/mkldnn_fc_property.h
 create mode 100644 
src/operator/subgraph/mkldnn/mkldnn_post_quantize_align_scale_property.h
 copy src/operator/subgraph/mkldnn/{mkldnn_conv-inl.h => 
mkldnn_subgraph_property.cc} (60%)
 create mode 100644 tests/python/unittest/test_dynamic_shape.py

Reply via email to