gitextract_zlms863u/

├── .asf.yaml
├── .clang-format
├── .clang-tidy
├── .cmakelintrc
├── .codecov.yml
├── .git-blame-ignore-revs
├── .gitattributes
├── .github/
│   ├── ISSUE_TEMPLATE/
│   │   ├── bug_report.md
│   │   ├── config.yml
│   │   ├── feature_request.md
│   │   ├── flaky_test.md
│   │   └── rfc.md
│   ├── PULL_REQUEST_TEMPLATE.md
│   └── workflows/
│       ├── greetings.yml
│       ├── license_check.yml
│       ├── link_check.yml
│       ├── os_x_mklbuild.yml
│       └── os_x_staticbuild.yml
├── .gitignore
├── .gitmodules
├── .licenserc.yaml
├── .mxnet_root
├── 3rdparty/
│   ├── ctc_include/
│   │   ├── LICENSE
│   │   ├── contrib/
│   │   │   └── moderngpu/
│   │   │       ├── LICENSE
│   │   │       └── include/
│   │   │           ├── device/
│   │   │           │   ├── ctaloadbalance.cuh
│   │   │           │   ├── ctamerge.cuh
│   │   │           │   ├── ctascan.cuh
│   │   │           │   ├── ctasearch.cuh
│   │   │           │   ├── ctasegreduce.cuh
│   │   │           │   ├── ctasegscan.cuh
│   │   │           │   ├── ctasegsort.cuh
│   │   │           │   ├── ctasortedsearch.cuh
│   │   │           │   ├── devicetypes.cuh
│   │   │           │   ├── deviceutil.cuh
│   │   │           │   ├── intrinsics.cuh
│   │   │           │   ├── loadstore.cuh
│   │   │           │   ├── serialsets.cuh
│   │   │           │   └── sortnetwork.cuh
│   │   │           ├── mgpudevice.cuh
│   │   │           ├── mgpuenums.h
│   │   │           └── util/
│   │   │               └── static.h
│   │   └── detail/
│   │       ├── cpu_ctc.h
│   │       ├── ctc_helper.h
│   │       ├── gpu_ctc.h
│   │       ├── gpu_ctc_kernels.h
│   │       └── hostdevice.h
│   ├── miniz/
│   │   ├── miniz.c
│   │   └── miniz.h
│   └── mshadow/
│       ├── .gitignore
│       ├── .travis.yml
│       ├── CHANGES.md
│       ├── CMakeLists.txt
│       ├── LICENSE
│       ├── README.md
│       ├── cmake/
│       │   └── AutoDetectF16C.cmake
│       ├── doc/
│       │   ├── Doxyfile
│       │   ├── README.md
│       │   └── mkdoc.sh
│       ├── guide/
│       │   ├── .gitignore
│       │   ├── Makefile
│       │   ├── README.md
│       │   ├── basic.cpp
│       │   ├── basic_stream.cu
│       │   ├── defop.cpp
│       │   ├── exp-template/
│       │   │   ├── .gitignore
│       │   │   ├── Makefile
│       │   │   └── README.md
│       │   ├── mshadow-ps/
│       │   │   ├── .gitignore
│       │   │   ├── Makefile
│       │   │   ├── README.md
│       │   │   ├── dbstr.h
│       │   │   ├── dist_async_sum-inl.h
│       │   │   ├── dist_async_sum.cpp
│       │   │   ├── local.sh
│       │   │   ├── local_sum-inl.h
│       │   │   ├── local_sum.cpp
│       │   │   └── local_sum.cu
│       │   └── neuralnet/
│       │       ├── Makefile
│       │       ├── README.md
│       │       ├── convnet.cu
│       │       ├── nnet.cu
│       │       ├── nnet_ps.cu
│       │       └── util.h
│       ├── make/
│       │   ├── README.md
│       │   └── mshadow.mk
│       ├── mshadow/
│       │   ├── README.md
│       │   ├── base.h
│       │   ├── bfloat.h
│       │   ├── cuda/
│       │   │   ├── reduce.cuh
│       │   │   └── tensor_gpu-inl.cuh
│       │   ├── dot_engine-inl.h
│       │   ├── expr_engine-inl.h
│       │   ├── expr_scalar-inl.h
│       │   ├── expression.h
│       │   ├── extension/
│       │   │   ├── broadcast.h
│       │   │   ├── broadcast_with_axis.h
│       │   │   ├── channel_pool.h
│       │   │   ├── channel_unpool.h
│       │   │   ├── choose.h
│       │   │   ├── complex.h
│       │   │   ├── concat.h
│       │   │   ├── crop.h
│       │   │   ├── fill.h
│       │   │   ├── flip.h
│       │   │   ├── implicit_gemm.h
│       │   │   ├── mask.h
│       │   │   ├── mirror.h
│       │   │   ├── one_hot.h
│       │   │   ├── pack_col2patch.h
│       │   │   ├── pad.h
│       │   │   ├── range.h
│       │   │   ├── reduce_with_axis.h
│       │   │   ├── reduceto1d.h
│       │   │   ├── reshape.h
│       │   │   ├── slice.h
│       │   │   ├── slice_ex.h
│       │   │   ├── spatial_pool.h
│       │   │   ├── spatial_unpool.h
│       │   │   ├── spatial_upsampling_nearest.h
│       │   │   ├── swapaxis.h
│       │   │   ├── take.h
│       │   │   ├── take_grad.h
│       │   │   ├── transpose.h
│       │   │   └── unpack_patch2col.h
│       │   ├── extension.h
│       │   ├── half.h
│       │   ├── io.h
│       │   ├── packet/
│       │   │   ├── plain-inl.h
│       │   │   └── sse-inl.h
│       │   ├── packet-inl.h
│       │   ├── random.h
│       │   ├── stream_gpu-inl.h
│       │   ├── tensor.h
│       │   ├── tensor_container.h
│       │   ├── tensor_cpu-inl.h
│       │   └── tensor_gpu-inl.h
│       ├── mshadow-ps/
│       │   ├── .gitignore
│       │   ├── README.md
│       │   ├── mshadow_ps.h
│       │   ├── ps_dist-inl.h
│       │   ├── ps_local-inl.h
│       │   ├── ps_rabit-inl.h
│       │   ├── thread.h
│       │   └── thread_util.h
│       ├── scripts/
│       │   └── travis_script.sh
│       └── test/
│           ├── Makefile
│           ├── pairtest.cu
│           ├── pool.cu
│           ├── reshape.cu
│           ├── test.cu
│           ├── test.h
│           └── unpack.cu
├── CMakeLists.txt
├── CODEOWNERS
├── CODE_OF_CONDUCT.md
├── CONTRIBUTORS.md
├── DNNL_README.md
├── LICENSE
├── NEWS.md
├── NOTICE
├── README.md
├── SECURITY.md
├── benchmark/
│   ├── __init__.py
│   ├── opperf/
│   │   ├── README.md
│   │   ├── __init__.py
│   │   ├── custom_operations/
│   │   │   ├── __init__.py
│   │   │   └── custom_operations.py
│   │   ├── nd_operations/
│   │   │   ├── README.md
│   │   │   ├── __init__.py
│   │   │   ├── array_manipulation_operators.py
│   │   │   ├── array_rearrange.py
│   │   │   ├── binary_operators.py
│   │   │   ├── gemm_operators.py
│   │   │   ├── indexing_routines.py
│   │   │   ├── linalg_operators.py
│   │   │   ├── misc_operators.py
│   │   │   ├── nn_activation_operators.py
│   │   │   ├── nn_basic_operators.py
│   │   │   ├── nn_conv_operators.py
│   │   │   ├── nn_loss_operators.py
│   │   │   ├── nn_optimizer_operators.py
│   │   │   ├── random_sampling_operators.py
│   │   │   ├── reduction_operators.py
│   │   │   ├── sorting_searching_operators.py
│   │   │   └── unary_operators.py
│   │   ├── opperf.py
│   │   ├── results/
│   │   │   ├── mxnet_operator_benchmark_results_cpu.md
│   │   │   └── mxnet_operator_benchmark_results_gpu.md
│   │   ├── rules/
│   │   │   ├── __init__.py
│   │   │   └── default_params.py
│   │   └── utils/
│   │       ├── __init__.py
│   │       ├── benchmark_operators_pytest.py
│   │       ├── benchmark_utils.py
│   │       ├── common_utils.py
│   │       ├── ndarray_utils.py
│   │       ├── op_registry_utils.py
│   │       └── profiler_utils.py
│   └── python/
│       ├── control_flow/
│       │   └── rnn.py
│       ├── dnnl/
│       │   ├── fc_add.py
│       │   ├── run.sh
│       │   └── run_per_thread.sh
│       ├── einsum/
│       │   └── benchmark_einsum.py
│       ├── ffi/
│       │   └── benchmark_ffi.py
│       ├── metric/
│       │   └── benchmark_metric.py
│       ├── quantization/
│       │   └── benchmark_op.py
│       ├── sparse/
│       │   ├── cast_storage.py
│       │   ├── dot.py
│       │   ├── memory_benchmark.py
│       │   ├── sparse_op.py
│       │   ├── updater.py
│       │   └── util.py
│       └── tvmop/
│           └── benchmark_tvmop.py
├── cd/
│   ├── Jenkinsfile_cd_pipeline
│   ├── Jenkinsfile_release_job
│   ├── Jenkinsfile_utils.groovy
│   ├── README.md
│   ├── mxnet_lib/
│   │   ├── Jenkins_pipeline.groovy
│   │   └── mxnet_lib_pipeline.groovy
│   ├── python/
│   │   ├── docker/
│   │   │   ├── Dockerfile
│   │   │   ├── Dockerfile.test
│   │   │   ├── Jenkins_pipeline.groovy
│   │   │   ├── python_images.sh
│   │   │   └── test_python_image.sh
│   │   └── pypi/
│   │       ├── Jenkins_pipeline.groovy
│   │       ├── README.md
│   │       ├── pypi_package.sh
│   │       └── pypi_publish.py
│   └── utils/
│       ├── artifact_repository.md
│       ├── artifact_repository.py
│       ├── docker_tag.sh
│       ├── mxnet_base_image.sh
│       └── test_artifact_repository.py
├── ci/
│   ├── Jenkinsfile_docker_cache
│   ├── Jenkinsfile_utils.groovy
│   ├── README.md
│   ├── __init__.py
│   ├── build.py
│   ├── build_windows.py
│   ├── dev_menu.py
│   ├── docker/
│   │   ├── Dockerfile.build.android
│   │   ├── Dockerfile.build.arm
│   │   ├── Dockerfile.build.centos7
│   │   ├── Dockerfile.build.jetson
│   │   ├── Dockerfile.build.ubuntu
│   │   ├── Dockerfile.build.ubuntu_cpu_jekyll
│   │   ├── Dockerfile.publish.test.centos7
│   │   ├── Dockerfile.test.arm
│   │   ├── docker-compose.yml
│   │   ├── install/
│   │   │   ├── deb_ubuntu_ccache.sh
│   │   │   ├── docker_filepermissions.sh
│   │   │   ├── requirements
│   │   │   └── ubuntu_adduser.sh
│   │   ├── runtime_functions.sh
│   │   └── toolchains/
│   │       ├── aarch64-linux-gnu-toolchain.cmake
│   │       └── arm-linux-gnueabihf-toolchain.cmake
│   ├── docker_login.py
│   ├── jenkins/
│   │   ├── Jenkins_steps.groovy
│   │   ├── Jenkinsfile_centos_cpu
│   │   ├── Jenkinsfile_centos_gpu
│   │   ├── Jenkinsfile_clang
│   │   ├── Jenkinsfile_edge
│   │   ├── Jenkinsfile_full
│   │   ├── Jenkinsfile_miscellaneous
│   │   ├── Jenkinsfile_sanity
│   │   ├── Jenkinsfile_tools
│   │   ├── Jenkinsfile_unix_cpu
│   │   ├── Jenkinsfile_unix_gpu
│   │   ├── Jenkinsfile_website_beta
│   │   ├── Jenkinsfile_website_full
│   │   ├── Jenkinsfile_website_full_pr
│   │   ├── Jenkinsfile_website_jekyll_docs
│   │   ├── Jenkinsfile_website_mxnet_build
│   │   ├── Jenkinsfile_website_nightly
│   │   ├── Jenkinsfile_website_python_docs
│   │   ├── Jenkinsfile_website_version_artifacts
│   │   ├── Jenkinsfile_windows_cpu
│   │   └── Jenkinsfile_windows_gpu
│   ├── logging.conf
│   ├── other/
│   │   └── ci_deploy_doc.sh
│   ├── publish/
│   │   ├── Jenkinsfile
│   │   ├── README.md
│   │   ├── python/
│   │   │   └── build.sh
│   │   ├── scala/
│   │   │   ├── build.sh
│   │   │   ├── buildkey.py
│   │   │   ├── deploy.sh
│   │   │   ├── fullDeploy.sh
│   │   │   └── test.sh
│   │   └── website/
│   │       ├── README.md
│   │       ├── beta-deploy.sh
│   │       ├── deploy.sh
│   │       └── publish_artifacts.sh
│   ├── test_docker_login.py
│   ├── util.py
│   └── windows/
│       ├── test_py3_cpu.ps1
│       └── test_py3_gpu.ps1
├── cmake/
│   ├── BuildCythonModules.cmake
│   ├── BuildTVM.cmake
│   ├── ChooseBlas.cmake
│   ├── Modules/
│   │   ├── FindAccelerate.cmake
│   │   ├── FindAtlas.cmake
│   │   ├── FindCUDNN.cmake
│   │   ├── FindCUTENSOR.cmake
│   │   ├── FindGperftools.cmake
│   │   ├── FindJeMalloc.cmake
│   │   ├── FindNCCL.cmake
│   │   ├── FindNVML.cmake
│   │   ├── FindNVTX.cmake
│   │   └── FindOpenBLAS.cmake
│   ├── Utils.cmake
│   ├── libmxnet.sym
│   └── upstream/
│       ├── FindBLAS.cmake
│       ├── FindCUDAToolkit.cmake
│       └── select_compute_arch.cmake
├── config/
│   ├── darwin.cmake
│   ├── distribution/
│   │   ├── darwin_cpu.cmake
│   │   ├── darwin_cpu_mkl.cmake
│   │   ├── darwin_native.cmake
│   │   ├── linux_cpu.cmake
│   │   ├── linux_cpu_mkl.cmake
│   │   ├── linux_cu100.cmake
│   │   ├── linux_cu101.cmake
│   │   ├── linux_cu102.cmake
│   │   ├── linux_cu110.cmake
│   │   ├── linux_cu112.cmake
│   │   ├── linux_cu92.cmake
│   │   └── linux_native.cmake
│   ├── linux.cmake
│   └── linux_gpu.cmake
├── conftest.py
├── contrib/
│   └── tvmop/
│       ├── __init__.py
│       ├── basic/
│       │   ├── __init__.py
│       │   └── ufunc.py
│       ├── compile.py
│       ├── core/
│       │   ├── __init__.py
│       │   ├── fromnumeric.py
│       │   ├── multiarray.py
│       │   └── umath.py
│       ├── opdef.py
│       ├── space.py
│       └── utils.py
├── cpp-package/
│   ├── CMakeLists.txt
│   ├── README.md
│   ├── example/
│   │   ├── CMakeLists.txt
│   │   ├── README.md
│   │   ├── alexnet.cpp
│   │   ├── charRNN.cpp
│   │   ├── feature_extract/
│   │   │   ├── README.md
│   │   │   ├── feature_extract.cpp
│   │   │   ├── prepare_data_with_opencv.cpp
│   │   │   └── run.sh
│   │   ├── get_data.sh
│   │   ├── googlenet.cpp
│   │   ├── inception_bn.cpp
│   │   ├── inference/
│   │   │   ├── CMakeLists.txt
│   │   │   ├── README.md
│   │   │   ├── imagenet_inference.cpp
│   │   │   ├── multi_threaded_inference/
│   │   │   │   ├── get_model.py
│   │   │   │   ├── multi_threaded_inference.cc
│   │   │   │   └── unit_test_multi_threaded_inference.sh
│   │   │   ├── sentiment_analysis_rnn.cpp
│   │   │   ├── unit_test_imagenet_inference.sh
│   │   │   └── unit_test_sentiment_analysis_rnn.sh
│   │   ├── lenet.cpp
│   │   ├── lenet_with_mxdataiter.cpp
│   │   ├── mlp.cpp
│   │   ├── mlp_cpu.cpp
│   │   ├── mlp_csv.cpp
│   │   ├── mlp_gpu.cpp
│   │   ├── mnist_to_csv.py
│   │   ├── resnet.cpp
│   │   ├── run_lenet_with_mxdataiter.sh
│   │   ├── test_kvstore.cpp
│   │   ├── test_ndarray_copy.cpp
│   │   ├── test_optimizer.cpp
│   │   ├── test_regress_label.cpp
│   │   ├── test_score.cpp
│   │   ├── unittests/
│   │   │   └── unit_test_mlp_csv.sh
│   │   └── utils.h
│   ├── include/
│   │   └── mxnet-cpp/
│   │       ├── .gitignore
│   │       ├── CPPLINT.cfg
│   │       ├── MxNetCpp.h
│   │       ├── base.h
│   │       ├── contrib.h
│   │       ├── executor.h
│   │       ├── executor.hpp
│   │       ├── initializer.h
│   │       ├── io.h
│   │       ├── io.hpp
│   │       ├── kvstore.h
│   │       ├── kvstore.hpp
│   │       ├── lr_scheduler.h
│   │       ├── metric.h
│   │       ├── model.h
│   │       ├── ndarray.h
│   │       ├── ndarray.hpp
│   │       ├── op_map.h
│   │       ├── op_suppl.h
│   │       ├── op_util.h
│   │       ├── operator.h
│   │       ├── operator.hpp
│   │       ├── optimizer.h
│   │       ├── optimizer.hpp
│   │       ├── shape.h
│   │       ├── symbol.h
│   │       └── symbol.hpp
│   ├── scripts/
│   │   ├── OpWrapperGenerator.py
│   │   └── lint.py
│   └── tests/
│       └── ci_test.sh
├── doap.rdf
├── docker/
│   ├── .gitignore
│   ├── Dockerfiles/
│   │   ├── Dockerfile.in.julia
│   │   ├── Dockerfile.in.lib.cpu
│   │   ├── Dockerfile.in.lib.gpu
│   │   ├── Dockerfile.in.perl
│   │   ├── Dockerfile.in.python
│   │   ├── Dockerfile.in.r-lang
│   │   └── Dockerfile.in.scala
│   ├── README.md
│   ├── docker-python/
│   │   ├── README.md
│   │   ├── build_python_dockerfile.sh
│   │   └── test_mxnet.py
│   ├── install/
│   │   ├── cpp.sh
│   │   ├── julia.sh
│   │   ├── perl.sh
│   │   ├── python.sh
│   │   ├── r.sh
│   │   └── scala.sh
│   ├── run.sh
│   └── tool.sh
├── docs/
│   ├── .dockerignore
│   ├── .gitignore
│   ├── README.md
│   ├── cpp_docs/
│   │   ├── Doxyfile
│   │   └── Makefile
│   ├── python_docs/
│   │   ├── README.md
│   │   ├── _static/
│   │   │   ├── autodoc.js
│   │   │   ├── feedback.css
│   │   │   ├── matomo_analytics.js
│   │   │   └── mxnet.css
│   │   ├── python/
│   │   │   ├── .gitignore
│   │   │   ├── Makefile
│   │   │   ├── Makefile_sphinx
│   │   │   ├── api/
│   │   │   │   ├── autograd/
│   │   │   │   │   └── index.rst
│   │   │   │   ├── contrib/
│   │   │   │   │   ├── index.rst
│   │   │   │   │   ├── io/
│   │   │   │   │   │   └── index.rst
│   │   │   │   │   ├── ndarray/
│   │   │   │   │   │   └── index.rst
│   │   │   │   │   ├── onnx/
│   │   │   │   │   │   └── index.rst
│   │   │   │   │   ├── quantization/
│   │   │   │   │   │   └── index.rst
│   │   │   │   │   ├── symbol/
│   │   │   │   │   │   └── index.rst
│   │   │   │   │   ├── tensorboard/
│   │   │   │   │   │   └── index.rst
│   │   │   │   │   ├── tensorrt/
│   │   │   │   │   │   └── index.rst
│   │   │   │   │   └── text/
│   │   │   │   │       └── index.rst
│   │   │   │   ├── device/
│   │   │   │   │   └── index.rst
│   │   │   │   ├── engine/
│   │   │   │   │   └── index.rst
│   │   │   │   ├── executor/
│   │   │   │   │   └── index.rst
│   │   │   │   ├── gluon/
│   │   │   │   │   ├── block.rst
│   │   │   │   │   ├── constant.rst
│   │   │   │   │   ├── contrib/
│   │   │   │   │   │   └── index.rst
│   │   │   │   │   ├── hybrid_block.rst
│   │   │   │   │   ├── index.rst
│   │   │   │   │   ├── loss/
│   │   │   │   │   │   └── index.rst
│   │   │   │   │   ├── metric/
│   │   │   │   │   │   └── index.rst
│   │   │   │   │   ├── model_zoo/
│   │   │   │   │   │   └── index.rst
│   │   │   │   │   ├── nn/
│   │   │   │   │   │   └── index.rst
│   │   │   │   │   ├── parameter.rst
│   │   │   │   │   ├── rnn/
│   │   │   │   │   │   └── index.rst
│   │   │   │   │   ├── symbol_block.rst
│   │   │   │   │   ├── trainer.rst
│   │   │   │   │   └── utils/
│   │   │   │   │       └── index.rst
│   │   │   │   ├── index.rst
│   │   │   │   ├── initializer/
│   │   │   │   │   └── index.rst
│   │   │   │   ├── kvstore/
│   │   │   │   │   └── index.rst
│   │   │   │   ├── kvstore_server/
│   │   │   │   │   └── index.rst
│   │   │   │   ├── legacy/
│   │   │   │   │   ├── callback/
│   │   │   │   │   │   └── index.rst
│   │   │   │   │   ├── image/
│   │   │   │   │   │   └── index.rst
│   │   │   │   │   ├── index.rst
│   │   │   │   │   ├── io/
│   │   │   │   │   │   └── index.rst
│   │   │   │   │   ├── ndarray/
│   │   │   │   │   │   ├── contrib/
│   │   │   │   │   │   │   └── index.rst
│   │   │   │   │   │   ├── image/
│   │   │   │   │   │   │   └── index.rst
│   │   │   │   │   │   ├── index.rst
│   │   │   │   │   │   ├── linalg/
│   │   │   │   │   │   │   └── index.rst
│   │   │   │   │   │   ├── ndarray.rst
│   │   │   │   │   │   ├── op/
│   │   │   │   │   │   │   └── index.rst
│   │   │   │   │   │   ├── random/
│   │   │   │   │   │   │   └── index.rst
│   │   │   │   │   │   ├── register/
│   │   │   │   │   │   │   └── index.rst
│   │   │   │   │   │   ├── sparse/
│   │   │   │   │   │   │   └── index.rst
│   │   │   │   │   │   └── utils/
│   │   │   │   │   │       └── index.rst
│   │   │   │   │   ├── recordio/
│   │   │   │   │   │   └── index.rst
│   │   │   │   │   ├── symbol/
│   │   │   │   │   │   ├── contrib/
│   │   │   │   │   │   │   └── index.rst
│   │   │   │   │   │   ├── image/
│   │   │   │   │   │   │   └── index.rst
│   │   │   │   │   │   ├── index.rst
│   │   │   │   │   │   ├── linalg/
│   │   │   │   │   │   │   └── index.rst
│   │   │   │   │   │   ├── op/
│   │   │   │   │   │   │   └── index.rst
│   │   │   │   │   │   ├── random/
│   │   │   │   │   │   │   └── index.rst
│   │   │   │   │   │   ├── register/
│   │   │   │   │   │   │   └── index.rst
│   │   │   │   │   │   ├── sparse/
│   │   │   │   │   │   │   └── index.rst
│   │   │   │   │   │   └── symbol.rst
│   │   │   │   │   └── visualization/
│   │   │   │   │       └── index.rst
│   │   │   │   ├── lr_scheduler/
│   │   │   │   │   └── index.rst
│   │   │   │   ├── np/
│   │   │   │   │   ├── arrays.indexing.rst
│   │   │   │   │   ├── arrays.ndarray.rst
│   │   │   │   │   ├── arrays.rst
│   │   │   │   │   ├── index.rst
│   │   │   │   │   ├── random/
│   │   │   │   │   │   └── index.rst
│   │   │   │   │   ├── routines.array-creation.rst
│   │   │   │   │   ├── routines.array-manipulation.rst
│   │   │   │   │   ├── routines.io.rst
│   │   │   │   │   ├── routines.linalg.rst
│   │   │   │   │   ├── routines.math.rst
│   │   │   │   │   ├── routines.rst
│   │   │   │   │   ├── routines.sort.rst
│   │   │   │   │   └── routines.statistics.rst
│   │   │   │   ├── npx/
│   │   │   │   │   └── index.rst
│   │   │   │   ├── optimizer/
│   │   │   │   │   └── index.rst
│   │   │   │   ├── profiler/
│   │   │   │   │   └── index.rst
│   │   │   │   ├── rtc/
│   │   │   │   │   └── index.rst
│   │   │   │   ├── runtime/
│   │   │   │   │   └── index.rst
│   │   │   │   ├── test_utils/
│   │   │   │   │   └── index.rst
│   │   │   │   └── util/
│   │   │   │       └── index.rst
│   │   │   ├── index.rst
│   │   │   ├── scripts/
│   │   │   │   ├── conf.py
│   │   │   │   ├── md2ipynb.py
│   │   │   │   └── process_rst.py
│   │   │   └── tutorials/
│   │   │       ├── deploy/
│   │   │       │   ├── export/
│   │   │       │   │   ├── index.rst
│   │   │       │   │   └── onnx.md
│   │   │       │   ├── index.rst
│   │   │       │   ├── inference/
│   │   │       │   │   ├── cpp.rst
│   │   │       │   │   ├── image_classification_jetson.md
│   │   │       │   │   └── index.rst
│   │   │       │   └── run-on-aws/
│   │   │       │       ├── cloud.md
│   │   │       │       ├── index.rst
│   │   │       │       ├── use_ec2.rst
│   │   │       │       └── use_sagemaker.rst
│   │   │       ├── extend/
│   │   │       │   ├── customop.md
│   │   │       │   └── index.rst
│   │   │       ├── getting-started/
│   │   │       │   ├── crash-course/
│   │   │       │   │   ├── 0-introduction.md
│   │   │       │   │   ├── 1-nparray.md
│   │   │       │   │   ├── 2-create-nn.md
│   │   │       │   │   ├── 3-autograd.md
│   │   │       │   │   ├── 4-components.md
│   │   │       │   │   ├── 5-datasets.md
│   │   │       │   │   ├── 6-train-nn.md
│   │   │       │   │   ├── 7-use-gpus.md
│   │   │       │   │   ├── index.rst
│   │   │       │   │   └── prepare_dataset.py
│   │   │       │   ├── gluon_from_experiment_to_deployment.md
│   │   │       │   ├── gluon_migration_guide.md
│   │   │       │   ├── index.rst
│   │   │       │   ├── logistic_regression_explained.md
│   │   │       │   └── to-mxnet/
│   │   │       │       ├── index.rst
│   │   │       │       └── pytorch.md
│   │   │       ├── index.rst
│   │   │       ├── packages/
│   │   │       │   ├── autograd/
│   │   │       │   │   └── index.md
│   │   │       │   ├── gluon/
│   │   │       │   │   ├── blocks/
│   │   │       │   │   │   ├── activations/
│   │   │       │   │   │   │   └── activations.md
│   │   │       │   │   │   ├── custom-layer.md
│   │   │       │   │   │   ├── hybridize.md
│   │   │       │   │   │   ├── index.rst
│   │   │       │   │   │   ├── init.md
│   │   │       │   │   │   ├── naming.md
│   │   │       │   │   │   ├── nn.md
│   │   │       │   │   │   ├── parameters.md
│   │   │       │   │   │   └── save_load_params.md
│   │   │       │   │   ├── image/
│   │   │       │   │   │   ├── index.rst
│   │   │       │   │   │   ├── info_gan.md
│   │   │       │   │   │   └── mnist.md
│   │   │       │   │   ├── index.rst
│   │   │       │   │   ├── loss/
│   │   │       │   │   │   ├── custom-loss.md
│   │   │       │   │   │   ├── index.rst
│   │   │       │   │   │   ├── kl_divergence.md
│   │   │       │   │   │   └── loss.md
│   │   │       │   │   ├── text/
│   │   │       │   │   │   ├── gnmt.rst
│   │   │       │   │   │   ├── index.rst
│   │   │       │   │   │   └── transformer.rst
│   │   │       │   │   └── training/
│   │   │       │   │       ├── fit_api_tutorial.md
│   │   │       │   │       ├── index.rst
│   │   │       │   │       ├── learning_rates/
│   │   │       │   │       │   ├── index.rst
│   │   │       │   │       │   ├── learning_rate_finder.md
│   │   │       │   │       │   ├── learning_rate_schedules.md
│   │   │       │   │       │   └── learning_rate_schedules_advanced.md
│   │   │       │   │       ├── normalization/
│   │   │       │   │       │   └── index.md
│   │   │       │   │       └── trainer.md
│   │   │       │   ├── index.rst
│   │   │       │   ├── kvstore/
│   │   │       │   │   ├── index.rst
│   │   │       │   │   └── kvstore.md
│   │   │       │   ├── legacy/
│   │   │       │   │   ├── index.rst
│   │   │       │   │   └── ndarray/
│   │   │       │   │       ├── 01-ndarray-intro.md
│   │   │       │   │       ├── 02-ndarray-operations.md
│   │   │       │   │       ├── 03-ndarray-contexts.md
│   │   │       │   │       ├── gotchas_numpy_in_mxnet.md
│   │   │       │   │       ├── index.rst
│   │   │       │   │       └── sparse/
│   │   │       │   │           ├── csr.md
│   │   │       │   │           ├── index.rst
│   │   │       │   │           └── row_sparse.md
│   │   │       │   ├── np/
│   │   │       │   │   ├── cheat-sheet.md
│   │   │       │   │   ├── index.rst
│   │   │       │   │   └── np-vs-numpy.md
│   │   │       │   ├── onnx/
│   │   │       │   │   ├── fine_tuning_gluon.md
│   │   │       │   │   ├── index.rst
│   │   │       │   │   └── inference_on_onnx_model.md
│   │   │       │   ├── optimizer/
│   │   │       │   │   └── index.md
│   │   │       │   └── viz/
│   │   │       │       └── index.rst
│   │   │       └── performance/
│   │   │           ├── backend/
│   │   │           │   ├── amp.md
│   │   │           │   ├── dnnl/
│   │   │           │   │   ├── dnnl_quantization.md
│   │   │           │   │   ├── dnnl_quantization_inc.md
│   │   │           │   │   ├── dnnl_readme.md
│   │   │           │   │   └── index.rst
│   │   │           │   ├── index.rst
│   │   │           │   ├── profiler.md
│   │   │           │   └── tvm.rst
│   │   │           ├── compression/
│   │   │           │   ├── index.rst
│   │   │           │   └── int8.rst
│   │   │           └── index.rst
│   │   ├── requirements
│   │   └── themes/
│   │       ├── .babelrc
│   │       ├── .circleci/
│   │       │   └── config.yml
│   │       ├── .gitignore
│   │       ├── .sassrc
│   │       └── mx-theme/
│   │           ├── LICENSE
│   │           ├── MANIFEST.in
│   │           ├── README.md
│   │           ├── mxtheme/
│   │           │   ├── __init__.py
│   │           │   ├── card.py
│   │           │   ├── drawer.html
│   │           │   ├── feedback.html
│   │           │   ├── footer.html
│   │           │   ├── header.html
│   │           │   ├── header_search.html
│   │           │   ├── header_sourcelink.html
│   │           │   ├── header_top.html
│   │           │   ├── layout.html
│   │           │   ├── localtoc.html
│   │           │   ├── relations.html
│   │           │   ├── search.html
│   │           │   ├── static/
│   │           │   │   ├── fontawesome/
│   │           │   │   │   └── all.css
│   │           │   │   ├── fonts.css
│   │           │   │   ├── sphinx_materialdesign_theme.css
│   │           │   │   └── sphinx_materialdesign_theme.js
│   │           │   └── theme.conf
│   │           ├── setup.py
│   │           └── src/
│   │               ├── js/
│   │               │   ├── adjust-height.js
│   │               │   ├── feedback.js
│   │               │   ├── scrollspy.js
│   │               │   └── sphinx_materialdesign_theme.js
│   │               └── scss/
│   │                   ├── _root.scss
│   │                   ├── _variables.scss
│   │                   ├── admonitions/
│   │                   │   └── _admonitions.scss
│   │                   ├── blockquote/
│   │                   │   └── _blockquote.scss
│   │                   ├── card/
│   │                   │   └── _card.scss
│   │                   ├── code/
│   │                   │   └── _code.scss
│   │                   ├── downloadlink/
│   │                   │   └── _downloadlink.scss
│   │                   ├── drawer/
│   │                   │   └── _drawer.scss
│   │                   ├── fonts/
│   │                   │   └── _material-icons.scss
│   │                   ├── footer/
│   │                   │   └── _footer.scss
│   │                   ├── grid/
│   │                   │   └── _simplegrid.scss
│   │                   ├── header/
│   │                   │   └── _header.scss
│   │                   ├── headerings/
│   │                   │   └── _headerings.scss
│   │                   ├── layout/
│   │                   │   └── _layout.scss
│   │                   ├── lists/
│   │                   │   └── _lists.scss
│   │                   ├── search/
│   │                   │   └── _search.scss
│   │                   ├── sphinx_materialdesign_theme.scss
│   │                   ├── tables/
│   │                   │   └── _tables.scss
│   │                   └── toc/
│   │                       ├── _globaltoc.scss
│   │                       ├── _localtoc.scss
│   │                       └── _toctree.scss
│   ├── static_site/
│   │   ├── .gitignore
│   │   ├── .nojekyll
│   │   ├── Makefile
│   │   ├── README.md
│   │   └── src/
│   │       ├── .asf.yaml
│   │       ├── .gitignore
│   │       ├── .htaccess
│   │       ├── .nojekyll
│   │       ├── 404.html
│   │       ├── Gemfile
│   │       ├── _config.yml
│   │       ├── _config_beta.yml
│   │       ├── _config_prod.yml
│   │       ├── _includes/
│   │       │   ├── callout.html
│   │       │   ├── disqus_comments.html
│   │       │   ├── feedback.html
│   │       │   ├── footer.html
│   │       │   ├── get_started/
│   │       │   │   ├── cloud/
│   │       │   │   │   ├── cpu.md
│   │       │   │   │   └── gpu.md
│   │       │   │   ├── devices/
│   │       │   │   │   ├── nvidia-jetson.md
│   │       │   │   │   └── raspberry_pi.md
│   │       │   │   ├── get_started.html
│   │       │   │   ├── gpu_snippet.md
│   │       │   │   ├── linux/
│   │       │   │   │   ├── clojure/
│   │       │   │   │   │   └── build-from-source.md
│   │       │   │   │   ├── cpp/
│   │       │   │   │   │   └── build-from-source.md
│   │       │   │   │   ├── java/
│   │       │   │   │   │   └── build-from-source.md
│   │       │   │   │   ├── julia/
│   │       │   │   │   │   └── build-from-source.md
│   │       │   │   │   ├── perl/
│   │       │   │   │   │   └── build-from-source.md
│   │       │   │   │   ├── python/
│   │       │   │   │   │   ├── cpu/
│   │       │   │   │   │   │   ├── build-from-source.md
│   │       │   │   │   │   │   ├── docker.md
│   │       │   │   │   │   │   └── pip.md
│   │       │   │   │   │   └── gpu/
│   │       │   │   │   │       ├── build-from-source.md
│   │       │   │   │   │       ├── docker.md
│   │       │   │   │   │       └── pip.md
│   │       │   │   │   ├── r/
│   │       │   │   │   │   └── build-from-source.md
│   │       │   │   │   └── scala/
│   │       │   │   │       └── build-from-source.md
│   │       │   │   └── pip_snippet.md
│   │       │   ├── head.html
│   │       │   ├── header.html
│   │       │   ├── icon-github.html
│   │       │   ├── icon-twitter.html
│   │       │   ├── important.html
│   │       │   ├── matomo-analytics.html
│   │       │   ├── note.html
│   │       │   ├── social.html
│   │       │   ├── tip.html
│   │       │   └── warning.html
│   │       ├── _layouts/
│   │       │   ├── default.html
│   │       │   ├── home.html
│   │       │   ├── page.html
│   │       │   ├── page_api.html
│   │       │   ├── page_category.html
│   │       │   ├── page_landing_tutorials.html
│   │       │   └── post.html
│   │       ├── _plugins/
│   │       │   └── markdowner.rb
│   │       ├── _sass/
│   │       │   ├── feedback.scss
│   │       │   ├── generalVersionDropdown.scss
│   │       │   ├── globalSearch.scss
│   │       │   ├── minima/
│   │       │   │   ├── _base.scss
│   │       │   │   ├── _blog.scss
│   │       │   │   ├── _docs.scss
│   │       │   │   ├── _ecosystem.scss
│   │       │   │   ├── _features.scss
│   │       │   │   ├── _getting_started.scss
│   │       │   │   ├── _home.scss
│   │       │   │   ├── _layout.scss
│   │       │   │   ├── _syntax-highlighting.scss
│   │       │   │   ├── colorful.scss
│   │       │   │   └── simple-grid.scss
│   │       │   └── minima.scss
│   │       ├── assets/
│   │       │   ├── js/
│   │       │   │   ├── clipboard.js
│   │       │   │   ├── copycode.js
│   │       │   │   ├── feedback.js
│   │       │   │   ├── globalSearch.js
│   │       │   │   └── options.js
│   │       │   └── main.scss
│   │       ├── index.html
│   │       └── pages/
│   │           ├── api/
│   │           │   ├── api.html
│   │           │   ├── architecture/
│   │           │   │   ├── exception_handling.md
│   │           │   │   ├── note_data_loading.md
│   │           │   │   ├── note_engine.md
│   │           │   │   ├── note_memory.md
│   │           │   │   ├── overview.md
│   │           │   │   └── program_model.md
│   │           │   ├── clojure/
│   │           │   │   ├── docs/
│   │           │   │   │   └── tutorials/
│   │           │   │   │       ├── index.md
│   │           │   │   │       ├── kvstore.md
│   │           │   │   │       ├── module.md
│   │           │   │   │       ├── ndarray.md
│   │           │   │   │       ├── symbol.md
│   │           │   │   │       └── symbol_in_pictures.md
│   │           │   │   └── index.md
│   │           │   ├── cpp/
│   │           │   │   ├── docs/
│   │           │   │   │   └── tutorials/
│   │           │   │   │       ├── basics.md
│   │           │   │   │       ├── index.md
│   │           │   │   │       ├── multi_threaded_inference.md
│   │           │   │   │       ├── mxnet_cpp_inference_tutorial.md
│   │           │   │   │       └── subgraphAPI.md
│   │           │   │   └── index.md
│   │           │   ├── developer_guide/
│   │           │   │   ├── 1_github_contribution_and_PR_verification_tips.md
│   │           │   │   ├── debugging_and_performance_optimization_tips.md
│   │           │   │   ├── examine_forward_results_with_hooks.md
│   │           │   │   ├── exception_handing_and_custom_error_types.md
│   │           │   │   └── profiling.md
│   │           │   ├── faq/
│   │           │   │   ├── add_op_in_backend.md
│   │           │   │   ├── cloud.md
│   │           │   │   ├── distributed_training.md
│   │           │   │   ├── env_var.md
│   │           │   │   ├── float16.md
│   │           │   │   ├── gradient_compression.md
│   │           │   │   ├── large_tensor_support.md
│   │           │   │   ├── model_parallel_lstm.md
│   │           │   │   ├── new_op.md
│   │           │   │   ├── perf.md
│   │           │   │   ├── recordio.md
│   │           │   │   ├── s3_integration.md
│   │           │   │   ├── security.md
│   │           │   │   ├── tensor_inspector_tutorial.md
│   │           │   │   ├── using_rtc.md
│   │           │   │   └── why_mxnet.md
│   │           │   ├── java/
│   │           │   │   ├── docs/
│   │           │   │   │   └── tutorials/
│   │           │   │   │       ├── index.md
│   │           │   │   │       └── ssd_inference.md
│   │           │   │   └── index.md
│   │           │   ├── julia/
│   │           │   │   └── index.md
│   │           │   ├── perl/
│   │           │   │   ├── docs/
│   │           │   │   │   └── tutorials/
│   │           │   │   │       ├── index.md
│   │           │   │   │       ├── io.md
│   │           │   │   │       ├── kvstore.md
│   │           │   │   │       ├── ndarray.md
│   │           │   │   │       └── symbol.md
│   │           │   │   └── index.md
│   │           │   ├── python/
│   │           │   │   └── index.md
│   │           │   ├── r/
│   │           │   │   ├── docs/
│   │           │   │   │   └── tutorials/
│   │           │   │   │       ├── char_rnn_model.md
│   │           │   │   │       ├── classify_real_image_with_pretrained_model.md
│   │           │   │   │       ├── custom_iterator.md
│   │           │   │   │       ├── index.md
│   │           │   │   │       ├── multi_dim_lstm.md
│   │           │   │   │       ├── ndarray.md
│   │           │   │   │       └── symbol.md
│   │           │   │   └── index.md
│   │           │   └── scala/
│   │           │       ├── docs/
│   │           │       │   └── tutorials/
│   │           │       │       ├── index.md
│   │           │       │       ├── infer.md
│   │           │       │       ├── io.md
│   │           │       │       ├── kvstore.md
│   │           │       │       ├── ndarray.md
│   │           │       │       ├── symbol.md
│   │           │       │       └── symbol_in_pictures.md
│   │           │       └── index.md
│   │           ├── community/
│   │           │   ├── clang_format_guide.md
│   │           │   ├── code_guide.md
│   │           │   ├── code_review.md
│   │           │   ├── committer_guide.md
│   │           │   ├── community.md
│   │           │   ├── document.md
│   │           │   ├── error_handling.md
│   │           │   ├── git_howto.md
│   │           │   ├── index.md
│   │           │   └── pull_request.md
│   │           ├── ecosystem.html
│   │           ├── features.html
│   │           ├── get_started/
│   │           │   ├── build_from_source.md
│   │           │   ├── download.md
│   │           │   ├── index.html
│   │           │   ├── jetson_setup.md
│   │           │   └── validate_mxnet.md
│   │           └── trusted_by.html
│   └── tutorial_utils/
│       └── vision/
│           └── cnn_visualization/
│               └── gradcam.py
├── example/
│   ├── MXNetTutorialTemplate.ipynb
│   ├── README.md
│   ├── adversary/
│   │   ├── README.md
│   │   └── adversary_generation.ipynb
│   ├── bi-lstm-sort/
│   │   ├── README.md
│   │   └── bi-lstm-sort.ipynb
│   ├── distributed_training/
│   │   ├── README.md
│   │   ├── cifar10_dist.py
│   │   └── cifar10_kvstore_hvd.py
│   ├── distributed_training-horovod/
│   │   ├── README.md
│   │   ├── gluon_mnist.py
│   │   └── resnet50_imagenet.py
│   ├── extensions/
│   │   ├── lib_api/
│   │   │   ├── Makefile
│   │   │   ├── init_lib.cc
│   │   │   ├── libtest.cc
│   │   │   └── test_loading.py
│   │   ├── lib_custom_op/
│   │   │   ├── Makefile
│   │   │   ├── README.md
│   │   │   ├── gemm_lib.cc
│   │   │   ├── relu_lib.cc
│   │   │   ├── relu_lib.cu
│   │   │   ├── relu_lib.h
│   │   │   ├── test_gemm.py
│   │   │   ├── test_relu.py
│   │   │   ├── test_transposecsr.py
│   │   │   ├── test_transposerowsp.py
│   │   │   ├── transposecsr_lib.cc
│   │   │   └── transposerowsp_lib.cc
│   │   ├── lib_external_ops/
│   │   │   ├── CMakeLists.txt
│   │   │   ├── README.md
│   │   │   ├── init_lib.cc
│   │   │   ├── min_ex-inl.h
│   │   │   ├── min_ex.cc
│   │   │   ├── min_ex.cu
│   │   │   └── test_loading.py
│   │   ├── lib_pass/
│   │   │   ├── Makefile
│   │   │   ├── README.md
│   │   │   ├── pass_lib.cc
│   │   │   └── test_pass.py
│   │   └── lib_subgraph/
│   │       ├── Makefile
│   │       ├── README.md
│   │       ├── subgraph_lib.cc
│   │       └── test_subgraph.py
│   ├── gluon/
│   │   ├── actor_critic/
│   │   │   ├── README.md
│   │   │   └── actor_critic.py
│   │   ├── data.py
│   │   ├── house_prices/
│   │   │   ├── README.md
│   │   │   └── kaggle_k_fold_cross_validation.py
│   │   ├── image_classification.py
│   │   ├── mnist/
│   │   │   ├── README.md
│   │   │   └── mnist.py
│   │   └── super_resolution/
│   │       ├── README.md
│   │       └── super_resolution.py
│   ├── multi-task/
│   │   ├── README.md
│   │   └── multi-task-learning.ipynb
│   ├── probability/
│   │   └── VAE/
│   │       └── VAE.md
│   ├── profiler/
│   │   ├── README.md
│   │   ├── profiler_imageiter.py
│   │   ├── profiler_matmul.py
│   │   └── profiler_ndarray.py
│   ├── quantization/
│   │   ├── README.md
│   │   ├── imagenet_gen_qsym_onednn.py
│   │   ├── imagenet_inference.py
│   │   └── launch_inference_onednn.sh
│   ├── quantization_inc/
│   │   ├── custom_strategy.py
│   │   ├── resnet50v2_mse.yaml
│   │   ├── resnet_measurement.py
│   │   ├── resnet_mse.py
│   │   └── resnet_tuning.py
│   └── recommenders/
│       ├── .gitignore
│       ├── README.md
│       ├── demo1-MF.ipynb
│       ├── demo2-dssm.ipynb
│       ├── matrix_fact.py
│       └── movielens_data.py
├── include/
│   └── mxnet/
│       ├── api_registry.h
│       ├── base.h
│       ├── c_api.h
│       ├── c_api_error.h
│       ├── c_api_test.h
│       ├── engine.h
│       ├── executor.h
│       ├── expr_operator.h
│       ├── graph_attr_types.h
│       ├── imperative.h
│       ├── io.h
│       ├── ir/
│       │   └── expr.h
│       ├── kvstore.h
│       ├── lib_api.h
│       ├── libinfo.h
│       ├── ndarray.h
│       ├── node/
│       │   ├── container.h
│       │   └── node.h
│       ├── op_attr_types.h
│       ├── operator.h
│       ├── operator_util.h
│       ├── random_generator.h
│       ├── resource.h
│       ├── rtc.h
│       ├── runtime/
│       │   ├── c_runtime_api.h
│       │   ├── container.h
│       │   ├── container_ext.h
│       │   ├── data_type.h
│       │   ├── ffi_helper.h
│       │   ├── memory.h
│       │   ├── ndarray.h
│       │   ├── ndarray_handle.h
│       │   ├── object.h
│       │   ├── packed_func.h
│       │   ├── py_arg.h
│       │   └── registry.h
│       ├── storage.h
│       ├── tensor_blob.h
│       └── tuple.h
├── licenses/
│   ├── BOOST1_0
│   ├── BSD2
│   ├── BSD3-cmake
│   ├── MIT
│   └── OFL1_1
├── plugin/
│   ├── opencv/
│   │   ├── __init__.py
│   │   ├── cv_api.cc
│   │   ├── cv_api.h
│   │   ├── opencv.mk
│   │   └── opencv.py
│   ├── sframe/
│   │   ├── iter_sframe.cc
│   │   └── plugin.mk
│   ├── torch/
│   │   ├── torch.mk
│   │   ├── torch_base.cc
│   │   ├── torch_base.h
│   │   ├── torch_criterion-inl.h
│   │   ├── torch_criterion.cc
│   │   ├── torch_criterion.cu
│   │   ├── torch_function.cc
│   │   ├── torch_function.h
│   │   ├── torch_module-inl.h
│   │   ├── torch_module.cc
│   │   └── torch_module.cu
│   └── warpctc/
│       ├── warpctc-inl.h
│       ├── warpctc.cc
│       ├── warpctc.cu
│       └── warpctc.mk
├── prospector.yaml
├── pytest.ini
├── python/
│   ├── .gitignore
│   ├── README.md
│   ├── mxnet/
│   │   ├── __init__.py
│   │   ├── _api_internal.py
│   │   ├── _ctypes/
│   │   │   ├── __init__.py
│   │   │   ├── _api_internal.py
│   │   │   ├── cached_op.py
│   │   │   ├── ndarray.py
│   │   │   ├── space.py
│   │   │   └── symbol.py
│   │   ├── _cy3/
│   │   │   ├── README.md
│   │   │   └── __init__.py
│   │   ├── _deferred_compute.py
│   │   ├── _ffi/
│   │   │   ├── __init__.py
│   │   │   ├── _ctypes/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── function.py
│   │   │   │   ├── object.py
│   │   │   │   └── types.py
│   │   │   ├── _cy3/
│   │   │   │   └── __init__.py
│   │   │   ├── _cython/
│   │   │   │   ├── base.pxi
│   │   │   │   ├── core.pyx
│   │   │   │   ├── function.pxi
│   │   │   │   ├── ndarray.pxi
│   │   │   │   └── object.pxi
│   │   │   ├── base.py
│   │   │   ├── function.py
│   │   │   ├── node_generic.py
│   │   │   ├── object.py
│   │   │   └── runtime_ctypes.py
│   │   ├── _global_var.py
│   │   ├── _numpy_op_doc.py
│   │   ├── amp/
│   │   │   ├── __init__.py
│   │   │   ├── amp.py
│   │   │   ├── lists/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── symbol_bf16.py
│   │   │   │   └── symbol_fp16.py
│   │   │   └── loss_scaler.py
│   │   ├── api.py
│   │   ├── attribute.py
│   │   ├── autograd.py
│   │   ├── base.py
│   │   ├── callback.py
│   │   ├── container.py
│   │   ├── context.py
│   │   ├── contrib/
│   │   │   ├── __init__.py
│   │   │   ├── io.py
│   │   │   ├── ndarray.py
│   │   │   ├── onnx/
│   │   │   │   └── __init__.py
│   │   │   ├── quantization.py
│   │   │   ├── symbol.py
│   │   │   ├── tensorboard.py
│   │   │   ├── tensorrt.py
│   │   │   └── text/
│   │   │       ├── __init__.py
│   │   │       ├── _constants.py
│   │   │       ├── embedding.py
│   │   │       ├── utils.py
│   │   │       └── vocab.py
│   │   ├── cuda/
│   │   │   ├── __init__.py
│   │   │   └── nvtx.py
│   │   ├── cython/
│   │   │   ├── __init__.py
│   │   │   ├── base.pyi
│   │   │   ├── ndarray.pyx
│   │   │   └── symbol.pyx
│   │   ├── device.py
│   │   ├── dlpack.py
│   │   ├── engine.py
│   │   ├── error.py
│   │   ├── executor.py
│   │   ├── gluon/
│   │   │   ├── .gitignore
│   │   │   ├── __init__.py
│   │   │   ├── block.py
│   │   │   ├── contrib/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── data/
│   │   │   │   │   ├── __init__.py
│   │   │   │   │   ├── _constants.py
│   │   │   │   │   └── vision/
│   │   │   │   │       ├── __init__.py
│   │   │   │   │       ├── dataloader.py
│   │   │   │   │       └── transforms/
│   │   │   │   │           ├── __init__.py
│   │   │   │   │           └── bbox/
│   │   │   │   │               ├── __init__.py
│   │   │   │   │               ├── bbox.py
│   │   │   │   │               └── utils.py
│   │   │   │   └── estimator/
│   │   │   │       ├── __init__.py
│   │   │   │       ├── batch_processor.py
│   │   │   │       ├── estimator.py
│   │   │   │       ├── event_handler.py
│   │   │   │       └── utils.py
│   │   │   ├── data/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── _internal.py
│   │   │   │   ├── batchify.py
│   │   │   │   ├── dataloader.py
│   │   │   │   ├── dataset.py
│   │   │   │   ├── sampler.py
│   │   │   │   └── vision/
│   │   │   │       ├── __init__.py
│   │   │   │       ├── datasets.py
│   │   │   │       └── transforms/
│   │   │   │           ├── __init__.py
│   │   │   │           └── image.py
│   │   │   ├── loss.py
│   │   │   ├── metric.py
│   │   │   ├── model_zoo/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── model_store.py
│   │   │   │   └── vision/
│   │   │   │       ├── __init__.py
│   │   │   │       ├── alexnet.py
│   │   │   │       ├── densenet.py
│   │   │   │       ├── inception.py
│   │   │   │       ├── mobilenet.py
│   │   │   │       ├── resnet.py
│   │   │   │       ├── squeezenet.py
│   │   │   │       └── vgg.py
│   │   │   ├── nn/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── activations.py
│   │   │   │   ├── basic_layers.py
│   │   │   │   └── conv_layers.py
│   │   │   ├── parameter.py
│   │   │   ├── probability/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── block/
│   │   │   │   │   ├── __init__.py
│   │   │   │   │   └── stochastic_block.py
│   │   │   │   ├── distributions/
│   │   │   │   │   ├── __init__.py
│   │   │   │   │   ├── bernoulli.py
│   │   │   │   │   ├── beta.py
│   │   │   │   │   ├── binomial.py
│   │   │   │   │   ├── categorical.py
│   │   │   │   │   ├── cauchy.py
│   │   │   │   │   ├── chi2.py
│   │   │   │   │   ├── constraint.py
│   │   │   │   │   ├── dirichlet.py
│   │   │   │   │   ├── distribution.py
│   │   │   │   │   ├── divergence.py
│   │   │   │   │   ├── exp_family.py
│   │   │   │   │   ├── exponential.py
│   │   │   │   │   ├── fishersnedecor.py
│   │   │   │   │   ├── gamma.py
│   │   │   │   │   ├── geometric.py
│   │   │   │   │   ├── gumbel.py
│   │   │   │   │   ├── half_cauchy.py
│   │   │   │   │   ├── half_normal.py
│   │   │   │   │   ├── independent.py
│   │   │   │   │   ├── laplace.py
│   │   │   │   │   ├── multinomial.py
│   │   │   │   │   ├── multivariate_normal.py
│   │   │   │   │   ├── negative_binomial.py
│   │   │   │   │   ├── normal.py
│   │   │   │   │   ├── one_hot_categorical.py
│   │   │   │   │   ├── pareto.py
│   │   │   │   │   ├── poisson.py
│   │   │   │   │   ├── relaxed_bernoulli.py
│   │   │   │   │   ├── relaxed_one_hot_categorical.py
│   │   │   │   │   ├── studentT.py
│   │   │   │   │   ├── transformed_distribution.py
│   │   │   │   │   ├── uniform.py
│   │   │   │   │   ├── utils.py
│   │   │   │   │   └── weibull.py
│   │   │   │   └── transformation/
│   │   │   │       ├── __init__.py
│   │   │   │       ├── domain_map.py
│   │   │   │       └── transformation.py
│   │   │   ├── rnn/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── conv_rnn_cell.py
│   │   │   │   ├── rnn_cell.py
│   │   │   │   └── rnn_layer.py
│   │   │   ├── trainer.py
│   │   │   └── utils.py
│   │   ├── image/
│   │   │   ├── __init__.py
│   │   │   ├── detection.py
│   │   │   └── image.py
│   │   ├── initializer.py
│   │   ├── io/
│   │   │   ├── __init__.py
│   │   │   ├── io.py
│   │   │   └── utils.py
│   │   ├── kvstore/
│   │   │   ├── __init__.py
│   │   │   ├── base.py
│   │   │   ├── byteps.py
│   │   │   ├── horovod.py
│   │   │   ├── kvstore.py
│   │   │   └── kvstore_server.py
│   │   ├── libinfo.py
│   │   ├── library.py
│   │   ├── log.py
│   │   ├── lr_scheduler.py
│   │   ├── misc.py
│   │   ├── model.py
│   │   ├── name.py
│   │   ├── ndarray/
│   │   │   ├── __init__.py
│   │   │   ├── _internal.py
│   │   │   ├── contrib.py
│   │   │   ├── image.py
│   │   │   ├── linalg.py
│   │   │   ├── ndarray.py
│   │   │   ├── numpy/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── _api_internal.py
│   │   │   │   ├── _internal.py
│   │   │   │   ├── _op.py
│   │   │   │   ├── _register.py
│   │   │   │   ├── linalg.py
│   │   │   │   └── random.py
│   │   │   ├── numpy_extension/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── _api_internal.py
│   │   │   │   ├── _op.py
│   │   │   │   ├── _register.py
│   │   │   │   ├── control_flow.py
│   │   │   │   ├── image.py
│   │   │   │   └── random.py
│   │   │   ├── op.py
│   │   │   ├── random.py
│   │   │   ├── register.py
│   │   │   ├── sparse.py
│   │   │   └── utils.py
│   │   ├── ndarray_doc.py
│   │   ├── notebook/
│   │   │   ├── __init__.py
│   │   │   └── callback.py
│   │   ├── numpy/
│   │   │   ├── __init__.py
│   │   │   ├── _op.py
│   │   │   ├── _register.py
│   │   │   ├── arrayprint.py
│   │   │   ├── fallback.py
│   │   │   ├── fallback_linalg.py
│   │   │   ├── function_base.py
│   │   │   ├── io.py
│   │   │   ├── linalg.py
│   │   │   ├── multiarray.py
│   │   │   ├── random.py
│   │   │   ├── set_functions.py
│   │   │   ├── stride_tricks.py
│   │   │   ├── type_functions.py
│   │   │   └── utils.py
│   │   ├── numpy_dispatch_protocol.py
│   │   ├── numpy_extension/
│   │   │   ├── __init__.py
│   │   │   ├── _op.py
│   │   │   ├── _register.py
│   │   │   ├── control_flow.py
│   │   │   ├── image.py
│   │   │   ├── random.py
│   │   │   └── utils.py
│   │   ├── numpy_op_fallback.py
│   │   ├── numpy_op_signature.py
│   │   ├── onnx/
│   │   │   ├── README.md
│   │   │   ├── __init__.py
│   │   │   ├── mx2onnx/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── _export_helper.py
│   │   │   │   ├── _export_model.py
│   │   │   │   ├── _export_onnx.py
│   │   │   │   └── _op_translations/
│   │   │   │       ├── __init__.py
│   │   │   │       ├── _op_translations_opset12.py
│   │   │   │       └── _op_translations_opset13.py
│   │   │   └── setup.py
│   │   ├── operator.py
│   │   ├── optimizer/
│   │   │   ├── __init__.py
│   │   │   ├── adabelief.py
│   │   │   ├── adadelta.py
│   │   │   ├── adagrad.py
│   │   │   ├── adam.py
│   │   │   ├── adamW.py
│   │   │   ├── adamax.py
│   │   │   ├── contrib.py
│   │   │   ├── dcasgd.py
│   │   │   ├── ftml.py
│   │   │   ├── ftrl.py
│   │   │   ├── lamb.py
│   │   │   ├── lans.py
│   │   │   ├── lars.py
│   │   │   ├── nadam.py
│   │   │   ├── nag.py
│   │   │   ├── optimizer.py
│   │   │   ├── rmsprop.py
│   │   │   ├── sgd.py
│   │   │   ├── sgld.py
│   │   │   ├── signum.py
│   │   │   ├── updater.py
│   │   │   └── utils.py
│   │   ├── profiler.py
│   │   ├── random.py
│   │   ├── recordio.py
│   │   ├── registry.py
│   │   ├── rtc.py
│   │   ├── runtime.py
│   │   ├── symbol/
│   │   │   ├── __init__.py
│   │   │   ├── _internal.py
│   │   │   ├── contrib.py
│   │   │   ├── image.py
│   │   │   ├── linalg.py
│   │   │   ├── numpy/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── _internal.py
│   │   │   │   ├── _op.py
│   │   │   │   ├── _register.py
│   │   │   │   ├── _symbol.py
│   │   │   │   ├── linalg.py
│   │   │   │   └── random.py
│   │   │   ├── numpy_extension/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── _op.py
│   │   │   │   ├── _register.py
│   │   │   │   ├── image.py
│   │   │   │   └── random.py
│   │   │   ├── op.py
│   │   │   ├── random.py
│   │   │   ├── register.py
│   │   │   ├── sparse.py
│   │   │   └── symbol.py
│   │   ├── symbol_doc.py
│   │   ├── test_utils.py
│   │   ├── tvmop.py
│   │   ├── util.py
│   │   └── visualization.py
│   └── setup.py
├── rat-excludes
├── readthedocs.yml
├── snap.python
├── src/
│   ├── api/
│   │   ├── _api_internal/
│   │   │   └── _api_internal.cc
│   │   ├── cached_op_api.cc
│   │   └── operator/
│   │       ├── numpy/
│   │       │   ├── linalg/
│   │       │   │   ├── np_det.cc
│   │       │   │   ├── np_eig.cc
│   │       │   │   ├── np_eigvals.cc
│   │       │   │   ├── np_gesvd.cc
│   │       │   │   ├── np_inv.cc
│   │       │   │   ├── np_lstsq.cc
│   │       │   │   ├── np_matrix_rank.cc
│   │       │   │   ├── np_norm.cc
│   │       │   │   ├── np_pinv.cc
│   │       │   │   ├── np_potrf.cc
│   │       │   │   ├── np_qr.cc
│   │       │   │   ├── np_slogdet.cc
│   │       │   │   ├── np_solve.cc
│   │       │   │   ├── np_tensorinv.cc
│   │       │   │   └── np_tensorsolve.cc
│   │       │   ├── np_bincount_op.cc
│   │       │   ├── np_broadcast_reduce_op_boolean.cc
│   │       │   ├── np_broadcast_reduce_op_index.cc
│   │       │   ├── np_broadcast_reduce_op_value.cc
│   │       │   ├── np_cross.cc
│   │       │   ├── np_cumsum.cc
│   │       │   ├── np_delete_op.cc
│   │       │   ├── np_diff_op.cc
│   │       │   ├── np_dot_op.cc
│   │       │   ├── np_ediff1d_op.cc
│   │       │   ├── np_einsum_op.cc
│   │       │   ├── np_elemwise_broadcast_logic_op.cc
│   │       │   ├── np_elemwise_broadcast_op.cc
│   │       │   ├── np_elemwise_broadcast_op_extended_sec.cc
│   │       │   ├── np_elemwise_unary_op_basic.cc
│   │       │   ├── np_fill_diagonal_op.cc
│   │       │   ├── np_histogram_op.cc
│   │       │   ├── np_init_op.cc
│   │       │   ├── np_insert_op.cc
│   │       │   ├── np_interp_op.cc
│   │       │   ├── np_kron.cc
│   │       │   ├── np_matmul_op.cc
│   │       │   ├── np_matrix_op.cc
│   │       │   ├── np_memory_op.cc
│   │       │   ├── np_moments_op.cc
│   │       │   ├── np_nan_to_num_op.cc
│   │       │   ├── np_nonzero_op.cc
│   │       │   ├── np_ordering_op.cc
│   │       │   ├── np_pad_op.cc
│   │       │   ├── np_percentile_op.cc
│   │       │   ├── np_polynomial_op.cc
│   │       │   ├── np_repeat_op.cc
│   │       │   ├── np_tensordot_op.cc
│   │       │   ├── np_trace_op.cc
│   │       │   ├── np_tri_op.cc
│   │       │   ├── np_tril_op.cc
│   │       │   ├── np_triu_op.cc
│   │       │   ├── np_unique_op.cc
│   │       │   ├── np_where_op.cc
│   │       │   ├── np_window_op.cc
│   │       │   └── random/
│   │       │       ├── np_choice_op.cc
│   │       │       ├── np_exponential_op.cc
│   │       │       ├── np_laplace_op.cc
│   │       │       ├── np_location_scale_op.cc
│   │       │       ├── np_multinomial_op.cc
│   │       │       ├── np_pareto_op.cc
│   │       │       ├── np_power_op.cc
│   │       │       ├── np_rayleigh_op.cc
│   │       │       └── np_weibull_op.cc
│   │       ├── numpy_extension/
│   │       │   ├── npx_activation_op.cc
│   │       │   ├── npx_arange_like_op.cc
│   │       │   ├── npx_batch_dot_op.cc
│   │       │   ├── npx_batch_norm_op.cc
│   │       │   ├── npx_broadcast_like_op.cc
│   │       │   ├── npx_control_flow_op.cc
│   │       │   ├── npx_convolution_op.cc
│   │       │   ├── npx_deconvolution_op.cc
│   │       │   ├── npx_dropout_op.cc
│   │       │   ├── npx_embedding_op.cc
│   │       │   ├── npx_fully_connected_op.cc
│   │       │   ├── npx_group_norm_op.cc
│   │       │   ├── npx_layer_norm_op.cc
│   │       │   ├── npx_leaky_relu_op.cc
│   │       │   ├── npx_one_hot_op.cc
│   │       │   ├── npx_pick_op.cc
│   │       │   ├── npx_pooling_op.cc
│   │       │   ├── npx_rnn_op.cc
│   │       │   ├── npx_softmax_op.cc
│   │       │   └── npx_topk_op.cc
│   │       ├── op_utils.cc
│   │       ├── op_utils.h
│   │       ├── random/
│   │       │   ├── np_gamma_op.cc
│   │       │   ├── np_normal_op.cc
│   │       │   ├── np_randint_op.cc
│   │       │   ├── np_uniform_op.cc
│   │       │   └── shuffle_op.cc
│   │       ├── tensor/
│   │       │   ├── elemwise_binary_broadcast_op_extended.cc
│   │       │   ├── indexing_op.cc
│   │       │   ├── matrix_op.cc
│   │       │   └── unravel.cc
│   │       ├── ufunc_helper.cc
│   │       ├── ufunc_helper.h
│   │       ├── utils.cc
│   │       └── utils.h
│   ├── base.cc
│   ├── c_api/
│   │   ├── .clang-tidy
│   │   ├── c_api.cc
│   │   ├── c_api_common.h
│   │   ├── c_api_function.cc
│   │   ├── c_api_ndarray.cc
│   │   ├── c_api_profile.cc
│   │   ├── c_api_symbolic.cc
│   │   └── c_api_test.cc
│   ├── common/
│   │   ├── alm.cc
│   │   ├── alm.h
│   │   ├── cuda/
│   │   │   ├── cudnn_cxx.cc
│   │   │   ├── cudnn_cxx.h
│   │   │   ├── nvtx.h
│   │   │   ├── rtc/
│   │   │   │   ├── backward_functions-inl.h
│   │   │   │   ├── forward_functions-inl.h
│   │   │   │   ├── half-inl.h
│   │   │   │   ├── reducer-inl.h
│   │   │   │   ├── special_functions-inl.h
│   │   │   │   ├── util-inl.h
│   │   │   │   └── vectorization-inl.h
│   │   │   ├── rtc.cc
│   │   │   ├── rtc.h
│   │   │   ├── utils.cc
│   │   │   └── utils.h
│   │   ├── exec_utils.cc
│   │   ├── exec_utils.h
│   │   ├── lazy_alloc_array.h
│   │   ├── object_pool.h
│   │   ├── random_generator.cu
│   │   ├── rtc.cc
│   │   ├── static_array.h
│   │   ├── tensor_inspector.h
│   │   ├── utils.cc
│   │   ├── utils.cu
│   │   └── utils.h
│   ├── engine/
│   │   ├── engine.cc
│   │   ├── engine_impl.h
│   │   ├── naive_engine.cc
│   │   ├── openmp.cc
│   │   ├── openmp.h
│   │   ├── stream_manager.h
│   │   ├── thread_pool.h
│   │   ├── threaded_engine.cc
│   │   ├── threaded_engine.h
│   │   ├── threaded_engine_perdevice.cc
│   │   └── threaded_engine_pooled.cc
│   ├── imperative/
│   │   ├── attach_op_execs_pass.cc
│   │   ├── attach_op_resource_pass.cc
│   │   ├── cached_op.cc
│   │   ├── cached_op.h
│   │   ├── cached_op_threadsafe.cc
│   │   ├── cached_op_threadsafe.h
│   │   ├── cuda_graphs.h
│   │   ├── eliminate_common_expr_pass.cc
│   │   ├── exec_pass.h
│   │   ├── imperative.cc
│   │   ├── imperative_utils.cc
│   │   ├── imperative_utils.h
│   │   ├── infer_graph_attr_pass.cc
│   │   ├── inplace_addto_detect_pass.cc
│   │   ├── naive_cached_op.cc
│   │   ├── naive_cached_op.h
│   │   ├── pointwise_fusion_pass.cc
│   │   ├── simple_partition_pass.cc
│   │   └── simple_partition_pass.h
│   ├── initialize.cc
│   ├── initialize.h
│   ├── io/
│   │   ├── batchify.cc
│   │   ├── dataloader.cc
│   │   ├── dataset.cc
│   │   ├── image_aug_default.cc
│   │   ├── image_augmenter.h
│   │   ├── image_det_aug_default.cc
│   │   ├── image_io.cc
│   │   ├── image_iter_common.h
│   │   ├── image_recordio.h
│   │   ├── inst_vector.h
│   │   ├── io.cc
│   │   ├── iter_batchloader.h
│   │   ├── iter_csv.cc
│   │   ├── iter_image_det_recordio.cc
│   │   ├── iter_image_recordio.cc
│   │   ├── iter_image_recordio_2.cc
│   │   ├── iter_libsvm.cc
│   │   ├── iter_mnist.cc
│   │   ├── iter_normalize.h
│   │   ├── iter_prefetcher.h
│   │   ├── iter_sampler.cc
│   │   ├── iter_sparse.h
│   │   ├── iter_sparse_batchloader.h
│   │   ├── iter_sparse_prefetcher.h
│   │   └── opencv_compatibility.h
│   ├── ir/
│   │   └── expr.cc
│   ├── kvstore/
│   │   ├── comm.h
│   │   ├── comm_tree.h
│   │   ├── gpu_topology.h
│   │   ├── gradient_compression-inl.h
│   │   ├── gradient_compression.cc
│   │   ├── gradient_compression.cu
│   │   ├── gradient_compression.h
│   │   ├── kvstore.cc
│   │   ├── kvstore_dist.h
│   │   ├── kvstore_dist_server.h
│   │   ├── kvstore_local.h
│   │   ├── kvstore_nccl.h
│   │   ├── kvstore_utils.cc
│   │   ├── kvstore_utils.cu
│   │   ├── kvstore_utils.h
│   │   └── p3store_dist.h
│   ├── lang/
│   │   ├── expr.cc
│   │   └── ir.cc
│   ├── lib_api.cc
│   ├── libinfo.cc
│   ├── ndarray/
│   │   ├── ndarray.cc
│   │   ├── ndarray_function-inl.cuh
│   │   ├── ndarray_function-inl.h
│   │   ├── ndarray_function.cc
│   │   ├── ndarray_function.cu
│   │   └── ndarray_function.h
│   ├── nnvm/
│   │   ├── error.h
│   │   ├── gradient.cc
│   │   ├── graph_algorithm.h
│   │   ├── graph_editor.cc
│   │   ├── legacy_json_util.cc
│   │   ├── legacy_op_util.cc
│   │   ├── low_precision_pass.cc
│   │   ├── node_op_util.h
│   │   ├── plan_memory.cc
│   │   └── tvm_bridge.cc
│   ├── operator/
│   │   ├── all_finite-inl.h
│   │   ├── all_finite.cc
│   │   ├── all_finite.cu
│   │   ├── amp_graph_pass.cc
│   │   ├── bilinear_sampler-inl.h
│   │   ├── bilinear_sampler.cc
│   │   ├── bilinear_sampler.cu
│   │   ├── c_lapack_api.cc
│   │   ├── c_lapack_api.h
│   │   ├── channel_op_common.h
│   │   ├── contrib/
│   │   │   ├── adabelief-inl.h
│   │   │   ├── adabelief.cc
│   │   │   ├── adabelief.cu
│   │   │   ├── adamw-inl.h
│   │   │   ├── adamw.cc
│   │   │   ├── adamw.cu
│   │   │   ├── adaptive_avg_pooling-inl.h
│   │   │   ├── adaptive_avg_pooling.cc
│   │   │   ├── adaptive_avg_pooling.cu
│   │   │   ├── allclose_op-inl.h
│   │   │   ├── allclose_op.cc
│   │   │   ├── allclose_op.cu
│   │   │   ├── bilinear_resize-inl.cuh
│   │   │   ├── bilinear_resize-inl.h
│   │   │   ├── bilinear_resize.cc
│   │   │   ├── bilinear_resize.cu
│   │   │   ├── boolean_mask-inl.h
│   │   │   ├── boolean_mask.cc
│   │   │   ├── boolean_mask.cu
│   │   │   ├── bounding_box-common.h
│   │   │   ├── bounding_box-inl.cuh
│   │   │   ├── bounding_box-inl.h
│   │   │   ├── bounding_box.cc
│   │   │   ├── bounding_box.cu
│   │   │   ├── count_sketch-inl.h
│   │   │   ├── count_sketch.cc
│   │   │   ├── count_sketch.cu
│   │   │   ├── deformable_psroi_pooling-inl.h
│   │   │   ├── deformable_psroi_pooling.cc
│   │   │   ├── deformable_psroi_pooling.cu
│   │   │   ├── dgl_graph-inl.h
│   │   │   ├── dgl_graph.cc
│   │   │   ├── dgl_graph.cu
│   │   │   ├── dynamic_shape_ops-inl.h
│   │   │   ├── dynamic_shape_ops.cc
│   │   │   ├── erfinv-inl.h
│   │   │   ├── fft-inl.h
│   │   │   ├── fft.cc
│   │   │   ├── fft.cu
│   │   │   ├── gradient_multiplier_op.cc
│   │   │   ├── gradient_multiplier_op.cu
│   │   │   ├── hawkes_ll-inl.h
│   │   │   ├── hawkes_ll.cc
│   │   │   ├── hawkes_ll.cu
│   │   │   ├── index_array-inl.h
│   │   │   ├── index_array.cc
│   │   │   ├── index_array.cu
│   │   │   ├── index_copy-inl.h
│   │   │   ├── index_copy.cc
│   │   │   ├── index_copy.cu
│   │   │   ├── intgemm/
│   │   │   │   ├── intgemm_fully_connected_op.cc
│   │   │   │   ├── max_absolute_op.cc
│   │   │   │   ├── prepare_data_op.cc
│   │   │   │   ├── prepare_weight_op.cc
│   │   │   │   └── take_weight_op.cc
│   │   │   ├── krprod.cc
│   │   │   ├── krprod.h
│   │   │   ├── mrcnn_mask_target-inl.h
│   │   │   ├── mrcnn_mask_target.cu
│   │   │   ├── multi_lamb-inl.h
│   │   │   ├── multi_lamb.cc
│   │   │   ├── multi_lamb.cu
│   │   │   ├── multi_lans-inl.h
│   │   │   ├── multi_lans.cc
│   │   │   ├── multi_lans.cu
│   │   │   ├── multi_lars-inl.h
│   │   │   ├── multi_lars.cc
│   │   │   ├── multi_lars.cu
│   │   │   ├── multi_proposal-inl.h
│   │   │   ├── multi_proposal.cc
│   │   │   ├── multi_proposal.cu
│   │   │   ├── multi_sum_sq-inl.h
│   │   │   ├── multi_sum_sq.cc
│   │   │   ├── multi_sum_sq.cu
│   │   │   ├── multibox_detection-inl.h
│   │   │   ├── multibox_detection.cc
│   │   │   ├── multibox_detection.cu
│   │   │   ├── multibox_prior-inl.h
│   │   │   ├── multibox_prior.cc
│   │   │   ├── multibox_prior.cu
│   │   │   ├── multibox_target-inl.h
│   │   │   ├── multibox_target.cc
│   │   │   ├── multibox_target.cu
│   │   │   ├── nn/
│   │   │   │   ├── deformable_im2col.cuh
│   │   │   │   ├── deformable_im2col.h
│   │   │   │   ├── modulated_deformable_im2col.cuh
│   │   │   │   └── modulated_deformable_im2col.h
│   │   │   ├── nnz.cc
│   │   │   ├── optimizer_op-inl.h
│   │   │   ├── optimizer_op.cc
│   │   │   ├── optimizer_op.cu
│   │   │   ├── preloaded_multi_sgd-inl.h
│   │   │   ├── preloaded_multi_sgd.cc
│   │   │   ├── preloaded_multi_sgd.cu
│   │   │   ├── proposal-inl.h
│   │   │   ├── proposal.cc
│   │   │   ├── proposal.cu
│   │   │   ├── psroi_pooling-inl.h
│   │   │   ├── psroi_pooling.cc
│   │   │   ├── psroi_pooling.cu
│   │   │   ├── quadratic_op-inl.h
│   │   │   ├── quadratic_op.cc
│   │   │   ├── quadratic_op.cu
│   │   │   ├── reset_arrays-inl.h
│   │   │   ├── reset_arrays.cc
│   │   │   ├── reset_arrays.cu
│   │   │   ├── roi_align-inl.h
│   │   │   ├── roi_align.cc
│   │   │   ├── roi_align.cu
│   │   │   ├── rroi_align-inl.h
│   │   │   ├── rroi_align.cc
│   │   │   ├── stes_op.cc
│   │   │   ├── stes_op.cu
│   │   │   ├── stes_op.h
│   │   │   ├── sync_batch_norm-inl.h
│   │   │   ├── sync_batch_norm.cc
│   │   │   ├── sync_batch_norm.cu
│   │   │   ├── transformer-inl.h
│   │   │   ├── transformer.cc
│   │   │   ├── transformer.cu
│   │   │   └── tvmop/
│   │   │       ├── dot.cc
│   │   │       └── ufunc.cc
│   │   ├── control_flow.cc
│   │   ├── correlation-inl.h
│   │   ├── correlation.cc
│   │   ├── correlation.cu
│   │   ├── crop-inl.h
│   │   ├── crop.cc
│   │   ├── crop.cu
│   │   ├── cross_device_copy.cc
│   │   ├── cudnn_bilinear_sampler-inl.h
│   │   ├── cudnn_lrn-inl.h
│   │   ├── cudnn_ops.cc
│   │   ├── cudnn_ops.h
│   │   ├── cudnn_spatial_transformer-inl.h
│   │   ├── custom/
│   │   │   ├── custom-inl.h
│   │   │   ├── custom.cc
│   │   │   ├── native_op-inl.h
│   │   │   ├── native_op.cc
│   │   │   ├── native_op.cu
│   │   │   ├── ndarray_op-inl.h
│   │   │   └── ndarray_op.cc
│   │   ├── deformable_convolution-inl.h
│   │   ├── deformable_convolution.cc
│   │   ├── deformable_convolution.cu
│   │   ├── elemwise_op_common.h
│   │   ├── fusion/
│   │   │   ├── fused_op-inl.h
│   │   │   ├── fused_op.cc
│   │   │   ├── fused_op.cu
│   │   │   └── fused_op.h
│   │   ├── grid_generator-inl.h
│   │   ├── grid_generator.cc
│   │   ├── grid_generator.cu
│   │   ├── identity_attach_KL_sparse_reg-inl.h
│   │   ├── identity_attach_KL_sparse_reg.cc
│   │   ├── identity_attach_KL_sparse_reg.cu
│   │   ├── image/
│   │   │   ├── crop-inl.h
│   │   │   ├── crop.cc
│   │   │   ├── crop.cu
│   │   │   ├── image_random-inl.h
│   │   │   ├── image_random.cc
│   │   │   ├── image_random.cu
│   │   │   ├── image_utils.h
│   │   │   ├── resize-inl.h
│   │   │   ├── resize.cc
│   │   │   └── resize.cu
│   │   ├── instance_norm-inl.h
│   │   ├── instance_norm.cc
│   │   ├── instance_norm.cu
│   │   ├── l2_normalization-inl.h
│   │   ├── l2_normalization.cc
│   │   ├── l2_normalization.cu
│   │   ├── leaky_relu-inl.h
│   │   ├── leaky_relu.cc
│   │   ├── leaky_relu.cu
│   │   ├── linalg.h
│   │   ├── linalg_impl.h
│   │   ├── loss_binary_op-inl.h
│   │   ├── loss_binary_op.cc
│   │   ├── loss_binary_op.cu
│   │   ├── make_loss-inl.h
│   │   ├── make_loss.cc
│   │   ├── make_loss.cu
│   │   ├── math_functions-inl.h
│   │   ├── mkl_functions-inl.h
│   │   ├── modulated_deformable_convolution-inl.h
│   │   ├── modulated_deformable_convolution.cc
│   │   ├── modulated_deformable_convolution.cu
│   │   ├── mshadow_op.h
│   │   ├── mxnet_op.h
│   │   ├── nn/
│   │   │   ├── activation-inl.h
│   │   │   ├── activation.cc
│   │   │   ├── activation.cu
│   │   │   ├── batch_norm-inl.h
│   │   │   ├── batch_norm.cc
│   │   │   ├── batch_norm.cu
│   │   │   ├── concat-inl.h
│   │   │   ├── concat.cc
│   │   │   ├── concat.cu
│   │   │   ├── convolution-inl.h
│   │   │   ├── convolution.cc
│   │   │   ├── convolution.cu
│   │   │   ├── ctc_loss-inl.h
│   │   │   ├── ctc_loss.cc
│   │   │   ├── ctc_loss.cu
│   │   │   ├── cudnn/
│   │   │   │   ├── cudnn_activation-inl.h
│   │   │   │   ├── cudnn_algoreg-inl.h
│   │   │   │   ├── cudnn_algoreg.cc
│   │   │   │   ├── cudnn_batch_norm.cu
│   │   │   │   ├── cudnn_batch_norm.h
│   │   │   │   ├── cudnn_convolution-inl.h
│   │   │   │   ├── cudnn_deconvolution-inl.h
│   │   │   │   ├── cudnn_pooling-inl.h
│   │   │   │   └── cudnn_softmax_activation-inl.h
│   │   │   ├── deconvolution-inl.h
│   │   │   ├── deconvolution.cc
│   │   │   ├── deconvolution.cu
│   │   │   ├── depthwise_convolution-inl.h
│   │   │   ├── depthwise_convolution_tf.cuh
│   │   │   ├── dnnl/
│   │   │   │   ├── dnnl_act-inl.h
│   │   │   │   ├── dnnl_act.cc
│   │   │   │   ├── dnnl_base-inl.h
│   │   │   │   ├── dnnl_base.cc
│   │   │   │   ├── dnnl_batch_dot-inl.h
│   │   │   │   ├── dnnl_batch_dot.cc
│   │   │   │   ├── dnnl_batch_norm-inl.h
│   │   │   │   ├── dnnl_batch_norm.cc
│   │   │   │   ├── dnnl_binary-inl.h
│   │   │   │   ├── dnnl_binary.cc
│   │   │   │   ├── dnnl_concat-inl.h
│   │   │   │   ├── dnnl_concat.cc
│   │   │   │   ├── dnnl_convolution-inl.h
│   │   │   │   ├── dnnl_convolution.cc
│   │   │   │   ├── dnnl_copy-inl.h
│   │   │   │   ├── dnnl_copy.cc
│   │   │   │   ├── dnnl_deconvolution-inl.h
│   │   │   │   ├── dnnl_deconvolution.cc
│   │   │   │   ├── dnnl_dot-inl.h
│   │   │   │   ├── dnnl_dot.cc
│   │   │   │   ├── dnnl_eltwise-inl.h
│   │   │   │   ├── dnnl_eltwise.cc
│   │   │   │   ├── dnnl_fully_connected-inl.h
│   │   │   │   ├── dnnl_fully_connected.cc
│   │   │   │   ├── dnnl_layer_norm-inl.h
│   │   │   │   ├── dnnl_layer_norm.cc
│   │   │   │   ├── dnnl_log_softmax.cc
│   │   │   │   ├── dnnl_lrn-inl.h
│   │   │   │   ├── dnnl_masked_softmax-inl.h
│   │   │   │   ├── dnnl_masked_softmax.cc
│   │   │   │   ├── dnnl_pooling-inl.h
│   │   │   │   ├── dnnl_pooling.cc
│   │   │   │   ├── dnnl_pow_mul_scalar-inl.h
│   │   │   │   ├── dnnl_pow_mul_scalar.cc
│   │   │   │   ├── dnnl_reduce-inl.h
│   │   │   │   ├── dnnl_reduce.cc
│   │   │   │   ├── dnnl_reshape-inl.h
│   │   │   │   ├── dnnl_reshape.cc
│   │   │   │   ├── dnnl_rnn-inl.h
│   │   │   │   ├── dnnl_rnn.cc
│   │   │   │   ├── dnnl_softmax-inl.h
│   │   │   │   ├── dnnl_softmax.cc
│   │   │   │   ├── dnnl_softmax_output-inl.h
│   │   │   │   ├── dnnl_softmax_output.cc
│   │   │   │   ├── dnnl_split-inl.h
│   │   │   │   ├── dnnl_split.cc
│   │   │   │   ├── dnnl_stack-inl.h
│   │   │   │   ├── dnnl_stack.cc
│   │   │   │   ├── dnnl_sum-inl.h
│   │   │   │   ├── dnnl_sum.cc
│   │   │   │   ├── dnnl_transpose-inl.h
│   │   │   │   ├── dnnl_transpose.cc
│   │   │   │   ├── dnnl_where-inl.h
│   │   │   │   └── dnnl_where.cc
│   │   │   ├── dropout-inl.h
│   │   │   ├── dropout.cc
│   │   │   ├── dropout.cu
│   │   │   ├── fully_connected-inl.h
│   │   │   ├── fully_connected.cc
│   │   │   ├── fully_connected.cu
│   │   │   ├── group_norm-inl.h
│   │   │   ├── group_norm.cc
│   │   │   ├── group_norm.cu
│   │   │   ├── im2col-inl.h
│   │   │   ├── im2col.cc
│   │   │   ├── im2col.cu
│   │   │   ├── im2col.cuh
│   │   │   ├── im2col.h
│   │   │   ├── layer_norm-inl.h
│   │   │   ├── layer_norm.cc
│   │   │   ├── layer_norm.cu
│   │   │   ├── layer_norm_cpu.h
│   │   │   ├── log_softmax.cc
│   │   │   ├── log_softmax.cu
│   │   │   ├── lrn-inl.h
│   │   │   ├── lrn.cc
│   │   │   ├── lrn.cu
│   │   │   ├── masked_softmax.cc
│   │   │   ├── moments-inl.h
│   │   │   ├── moments.cc
│   │   │   ├── moments.cu
│   │   │   ├── pool.cuh
│   │   │   ├── pool.h
│   │   │   ├── pool_utils.h
│   │   │   ├── pooling-inl.h
│   │   │   ├── pooling.cc
│   │   │   ├── pooling.cu
│   │   │   ├── sequence_mask-inl.h
│   │   │   ├── softmax-inl.h
│   │   │   ├── softmax.cc
│   │   │   ├── softmax.cu
│   │   │   ├── softmax_activation-inl.h
│   │   │   ├── softmax_activation.cc
│   │   │   ├── softmax_activation.cu
│   │   │   ├── softmin.cc
│   │   │   ├── softmin.cu
│   │   │   ├── upsampling-inl.h
│   │   │   ├── upsampling.cc
│   │   │   └── upsampling.cu
│   │   ├── npx_control_flow.cc
│   │   ├── npx_control_flow.h
│   │   ├── numpy/
│   │   │   ├── linalg/
│   │   │   │   ├── broadcast_reduce_customized-inl.h
│   │   │   │   ├── broadcast_reduce_op_customized.h
│   │   │   │   ├── np_eig-inl.h
│   │   │   │   ├── np_eig.cc
│   │   │   │   ├── np_eig.cu
│   │   │   │   ├── np_eigvals-inl.h
│   │   │   │   ├── np_eigvals.cc
│   │   │   │   ├── np_eigvals.cu
│   │   │   │   ├── np_gesvd-inl.h
│   │   │   │   ├── np_gesvd.cc
│   │   │   │   ├── np_gesvd.cu
│   │   │   │   ├── np_lstsq-inl.h
│   │   │   │   ├── np_lstsq.cc
│   │   │   │   ├── np_lstsq.cu
│   │   │   │   ├── np_matrix_rank-inl.h
│   │   │   │   ├── np_matrix_rank.cc
│   │   │   │   ├── np_matrix_rank.cu
│   │   │   │   ├── np_norm-inl.h
│   │   │   │   ├── np_norm.cc
│   │   │   │   ├── np_norm_backward.cc
│   │   │   │   ├── np_norm_backward.cu
│   │   │   │   ├── np_norm_forward.cc
│   │   │   │   ├── np_norm_forward.cu
│   │   │   │   ├── np_pinv-inl.h
│   │   │   │   ├── np_pinv.cc
│   │   │   │   ├── np_pinv.cu
│   │   │   │   ├── np_potrf-inl.h
│   │   │   │   ├── np_potrf.cc
│   │   │   │   ├── np_potrf.cu
│   │   │   │   ├── np_qr-inl.h
│   │   │   │   ├── np_qr.cc
│   │   │   │   ├── np_qr.cu
│   │   │   │   ├── np_solve-inl.h
│   │   │   │   ├── np_solve.cc
│   │   │   │   ├── np_solve.cu
│   │   │   │   ├── np_tensorinv-inl.h
│   │   │   │   ├── np_tensorinv.cc
│   │   │   │   ├── np_tensorinv.cu
│   │   │   │   ├── np_tensorsolve-inl.h
│   │   │   │   ├── np_tensorsolve.cc
│   │   │   │   └── np_tensorsolve.cu
│   │   │   ├── np_bincount_op-inl.h
│   │   │   ├── np_bincount_op.cc
│   │   │   ├── np_bincount_op.cu
│   │   │   ├── np_boolean_mask_assign.cc
│   │   │   ├── np_boolean_mask_assign.cu
│   │   │   ├── np_broadcast_reduce_op.cc
│   │   │   ├── np_broadcast_reduce_op.h
│   │   │   ├── np_broadcast_reduce_op_boolean.cc
│   │   │   ├── np_broadcast_reduce_op_boolean.cu
│   │   │   ├── np_broadcast_reduce_op_index.cc
│   │   │   ├── np_broadcast_reduce_op_index.cu
│   │   │   ├── np_broadcast_reduce_op_value.h
│   │   │   ├── np_broadcast_reduce_op_value_broadcast_to.cc
│   │   │   ├── np_broadcast_reduce_op_value_broadcast_to.cu
│   │   │   ├── np_broadcast_reduce_op_value_max.cc
│   │   │   ├── np_broadcast_reduce_op_value_max.cu
│   │   │   ├── np_broadcast_reduce_op_value_mean.cc
│   │   │   ├── np_broadcast_reduce_op_value_mean.cu
│   │   │   ├── np_broadcast_reduce_op_value_min.cc
│   │   │   ├── np_broadcast_reduce_op_value_min.cu
│   │   │   ├── np_broadcast_reduce_op_value_prod.cc
│   │   │   ├── np_broadcast_reduce_op_value_prod.cu
│   │   │   ├── np_broadcast_reduce_op_value_sum.cc
│   │   │   ├── np_broadcast_reduce_op_value_sum.cu
│   │   │   ├── np_constraint_check.cc
│   │   │   ├── np_constraint_check.cu
│   │   │   ├── np_constraint_check.h
│   │   │   ├── np_cross-inl.h
│   │   │   ├── np_cross.cc
│   │   │   ├── np_cross.cu
│   │   │   ├── np_cumsum-inl.h
│   │   │   ├── np_cumsum.cc
│   │   │   ├── np_cumsum.cu
│   │   │   ├── np_delete_op-inl.h
│   │   │   ├── np_delete_op.cc
│   │   │   ├── np_delete_op.cu
│   │   │   ├── np_diff-inl.h
│   │   │   ├── np_diff.cc
│   │   │   ├── np_diff.cu
│   │   │   ├── np_dot-inl.h
│   │   │   ├── np_dot_backward.cc
│   │   │   ├── np_dot_backward.cu
│   │   │   ├── np_dot_forward.cc
│   │   │   ├── np_dot_forward.cu
│   │   │   ├── np_ediff1d_op-inl.h
│   │   │   ├── np_ediff1d_op.cc
│   │   │   ├── np_ediff1d_op.cu
│   │   │   ├── np_einsum_op-inl.h
│   │   │   ├── np_einsum_op.cc
│   │   │   ├── np_einsum_op.cu
│   │   │   ├── np_einsum_path_op-inl.h
│   │   │   ├── np_elemwise_broadcast_logic_op.h
│   │   │   ├── np_elemwise_broadcast_logic_op_and.cc
│   │   │   ├── np_elemwise_broadcast_logic_op_and.cu
│   │   │   ├── np_elemwise_broadcast_logic_op_equal.cc
│   │   │   ├── np_elemwise_broadcast_logic_op_equal.cu
│   │   │   ├── np_elemwise_broadcast_logic_op_greater.cc
│   │   │   ├── np_elemwise_broadcast_logic_op_greater.cu
│   │   │   ├── np_elemwise_broadcast_logic_op_greater_equal.cc
│   │   │   ├── np_elemwise_broadcast_logic_op_greater_equal.cu
│   │   │   ├── np_elemwise_broadcast_logic_op_less.cc
│   │   │   ├── np_elemwise_broadcast_logic_op_less.cu
│   │   │   ├── np_elemwise_broadcast_logic_op_less_equal.cc
│   │   │   ├── np_elemwise_broadcast_logic_op_less_equal.cu
│   │   │   ├── np_elemwise_broadcast_logic_op_not_equal.cc
│   │   │   ├── np_elemwise_broadcast_logic_op_not_equal.cu
│   │   │   ├── np_elemwise_broadcast_logic_op_or.cc
│   │   │   ├── np_elemwise_broadcast_logic_op_or.cu
│   │   │   ├── np_elemwise_broadcast_logic_op_xor.cc
│   │   │   ├── np_elemwise_broadcast_logic_op_xor.cu
│   │   │   ├── np_elemwise_broadcast_op.h
│   │   │   ├── np_elemwise_broadcast_op_add.cc
│   │   │   ├── np_elemwise_broadcast_op_add.cu
│   │   │   ├── np_elemwise_broadcast_op_extended.cc
│   │   │   ├── np_elemwise_broadcast_op_extended.cu
│   │   │   ├── np_elemwise_broadcast_op_extended_sec.cc
│   │   │   ├── np_elemwise_broadcast_op_extended_sec.cu
│   │   │   ├── np_elemwise_broadcast_op_extended_thi.cc
│   │   │   ├── np_elemwise_broadcast_op_extended_thi.cu
│   │   │   ├── np_elemwise_broadcast_op_lae.cc
│   │   │   ├── np_elemwise_broadcast_op_lae.cu
│   │   │   ├── np_elemwise_broadcast_op_mod.cc
│   │   │   ├── np_elemwise_broadcast_op_mod.cu
│   │   │   ├── np_elemwise_broadcast_op_mul.cc
│   │   │   ├── np_elemwise_broadcast_op_mul.cu
│   │   │   ├── np_elemwise_broadcast_op_pow.cc
│   │   │   ├── np_elemwise_broadcast_op_pow.cu
│   │   │   ├── np_elemwise_broadcast_op_scalar.cc
│   │   │   ├── np_elemwise_broadcast_op_scalar.cu
│   │   │   ├── np_elemwise_broadcast_op_sub.cc
│   │   │   ├── np_elemwise_broadcast_op_sub.cu
│   │   │   ├── np_elemwise_unary_op_basic.cc
│   │   │   ├── np_elemwise_unary_op_basic.cu
│   │   │   ├── np_fill_diagonal_op-inl.h
│   │   │   ├── np_fill_diagonal_op.cc
│   │   │   ├── np_fill_diagonal_op.cu
│   │   │   ├── np_floor_divide.cc
│   │   │   ├── np_floor_divide.cu
│   │   │   ├── np_indexing_op.cc
│   │   │   ├── np_indexing_op.cu
│   │   │   ├── np_indexing_op.h
│   │   │   ├── np_init_op.cc
│   │   │   ├── np_init_op.cu
│   │   │   ├── np_init_op.h
│   │   │   ├── np_insert_op-inl.h
│   │   │   ├── np_insert_op_scalar-inl.h
│   │   │   ├── np_insert_op_scalar.cc
│   │   │   ├── np_insert_op_scalar.cu
│   │   │   ├── np_insert_op_slice-inl.h
│   │   │   ├── np_insert_op_slice.cc
│   │   │   ├── np_insert_op_slice.cu
│   │   │   ├── np_insert_op_tensor-inl.h
│   │   │   ├── np_insert_op_tensor.cc
│   │   │   ├── np_insert_op_tensor.cu
│   │   │   ├── np_interp_op-inl.h
│   │   │   ├── np_interp_op.cc
│   │   │   ├── np_interp_op.cu
│   │   │   ├── np_kron-inl.h
│   │   │   ├── np_kron_backward.cc
│   │   │   ├── np_kron_backward.cu
│   │   │   ├── np_kron_forward.cc
│   │   │   ├── np_kron_forward.cu
│   │   │   ├── np_matmul_op-inl.h
│   │   │   ├── np_matmul_op.cc
│   │   │   ├── np_matmul_op.cu
│   │   │   ├── np_matrix_op-inl.h
│   │   │   ├── np_matrix_op.cc
│   │   │   ├── np_matrix_op.cu
│   │   │   ├── np_memory_op.cc
│   │   │   ├── np_memory_op.cu
│   │   │   ├── np_memory_op.h
│   │   │   ├── np_moments_op.cc
│   │   │   ├── np_moments_op.cu
│   │   │   ├── np_nonzero_op-inl.h
│   │   │   ├── np_nonzero_op.cc
│   │   │   ├── np_nonzero_op.cu
│   │   │   ├── np_pad_op-inl.h
│   │   │   ├── np_pad_op.cc
│   │   │   ├── np_pad_op.cu
│   │   │   ├── np_percentile_op-inl.h
│   │   │   ├── np_percentile_op.cc
│   │   │   ├── np_percentile_op.cu
│   │   │   ├── np_polynomial_op-inl.h
│   │   │   ├── np_polynomial_op.cc
│   │   │   ├── np_polynomial_op.cu
│   │   │   ├── np_repeat_op-inl.h
│   │   │   ├── np_repeat_op.cc
│   │   │   ├── np_repeat_op.cu
│   │   │   ├── np_tensordot_op-inl.h
│   │   │   ├── np_tensordot_op.cc
│   │   │   ├── np_tensordot_op.cu
│   │   │   ├── np_trace_op-inl.h
│   │   │   ├── np_trace_op.cc
│   │   │   ├── np_trace_op.cu
│   │   │   ├── np_tri_op-inl.h
│   │   │   ├── np_tri_op.cc
│   │   │   ├── np_tri_op.cu
│   │   │   ├── np_tril_op-inl.h
│   │   │   ├── np_tril_op.cc
│   │   │   ├── np_tril_op.cu
│   │   │   ├── np_triu_op-inl.h
│   │   │   ├── np_triu_op.cc
│   │   │   ├── np_triu_op.cu
│   │   │   ├── np_true_divide-inl.h
│   │   │   ├── np_true_divide.cc
│   │   │   ├── np_true_divide.cu
│   │   │   ├── np_unique_op.cc
│   │   │   ├── np_unique_op.cu
│   │   │   ├── np_unique_op.h
│   │   │   ├── np_where_backward_op.cc
│   │   │   ├── np_where_backward_op.cu
│   │   │   ├── np_where_forward_op.cc
│   │   │   ├── np_where_forward_op.cu
│   │   │   ├── np_where_op-inl.h
│   │   │   ├── np_window_op.cc
│   │   │   ├── np_window_op.cu
│   │   │   ├── np_window_op.h
│   │   │   └── random/
│   │   │       ├── dist_common.cc
│   │   │       ├── dist_common.cu
│   │   │       ├── dist_common.h
│   │   │       ├── np_bernoulli_op.cc
│   │   │       ├── np_bernoulli_op.cu
│   │   │       ├── np_bernoulli_op.h
│   │   │       ├── np_choice_op.cc
│   │   │       ├── np_choice_op.cu
│   │   │       ├── np_choice_op.h
│   │   │       ├── np_exponential_op.cc
│   │   │       ├── np_exponential_op.cu
│   │   │       ├── np_exponential_op.h
│   │   │       ├── np_gamma_op.cc
│   │   │       ├── np_gamma_op.cu
│   │   │       ├── np_gamma_op.h
│   │   │       ├── np_laplace_op.cc
│   │   │       ├── np_laplace_op.cu
│   │   │       ├── np_laplace_op.h
│   │   │       ├── np_location_scale_op.cc
│   │   │       ├── np_location_scale_op.cu
│   │   │       ├── np_location_scale_op.h
│   │   │       ├── np_multinomial_op.cc
│   │   │       ├── np_multinomial_op.cu
│   │   │       ├── np_multinomial_op.h
│   │   │       ├── np_normal_op.cc
│   │   │       ├── np_normal_op.cu
│   │   │       ├── np_normal_op.h
│   │   │       ├── np_pareto_op.cc
│   │   │       ├── np_pareto_op.cu
│   │   │       ├── np_pareto_op.h
│   │   │       ├── np_power_op.cc
│   │   │       ├── np_power_op.cu
│   │   │       ├── np_power_op.h
│   │   │       ├── np_rayleigh_op.cc
│   │   │       ├── np_rayleigh_op.cu
│   │   │       ├── np_rayleigh_op.h
│   │   │       ├── np_uniform_op.cc
│   │   │       ├── np_uniform_op.cu
│   │   │       ├── np_uniform_op.h
│   │   │       ├── np_weibull_op.cc
│   │   │       ├── np_weibull_op.cu
│   │   │       └── np_weibull_op.h
│   │   ├── operator.cc
│   │   ├── operator_common.h
│   │   ├── operator_tune-inl.h
│   │   ├── operator_tune.cc
│   │   ├── operator_tune.h
│   │   ├── operator_util.cc
│   │   ├── optimizer_op-inl.h
│   │   ├── optimizer_op.cc
│   │   ├── optimizer_op.cu
│   │   ├── pad-inl.h
│   │   ├── pad.cc
│   │   ├── pad.cu
│   │   ├── quantization/
│   │   │   ├── calibrate-inl.h
│   │   │   ├── calibrate.cc
│   │   │   ├── dequantize-inl.h
│   │   │   ├── dequantize.cc
│   │   │   ├── dequantize.cu
│   │   │   ├── dnnl/
│   │   │   │   ├── dnnl_dequantize-inl.h
│   │   │   │   ├── dnnl_quantize-inl.h
│   │   │   │   ├── dnnl_quantize_asym-inl.h
│   │   │   │   ├── dnnl_quantize_v2-inl.h
│   │   │   │   ├── dnnl_quantized_act.cc
│   │   │   │   ├── dnnl_quantized_batch_norm.cc
│   │   │   │   ├── dnnl_quantized_concat.cc
│   │   │   │   ├── dnnl_quantized_conv.cc
│   │   │   │   ├── dnnl_quantized_elemwise_add.cc
│   │   │   │   ├── dnnl_quantized_flatten.cc
│   │   │   │   ├── dnnl_quantized_fully_connected.cc
│   │   │   │   ├── dnnl_quantized_ops-inl.h
│   │   │   │   ├── dnnl_quantized_pooling.cc
│   │   │   │   ├── dnnl_quantized_reshape.cc
│   │   │   │   ├── dnnl_quantized_rnn-inl.h
│   │   │   │   ├── dnnl_quantized_rnn.cc
│   │   │   │   ├── dnnl_quantized_transpose.cc
│   │   │   │   └── dnnl_requantize-inl.h
│   │   │   ├── quantization_utils.h
│   │   │   ├── quantize-inl.h
│   │   │   ├── quantize.cc
│   │   │   ├── quantize.cu
│   │   │   ├── quantize_asym-inl.h
│   │   │   ├── quantize_asym.cc
│   │   │   ├── quantize_graph_pass.cc
│   │   │   ├── quantize_v2-inl.h
│   │   │   ├── quantize_v2.cc
│   │   │   ├── quantize_v2.cu
│   │   │   ├── quantized_activation.cc
│   │   │   ├── quantized_batch_norm.cc
│   │   │   ├── quantized_batch_norm_relu.cc
│   │   │   ├── quantized_concat.cc
│   │   │   ├── quantized_conv.cc
│   │   │   ├── quantized_conv.cu
│   │   │   ├── quantized_elemwise_add-inl.h
│   │   │   ├── quantized_elemwise_add.cc
│   │   │   ├── quantized_elemwise_mul-inl.h
│   │   │   ├── quantized_elemwise_mul.cc
│   │   │   ├── quantized_flatten-inl.h
│   │   │   ├── quantized_flatten.cc
│   │   │   ├── quantized_flatten.cu
│   │   │   ├── quantized_fully_connected.cc
│   │   │   ├── quantized_fully_connected.cu
│   │   │   ├── quantized_indexing_op.cc
│   │   │   ├── quantized_pooling.cc
│   │   │   ├── quantized_pooling.cu
│   │   │   ├── quantized_reshape-inl.h
│   │   │   ├── quantized_reshape.cc
│   │   │   ├── quantized_rnn-inl.h
│   │   │   ├── quantized_rnn.cc
│   │   │   ├── quantized_transpose.cc
│   │   │   ├── requantize-inl.h
│   │   │   ├── requantize.cc
│   │   │   └── requantize.cu
│   │   ├── random/
│   │   │   ├── multisample_op.cc
│   │   │   ├── multisample_op.cu
│   │   │   ├── multisample_op.h
│   │   │   ├── pdf_op.cc
│   │   │   ├── pdf_op.cu
│   │   │   ├── pdf_op.h
│   │   │   ├── sample_multinomial_op.cc
│   │   │   ├── sample_multinomial_op.cu
│   │   │   ├── sample_multinomial_op.h
│   │   │   ├── sample_op.cc
│   │   │   ├── sample_op.cu
│   │   │   ├── sample_op.h
│   │   │   ├── sampler.h
│   │   │   ├── shuffle_op.cc
│   │   │   ├── shuffle_op.cu
│   │   │   ├── unique_sample_op.cc
│   │   │   └── unique_sample_op.h
│   │   ├── regression_output-inl.h
│   │   ├── regression_output.cc
│   │   ├── regression_output.cu
│   │   ├── rnn-inl.h
│   │   ├── rnn.cc
│   │   ├── rnn.cu
│   │   ├── rnn_impl.h
│   │   ├── roi_pooling-inl.h
│   │   ├── roi_pooling.cc
│   │   ├── roi_pooling.cu
│   │   ├── sequence_last-inl.h
│   │   ├── sequence_last.cc
│   │   ├── sequence_last.cu
│   │   ├── sequence_mask-inl.h
│   │   ├── sequence_mask.cc
│   │   ├── sequence_mask.cu
│   │   ├── sequence_op_common.h
│   │   ├── sequence_reverse-inl.h
│   │   ├── sequence_reverse.cc
│   │   ├── sequence_reverse.cu
│   │   ├── slice_channel-inl.h
│   │   ├── slice_channel.cc
│   │   ├── slice_channel.cu
│   │   ├── softmax_output-inl.h
│   │   ├── softmax_output.cc
│   │   ├── softmax_output.cu
│   │   ├── spatial_transformer-inl.h
│   │   ├── spatial_transformer.cc
│   │   ├── spatial_transformer.cu
│   │   ├── special_functions-inl.h
│   │   ├── subgraph/
│   │   │   ├── build_subgraph.cc
│   │   │   ├── common.h
│   │   │   ├── default_subgraph_property.cc
│   │   │   ├── default_subgraph_property_v2.cc
│   │   │   ├── dnnl/
│   │   │   │   ├── dnnl_batch_dot.cc
│   │   │   │   ├── dnnl_batch_dot_property.h
│   │   │   │   ├── dnnl_bn_relu.cc
│   │   │   │   ├── dnnl_bn_relu_property.h
│   │   │   │   ├── dnnl_common.h
│   │   │   │   ├── dnnl_conv-inl.h
│   │   │   │   ├── dnnl_conv.cc
│   │   │   │   ├── dnnl_conv_property.h
│   │   │   │   ├── dnnl_fc-inl.h
│   │   │   │   ├── dnnl_fc.cc
│   │   │   │   ├── dnnl_fc_property.h
│   │   │   │   ├── dnnl_fc_sum_fuse_property.h
│   │   │   │   ├── dnnl_identity_property.h
│   │   │   │   ├── dnnl_post_amp_property.h
│   │   │   │   ├── dnnl_post_quantize_align_scale_property.h
│   │   │   │   ├── dnnl_post_quantize_property.h
│   │   │   │   ├── dnnl_pow_mul_scalar.cc
│   │   │   │   ├── dnnl_pow_mul_scalar_property.h
│   │   │   │   ├── dnnl_remove_casts_property.h
│   │   │   │   ├── dnnl_subgraph_base-inl.h
│   │   │   │   ├── dnnl_subgraph_property.cc
│   │   │   │   ├── dnnl_transformer-inl.h
│   │   │   │   ├── dnnl_transformer.cc
│   │   │   │   ├── dnnl_transformer_qk_common.h
│   │   │   │   ├── dnnl_transformer_qk_property.h
│   │   │   │   └── dnnl_transformer_valatt_property.h
│   │   │   ├── eliminate_common_nodes_pass.cc
│   │   │   ├── partitioner/
│   │   │   │   └── custom_subgraph_property.h
│   │   │   ├── static_shape_subgraph_property.cc
│   │   │   ├── subgraph_property.h
│   │   │   └── tensorrt/
│   │   │       ├── nnvm_to_onnx-inl.h
│   │   │       ├── nnvm_to_onnx.cc
│   │   │       ├── onnx_to_tensorrt.cc
│   │   │       ├── onnx_to_tensorrt.h
│   │   │       ├── tensorrt-inl.h
│   │   │       ├── tensorrt.cc
│   │   │       └── tensorrt.cu
│   │   ├── subgraph_op_common.cc
│   │   ├── subgraph_op_common.h
│   │   ├── svm_output-inl.h
│   │   ├── svm_output.cc
│   │   ├── svm_output.cu
│   │   ├── swapaxis-inl.h
│   │   ├── swapaxis.cc
│   │   ├── swapaxis.cu
│   │   ├── tensor/
│   │   │   ├── amp_cast.cc
│   │   │   ├── amp_cast.cu
│   │   │   ├── amp_cast.h
│   │   │   ├── broadcast_reduce-inl.h
│   │   │   ├── broadcast_reduce_minmax_value.cc
│   │   │   ├── broadcast_reduce_minmax_value.cu
│   │   │   ├── broadcast_reduce_norm_value.cc
│   │   │   ├── broadcast_reduce_norm_value.cu
│   │   │   ├── broadcast_reduce_op.cc
│   │   │   ├── broadcast_reduce_op.h
│   │   │   ├── broadcast_reduce_op_index.cc
│   │   │   ├── broadcast_reduce_op_index.cu
│   │   │   ├── broadcast_reduce_op_value.cc
│   │   │   ├── broadcast_reduce_op_value.cu
│   │   │   ├── broadcast_reduce_prod_value.cc
│   │   │   ├── broadcast_reduce_prod_value.cu
│   │   │   ├── broadcast_reduce_sum_value.cc
│   │   │   ├── broadcast_reduce_sum_value.cu
│   │   │   ├── cast_storage-inl.cuh
│   │   │   ├── cast_storage-inl.h
│   │   │   ├── cast_storage.cc
│   │   │   ├── cast_storage.cu
│   │   │   ├── control_flow_op.cc
│   │   │   ├── control_flow_op.cu
│   │   │   ├── control_flow_op.h
│   │   │   ├── diag_op-inl.h
│   │   │   ├── diag_op.cc
│   │   │   ├── diag_op.cu
│   │   │   ├── dot-inl.cuh
│   │   │   ├── dot-inl.h
│   │   │   ├── dot.cc
│   │   │   ├── dot.cu
│   │   │   ├── elemwise_binary_broadcast_op.cc
│   │   │   ├── elemwise_binary_broadcast_op.h
│   │   │   ├── elemwise_binary_broadcast_op_basic.cc
│   │   │   ├── elemwise_binary_broadcast_op_basic.cu
│   │   │   ├── elemwise_binary_broadcast_op_extended.cc
│   │   │   ├── elemwise_binary_broadcast_op_extended.cu
│   │   │   ├── elemwise_binary_broadcast_op_logic.cc
│   │   │   ├── elemwise_binary_broadcast_op_logic.cu
│   │   │   ├── elemwise_binary_op-inl.h
│   │   │   ├── elemwise_binary_op.cc
│   │   │   ├── elemwise_binary_op.h
│   │   │   ├── elemwise_binary_op_basic.cc
│   │   │   ├── elemwise_binary_op_basic.cu
│   │   │   ├── elemwise_binary_op_extended.cc
│   │   │   ├── elemwise_binary_op_extended.cu
│   │   │   ├── elemwise_binary_op_logic.cc
│   │   │   ├── elemwise_binary_op_logic.cu
│   │   │   ├── elemwise_binary_scalar_op.cc
│   │   │   ├── elemwise_binary_scalar_op.h
│   │   │   ├── elemwise_binary_scalar_op_basic.cc
│   │   │   ├── elemwise_binary_scalar_op_basic.cu
│   │   │   ├── elemwise_binary_scalar_op_extended.cc
│   │   │   ├── elemwise_binary_scalar_op_extended.cu
│   │   │   ├── elemwise_binary_scalar_op_logic.cc
│   │   │   ├── elemwise_binary_scalar_op_logic.cu
│   │   │   ├── elemwise_sum.cc
│   │   │   ├── elemwise_sum.cu
│   │   │   ├── elemwise_sum.h
│   │   │   ├── elemwise_unary_op.cc
│   │   │   ├── elemwise_unary_op.h
│   │   │   ├── elemwise_unary_op_basic.cc
│   │   │   ├── elemwise_unary_op_basic.cu
│   │   │   ├── elemwise_unary_op_logexp.cc
│   │   │   ├── elemwise_unary_op_logexp.cu
│   │   │   ├── elemwise_unary_op_pow.cc
│   │   │   ├── elemwise_unary_op_pow.cu
│   │   │   ├── elemwise_unary_op_trig.cc
│   │   │   ├── elemwise_unary_op_trig.cu
│   │   │   ├── histogram-inl.h
│   │   │   ├── histogram.cc
│   │   │   ├── histogram.cu
│   │   │   ├── index_add-inl.h
│   │   │   ├── index_add_backward.cc
│   │   │   ├── index_add_backward.cu
│   │   │   ├── index_add_forward.cc
│   │   │   ├── index_add_forward.cu
│   │   │   ├── index_update-inl.h
│   │   │   ├── index_update.cc
│   │   │   ├── index_update.cu
│   │   │   ├── indexing_op-inl.cuh
│   │   │   ├── indexing_op.cc
│   │   │   ├── indexing_op.cu
│   │   │   ├── indexing_op.h
│   │   │   ├── init_op.cc
│   │   │   ├── init_op.cu
│   │   │   ├── init_op.h
│   │   │   ├── la_op-inl.h
│   │   │   ├── la_op.cc
│   │   │   ├── la_op.cu
│   │   │   ├── la_op.h
│   │   │   ├── matrix_op-inl.h
│   │   │   ├── matrix_op.cc
│   │   │   ├── matrix_op.cu
│   │   │   ├── ordering_op-inl.h
│   │   │   ├── ordering_op.cc
│   │   │   ├── ordering_op.cu
│   │   │   ├── pseudo2DTranspose_op-inl.cuh
│   │   │   ├── ravel.cc
│   │   │   ├── ravel.cu
│   │   │   ├── ravel.h
│   │   │   ├── reduce_rtc.cc
│   │   │   ├── slice-inl.h
│   │   │   ├── sort_op-inl.cuh
│   │   │   ├── sort_op.h
│   │   │   ├── sparse_retain-inl.h
│   │   │   ├── sparse_retain.cc
│   │   │   ├── sparse_retain.cu
│   │   │   ├── square_sum-inl.h
│   │   │   ├── square_sum.cc
│   │   │   ├── square_sum.cu
│   │   │   └── util/
│   │   │       ├── tensor_util-inl.cuh
│   │   │       └── tensor_util-inl.h
│   │   └── tvmop/
│   │       ├── op_module.cc
│   │       └── op_module.h
│   ├── optimizer/
│   │   └── sgd-inl.h
│   ├── profiler/
│   │   ├── aggregate_stats.cc
│   │   ├── aggregate_stats.h
│   │   ├── custom_op_profiler.h
│   │   ├── profiler.cc
│   │   ├── profiler.h
│   │   ├── storage_profiler.cc
│   │   ├── storage_profiler.h
│   │   ├── vtune.cc
│   │   └── vtune.h
│   ├── resource.cc
│   ├── runtime/
│   │   ├── c_runtime_api.cc
│   │   ├── container.cc
│   │   ├── ndarray_handle.cc
│   │   ├── object.cc
│   │   ├── object_internal.h
│   │   └── registry.cc
│   ├── serialization/
│   │   ├── cnpy.cc
│   │   └── cnpy.h
│   └── storage/
│       ├── cpu_device_storage.h
│       ├── cpu_shared_storage_manager.h
│       ├── gpu_device_storage.h
│       ├── naive_storage_manager.h
│       ├── pinned_memory_storage.h
│       ├── pooled_storage_manager.h
│       ├── storage.cc
│       ├── storage_manager.h
│       └── storage_manager_helpers.h
├── tests/
│   ├── .gitignore
│   ├── CMakeLists.txt
│   ├── README.md
│   ├── cpp/
│   │   ├── .gitignore
│   │   ├── engine/
│   │   │   ├── engine_shutdown_test.cc
│   │   │   ├── omp_test.cc
│   │   │   ├── thread_local_test.cc
│   │   │   └── threaded_engine_test.cc
│   │   ├── include/
│   │   │   ├── test_core_op.h
│   │   │   ├── test_dnnl.h
│   │   │   ├── test_legacy_op.h
│   │   │   ├── test_ndarray_utils.h
│   │   │   ├── test_op.h
│   │   │   ├── test_op_runner.h
│   │   │   ├── test_perf.h
│   │   │   ├── test_tune.h
│   │   │   └── test_util.h
│   │   ├── kvstore/
│   │   │   └── gpu_topology_test.cc
│   │   ├── misc/
│   │   │   ├── base.cc
│   │   │   └── libinfo_test.cc
│   │   ├── operator/
│   │   │   ├── activation_perf.cc
│   │   │   ├── batchnorm_test.cc
│   │   │   ├── coreop_perf.cc
│   │   │   ├── dnnl_operator_test.cc
│   │   │   ├── dnnl_test.cc
│   │   │   ├── dropout_perf.cc
│   │   │   ├── fully_conn_perf.cc
│   │   │   ├── krprod_test.cc
│   │   │   ├── runner/
│   │   │   │   └── core_op_runner_test.cc
│   │   │   ├── slice_channel_perf.cc
│   │   │   └── tune/
│   │   │       └── operator_tune_test.cc
│   │   ├── storage/
│   │   │   └── storage_test.cc
│   │   └── test_main.cc
│   ├── nightly/
│   │   ├── .gitignore
│   │   ├── Jenkinsfile
│   │   ├── JenkinsfileForBinaries
│   │   ├── README.md
│   │   ├── TestDoc/
│   │   │   ├── doc_spell_checker.py
│   │   │   └── doc_spell_grammar.sh
│   │   ├── common.py
│   │   ├── dist_async_kvstore.py
│   │   ├── dist_device_sync_kvstore.py
│   │   ├── dist_device_sync_kvstore_byteps.py
│   │   ├── dist_device_sync_kvstore_custom.py
│   │   ├── dist_device_sync_kvstore_horovod.py
│   │   ├── dist_sync_kvstore.py
│   │   ├── estimator/
│   │   │   ├── test_estimator_cnn.py
│   │   │   └── test_sentiment_rnn.py
│   │   ├── model_backwards_compatibility_check/
│   │   │   ├── JenkinsfileForMBCC
│   │   │   ├── README.md
│   │   │   ├── __init__.py
│   │   │   ├── common.py
│   │   │   ├── model_backward_compat_checker.sh
│   │   │   ├── model_backwards_compat_inference.py
│   │   │   ├── model_backwards_compat_train.py
│   │   │   ├── train_mxnet_legacy_models.sh
│   │   │   └── upload_models_to_s3.sh
│   │   ├── test_distributed_training-gpu.sh
│   │   ├── test_kvstore.py
│   │   ├── test_large_array.py
│   │   ├── test_large_vector.py
│   │   ├── test_np_large_array.py
│   │   ├── test_np_random.py
│   │   └── test_server_profiling.py
│   ├── python/
│   │   ├── README.md
│   │   ├── amp/
│   │   │   └── common.py
│   │   ├── array-api/
│   │   │   └── test_data_interchange.py
│   │   ├── common/
│   │   │   └── models.py
│   │   ├── conftest.py
│   │   ├── dnnl/
│   │   │   ├── op_cfg.py
│   │   │   ├── subgraphs/
│   │   │   │   ├── subgraph_common.py
│   │   │   │   ├── test_amp_subgraph.py
│   │   │   │   ├── test_conv_subgraph.py
│   │   │   │   ├── test_fc_subgraph.py
│   │   │   │   ├── test_matmul_subgraph.py
│   │   │   │   └── test_pow_mul_subgraph.py
│   │   │   ├── test_amp.py
│   │   │   ├── test_bf16_operator.py
│   │   │   ├── test_dnnl.py
│   │   │   └── test_quantization_dnnl.py
│   │   ├── doctest/
│   │   │   └── test_docstring.py
│   │   ├── gpu/
│   │   │   ├── test_amp.py
│   │   │   ├── test_amp_init.py
│   │   │   ├── test_deferred_compute_gpu.py
│   │   │   ├── test_device.py
│   │   │   ├── test_extensions_gpu.py
│   │   │   ├── test_fusion.py
│   │   │   ├── test_gluon_gpu.py
│   │   │   ├── test_gluon_model_zoo_gpu.py
│   │   │   ├── test_gluon_transforms.py
│   │   │   ├── test_kvstore_gpu.py
│   │   │   ├── test_nccl.py
│   │   │   ├── test_numpy_einsum.py
│   │   │   ├── test_numpy_fallback.py
│   │   │   ├── test_operator_gpu.py
│   │   │   ├── test_profiler_gpu.py
│   │   │   ├── test_rtc.py
│   │   │   ├── test_tvm_bridge.py
│   │   │   └── test_tvm_op_gpu.py
│   │   ├── onnx/
│   │   │   ├── test_models.py
│   │   │   └── test_operators.py
│   │   ├── profiling/
│   │   │   ├── simple_forward.py
│   │   │   └── test_nvtx.py
│   │   ├── quantization/
│   │   │   └── test_quantization.py
│   │   ├── test_quantization_gpu.py
│   │   ├── train/
│   │   │   ├── common.py
│   │   │   └── test_autograd.py
│   │   └── unittest/
│   │       ├── common.py
│   │       ├── legacy_ndarray.v0
│   │       ├── test_attr.py
│   │       ├── test_autograd.py
│   │       ├── test_base.py
│   │       ├── test_contrib_control_flow.py
│   │       ├── test_contrib_gluon_data_vision.py
│   │       ├── test_contrib_hawkesll.py
│   │       ├── test_contrib_intgemm.py
│   │       ├── test_contrib_io.py
│   │       ├── test_contrib_krprod.py
│   │       ├── test_contrib_operator.py
│   │       ├── test_contrib_optimizer.py
│   │       ├── test_contrib_stes_op.py
│   │       ├── test_deferred_compute.py
│   │       ├── test_dgl_graph.py
│   │       ├── test_dynamic_shape.py
│   │       ├── test_engine.py
│   │       ├── test_engine_import.py
│   │       ├── test_exc_handling.py
│   │       ├── test_executor.py
│   │       ├── test_extensions.py
│   │       ├── test_ffi_container.py
│   │       ├── test_gluon.py
│   │       ├── test_gluon_batch_processor.py
│   │       ├── test_gluon_control_flow.py
│   │       ├── test_gluon_data.py
│   │       ├── test_gluon_estimator.py
│   │       ├── test_gluon_event_handler.py
│   │       ├── test_gluon_indexing.py
│   │       ├── test_gluon_model_zoo.py
│   │       ├── test_gluon_probability_v2.py
│   │       ├── test_gluon_rnn.py
│   │       ├── test_gluon_save.py
│   │       ├── test_gluon_trainer.py
│   │       ├── test_gluon_utils.py
│   │       ├── test_higher_order_grad.py
│   │       ├── test_image.py
│   │       ├── test_infer_shape.py
│   │       ├── test_infer_type.py
│   │       ├── test_io.py
│   │       ├── test_kvstore.py
│   │       ├── test_kvstore_custom.py
│   │       ├── test_loss.py
│   │       ├── test_memory_opt.py
│   │       ├── test_metric.py
│   │       ├── test_ndarray.py
│   │       ├── test_numpy_contrib_gluon_data_vision.py
│   │       ├── test_numpy_default_dtype.py
│   │       ├── test_numpy_gluon.py
│   │       ├── test_numpy_gluon_data_vision.py
│   │       ├── test_numpy_interoperability.py
│   │       ├── test_numpy_loss.py
│   │       ├── test_numpy_ndarray.py
│   │       ├── test_numpy_op.py
│   │       ├── test_operator.py
│   │       ├── test_optimizer.py
│   │       ├── test_profiler.py
│   │       ├── test_random.py
│   │       ├── test_recordio.py
│   │       ├── test_runtime.py
│   │       ├── test_smoke.py
│   │       ├── test_sparse_ndarray.py
│   │       ├── test_sparse_operator.py
│   │       ├── test_subgraph.py
│   │       ├── test_subgraph_op.py
│   │       ├── test_symbol.py
│   │       ├── test_test_utils.py
│   │       ├── test_thread_local.py
│   │       ├── test_tvm_op.py
│   │       └── test_viz.py
│   ├── tutorials/
│   │   ├── test_sanity_tutorials.py
│   │   └── test_tutorials.py
│   └── utils/
│       └── notebook_test/
│           └── __init__.py
└── tools/
    ├── bandwidth/
    │   ├── .gitignore
    │   ├── README.md
    │   ├── measure.py
    │   └── test_measure.py
    ├── cfn/
    │   └── Readme.md
    ├── create_source_archive.sh
    ├── dependencies/
    │   ├── LICENSE.binary.dependencies
    │   ├── README.md
    │   ├── cityhash.sh
    │   ├── curl.sh
    │   ├── eigen.sh
    │   ├── libpng.sh
    │   ├── libtiff.sh
    │   ├── libturbojpeg.sh
    │   ├── libz.sh
    │   ├── lz4.sh
    │   ├── make_shared_dependencies.sh
    │   ├── mkl.sh
    │   ├── numpy_mkl.sh
    │   ├── openblas.sh
    │   ├── opencv.sh
    │   ├── openssl.sh
    │   ├── patch/
    │   │   └── opencv_lapack.h
    │   ├── protobuf.sh
    │   └── zmq.sh
    ├── diagnose.py
    ├── flakiness_checker.py
    ├── git-pre-commit
    ├── im2rec.cc
    ├── im2rec.py
    ├── ipynb2md.py
    ├── kill-mxnet.py
    ├── launch.py
    ├── license_header.py
    ├── lint/
    │   ├── clang_format_ci.sh
    │   └── git-clang-format-13
    ├── parse_log.py
    ├── pip/
    │   ├── MANIFEST.in
    │   ├── doc/
    │   │   ├── CPU_ADDITIONAL.md
    │   │   ├── CU101_ADDITIONAL.md
    │   │   ├── CU102_ADDITIONAL.md
    │   │   ├── CU110_ADDITIONAL.md
    │   │   ├── CU112_ADDITIONAL.md
    │   │   ├── NATIVE_ADDITIONAL.md
    │   │   └── PYPI_README.md
    │   ├── sanity_test.py
    │   └── setup.py
    ├── profile/
    │   └── tune_python.sh
    ├── rec2idx.py
    ├── staticbuild/
    │   ├── README.md
    │   ├── build.sh
    │   ├── build_lib.sh
    │   └── build_wheel.sh
    └── windowsbuild/
        ├── README.md
        ├── gen_warp.cpp
        └── warp_dll.cpp