gitextract_ycct44t1/

├── .gitignore
├── README.md
├── akaitsuki-slow/
│   ├── config.py
│   ├── feed_dict.pbtxt
│   ├── feed_dict.py
│   └── main.py
├── autotune/
│   ├── README.md
│   ├── autograd_lib.py
│   ├── autograd_lib_test.py
│   ├── autograd_test.py
│   ├── ciresan_bench.py
│   ├── curvature_test.py
│   ├── eval_conv2d_approx.py
│   ├── factored_test.py
│   ├── globals.py
│   ├── hessian_test.py
│   ├── linalg_bench.py
│   ├── linesearch_test_disabled.py
│   ├── lyapunov_test.py
│   ├── mnist_end2end_test.py
│   ├── plotting_test.py
│   ├── pytorch_benchmark.py
│   ├── scipy_benchmark.py
│   ├── svd_benchmark.py
│   ├── test/
│   │   ├── bad_sigmas.pt
│   │   ├── factored.pt
│   │   └── gesvd_crash.txt
│   ├── train_ciresan.py
│   ├── train_ciresan_cca.py
│   ├── train_ciresan_factored.py
│   ├── train_ciresan_new.py
│   ├── train_medium.py
│   ├── train_small.py
│   ├── train_small_xent.py
│   ├── train_small_xent_factored.py
│   ├── train_tiny.py
│   ├── train_tiny_xent.py
│   ├── util.py
│   └── util_test.py
├── aws-recipes.ipynb
├── aws-scratch.ipynb
├── benchmark_huggingface_predict.py
├── bin/
│   └── tfversion
├── clipping-profile.ipynb
├── cluster/
│   ├── .gitignore
│   ├── README.md
│   ├── async_adder.py
│   ├── aws.py
│   ├── benchmark_grpc_recv.py
│   ├── benchmarks/
│   │   ├── .gitignore
│   │   ├── LICENSE
│   │   ├── README.md
│   │   ├── bower_components/
│   │   │   ├── d3/
│   │   │   │   ├── .bower.json
│   │   │   │   ├── .gitattributes
│   │   │   │   ├── CONTRIBUTING.md
│   │   │   │   ├── LICENSE
│   │   │   │   ├── README.md
│   │   │   │   ├── bower.json
│   │   │   │   ├── d3.js
│   │   │   │   └── package.js
│   │   │   └── plottable/
│   │   │       ├── .bower.json
│   │   │       ├── bower.json
│   │   │       ├── plottable.css
│   │   │       ├── plottable.d.ts
│   │   │       └── plottable.js
│   │   ├── dashboard_app/
│   │   │   ├── app.yaml
│   │   │   ├── main.py
│   │   │   ├── main_test.py
│   │   │   ├── requirements.txt
│   │   │   ├── static/
│   │   │   │   ├── css/
│   │   │   │   │   └── style.css
│   │   │   │   └── js/
│   │   │   │       └── benchmark_latency_chart.js
│   │   │   └── templates/
│   │   │       ├── index.html
│   │   │       └── test.html
│   │   ├── index.html
│   │   ├── js/
│   │   │   ├── csv_benchmark_chart.js
│   │   │   └── latency_chart.js
│   │   ├── scripts/
│   │   │   ├── Dockerfile.tf_cnn_benchmarks
│   │   │   ├── benchmark_configs.yml
│   │   │   ├── tf_cnn_benchmarks/
│   │   │   │   ├── README.md
│   │   │   │   ├── benchmark_cnn.py
│   │   │   │   ├── benchmark_storage.py
│   │   │   │   ├── cbuild_benchmark_storage.py
│   │   │   │   ├── cnn_util.py
│   │   │   │   ├── convnet_builder.py
│   │   │   │   ├── datasets.py
│   │   │   │   ├── models/
│   │   │   │   │   ├── __init__.py
│   │   │   │   │   ├── alexnet_model.py
│   │   │   │   │   ├── densenet_model.py
│   │   │   │   │   ├── googlenet_model.py
│   │   │   │   │   ├── inception_model.py
│   │   │   │   │   ├── lenet_model.py
│   │   │   │   │   ├── model.py
│   │   │   │   │   ├── model_config.py
│   │   │   │   │   ├── overfeat_model.py
│   │   │   │   │   ├── resnet_model.py
│   │   │   │   │   ├── trivial_model.py
│   │   │   │   │   └── vgg_model.py
│   │   │   │   ├── preprocessing.py
│   │   │   │   ├── tf_cnn_benchmarks.py
│   │   │   │   └── variable_mgr.py
│   │   │   └── util/
│   │   │       ├── __init__.py
│   │   │       ├── benchmark_util.py
│   │   │       ├── benchmark_util_test.py
│   │   │       ├── convert_csv_to_json.py
│   │   │       └── convert_csv_to_json_test.py
│   │   ├── soumith_benchmarks.html
│   │   └── tools/
│   │       ├── k8s_tensorflow_lib.py
│   │       ├── k8s_tensorflow_test.py
│   │       ├── kubectl_util.py
│   │       ├── kubectl_util_test.py
│   │       └── run_distributed_benchmarks.py
│   ├── client_transfer_benchmark.py
│   ├── cloud-formation-example/
│   │   ├── README.md
│   │   ├── iam.yaml
│   │   ├── tensorflow.yaml
│   │   └── zone.sh
│   ├── connect.py
│   ├── delete_placement_groups.py
│   ├── fill_efs.py
│   ├── imagenet64/
│   │   ├── README.md
│   │   ├── aws.py
│   │   ├── launch.py
│   │   ├── requirements.txt
│   │   └── variable_mgr.py
│   ├── instance_info.py
│   ├── launch_async_adder.py
│   ├── launch_micro.py
│   ├── launch_ray.py
│   ├── launch_simple_tf.py
│   ├── local_distributed_benchmark.py
│   ├── myutil.py
│   ├── ray_add.py
│   ├── simple_distributed.py
│   ├── terminate_instances.py
│   ├── test_aws.py
│   ├── tf-tools/
│   │   ├── .gitignore
│   │   ├── benchmark/
│   │   │   ├── multi_gpu/
│   │   │   │   ├── advanced_tweaks_compare.sh
│   │   │   │   ├── image_classification_bench_tests.sh
│   │   │   │   ├── stats_monitor.sh
│   │   │   │   ├── test_runner.sh
│   │   │   │   └── unit_test_stats_monitor.sh
│   │   │   └── runner/
│   │   │       ├── cluster_aws.py
│   │   │       ├── command_builder.py
│   │   │       ├── configs/
│   │   │       │   └── aws/
│   │   │       │       ├── multi_server.yaml
│   │   │       │       └── yaroslav.yaml
│   │   │       ├── instance_info.py
│   │   │       ├── launch_experiment.py
│   │   │       ├── test_cluster_aws.py
│   │   │       ├── test_command_builder.py
│   │   │       └── util.py
│   │   └── install/
│   │       ├── aws_amzlinux.md
│   │       └── aws_ubuntu16_04.md
│   ├── tmux.py
│   └── upload_test.txt
├── conditional_backprop.py
├── configure_tf.sh
├── configure_tf_cpu.sh
├── danjar_peek.py
├── distributed/
│   ├── README.md
│   ├── benchmark_grpc_recv.py
│   └── client_transfer_benchmark.py
├── double_memory_bug.py
├── dynamic_stitch_gpu.py
├── dynamic_stitch_gpu_profile.pbtxt
├── eager_lbfgs/
│   ├── .ipynb_checkpoints/
│   │   └── performance-checkpoint.ipynb
│   ├── common_gd.py
│   ├── data/
│   │   ├── short_batch.csv
│   │   ├── short_eager_batch.csv
│   │   ├── short_eager_loss.csv
│   │   ├── short_eager_time.csv
│   │   ├── short_pytorch_loss.csv
│   │   └── short_pytorch_time.csv
│   ├── eager_lbfgs.py
│   ├── performance.ipynb
│   ├── pytorch_lbfgs.py
│   ├── run_experiment.py
│   ├── torch_lbfgs.lua
│   └── util.py
├── enqueue_many_test.py
├── enqueue_many_test_singlerun.py
├── ericyue-slowreader/
│   ├── benchmark-batch-noqueuerunners-timeline.json
│   ├── benchmark-batch-noqueuerunners.profile
│   ├── benchmark-batch-noqueuerunners.py
│   ├── benchmark-batch.py
│   ├── benchmark-reader.py
│   ├── benchmark-synthetic-batch.py
│   ├── benchmark-synthetic.py
│   ├── benchmark.py
│   ├── data.zlib
│   └── profile-batch.py
├── free_gpus.py
├── github_pyfunc_slowness.py
├── gpu-memory-transfer.ipynb
├── gpu_oom.py
├── graph_template.py
├── imagenet15-scratch.ipynb
├── input_benchmarks/
│   ├── convert_to_records.py
│   ├── fully_connected_feed.py
│   ├── fully_connected_preloaded_var.py
│   ├── fully_connected_reader.py
│   ├── timeline.feed.json
│   ├── timeline.reader.json
│   └── timeline.var.json
├── inverse_segfault.py
├── keras_autoencoder/
│   ├── keras_large.py
│   ├── util.py
│   └── weightnorm.py
├── khatri_rao_benchmark.py
├── lazy_dog.py
├── linalg-benchmark/
│   ├── README.md
│   ├── bad_matrix.py
│   ├── benchmark.py
│   ├── environment.yml
│   ├── get_cores_per_socket.py
│   ├── launch.py
│   ├── launch_tensorflow_svd_crash.py
│   ├── requirements.txt
│   ├── results.txt
│   └── tensorflow_svd_crash.py
├── line_search_example/
│   ├── data/
│   │   └── step_lengths_ada.csv
│   ├── line_search_example.py
│   └── util.py
├── linearize/
│   ├── linearize.py
│   ├── linearize_test.py
│   └── memory_util.py
├── matmul_benchmark.py
├── matmul_benchmark_seq.py
├── matmul_times/
│   ├── 1080-float16.csv
│   ├── 1080-float32.csv
│   ├── g3-float16.csv
│   ├── g3-float32.csv
│   ├── nvidia-p3-float16.csv
│   ├── nvidia-p3-float32.csv
│   ├── p2-float16.csv
│   └── p2-float32.csv
├── mavelin/
│   ├── machine1.py
│   └── machine3.py
├── memory tracking.ipynb
├── memory-probe-examples.ipynb
├── memory-release-check.ipynb
├── natural_gradient_multilayer.py
├── node-merge.ipynb
├── notebook_util.py
├── numpy_initializers/
│   ├── kfac_cifar.py
│   └── util.py
├── parallel_dequeue_test.py
├── phantomjs-tryout.ipynb
├── phantomjs-tryout.js
├── pytorch-hessian.ipynb
├── queue_mismatch.py
├── queues_talk/
│   └── queues.ipynb
├── resnet_8_simple.pbtxt
├── resnet_leak_report.py
├── resnet_leak_report2.py
├── resource_variable_test.py
├── rotations_comparison.py
├── saving memory by using functions.ipynb
├── simple_rewiring.ipynb
├── simple_train.py
├── svd_benchmark.py
├── svd_noconverge.py
├── svd_test.py
├── tf_initializer_bug_report.py
├── tiny_runs/
│   ├── qr_test.py
│   └── tiny_tf.py
└── whitening_util.py