This is an automated email from the ASF dual-hosted git repository.
lmzheng pushed a change to branch master
in repository https://gitbox.apache.org/repos/asf/incubator-tvm.git.
from c4c61cb [Fix] Fix get_valid_count flaky test for cuda (#4901)
add 623dd20 [Relay][AutoTVM] Relay op strategy (#4644)
No new revisions were added by this update.
Summary of changes:
include/tvm/relay/op_attr_types.h | 31 +-
include/tvm/relay/op_strategy.h | 164 +++++
include/tvm/te/schedule.h | 49 ++
python/tvm/autotvm/__init__.py | 4 +-
python/tvm/autotvm/database.py | 5 +-
python/tvm/autotvm/feature.py | 5 +-
python/tvm/autotvm/graph_tuner/base_graph_tuner.py | 44 +-
.../autotvm/graph_tuner/utils/traverse_graph.py | 41 +-
python/tvm/autotvm/graph_tuner/utils/utils.py | 13 +-
python/tvm/autotvm/record.py | 76 +-
python/tvm/autotvm/task/__init__.py | 7 +-
python/tvm/autotvm/task/dispatcher.py | 90 +--
python/tvm/autotvm/task/relay_integration.py | 65 +-
python/tvm/autotvm/task/space.py | 30 +-
python/tvm/autotvm/task/task.py | 331 +++++----
python/tvm/autotvm/task/topi_integration.py | 497 +++----------
python/tvm/autotvm/tophub.py | 25 +-
python/tvm/autotvm/tuner/xgboost_cost_model.py | 3 +-
python/tvm/relay/backend/compile_engine.py | 203 +++++-
python/tvm/relay/expr_functor.py | 20 +-
python/tvm/relay/frontend/tensorflow.py | 4 +-
python/tvm/relay/frontend/tflite.py | 2 +-
python/tvm/relay/memory_alloc.py | 4 +-
python/tvm/relay/op/__init__.py | 5 +-
python/tvm/relay/op/_algorithm.py | 48 +-
python/tvm/relay/op/_reduce.py | 32 +-
python/tvm/relay/op/_tensor.py | 119 ++--
python/tvm/relay/op/_transform.py | 121 ++--
python/tvm/relay/op/annotation/annotation.py | 4 +-
python/tvm/relay/op/contrib/_contrib.py | 20 +-
python/tvm/relay/op/image/_image.py | 13 +-
python/tvm/relay/op/nn/_nn.py | 784 +++------------------
python/tvm/relay/op/nn/nn.py | 137 ----
python/tvm/relay/op/op.py | 212 +++++-
.../tvm/relay/op/strategy}/__init__.py | 16 +-
python/tvm/relay/op/strategy/arm_cpu.py | 231 ++++++
python/tvm/relay/op/strategy/bifrost.py | 104 +++
python/tvm/relay/op/strategy/cuda.py | 398 +++++++++++
python/tvm/relay/op/strategy/generic.py | 749 ++++++++++++++++++++
python/tvm/relay/op/strategy/hls.py | 158 +++++
python/tvm/relay/op/strategy/intel_graphics.py | 74 ++
python/tvm/relay/op/strategy/mali.py | 106 +++
python/tvm/relay/op/strategy/opengl.py | 73 ++
python/tvm/relay/op/strategy/rocm.py | 136 ++++
python/tvm/relay/op/strategy/x86.py | 302 ++++++++
python/tvm/relay/op/vision/_rcnn.py | 56 +-
python/tvm/relay/op/vision/_vision.py | 91 +--
python/tvm/relay/op/vision/_yolo.py | 6 +-
python/tvm/relay/quantize/_annotate.py | 7 +-
python/tvm/relay/testing/mobilenet.py | 30 +-
python/tvm/target/generic_func.py | 2 +
python/tvm/te/__init__.py | 4 +-
python/tvm/te/schedule.py | 35 +
python/tvm/tir/expr.py | 8 +
src/relay/backend/compile_engine.cc | 78 +-
src/relay/backend/compile_engine.h | 26 +
src/relay/ir/op_strategy.cc | 114 +++
src/relay/op/annotation/annotation.cc | 14 +-
src/relay/op/debug.cc | 5 +-
src/relay/op/memory/memory.cc | 10 +-
src/relay/op/nn/convolution.cc | 101 ---
src/relay/op/nn/convolution.h | 14 +-
src/relay/op/nn/nn.cc | 23 +-
src/relay/op/nn/pad.cc | 5 +-
src/relay/op/nn/pooling.cc | 30 +-
src/relay/op/tensor/binary.cc | 5 +-
src/relay/op/tensor/reduce.cc | 71 +-
src/relay/op/tensor/transform.cc | 135 ++--
src/relay/op/tensor/unary.cc | 15 +-
src/relay/op/vision/yolo.cc | 3 +-
src/relay/pass/alter_op_layout.cc | 5 +-
src/te/schedule/schedule_lang.cc | 75 +-
tests/cpp/relay_build_module_test.cc | 57 +-
tests/python/frontend/mxnet/test_forward.py | 15 +-
tests/python/integration/test_tuning.py | 4 +-
tests/python/relay/test_any.py | 3 +
tests/python/relay/test_autotvm_task_extraction.py | 70 +-
tests/python/relay/test_backend_compile_engine.py | 129 +++-
tests/python/relay/test_op_level2.py | 65 +-
tests/python/relay/test_op_qnn_conv2d.py | 25 +-
tests/python/relay/test_pass_alter_op_layout.py | 51 +-
tests/python/relay/test_pass_auto_quantize.py | 5 +-
tests/python/relay/test_pass_fold_scale_axis.py | 9 +-
tests/python/unittest/test_autotvm_common.py | 6 +-
.../unittest/test_autotvm_dispatch_context.py | 34 +-
tests/python/unittest/test_autotvm_measure.py | 2 +-
tests/python/unittest/test_codegen_blob.py | 2 +-
tests/python/unittest/test_codegen_cuda.py | 2 +-
tests/python/unittest/test_graph_tuner_core.py | 416 +++++------
tests/python/unittest/test_graph_tuner_utils.py | 33 +-
.../unittest/test_lang_tensor_overload_op.py | 10 +-
topi/include/topi/cuda/normalization.h | 5 +-
topi/include/topi/rocm/normalization.h | 7 +-
topi/python/topi/__init__.py | 1 +
topi/python/topi/argwhere.py | 2 -
topi/python/topi/arm_cpu/__init__.py | 17 +-
topi/python/topi/arm_cpu/bitserial_conv2d.py | 11 +-
topi/python/topi/arm_cpu/bitserial_dense.py | 10 +-
topi/python/topi/arm_cpu/conv2d.py | 456 ++----------
topi/python/topi/arm_cpu/conv2d_alter_op.py | 171 +++++
topi/python/topi/arm_cpu/conv2d_int8.py | 20 +-
topi/python/topi/arm_cpu/conv2d_spatial_pack.py | 6 +-
topi/python/topi/arm_cpu/conv2d_transpose.py | 11 +-
topi/python/topi/arm_cpu/depthwise_conv2d.py | 71 +-
topi/python/topi/arm_cpu/injective.py | 4 -
topi/python/topi/bifrost/conv2d.py | 146 ++--
topi/python/topi/bifrost/dense.py | 37 +-
topi/python/topi/bifrost/depthwise_conv2d.py | 2 -
topi/python/topi/cuda/__init__.py | 28 +-
topi/python/topi/cuda/batch_matmul.py | 49 +-
topi/python/topi/cuda/conv1d.py | 81 +--
topi/python/topi/cuda/conv1d_transpose_ncw.py | 11 +-
topi/python/topi/cuda/conv2d.py | 234 ++----
topi/python/topi/cuda/conv2d_alter_op.py | 136 ++++
topi/python/topi/cuda/conv2d_direct.py | 2 +-
topi/python/topi/cuda/conv2d_hwcn.py | 12 +-
topi/python/topi/cuda/conv2d_int8.py | 18 +-
topi/python/topi/cuda/conv2d_transpose_nchw.py | 11 +-
topi/python/topi/cuda/conv2d_winograd.py | 178 +----
topi/python/topi/cuda/conv3d.py | 207 ++++--
topi/python/topi/cuda/conv3d_direct.py | 11 +-
topi/python/topi/cuda/deformable_conv2d.py | 20 +-
topi/python/topi/cuda/dense.py | 163 ++---
topi/python/topi/cuda/depthwise_conv2d.py | 17 +-
topi/python/topi/cuda/group_conv2d_nchw.py | 358 +++++-----
topi/python/topi/cuda/injective.py | 7 +-
topi/python/topi/cuda/nms.py | 13 +-
topi/python/topi/cuda/nn.py | 7 +-
topi/python/topi/cuda/pooling.py | 7 +-
topi/python/topi/cuda/rcnn/__init__.py | 2 +-
topi/python/topi/cuda/rcnn/proposal.py | 7 +-
topi/python/topi/cuda/reduction.py | 2 -
topi/python/topi/cuda/softmax.py | 3 +-
topi/python/topi/cuda/sort.py | 14 +-
topi/python/topi/cuda/ssd/multibox.py | 18 +-
topi/python/topi/cuda/vision.py | 12 +-
topi/python/topi/generic/conv2d.py | 82 ++-
topi/python/topi/generic/extern.py | 1 -
topi/python/topi/generic/injective.py | 21 +-
topi/python/topi/generic/nn.py | 75 +-
topi/python/topi/generic/search.py | 2 -
topi/python/topi/generic/sort.py | 3 -
topi/python/topi/generic/vision.py | 9 -
topi/python/topi/hls/injective.py | 3 -
topi/python/topi/hls/nn.py | 14 -
topi/python/topi/intel_graphics/__init__.py | 2 +
topi/python/topi/intel_graphics/conv2d.py | 380 ++++------
topi/python/topi/intel_graphics/conv2d_alter_op.py | 102 +++
.../python/topi/intel_graphics/depthwise_conv2d.py | 21 +-
topi/python/topi/mali/conv2d.py | 152 ++--
topi/python/topi/mali/dense.py | 40 +-
topi/python/topi/mali/depthwise_conv2d.py | 15 +-
topi/python/topi/nn/batch_matmul.py | 22 +-
topi/python/topi/nn/bitserial_conv2d.py | 221 +-----
topi/python/topi/nn/bitserial_dense.py | 79 +--
topi/python/topi/nn/conv1d.py | 15 +-
topi/python/topi/nn/conv1d_transpose.py | 1 -
topi/python/topi/nn/conv2d.py | 203 ++----
topi/python/topi/nn/conv2d_transpose.py | 1 -
topi/python/topi/nn/conv3d.py | 48 +-
topi/python/topi/nn/deformable_conv2d.py | 1 -
topi/python/topi/nn/dense.py | 28 +-
topi/python/topi/nn/depthwise_conv2d.py | 3 -
topi/python/topi/nn/local_response_norm.py | 2 -
topi/python/topi/nn/sparse.py | 8 +-
topi/python/topi/nn/util.py | 2 +-
topi/python/topi/opengl/conv2d_nchw.py | 2 -
topi/python/topi/opengl/dense.py | 2 -
topi/python/topi/opengl/injective.py | 3 -
topi/python/topi/opengl/pooling.py | 3 -
topi/python/topi/opengl/softmax.py | 2 -
topi/python/topi/rocm/conv2d.py | 77 +-
topi/python/topi/rocm/dense.py | 101 ++-
topi/python/topi/rocm/nn.py | 7 +-
topi/python/topi/sort.py | 2 -
topi/python/topi/testing/__init__.py | 2 +
topi/python/topi/testing/common.py | 74 ++
topi/python/topi/vision/nms.py | 3 +-
topi/python/topi/vision/rcnn/proposal.py | 2 +-
topi/python/topi/vision/rcnn/roi_align.py | 1 -
topi/python/topi/vision/rcnn/roi_pool.py | 1 -
topi/python/topi/vision/reorg.py | 2 -
topi/python/topi/vision/ssd/multibox.py | 3 -
topi/python/topi/x86/__init__.py | 18 +-
topi/python/topi/x86/batch_matmul.py | 53 +-
topi/python/topi/x86/binarize_pack.py | 2 -
topi/python/topi/x86/binary_dense.py | 2 -
topi/python/topi/x86/bitserial_conv2d.py | 235 +++++-
topi/python/topi/x86/bitserial_dense.py | 80 ++-
topi/python/topi/x86/conv1d.py | 4 +-
topi/python/topi/x86/conv2d.py | 443 ++++--------
topi/python/topi/x86/conv2d_alter_op.py | 223 +++---
topi/python/topi/x86/conv2d_avx_1x1.py | 150 ++--
topi/python/topi/x86/conv2d_avx_common.py | 147 ++--
topi/python/topi/x86/conv2d_int8.py | 223 +++---
topi/python/topi/x86/conv2d_transpose.py | 49 +-
topi/python/topi/x86/conv3d.py | 27 +-
topi/python/topi/x86/dense.py | 243 +++----
topi/python/topi/x86/depthwise_conv2d.py | 203 +++---
topi/python/topi/x86/injective.py | 4 -
topi/python/topi/x86/nn.py | 2 -
topi/python/topi/x86/pooling.py | 3 -
topi/python/topi/x86/reduction.py | 5 +-
topi/python/topi/x86/roi_align.py | 4 +-
topi/python/topi/x86/sparse.py | 5 +-
topi/src/topi.cc | 4 +-
topi/tests/python/common.py | 5 +-
topi/tests/python/test_fifo_buffer.py | 24 +-
topi/tests/python/test_topi_batch_matmul.py | 11 +-
topi/tests/python/test_topi_bitserial_conv2d.py | 12 +-
.../python/test_topi_bitserial_conv2d_rasp.py | 6 +-
topi/tests/python/test_topi_bitserial_dense.py | 52 +-
topi/tests/python/test_topi_bnn.py | 6 +-
topi/tests/python/test_topi_broadcast.py | 13 +-
topi/tests/python/test_topi_clip.py | 3 +-
topi/tests/python/test_topi_conv1d.py | 23 +-
.../tests/python/test_topi_conv1d_transpose_ncw.py | 12 +-
topi/tests/python/test_topi_conv2d_NCHWc.py | 12 +-
topi/tests/python/test_topi_conv2d_hwcn.py | 15 +-
topi/tests/python/test_topi_conv2d_int8.py | 6 +-
topi/tests/python/test_topi_conv2d_nchw.py | 15 +-
topi/tests/python/test_topi_conv2d_nhwc.py | 13 +-
.../python/test_topi_conv2d_nhwc_pack_int8.py | 25 +-
.../python/test_topi_conv2d_transpose_nchw.py | 21 +-
topi/tests/python/test_topi_conv2d_winograd.py | 104 ++-
topi/tests/python/test_topi_conv3d_ncdhw.py | 12 +-
topi/tests/python/test_topi_conv3d_ndhwc.py | 17 +-
topi/tests/python/test_topi_deformable_conv2d.py | 12 +-
topi/tests/python/test_topi_dense.py | 40 +-
topi/tests/python/test_topi_depth_to_space.py | 2 +-
topi/tests/python/test_topi_depthwise_conv2d.py | 176 +++--
topi/tests/python/test_topi_group_conv2d.py | 15 +-
.../python/test_topi_group_conv2d_NCHWc_int8.py | 12 +-
topi/tests/python/test_topi_image.py | 6 +-
topi/tests/python/test_topi_lrn.py | 16 +-
topi/tests/python/test_topi_math.py | 30 +-
topi/tests/python/test_topi_pooling.py | 37 +-
topi/tests/python/test_topi_reduce.py | 3 +-
topi/tests/python/test_topi_relu.py | 4 +-
topi/tests/python/test_topi_reorg.py | 11 +-
topi/tests/python/test_topi_softmax.py | 17 +-
topi/tests/python/test_topi_sort.py | 19 +-
topi/tests/python/test_topi_space_to_depth.py | 2 +-
topi/tests/python/test_topi_tensor.py | 3 +-
topi/tests/python/test_topi_transform.py | 64 +-
topi/tests/python/test_topi_upsampling.py | 4 +-
topi/tests/python/test_topi_vision.py | 98 ++-
tutorials/autotvm/tune_conv2d_cuda.py | 4 +-
tutorials/autotvm/tune_relay_arm.py | 27 +-
tutorials/autotvm/tune_relay_cuda.py | 17 +-
tutorials/autotvm/tune_relay_mobile_gpu.py | 15 +-
tutorials/autotvm/tune_relay_x86.py | 21 +-
tutorials/autotvm/tune_simple_template.py | 6 +-
tutorials/dev/relay_pass_infra.py | 6 +-
tutorials/optimize/opt_matmul_auto_tensorcore.py | 5 +-
tutorials/topi/intro_topi.py | 8 +-
vta/python/vta/ir_pass.py | 8 +-
vta/python/vta/top/__init__.py | 8 +-
vta/python/vta/top/bitpack.py | 5 +-
vta/python/vta/top/op.py | 217 +++---
vta/python/vta/top/vta_conv2d.py | 16 +-
vta/python/vta/top/vta_conv2d_transpose.py | 15 +-
vta/python/vta/top/vta_dense.py | 12 +-
vta/python/vta/top/vta_group_conv2d.py | 8 +-
vta/scripts/tune_resnet.py | 2 +-
.../integration/test_benchmark_topi_conv2d.py | 23 +-
.../test_benchmark_topi_conv2d_transpose.py | 20 +-
.../integration/test_benchmark_topi_dense.py | 10 +-
.../test_benchmark_topi_group_conv2d.py | 17 +-
vta/tutorials/autotvm/tune_relay_vta.py | 14 +-
270 files changed, 8445 insertions(+), 7055 deletions(-)
create mode 100644 include/tvm/relay/op_strategy.h
copy {topi/python/topi/vision => python/tvm/relay/op/strategy}/__init__.py
(78%)
create mode 100644 python/tvm/relay/op/strategy/arm_cpu.py
create mode 100644 python/tvm/relay/op/strategy/bifrost.py
create mode 100644 python/tvm/relay/op/strategy/cuda.py
create mode 100644 python/tvm/relay/op/strategy/generic.py
create mode 100644 python/tvm/relay/op/strategy/hls.py
create mode 100644 python/tvm/relay/op/strategy/intel_graphics.py
create mode 100644 python/tvm/relay/op/strategy/mali.py
create mode 100644 python/tvm/relay/op/strategy/opengl.py
create mode 100644 python/tvm/relay/op/strategy/rocm.py
create mode 100644 python/tvm/relay/op/strategy/x86.py
create mode 100644 src/relay/ir/op_strategy.cc
create mode 100644 topi/python/topi/arm_cpu/conv2d_alter_op.py
create mode 100644 topi/python/topi/cuda/conv2d_alter_op.py
create mode 100644 topi/python/topi/intel_graphics/conv2d_alter_op.py
create mode 100644 topi/python/topi/testing/common.py