This is an automated email from the ASF dual-hosted git repository. tqchen pushed a change to branch master in repository https://gitbox.apache.org/repos/asf/incubator-tvm.git.
from df02e73 reduce input size to fix oom (#4653) add f4c5f93 [REFACTOR][IR] Add Node suffix to low-level IR nodes (#4649) No new revisions were added by this update. Summary of changes: include/tvm/arithmetic.h | 12 +- include/tvm/attrs.h | 12 +- include/tvm/expr.h | 22 +- include/tvm/expr_operator.h | 40 +-- include/tvm/ir.h | 160 ++++----- include/tvm/ir_functor_ext.h | 360 ++++++++++----------- include/tvm/ir_pass.h | 6 +- include/tvm/operation.h | 14 +- include/tvm/relay/type.h | 2 +- src/api/api_ir.cc | 27 +- src/api/api_lang.cc | 4 +- src/arithmetic/analyzer.cc | 8 +- src/arithmetic/bound_deducer.cc | 40 +-- src/arithmetic/canonical_simplify.cc | 84 ++--- src/arithmetic/compute_expr.h | 14 +- src/arithmetic/const_fold.h | 132 ++++---- src/arithmetic/const_int_bound.cc | 42 +-- src/arithmetic/detect_linear_equation.cc | 30 +- src/arithmetic/domain_touched.cc | 16 +- src/arithmetic/int_operator.h | 32 +- src/arithmetic/int_set.cc | 144 ++++----- src/arithmetic/ir_mutator_with_analyzer.cc | 32 +- src/arithmetic/ir_mutator_with_analyzer.h | 18 +- src/arithmetic/ir_visitor_with_analyzer.h | 6 +- src/arithmetic/modular_set.cc | 30 +- src/arithmetic/pattern_match.h | 120 +++---- src/arithmetic/rewrite_simplify.cc | 132 ++++---- src/arithmetic/rewrite_simplify.h | 46 +-- src/arithmetic/stmt_simplify.cc | 12 +- src/autotvm/feature_visitor.cc | 12 +- src/autotvm/feature_visitor.h | 8 +- src/autotvm/touch_extractor.cc | 41 +-- src/autotvm/touch_extractor.h | 10 +- src/codegen/build_module.cc | 44 +-- src/codegen/codegen_c.cc | 138 ++++---- src/codegen/codegen_c.h | 94 +++--- src/codegen/codegen_c_host.cc | 22 +- src/codegen/codegen_c_host.h | 10 +- src/codegen/codegen_cuda.cc | 42 +-- src/codegen/codegen_cuda.h | 30 +- src/codegen/codegen_metal.cc | 10 +- src/codegen/codegen_metal.h | 10 +- src/codegen/codegen_opencl.cc | 18 +- src/codegen/codegen_opencl.h | 20 +- src/codegen/codegen_opengl.cc | 22 +- src/codegen/codegen_opengl.h | 26 +- src/codegen/codegen_source_base.cc | 4 +- src/codegen/codegen_source_base.h | 10 +- src/codegen/codegen_vhls.cc | 4 +- src/codegen/codegen_vhls.h | 8 +- src/codegen/intrin_rule.cc | 8 +- src/codegen/intrin_rule.h | 6 +- src/codegen/llvm/codegen_amdgpu.cc | 8 +- src/codegen/llvm/codegen_arm.cc | 48 +-- src/codegen/llvm/codegen_cpu.cc | 56 ++-- src/codegen/llvm/codegen_cpu.h | 18 +- src/codegen/llvm/codegen_llvm.cc | 134 ++++---- src/codegen/llvm/codegen_llvm.h | 98 +++--- src/codegen/llvm/codegen_nvptx.cc | 6 +- src/codegen/llvm/codegen_x86_64.cc | 23 +- src/codegen/llvm/intrin_rule_llvm.cc | 12 +- src/codegen/llvm/intrin_rule_llvm.h | 20 +- src/codegen/llvm/intrin_rule_nvptx.cc | 6 +- src/codegen/llvm/intrin_rule_rocm.cc | 6 +- src/codegen/spirv/codegen_spirv.cc | 114 +++---- src/codegen/spirv/codegen_spirv.h | 80 ++--- src/codegen/spirv/intrin_rule_spirv.cc | 8 +- src/codegen/stackvm/codegen_stackvm.cc | 108 +++---- src/codegen/stackvm/codegen_stackvm.h | 80 ++--- src/contrib/hybrid/codegen_hybrid.cc | 106 +++--- src/contrib/hybrid/codegen_hybrid.h | 86 ++--- src/lang/attr_functor.h | 204 ++++++------ src/lang/attrs.cc | 128 ++++---- src/lang/buffer.cc | 38 +-- src/lang/data_layout.cc | 16 +- src/lang/expr.cc | 20 +- src/lang/expr_operator.cc | 289 +++++++++-------- src/lang/ir.cc | 412 ++++++++++++------------ src/lang/tensor.cc | 6 +- src/op/compute_op.cc | 48 +-- src/op/cross_thread_reduction.cc | 20 +- src/op/extern_op.cc | 10 +- src/op/hybrid_op.cc | 70 ++-- src/op/op_util.cc | 36 +-- src/op/placeholder_op.cc | 2 +- src/op/scan_op.cc | 14 +- src/op/tensor_compute_op.cc | 18 +- src/op/tensorize.cc | 44 +-- src/pass/arg_binder.cc | 58 ++-- src/pass/arg_binder.h | 8 +- src/pass/bound_checker.cc | 52 +-- src/pass/combine_context_call.cc | 10 +- src/pass/coproc_sync.cc | 64 ++-- src/pass/detect_device.cc | 2 +- src/pass/hoist_if_then_else.cc | 66 ++-- src/pass/infer_fragment.cc | 54 ++-- src/pass/inject_copy_intrin.cc | 32 +- src/pass/inject_double_buffer.cc | 76 ++--- src/pass/inject_prefetch.cc | 10 +- src/pass/inject_virtual_thread.cc | 112 +++---- src/pass/inline.cc | 8 +- src/pass/ir_deep_compare.cc | 148 ++++----- src/pass/ir_functor.cc | 208 ++++++------ src/pass/ir_util.cc | 24 +- src/pass/ir_util.h | 22 +- src/pass/lift_attr_scope.cc | 32 +- src/pass/loop_partition.cc | 92 +++--- src/pass/lower_custom_datatypes.cc | 50 +-- src/pass/lower_intrin.cc | 52 +-- src/pass/lower_thread_allreduce.cc | 80 ++--- src/pass/lower_tvm_builtin.cc | 114 +++---- src/pass/lower_warp_memory.cc | 54 ++-- src/pass/make_api.cc | 72 ++--- src/pass/remap_thread_axis.cc | 12 +- src/pass/remove_no_op.cc | 46 +-- src/pass/rewrite_unsafe_select.cc | 72 ++--- src/pass/simple_passes.cc | 36 +-- src/pass/skip_assert.cc | 4 +- src/pass/split_host_device.cc | 42 +-- src/pass/ssa.cc | 72 ++--- src/pass/storage_access.cc | 60 ++-- src/pass/storage_access.h | 24 +- src/pass/storage_flatten.cc | 92 +++--- src/pass/storage_rewrite.cc | 204 ++++++------ src/pass/storage_sync.cc | 66 ++-- src/pass/tensor_core.cc | 234 +++++++------- src/pass/unroll_loop.cc | 24 +- src/pass/vectorize_loop.cc | 152 ++++----- src/pass/verify_compact_buffer.cc | 2 +- src/pass/verify_gpu_code.cc | 20 +- src/pass/verify_memory.cc | 26 +- src/relay/backend/build_module.cc | 4 +- src/relay/backend/compile_engine.cc | 18 +- src/relay/backend/contrib/codegen_c/codegen_c.h | 5 +- src/relay/backend/contrib/dnnl/codegen.cc | 8 +- src/relay/backend/graph_runtime_codegen.cc | 4 +- src/relay/backend/vm/lambda_lift.cc | 2 +- src/relay/backend/vm/removed_unused_funcs.cc | 2 +- src/relay/ir/alpha_equal.cc | 2 +- src/relay/ir/expr.cc | 6 +- src/relay/ir/hash.cc | 4 +- src/relay/ir/pretty_printer.cc | 10 +- src/relay/op/memory/memory.cc | 2 +- src/relay/op/nn/convolution.cc | 4 +- src/relay/op/nn/convolution.h | 10 +- src/relay/op/nn/nn.cc | 2 +- src/relay/op/nn/pad.cc | 4 +- src/relay/op/nn/pooling.cc | 6 +- src/relay/op/nn/upsampling.cc | 10 +- src/relay/op/tensor/reduce.cc | 2 +- src/relay/op/tensor/transform.cc | 26 +- src/relay/pass/alter_op_layout.cc | 2 +- src/relay/pass/canonicalize_cast.cc | 2 +- src/relay/pass/canonicalize_ops.cc | 2 +- src/relay/pass/combine_parallel_conv2d.cc | 2 +- src/relay/pass/combine_parallel_dense.cc | 2 +- src/relay/pass/combine_parallel_op_batch.cc | 2 +- src/relay/pass/convert_layout.cc | 4 +- src/relay/pass/device_annotation.cc | 2 +- src/relay/pass/eliminate_common_subexpr.cc | 2 +- src/relay/pass/fold_constant.cc | 4 +- src/relay/pass/fold_scale_axis.cc | 4 +- src/relay/pass/fuse_ops.cc | 2 +- src/relay/pass/infer_layout_util.h | 6 +- src/relay/pass/legalize.cc | 2 +- src/relay/pass/mac_count.cc | 26 +- src/relay/pass/pass_manager.cc | 8 +- src/relay/pass/pattern_util.h | 2 +- src/relay/pass/simplify_inference.cc | 2 +- src/relay/pass/type_solver.cc | 12 +- src/schedule/auto_inline_elem_wise.cc | 2 +- src/schedule/bound.cc | 4 +- src/schedule/graph.cc | 8 +- src/schedule/message_passing.cc | 2 +- src/schedule/schedule_dataflow_rewrite.cc | 76 ++--- src/schedule/schedule_lang.cc | 2 +- src/schedule/schedule_ops.cc | 54 ++-- tests/cpp/attrs_test.cc | 2 +- tests/cpp/container_test.cc | 4 +- tests/cpp/expr_test.cc | 2 +- tests/cpp/ir_functor_test.cc | 76 ++--- tests/cpp/ir_simplify_test.cc | 2 +- tests/cpp/ir_ssa_test.cc | 6 +- tests/cpp/packed_func_test.cc | 2 +- tests/cpp/pattern_match_test.cc | 26 +- topi/include/topi/detail/broadcast.h | 4 +- topi/include/topi/detail/constant_utils.h | 12 +- topi/include/topi/detail/extern.h | 18 +- topi/include/topi/detail/tensor_utils.h | 2 +- topi/include/topi/elemwise.h | 10 +- topi/include/topi/nn.h | 8 +- topi/include/topi/nn/pooling.h | 46 +-- topi/include/topi/reduction.h | 11 +- topi/include/topi/transform.h | 8 +- 194 files changed, 3961 insertions(+), 3919 deletions(-)