You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@tvm.apache.org by tq...@apache.org on 2020/01/08 17:01:08 UTC
[incubator-tvm] branch master updated (df02e73 -> f4c5f93)
This is an automated email from the ASF dual-hosted git repository.
tqchen pushed a change to branch master
in repository https://gitbox.apache.org/repos/asf/incubator-tvm.git.
from df02e73 reduce input size to fix oom (#4653)
add f4c5f93 [REFACTOR][IR] Add Node suffix to low-level IR nodes (#4649)
No new revisions were added by this update.
Summary of changes:
include/tvm/arithmetic.h | 12 +-
include/tvm/attrs.h | 12 +-
include/tvm/expr.h | 22 +-
include/tvm/expr_operator.h | 40 +--
include/tvm/ir.h | 160 ++++-----
include/tvm/ir_functor_ext.h | 360 ++++++++++-----------
include/tvm/ir_pass.h | 6 +-
include/tvm/operation.h | 14 +-
include/tvm/relay/type.h | 2 +-
src/api/api_ir.cc | 27 +-
src/api/api_lang.cc | 4 +-
src/arithmetic/analyzer.cc | 8 +-
src/arithmetic/bound_deducer.cc | 40 +--
src/arithmetic/canonical_simplify.cc | 84 ++---
src/arithmetic/compute_expr.h | 14 +-
src/arithmetic/const_fold.h | 132 ++++----
src/arithmetic/const_int_bound.cc | 42 +--
src/arithmetic/detect_linear_equation.cc | 30 +-
src/arithmetic/domain_touched.cc | 16 +-
src/arithmetic/int_operator.h | 32 +-
src/arithmetic/int_set.cc | 144 ++++-----
src/arithmetic/ir_mutator_with_analyzer.cc | 32 +-
src/arithmetic/ir_mutator_with_analyzer.h | 18 +-
src/arithmetic/ir_visitor_with_analyzer.h | 6 +-
src/arithmetic/modular_set.cc | 30 +-
src/arithmetic/pattern_match.h | 120 +++----
src/arithmetic/rewrite_simplify.cc | 132 ++++----
src/arithmetic/rewrite_simplify.h | 46 +--
src/arithmetic/stmt_simplify.cc | 12 +-
src/autotvm/feature_visitor.cc | 12 +-
src/autotvm/feature_visitor.h | 8 +-
src/autotvm/touch_extractor.cc | 41 +--
src/autotvm/touch_extractor.h | 10 +-
src/codegen/build_module.cc | 44 +--
src/codegen/codegen_c.cc | 138 ++++----
src/codegen/codegen_c.h | 94 +++---
src/codegen/codegen_c_host.cc | 22 +-
src/codegen/codegen_c_host.h | 10 +-
src/codegen/codegen_cuda.cc | 42 +--
src/codegen/codegen_cuda.h | 30 +-
src/codegen/codegen_metal.cc | 10 +-
src/codegen/codegen_metal.h | 10 +-
src/codegen/codegen_opencl.cc | 18 +-
src/codegen/codegen_opencl.h | 20 +-
src/codegen/codegen_opengl.cc | 22 +-
src/codegen/codegen_opengl.h | 26 +-
src/codegen/codegen_source_base.cc | 4 +-
src/codegen/codegen_source_base.h | 10 +-
src/codegen/codegen_vhls.cc | 4 +-
src/codegen/codegen_vhls.h | 8 +-
src/codegen/intrin_rule.cc | 8 +-
src/codegen/intrin_rule.h | 6 +-
src/codegen/llvm/codegen_amdgpu.cc | 8 +-
src/codegen/llvm/codegen_arm.cc | 48 +--
src/codegen/llvm/codegen_cpu.cc | 56 ++--
src/codegen/llvm/codegen_cpu.h | 18 +-
src/codegen/llvm/codegen_llvm.cc | 134 ++++----
src/codegen/llvm/codegen_llvm.h | 98 +++---
src/codegen/llvm/codegen_nvptx.cc | 6 +-
src/codegen/llvm/codegen_x86_64.cc | 23 +-
src/codegen/llvm/intrin_rule_llvm.cc | 12 +-
src/codegen/llvm/intrin_rule_llvm.h | 20 +-
src/codegen/llvm/intrin_rule_nvptx.cc | 6 +-
src/codegen/llvm/intrin_rule_rocm.cc | 6 +-
src/codegen/spirv/codegen_spirv.cc | 114 +++----
src/codegen/spirv/codegen_spirv.h | 80 ++---
src/codegen/spirv/intrin_rule_spirv.cc | 8 +-
src/codegen/stackvm/codegen_stackvm.cc | 108 +++----
src/codegen/stackvm/codegen_stackvm.h | 80 ++---
src/contrib/hybrid/codegen_hybrid.cc | 106 +++---
src/contrib/hybrid/codegen_hybrid.h | 86 ++---
src/lang/attr_functor.h | 204 ++++++------
src/lang/attrs.cc | 128 ++++----
src/lang/buffer.cc | 38 +--
src/lang/data_layout.cc | 16 +-
src/lang/expr.cc | 20 +-
src/lang/expr_operator.cc | 289 +++++++++--------
src/lang/ir.cc | 412 ++++++++++++------------
src/lang/tensor.cc | 6 +-
src/op/compute_op.cc | 48 +--
src/op/cross_thread_reduction.cc | 20 +-
src/op/extern_op.cc | 10 +-
src/op/hybrid_op.cc | 70 ++--
src/op/op_util.cc | 36 +--
src/op/placeholder_op.cc | 2 +-
src/op/scan_op.cc | 14 +-
src/op/tensor_compute_op.cc | 18 +-
src/op/tensorize.cc | 44 +--
src/pass/arg_binder.cc | 58 ++--
src/pass/arg_binder.h | 8 +-
src/pass/bound_checker.cc | 52 +--
src/pass/combine_context_call.cc | 10 +-
src/pass/coproc_sync.cc | 64 ++--
src/pass/detect_device.cc | 2 +-
src/pass/hoist_if_then_else.cc | 66 ++--
src/pass/infer_fragment.cc | 54 ++--
src/pass/inject_copy_intrin.cc | 32 +-
src/pass/inject_double_buffer.cc | 76 ++---
src/pass/inject_prefetch.cc | 10 +-
src/pass/inject_virtual_thread.cc | 112 +++----
src/pass/inline.cc | 8 +-
src/pass/ir_deep_compare.cc | 148 ++++-----
src/pass/ir_functor.cc | 208 ++++++------
src/pass/ir_util.cc | 24 +-
src/pass/ir_util.h | 22 +-
src/pass/lift_attr_scope.cc | 32 +-
src/pass/loop_partition.cc | 92 +++---
src/pass/lower_custom_datatypes.cc | 50 +--
src/pass/lower_intrin.cc | 52 +--
src/pass/lower_thread_allreduce.cc | 80 ++---
src/pass/lower_tvm_builtin.cc | 114 +++----
src/pass/lower_warp_memory.cc | 54 ++--
src/pass/make_api.cc | 72 ++---
src/pass/remap_thread_axis.cc | 12 +-
src/pass/remove_no_op.cc | 46 +--
src/pass/rewrite_unsafe_select.cc | 72 ++---
src/pass/simple_passes.cc | 36 +--
src/pass/skip_assert.cc | 4 +-
src/pass/split_host_device.cc | 42 +--
src/pass/ssa.cc | 72 ++---
src/pass/storage_access.cc | 60 ++--
src/pass/storage_access.h | 24 +-
src/pass/storage_flatten.cc | 92 +++---
src/pass/storage_rewrite.cc | 204 ++++++------
src/pass/storage_sync.cc | 66 ++--
src/pass/tensor_core.cc | 234 +++++++-------
src/pass/unroll_loop.cc | 24 +-
src/pass/vectorize_loop.cc | 152 ++++-----
src/pass/verify_compact_buffer.cc | 2 +-
src/pass/verify_gpu_code.cc | 20 +-
src/pass/verify_memory.cc | 26 +-
src/relay/backend/build_module.cc | 4 +-
src/relay/backend/compile_engine.cc | 18 +-
src/relay/backend/contrib/codegen_c/codegen_c.h | 5 +-
src/relay/backend/contrib/dnnl/codegen.cc | 8 +-
src/relay/backend/graph_runtime_codegen.cc | 4 +-
src/relay/backend/vm/lambda_lift.cc | 2 +-
src/relay/backend/vm/removed_unused_funcs.cc | 2 +-
src/relay/ir/alpha_equal.cc | 2 +-
src/relay/ir/expr.cc | 6 +-
src/relay/ir/hash.cc | 4 +-
src/relay/ir/pretty_printer.cc | 10 +-
src/relay/op/memory/memory.cc | 2 +-
src/relay/op/nn/convolution.cc | 4 +-
src/relay/op/nn/convolution.h | 10 +-
src/relay/op/nn/nn.cc | 2 +-
src/relay/op/nn/pad.cc | 4 +-
src/relay/op/nn/pooling.cc | 6 +-
src/relay/op/nn/upsampling.cc | 10 +-
src/relay/op/tensor/reduce.cc | 2 +-
src/relay/op/tensor/transform.cc | 26 +-
src/relay/pass/alter_op_layout.cc | 2 +-
src/relay/pass/canonicalize_cast.cc | 2 +-
src/relay/pass/canonicalize_ops.cc | 2 +-
src/relay/pass/combine_parallel_conv2d.cc | 2 +-
src/relay/pass/combine_parallel_dense.cc | 2 +-
src/relay/pass/combine_parallel_op_batch.cc | 2 +-
src/relay/pass/convert_layout.cc | 4 +-
src/relay/pass/device_annotation.cc | 2 +-
src/relay/pass/eliminate_common_subexpr.cc | 2 +-
src/relay/pass/fold_constant.cc | 4 +-
src/relay/pass/fold_scale_axis.cc | 4 +-
src/relay/pass/fuse_ops.cc | 2 +-
src/relay/pass/infer_layout_util.h | 6 +-
src/relay/pass/legalize.cc | 2 +-
src/relay/pass/mac_count.cc | 26 +-
src/relay/pass/pass_manager.cc | 8 +-
src/relay/pass/pattern_util.h | 2 +-
src/relay/pass/simplify_inference.cc | 2 +-
src/relay/pass/type_solver.cc | 12 +-
src/schedule/auto_inline_elem_wise.cc | 2 +-
src/schedule/bound.cc | 4 +-
src/schedule/graph.cc | 8 +-
src/schedule/message_passing.cc | 2 +-
src/schedule/schedule_dataflow_rewrite.cc | 76 ++---
src/schedule/schedule_lang.cc | 2 +-
src/schedule/schedule_ops.cc | 54 ++--
tests/cpp/attrs_test.cc | 2 +-
tests/cpp/container_test.cc | 4 +-
tests/cpp/expr_test.cc | 2 +-
tests/cpp/ir_functor_test.cc | 76 ++---
tests/cpp/ir_simplify_test.cc | 2 +-
tests/cpp/ir_ssa_test.cc | 6 +-
tests/cpp/packed_func_test.cc | 2 +-
tests/cpp/pattern_match_test.cc | 26 +-
topi/include/topi/detail/broadcast.h | 4 +-
topi/include/topi/detail/constant_utils.h | 12 +-
topi/include/topi/detail/extern.h | 18 +-
topi/include/topi/detail/tensor_utils.h | 2 +-
topi/include/topi/elemwise.h | 10 +-
topi/include/topi/nn.h | 8 +-
topi/include/topi/nn/pooling.h | 46 +--
topi/include/topi/reduction.h | 11 +-
topi/include/topi/transform.h | 8 +-
194 files changed, 3961 insertions(+), 3919 deletions(-)