tree: 44ec355ea9c54c9c9635ed025698f5a71c7e101a [path history] [tgz]
  1. annotate_device_regions.cc
  2. annotate_irregular_loop.cc
  3. arg_binder.cc
  4. arg_binder.h
  5. bind_params.cc
  6. bind_target.cc
  7. bound_checker.cc
  8. combine_context_call.cc
  9. common_subexpr_elim.cc
  10. common_subexpr_elim.h
  11. common_subexpr_elim_tools.cc
  12. common_subexpr_elim_tools.h
  13. compact_buffer_region.cc
  14. convert_blocks_to_opaque.cc
  15. convert_for_loops_serial.cc
  16. decorate_device_scope.cc
  17. default_gpu_schedule.cc
  18. dtype_conversion.cc
  19. dtype_conversion.h
  20. extract_constants.cc
  21. flatten_buffer.cc
  22. force_narrow_index_to_i32.cc
  23. hoist_expression.cc
  24. inject_double_buffer.cc
  25. inject_permuted_layout.cc
  26. inject_ptx_async_copy.cc
  27. inject_ptx_ldg32.cc
  28. inject_rolling_buffer.cc
  29. inject_software_pipeline.cc
  30. inject_virtual_thread.cc
  31. inline_private_functions.cc
  32. ir_utils.cc
  33. ir_utils.h
  34. lift_thread_binding.cc
  35. loop_partition.cc
  36. lower_async_dma.cc
  37. lower_cross_thread_reduction.cc
  38. lower_custom_datatypes.cc
  39. lower_device_kernel_launch.cc
  40. lower_device_storage_access_info.cc
  41. lower_init_block.cc
  42. lower_intrin.cc
  43. lower_match_buffer.cc
  44. lower_opaque_block.cc
  45. lower_thread_allreduce.cc
  46. lower_tvm_builtin.cc
  47. lower_vtcm_alloc.cc
  48. lower_warp_memory.cc
  49. make_packed_api.cc
  50. make_unpacked_api.cc
  51. manifest_shared_memory_local_stage.cc
  52. memhammer_coalesce.cc
  53. memhammer_intermediate_stage.cc
  54. memhammer_lower_auto_copy.cc
  55. memhammer_rewrite_rule.h
  56. memhammer_tensorcore_rewrite.cc
  57. merge_shared_memory_allocations.cc
  58. narrow_datatype.cc
  59. plan_update_buffer_allocation_location.cc
  60. primfunc_utils.cc
  61. profile_instrumentation.cc
  62. reduce_branching_through_overcompute.cc
  63. remap_thread_axis.cc
  64. remove_assume.cc
  65. remove_no_op.cc
  66. remove_no_op.h
  67. remove_store_undef.cc
  68. remove_weight_layout_rewrite_block.cc
  69. renew_defs.cc
  70. renormalize_split_pattern.cc
  71. replace_global_vars.cc
  72. replace_selected_expr.cc
  73. replace_selected_expr.h
  74. rewrite_unsafe_select.cc
  75. simplify.cc
  76. simplify.h
  77. skip_assert.cc
  78. split_host_device.cc
  79. storage_access.cc
  80. storage_access.h
  81. storage_rewrite.cc
  82. tensorcore_infer_fragment.cc
  83. thread_storage_sync.cc
  84. transform_mma_buffer_layout.cc
  85. unify_thread_binding.cc
  86. unroll_loop.cc
  87. unsupported_dtype_legalize.cc
  88. update_pointer_storage_scope.cc
  89. update_pointer_storage_scope.h
  90. using_assume_to_reduce_branches.cc
  91. vectorize_loop.cc