tree: a9d7b84b5e0efba73615164ff1a9a48be4fe761b [path history] [tgz]
  1. collectives/
  2. add_tracking_suffix_to_instruction_names.cc
  3. add_tracking_suffix_to_instruction_names.h
  4. add_tracking_suffix_to_instruction_names_test.cc
  5. algebraic_simplifier.cc
  6. algebraic_simplifier.h
  7. algebraic_simplifier_test.cc
  8. algorithm_checker.cc
  9. algorithm_checker.h
  10. alias_passthrough_params.cc
  11. alias_passthrough_params.h
  12. alias_passthrough_params_test.cc
  13. async_wrapper.cc
  14. async_wrapper.h
  15. async_wrapper_test.cc
  16. block_scaling_rewriter.cc
  17. block_scaling_rewriter.h
  18. block_scaling_rewriter_cudnn_test.cc
  19. block_scaling_rewriter_test.cc
  20. BUILD
  21. command_buffer_scheduling.cc
  22. command_buffer_scheduling.h
  23. command_buffer_scheduling_test.cc
  24. composite_rewriter.cc
  25. composite_rewriter.h
  26. composite_rewriter_test.cc
  27. conv_padding_legalization.cc
  28. conv_padding_legalization.h
  29. conv_padding_legalization_test.cc
  30. conv_rewriter.cc
  31. conv_rewriter.h
  32. conv_rewriter_test.cc
  33. copy_fusion.cc
  34. copy_fusion.h
  35. copy_fusion_test.cc
  36. cublas_gemm_rewriter_test.cc
  37. cublas_pad_for_gemms.cc
  38. cublas_pad_for_gemms.h
  39. cublas_pad_for_gemms_test.cc
  40. cudnn_custom_call_compiler.cc
  41. cudnn_custom_call_compiler.h
  42. cudnn_custom_call_converter.cc
  43. cudnn_custom_call_converter.h
  44. cudnn_custom_call_converter_test.cc
  45. cudnn_fused_conv_rewriter.cc
  46. cudnn_fused_conv_rewriter.h
  47. cudnn_fused_conv_rewriter_test.cc
  48. cudnn_fusion_compiler.cc
  49. cudnn_fusion_compiler.h
  50. cudnn_norm_rewriter.cc
  51. cudnn_norm_rewriter.h
  52. cudnn_norm_rewriter_test.cc
  53. cudnn_pad_for_convolutions.cc
  54. cudnn_pad_for_convolutions.h
  55. cudnn_pad_for_convolutions_test.cc
  56. cudnn_simplify_padding.cc
  57. cudnn_simplify_padding.h
  58. cudnn_simplify_padding_test.cc
  59. custom_kernel_fusion_rewriter.cc
  60. custom_kernel_fusion_rewriter.h
  61. custom_kernel_fusion_rewriter_test.cc
  62. dot_algorithm_rewriter.cc
  63. dot_algorithm_rewriter.h
  64. dot_dimension_sorter.cc
  65. dot_dimension_sorter.h
  66. dot_dimension_sorter_test.cc
  67. dot_normalizer.cc
  68. dot_normalizer.h
  69. dot_normalizer_test.cc
  70. dot_operand_converter.cc
  71. dot_operand_converter.h
  72. dot_operand_converter_test.cc
  73. dot_strength_reduction.cc
  74. dot_strength_reduction.h
  75. dot_strength_reduction_test.cc
  76. double_buffer_loop_unrolling.cc
  77. double_buffer_loop_unrolling.h
  78. double_buffer_loop_unrolling_test.cc
  79. dynamic_slice_fusion_rewriter.cc
  80. dynamic_slice_fusion_rewriter.h
  81. dynamic_slice_fusion_rewriter_test.cc
  82. explicit_collectives_group_async_wrapper.cc
  83. explicit_collectives_group_async_wrapper.h
  84. explicit_collectives_group_async_wrapper_test.cc
  85. explicit_stream_annotation_async_wrapper.cc
  86. explicit_stream_annotation_async_wrapper.h
  87. explicit_stream_annotation_async_wrapper_test.cc
  88. fusion_block_level_rewriter.cc
  89. fusion_block_level_rewriter.h
  90. fusion_block_level_rewriter_test.cc
  91. fusion_dynamic_memcpy_rewriter.cc
  92. fusion_dynamic_memcpy_rewriter.h
  93. fusion_dynamic_memcpy_rewriter_test.cc
  94. fusion_wrapper.cc
  95. fusion_wrapper.h
  96. fusion_wrapper_test.cc
  97. gemm_broadcast_folding_rewriter.cc
  98. gemm_broadcast_folding_rewriter.h
  99. gemm_broadcast_folding_rewriter_test.cc
  100. gemm_fusion.cc
  101. gemm_fusion.h
  102. gemm_fusion_swap_operands.cc
  103. gemm_fusion_swap_operands.h
  104. gemm_fusion_swap_operands_test.cc
  105. gemm_fusion_test.cc
  106. gemm_rewriter.cc
  107. gemm_rewriter.h
  108. gemm_rewriter_fp8_test.cc
  109. gemm_rewriter_test.cc
  110. gemm_rewriter_test_lib.cc
  111. gemm_rewriter_test_lib.h
  112. gemv_rewriter.cc
  113. gemv_rewriter.h
  114. gemv_rewriter_test.cc
  115. gpusolver_rewriter.cc
  116. gpusolver_rewriter.h
  117. gpusolver_rewriter_test.cc
  118. layout_assignment.cc
  119. layout_assignment.h
  120. layout_assignment_a100.hlo
  121. layout_assignment_h100.hlo
  122. layout_assignment_test.cc
  123. layout_assignment_v100.hlo
  124. move_copy_to_users.cc
  125. move_copy_to_users.h
  126. move_copy_to_users_test.cc
  127. multi_output_fusion.cc
  128. multi_output_fusion.h
  129. multi_output_fusion_test.cc
  130. nest_gemm_fusion.cc
  131. nest_gemm_fusion.h
  132. nest_gemm_fusion_test.cc
  133. pgle_accuracy_checker.cc
  134. pgle_accuracy_checker.h
  135. pgle_accuracy_checker_test.cc
  136. priority_fusion.cc
  137. priority_fusion.h
  138. priority_fusion_test.cc
  139. ragged_all_to_all_canonicalizer.cc
  140. ragged_all_to_all_canonicalizer.h
  141. ragged_all_to_all_canonicalizer_test.cc
  142. ragged_all_to_all_decomposer.cc
  143. ragged_all_to_all_decomposer.h
  144. ragged_all_to_all_decomposer_test.cc
  145. ragged_all_to_all_multi_host_decomposer.cc
  146. ragged_all_to_all_multi_host_decomposer.h
  147. ragged_all_to_all_multi_host_decomposer_test.cc
  148. README.md
  149. reduce_scatter_creator.cc
  150. reduce_scatter_creator.h
  151. reduce_scatter_creator_test.cc
  152. reduction_degenerate_dim_remover.cc
  153. reduction_degenerate_dim_remover.h
  154. reduction_degenerate_dim_remover_test.cc
  155. reduction_dimension_grouper.cc
  156. reduction_dimension_grouper.h
  157. reduction_dimension_grouper_test.cc
  158. reduction_layout_normalizer.cc
  159. reduction_layout_normalizer.h
  160. reduction_layout_normalizer_test.cc
  161. reduction_splitter.cc
  162. reduction_splitter.h
  163. reduction_splitter_test.cc
  164. rename_fusions.cc
  165. rename_fusions.h
  166. rename_fusions_test.cc
  167. sanitize_constant_names.cc
  168. sanitize_constant_names.h
  169. sanitize_constant_names_test.cc
  170. scalar_constant_sinker.cc
  171. scalar_constant_sinker.h
  172. scalar_constant_sinker_test.cc
  173. scaled_dot_rewriter.cc
  174. scaled_dot_rewriter.h
  175. scaled_dot_rewriter_test.cc
  176. scatter_expander.cc
  177. scatter_expander.h
  178. scatter_slice_simplifier.cc
  179. scatter_slice_simplifier.h
  180. scatter_slice_simplifier_test.cc
  181. scheduling_instruction_annotator.cc
  182. scheduling_instruction_annotator.h
  183. scheduling_instruction_annotator_test.cc
  184. softmax_rewriter_triton.cc
  185. softmax_rewriter_triton.h
  186. softmax_rewriter_triton_test.cc
  187. sort_rewriter.cc
  188. sort_rewriter.h
  189. sort_rewriter_test.cc
  190. splitk_rewriter.cc
  191. splitk_rewriter.h
  192. splitk_rewriter_test.cc
  193. stream_attribute_annotator.cc
  194. stream_attribute_annotator.h
  195. stream_attribute_annotator_test.cc
  196. stream_attribute_async_wrapper.cc
  197. stream_attribute_async_wrapper.h
  198. stream_attribute_async_wrapper_test.cc
  199. topk_specializer.cc
  200. topk_specializer.h
  201. topk_specializer_test.cc
  202. topk_splitter.cc
  203. topk_splitter.h
  204. topk_splitter_test.cc
  205. transpose_dimension_grouper.cc
  206. transpose_dimension_grouper.h
  207. transpose_dimension_grouper_test.cc
  208. tree_reduction_rewriter.cc
  209. tree_reduction_rewriter.h
  210. tree_reduction_rewriter_test.cc
  211. triangular_solve_rewriter.cc
  212. triangular_solve_rewriter.h
  213. triangular_solve_rewriter_test.cc
  214. triton_fusion_numerics_verifier.cc
  215. triton_fusion_numerics_verifier.h
  216. triton_fusion_numerics_verifier_test.cc
  217. variadic_op_splitter.cc
  218. variadic_op_splitter.h
  219. variadic_op_splitter_test.cc
  220. windowed_einsum_handler.cc
  221. windowed_einsum_handler.h
  222. windowed_einsum_handler_test.cc
third_party/xla/xla/service/gpu/transforms/README.md

This folder consolidates GPU specific HLO transformation passes.