tree: 9609ee5258f147b851ee9cb3d40041279f731ef3 [path history] [tgz]
  1. llvm_gpu_backend/
  2. tests/
  3. backend_configs.proto
  4. buffer_allocations.cc
  5. buffer_allocations.h
  6. buffer_comparator.cc
  7. buffer_comparator.h
  8. buffer_comparator_test.cc
  9. BUILD
  10. conditional_thunk.cc
  11. conditional_thunk.h
  12. convolution_thunk.cc
  13. convolution_thunk.h
  14. copy_thunk.cc
  15. copy_thunk.h
  16. cudnn_batchnorm_rewriter.cc
  17. cudnn_batchnorm_rewriter.h
  18. cudnn_batchnorm_thunk.cc
  19. cudnn_batchnorm_thunk.h
  20. cudnn_conv_algorithm_picker.cc
  21. cudnn_conv_algorithm_picker.h
  22. cudnn_conv_pad_for_tensor_cores.cc
  23. cudnn_conv_pad_for_tensor_cores.h
  24. cudnn_conv_pad_for_tensor_cores_test.cc
  25. cudnn_conv_padding_legalization.cc
  26. cudnn_conv_padding_legalization.h
  27. cudnn_conv_rewriter.cc
  28. cudnn_conv_rewriter.h
  29. cudnn_conv_rewriter_test.cc
  30. cudnn_conv_runner.cc
  31. cudnn_conv_runner.h
  32. cudnn_fused_conv_rewriter.cc
  33. cudnn_fused_conv_rewriter.h
  34. elemental_ir_emitter.cc
  35. elemental_ir_emitter.h
  36. fft_thunk.cc
  37. fft_thunk.h
  38. for_thunk.cc
  39. for_thunk.h
  40. fusion_merger.cc
  41. fusion_merger.h
  42. fusion_merger_test.cc
  43. gemm_thunk.cc
  44. gemm_thunk.h
  45. gpu_constants.cc
  46. gpu_constants.h
  47. gpu_copy_insertion.cc
  48. gpu_copy_insertion.h
  49. gpu_executable.cc
  50. gpu_executable.h
  51. gpu_fusible.cc
  52. gpu_fusible.h
  53. gpu_fusible_test.cc
  54. gpu_hlo_schedule.cc
  55. gpu_hlo_schedule.h
  56. gpu_hlo_schedule_test.cc
  57. gpu_hlo_support_checker.cc
  58. gpu_hlo_support_checker.h
  59. gpu_hlo_support_checker_test.cc
  60. gpu_layout_assignment.cc
  61. gpu_layout_assignment.h
  62. gpu_layout_assignment_test.cc
  63. gpu_transfer_manager.cc
  64. gpu_transfer_manager.h
  65. hlo_execution_profiler.cc
  66. hlo_execution_profiler.h
  67. hlo_to_ir_bindings.cc
  68. hlo_to_ir_bindings.h
  69. infeed_manager.cc
  70. infeed_manager.h
  71. infeed_thunk.cc
  72. infeed_thunk.h
  73. instruction_fusion.cc
  74. instruction_fusion.h
  75. instruction_fusion_test.cc
  76. ir_emission_utils.cc
  77. ir_emission_utils.h
  78. ir_emitter.cc
  79. ir_emitter.h
  80. ir_emitter_context.h
  81. ir_emitter_nested.cc
  82. ir_emitter_nested.h
  83. ir_emitter_unnested.cc
  84. ir_emitter_unnested.h
  85. kernel_thunk.cc
  86. kernel_thunk.h
  87. memset_thunk.cc
  88. memset_thunk.h
  89. multi_output_fusion.cc
  90. multi_output_fusion.h
  91. multi_output_fusion_test.cc
  92. nvptx_compiler.cc
  93. nvptx_compiler.h
  94. outfeed_manager.cc
  95. outfeed_manager.h
  96. outfeed_thunk.cc
  97. outfeed_thunk.h
  98. parallel_loop_emitter.cc
  99. parallel_loop_emitter.h
  100. partition_assignment.cc
  101. partition_assignment.h
  102. sequential_thunk.cc
  103. sequential_thunk.h
  104. stream_assignment.cc
  105. stream_assignment.h
  106. stream_assignment_test.cc
  107. stream_executor_util.cc
  108. stream_executor_util.h
  109. thunk.cc
  110. thunk.h
  111. thunk_schedule.cc
  112. thunk_schedule.h
  113. tuple_thunk.cc
  114. tuple_thunk.h
  115. while_thunk.cc
  116. while_thunk.h
  117. while_transformer_test.cc
  118. xfeed_queue.h