Sign in
chromium
/
external
/
github.com
/
tensorflow
/
tensorflow
/
200f3a9b907427172cfad2d969aa9c69884c8dfd
/
.
/
tensorflow
/
compiler
/
xla
/
service
/
gpu
tree: 9a1fc294d07f82a44553c5dc2abbbabb1a350f87 [
path history
]
[
tgz
]
data/
llvm_gpu_backend/
runtime/
tests/
alias_passthrough_params.cc
alias_passthrough_params.h
alias_passthrough_params_test.cc
all_reduce_blueconnect.cc
all_reduce_blueconnect.h
all_reduce_blueconnect_test.cc
amdgpu_compiler.cc
amdgpu_compiler.h
amdgpu_compiler_registration.cc
backend_configs.proto
buffer_allocations.cc
buffer_allocations.h
buffer_comparator.cc
buffer_comparator.h
buffer_comparator_test.cc
BUILD
cholesky_thunk.cc
cholesky_thunk.h
conditional_thunk.cc
conditional_thunk.h
conv_layout_normalization.cc
conv_layout_normalization.h
conv_layout_normalization_test.cc
convolution_thunk.cc
convolution_thunk.h
copy_thunk.cc
copy_thunk.h
cublas_cudnn.cc
cublas_cudnn.h
cublas_lt_matmul_thunk.cc
cublas_lt_matmul_thunk.h
cublas_pad_for_gemms.cc
cublas_pad_for_gemms.h
cublas_pad_for_gemms_test.cc
cudnn_fused_conv_rewriter.cc
cudnn_fused_conv_rewriter.h
cudnn_fused_conv_rewriter_test.cc
cudnn_pad_for_convolutions.cc
cudnn_pad_for_convolutions.h
cudnn_pad_for_convolutions_test.cc
cudnn_simplify_padding.cc
cudnn_simplify_padding.h
cudnn_simplify_padding_test.cc
cudnn_support_utils.cc
cudnn_support_utils.h
cudnn_support_utils_test.cc
cudnn_vectorize_convolutions.cc
cudnn_vectorize_convolutions.h
cudnn_vectorize_convolutions_test.cc
cusolver_context.cc
cusolver_context.h
cusolver_rewriter.cc
cusolver_rewriter.h
custom_call_test.cc
custom_call_thunk.cc
custom_call_thunk.h
elemental_ir_emitter.cc
elemental_ir_emitter.h
executable.proto
fft_thunk.cc
fft_thunk.h
for_thunk.cc
for_thunk.h
fusion_merger.cc
fusion_merger.h
fusion_merger_test.cc
gemm_algorithm_picker.cc
gemm_algorithm_picker.h
gemm_broadcast_folding_rewriter.cc
gemm_broadcast_folding_rewriter.h
gemm_rewriter.cc
gemm_rewriter.h
gemm_thunk.cc
gemm_thunk.h
gpu_aot_compilation_test.cc
gpu_asm_opts_util.cc
gpu_asm_opts_util.h
gpu_autotuning.proto
gpu_compiler.cc
gpu_compiler.h
gpu_compiler_test.cc
gpu_constants.h
gpu_conv_algorithm_picker.cc
gpu_conv_algorithm_picker.h
gpu_conv_padding_legalization.cc
gpu_conv_padding_legalization.h
gpu_conv_padding_legalization_test.cc
gpu_conv_rewriter.cc
gpu_conv_rewriter.h
gpu_conv_rewriter_test.cc
gpu_conv_runner.cc
gpu_conv_runner.h
gpu_device_info.cc
gpu_device_info.h
gpu_executable.cc
gpu_executable.h
gpu_executable_run_options.cc
gpu_executable_run_options.h
gpu_fusible.cc
gpu_fusible.h
gpu_fusible_test.cc
gpu_hlo_cost_analysis.cc
gpu_hlo_cost_analysis.h
gpu_hlo_cost_analysis_test.cc
gpu_hlo_schedule.cc
gpu_hlo_schedule.h
gpu_hlo_schedule_test.cc
gpu_layout_assignment.cc
gpu_layout_assignment.h
gpu_layout_assignment_test.cc
gpu_performance_model.cc
gpu_performance_model.h
gpu_performance_model_test.cc
gpu_reduce_scatter_creator.cc
gpu_reduce_scatter_creator.h
gpu_sanitize_constant_names.cc
gpu_sanitize_constant_names.h
gpu_sanitize_constant_names_test.cc
gpu_scatter_expander.cc
gpu_scatter_expander.h
gpu_shape_verifier.cc
gpu_shape_verifier.h
gpu_transfer_manager.cc
gpu_transfer_manager.h
gpu_types.h
hlo_algorithm_denylist.cc
hlo_algorithm_denylist.h
hlo_algorithm_denylist_test.cc
hlo_fusion_stats.cc
hlo_fusion_stats.h
hlo_fusion_stats_test.cc
hlo_to_ir_bindings.cc
hlo_to_ir_bindings.h
horizontal_input_fusion.cc
horizontal_input_fusion.h
horizontal_input_fusion_test.cc
horizontal_loop_fusion.cc
horizontal_loop_fusion.h
horizontal_loop_fusion_test.cc
infeed_manager.cc
infeed_manager.h
infeed_thunk.cc
infeed_thunk.h
instruction_fusion.cc
instruction_fusion.h
instruction_fusion_test.cc
ir_emission_utils.cc
ir_emission_utils.h
ir_emission_utils_test.cc
ir_emitter.cc
ir_emitter.h
ir_emitter_context.cc
ir_emitter_context.h
ir_emitter_nested.cc
ir_emitter_nested.h
ir_emitter_unnested.cc
ir_emitter_unnested.h
jitrt_custom_calls.cc
jitrt_custom_calls.h
kernel_mapping_scheme.h
kernel_thunk.cc
kernel_thunk.h
launch_dimensions.cc
launch_dimensions.h
matmul_utils.cc
matmul_utils.h
matmul_utils_test.cc
memset_thunk.cc
memset_thunk.h
metrics.cc
metrics.h
move_copy_to_users.cc
move_copy_to_users.h
move_copy_to_users_test.cc
multi_output_fusion.cc
multi_output_fusion.h
multi_output_fusion_test.cc
nccl_all_gather_thunk.cc
nccl_all_gather_thunk.h
nccl_all_reduce_thunk.cc
nccl_all_reduce_thunk.h
nccl_all_to_all_thunk.cc
nccl_all_to_all_thunk.h
nccl_collective_permute_thunk.cc
nccl_collective_permute_thunk.h
nccl_collective_thunk.cc
nccl_collective_thunk.h
nccl_utils.cc
nccl_utils.h
nvptx_compiler.cc
nvptx_compiler.h
nvptx_compiler_registration.cc
nvptx_compiler_test.cc
nvptx_helper.cc
nvptx_helper.h
outfeed_manager.cc
outfeed_manager.h
outfeed_thunk.cc
outfeed_thunk.h
parallel_loop_emitter.cc
parallel_loop_emitter.h
precompiled_kernels.cc
precompiled_kernels.h
reduction_degenerate_dim_remover.cc
reduction_degenerate_dim_remover.h
reduction_dimension_grouper.cc
reduction_dimension_grouper.h
reduction_layout_normalizer.cc
reduction_layout_normalizer.h
reduction_splitter.cc
reduction_splitter.h
reduction_splitter_test.cc
replica_id_thunk.cc
replica_id_thunk.h
runtime_intrinsics.cc
runtime_intrinsics.h
scatter_slice_simplifier.cc
scatter_slice_simplifier.h
scatter_slice_simplifier_test.cc
sequential_thunk.cc
sequential_thunk.h
softmax_fusion.cc
softmax_fusion.h
softmax_fusion_test.cc
stream_executor_util.cc
stream_executor_util.h
target_constants.h
target_util.cc
target_util.h
target_util_test.cc
thunk.cc
thunk.h
tree_reduction_rewriter.cc
tree_reduction_rewriter.h
triangular_solve_rewriter.cc
triangular_solve_rewriter.h
triangular_solve_thunk.cc
triangular_solve_thunk.h
variadic_op_splitter.cc
variadic_op_splitter.h
variadic_op_splitter_test.cc
while_thunk.cc
while_thunk.h
while_transformer_test.cc
xfeed_queue.h
xla_executor_state.h