tree: 3e504bacdef014f8ad834918d6f859e11bc1e6ef [path history] [tgz]
  1. data/
  2. ir/
  3. llvm_gpu_backend/
  4. tests/
  5. alias_passthrough_params.cc
  6. alias_passthrough_params.h
  7. alias_passthrough_params_test.cc
  8. amdgpu_compiler.cc
  9. amdgpu_compiler.h
  10. amdgpu_compiler_registration.cc
  11. backend_configs.proto
  12. buffer_allocations.cc
  13. buffer_allocations.h
  14. buffer_comparator.cc
  15. buffer_comparator.h
  16. buffer_comparator_test.cc
  17. BUILD
  18. cholesky_thunk.cc
  19. cholesky_thunk.h
  20. collective_permute_thunk.cc
  21. collective_permute_thunk.h
  22. conditional_thunk.cc
  23. conditional_thunk.h
  24. convolution_thunk.cc
  25. convolution_thunk.h
  26. copy_thunk.cc
  27. copy_thunk.h
  28. cublas_gemm_pad_for_tensor_cores.cc
  29. cublas_gemm_pad_for_tensor_cores.h
  30. cublas_gemm_pad_for_tensor_cores_test.cc
  31. cudnn_batchnorm_rewriter.cc
  32. cudnn_batchnorm_rewriter.h
  33. cudnn_batchnorm_runner.cc
  34. cudnn_batchnorm_runner.h
  35. cudnn_batchnorm_thunk.cc
  36. cudnn_batchnorm_thunk.h
  37. cudnn_fused_conv_rewriter.cc
  38. cudnn_fused_conv_rewriter.h
  39. cudnn_fused_conv_rewriter_test.cc
  40. cudnn_pad_for_convolutions.cc
  41. cudnn_pad_for_convolutions.h
  42. cudnn_pad_for_convolutions_test.cc
  43. cusolver_context.cc
  44. cusolver_context.h
  45. cusolver_rewriter.cc
  46. cusolver_rewriter.h
  47. custom_call_test.cc
  48. custom_call_thunk.cc
  49. custom_call_thunk.h
  50. dummy_all_reduce_thunk.cc
  51. elemental_ir_emitter.cc
  52. elemental_ir_emitter.h
  53. fft_thunk.cc
  54. fft_thunk.h
  55. for_thunk.cc
  56. for_thunk.h
  57. fusion_merger.cc
  58. fusion_merger.h
  59. fusion_merger_test.cc
  60. gemm_algorithm_picker.cc
  61. gemm_algorithm_picker.h
  62. gemm_rewriter.cc
  63. gemm_rewriter.h
  64. gemm_thunk.cc
  65. gemm_thunk.h
  66. gpu_autotuning.proto
  67. gpu_compiler.cc
  68. gpu_compiler.h
  69. gpu_constants.cc
  70. gpu_constants.h
  71. gpu_conv_algorithm_picker.cc
  72. gpu_conv_algorithm_picker.h
  73. gpu_conv_padding_legalization.cc
  74. gpu_conv_padding_legalization.h
  75. gpu_conv_rewriter.cc
  76. gpu_conv_rewriter.h
  77. gpu_conv_rewriter_test.cc
  78. gpu_conv_runner.cc
  79. gpu_conv_runner.h
  80. gpu_copy_insertion.cc
  81. gpu_copy_insertion.h
  82. gpu_debug_info_manager.cc
  83. gpu_debug_info_manager.h
  84. gpu_debug_info_manager_test.cc
  85. gpu_device_info.h
  86. gpu_executable.cc
  87. gpu_executable.h
  88. gpu_executable_run_options.cc
  89. gpu_executable_run_options.h
  90. gpu_fusible.cc
  91. gpu_fusible.h
  92. gpu_fusible_test.cc
  93. gpu_hlo_schedule.cc
  94. gpu_hlo_schedule.h
  95. gpu_hlo_schedule_test.cc
  96. gpu_layout_assignment.cc
  97. gpu_layout_assignment.h
  98. gpu_layout_assignment_test.cc
  99. gpu_sanitize_constant_names.cc
  100. gpu_sanitize_constant_names.h
  101. gpu_sanitize_constant_names_test.cc
  102. gpu_scatter_expander.cc
  103. gpu_scatter_expander.h
  104. gpu_transfer_manager.cc
  105. gpu_transfer_manager.h
  106. gpu_types.h
  107. hlo_algorithm_denylist.cc
  108. hlo_algorithm_denylist.h
  109. hlo_algorithm_denylist_test.cc
  110. hlo_execution_profiler.cc
  111. hlo_execution_profiler.h
  112. hlo_to_ir_bindings.cc
  113. hlo_to_ir_bindings.h
  114. horizontal_fusion.cc
  115. horizontal_fusion.h
  116. horizontal_fusion_test.cc
  117. infeed_manager.cc
  118. infeed_manager.h
  119. infeed_thunk.cc
  120. infeed_thunk.h
  121. instruction_fusion.cc
  122. instruction_fusion.h
  123. instruction_fusion_test.cc
  124. ir_emission_utils.cc
  125. ir_emission_utils.h
  126. ir_emitter.cc
  127. ir_emitter.h
  128. ir_emitter_context.h
  129. ir_emitter_nested.cc
  130. ir_emitter_nested.h
  131. ir_emitter_unnested.cc
  132. ir_emitter_unnested.h
  133. kernel_mapping_scheme.h
  134. kernel_thunk.cc
  135. kernel_thunk.h
  136. launch_dimensions.cc
  137. launch_dimensions.h
  138. memset_thunk.cc
  139. memset_thunk.h
  140. multi_output_fusion.cc
  141. multi_output_fusion.h
  142. multi_output_fusion_test.cc
  143. nccl_all_reduce_thunk.cc
  144. nccl_all_reduce_thunk.h
  145. nvptx_compiler.cc
  146. nvptx_compiler.h
  147. nvptx_compiler_registration.cc
  148. outfeed_manager.cc
  149. outfeed_manager.h
  150. outfeed_thunk.cc
  151. outfeed_thunk.h
  152. parallel_loop_emitter.cc
  153. parallel_loop_emitter.h
  154. reduction_degenerate_dim_remover.cc
  155. reduction_degenerate_dim_remover.h
  156. reduction_dimension_grouper.cc
  157. reduction_dimension_grouper.h
  158. reduction_layout_normalizer.cc
  159. reduction_layout_normalizer.h
  160. reduction_splitter.cc
  161. reduction_splitter.h
  162. reduction_splitter_test.cc
  163. replica_id_thunk.cc
  164. replica_id_thunk.h
  165. sequential_thunk.cc
  166. sequential_thunk.h
  167. stream_assignment.cc
  168. stream_assignment.h
  169. stream_assignment_test.cc
  170. stream_executor_util.cc
  171. stream_executor_util.h
  172. target_constants.h
  173. target_util.cc
  174. target_util.h
  175. thunk.cc
  176. thunk.h
  177. thunk_emitter.cc
  178. thunk_emitter.h
  179. thunk_schedule.cc
  180. thunk_schedule.h
  181. tree_reduction_rewriter.cc
  182. tree_reduction_rewriter.h
  183. triangular_solve_thunk.cc
  184. triangular_solve_thunk.h
  185. tuple_thunk.cc
  186. tuple_thunk.h
  187. variadic_op_splitter.cc
  188. variadic_op_splitter.h
  189. variadic_op_splitter_test.cc
  190. while_thunk.cc
  191. while_thunk.h
  192. while_transformer_test.cc
  193. xfeed_queue.h