Name | Last modified | Size | Description | |
---|---|---|---|---|
Parent Directory | - | |||
address_computation_..> | 2024-10-20 16:17 | 3.2K | ||
algorithm_checker.h | 2024-10-20 16:17 | 1.8K | ||
alias_passthrough_pa..> | 2024-10-20 16:17 | 1.7K | ||
all_reduce_blueconne..> | 2024-10-20 16:17 | 1.9K | ||
autotuner_compile_ut..> | 2024-10-20 16:17 | 6.8K | ||
autotuner_util.h | 2024-10-20 16:17 | 11K | ||
backend_configs.pb.h | 2024-10-20 16:17 | 243K | ||
buffer_allocations.h | 2024-10-20 16:17 | 3.6K | ||
buffer_comparator.h | 2024-10-20 16:17 | 2.2K | ||
buffer_sharing.h | 2024-10-20 16:17 | 1.3K | ||
collective_permute_c..> | 2024-10-20 16:17 | 2.8K | ||
command_buffer_sched..> | 2024-10-20 16:17 | 5.4K | ||
compile_module_to_ll..> | 2024-10-20 16:17 | 2.8K | ||
conv_algorithm_picker.h | 2024-10-20 16:17 | 5.9K | ||
conv_layout_normaliz..> | 2024-10-20 16:17 | 1.1K | ||
copy_fusion.h | 2024-10-20 16:17 | 1.6K | ||
cub_sort_kernel.h | 2024-10-20 16:17 | 2.4K | ||
cublas_cudnn.h | 2024-10-20 16:17 | 8.6K | ||
cublas_pad_for_gemms.h | 2024-10-20 16:17 | 2.1K | ||
cublas_padding_requi..> | 2024-10-20 16:17 | 1.8K | ||
cudnn_fused_conv_rew..> | 2024-10-20 16:17 | 4.5K | ||
cudnn_fused_mha_rewr..> | 2024-10-20 16:17 | 2.1K | ||
cudnn_fused_mha_tran..> | 2024-10-20 16:17 | 1.5K | ||
cudnn_fusion_compiler.h | 2024-10-20 16:17 | 2.2K | ||
cudnn_norm_rewriter.h | 2024-10-20 16:17 | 1.7K | ||
cudnn_pad_for_convol..> | 2024-10-20 16:17 | 1.9K | ||
cudnn_simplify_paddi..> | 2024-10-20 16:17 | 2.7K | ||
cudnn_support_utils.h | 2024-10-20 16:17 | 3.2K | ||
cudnn_vectorize_conv..> | 2024-10-20 16:17 | 2.4K | ||
cudnn_workspace_rewr..> | 2024-10-20 16:17 | 1.9K | ||
cusolver_context.h | 2024-10-20 16:17 | 5.3K | ||
cusolver_rewriter.h | 2024-10-20 16:17 | 1.5K | ||
custom_kernel_fusion..> | 2024-10-20 16:17 | 3.1K | ||
dot_dimension_sorter.h | 2024-10-20 16:17 | 1.9K | ||
dot_operand_converter.h | 2024-10-20 16:17 | 1.5K | ||
dot_sparsity_rewriter.h | 2024-10-20 16:17 | 1.4K | ||
double_buffer_loop_u..> | 2024-10-20 16:17 | 2.8K | ||
elemental_ir_emitter.h | 2024-10-20 16:17 | 5.4K | ||
executable.pb.h | 2024-10-20 16:17 | 28K | ||
execution_stream_ass..> | 2024-10-20 16:17 | 3.5K | ||
fusion_merger.h | 2024-10-20 16:17 | 3.4K | ||
fusion_pipeline.h | 2024-10-20 16:17 | 1.5K | ||
fusion_process_dump...> | 2024-10-20 16:17 | 75K | ||
fusion_wrapper.h | 2024-10-20 16:17 | 1.5K | ||
fusions/ | 2024-10-20 16:17 | - | ||
gemm_algorithm_picker.h | 2024-10-20 16:17 | 2.3K | ||
gemm_broadcast_foldi..> | 2024-10-20 16:17 | 1.9K | ||
gemm_fusion.h | 2024-10-20 16:17 | 2.0K | ||
gemm_fusion_autotuner.h | 2024-10-20 16:17 | 5.0K | ||
gemm_rewriter.h | 2024-10-20 16:17 | 2.5K | ||
gemv_rewriter.h | 2024-10-20 16:17 | 1.5K | ||
gpu_algebraic_simpli..> | 2024-10-20 16:17 | 2.7K | ||
gpu_all_gather_optim..> | 2024-10-20 16:17 | 1.5K | ||
gpu_asm_opts_util.h | 2024-10-20 16:17 | 1.0K | ||
gpu_async_collective..> | 2024-10-20 16:17 | 1.7K | ||
gpu_autotuning.pb.h | 2024-10-20 16:17 | 56K | ||
gpu_compiler.h | 2024-10-20 16:17 | 10K | ||
gpu_constants.h | 2024-10-20 16:17 | 1.9K | ||
gpu_conv_padding_leg..> | 2024-10-20 16:17 | 2.0K | ||
gpu_conv_rewriter.h | 2024-10-20 16:17 | 2.0K | ||
gpu_conv_runner.h | 2024-10-20 16:17 | 9.7K | ||
gpu_convert_async_co..> | 2024-10-20 16:17 | 1.6K | ||
gpu_executable.h | 2024-10-20 16:17 | 12K | ||
gpu_executable_run_o..> | 2024-10-20 16:17 | 3.2K | ||
gpu_float_support.h | 2024-10-20 16:17 | 1.9K | ||
gpu_fused_mha_runner.h | 2024-10-20 16:17 | 16K | ||
gpu_fusible.h | 2024-10-20 16:17 | 10K | ||
gpu_hlo_schedule.h | 2024-10-20 16:17 | 1.6K | ||
gpu_layout_assignment.h | 2024-10-20 16:17 | 3.0K | ||
gpu_memory_space_ass..> | 2024-10-20 16:17 | 2.7K | ||
gpu_norm_runner.h | 2024-10-20 16:17 | 7.4K | ||
gpu_p2p_pipeliner.h | 2024-10-20 16:17 | 1.0K | ||
gpu_prim.h | 2024-10-20 16:17 | 4.1K | ||
gpu_reduce_scatter_c..> | 2024-10-20 16:17 | 1.5K | ||
gpu_sanitize_constan..> | 2024-10-20 16:17 | 1.5K | ||
gpu_scatter_expander.h | 2024-10-20 16:17 | 1.4K | ||
gpu_schedule_postpro..> | 2024-10-20 16:17 | 1.9K | ||
gpu_sort_rewriter.h | 2024-10-20 16:17 | 1.9K | ||
gpu_transfer_manager.h | 2024-10-20 16:17 | 6.7K | ||
gpu_windowed_einsum_..> | 2024-10-20 16:17 | 2.3K | ||
hlo_algorithm_denyli..> | 2024-10-20 16:17 | 1.1K | ||
hlo_fusion_analysis.h | 2024-10-20 16:17 | 5.0K | ||
hlo_fusion_stats.h | 2024-10-20 16:17 | 1.8K | ||
hlo_to_ir_bindings.h | 2024-10-20 16:17 | 3.3K | ||
hlo_traversal.h | 2024-10-20 16:17 | 7.8K | ||
horizontal_input_fus..> | 2024-10-20 16:17 | 2.4K | ||
horizontal_loop_fusi..> | 2024-10-20 16:17 | 5.7K | ||
infeed_manager.h | 2024-10-20 16:17 | 2.4K | ||
instruction_fusion.h | 2024-10-20 16:17 | 2.9K | ||
ir_emission_utils.h | 2024-10-20 16:17 | 10K | ||
ir_emitter.h | 2024-10-20 16:17 | 6.6K | ||
ir_emitter_context.h | 2024-10-20 16:17 | 6.0K | ||
ir_emitter_nested.h | 2024-10-20 16:17 | 3.5K | ||
ir_emitter_triton.h | 2024-10-20 16:17 | 7.4K | ||
ir_emitter_unnested.h | 2024-10-20 16:17 | 15K | ||
kernel_arguments.h | 2024-10-20 16:17 | 2.8K | ||
kernel_reuse_cache.h | 2024-10-20 16:17 | 3.1K | ||
kernels/ | 2024-10-20 16:17 | - | ||
launch_dimensions.h | 2024-10-20 16:17 | 4.6K | ||
llvm_gpu_backend/ | 2024-10-20 16:17 | - | ||
make_batch_pointers.h | 2024-10-20 16:17 | 2.3K | ||
matmul_utils.h | 2024-10-20 16:17 | 9.1K | ||
metrics.h | 2024-10-20 16:17 | 1.8K | ||
model/ | 2024-10-20 16:17 | - | ||
move_copy_to_users.h | 2024-10-20 16:17 | 1.4K | ||
multi_output_fusion.h | 2024-10-20 16:17 | 5.8K | ||
nvptx_compiler.h | 2024-10-20 16:17 | 7.3K | ||
outfeed_manager.h | 2024-10-20 16:17 | 2.6K | ||
parallel_loop_emitter.h | 2024-10-20 16:17 | 3.8K | ||
pipelined_p2p_rewrit..> | 2024-10-20 16:17 | 3.2K | ||
prepare_hlo_for_ir_e..> | 2024-10-20 16:17 | 1.3K | ||
priority_fusion.h | 2024-10-20 16:17 | 3.4K | ||
reduction_degenerate..> | 2024-10-20 16:17 | 1.8K | ||
reduction_dimension_..> | 2024-10-20 16:17 | 1.8K | ||
reduction_layout_nor..> | 2024-10-20 16:17 | 1.8K | ||
reduction_splitter.h | 2024-10-20 16:17 | 2.1K | ||
reduction_utils.h | 2024-10-20 16:17 | 4.0K | ||
rename_fusions.h | 2024-10-20 16:17 | 1.7K | ||
runtime/ | 2024-10-20 16:17 | - | ||
runtime_intrinsics.h | 2024-10-20 16:17 | 954 | ||
scatter_slice_simpli..> | 2024-10-20 16:17 | 2.3K | ||
softmax_rewriter_tri..> | 2024-10-20 16:17 | 3.3K | ||
split_k_gemm_rewriter.h | 2024-10-20 16:17 | 1.6K | ||
stream_attribute_ann..> | 2024-10-20 16:17 | 2.2K | ||
stream_attribute_asy..> | 2024-10-20 16:17 | 1.7K | ||
stream_executor_util.h | 2024-10-20 16:17 | 6.5K | ||
target_constants.h | 2024-10-20 16:17 | 2.4K | ||
target_util.h | 2024-10-20 16:17 | 3.1K | ||
topk_specializer.h | 2024-10-20 16:17 | 1.4K | ||
topk_splitter.h | 2024-10-20 16:17 | 1.7K | ||
tree_reduction_rewri..> | 2024-10-20 16:17 | 3.2K | ||
triangular_solve_rew..> | 2024-10-20 16:17 | 2.2K | ||
triton_call.h | 2024-10-20 16:17 | 1.3K | ||
triton_fusion_analys..> | 2024-10-20 16:17 | 5.9K | ||
triton_fusion_numeri..> | 2024-10-20 16:17 | 2.9K | ||
triton_support.h | 2024-10-20 16:17 | 2.7K | ||
triton_tiling_propag..> | 2024-10-20 16:17 | 11K | ||
variadic_op_splitter.h | 2024-10-20 16:17 | 1.5K | ||
variant_visitor.h | 2024-10-20 16:17 | 1.2K | ||
xfeed_queue.h | 2024-10-20 16:17 | 5.0K | ||
xla_executor_state.h | 2024-10-20 16:17 | 2.1K | ||