| Name | Last modified | Size | Description | |
|---|---|---|---|---|
| Parent Directory | - | |||
| __pycache__/ | 2025-09-24 17:10 | - | ||
| aoti_runtime/ | 2025-09-24 17:10 | - | ||
| cuda/ | 2025-09-24 17:10 | - | ||
| rocm/ | 2025-09-24 17:10 | - | ||
| xpu/ | 2025-09-24 17:10 | - | ||
| __init__.py | 2025-09-24 17:10 | 0 | ||
| mps_device_op_overri..> | 2025-09-24 17:10 | 483 | ||
| cpu_device_op_overri..> | 2025-09-24 17:10 | 659 | ||
| aoti_hipify_utils.py | 2025-09-24 17:10 | 1.3K | ||
| cpp_template.py | 2025-09-24 17:10 | 4.9K | ||
| cuda_combined_schedu..> | 2025-09-24 17:10 | 4.9K | ||
| block_analysis.py | 2025-09-24 17:10 | 6.7K | ||
| triton_split_scan.py | 2025-09-24 17:10 | 7.3K | ||
| triton_utils.py | 2025-09-24 17:10 | 7.4K | ||
| cpp_bmm_template.py | 2025-09-24 17:10 | 9.4K | ||
| debug_utils.py | 2025-09-24 17:10 | 11K | ||
| multi_kernel.py | 2025-09-24 17:10 | 16K | ||
| cpp_grouped_gemm_tem..> | 2025-09-24 17:10 | 20K | ||
| cpp_wrapper_gpu.py | 2025-09-24 17:10 | 22K | ||
| simd_kernel_features.py | 2025-09-24 17:10 | 24K | ||
| cpp_template_kernel.py | 2025-09-24 17:10 | 24K | ||
| memory_planning.py | 2025-09-24 17:10 | 25K | ||
| mps.py | 2025-09-24 17:10 | 27K | ||
| cpp_utils.py | 2025-09-24 17:10 | 30K | ||
| cpp_prefix.h | 2025-09-24 17:10 | 33K | ||
| cpp_wrapper_cpu_arra..> | 2025-09-24 17:10 | 39K | ||
| cpp_flex_attention_t..> | 2025-09-24 17:10 | 40K | ||
| triton_combo_kernel.py | 2025-09-24 17:10 | 41K | ||
| cpp_micro_gemm.py | 2025-09-24 17:10 | 58K | ||
| halide.py | 2025-09-24 17:10 | 62K | ||
| cpp_gemm_template.py | 2025-09-24 17:10 | 66K | ||
| simd.py | 2025-09-24 17:10 | 83K | ||
| common.py | 2025-09-24 17:10 | 93K | ||
| cpp_wrapper_cpu.py | 2025-09-24 17:10 | 107K | ||
| wrapper.py | 2025-09-24 17:10 | 115K | ||
| triton.py | 2025-09-24 17:10 | 173K | ||
| cpp.py | 2025-09-24 17:10 | 219K | ||