|
.gitignore
|
updates from the chonker branch
|
2022-11-07 21:12:08 -08:00 |
|
amx.py
|
fixes (#1893)
|
2023-09-22 07:20:27 +08:00 |
|
cuda_matmul.py
|
fix cuda matmul (#2725)
|
2023-12-12 07:59:31 -08:00 |
|
gemm.c
|
only 62 gflops (#2629)
|
2023-12-05 13:28:24 -08:00 |
|
gemm.py
|
only 62 gflops (#2629)
|
2023-12-05 13:28:24 -08:00 |
|
hip_matmul.py
|
move dtypes to dtype.py (#2964)
|
2024-01-01 14:58:48 -08:00 |
|
jax_pmatmul.py
|
jax parallel matmul example
|
2023-11-28 13:48:11 -08:00 |
|
metal_conv.py
|
move device to device.py (#2466)
|
2023-11-27 11:34:37 -08:00 |
|
metal_matmul.py
|
move dtypes to dtype.py (#2964)
|
2024-01-01 14:58:48 -08:00 |
|
metal_matvec.py
|
move dtypes to dtype.py (#2964)
|
2024-01-01 14:58:48 -08:00 |
|
mlx_matmul.py
|
mlx benchmark, a lil slower than tg
|
2023-12-05 19:00:43 -08:00 |
|
simple_matmul.py
|
move dtypes to dtype.py (#2964)
|
2024-01-01 14:58:48 -08:00 |
|
tf_gemm.py
|
Add tensorflow GEMM benchmark script (#1000)
|
2023-06-18 10:57:45 -07:00 |
|
torch_gemm.py
|
faster RDNA assembly backend (#990)
|
2023-06-16 12:06:38 -07:00 |
|
tvm_gemm.py
|
fix tvm gemm example
|
2023-10-08 05:57:41 -07:00 |