mirror of
https://github.com/tinygrad/tinygrad.git
synced 2026-06-24 02:14:17 +00:00
enable float16 and unaligned vector load/store
This commit is contained in:
parent
6b7d75683f
commit
dacfa01c0d
1 changed files with 2 additions and 2 deletions
|
|
@ -157,8 +157,8 @@ def split_load_store(ctx:Renderer|None, ls:UOp, idx:UOp):
|
|||
elif isinstance(buf.dtype, ImageDType):
|
||||
lengths = [4]
|
||||
elif ctx is not None and CPU_X86:
|
||||
lengths = [4,2] if buf.dtype.base == dtypes.float32 else []
|
||||
#must_divide = False
|
||||
lengths = [8,4,2] if buf.dtype.base == dtypes.half else [4,2]
|
||||
must_divide = False
|
||||
elif ctx is not None and ctx.supports_float4:
|
||||
# TODO: a better way to get this than ctx
|
||||
lengths = [8,4,2] if buf.dtype.base == dtypes.half and getenv("ALLOW_HALF8") else ([16,8,4,2] if AMX else [4,2])
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue