mirror of
https://github.com/tinygrad/tinygrad.git
synced 2026-06-24 02:14:17 +00:00
Fix double SDMA_OP_FENCE (#9705)
Introduced in #9585, probably when i incorrectly resolved merge conflict while rebasing an old, mi300x-only branch. Seems to be the source of multi gpu beam llama hangs
This commit is contained in:
parent
a6fec2f5ae
commit
5bd485c027
1 changed files with 0 additions and 1 deletions
|
|
@ -339,7 +339,6 @@ class AMDCopyQueue(HWQueue):
|
|||
def signal(self, signal:AMDSignal, value:sint=0):
|
||||
fence_flags = self.sdma.SDMA_PKT_FENCE_HEADER_MTYPE(3) if self.dev.gfxver >= 10 else 0
|
||||
self.q(self.sdma.SDMA_OP_FENCE | fence_flags, *data64_le(signal.value_addr), value)
|
||||
self.q(self.sdma.SDMA_OP_FENCE, *data64_le(signal.value_addr), value)
|
||||
|
||||
if not AMDDevice.driverless and (dev:=signal.timeline_for_device) is not None:
|
||||
self.q(self.sdma.SDMA_OP_FENCE | fence_flags, *data64_le(dev.queue_event_mailbox_ptr), dev.queue_event.event_id)
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue