mirror of
https://github.com/matrix-construct/construct
synced 2024-11-15 22:41:12 +01:00
ircd::gpt::gpu: Add global fence between attn and ffnn accumulations (gfx1011).
This commit is contained in:
parent
c4cceb425c
commit
33afa8a4fc
1 changed files with 3 additions and 1 deletions
|
@ -528,7 +528,9 @@ ircd_gpt_coil(__global struct ircd_gpt_ctrl *const ctrl,
|
|||
accum[wi].elem[li] = result;
|
||||
}
|
||||
|
||||
// Backend mlp; layer-norm acquires any pending writes, no fence required.
|
||||
barrier(CLK_GLOBAL_MEM_FENCE);
|
||||
|
||||
// Backend mlp
|
||||
ircd_gpt_ffnn
|
||||
(
|
||||
ctrl,
|
||||
|
|
Loading…
Reference in a new issue