0
0
Fork 0
mirror of https://github.com/matrix-construct/construct synced 2024-09-27 19:28:52 +02:00

ircd::gpt::gpu: Add global fence between attn and ffnn accumulations (gfx1011).

This commit is contained in:
Jason Volk 2022-10-05 17:33:44 +00:00
parent c4cceb425c
commit 33afa8a4fc

View file

@ -528,7 +528,9 @@ ircd_gpt_coil(__global struct ircd_gpt_ctrl *const ctrl,
accum[wi].elem[li] = result;
}
// Backend mlp; layer-norm acquires any pending writes, no fence required.
barrier(CLK_GLOBAL_MEM_FENCE);
// Backend mlp
ircd_gpt_ffnn
(
ctrl,