Commit 3a2e4799 authored by novelailab's avatar novelailab

k

parent 3b246976
......@@ -260,7 +260,6 @@ class GPTLayer(nn.Module):
x = attn_out + ff_out + residual
#x = residual + attn_out + ff_out -> doesn't match.
if hypernetwork and layer_id % every_n == 0:
#if hypernetwork and layer_id % 5 == 0:
x = x + hyper_out
return x
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment