config almost done

44751bc6 · novelailab · 42870e7b · 44751bc6
Commit 44751bc6 authored May 09, 2022 by novelailab
Hide whitespace changes
Inline Side-by-side

Showing with 4 additions and 8 deletions

basedformer/gptj.py basedformer/gptj.py +4 -8

No files found.
--- a/basedformer/gptj.py
+++ b/basedformer/gptj.py
-from typing import KeysView
+from typing import Callable, KeysView
 from regex import D
 import torch
 import torch.nn as nn
@@ -148,7 +148,7 @@ class FeedForward(nn.Module):
 class GPTJLayer(nn.Module):
    def __init__(self, attn, ff, config):
        nn.Module.__init__(self)
-        self.ln_preattn = nn.LayerNorm(config.hidden_dim, eps=config.eps, device=config.device, dtype=config.type)
+        self.ln_preattn = nn.LayerNorm(config.hidden_dim, eps=config.eps, device=config.device, dtype=config.dtype)
        self.ff = ff(config)
        self.attn = attn(config)
        self.tick = True
@@ -253,12 +253,8 @@ class GPTJConfig:
    eps: float = 1e-5
    device: torch.device = torch.device('cuda')
    dtype: torch.dtype = torch.float16
-    Layer = GPTJLayer
+    Layer: nn.Module = GPTJLayer
-    activation = gelu_new
+    activation: Callable = gelu_new
-    def from_dict(self, config_dict):
-        for k, v in config_dict.items():
-            setattr(self, k, v)
 def load_gpt_j(path="models/6b", state_dict=None):
    config = {