Abdullah-Nazhat
/

Lite_Tensor_Mapper

Model card Files Files and versions

Abdullah-Nazhat commited on Feb 24

Commit

208ef89

·

verified ·

1 Parent(s): a8c7584

Update litetensormapper.py

Files changed (1) hide show

litetensormapper.py +35 -12

litetensormapper.py CHANGED Viewed

@@ -2,8 +2,6 @@ import torch
 from torch import nn, Tensor
 class VecDyT(nn.Module):
     def __init__(self, input_shape):
@@ -24,14 +22,34 @@ class VecDyGeluSine(nn.Module):
         self.alpha = nn.Parameter(torch.randn(input_shape))
         self.beta = nn.Parameter(torch.randn(input_shape))
         self.gamma = nn.Parameter(torch.randn(1))
-        self.eta = nn.Parameter(torch.randn(1))
         self.gelu = nn.GELU()
     def forward(self, x):
-        x = self.gamma * self.gelu(self.alpha * x) + self.eta * torch.sin(self.beta * x)
         return x
 class TTT(nn.Module):
@@ -65,12 +83,12 @@ class TTT(nn.Module):
         return out
-class FFUnit(nn.Module):
     def __init__(self,dim):
         super().__init__()
-        self.proj =  nn.Linear(dim,dim,bias=False)
         self.modulate = VecDyGeluSine(dim)
@@ -91,24 +109,28 @@ class LiteTensorMapperBlock(nn.Module):
         self.norm_1 =  VecDyT(dim)
         self.norm_2 =  VecDyT(dim)
-        self.memory = TTT(dim)
         self.feedforward = FFUnit(dim)
     def forward(self, x):
-        memorypath, FeedForwardpath = x, x
         memorypath = self.norm_1(memorypath)
         memorypath = self.memory(memorypath)
-        FeedForwardpath = self.norm_2(FeedForwardpath)
-        FeedForwardpath = self.feedforward(FeedForwardpath)
-        x = memorypath + FeedForwardpath
         return x
@@ -123,4 +145,5 @@ class LiteTensorMapper(nn.Module):
     def forward(self, x):
-        return self.model(x)

 from torch import nn, Tensor
 class VecDyT(nn.Module):
     def __init__(self, input_shape):
         self.alpha = nn.Parameter(torch.randn(input_shape))
         self.beta = nn.Parameter(torch.randn(input_shape))
         self.gamma = nn.Parameter(torch.randn(1))
+        self.etta = nn.Parameter(torch.randn(1))
         self.gelu = nn.GELU()
     def forward(self, x):
+        x = self.gamma * self.gelu(self.alpha * x) + self.etta * torch.sin(self.beta * x)
         return x
+class FFUnit(nn.Module):
+    def __init__(self,dim):
+        super().__init__()
+        self.proj =  nn.Linear(dim,dim,bias=False)
+        self.modulate = VecDyGeluSine(dim)
+    def forward(self, x):
+        u, v = x, x
+        u = self.modulate(u)
+        v = self.proj(v)
+        g = u * v
+        return g
 class TTT(nn.Module):
         return out
+class FFUnit_TTT(nn.Module):
     def __init__(self,dim):
         super().__init__()
+        self.proj = TTT(dim)
         self.modulate = VecDyGeluSine(dim)
         self.norm_1 =  VecDyT(dim)
         self.norm_2 =  VecDyT(dim)
+        self.memory = FFUnit_TTT(dim)
         self.feedforward = FFUnit(dim)
     def forward(self, x):
+        memorypath,residual = x, x
         memorypath = self.norm_1(memorypath)
         memorypath = self.memory(memorypath)
+        x = memorypath + residual
+        FFpath, residual = x, x
+        FFpath = self.norm_2(FFpath)
+        FFpath = self.feedforward(FFpath)
+        x = FFpath + residual
         return x
     def forward(self, x):
+        return self.model(x)