Yuchan
commited on
Update Model.py
Browse files
Model.py
CHANGED
|
@@ -191,10 +191,12 @@ class Lo(layers.Layer):
|
|
| 191 |
super().__init__()
|
| 192 |
self.d = layers.Dense(256, activation='silu')
|
| 193 |
self.w = layers.Dense(d_model)
|
|
|
|
|
|
|
| 194 |
def call(self, x):
|
| 195 |
p = self.d(x)
|
| 196 |
p = self.w(p)
|
| 197 |
-
return p + x
|
| 198 |
|
| 199 |
class Block(layers.Layer):
|
| 200 |
def __init__(self, d_model):
|
|
@@ -256,7 +258,7 @@ model = ReLM(
|
|
| 256 |
vocab_size=vocab_size,
|
| 257 |
max_seq_len=max_len,
|
| 258 |
d_model=700,
|
| 259 |
-
n_layers=
|
| 260 |
)
|
| 261 |
|
| 262 |
# 옵티마이저 설정
|
|
|
|
| 191 |
super().__init__()
|
| 192 |
self.d = layers.Dense(256, activation='silu')
|
| 193 |
self.w = layers.Dense(d_model)
|
| 194 |
+
self.norm = layers.LayerNormalization(epsilon=1e-5, dtype='float32')
|
| 195 |
+
|
| 196 |
def call(self, x):
|
| 197 |
p = self.d(x)
|
| 198 |
p = self.w(p)
|
| 199 |
+
return self.norm(p) + x
|
| 200 |
|
| 201 |
class Block(layers.Layer):
|
| 202 |
def __init__(self, d_model):
|
|
|
|
| 258 |
vocab_size=vocab_size,
|
| 259 |
max_seq_len=max_len,
|
| 260 |
d_model=700,
|
| 261 |
+
n_layers=16
|
| 262 |
)
|
| 263 |
|
| 264 |
# 옵티마이저 설정
|