Upload model
Browse files- model.safetensors +1 -1
- modeling_IQtransformer.py +1 -1
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 79108
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7daa464c1cd2b8e003a3f0909c0531e2b1ec8c317d3f52402a1debd1a3e46260
|
3 |
size 79108
|
modeling_IQtransformer.py
CHANGED
@@ -228,7 +228,7 @@ class transformerModel(PreTrainedModel):
|
|
228 |
# 因为位置编码值在-1和1之间,
|
229 |
# 因此嵌入值乘以嵌入维度的平方根进行缩放,
|
230 |
# 然后再与位置编码相加。
|
231 |
-
X = self.ln(self.Linear(X))
|
232 |
self.attention_weights = [None] * len(self.blks)
|
233 |
for i, blk in enumerate(self.blks):
|
234 |
X = blk(X, valid_lens)
|
|
|
228 |
# 因为位置编码值在-1和1之间,
|
229 |
# 因此嵌入值乘以嵌入维度的平方根进行缩放,
|
230 |
# 然后再与位置编码相加。
|
231 |
+
X = self.ln(self.Linear(X).to(torch.float32))
|
232 |
self.attention_weights = [None] * len(self.blks)
|
233 |
for i, blk in enumerate(self.blks):
|
234 |
X = blk(X, valid_lens)
|