bu1 commited on
Commit
eb6e10c
·
verified ·
1 Parent(s): 3be7fe8

Upload model

Browse files
Files changed (2) hide show
  1. model.safetensors +1 -1
  2. modeling_IQtransformer.py +1 -1
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f0086aa0b6c4b67c2d818b2038c0232b0c8d86445867f1d73489eb2e5f4bf41d
3
  size 79108
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7daa464c1cd2b8e003a3f0909c0531e2b1ec8c317d3f52402a1debd1a3e46260
3
  size 79108
modeling_IQtransformer.py CHANGED
@@ -228,7 +228,7 @@ class transformerModel(PreTrainedModel):
228
  # 因为位置编码值在-1和1之间,
229
  # 因此嵌入值乘以嵌入维度的平方根进行缩放,
230
  # 然后再与位置编码相加。
231
- X = self.ln(self.Linear(X))
232
  self.attention_weights = [None] * len(self.blks)
233
  for i, blk in enumerate(self.blks):
234
  X = blk(X, valid_lens)
 
228
  # 因为位置编码值在-1和1之间,
229
  # 因此嵌入值乘以嵌入维度的平方根进行缩放,
230
  # 然后再与位置编码相加。
231
+ X = self.ln(self.Linear(X).to(torch.float32))
232
  self.attention_weights = [None] * len(self.blks)
233
  for i, blk in enumerate(self.blks):
234
  X = blk(X, valid_lens)