Upload model
Browse files- README.md +5 -5
- config.json +1 -1
- generation_config.json +1 -1
- tf_model.h5 +1 -1
README.md
CHANGED
@@ -32,8 +32,8 @@ More information needed
|
|
32 |
### Training hyperparameters
|
33 |
|
34 |
The following hyperparameters were used during training:
|
35 |
-
- optimizer: {'name': 'AdamWeightDecay', 'learning_rate': {'class_name': 'WarmUp', 'config': {'initial_learning_rate': 5e-05, 'decay_schedule_fn': {'class_name': 'PolynomialDecay', 'config': {'initial_learning_rate': 5e-05, 'decay_steps':
|
36 |
-
- training_precision:
|
37 |
|
38 |
### Training results
|
39 |
|
@@ -41,7 +41,7 @@ The following hyperparameters were used during training:
|
|
41 |
|
42 |
### Framework versions
|
43 |
|
44 |
-
- Transformers 4.
|
45 |
-
- TensorFlow 2.
|
46 |
-
- Datasets 2.1
|
47 |
- Tokenizers 0.13.3
|
|
|
32 |
### Training hyperparameters
|
33 |
|
34 |
The following hyperparameters were used during training:
|
35 |
+
- optimizer: {'name': 'AdamWeightDecay', 'learning_rate': {'class_name': 'WarmUp', 'config': {'initial_learning_rate': 5e-05, 'decay_schedule_fn': {'class_name': 'PolynomialDecay', 'config': {'initial_learning_rate': 5e-05, 'decay_steps': 7623, 'end_learning_rate': 0.0, 'power': 1.0, 'cycle': False, 'name': None}, '__passive_serialization__': True}, 'warmup_steps': 1000, 'power': 1.0, 'name': None}}, 'decay': 0.0, 'beta_1': 0.9, 'beta_2': 0.999, 'epsilon': 1e-08, 'amsgrad': False, 'weight_decay_rate': 0.01}
|
36 |
+
- training_precision: float32
|
37 |
|
38 |
### Training results
|
39 |
|
|
|
41 |
|
42 |
### Framework versions
|
43 |
|
44 |
+
- Transformers 4.31.0
|
45 |
+
- TensorFlow 2.12.0
|
46 |
+
- Datasets 2.13.1
|
47 |
- Tokenizers 0.13.3
|
config.json
CHANGED
@@ -44,7 +44,7 @@
|
|
44 |
"max_length": 50
|
45 |
}
|
46 |
},
|
47 |
-
"transformers_version": "4.
|
48 |
"use_cache": true,
|
49 |
"vocab_size": 50003
|
50 |
}
|
|
|
44 |
"max_length": 50
|
45 |
}
|
46 |
},
|
47 |
+
"transformers_version": "4.31.0",
|
48 |
"use_cache": true,
|
49 |
"vocab_size": 50003
|
50 |
}
|
generation_config.json
CHANGED
@@ -3,5 +3,5 @@
|
|
3 |
"bos_token_id": 1,
|
4 |
"eos_token_id": 2,
|
5 |
"pad_token_id": 3,
|
6 |
-
"transformers_version": "4.
|
7 |
}
|
|
|
3 |
"bos_token_id": 1,
|
4 |
"eos_token_id": 2,
|
5 |
"pad_token_id": 3,
|
6 |
+
"transformers_version": "4.31.0"
|
7 |
}
|
tf_model.h5
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 326965184
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9faeaaa945c5f711617c85af1c061d07631d8c1e33ca18435c8ec0a0320de85d
|
3 |
size 326965184
|