Add SetFit model
Browse files- README.md +5 -4
- model_head.pkl +1 -1
README.md
CHANGED
@@ -88,11 +88,11 @@ preds = model("I loved the spiderman movie!")
|
|
88 |
## Training Details
|
89 |
|
90 |
### Training Hyperparameters
|
91 |
-
- batch_size: (
|
92 |
- num_epochs: (3, 3)
|
93 |
- max_steps: -1
|
94 |
- sampling_strategy: oversampling
|
95 |
-
- body_learning_rate: (
|
96 |
- head_learning_rate: 0.01
|
97 |
- loss: CosineSimilarityLoss
|
98 |
- distance_metric: cosine_distance
|
@@ -101,14 +101,15 @@ preds = model("I loved the spiderman movie!")
|
|
101 |
- use_amp: False
|
102 |
- warmup_proportion: 0.1
|
103 |
- l2_weight: 0.01
|
104 |
-
- seed:
|
105 |
- eval_max_steps: -1
|
106 |
- load_best_model_at_end: False
|
107 |
|
108 |
### Training Results
|
109 |
| Epoch | Step | Training Loss | Validation Loss |
|
110 |
|:------:|:----:|:-------------:|:---------------:|
|
111 |
-
| 0.
|
|
|
112 |
|
113 |
### Framework Versions
|
114 |
- Python: 3.11.4
|
|
|
88 |
## Training Details
|
89 |
|
90 |
### Training Hyperparameters
|
91 |
+
- batch_size: (8, 8)
|
92 |
- num_epochs: (3, 3)
|
93 |
- max_steps: -1
|
94 |
- sampling_strategy: oversampling
|
95 |
+
- body_learning_rate: (4.843982450599576e-05, 4.843982450599576e-05)
|
96 |
- head_learning_rate: 0.01
|
97 |
- loss: CosineSimilarityLoss
|
98 |
- distance_metric: cosine_distance
|
|
|
101 |
- use_amp: False
|
102 |
- warmup_proportion: 0.1
|
103 |
- l2_weight: 0.01
|
104 |
+
- seed: 36
|
105 |
- eval_max_steps: -1
|
106 |
- load_best_model_at_end: False
|
107 |
|
108 |
### Training Results
|
109 |
| Epoch | Step | Training Loss | Validation Loss |
|
110 |
|:------:|:----:|:-------------:|:---------------:|
|
111 |
+
| 0.0556 | 1 | 0.157 | - |
|
112 |
+
| 2.7778 | 50 | 0.2482 | - |
|
113 |
|
114 |
### Framework Versions
|
115 |
- Python: 3.11.4
|
model_head.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 7067
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22113a402d7576b498ad3d18eaffbacce87ec50e34f9c366ebd5d7f887218fc8
|
3 |
size 7067
|