.../acceptance_evaluator_agent

Files changed (5) hide show

README.md CHANGED Viewed

@@ -5,7 +5,7 @@ tags:
 - trl
 - sft
 - generated_from_trainer
-base_model: Hugofernandez/Mistral-7B-v0.1-colab-sharded
 model-index:
 - name: results
   results: []
@@ -16,7 +16,9 @@ should probably proofread and complete it, then remove this comment. -->
 # results
-This model is a fine-tuned version of [Hugofernandez/Mistral-7B-v0.1-colab-sharded](https://huggingface.co/Hugofernandez/Mistral-7B-v0.1-colab-sharded) on an unknown dataset.
 ## Model description
@@ -44,6 +46,13 @@ The following hyperparameters were used during training:
 - lr_scheduler_warmup_steps: 100
 - num_epochs: 1
 ### Framework versions
 - PEFT 0.10.0

 - trl
 - sft
 - generated_from_trainer
+base_model: cemuluoglakci/Mistral-7B-v0.1_optimized
 model-index:
 - name: results
   results: []
 # results
+This model is a fine-tuned version of [cemuluoglakci/Mistral-7B-v0.1_optimized](https://huggingface.co/cemuluoglakci/Mistral-7B-v0.1_optimized) on the None dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.5001
 ## Model description
 - lr_scheduler_warmup_steps: 100
 - num_epochs: 1
+### Training results
+| Training Loss | Epoch | Step | Validation Loss |
+|:-------------:|:-----:|:----:|:---------------:|
+| 0.5221        | 1.0   | 75   | 0.5001          |
 ### Framework versions
 - PEFT 0.10.0

adapter_config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "alpha_pattern": {},
   "auto_mapping": null,
-  "base_model_name_or_path": "Hugofernandez/Mistral-7B-v0.1-colab-sharded",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
@@ -21,13 +21,13 @@
   "revision": null,
   "target_modules": [
     "q_proj",
-    "up_proj",
-    "down_proj",
-    "lm_head",
-    "gate_proj",
     "o_proj",
     "k_proj",
-    "v_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

 {
   "alpha_pattern": {},
   "auto_mapping": null,
+  "base_model_name_or_path": "cemuluoglakci/Mistral-7B-v0.1_optimized",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "revision": null,
   "target_modules": [
     "q_proj",
+    "v_proj",
     "o_proj",
+    "gate_proj",
     "k_proj",
+    "down_proj",
+    "lm_head",
+    "up_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:452d34be20aacd08345ba03b4acaa0d3053543f60787992246a5bb05e06a0811
 size 694431312

 version https://git-lfs.github.com/spec/v1
+oid sha256:c3fc5cc4fcba88c5887b8348d73c0567571132ddc59185784c7e35a635fa1010
 size 694431312

runs/Apr03_21-08-35_d77cb52e792b/events.out.tfevents.1712178606.d77cb52e792b.228.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c9406e217610bc4f41ec6bc56caeba8539416b24c4a84ef33500ba1064fa67bb
+size 6256

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7bff757043b101123b802ad6b509aa3c8404d4296859b8d5ef951ea7ecfd425a
 size 4856

 version https://git-lfs.github.com/spec/v1
+oid sha256:ad8b96b5b70ca432529d6ed2699d3f72aca75d25fd761bd088215e4f61da91eb
 size 4856