karths commited on
Commit
5adfca4
·
verified ·
1 Parent(s): 083c005

Upload folder using huggingface_hub

Browse files
checkpoint-1840/config.json CHANGED
@@ -21,7 +21,7 @@
21
  "position_embedding_type": "absolute",
22
  "problem_type": "single_label_classification",
23
  "torch_dtype": "float32",
24
- "transformers_version": "4.35.0",
25
  "type_vocab_size": 1,
26
  "use_cache": true,
27
  "vocab_size": 50265
 
21
  "position_embedding_type": "absolute",
22
  "problem_type": "single_label_classification",
23
  "torch_dtype": "float32",
24
+ "transformers_version": "4.41.2",
25
  "type_vocab_size": 1,
26
  "use_cache": true,
27
  "vocab_size": 50265
checkpoint-1840/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:65991d02e936acfa38384baa6366ba8a943dce353cb716b29a18650cfc29a590
3
  size 328492280
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8488d3812cc2775f9fa8917117f100dfb69714e6a94cbb7a1eebc4b92e9e252
3
  size 328492280
checkpoint-1840/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b3b333c16839fa82647f5686e93d13f32b010d46765bab63ed8166643d38154
3
  size 657047610
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52788f424eefb5cb5b4b5e8c5e34d7fe1965f0084f3d39f164305cfd00fba1fa
3
  size 657047610
checkpoint-1840/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d167b935a74aa253d1aa8950b2f24089232dac154efb8ac3f4c8a615e8446dd
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:659caa9ad8524c5ba45bf7e5788de849dcce22cf5df8d2a6f7b9a59ecd318d58
3
  size 14244
checkpoint-1840/trainer_state.json CHANGED
@@ -9,29 +9,46 @@
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 1.36,
 
13
  "learning_rate": 4.9800000000000004e-05,
14
- "loss": 0.0281,
15
  "step": 500
16
  },
17
  {
18
- "epoch": 2.71,
 
19
  "learning_rate": 3.4810224965023004e-05,
20
- "loss": 0.0472,
21
  "step": 1000
22
  },
23
  {
24
- "epoch": 4.07,
 
25
  "learning_rate": 7.614811590589446e-06,
26
- "loss": 0.0231,
27
  "step": 1500
28
  }
29
  ],
30
  "logging_steps": 500,
31
  "max_steps": 1840,
 
32
  "num_train_epochs": 5,
33
  "save_steps": 500,
 
 
 
 
 
 
 
 
 
 
 
 
34
  "total_flos": 1.5591942691405824e+16,
 
35
  "trial_name": null,
36
  "trial_params": null
37
  }
 
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 1.3568521031207599,
13
+ "grad_norm": 1.447092056274414,
14
  "learning_rate": 4.9800000000000004e-05,
15
+ "loss": 0.0263,
16
  "step": 500
17
  },
18
  {
19
+ "epoch": 2.7137042062415198,
20
+ "grad_norm": 18.664369583129883,
21
  "learning_rate": 3.4810224965023004e-05,
22
+ "loss": 0.0457,
23
  "step": 1000
24
  },
25
  {
26
+ "epoch": 4.07055630936228,
27
+ "grad_norm": 0.045205749571323395,
28
  "learning_rate": 7.614811590589446e-06,
29
+ "loss": 0.0204,
30
  "step": 1500
31
  }
32
  ],
33
  "logging_steps": 500,
34
  "max_steps": 1840,
35
+ "num_input_tokens_seen": 0,
36
  "num_train_epochs": 5,
37
  "save_steps": 500,
38
+ "stateful_callbacks": {
39
+ "TrainerControl": {
40
+ "args": {
41
+ "should_epoch_stop": false,
42
+ "should_evaluate": false,
43
+ "should_log": false,
44
+ "should_save": true,
45
+ "should_training_stop": true
46
+ },
47
+ "attributes": {}
48
+ }
49
+ },
50
  "total_flos": 1.5591942691405824e+16,
51
+ "train_batch_size": 32,
52
  "trial_name": null,
53
  "trial_params": null
54
  }
checkpoint-1840/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8482030ab2426c1370f4f8a5abc57fb9e3570c2d3f610e3261bf2a9bfa841aa0
3
- size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2f49eaa4bc8e46aafa72cc70e2c03820d95ffde8da5b6d004aa8848152170c2
3
+ size 5176
classification_report.json CHANGED
@@ -1 +1 @@
1
- {"0": {"precision": 0.9986559139784946, "recall": 0.9983204568357407, "f1-score": 0.9984881572316479, "support": 2977}, "1": {"precision": 0.9982853223593965, "recall": 0.9986277873070326, "f1-score": 0.9984565254673299, "support": 2915}, "accuracy": 0.9984725050916496, "macro avg": {"precision": 0.9984706181689456, "recall": 0.9984741220713866, "f1-score": 0.9984723413494889, "support": 5892}, "weighted avg": {"precision": 0.9984725679890731, "recall": 0.9984725050916496, "f1-score": 0.9984725077759473, "support": 5892}}
 
1
+ {"0": {"precision": 0.9996636394214599, "recall": 0.9983204568357407, "f1-score": 0.9989915966386554, "support": 2977}, "1": {"precision": 0.9982870846180198, "recall": 0.9996569468267581, "f1-score": 0.9989715461090161, "support": 2915}, "accuracy": 0.9989816700610998, "macro avg": {"precision": 0.9989753620197399, "recall": 0.9989887018312493, "f1-score": 0.9989815713738357, "support": 5892}, "weighted avg": {"precision": 0.9989826045857457, "recall": 0.9989816700610998, "f1-score": 0.998981676867118, "support": 5892}}
config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "_name_or_path": "binary_classification_train_comp",
3
  "architectures": [
4
- "RobertaModel"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "bos_token_id": 0,
@@ -21,7 +21,7 @@
21
  "position_embedding_type": "absolute",
22
  "problem_type": "single_label_classification",
23
  "torch_dtype": "float32",
24
- "transformers_version": "4.35.0",
25
  "type_vocab_size": 1,
26
  "use_cache": true,
27
  "vocab_size": 50265
 
1
  {
2
+ "_name_or_path": "distilroberta-base",
3
  "architectures": [
4
+ "RobertaForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "bos_token_id": 0,
 
21
  "position_embedding_type": "absolute",
22
  "problem_type": "single_label_classification",
23
  "torch_dtype": "float32",
24
+ "transformers_version": "4.41.2",
25
  "type_vocab_size": 1,
26
  "use_cache": true,
27
  "vocab_size": 50265
confusion_matrix.png CHANGED
detailed_confusion_matrix.png CHANGED
fold_results.json CHANGED
@@ -1,67 +1,67 @@
1
  {
2
  "0": {
3
- "eval_loss": 0.49251872301101685,
4
- "eval_precision": 0.8383937316356513,
5
- "eval_recall": 0.8806584362139918,
6
- "eval_acc": 0.8569489224503648,
7
- "eval_mcc": 0.7149044085568931,
8
- "eval_f1": 0.8590065228299046,
9
- "eval_auc": 0.9368403646060125,
10
- "eval_runtime": 43.2643,
11
- "eval_samples_per_second": 136.209,
12
- "eval_steps_per_second": 2.15,
13
- "epoch": 4.99
14
  },
15
  "1": {
16
- "eval_loss": 0.1094377413392067,
17
- "eval_precision": 0.9633649932157394,
18
- "eval_recall": 0.9742710120068611,
19
- "eval_acc": 0.96894620736467,
20
- "eval_mcc": 0.9379515794159662,
21
- "eval_f1": 0.9687873102507248,
22
- "eval_auc": 0.9945646576898399,
23
- "eval_runtime": 44.6925,
24
- "eval_samples_per_second": 131.857,
25
- "eval_steps_per_second": 2.081,
26
- "epoch": 4.99
27
  },
28
  "2": {
29
- "eval_loss": 0.03799332678318024,
30
- "eval_precision": 0.9870616275110657,
31
- "eval_recall": 0.9945111492281303,
32
- "eval_acc": 0.9908350305498982,
33
- "eval_mcc": 0.9816968472799382,
34
- "eval_f1": 0.9907723855092277,
35
- "eval_auc": 0.9989923317187055,
36
- "eval_runtime": 43.1075,
37
- "eval_samples_per_second": 136.682,
38
- "eval_steps_per_second": 2.157,
39
- "epoch": 4.99
40
  },
41
  "3": {
42
- "eval_loss": 0.01312282308936119,
43
- "eval_precision": 0.9958918178705922,
44
  "eval_recall": 0.9979416809605489,
45
- "eval_acc": 0.9969450101832994,
46
- "eval_mcc": 0.9938915364089936,
47
- "eval_f1": 0.9969156956819739,
48
- "eval_auc": 0.9997945368465266,
49
- "eval_runtime": 45.5654,
50
- "eval_samples_per_second": 129.309,
51
- "eval_steps_per_second": 2.041,
52
- "epoch": 4.99
53
  },
54
  "4": {
55
- "eval_loss": 0.005135194398462772,
56
- "eval_precision": 0.9982853223593965,
57
- "eval_recall": 0.9986277873070326,
58
- "eval_acc": 0.9984725050916496,
59
- "eval_mcc": 0.9969447402341746,
60
- "eval_f1": 0.9984565254673299,
61
- "eval_auc": 0.9999125369974838,
62
- "eval_runtime": 49.4472,
63
- "eval_samples_per_second": 119.157,
64
- "eval_steps_per_second": 1.881,
65
- "epoch": 4.99
66
  }
67
  }
 
1
  {
2
  "0": {
3
+ "eval_loss": 0.5038772225379944,
4
+ "eval_precision": 0.8480212836714334,
5
+ "eval_recall": 0.8744855967078189,
6
+ "eval_acc": 0.8603427795689802,
7
+ "eval_mcc": 0.7210887452562239,
8
+ "eval_f1": 0.8610501435083573,
9
+ "eval_auc": 0.9368668018595239,
10
+ "eval_runtime": 21.4451,
11
+ "eval_samples_per_second": 274.795,
12
+ "eval_steps_per_second": 4.337,
13
+ "epoch": 4.993215739484397
14
  },
15
  "1": {
16
+ "eval_loss": 0.1229735016822815,
17
+ "eval_precision": 0.9655525238744884,
18
+ "eval_recall": 0.9711835334476844,
19
+ "eval_acc": 0.9686068216528084,
20
+ "eval_mcc": 0.9372259408227088,
21
+ "eval_f1": 0.9683598426543527,
22
+ "eval_auc": 0.9929632053008512,
23
+ "eval_runtime": 20.9383,
24
+ "eval_samples_per_second": 281.446,
25
+ "eval_steps_per_second": 4.442,
26
+ "epoch": 4.993215739484397
27
  },
28
  "2": {
29
+ "eval_loss": 0.04947742819786072,
30
+ "eval_precision": 0.9823069071112623,
31
+ "eval_recall": 0.9903945111492282,
32
+ "eval_acc": 0.9864222674813307,
33
+ "eval_mcc": 0.9728761419175846,
34
+ "eval_f1": 0.9863341305090536,
35
+ "eval_auc": 0.999065851344009,
36
+ "eval_runtime": 21.3434,
37
+ "eval_samples_per_second": 276.057,
38
+ "eval_steps_per_second": 4.357,
39
+ "epoch": 4.993215739484397
40
  },
41
  "3": {
42
+ "eval_loss": 0.010631650686264038,
43
+ "eval_precision": 0.9955509924709104,
44
  "eval_recall": 0.9979416809605489,
45
+ "eval_acc": 0.9967752885268161,
46
+ "eval_mcc": 0.9935528293476538,
47
+ "eval_f1": 0.9967449032037006,
48
+ "eval_auc": 0.9999366786299306,
49
+ "eval_runtime": 22.1376,
50
+ "eval_samples_per_second": 266.153,
51
+ "eval_steps_per_second": 4.201,
52
+ "epoch": 4.993215739484397
53
  },
54
  "4": {
55
+ "eval_loss": 0.007078895810991526,
56
+ "eval_precision": 0.9982870846180198,
57
+ "eval_recall": 0.9996569468267581,
58
+ "eval_acc": 0.9989816700610998,
59
+ "eval_mcc": 0.9979640637618323,
60
+ "eval_f1": 0.9989715461090161,
61
+ "eval_auc": 0.999933221594258,
62
+ "eval_runtime": 22.6852,
63
+ "eval_samples_per_second": 259.728,
64
+ "eval_steps_per_second": 4.1,
65
+ "epoch": 4.993215739484397
66
  }
67
  }
metrics.json CHANGED
@@ -1 +1 @@
1
- {"precision": 0.9982853223593965, "recall": 0.9986277873070326, "acc": 0.9984725050916496, "mcc": 0.9969447402341746, "f1": 0.9984565254673299, "auc": 0.9999125369974838}
 
1
+ {"precision": 0.9982870846180198, "recall": 0.9996569468267581, "acc": 0.9989816700610998, "mcc": 0.9979640637618323, "f1": 0.9989715461090161, "auc": 0.999933221594258}
metrics_all_fold.json CHANGED
@@ -1,44 +1,44 @@
1
  {
2
  "precision": [
3
- 0.8383937316356513,
4
- 0.9633649932157394,
5
- 0.9870616275110657,
6
- 0.9958918178705922,
7
- 0.9982853223593965
8
  ],
9
  "recall": [
10
- 0.8806584362139918,
11
- 0.9742710120068611,
12
- 0.9945111492281303,
13
  0.9979416809605489,
14
- 0.9986277873070326
15
  ],
16
  "f1": [
17
- 0.8590065228299046,
18
- 0.9687873102507248,
19
- 0.9907723855092277,
20
- 0.9969156956819739,
21
- 0.9984565254673299
22
  ],
23
  "auc": [
24
- 0.9368403646060125,
25
- 0.9945646576898399,
26
- 0.9989923317187055,
27
- 0.9997945368465266,
28
- 0.9999125369974838
29
  ],
30
  "acc": [
31
- 0.8569489224503648,
32
- 0.96894620736467,
33
- 0.9908350305498982,
34
- 0.9969450101832994,
35
- 0.9984725050916496
36
  ],
37
  "mcc": [
38
- 0.7149044085568931,
39
- 0.9379515794159662,
40
- 0.9816968472799382,
41
- 0.9938915364089936,
42
- 0.9969447402341746
43
  ]
44
  }
 
1
  {
2
  "precision": [
3
+ 0.8480212836714334,
4
+ 0.9655525238744884,
5
+ 0.9823069071112623,
6
+ 0.9955509924709104,
7
+ 0.9982870846180198
8
  ],
9
  "recall": [
10
+ 0.8744855967078189,
11
+ 0.9711835334476844,
12
+ 0.9903945111492282,
13
  0.9979416809605489,
14
+ 0.9996569468267581
15
  ],
16
  "f1": [
17
+ 0.8610501435083573,
18
+ 0.9683598426543527,
19
+ 0.9863341305090536,
20
+ 0.9967449032037006,
21
+ 0.9989715461090161
22
  ],
23
  "auc": [
24
+ 0.9368668018595239,
25
+ 0.9929632053008512,
26
+ 0.999065851344009,
27
+ 0.9999366786299306,
28
+ 0.999933221594258
29
  ],
30
  "acc": [
31
+ 0.8603427795689802,
32
+ 0.9686068216528084,
33
+ 0.9864222674813307,
34
+ 0.9967752885268161,
35
+ 0.9989816700610998
36
  ],
37
  "mcc": [
38
+ 0.7210887452562239,
39
+ 0.9372259408227088,
40
+ 0.9728761419175846,
41
+ 0.9935528293476538,
42
+ 0.9979640637618323
43
  ]
44
  }
metrics_ci_bounds.json CHANGED
@@ -1,26 +1,26 @@
1
  {
2
  "precision": {
3
- "ci_lower": 0.872780485843686,
4
- "ci_upper": 1.0404185111932922
5
  },
6
  "recall": {
7
- "ci_lower": 0.9065070275143534,
8
- "ci_upper": 1.0318969987722724
9
  },
10
  "f1": {
11
- "ci_lower": 0.8892599568883727,
12
- "ci_upper": 1.0363154190072918
13
  },
14
  "auc": {
15
- "ci_lower": 0.9517755451801476,
16
- "ci_upper": 1.0202662259632802
17
  },
18
  "acc": {
19
- "ci_lower": 0.8877593873405121,
20
- "ci_upper": 1.0370996829154409
21
  },
22
  "mcc": {
23
- "ci_lower": 0.7762794118041381,
24
- "ci_upper": 1.0738762329542482
25
  }
26
  }
 
1
  {
2
  "precision": {
3
+ "ci_lower": 0.879964948964814,
4
+ "ci_upper": 1.035922567733632
5
  },
6
  "recall": {
7
+ "ci_lower": 0.9011847484720348,
8
+ "ci_upper": 1.0322801591647803
9
  },
10
  "f1": {
11
+ "ci_lower": 0.8904332620940503,
12
+ "ci_upper": 1.0341509642997417
13
  },
14
  "auc": {
15
+ "ci_lower": 0.9516280838265948,
16
+ "ci_upper": 1.0198782196648344
17
  },
18
  "acc": {
19
+ "ci_lower": 0.8899554874350446,
20
+ "ci_upper": 1.0344960434813693
21
  },
22
  "mcc": {
23
+ "ci_lower": 0.7802150047216826,
24
+ "ci_upper": 1.068868083720719
25
  }
26
  }
metrics_mean.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "precision": 0.956599498518489,
3
- "recall": 0.9692020131433129,
4
- "f1": 0.9627876879478322,
5
- "auc": 0.9860208855717139,
6
- "acc": 0.9624295351279765,
7
- "mcc": 0.9250778223791931
8
  }
 
1
  {
2
+ "precision": 0.957943758349223,
3
+ "recall": 0.9667324538184076,
4
+ "f1": 0.962292113196896,
5
+ "auc": 0.9857531517457145,
6
+ "acc": 0.9622257654582069,
7
+ "mcc": 0.9245415442212007
8
  }
metrics_std.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "precision": 0.06750539018289854,
3
- "recall": 0.050492714389445276,
4
- "f1": 0.05921709187495754,
5
- "auc": 0.027580199185211717,
6
- "acc": 0.060137161015769824,
7
- "mcc": 0.11983790364407107
8
  }
 
1
  {
2
+ "precision": 0.062801860646049,
3
+ "recall": 0.05279021171685444,
4
+ "f1": 0.05787302459183737,
5
+ "auc": 0.027483335240843117,
6
+ "acc": 0.058204375843795855,
7
+ "mcc": 0.11623638899759181
8
  }
metrics_visualisation.png CHANGED
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba78e30ea5990c11835a6c6a7b03ba0c39607b0f8c9d6e8cc10948f6eac8f978
3
- size 328485128
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8488d3812cc2775f9fa8917117f100dfb69714e6a94cbb7a1eebc4b92e9e252
3
+ size 328492280
precision_recall_curve.png CHANGED
roc_curve.png CHANGED
test_top_repo_data.csv CHANGED
The diff for this file is too large to render. See raw diff
 
top_repo_data.csv CHANGED
The diff for this file is too large to render. See raw diff
 
tracker_carbon_statistics.json CHANGED
@@ -4,30 +4,30 @@
4
  "codecarbon_version": "2.3.4",
5
  "country_iso_code": "NOR",
6
  "country_name": "Norway",
7
- "cpu_count": 192,
8
- "cpu_energy": 0.13407618624252984,
9
- "cpu_model": "AMD EPYC 7642 48-Core Processor",
10
- "cpu_power": 115.58872123619882,
11
- "duration": 4398.068885803223,
12
- "emissions": 0.04812536324960169,
13
- "emissions_rate": 1.0942385055620274e-05,
14
- "energy_consumed": 1.7468371415463408,
15
- "gpu_count": 4,
16
- "gpu_energy": 1.1546827076343176,
17
- "gpu_model": "4 x NVIDIA GeForce RTX 3090",
18
- "gpu_power": 930.33821452628,
19
  "latitude": 59.9016,
20
  "longitude": 10.7343,
21
  "on_cloud": "N",
22
- "os": "Linux-4.18.0-513.18.1.el8_9.x86_64-x86_64-with-glibc2.28",
23
  "project_name": "codecarbon",
24
  "pue": 1.0,
25
  "python_version": "3.10.8",
26
- "ram_energy": 0.4580782476694937,
27
- "ram_power": 377.6938190460205,
28
- "ram_total_size": 1007.1835174560547,
29
  "region": "oslo county",
30
- "run_id": "e316b659-b759-4762-8600-b944027dd60d",
31
- "timestamp": "2024-04-05T15:17:11",
32
  "tracking_mode": "machine"
33
  }
 
4
  "codecarbon_version": "2.3.4",
5
  "country_iso_code": "NOR",
6
  "country_name": "Norway",
7
+ "cpu_count": 64,
8
+ "cpu_energy": 0.15794805491750952,
9
+ "cpu_model": "AMD EPYC 7282 16-Core Processor",
10
+ "cpu_power": 111.57651490678498,
11
+ "duration": 5100.969531536102,
12
+ "emissions": 0.036391987394340346,
13
+ "emissions_rate": 7.134327537020455e-06,
14
+ "energy_consumed": 1.320943281101283,
15
+ "gpu_count": 8,
16
+ "gpu_energy": 1.029562893927391,
17
+ "gpu_model": "8 x NVIDIA GeForce RTX 2080 Ti",
18
+ "gpu_power": 724.4046913237145,
19
  "latitude": 59.9016,
20
  "longitude": 10.7343,
21
  "on_cloud": "N",
22
+ "os": "Linux-4.18.0-513.11.1.el8_9.x86_64-x86_64-with-glibc2.28",
23
  "project_name": "codecarbon",
24
  "pue": 1.0,
25
  "python_version": "3.10.8",
26
+ "ram_energy": 0.1334323322563821,
27
+ "ram_power": 94.20606851577759,
28
+ "ram_total_size": 251.21618270874023,
29
  "region": "oslo county",
30
+ "run_id": "1db31b74-a004-4552-b529-cdbe2bc98c29",
31
+ "timestamp": "2024-10-18T12:07:48",
32
  "tracking_mode": "machine"
33
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8482030ab2426c1370f4f8a5abc57fb9e3570c2d3f610e3261bf2a9bfa841aa0
3
- size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2f49eaa4bc8e46aafa72cc70e2c03820d95ffde8da5b6d004aa8848152170c2
3
+ size 5176