seanfarrell commited on
Commit
5f0c21c
·
verified ·
1 Parent(s): de18e88

Upload folder using huggingface_hub

Browse files
Files changed (7) hide show
  1. config.json +8 -12
  2. model.safetensors +2 -2
  3. optimizer.pt +2 -2
  4. rng_state.pth +2 -2
  5. scheduler.pt +2 -2
  6. trainer_state.json +49 -38
  7. training_args.bin +2 -2
config.json CHANGED
@@ -4,6 +4,7 @@
4
  ],
5
  "attention_probs_dropout_prob": 0.1,
6
  "classifier_dropout": null,
 
7
  "gradient_checkpointing": false,
8
  "hidden_act": "gelu",
9
  "hidden_dropout_prob": 0.1,
@@ -11,21 +12,17 @@
11
  "id2label": {
12
  "0": "O",
13
  "1": "B-DISEASE",
14
- "2": "B-ETIOLOGY",
15
- "3": "B-SYMPTOM",
16
- "4": "I-DISEASE",
17
- "5": "I-ETIOLOGY",
18
- "6": "I-SYMPTOM"
19
  },
20
  "initializer_range": 0.02,
21
  "intermediate_size": 3072,
22
  "label2id": {
23
  "B-DISEASE": 1,
24
- "B-ETIOLOGY": 2,
25
- "B-SYMPTOM": 3,
26
- "I-DISEASE": 4,
27
- "I-ETIOLOGY": 5,
28
- "I-SYMPTOM": 6,
29
  "O": 0
30
  },
31
  "layer_norm_eps": 1e-12,
@@ -35,8 +32,7 @@
35
  "num_hidden_layers": 12,
36
  "pad_token_id": 0,
37
  "position_embedding_type": "absolute",
38
- "torch_dtype": "float32",
39
- "transformers_version": "4.55.0",
40
  "type_vocab_size": 2,
41
  "use_cache": true,
42
  "vocab_size": 28996
 
4
  ],
5
  "attention_probs_dropout_prob": 0.1,
6
  "classifier_dropout": null,
7
+ "dtype": "float32",
8
  "gradient_checkpointing": false,
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
 
12
  "id2label": {
13
  "0": "O",
14
  "1": "B-DISEASE",
15
+ "2": "B-SYMPTOMS",
16
+ "3": "I-DISEASE",
17
+ "4": "I-SYMPTOMS"
 
 
18
  },
19
  "initializer_range": 0.02,
20
  "intermediate_size": 3072,
21
  "label2id": {
22
  "B-DISEASE": 1,
23
+ "B-SYMPTOMS": 2,
24
+ "I-DISEASE": 3,
25
+ "I-SYMPTOMS": 4,
 
 
26
  "O": 0
27
  },
28
  "layer_norm_eps": 1e-12,
 
32
  "num_hidden_layers": 12,
33
  "pad_token_id": 0,
34
  "position_embedding_type": "absolute",
35
+ "transformers_version": "4.57.1",
 
36
  "type_vocab_size": 2,
37
  "use_cache": true,
38
  "vocab_size": 28996
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a116629a4282b83bbbc6ae5c0c78022c367c952f9b5770c0b4520893160417b0
3
- size 430923588
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:877c23e0bc64c21e732ba2494d57dae6b22eff75d32ebb79159819c0db88d1d4
3
+ size 430917436
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83814b56092b8cdda9bc091166b623666d463f1dbcd550dc0e134f3869075c12
3
- size 861970123
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29bd932a0a275eb9417464ef20427542b74c4034ae0c9880c44075cf5117848d
3
+ size 861954618
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea246aba954a9bf876500e5102a90bebac5164933d3a04b50d122d18b3a18191
3
- size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8330b00877817a60d41771d75796a9679cc8e49595b5165569b741d43c6c7e82
3
+ size 14244
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9dd985d9cb19185d3edca03f39c6fceda1b539da63f4d331013a5e66d0ebb15d
3
- size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:800e8b30f036bc34fdd1b14175c550852a73bd5d39d2a0dcaca1fcab37c037a6
3
+ size 1064
trainer_state.json CHANGED
@@ -1,61 +1,72 @@
1
  {
2
- "best_global_step": 63,
3
- "best_metric": 0.2536899447441101,
4
- "best_model_checkpoint": "projects/PetBERT_disease/model/checkpoint-63",
5
  "epoch": 4.0,
6
  "eval_steps": 500,
7
- "global_step": 252,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
11
  "log_history": [
 
 
 
 
 
 
 
 
 
 
 
12
  {
13
  "epoch": 1.0,
14
- "eval_f1": 0.5469600521701229,
15
- "eval_loss": 0.2536899447441101,
16
- "eval_precision": 0.6240827679507994,
17
- "eval_recall": 0.5707008372952973,
18
- "eval_runtime": 18.8855,
19
- "eval_samples_per_second": 72.437,
20
- "eval_steps_per_second": 2.277,
21
- "step": 63
22
  },
23
  {
24
  "epoch": 2.0,
25
- "eval_f1": 0.6530841773386488,
26
- "eval_loss": 0.2897721529006958,
27
- "eval_precision": 0.6121946789552213,
28
- "eval_recall": 0.7268689387271124,
29
- "eval_runtime": 18.8901,
30
- "eval_samples_per_second": 72.419,
31
- "eval_steps_per_second": 2.276,
32
- "step": 126
33
  },
34
  {
35
  "epoch": 3.0,
36
- "eval_f1": 0.6474491673607571,
37
- "eval_loss": 0.28480294346809387,
38
- "eval_precision": 0.613922648135192,
39
- "eval_recall": 0.7047525364262208,
40
- "eval_runtime": 18.8954,
41
- "eval_samples_per_second": 72.398,
42
- "eval_steps_per_second": 2.276,
43
- "step": 189
44
  },
45
  {
46
  "epoch": 4.0,
47
- "eval_f1": 0.6666160547465906,
48
- "eval_loss": 0.3676050901412964,
49
- "eval_precision": 0.643380757727672,
50
- "eval_recall": 0.7153767840809319,
51
- "eval_runtime": 18.886,
52
- "eval_samples_per_second": 72.435,
53
- "eval_steps_per_second": 2.277,
54
- "step": 252
55
  }
56
  ],
57
  "logging_steps": 500,
58
- "max_steps": 63000,
59
  "num_input_tokens_seen": 0,
60
  "num_train_epochs": 1000,
61
  "save_steps": 500,
@@ -80,7 +91,7 @@
80
  "attributes": {}
81
  }
82
  },
83
- "total_flos": 2075835268767744.0,
84
  "train_batch_size": 32,
85
  "trial_name": null,
86
  "trial_params": null
 
1
  {
2
+ "best_global_step": 62,
3
+ "best_metric": 0.28845715522766113,
4
+ "best_model_checkpoint": "projects/PetBERT_disease/model/checkpoint-62",
5
  "epoch": 4.0,
6
  "eval_steps": 500,
7
+ "global_step": 248,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
11
  "log_history": [
12
+ {
13
+ "epoch": 0,
14
+ "eval_f1": 0.047209471302922856,
15
+ "eval_loss": 1.8303550481796265,
16
+ "eval_precision": 0.21319458797816965,
17
+ "eval_recall": 0.22196545377896099,
18
+ "eval_runtime": 7.4968,
19
+ "eval_samples_per_second": 182.477,
20
+ "eval_steps_per_second": 5.736,
21
+ "step": 0
22
+ },
23
  {
24
  "epoch": 1.0,
25
+ "eval_f1": 0.6576773743691161,
26
+ "eval_loss": 0.28845715522766113,
27
+ "eval_precision": 0.6425181973626329,
28
+ "eval_recall": 0.7232820624123552,
29
+ "eval_runtime": 7.4773,
30
+ "eval_samples_per_second": 182.955,
31
+ "eval_steps_per_second": 5.751,
32
+ "step": 62
33
  },
34
  {
35
  "epoch": 2.0,
36
+ "eval_f1": 0.6610305313525668,
37
+ "eval_loss": 0.36211177706718445,
38
+ "eval_precision": 0.6395951146577501,
39
+ "eval_recall": 0.7429373450761562,
40
+ "eval_runtime": 7.6395,
41
+ "eval_samples_per_second": 179.068,
42
+ "eval_steps_per_second": 5.629,
43
+ "step": 124
44
  },
45
  {
46
  "epoch": 3.0,
47
+ "eval_f1": 0.6550347805744801,
48
+ "eval_loss": 0.398381769657135,
49
+ "eval_precision": 0.6346157276309076,
50
+ "eval_recall": 0.7372202656188375,
51
+ "eval_runtime": 7.6479,
52
+ "eval_samples_per_second": 178.871,
53
+ "eval_steps_per_second": 5.622,
54
+ "step": 186
55
  },
56
  {
57
  "epoch": 4.0,
58
+ "eval_f1": 0.6557993066358558,
59
+ "eval_loss": 0.4582000970840454,
60
+ "eval_precision": 0.6258838857493523,
61
+ "eval_recall": 0.7362881327432333,
62
+ "eval_runtime": 7.6977,
63
+ "eval_samples_per_second": 177.716,
64
+ "eval_steps_per_second": 5.586,
65
+ "step": 248
66
  }
67
  ],
68
  "logging_steps": 500,
69
+ "max_steps": 62000,
70
  "num_input_tokens_seen": 0,
71
  "num_train_epochs": 1000,
72
  "save_steps": 500,
 
91
  "attributes": {}
92
  }
93
  },
94
+ "total_flos": 2069526443212800.0,
95
  "train_batch_size": 32,
96
  "trial_name": null,
97
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:749c49a6f77fe67d4230dd105f729ac9490a2f4a041ed0a6f305717d9657892a
3
- size 5713
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61e31ef5bbedfcada9aa3a3b84f81f075bc19130047acf8523a3eddf1b7042f2
3
+ size 5368