selmamalak commited on
Commit
f2bb93f
·
verified ·
1 Parent(s): 6219941

Training complete for fold 8. Best accuracy: 0.9763

Browse files
README.md ADDED
@@ -0,0 +1,82 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ license: apache-2.0
4
+ base_model: google/vit-base-patch16-224-in21k
5
+ tags:
6
+ - generated_from_trainer
7
+ datasets:
8
+ - medmnist-v2
9
+ metrics:
10
+ - accuracy
11
+ - precision
12
+ - recall
13
+ - f1
14
+ model-index:
15
+ - name: vit-base-patch16-224-in21k-bloodmnist-fold-8
16
+ results: []
17
+ ---
18
+
19
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
20
+ should probably proofread and complete it, then remove this comment. -->
21
+
22
+ # vit-base-patch16-224-in21k-bloodmnist-fold-8
23
+
24
+ This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the medmnist-v2 dataset.
25
+ It achieves the following results on the evaluation set:
26
+ - Loss: 0.0810
27
+ - Accuracy: 0.9763
28
+ - Precision: 0.9753
29
+ - Recall: 0.9758
30
+ - F1: 0.9754
31
+
32
+ ## Model description
33
+
34
+ More information needed
35
+
36
+ ## Intended uses & limitations
37
+
38
+ More information needed
39
+
40
+ ## Training and evaluation data
41
+
42
+ More information needed
43
+
44
+ ## Training procedure
45
+
46
+ ### Training hyperparameters
47
+
48
+ The following hyperparameters were used during training:
49
+ - learning_rate: 0.005
50
+ - train_batch_size: 16
51
+ - eval_batch_size: 16
52
+ - seed: 42
53
+ - gradient_accumulation_steps: 4
54
+ - total_train_batch_size: 64
55
+ - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
56
+ - lr_scheduler_type: linear
57
+ - num_epochs: 10
58
+ - mixed_precision_training: Native AMP
59
+
60
+ ### Training results
61
+
62
+ | Training Loss | Epoch | Step | Validation Loss | Accuracy | Precision | Recall | F1 |
63
+ |:-------------:|:-----:|:----:|:---------------:|:--------:|:---------:|:------:|:------:|
64
+ | 0.478 | 1.0 | 196 | 0.2420 | 0.9140 | 0.9007 | 0.9087 | 0.8994 |
65
+ | 0.3796 | 2.0 | 392 | 0.2008 | 0.9271 | 0.9211 | 0.9354 | 0.9225 |
66
+ | 0.2443 | 3.0 | 588 | 0.1970 | 0.9359 | 0.9236 | 0.9235 | 0.9216 |
67
+ | 0.3441 | 4.0 | 784 | 0.2070 | 0.9359 | 0.9267 | 0.9406 | 0.9320 |
68
+ | 0.2523 | 5.0 | 980 | 0.1415 | 0.9517 | 0.9453 | 0.9502 | 0.9471 |
69
+ | 0.2062 | 6.0 | 1176 | 0.1345 | 0.9561 | 0.9510 | 0.9495 | 0.9492 |
70
+ | 0.2034 | 7.0 | 1372 | 0.1323 | 0.9535 | 0.9575 | 0.9420 | 0.9473 |
71
+ | 0.1798 | 8.0 | 1568 | 0.0902 | 0.9675 | 0.9629 | 0.9652 | 0.9639 |
72
+ | 0.1539 | 9.0 | 1764 | 0.0943 | 0.9684 | 0.9640 | 0.9705 | 0.9669 |
73
+ | 0.1262 | 10.0 | 1960 | 0.0810 | 0.9763 | 0.9753 | 0.9758 | 0.9754 |
74
+
75
+
76
+ ### Framework versions
77
+
78
+ - PEFT 0.15.2
79
+ - Transformers 4.52.4
80
+ - Pytorch 2.6.0+cu124
81
+ - Datasets 3.6.0
82
+ - Tokenizers 0.21.2
adapter_config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": {
4
+ "base_model_class": "ViTForImageClassification",
5
+ "parent_library": "transformers.models.vit.modeling_vit"
6
+ },
7
+ "base_model_name_or_path": "google/vit-base-patch16-224-in21k",
8
+ "bias": "none",
9
+ "corda_config": null,
10
+ "eva_config": null,
11
+ "exclude_modules": null,
12
+ "fan_in_fan_out": false,
13
+ "inference_mode": true,
14
+ "init_lora_weights": true,
15
+ "layer_replication": null,
16
+ "layers_pattern": null,
17
+ "layers_to_transform": null,
18
+ "loftq_config": {},
19
+ "lora_alpha": 16,
20
+ "lora_bias": false,
21
+ "lora_dropout": 0.1,
22
+ "megatron_config": null,
23
+ "megatron_core": "megatron.core",
24
+ "modules_to_save": [
25
+ "classifier"
26
+ ],
27
+ "peft_type": "LORA",
28
+ "r": 16,
29
+ "rank_pattern": {},
30
+ "revision": null,
31
+ "target_modules": [
32
+ "value",
33
+ "query"
34
+ ],
35
+ "task_type": null,
36
+ "trainable_token_indices": null,
37
+ "use_dora": false,
38
+ "use_rslora": false
39
+ }
adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:574ffbe028d082fb607e76bfb12387988c68a38bd701b851c2dd826975a842b6
3
+ size 2391056
preprocessor_config.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_convert_rgb": null,
3
+ "do_normalize": true,
4
+ "do_rescale": true,
5
+ "do_resize": true,
6
+ "image_mean": [
7
+ 0.5,
8
+ 0.5,
9
+ 0.5
10
+ ],
11
+ "image_processor_type": "ViTImageProcessor",
12
+ "image_std": [
13
+ 0.5,
14
+ 0.5,
15
+ 0.5
16
+ ],
17
+ "resample": 2,
18
+ "rescale_factor": 0.00392156862745098,
19
+ "size": {
20
+ "height": 224,
21
+ "width": 224
22
+ }
23
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:336af24c35808d7e3023f30a0a8b424840003f366ea5decfe69ac562011e4fd9
3
+ size 5496