Marszzibros commited on
Commit
553a4a2
·
verified ·
1 Parent(s): ca958cb

Training in progress, epoch 1

Browse files
adapter_config.json CHANGED
@@ -25,74 +25,74 @@
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
- "language_model.layers.4.self_attn.q_proj",
29
- "language_model.layers.16.self_attn.k_proj",
30
- "language_model.layers.33.self_attn.q_proj",
31
- "language_model.layers.31.self_attn.k_proj",
32
- "language_model.layers.29.self_attn.k_proj",
33
- "language_model.layers.10.self_attn.k_proj",
34
- "language_model.layers.2.self_attn.q_proj",
35
- "language_model.layers.19.self_attn.q_proj",
36
- "language_model.layers.0.self_attn.k_proj",
37
- "language_model.layers.11.self_attn.k_proj",
38
- "language_model.layers.1.self_attn.k_proj",
39
- "language_model.layers.14.self_attn.k_proj",
40
- "language_model.layers.20.self_attn.k_proj",
41
  "language_model.layers.12.self_attn.k_proj",
42
- "language_model.layers.27.self_attn.q_proj",
43
- "language_model.layers.14.self_attn.q_proj",
44
- "language_model.layers.15.self_attn.k_proj",
 
45
  "language_model.layers.7.self_attn.k_proj",
46
- "language_model.layers.20.self_attn.q_proj",
47
- "language_model.layers.19.self_attn.k_proj",
48
- "language_model.layers.17.self_attn.k_proj",
 
49
  "language_model.layers.12.self_attn.q_proj",
50
- "language_model.layers.23.self_attn.q_proj",
51
  "language_model.layers.24.self_attn.k_proj",
52
- "language_model.layers.1.self_attn.q_proj",
53
- "language_model.layers.0.self_attn.q_proj",
54
- "language_model.layers.22.self_attn.q_proj",
55
- "language_model.layers.13.self_attn.k_proj",
56
- "language_model.layers.28.self_attn.k_proj",
57
- "language_model.layers.30.self_attn.q_proj",
58
- "language_model.layers.33.self_attn.k_proj",
59
- "language_model.layers.2.self_attn.k_proj",
60
- "language_model.layers.24.self_attn.q_proj",
61
- "language_model.layers.21.self_attn.k_proj",
62
- "language_model.layers.23.self_attn.k_proj",
63
- "language_model.layers.4.self_attn.k_proj",
64
- "language_model.layers.3.self_attn.k_proj",
65
- "language_model.layers.28.self_attn.q_proj",
66
- "language_model.layers.6.self_attn.q_proj",
67
  "language_model.layers.8.self_attn.q_proj",
68
- "language_model.layers.9.self_attn.k_proj",
69
- "language_model.layers.13.self_attn.q_proj",
70
- "language_model.layers.25.self_attn.k_proj",
 
 
 
 
 
 
 
71
  "language_model.layers.27.self_attn.k_proj",
72
- "language_model.layers.9.self_attn.q_proj",
73
  "language_model.layers.8.self_attn.k_proj",
74
- "language_model.layers.3.self_attn.q_proj",
75
- "language_model.layers.7.self_attn.q_proj",
76
- "language_model.layers.11.self_attn.q_proj",
77
- "language_model.layers.16.self_attn.q_proj",
78
  "language_model.layers.18.self_attn.k_proj",
79
- "language_model.layers.26.self_attn.k_proj",
 
 
 
 
 
80
  "language_model.layers.5.self_attn.k_proj",
 
 
 
 
 
 
81
  "language_model.layers.22.self_attn.k_proj",
82
- "language_model.layers.32.self_attn.q_proj",
 
 
 
 
 
 
 
 
 
83
  "language_model.layers.32.self_attn.k_proj",
 
 
 
84
  "language_model.layers.26.self_attn.q_proj",
 
 
85
  "language_model.layers.6.self_attn.k_proj",
86
- "language_model.layers.21.self_attn.q_proj",
87
- "language_model.layers.10.self_attn.q_proj",
88
- "language_model.layers.5.self_attn.q_proj",
89
- "language_model.layers.25.self_attn.q_proj",
90
- "language_model.layers.18.self_attn.q_proj",
91
- "language_model.layers.30.self_attn.k_proj",
92
- "language_model.layers.15.self_attn.q_proj",
93
- "language_model.layers.17.self_attn.q_proj",
94
- "language_model.layers.29.self_attn.q_proj",
95
- "language_model.layers.31.self_attn.q_proj"
96
  ],
97
  "target_parameters": null,
98
  "task_type": "CAUSAL_LM",
 
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
+ "language_model.layers.2.self_attn.k_proj",
29
+ "language_model.layers.16.self_attn.q_proj",
30
+ "language_model.layers.3.self_attn.q_proj",
31
+ "language_model.layers.22.self_attn.q_proj",
 
 
 
 
 
 
 
 
 
32
  "language_model.layers.12.self_attn.k_proj",
33
+ "language_model.layers.0.self_attn.k_proj",
34
+ "language_model.layers.5.self_attn.q_proj",
35
+ "language_model.layers.31.self_attn.q_proj",
36
+ "language_model.layers.0.self_attn.q_proj",
37
  "language_model.layers.7.self_attn.k_proj",
38
+ "language_model.layers.9.self_attn.k_proj",
39
+ "language_model.layers.3.self_attn.k_proj",
40
+ "language_model.layers.13.self_attn.q_proj",
41
+ "language_model.layers.23.self_attn.k_proj",
42
  "language_model.layers.12.self_attn.q_proj",
43
+ "language_model.layers.20.self_attn.k_proj",
44
  "language_model.layers.24.self_attn.k_proj",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
45
  "language_model.layers.8.self_attn.q_proj",
46
+ "language_model.layers.23.self_attn.q_proj",
47
+ "language_model.layers.14.self_attn.k_proj",
48
+ "language_model.layers.15.self_attn.k_proj",
49
+ "language_model.layers.10.self_attn.k_proj",
50
+ "language_model.layers.26.self_attn.k_proj",
51
+ "language_model.layers.4.self_attn.k_proj",
52
+ "language_model.layers.11.self_attn.q_proj",
53
+ "language_model.layers.13.self_attn.k_proj",
54
+ "language_model.layers.18.self_attn.q_proj",
55
+ "language_model.layers.29.self_attn.q_proj",
56
  "language_model.layers.27.self_attn.k_proj",
57
+ "language_model.layers.30.self_attn.q_proj",
58
  "language_model.layers.8.self_attn.k_proj",
59
+ "language_model.layers.31.self_attn.k_proj",
60
+ "language_model.layers.28.self_attn.k_proj",
61
+ "language_model.layers.32.self_attn.q_proj",
 
62
  "language_model.layers.18.self_attn.k_proj",
63
+ "language_model.layers.20.self_attn.q_proj",
64
+ "language_model.layers.30.self_attn.k_proj",
65
+ "language_model.layers.21.self_attn.q_proj",
66
+ "language_model.layers.7.self_attn.q_proj",
67
+ "language_model.layers.19.self_attn.k_proj",
68
+ "language_model.layers.1.self_attn.q_proj",
69
  "language_model.layers.5.self_attn.k_proj",
70
+ "language_model.layers.25.self_attn.k_proj",
71
+ "language_model.layers.33.self_attn.q_proj",
72
+ "language_model.layers.6.self_attn.q_proj",
73
+ "language_model.layers.2.self_attn.q_proj",
74
+ "language_model.layers.14.self_attn.q_proj",
75
+ "language_model.layers.24.self_attn.q_proj",
76
  "language_model.layers.22.self_attn.k_proj",
77
+ "language_model.layers.4.self_attn.q_proj",
78
+ "language_model.layers.27.self_attn.q_proj",
79
+ "language_model.layers.19.self_attn.q_proj",
80
+ "language_model.layers.10.self_attn.q_proj",
81
+ "language_model.layers.17.self_attn.q_proj",
82
+ "language_model.layers.15.self_attn.q_proj",
83
+ "language_model.layers.16.self_attn.k_proj",
84
+ "language_model.layers.11.self_attn.k_proj",
85
+ "language_model.layers.17.self_attn.k_proj",
86
+ "language_model.layers.25.self_attn.q_proj",
87
  "language_model.layers.32.self_attn.k_proj",
88
+ "language_model.layers.28.self_attn.q_proj",
89
+ "language_model.layers.9.self_attn.q_proj",
90
+ "language_model.layers.21.self_attn.k_proj",
91
  "language_model.layers.26.self_attn.q_proj",
92
+ "language_model.layers.33.self_attn.k_proj",
93
+ "language_model.layers.1.self_attn.k_proj",
94
  "language_model.layers.6.self_attn.k_proj",
95
+ "language_model.layers.29.self_attn.k_proj"
 
 
 
 
 
 
 
 
 
96
  ],
97
  "target_parameters": null,
98
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:225642201f9d1c1bca8303db29b7dda867044e1847c4ba94bec880b253220c62
3
  size 17846024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81bdd65868be01652215114e4f52a3bbb31e8a90bb86fdbee66ce1473917cd1f
3
  size 17846024
runs/Oct10_11-41-29_raymondlab-MS-7D41/events.out.tfevents.1760110890.raymondlab-MS-7D41.2229692.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6f4ec0b104dae74d692110acb2fe4f164fb8cc6d7972171b453166269cfb973
3
+ size 8778
runs/Oct10_11-44-11_raymondlab-MS-7D41/events.out.tfevents.1760111051.raymondlab-MS-7D41.2231175.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ec5f06f7c9248823dc677fecb43b0d6e791feafbe795eb7dda4baf031d22fa6
3
+ size 8778
runs/Oct10_11-48-51_raymondlab-MS-7D41/events.out.tfevents.1760111331.raymondlab-MS-7D41.2233867.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de3d85420e009bfcbc88f4a8721e287e45850465977c460675a1599b26f4e372
3
+ size 10106
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4955c1a9d27b67b743b93c03743383c266ab7e166bcdd09964978b0526c040f3
3
  size 6225
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f3bbc87383d8a8bfebf51cb1193e609256a288e3d9e21820a4221175627b9f2
3
  size 6225