A2Amir commited on
Commit
5c51a10
·
verified ·
1 Parent(s): 4166960

Training in progress, step 179

Browse files
adapter_config.json CHANGED
@@ -1,175 +1,172 @@
1
  {
2
  "alpha_pattern": {},
3
- "auto_mapping": null,
 
 
 
4
  "base_model_name_or_path": "llava-hf/llava-v1.6-mistral-7b-hf",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
- "inference_mode": false,
8
  "init_lora_weights": "gaussian",
9
  "layer_replication": null,
10
  "layers_pattern": null,
11
  "layers_to_transform": null,
12
  "loftq_config": {},
13
- "lora_alpha": 64,
14
  "lora_dropout": 0.1,
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": null,
18
  "peft_type": "LORA",
19
- "r": 128,
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "vision_tower.vision_model.encoder.layers.6.self_attn.out_proj",
24
- "vision_tower.vision_model.encoder.layers.12.self_attn.k_proj",
25
- "vision_tower.vision_model.encoder.layers.3.self_attn.k_proj",
26
- "vision_tower.vision_model.encoder.layers.2.self_attn.v_proj",
27
- "vision_tower.vision_model.encoder.layers.5.self_attn.q_proj",
28
- "vision_tower.vision_model.encoder.layers.16.mlp.fc1",
29
- "vision_tower.vision_model.encoder.layers.18.mlp.fc2",
30
- "vision_tower.vision_model.encoder.layers.3.mlp.fc1",
 
 
 
31
  "vision_tower.vision_model.encoder.layers.8.mlp.fc2",
32
- "vision_tower.vision_model.encoder.layers.17.mlp.fc2",
33
- "vision_tower.vision_model.encoder.layers.9.self_attn.q_proj",
34
- "vision_tower.vision_model.encoder.layers.0.self_attn.k_proj",
35
- "vision_tower.vision_model.encoder.layers.5.self_attn.k_proj",
36
- "vision_tower.vision_model.encoder.layers.15.mlp.fc2",
37
- "vision_tower.vision_model.encoder.layers.7.self_attn.q_proj",
38
- "vision_tower.vision_model.encoder.layers.22.self_attn.out_proj",
39
- "vision_tower.vision_model.encoder.layers.20.self_attn.k_proj",
40
- "vision_tower.vision_model.encoder.layers.8.mlp.fc1",
41
- "vision_tower.vision_model.encoder.layers.3.mlp.fc2",
42
- "vision_tower.vision_model.encoder.layers.13.self_attn.q_proj",
43
  "vision_tower.vision_model.encoder.layers.19.mlp.fc2",
44
- "vision_tower.vision_model.encoder.layers.19.self_attn.k_proj",
 
 
 
 
 
 
 
 
 
 
 
 
 
45
  "vision_tower.vision_model.encoder.layers.15.self_attn.out_proj",
46
- "vision_tower.vision_model.encoder.layers.22.self_attn.v_proj",
47
- "vision_tower.vision_model.encoder.layers.21.mlp.fc1",
48
- "vision_tower.vision_model.encoder.layers.14.self_attn.q_proj",
49
  "vision_tower.vision_model.encoder.layers.8.self_attn.v_proj",
50
- "vision_tower.vision_model.encoder.layers.17.self_attn.out_proj",
51
- "vision_tower.vision_model.encoder.layers.23.self_attn.v_proj",
 
 
52
  "vision_tower.vision_model.encoder.layers.16.self_attn.v_proj",
53
- "vision_tower.vision_model.encoder.layers.9.mlp.fc2",
54
- "vision_tower.vision_model.encoder.layers.5.mlp.fc1",
55
- "vision_tower.vision_model.encoder.layers.0.mlp.fc2",
56
- "vision_tower.vision_model.encoder.layers.11.mlp.fc1",
57
- "vision_tower.vision_model.encoder.layers.0.self_attn.v_proj",
58
- "vision_tower.vision_model.encoder.layers.4.self_attn.v_proj",
59
- "vision_tower.vision_model.encoder.layers.21.self_attn.k_proj",
60
- "vision_tower.vision_model.encoder.layers.20.mlp.fc2",
61
- "vision_tower.vision_model.encoder.layers.13.self_attn.v_proj",
62
- "vision_tower.vision_model.encoder.layers.15.self_attn.q_proj",
63
- "vision_tower.vision_model.encoder.layers.14.self_attn.v_proj",
64
- "vision_tower.vision_model.encoder.layers.19.self_attn.q_proj",
65
- "vision_tower.vision_model.encoder.layers.12.self_attn.v_proj",
66
- "vision_tower.vision_model.encoder.layers.18.self_attn.q_proj",
67
  "vision_tower.vision_model.encoder.layers.4.mlp.fc1",
68
- "vision_tower.vision_model.encoder.layers.6.mlp.fc1",
69
- "multi_modal_projector.linear_1.lora_A.default",
70
- "vision_tower.vision_model.encoder.layers.7.mlp.fc1",
71
- "vision_tower.vision_model.encoder.layers.7.self_attn.v_proj",
72
- "vision_tower.vision_model.encoder.layers.23.mlp.fc1",
73
- "vision_tower.vision_model.encoder.layers.4.mlp.fc2",
74
- "vision_tower.vision_model.encoder.layers.21.self_attn.q_proj",
75
  "vision_tower.vision_model.encoder.layers.2.self_attn.out_proj",
76
- "vision_tower.vision_model.encoder.layers.19.self_attn.v_proj",
77
- "vision_tower.vision_model.encoder.layers.8.self_attn.q_proj",
78
- "vision_tower.vision_model.encoder.layers.12.self_attn.out_proj",
79
- "vision_tower.vision_model.encoder.layers.10.self_attn.v_proj",
80
- "vision_tower.vision_model.encoder.layers.6.mlp.fc2",
 
 
 
 
 
81
  "vision_tower.vision_model.encoder.layers.14.self_attn.out_proj",
82
- "vision_tower.vision_model.encoder.layers.20.self_attn.v_proj",
83
- "vision_tower.vision_model.encoder.layers.1.mlp.fc2",
 
 
 
 
 
 
 
 
 
 
 
84
  "vision_tower.vision_model.encoder.layers.13.mlp.fc1",
85
- "vision_tower.vision_model.encoder.layers.17.self_attn.k_proj",
86
- "vision_tower.vision_model.encoder.layers.3.self_attn.q_proj",
87
- "vision_tower.vision_model.encoder.layers.13.mlp.fc2",
88
- "vision_tower.vision_model.encoder.layers.9.self_attn.v_proj",
 
 
 
 
89
  "vision_tower.vision_model.encoder.layers.10.self_attn.k_proj",
90
- "vision_tower.vision_model.encoder.layers.11.self_attn.k_proj",
91
  "vision_tower.vision_model.encoder.layers.19.mlp.fc1",
92
- "vision_tower.vision_model.encoder.layers.21.self_attn.v_proj",
93
- "vision_tower.vision_model.encoder.layers.21.mlp.fc2",
94
- "multi_modal_projector.linear_1.base_layer",
95
- "vision_tower.vision_model.encoder.layers.1.self_attn.v_proj",
96
- "vision_tower.vision_model.encoder.layers.1.self_attn.out_proj",
97
- "vision_tower.vision_model.encoder.layers.9.self_attn.out_proj",
98
- "vision_tower.vision_model.encoder.layers.14.self_attn.k_proj",
99
- "vision_tower.vision_model.encoder.layers.18.self_attn.out_proj",
100
- "vision_tower.vision_model.encoder.layers.19.self_attn.out_proj",
101
  "vision_tower.vision_model.encoder.layers.10.self_attn.out_proj",
102
- "vision_tower.vision_model.encoder.layers.1.self_attn.q_proj",
103
- "multi_modal_projector.linear_2.lora_B.default",
104
- "vision_tower.vision_model.encoder.layers.23.mlp.fc2",
105
- "vision_tower.vision_model.encoder.layers.20.mlp.fc1",
106
- "vision_tower.vision_model.encoder.layers.23.self_attn.k_proj",
107
- "vision_tower.vision_model.encoder.layers.2.self_attn.k_proj",
 
 
 
 
 
 
 
108
  "vision_tower.vision_model.encoder.layers.5.self_attn.v_proj",
 
 
 
109
  "vision_tower.vision_model.encoder.layers.17.self_attn.v_proj",
110
- "vision_tower.vision_model.encoder.layers.12.mlp.fc2",
 
 
 
111
  "vision_tower.vision_model.encoder.layers.7.mlp.fc2",
112
- "vision_tower.vision_model.encoder.layers.3.self_attn.v_proj",
113
- "vision_tower.vision_model.encoder.layers.16.mlp.fc2",
114
- "vision_tower.vision_model.encoder.layers.23.self_attn.out_proj",
115
- "multi_modal_projector.linear_1.lora_B.default",
116
- "vision_tower.vision_model.encoder.layers.21.self_attn.out_proj",
117
- "vision_tower.vision_model.encoder.layers.10.mlp.fc2",
118
- "vision_tower.vision_model.encoder.layers.2.mlp.fc1",
119
  "vision_tower.vision_model.encoder.layers.0.self_attn.q_proj",
120
- "vision_tower.vision_model.encoder.layers.9.self_attn.k_proj",
121
- "vision_tower.vision_model.encoder.layers.15.self_attn.k_proj",
122
  "vision_tower.vision_model.encoder.layers.23.self_attn.q_proj",
123
- "vision_tower.vision_model.encoder.layers.7.self_attn.out_proj",
124
- "vision_tower.vision_model.encoder.layers.14.mlp.fc2",
125
- "vision_tower.vision_model.encoder.layers.11.self_attn.q_proj",
126
- "vision_tower.vision_model.encoder.layers.6.self_attn.q_proj",
127
- "multi_modal_projector.linear_2.lora_A.default",
128
  "vision_tower.vision_model.encoder.layers.16.self_attn.q_proj",
129
- "vision_tower.vision_model.encoder.layers.11.self_attn.out_proj",
130
- "vision_tower.vision_model.encoder.layers.0.self_attn.out_proj",
131
- "vision_tower.vision_model.encoder.layers.15.mlp.fc1",
132
- "vision_tower.vision_model.encoder.layers.18.self_attn.k_proj",
133
- "vision_tower.vision_model.encoder.layers.22.mlp.fc1",
134
- "vision_tower.vision_model.encoder.layers.9.mlp.fc1",
135
- "vision_tower.vision_model.encoder.layers.10.self_attn.q_proj",
136
- "vision_tower.vision_model.encoder.layers.18.self_attn.v_proj",
137
- "vision_tower.vision_model.encoder.layers.18.mlp.fc1",
138
- "vision_tower.vision_model.encoder.layers.4.self_attn.out_proj",
139
  "vision_tower.vision_model.encoder.layers.13.self_attn.k_proj",
140
- "vision_tower.vision_model.encoder.layers.4.self_attn.q_proj",
141
- "vision_tower.vision_model.encoder.layers.7.self_attn.k_proj",
142
- "vision_tower.vision_model.encoder.layers.17.mlp.fc1",
143
- "vision_tower.vision_model.encoder.layers.8.self_attn.k_proj",
144
- "vision_tower.vision_model.encoder.layers.6.self_attn.v_proj",
145
- "vision_tower.vision_model.encoder.layers.11.mlp.fc2",
146
- "vision_tower.vision_model.encoder.layers.12.mlp.fc1",
147
- "vision_tower.vision_model.encoder.layers.10.mlp.fc1",
148
- "vision_tower.vision_model.encoder.layers.6.self_attn.k_proj",
149
- "vision_tower.vision_model.encoder.layers.16.self_attn.k_proj",
150
- "vision_tower.vision_model.encoder.layers.2.mlp.fc2",
151
- "vision_tower.vision_model.encoder.layers.1.mlp.fc1",
152
- "vision_tower.vision_model.encoder.layers.8.self_attn.out_proj",
153
- "vision_tower.vision_model.encoder.layers.16.self_attn.out_proj",
154
- "vision_tower.vision_model.encoder.layers.22.mlp.fc2",
155
- "vision_tower.vision_model.encoder.layers.1.self_attn.k_proj",
156
- "vision_tower.vision_model.encoder.layers.13.self_attn.out_proj",
157
- "vision_tower.vision_model.encoder.layers.22.self_attn.q_proj",
158
- "vision_tower.vision_model.encoder.layers.11.self_attn.v_proj",
159
- "vision_tower.vision_model.encoder.layers.5.self_attn.out_proj",
160
- "vision_tower.vision_model.encoder.layers.3.self_attn.out_proj",
161
  "vision_tower.vision_model.encoder.layers.4.self_attn.k_proj",
 
 
 
 
 
 
162
  "vision_tower.vision_model.encoder.layers.15.self_attn.v_proj",
163
- "vision_tower.vision_model.encoder.layers.14.mlp.fc1",
164
- "vision_tower.vision_model.encoder.layers.2.self_attn.q_proj",
165
- "vision_tower.vision_model.encoder.layers.17.self_attn.q_proj",
166
- "vision_tower.vision_model.encoder.layers.12.self_attn.q_proj",
167
- "vision_tower.vision_model.encoder.layers.22.self_attn.k_proj",
168
- "vision_tower.vision_model.encoder.layers.5.mlp.fc2",
169
- "vision_tower.vision_model.encoder.layers.0.mlp.fc1",
170
- "multi_modal_projector.linear_2.base_layer",
171
- "vision_tower.vision_model.encoder.layers.20.self_attn.q_proj",
172
- "vision_tower.vision_model.encoder.layers.20.self_attn.out_proj"
173
  ],
174
  "task_type": null,
175
  "use_dora": false,
 
1
  {
2
  "alpha_pattern": {},
3
+ "auto_mapping": {
4
+ "base_model_class": "LlavaNextForConditionalGeneration",
5
+ "parent_library": "transformers.models.llava_next.modeling_llava_next"
6
+ },
7
  "base_model_name_or_path": "llava-hf/llava-v1.6-mistral-7b-hf",
8
  "bias": "none",
9
  "fan_in_fan_out": false,
10
+ "inference_mode": true,
11
  "init_lora_weights": "gaussian",
12
  "layer_replication": null,
13
  "layers_pattern": null,
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
+ "lora_alpha": 32,
17
  "lora_dropout": 0.1,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
20
  "modules_to_save": null,
21
  "peft_type": "LORA",
22
+ "r": 64,
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
+ "vision_tower.vision_model.encoder.layers.18.self_attn.v_proj",
27
+ "vision_tower.vision_model.encoder.layers.12.self_attn.out_proj",
28
+ "vision_tower.vision_model.encoder.layers.18.mlp.fc1",
29
+ "vision_tower.vision_model.encoder.layers.21.mlp.fc1",
30
+ "vision_tower.vision_model.encoder.layers.8.self_attn.out_proj",
31
+ "vision_tower.vision_model.encoder.layers.13.self_attn.out_proj",
32
+ "vision_tower.vision_model.encoder.layers.10.self_attn.q_proj",
33
+ "vision_tower.vision_model.encoder.layers.11.mlp.fc1",
34
+ "vision_tower.vision_model.encoder.layers.6.mlp.fc2",
35
+ "vision_tower.vision_model.encoder.layers.22.mlp.fc2",
36
+ "vision_tower.vision_model.encoder.layers.3.self_attn.out_proj",
37
  "vision_tower.vision_model.encoder.layers.8.mlp.fc2",
38
+ "vision_tower.vision_model.encoder.layers.7.self_attn.k_proj",
39
+ "vision_tower.vision_model.encoder.layers.12.self_attn.v_proj",
40
+ "vision_tower.vision_model.encoder.layers.14.self_attn.k_proj",
41
+ "vision_tower.vision_model.encoder.layers.22.mlp.fc1",
42
+ "vision_tower.vision_model.encoder.layers.12.self_attn.q_proj",
43
+ "vision_tower.vision_model.encoder.layers.6.self_attn.q_proj",
44
+ "vision_tower.vision_model.encoder.layers.21.mlp.fc2",
45
+ "vision_tower.vision_model.encoder.layers.5.self_attn.out_proj",
46
+ "vision_tower.vision_model.encoder.layers.5.self_attn.q_proj",
47
+ "vision_tower.vision_model.encoder.layers.18.self_attn.out_proj",
48
+ "vision_tower.vision_model.encoder.layers.12.mlp.fc2",
49
  "vision_tower.vision_model.encoder.layers.19.mlp.fc2",
50
+ "vision_tower.vision_model.encoder.layers.16.self_attn.k_proj",
51
+ "vision_tower.vision_model.encoder.layers.19.self_attn.q_proj",
52
+ "vision_tower.vision_model.encoder.layers.15.mlp.fc1",
53
+ "vision_tower.vision_model.encoder.layers.20.self_attn.v_proj",
54
+ "vision_tower.vision_model.encoder.layers.15.self_attn.q_proj",
55
+ "vision_tower.vision_model.encoder.layers.23.self_attn.v_proj",
56
+ "vision_tower.vision_model.encoder.layers.4.self_attn.out_proj",
57
+ "vision_tower.vision_model.encoder.layers.3.self_attn.k_proj",
58
+ "vision_tower.vision_model.encoder.layers.3.self_attn.q_proj",
59
+ "vision_tower.vision_model.encoder.layers.2.mlp.fc1",
60
+ "vision_tower.vision_model.encoder.layers.3.mlp.fc2",
61
+ "vision_tower.vision_model.encoder.layers.10.mlp.fc1",
62
+ "vision_tower.vision_model.encoder.layers.0.mlp.fc2",
63
+ "vision_tower.vision_model.encoder.layers.11.self_attn.k_proj",
64
  "vision_tower.vision_model.encoder.layers.15.self_attn.out_proj",
65
+ "vision_tower.vision_model.encoder.layers.7.mlp.fc1",
66
+ "vision_tower.vision_model.encoder.layers.16.mlp.fc2",
67
+ "vision_tower.vision_model.encoder.layers.11.self_attn.out_proj",
68
  "vision_tower.vision_model.encoder.layers.8.self_attn.v_proj",
69
+ "vision_tower.vision_model.encoder.layers.17.self_attn.k_proj",
70
+ "vision_tower.vision_model.encoder.layers.20.mlp.fc1",
71
+ "vision_tower.vision_model.encoder.layers.15.self_attn.k_proj",
72
+ "vision_tower.vision_model.encoder.layers.8.self_attn.q_proj",
73
  "vision_tower.vision_model.encoder.layers.16.self_attn.v_proj",
74
+ "vision_tower.vision_model.encoder.layers.0.mlp.fc1",
75
+ "vision_tower.vision_model.encoder.layers.1.mlp.fc2",
76
+ "vision_tower.vision_model.encoder.layers.9.self_attn.q_proj",
77
+ "vision_tower.vision_model.encoder.layers.14.mlp.fc1",
78
+ "vision_tower.vision_model.encoder.layers.23.mlp.fc2",
 
 
 
 
 
 
 
 
 
79
  "vision_tower.vision_model.encoder.layers.4.mlp.fc1",
80
+ "vision_tower.vision_model.encoder.layers.9.self_attn.v_proj",
81
+ "vision_tower.vision_model.encoder.layers.7.self_attn.q_proj",
82
+ "vision_tower.vision_model.encoder.layers.22.self_attn.v_proj",
83
+ "vision_tower.vision_model.encoder.layers.16.mlp.fc1",
84
+ "vision_tower.vision_model.encoder.layers.10.mlp.fc2",
85
+ "vision_tower.vision_model.encoder.layers.17.self_attn.out_proj",
 
86
  "vision_tower.vision_model.encoder.layers.2.self_attn.out_proj",
87
+ "vision_tower.vision_model.encoder.layers.8.self_attn.k_proj",
88
+ "vision_tower.vision_model.encoder.layers.4.self_attn.q_proj",
89
+ "vision_tower.vision_model.encoder.layers.23.self_attn.out_proj",
90
+ "vision_tower.vision_model.encoder.layers.17.mlp.fc1",
91
+ "vision_tower.vision_model.encoder.layers.18.mlp.fc2",
92
+ "vision_tower.vision_model.encoder.layers.1.mlp.fc1",
93
+ "vision_tower.vision_model.encoder.layers.2.mlp.fc2",
94
+ "vision_tower.vision_model.encoder.layers.4.mlp.fc2",
95
+ "vision_tower.vision_model.encoder.layers.6.self_attn.k_proj",
96
+ "vision_tower.vision_model.encoder.layers.8.mlp.fc1",
97
  "vision_tower.vision_model.encoder.layers.14.self_attn.out_proj",
98
+ "vision_tower.vision_model.encoder.layers.19.self_attn.k_proj",
99
+ "vision_tower.vision_model.encoder.layers.17.self_attn.q_proj",
100
+ "vision_tower.vision_model.encoder.layers.21.self_attn.k_proj",
101
+ "vision_tower.vision_model.encoder.layers.21.self_attn.out_proj",
102
+ "vision_tower.vision_model.encoder.layers.19.self_attn.v_proj",
103
+ "vision_tower.vision_model.encoder.layers.17.mlp.fc2",
104
+ "vision_tower.vision_model.encoder.layers.4.self_attn.v_proj",
105
+ "vision_tower.vision_model.encoder.layers.1.self_attn.q_proj",
106
+ "vision_tower.vision_model.encoder.layers.0.self_attn.k_proj",
107
+ "vision_tower.vision_model.encoder.layers.23.self_attn.k_proj",
108
+ "vision_tower.vision_model.encoder.layers.21.self_attn.v_proj",
109
+ "vision_tower.vision_model.encoder.layers.6.self_attn.v_proj",
110
+ "vision_tower.vision_model.encoder.layers.13.self_attn.v_proj",
111
  "vision_tower.vision_model.encoder.layers.13.mlp.fc1",
112
+ "vision_tower.vision_model.encoder.layers.3.self_attn.v_proj",
113
+ "vision_tower.vision_model.encoder.layers.0.self_attn.out_proj",
114
+ "vision_tower.vision_model.encoder.layers.6.self_attn.out_proj",
115
+ "vision_tower.vision_model.encoder.layers.5.mlp.fc2",
116
+ "vision_tower.vision_model.encoder.layers.1.self_attn.out_proj",
117
+ "vision_tower.vision_model.encoder.layers.21.self_attn.q_proj",
118
+ "vision_tower.vision_model.encoder.layers.22.self_attn.k_proj",
119
+ "vision_tower.vision_model.encoder.layers.14.mlp.fc2",
120
  "vision_tower.vision_model.encoder.layers.10.self_attn.k_proj",
121
+ "vision_tower.vision_model.encoder.layers.5.mlp.fc1",
122
  "vision_tower.vision_model.encoder.layers.19.mlp.fc1",
 
 
 
 
 
 
 
 
 
123
  "vision_tower.vision_model.encoder.layers.10.self_attn.out_proj",
124
+ "vision_tower.vision_model.encoder.layers.12.self_attn.k_proj",
125
+ "vision_tower.vision_model.encoder.layers.16.self_attn.out_proj",
126
+ "vision_tower.vision_model.encoder.layers.9.mlp.fc2",
127
+ "vision_tower.vision_model.encoder.layers.19.self_attn.out_proj",
128
+ "vision_tower.vision_model.encoder.layers.11.self_attn.q_proj",
129
+ "vision_tower.vision_model.encoder.layers.11.mlp.fc2",
130
+ "vision_tower.vision_model.encoder.layers.5.self_attn.k_proj",
131
+ "vision_tower.vision_model.encoder.layers.15.mlp.fc2",
132
+ "vision_tower.vision_model.encoder.layers.10.self_attn.v_proj",
133
+ "vision_tower.vision_model.encoder.layers.18.self_attn.q_proj",
134
+ "vision_tower.vision_model.encoder.layers.1.self_attn.v_proj",
135
+ "vision_tower.vision_model.encoder.layers.11.self_attn.v_proj",
136
+ "vision_tower.vision_model.encoder.layers.22.self_attn.q_proj",
137
  "vision_tower.vision_model.encoder.layers.5.self_attn.v_proj",
138
+ "vision_tower.vision_model.encoder.layers.9.self_attn.k_proj",
139
+ "vision_tower.vision_model.encoder.layers.9.self_attn.out_proj",
140
+ "vision_tower.vision_model.encoder.layers.12.mlp.fc1",
141
  "vision_tower.vision_model.encoder.layers.17.self_attn.v_proj",
142
+ "vision_tower.vision_model.encoder.layers.14.self_attn.q_proj",
143
+ "vision_tower.vision_model.encoder.layers.20.self_attn.q_proj",
144
+ "vision_tower.vision_model.encoder.layers.0.self_attn.v_proj",
145
+ "vision_tower.vision_model.encoder.layers.22.self_attn.out_proj",
146
  "vision_tower.vision_model.encoder.layers.7.mlp.fc2",
147
+ "vision_tower.vision_model.encoder.layers.2.self_attn.q_proj",
 
 
 
 
 
 
148
  "vision_tower.vision_model.encoder.layers.0.self_attn.q_proj",
149
+ "vision_tower.vision_model.encoder.layers.3.mlp.fc1",
150
+ "vision_tower.vision_model.encoder.layers.18.self_attn.k_proj",
151
  "vision_tower.vision_model.encoder.layers.23.self_attn.q_proj",
152
+ "vision_tower.vision_model.encoder.layers.23.mlp.fc1",
 
 
 
 
153
  "vision_tower.vision_model.encoder.layers.16.self_attn.q_proj",
154
+ "vision_tower.vision_model.encoder.layers.2.self_attn.k_proj",
155
+ "vision_tower.vision_model.encoder.layers.13.mlp.fc2",
 
 
 
 
 
 
 
 
156
  "vision_tower.vision_model.encoder.layers.13.self_attn.k_proj",
157
+ "vision_tower.vision_model.encoder.layers.14.self_attn.v_proj",
158
+ "vision_tower.vision_model.encoder.layers.2.self_attn.v_proj",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
159
  "vision_tower.vision_model.encoder.layers.4.self_attn.k_proj",
160
+ "vision_tower.vision_model.encoder.layers.20.self_attn.k_proj",
161
+ "vision_tower.vision_model.encoder.layers.20.mlp.fc2",
162
+ "vision_tower.vision_model.encoder.layers.6.mlp.fc1",
163
+ "vision_tower.vision_model.encoder.layers.7.self_attn.out_proj",
164
+ "vision_tower.vision_model.encoder.layers.20.self_attn.out_proj",
165
+ "vision_tower.vision_model.encoder.layers.13.self_attn.q_proj",
166
  "vision_tower.vision_model.encoder.layers.15.self_attn.v_proj",
167
+ "vision_tower.vision_model.encoder.layers.9.mlp.fc1",
168
+ "vision_tower.vision_model.encoder.layers.1.self_attn.k_proj",
169
+ "vision_tower.vision_model.encoder.layers.7.self_attn.v_proj"
 
 
 
 
 
 
 
170
  ],
171
  "task_type": null,
172
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f59ae13a37f36880d80f4c06f49304f0499d913fbd2ec59bbffbd6cfabd6a00
3
- size 1589496912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71d9f909c588fcb4cbd8af332ec53312c6241f9617da477d3d16fade3fa0feff
3
+ size 1462354992
tokenizer.json CHANGED
@@ -1,21 +1,7 @@
1
  {
2
  "version": "1.0",
3
- "truncation": {
4
- "direction": "Right",
5
- "max_length": 1137,
6
- "strategy": "LongestFirst",
7
- "stride": 0
8
- },
9
- "padding": {
10
- "strategy": {
11
- "Fixed": 1137
12
- },
13
- "direction": "Right",
14
- "pad_to_multiple_of": null,
15
- "pad_id": 32001,
16
- "pad_type_id": 0,
17
- "pad_token": "<pad>"
18
- },
19
  "added_tokens": [
20
  {
21
  "id": 0,
 
1
  {
2
  "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 0,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d52bfa99adfc8e14db8dae4b8f84c3ce5b4f50170d945cf980d78cbfbbcb36fe
3
  size 5560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6c0ba574922dd4f46b05820c0bac27fb7a773f344a5e09fd088147e1ba493f5
3
  size 5560