hermeschen-ezcon commited on
Commit
7d29f6c
·
verified ·
1 Parent(s): 1bd3e95

Upload folder using huggingface_hub

Browse files
README.md CHANGED
@@ -13,7 +13,7 @@ library_name: transformers
13
  ---
14
 
15
  # EZCon/Qwen2.5-VL-7B-Instruct-4bit-mlx
16
- This model was converted to MLX format from [`unsloth/Qwen2.5-VL-7B-Instruct`]() using mlx-vlm version **0.3.2**.
17
  Refer to the [original model card](https://huggingface.co/unsloth/Qwen2.5-VL-7B-Instruct) for more details on the model.
18
  ## Use with mlx
19
 
 
13
  ---
14
 
15
  # EZCon/Qwen2.5-VL-7B-Instruct-4bit-mlx
16
+ This model was converted to MLX format from [`unsloth/Qwen2.5-VL-7B-Instruct`]() using mlx-vlm version **0.3.3**.
17
  Refer to the [original model card](https://huggingface.co/unsloth/Qwen2.5-VL-7B-Instruct) for more details on the model.
18
  ## Use with mlx
19
 
config.json CHANGED
@@ -12,6 +12,7 @@
12
  "decoder_start_token_id": null,
13
  "diversity_penalty": 0.0,
14
  "do_sample": false,
 
15
  "early_stopping": false,
16
  "encoder_no_repeat_ngram_size": 0,
17
  "eos_token_id": 151645,
@@ -36,7 +37,7 @@
36
  },
37
  "length_penalty": 1.0,
38
  "max_length": 20,
39
- "max_position_embeddings": 128000,
40
  "max_window_layers": 28,
41
  "min_length": 0,
42
  "model_type": "qwen2_5_vl",
@@ -56,11 +57,13 @@
56
  "pruned_heads": {},
57
  "quantization": {
58
  "group_size": 64,
59
- "bits": 4
 
60
  },
61
  "quantization_config": {
62
  "group_size": 64,
63
- "bits": 4
 
64
  },
65
  "remove_invalid_values": false,
66
  "repetition_penalty": 1.0,
@@ -143,7 +146,7 @@
143
  "return_dict": true,
144
  "output_hidden_states": false,
145
  "torchscript": false,
146
- "torch_dtype": "bfloat16",
147
  "pruned_heads": {},
148
  "tie_word_embeddings": false,
149
  "chunk_size_feed_forward": 0,
@@ -168,8 +171,8 @@
168
  "problem_type": null,
169
  "tokenizer_class": null,
170
  "prefix": null,
171
- "bos_token_id": null,
172
- "pad_token_id": 151654,
173
  "eos_token_id": 151645,
174
  "sep_token_id": null,
175
  "decoder_start_token_id": null,
@@ -178,8 +181,6 @@
178
  "do_sample": false,
179
  "early_stopping": false,
180
  "num_beams": 1,
181
- "num_beam_groups": 1,
182
- "diversity_penalty": 0.0,
183
  "temperature": 1.0,
184
  "top_k": 50,
185
  "top_p": 1.0,
@@ -198,27 +199,24 @@
198
  "exponential_decay_length_penalty": null,
199
  "suppress_tokens": null,
200
  "begin_suppress_tokens": null,
 
 
201
  "_name_or_path": "",
202
  "model_type": "qwen2_5_vl_text",
203
- "unsloth_fixed": true,
204
  "vision_end_token_id": 151653,
205
  "vision_start_token_id": 151652,
206
  "vision_token_id": 151654,
207
- "tf_legacy_loss": false,
208
- "use_bfloat16": false,
209
  "output_attentions": false
210
  },
211
- "tf_legacy_loss": false,
212
  "tie_encoder_decoder": false,
213
  "tie_word_embeddings": false,
214
  "tokenizer_class": null,
215
  "top_k": 50,
216
  "top_p": 1.0,
217
  "torchscript": false,
218
- "transformers_version": "4.56.0.dev0",
219
  "typical_p": 1.0,
220
  "unsloth_fixed": true,
221
- "use_bfloat16": false,
222
  "use_cache": true,
223
  "use_sliding_window": false,
224
  "video_token_id": 151656,
@@ -226,7 +224,7 @@
226
  "return_dict": true,
227
  "output_hidden_states": false,
228
  "torchscript": false,
229
- "torch_dtype": "bfloat16",
230
  "pruned_heads": {},
231
  "tie_word_embeddings": true,
232
  "chunk_size_feed_forward": 0,
@@ -259,8 +257,6 @@
259
  "do_sample": false,
260
  "early_stopping": false,
261
  "num_beams": 1,
262
- "num_beam_groups": 1,
263
- "diversity_penalty": 0.0,
264
  "temperature": 1.0,
265
  "top_k": 50,
266
  "top_p": 1.0,
@@ -279,12 +275,12 @@
279
  "exponential_decay_length_penalty": null,
280
  "suppress_tokens": null,
281
  "begin_suppress_tokens": null,
 
 
282
  "_name_or_path": "",
283
  "in_chans": 3,
284
  "model_type": "qwen2_5_vl",
285
  "spatial_patch_size": 14,
286
- "tf_legacy_loss": false,
287
- "use_bfloat16": false,
288
  "depth": 32,
289
  "hidden_size": 1280,
290
  "hidden_act": "silu",
 
12
  "decoder_start_token_id": null,
13
  "diversity_penalty": 0.0,
14
  "do_sample": false,
15
+ "dtype": "bfloat16",
16
  "early_stopping": false,
17
  "encoder_no_repeat_ngram_size": 0,
18
  "eos_token_id": 151645,
 
37
  },
38
  "length_penalty": 1.0,
39
  "max_length": 20,
40
+ "max_position_embeddings": 32768,
41
  "max_window_layers": 28,
42
  "min_length": 0,
43
  "model_type": "qwen2_5_vl",
 
57
  "pruned_heads": {},
58
  "quantization": {
59
  "group_size": 64,
60
+ "bits": 4,
61
+ "mode": "affine"
62
  },
63
  "quantization_config": {
64
  "group_size": 64,
65
+ "bits": 4,
66
+ "mode": "affine"
67
  },
68
  "remove_invalid_values": false,
69
  "repetition_penalty": 1.0,
 
146
  "return_dict": true,
147
  "output_hidden_states": false,
148
  "torchscript": false,
149
+ "dtype": "bfloat16",
150
  "pruned_heads": {},
151
  "tie_word_embeddings": false,
152
  "chunk_size_feed_forward": 0,
 
171
  "problem_type": null,
172
  "tokenizer_class": null,
173
  "prefix": null,
174
+ "bos_token_id": 151643,
175
+ "pad_token_id": null,
176
  "eos_token_id": 151645,
177
  "sep_token_id": null,
178
  "decoder_start_token_id": null,
 
181
  "do_sample": false,
182
  "early_stopping": false,
183
  "num_beams": 1,
 
 
184
  "temperature": 1.0,
185
  "top_k": 50,
186
  "top_p": 1.0,
 
199
  "exponential_decay_length_penalty": null,
200
  "suppress_tokens": null,
201
  "begin_suppress_tokens": null,
202
+ "num_beam_groups": 1,
203
+ "diversity_penalty": 0.0,
204
  "_name_or_path": "",
205
  "model_type": "qwen2_5_vl_text",
 
206
  "vision_end_token_id": 151653,
207
  "vision_start_token_id": 151652,
208
  "vision_token_id": 151654,
 
 
209
  "output_attentions": false
210
  },
 
211
  "tie_encoder_decoder": false,
212
  "tie_word_embeddings": false,
213
  "tokenizer_class": null,
214
  "top_k": 50,
215
  "top_p": 1.0,
216
  "torchscript": false,
217
+ "transformers_version": "4.57.0.dev0",
218
  "typical_p": 1.0,
219
  "unsloth_fixed": true,
 
220
  "use_cache": true,
221
  "use_sliding_window": false,
222
  "video_token_id": 151656,
 
224
  "return_dict": true,
225
  "output_hidden_states": false,
226
  "torchscript": false,
227
+ "dtype": "bfloat16",
228
  "pruned_heads": {},
229
  "tie_word_embeddings": true,
230
  "chunk_size_feed_forward": 0,
 
257
  "do_sample": false,
258
  "early_stopping": false,
259
  "num_beams": 1,
 
 
260
  "temperature": 1.0,
261
  "top_k": 50,
262
  "top_p": 1.0,
 
275
  "exponential_decay_length_penalty": null,
276
  "suppress_tokens": null,
277
  "begin_suppress_tokens": null,
278
+ "num_beam_groups": 1,
279
+ "diversity_penalty": 0.0,
280
  "_name_or_path": "",
281
  "in_chans": 3,
282
  "model_type": "qwen2_5_vl",
283
  "spatial_patch_size": 14,
 
 
284
  "depth": 32,
285
  "hidden_size": 1280,
286
  "hidden_act": "silu",
generation_config.json CHANGED
@@ -5,9 +5,9 @@
5
  151645,
6
  151643
7
  ],
8
- "max_length": 128000,
9
  "pad_token_id": 151654,
10
  "repetition_penalty": 1.05,
11
  "temperature": 1e-06,
12
- "transformers_version": "4.51.3"
13
  }
 
5
  151645,
6
  151643
7
  ],
8
+ "max_length": 32768,
9
  "pad_token_id": 151654,
10
  "repetition_penalty": 1.05,
11
  "temperature": 1e-06,
12
+ "transformers_version": "4.56.1"
13
  }
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4cf0528116e672daa72b6623dbfd2e006438de499a1821e78aefa22f8f29cc11
3
  size 5330941330
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccc45d5108d1f396b0572e9adac725c5bbc37aacf383a5b97316846e168e6aec
3
  size 5330941330
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c04dc53c361cb18cf2975990700dee5e92b6414b0930b037c6d56c8107658b3b
3
  size 306561371
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c11d35d4fb4df53bd39c0cc3baebdfd312168ee9a24873cec45aa4847e101255
3
  size 306561371
model.safetensors.index.json CHANGED
@@ -1,5 +1,6 @@
1
  {
2
  "metadata": {
 
3
  "total_size": 16584333312
4
  },
5
  "weight_map": {
 
1
  {
2
  "metadata": {
3
+ "total_parameters": 8292166656,
4
  "total_size": 16584333312
5
  },
6
  "weight_map": {
preprocessor_config.json CHANGED
@@ -7,6 +7,7 @@
7
  "do_center_crop": null,
8
  "do_convert_rgb": true,
9
  "do_normalize": true,
 
10
  "do_rescale": true,
11
  "do_resize": true,
12
  "image_mean": [
@@ -24,6 +25,7 @@
24
  "max_pixels": 12845056,
25
  "merge_size": 2,
26
  "min_pixels": 3136,
 
27
  "patch_size": 14,
28
  "processor_class": "Qwen2_5_VLProcessor",
29
  "resample": 3,
 
7
  "do_center_crop": null,
8
  "do_convert_rgb": true,
9
  "do_normalize": true,
10
+ "do_pad": null,
11
  "do_rescale": true,
12
  "do_resize": true,
13
  "image_mean": [
 
25
  "max_pixels": 12845056,
26
  "merge_size": 2,
27
  "min_pixels": 3136,
28
+ "pad_size": null,
29
  "patch_size": 14,
30
  "processor_class": "Qwen2_5_VLProcessor",
31
  "resample": 3,
tokenizer_config.json CHANGED
@@ -199,7 +199,7 @@
199
  "eos_token": "<|im_end|>",
200
  "errors": "replace",
201
  "extra_special_tokens": {},
202
- "model_max_length": 128000,
203
  "pad_token": "<|vision_pad|>",
204
  "padding_side": "left",
205
  "processor_class": "Qwen2_5_VLProcessor",
 
199
  "eos_token": "<|im_end|>",
200
  "errors": "replace",
201
  "extra_special_tokens": {},
202
+ "model_max_length": 32768,
203
  "pad_token": "<|vision_pad|>",
204
  "padding_side": "left",
205
  "processor_class": "Qwen2_5_VLProcessor",
video_preprocessor_config.json CHANGED
@@ -28,10 +28,12 @@
28
  "min_frames": 4,
29
  "min_pixels": 3136,
30
  "num_frames": null,
 
31
  "patch_size": 14,
32
  "processor_class": "Qwen2_5_VLProcessor",
33
  "resample": 3,
34
  "rescale_factor": 0.00392156862745098,
 
35
  "size": {
36
  "longest_edge": 12845056,
37
  "shortest_edge": 3136
 
28
  "min_frames": 4,
29
  "min_pixels": 3136,
30
  "num_frames": null,
31
+ "pad_size": null,
32
  "patch_size": 14,
33
  "processor_class": "Qwen2_5_VLProcessor",
34
  "resample": 3,
35
  "rescale_factor": 0.00392156862745098,
36
+ "return_metadata": false,
37
  "size": {
38
  "longest_edge": 12845056,
39
  "shortest_edge": 3136