snake7gun commited on
Commit
b6a0a63
·
verified ·
1 Parent(s): cadde21

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -16,20 +16,19 @@
16
  "image_start_token_id": 151339,
17
  "image_token_id": 151343,
18
  "initializer_range": 0.02,
19
- "intermediate_size": 128,
20
  "max_position_embeddings": 65536,
21
  "model_type": "glm4v",
22
- "num_attention_heads": 2,
23
- "num_hidden_layers": 2,
24
- "num_key_value_heads": 1,
25
  "pad_token_id": 151329,
26
  "partial_rotary_factor": 0.5,
27
  "rms_norm_eps": 1e-05,
28
  "rope_scaling": {
29
  "mrope_section": [
30
- 2,
31
- 2,
32
- 4
33
  ],
34
  "rope_type": "default",
35
  "type": "default"
@@ -51,33 +50,32 @@
51
  "hidden_size": 64,
52
  "image_token_id": null,
53
  "initializer_range": 0.02,
54
- "intermediate_size": 128,
55
  "max_position_embeddings": 65536,
56
  "model_type": "glm4v_text",
57
- "num_attention_heads": 2,
58
- "num_hidden_layers": 2,
59
- "num_key_value_heads": 1,
60
  "pad_token_id": 151329,
61
  "partial_rotary_factor": 0.5,
62
  "rms_norm_eps": 1e-05,
63
  "rope_scaling": {
64
  "mrope_section": [
65
- 2,
66
- 2,
67
- 4
68
  ],
69
  "rope_type": "default",
70
  "type": "default"
71
  },
72
  "rope_theta": 10000.0,
73
- "tie_word_embeddings": true,
74
  "torch_dtype": "bfloat16",
75
  "use_cache": true,
76
  "video_token_id": null,
77
  "vocab_size": 151552
78
  },
79
- "torch_dtype": "bfloat16",
80
- "transformers_version": "4.54.0.dev0",
 
81
  "use_cache": true,
82
  "video_end_token_id": 151342,
83
  "video_start_token_id": 151341,
@@ -85,17 +83,17 @@
85
  "vision_config": {
86
  "attention_bias": false,
87
  "attention_dropout": 0.0,
88
- "depth": 2,
89
  "hidden_act": "silu",
90
  "hidden_dropout_prob": 0.0,
91
  "hidden_size": 64,
92
  "image_size": 336,
93
  "in_channels": 3,
94
  "initializer_range": 0.02,
95
- "intermediate_size": 128,
96
  "model_type": "glm4v",
97
- "num_heads": 2,
98
- "out_hidden_size": 64,
99
  "patch_size": 14,
100
  "rms_norm_eps": 1e-05,
101
  "spatial_merge_size": 2,
 
16
  "image_start_token_id": 151339,
17
  "image_token_id": 151343,
18
  "initializer_range": 0.02,
19
+ "intermediate_size": 64,
20
  "max_position_embeddings": 65536,
21
  "model_type": "glm4v",
22
+ "num_attention_heads": 8,
23
+ "num_hidden_layers": 3,
24
+ "num_key_value_heads": 2,
25
  "pad_token_id": 151329,
26
  "partial_rotary_factor": 0.5,
27
  "rms_norm_eps": 1e-05,
28
  "rope_scaling": {
29
  "mrope_section": [
30
+ 1,
31
+ 1
 
32
  ],
33
  "rope_type": "default",
34
  "type": "default"
 
50
  "hidden_size": 64,
51
  "image_token_id": null,
52
  "initializer_range": 0.02,
53
+ "intermediate_size": 64,
54
  "max_position_embeddings": 65536,
55
  "model_type": "glm4v_text",
56
+ "num_attention_heads": 8,
57
+ "num_hidden_layers": 3,
58
+ "num_key_value_heads": 2,
59
  "pad_token_id": 151329,
60
  "partial_rotary_factor": 0.5,
61
  "rms_norm_eps": 1e-05,
62
  "rope_scaling": {
63
  "mrope_section": [
64
+ 1,
65
+ 1
 
66
  ],
67
  "rope_type": "default",
68
  "type": "default"
69
  },
70
  "rope_theta": 10000.0,
 
71
  "torch_dtype": "bfloat16",
72
  "use_cache": true,
73
  "video_token_id": null,
74
  "vocab_size": 151552
75
  },
76
+ "tie_word_embeddings": false,
77
+ "torch_dtype": "float32",
78
+ "transformers_version": "4.54.1",
79
  "use_cache": true,
80
  "video_end_token_id": 151342,
81
  "video_start_token_id": 151341,
 
83
  "vision_config": {
84
  "attention_bias": false,
85
  "attention_dropout": 0.0,
86
+ "depth": 4,
87
  "hidden_act": "silu",
88
  "hidden_dropout_prob": 0.0,
89
  "hidden_size": 64,
90
  "image_size": 336,
91
  "in_channels": 3,
92
  "initializer_range": 0.02,
93
+ "intermediate_size": 64,
94
  "model_type": "glm4v",
95
+ "num_heads": 4,
96
+ "out_hidden_size": 4096,
97
  "patch_size": 14,
98
  "rms_norm_eps": 1e-05,
99
  "spatial_merge_size": 2,
generation_config.json CHANGED
@@ -7,5 +7,5 @@
7
  151348
8
  ],
9
  "pad_token_id": 151329,
10
- "transformers_version": "4.54.0.dev0"
11
  }
 
7
  151348
8
  ],
9
  "pad_token_id": 151329,
10
+ "transformers_version": "4.54.1"
11
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a51b22dc53e1de592646c2a898839abada0c547804444a118dac2508ec322d5c
3
- size 19984480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91d6edb23f856c096ba6962b6c7ea1d8d8336e16ef4dee2bcb8ae08733b66ea9
3
+ size 146137472
preprocessor_config.json CHANGED
@@ -1,27 +1,11 @@
1
  {
2
- "do_convert_rgb": true,
3
- "do_normalize": true,
4
- "do_rescale": true,
5
- "do_resize": true,
6
- "image_mean": [
7
- 0.48145466,
8
- 0.4578275,
9
- 0.40821073
10
- ],
11
- "image_processor_type": "Glm4vImageProcessor",
12
- "image_std": [
13
- 0.26862954,
14
- 0.26130258,
15
- 0.27577711
16
- ],
17
- "merge_size": 2,
18
- "patch_size": 14,
19
- "processor_class": "Glm4vProcessor",
20
- "resample": 3,
21
- "rescale_factor": 0.00392156862745098,
22
- "size": {
23
- "longest_edge": 11760000,
24
- "shortest_edge": 12544
25
- },
26
- "temporal_patch_size": 2
27
- }
 
1
  {
2
+ "size": {"shortest_edge": 12544, "longest_edge": 9633792},
3
+ "do_rescale": true,
4
+ "patch_size": 14,
5
+ "temporal_patch_size": 2,
6
+ "merge_size": 2,
7
+ "image_mean": [0.48145466, 0.4578275, 0.40821073],
8
+ "image_std": [0.26862954, 0.26130258, 0.27577711],
9
+ "image_processor_type": "Glm4vImageProcessor",
10
+ "processor_class": "Glm4vProcessor"
11
+ }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bcc742fc44db1f0870d7320b495e6240cc40e202565fc96786220fa0d9ddb41c
3
- size 19968183
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76ebeac0d8bd7879ead7b43c16b44981f277e47225de2bd7de9ae1a6cc664a8c
3
+ size 19966496
tokenizer_config.json CHANGED
@@ -112,7 +112,7 @@
112
  "single_word": false,
113
  "special": true
114
  },
115
- "151343": {
116
  "content": "<|image|>",
117
  "lstrip": false,
118
  "normalized": false,
@@ -128,7 +128,7 @@
128
  "single_word": false,
129
  "special": true
130
  },
131
- "151345": {
132
  "content": "<think>",
133
  "lstrip": false,
134
  "normalized": false,
@@ -136,7 +136,7 @@
136
  "single_word": false,
137
  "special": false
138
  },
139
- "151346": {
140
  "content": "</think>",
141
  "lstrip": false,
142
  "normalized": false,
@@ -144,7 +144,7 @@
144
  "single_word": false,
145
  "special": false
146
  },
147
- "151347": {
148
  "content": "<answer>",
149
  "lstrip": false,
150
  "normalized": false,
@@ -152,7 +152,7 @@
152
  "single_word": false,
153
  "special": false
154
  },
155
- "151348": {
156
  "content": "</answer>",
157
  "lstrip": false,
158
  "normalized": false,
@@ -206,15 +206,13 @@
206
  "clean_up_tokenization_spaces": false,
207
  "do_lower_case": false,
208
  "eos_token": "<|endoftext|>",
209
- "extra_special_tokens": {},
210
  "model_input_names": [
211
  "input_ids",
212
  "attention_mask"
213
  ],
214
  "model_max_length": 65536,
215
- "pad_token": "<|endoftext|>",
216
  "padding_side": "left",
217
- "processor_class": "Glm4vProcessor",
218
  "remove_space": false,
219
- "tokenizer_class": "PreTrainedTokenizerFast"
220
  }
 
112
  "single_word": false,
113
  "special": true
114
  },
115
+ "151343": {
116
  "content": "<|image|>",
117
  "lstrip": false,
118
  "normalized": false,
 
128
  "single_word": false,
129
  "special": true
130
  },
131
+ "151345": {
132
  "content": "<think>",
133
  "lstrip": false,
134
  "normalized": false,
 
136
  "single_word": false,
137
  "special": false
138
  },
139
+ "151346": {
140
  "content": "</think>",
141
  "lstrip": false,
142
  "normalized": false,
 
144
  "single_word": false,
145
  "special": false
146
  },
147
+ "151347": {
148
  "content": "<answer>",
149
  "lstrip": false,
150
  "normalized": false,
 
152
  "single_word": false,
153
  "special": false
154
  },
155
+ "151348": {
156
  "content": "</answer>",
157
  "lstrip": false,
158
  "normalized": false,
 
206
  "clean_up_tokenization_spaces": false,
207
  "do_lower_case": false,
208
  "eos_token": "<|endoftext|>",
209
+ "pad_token": "<|endoftext|>",
210
  "model_input_names": [
211
  "input_ids",
212
  "attention_mask"
213
  ],
214
  "model_max_length": 65536,
 
215
  "padding_side": "left",
 
216
  "remove_space": false,
217
+ "tokenizer_class": "PreTrainedTokenizer"
218
  }
video_preprocessor_config.json CHANGED
@@ -1,42 +1,11 @@
1
  {
2
- "crop_size": null,
3
- "data_format": "channels_first",
4
- "default_to_square": true,
5
- "device": null,
6
- "do_center_crop": null,
7
- "do_convert_rgb": true,
8
- "do_normalize": true,
9
- "do_pad": null,
10
- "do_rescale": true,
11
- "do_resize": true,
12
- "do_sample_frames": true,
13
- "fps": 2,
14
- "image_mean": [
15
- 0.48145466,
16
- 0.4578275,
17
- 0.40821073
18
- ],
19
- "image_std": [
20
- 0.26862954,
21
- 0.26130258,
22
- 0.27577711
23
- ],
24
- "input_data_format": null,
25
- "max_image_size": {
26
- "longest_edge": 47040000
27
- },
28
- "merge_size": 2,
29
- "num_frames": 16,
30
- "patch_size": 14,
31
- "processor_class": "Glm4vProcessor",
32
- "resample": 3,
33
- "rescale_factor": 0.00392156862745098,
34
- "size": {
35
- "longest_edge": 47040000,
36
- "shortest_edge": 12544
37
- },
38
- "size_divisor": null,
39
- "temporal_patch_size": 2,
40
- "video_metadata": null,
41
- "video_processor_type": "Glm4vVideoProcessor"
42
- }
 
1
  {
2
+ "size": {"shortest_edge": 12544, "longest_edge": 47040000},
3
+ "do_rescale": true,
4
+ "patch_size": 14,
5
+ "temporal_patch_size": 2,
6
+ "merge_size": 2,
7
+ "image_mean": [0.48145466, 0.4578275, 0.40821073],
8
+ "image_std": [0.26862954, 0.26130258, 0.27577711],
9
+ "video_processor_type": "Glm4vVideoProcessor",
10
+ "processor_class": "Glm4vProcessor"
11
+ }