Commit
·
e9d93a4
1
Parent(s):
a9bc1da
Switch model weights to safetensors format
Browse files- config.json +9 -4
- generation_config.json +4 -0
- pytorch_model-00001-of-00004.bin → model-00001-of-00003.safetensors +2 -2
- pytorch_model-00002-of-00004.bin → model-00002-of-00003.safetensors +2 -2
- pytorch_model-00003-of-00004.bin → model-00003-of-00003.safetensors +2 -2
- pytorch_model.bin.index.json → model.safetensors.index.json +0 -0
- pytorch_model-00004-of-00004.bin +0 -3
config.json
CHANGED
@@ -15,6 +15,8 @@
|
|
15 |
"ignore_index": -100,
|
16 |
"img_start_id": 100271,
|
17 |
"language_config": {
|
|
|
|
|
18 |
"add_cross_attention": false,
|
19 |
"architectures": [
|
20 |
"LlamaForCausalLM"
|
@@ -94,31 +96,34 @@
|
|
94 |
"top_p": 1.0,
|
95 |
"torch_dtype": "bfloat16",
|
96 |
"torchscript": false,
|
97 |
-
"transformers_version": "4.
|
98 |
"typical_p": 1.0,
|
99 |
"use_bfloat16": false,
|
100 |
"use_cache": true,
|
101 |
"vocab_size": 110592
|
102 |
},
|
|
|
103 |
"max_num_grids": 9,
|
104 |
"model_type": "hyperclovax_vlm",
|
105 |
-
"max_image_cnt": 12,
|
106 |
"num_queries_vis_abstractor": 81,
|
107 |
"proj_pos_emb": true,
|
108 |
"proj_prenorm": false,
|
109 |
"q_former_model_name_or_path": null,
|
110 |
"torch_dtype": "float32",
|
111 |
-
"transformers_version": "4.
|
112 |
"unpad": true,
|
113 |
"use_1x1_grid": true,
|
114 |
"use_nth_layer": -2,
|
115 |
"vision_config": {
|
|
|
|
|
116 |
"add_cross_attention": false,
|
117 |
"anyres": true,
|
118 |
"architectures": [
|
119 |
"SiglipVisionModel"
|
120 |
],
|
121 |
"attention_dropout": 0.0,
|
|
|
122 |
"bad_words_ids": null,
|
123 |
"begin_suppress_tokens": null,
|
124 |
"bos_token_id": null,
|
@@ -186,7 +191,7 @@
|
|
186 |
"top_p": 1.0,
|
187 |
"torch_dtype": "bfloat16",
|
188 |
"torchscript": false,
|
189 |
-
"transformers_version": "4.
|
190 |
"typical_p": 1.0,
|
191 |
"use_bfloat16": true
|
192 |
}
|
|
|
15 |
"ignore_index": -100,
|
16 |
"img_start_id": 100271,
|
17 |
"language_config": {
|
18 |
+
"_attn_implementation_autoset": true,
|
19 |
+
"_name_or_path": "",
|
20 |
"add_cross_attention": false,
|
21 |
"architectures": [
|
22 |
"LlamaForCausalLM"
|
|
|
96 |
"top_p": 1.0,
|
97 |
"torch_dtype": "bfloat16",
|
98 |
"torchscript": false,
|
99 |
+
"transformers_version": "4.48.2",
|
100 |
"typical_p": 1.0,
|
101 |
"use_bfloat16": false,
|
102 |
"use_cache": true,
|
103 |
"vocab_size": 110592
|
104 |
},
|
105 |
+
"max_image_cnt": 12,
|
106 |
"max_num_grids": 9,
|
107 |
"model_type": "hyperclovax_vlm",
|
|
|
108 |
"num_queries_vis_abstractor": 81,
|
109 |
"proj_pos_emb": true,
|
110 |
"proj_prenorm": false,
|
111 |
"q_former_model_name_or_path": null,
|
112 |
"torch_dtype": "float32",
|
113 |
+
"transformers_version": "4.48.2",
|
114 |
"unpad": true,
|
115 |
"use_1x1_grid": true,
|
116 |
"use_nth_layer": -2,
|
117 |
"vision_config": {
|
118 |
+
"_attn_implementation_autoset": true,
|
119 |
+
"_name_or_path": "",
|
120 |
"add_cross_attention": false,
|
121 |
"anyres": true,
|
122 |
"architectures": [
|
123 |
"SiglipVisionModel"
|
124 |
],
|
125 |
"attention_dropout": 0.0,
|
126 |
+
"auto_map": {},
|
127 |
"bad_words_ids": null,
|
128 |
"begin_suppress_tokens": null,
|
129 |
"bos_token_id": null,
|
|
|
191 |
"top_p": 1.0,
|
192 |
"torch_dtype": "bfloat16",
|
193 |
"torchscript": false,
|
194 |
+
"transformers_version": "4.48.2",
|
195 |
"typical_p": 1.0,
|
196 |
"use_bfloat16": true
|
197 |
}
|
generation_config.json
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"transformers_version": "4.48.2"
|
4 |
+
}
|
pytorch_model-00001-of-00004.bin → model-00001-of-00003.safetensors
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:340b93b87f93c98b62d2c96ef56e4656d9d68ec8a1cd178fe6812c925f8d8d88
|
3 |
+
size 4997245472
|
pytorch_model-00002-of-00004.bin → model-00002-of-00003.safetensors
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f85a5d24cadbb3d235c670a88f9b0757ff50b226819ba0a3cece51a72a2891e4
|
3 |
+
size 4920253536
|
pytorch_model-00003-of-00004.bin → model-00003-of-00003.safetensors
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4efe99ddd60fc020ad202df4ed089ab0a280c7b17d5376f011888fde8dd2c44
|
3 |
+
size 4967583384
|
pytorch_model.bin.index.json → model.safetensors.index.json
RENAMED
The diff for this file is too large to render.
See raw diff
|
|
pytorch_model-00004-of-00004.bin
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:1c50467661833482053fbbac1ea806cc818f09cde08545b731c7836667e91a99
|
3 |
-
size 1495999777
|
|
|
|
|
|
|
|