Switch model weights to safetensors format

Files changed (7) hide show

config.json CHANGED Viewed

@@ -15,6 +15,8 @@
   "ignore_index": -100,
   "img_start_id": 100271,
   "language_config": {
     "add_cross_attention": false,
     "architectures": [
       "LlamaForCausalLM"
@@ -94,31 +96,34 @@
     "top_p": 1.0,
     "torch_dtype": "bfloat16",
     "torchscript": false,
-    "transformers_version": "4.45.0",
     "typical_p": 1.0,
     "use_bfloat16": false,
     "use_cache": true,
     "vocab_size": 110592
   },
   "max_num_grids": 9,
   "model_type": "hyperclovax_vlm",
-  "max_image_cnt": 12,
   "num_queries_vis_abstractor": 81,
   "proj_pos_emb": true,
   "proj_prenorm": false,
   "q_former_model_name_or_path": null,
   "torch_dtype": "float32",
-  "transformers_version": "4.45.0",
   "unpad": true,
   "use_1x1_grid": true,
   "use_nth_layer": -2,
   "vision_config": {
     "add_cross_attention": false,
     "anyres": true,
     "architectures": [
       "SiglipVisionModel"
     ],
     "attention_dropout": 0.0,
     "bad_words_ids": null,
     "begin_suppress_tokens": null,
     "bos_token_id": null,
@@ -186,7 +191,7 @@
     "top_p": 1.0,
     "torch_dtype": "bfloat16",
     "torchscript": false,
-    "transformers_version": "4.45.0",
     "typical_p": 1.0,
     "use_bfloat16": true
   }

   "ignore_index": -100,
   "img_start_id": 100271,
   "language_config": {
+    "_attn_implementation_autoset": true,
+    "_name_or_path": "",
     "add_cross_attention": false,
     "architectures": [
       "LlamaForCausalLM"
     "top_p": 1.0,
     "torch_dtype": "bfloat16",
     "torchscript": false,
+    "transformers_version": "4.48.2",
     "typical_p": 1.0,
     "use_bfloat16": false,
     "use_cache": true,
     "vocab_size": 110592
   },
+  "max_image_cnt": 12,
   "max_num_grids": 9,
   "model_type": "hyperclovax_vlm",
   "num_queries_vis_abstractor": 81,
   "proj_pos_emb": true,
   "proj_prenorm": false,
   "q_former_model_name_or_path": null,
   "torch_dtype": "float32",
+  "transformers_version": "4.48.2",
   "unpad": true,
   "use_1x1_grid": true,
   "use_nth_layer": -2,
   "vision_config": {
+    "_attn_implementation_autoset": true,
+    "_name_or_path": "",
     "add_cross_attention": false,
     "anyres": true,
     "architectures": [
       "SiglipVisionModel"
     ],
     "attention_dropout": 0.0,
+    "auto_map": {},
     "bad_words_ids": null,
     "begin_suppress_tokens": null,
     "bos_token_id": null,
     "top_p": 1.0,
     "torch_dtype": "bfloat16",
     "torchscript": false,
+    "transformers_version": "4.48.2",
     "typical_p": 1.0,
     "use_bfloat16": true
   }

generation_config.json ADDED Viewed

+{
+  "_from_model_config": true,
+  "transformers_version": "4.48.2"
+}

pytorch_model-00001-of-00004.bin → model-00001-of-00003.safetensors RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b34c808a1106a2d41f4a7202226d86d01a74b70fb267b2aa6a5e118b81806248
-size 1995404833

 version https://git-lfs.github.com/spec/v1
+oid sha256:340b93b87f93c98b62d2c96ef56e4656d9d68ec8a1cd178fe6812c925f8d8d88
+size 4997245472

pytorch_model-00002-of-00004.bin → model-00002-of-00003.safetensors RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c461a7f04797ab043c9a28dc90f8f60d5607e97a0a67b7d7660f760128d586df
-size 1963104270

 version https://git-lfs.github.com/spec/v1
+oid sha256:f85a5d24cadbb3d235c670a88f9b0757ff50b226819ba0a3cece51a72a2891e4
+size 4920253536

pytorch_model-00003-of-00004.bin → model-00003-of-00003.safetensors RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:21b2e6e12f24b28beb82ddc329bc3177f6a8f3f105540801edb6c50cb7233276
-size 1988270158

 version https://git-lfs.github.com/spec/v1
+oid sha256:a4efe99ddd60fc020ad202df4ed089ab0a280c7b17d5376f011888fde8dd2c44
+size 4967583384

pytorch_model.bin.index.json → model.safetensors.index.json RENAMED Viewed

The diff for this file is too large to render. See raw diff

pytorch_model-00004-of-00004.bin DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:1c50467661833482053fbbac1ea806cc818f09cde08545b731c7836667e91a99
-size 1495999777