Upload Qwen3ForCausalLM

Browse files

Files changed (5) hide show

config.json +44 -4
generation_config.json +1 -1
pytorch_model-00001-of-00002.bin +2 -2
pytorch_model-00002-of-00002.bin +2 -2
pytorch_model.bin.index.json +1 -0

config.json CHANGED Viewed

@@ -11,6 +11,44 @@
   "hidden_size": 4096,
   "initializer_range": 0.02,
   "intermediate_size": 12288,
   "max_position_embeddings": 40960,
   "max_window_layers": 36,
   "model_type": "qwen3",
@@ -18,13 +56,14 @@
   "num_hidden_layers": 36,
   "num_key_value_heads": 8,
   "quantization_config": {
-    "include_embedding": false,
     "modules_to_not_convert": null,
     "quant_method": "torchao",
     "quant_type": {
       "default": {
         "_data": {
           "group_size": 128,
           "layout": {
             "_data": {
               "inner_k_tiles": 8
@@ -32,16 +71,17 @@
             "_type": "TensorCoreTiledLayout",
             "_version": 1
           },
           "preserve_zero": null,
           "set_inductor_config": true,
-          "use_hqq": true,
           "zero_point_domain": {
             "_data": "NONE",
             "_type": "ZeroPointDomain"
           }
         },
         "_type": "Int4WeightOnlyConfig",
-        "_version": 1
       }
     },
     "quant_type_kwargs": {},
@@ -53,7 +93,7 @@
   "sliding_window": null,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
-  "transformers_version": "4.52.0.dev0",
   "use_cache": true,
   "use_sliding_window": false,
   "vocab_size": 151936

   "hidden_size": 4096,
   "initializer_range": 0.02,
   "intermediate_size": 12288,
+  "layer_types": [
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention"
+  ],
   "max_position_embeddings": 40960,
   "max_window_layers": 36,
   "model_type": "qwen3",
   "num_hidden_layers": 36,
   "num_key_value_heads": 8,
   "quantization_config": {
+    "include_input_output_embeddings": false,
     "modules_to_not_convert": null,
     "quant_method": "torchao",
     "quant_type": {
       "default": {
         "_data": {
           "group_size": 128,
+          "int4_choose_qparams_algorithm": "hqq",
           "layout": {
             "_data": {
               "inner_k_tiles": 8
             "_type": "TensorCoreTiledLayout",
             "_version": 1
           },
+          "packing_format": "tile_packed_to_4d",
           "preserve_zero": null,
           "set_inductor_config": true,
+          "use_hqq": false,
           "zero_point_domain": {
             "_data": "NONE",
             "_type": "ZeroPointDomain"
           }
         },
         "_type": "Int4WeightOnlyConfig",
+        "_version": 2
       }
     },
     "quant_type_kwargs": {},
   "sliding_window": null,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
+  "transformers_version": "4.55.4",
   "use_cache": true,
   "use_sliding_window": false,
   "vocab_size": 151936

generation_config.json CHANGED Viewed

@@ -9,5 +9,5 @@
   "temperature": 0.6,
   "top_k": 20,
   "top_p": 0.95,
-  "transformers_version": "4.52.0.dev0"
 }

   "temperature": 0.6,
   "top_k": 20,
   "top_p": 0.95,
+  "transformers_version": "4.55.4"
 }

pytorch_model-00001-of-00002.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c1cd775b881e92b5210c6deb171a6768f277907079ef65b0e2f94c6e72df326a
-size 4935497756

 version https://git-lfs.github.com/spec/v1
+oid sha256:5e9cb30fa015b2d0075bc753865281b93b861b404b044bd852b3611ce0a4a020
+size 4935466523

pytorch_model-00002-of-00002.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4fb405e09d822b45d676275cf6d4a22df256e0e21ac9be3d3e199b24610ab53e
-size 1244661125

 version https://git-lfs.github.com/spec/v1
+oid sha256:f41a2ea7d01f35ed3c0ecd8cab39da1cd7bc2ad48be7c46dc8fab80b5628bfa9
+size 1244661564

pytorch_model.bin.index.json CHANGED Viewed

@@ -1,5 +1,6 @@
 {
   "metadata": {
     "total_size": 6179874816
   },
   "weight_map": {

 {
   "metadata": {
+    "total_parameters": 8190735360,
     "total_size": 6179874816
   },
   "weight_map": {