Update models
Browse files- .gitattributes +13 -0
- Qwen3-0.6B-Q2_K.gguf +3 -0
- Qwen3-0.6B-Q3_K_L.gguf +3 -0
- Qwen3-0.6B-Q3_K_M.gguf +3 -0
- Qwen3-0.6B-Q3_K_S.gguf +3 -0
- Qwen3-0.6B-Q4_0.gguf +3 -0
- Qwen3-0.6B-Q4_K_M.gguf +3 -0
- Qwen3-0.6B-Q4_K_S.gguf +3 -0
- Qwen3-0.6B-Q5_0.gguf +3 -0
- Qwen3-0.6B-Q5_K_M.gguf +3 -0
- Qwen3-0.6B-Q5_K_S.gguf +3 -0
- Qwen3-0.6B-Q6_K.gguf +3 -0
- Qwen3-0.6B-Q8_0.gguf +3 -0
- Qwen3-0.6B-f16.gguf +3 -0
- config.json +30 -0
.gitattributes
CHANGED
@@ -33,3 +33,16 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
Qwen3-0.6B-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
|
37 |
+
Qwen3-0.6B-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
|
38 |
+
Qwen3-0.6B-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
39 |
+
Qwen3-0.6B-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
40 |
+
Qwen3-0.6B-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
|
41 |
+
Qwen3-0.6B-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
42 |
+
Qwen3-0.6B-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
43 |
+
Qwen3-0.6B-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
|
44 |
+
Qwen3-0.6B-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
45 |
+
Qwen3-0.6B-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
46 |
+
Qwen3-0.6B-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
|
47 |
+
Qwen3-0.6B-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
|
48 |
+
Qwen3-0.6B-f16.gguf filter=lfs diff=lfs merge=lfs -text
|
Qwen3-0.6B-Q2_K.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb043f7932161baa0587727de13e50e884def5aeff5335110f0a5ce4e4d22335
|
3 |
+
size 347288224
|
Qwen3-0.6B-Q3_K_L.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65f8f9f73cca28b812e9626c31f72021cf3e87e82c37c5e0f2e6ce48115cc128
|
3 |
+
size 435343008
|
Qwen3-0.6B-Q3_K_M.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df588f102a9d6e240e86a9106fbef127e4eaa63c9c8ae40668d60daa2c456059
|
3 |
+
size 413978272
|
Qwen3-0.6B-Q3_K_S.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4b88c3b3e68a239a553306673401814fd1bd1a71f0eaa43539d0633aac1f14e
|
3 |
+
size 389926560
|
Qwen3-0.6B-Q4_0.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f734719e95510c7dff9ec1a7bc4d509d5fc63f7b4c8f72ed5b092f60df5c7ad8
|
3 |
+
size 469080736
|
Qwen3-0.6B-Q4_K_M.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd6df9d5627007fa6e29cf2fff3464b1ab01a789fa8220c61ff5f3cf4989ce0e
|
3 |
+
size 484219552
|
Qwen3-0.6B-Q4_K_S.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:564ee2ec7c066bf45498ba4aa431c259b1fada0cde0c79017fae79eff5374d1b
|
3 |
+
size 470784672
|
Qwen3-0.6B-Q5_0.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1297e04eb8e6da8f4ef8569c6bbe4f2b1c5712f545b683408bb2238cd4a6c2d
|
3 |
+
size 543578784
|
Qwen3-0.6B-Q5_K_M.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb4229cda08109a83c3b3a142f446443b811986562de49b3a0075b6732817355
|
3 |
+
size 551377568
|
Qwen3-0.6B-Q5_K_S.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f35abb4832ee1ad95161cf4679494fc0d96f2627e40e65c27a07542aa8da96f
|
3 |
+
size 543578784
|
Qwen3-0.6B-Q6_K.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f849a77a5eddcb3705b3495993c43b36f0c504409f47bf651925062ad94c8477
|
3 |
+
size 622732960
|
Qwen3-0.6B-Q8_0.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a475ffd89c94e46fbd9f7a2a1a6a6123e570ad1fe1511652b9923e9f1f651ba
|
3 |
+
size 804753056
|
Qwen3-0.6B-f16.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25fb880334987a71db728fb43af8568a4682208059f754a2735781f5d0970143
|
3 |
+
size 1509346976
|
config.json
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"Qwen3ForCausalLM"
|
4 |
+
],
|
5 |
+
"attention_bias": false,
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 151643,
|
8 |
+
"eos_token_id": 151645,
|
9 |
+
"head_dim": 128,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 1024,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 3072,
|
14 |
+
"max_position_embeddings": 40960,
|
15 |
+
"max_window_layers": 28,
|
16 |
+
"model_type": "qwen3",
|
17 |
+
"num_attention_heads": 16,
|
18 |
+
"num_hidden_layers": 28,
|
19 |
+
"num_key_value_heads": 8,
|
20 |
+
"rms_norm_eps": 1e-06,
|
21 |
+
"rope_scaling": null,
|
22 |
+
"rope_theta": 1000000,
|
23 |
+
"sliding_window": null,
|
24 |
+
"tie_word_embeddings": true,
|
25 |
+
"torch_dtype": "bfloat16",
|
26 |
+
"transformers_version": "4.51.0",
|
27 |
+
"use_cache": true,
|
28 |
+
"use_sliding_window": false,
|
29 |
+
"vocab_size": 151936
|
30 |
+
}
|