Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- config.json +40 -0
- model-00001-of-00049.safetensors +3 -0
- model-00002-of-00049.safetensors +3 -0
- model-00003-of-00049.safetensors +3 -0
- model-00004-of-00049.safetensors +3 -0
- model-00005-of-00049.safetensors +3 -0
- model-00006-of-00049.safetensors +3 -0
- model-00007-of-00049.safetensors +3 -0
- model-00008-of-00049.safetensors +3 -0
- model-00009-of-00049.safetensors +3 -0
- model-00010-of-00049.safetensors +3 -0
- model-00011-of-00049.safetensors +3 -0
- model-00012-of-00049.safetensors +3 -0
- model-00013-of-00049.safetensors +3 -0
- model-00014-of-00049.safetensors +3 -0
- model-00015-of-00049.safetensors +3 -0
- model-00016-of-00049.safetensors +3 -0
- model-00017-of-00049.safetensors +3 -0
- model-00018-of-00049.safetensors +3 -0
- model-00019-of-00049.safetensors +3 -0
- model-00020-of-00049.safetensors +3 -0
- model-00021-of-00049.safetensors +3 -0
- model-00022-of-00049.safetensors +3 -0
- model-00023-of-00049.safetensors +3 -0
- model-00024-of-00049.safetensors +3 -0
- model-00025-of-00049.safetensors +3 -0
- model-00026-of-00049.safetensors +3 -0
- model-00027-of-00049.safetensors +3 -0
- model-00028-of-00049.safetensors +3 -0
- model-00029-of-00049.safetensors +3 -0
- model-00030-of-00049.safetensors +3 -0
- model-00031-of-00049.safetensors +3 -0
- model-00032-of-00049.safetensors +3 -0
- model-00033-of-00049.safetensors +3 -0
- model-00034-of-00049.safetensors +3 -0
- model-00035-of-00049.safetensors +3 -0
- model-00036-of-00049.safetensors +3 -0
- model-00037-of-00049.safetensors +3 -0
- model-00038-of-00049.safetensors +3 -0
- model-00039-of-00049.safetensors +3 -0
- model-00040-of-00049.safetensors +3 -0
- model-00041-of-00049.safetensors +3 -0
- model-00042-of-00049.safetensors +3 -0
- model-00043-of-00049.safetensors +3 -0
- model-00044-of-00049.safetensors +3 -0
- model-00045-of-00049.safetensors +3 -0
- model-00046-of-00049.safetensors +3 -0
- model-00047-of-00049.safetensors +3 -0
- model-00048-of-00049.safetensors +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
config.json
ADDED
@@ -0,0 +1,40 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"Cohere2ForCausalLM"
|
4 |
+
],
|
5 |
+
"attention_bias": false,
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 5,
|
8 |
+
"cache_implementation": "hybrid",
|
9 |
+
"eos_token_id": 255001,
|
10 |
+
"head_dim": 128,
|
11 |
+
"hidden_act": "silu",
|
12 |
+
"hidden_size": 12288,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 36864,
|
15 |
+
"layer_norm_eps": 1e-05,
|
16 |
+
"logit_scale": 0.25,
|
17 |
+
"max_position_embeddings": 262144,
|
18 |
+
"model_type": "cohere2",
|
19 |
+
"num_attention_heads": 96,
|
20 |
+
"num_hidden_layers": 64,
|
21 |
+
"num_key_value_heads": 8,
|
22 |
+
"order_of_interleaved_layers": "local_attn_first",
|
23 |
+
"pad_token_id": 0,
|
24 |
+
"position_embedding_type": "rope_gptj",
|
25 |
+
"rope_scaling": null,
|
26 |
+
"rope_theta": 50000,
|
27 |
+
"rotary_pct": 1.0,
|
28 |
+
"sliding_window": 4096,
|
29 |
+
"sliding_window_pattern": 4,
|
30 |
+
"torch_dtype": "bfloat16",
|
31 |
+
"transformers_version": "4.50.3",
|
32 |
+
"unsloth_fixed": true,
|
33 |
+
"unsloth_version": "2025.3.19",
|
34 |
+
"use_cache": true,
|
35 |
+
"use_embedding_sharing": true,
|
36 |
+
"use_gated_activation": true,
|
37 |
+
"use_parallel_block": true,
|
38 |
+
"use_parallel_embedding": true,
|
39 |
+
"vocab_size": 256000
|
40 |
+
}
|
model-00001-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8b510a976376c61d1387063aec33104a962b451416d69d901089758bb00d9e8
|
3 |
+
size 6291456144
|
model-00002-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:485573b6df21b07e5abfe52465ee630254cfd95c92c5a326a09cad1bd7c34b82
|
3 |
+
size 4932527624
|
model-00003-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4e26dc2c3b74642c46975070a267243ffa438f98cf70583dd26cd14717e63d2
|
3 |
+
size 4278215728
|
model-00004-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60e7286aa5eabbe9e0f357fd6f82ff31f58399b46e7e0f1f5858fe54f95fce99
|
3 |
+
size 4932552312
|
model-00005-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4be97e749586fdf2b47d84b39c2a823f8ea6b2d929b9498d54b57cbaf3a2921
|
3 |
+
size 4278215728
|
model-00006-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c01c6be21720b6d902078429a53302320ad41521d07e92700a3a44ea180bd0a4
|
3 |
+
size 4278215728
|
model-00007-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0627f4d85516d9053859829d10f4a563948dece10186d91a5ceeab74295d728
|
3 |
+
size 4932552312
|
model-00008-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89eafea8d952fd04e65eacb9df5b4bf94f8c46baa4154d86c30094e8dba52e7a
|
3 |
+
size 4278215728
|
model-00009-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:457e1d57147b0c14c0e34f027195168922bfaf7f3445f2af28dc9f9004e2b669
|
3 |
+
size 4278215744
|
model-00010-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82b261740e39b6b6954229517e27f828c0fe5eb214f48e9755e9f4bcd99ce38a
|
3 |
+
size 4932552328
|
model-00011-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:545568b5a803b5257212a35bc1ac0736d9f37905245f755f4e06b3850c24f56a
|
3 |
+
size 4278215736
|
model-00012-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a13f5f89ca0b1fea3b1bdee3bb13e16720be21f218f0dbb7218ac5b908f635fc
|
3 |
+
size 4278215736
|
model-00013-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f296046a3bbbbb3b5017ed980e616d4ad05c73d096a853e54dcf894927ad67f
|
3 |
+
size 4932552328
|
model-00014-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b30c04bfce0e5aaabad43a9fbdb2d8d41f18efce2e894fd931018076f615219e
|
3 |
+
size 4278215736
|
model-00015-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e416d1349c91bbe5d0092bcad15d713700790b624ed086a20df1fd04163556af
|
3 |
+
size 4278215736
|
model-00016-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f9ec56197319edecbbdff22f944878882fadb374d5f13f5c44bb08cb2f3a33e
|
3 |
+
size 4932552328
|
model-00017-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:096c5fbf956a3079843fac773deb062ed7f62bb3fbdeb3444f368d979b867d76
|
3 |
+
size 4278215736
|
model-00018-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b253dc17d4deaec0b2d7b1c109a1c3d4544d3e0f073a36427015b1c38bd40d82
|
3 |
+
size 4278215736
|
model-00019-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9603a1d5f3c7da0dd4cc8991e2cd127960ba2225971ec5b31d6c4c467ee7960
|
3 |
+
size 4932552328
|
model-00020-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5391fe292aff4f8c44a92bc3cabf0abc6977eef57b8a078d3c3cc5cbcf5e6f4f
|
3 |
+
size 4278215736
|
model-00021-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6dffff92b839db4c87a8b63e3d2f0ec74c8b5cfa7f996fbcdbbb2f4663c0927
|
3 |
+
size 4278215736
|
model-00022-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ec1409b81d39255adf574b503eeebd8835381b14f91618a140d739da40ee48c
|
3 |
+
size 4932552328
|
model-00023-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ee7cf45bdea89cf73f4d6a587324afc1ef88dc26dde0b3cb587916dbe54cdcb
|
3 |
+
size 4278215736
|
model-00024-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18417d0c9376fdf5aaa77c9d47eb8a505962c80da1ad6f0bfaa713e3e0c0d5ee
|
3 |
+
size 4278215736
|
model-00025-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3363af6ffa39e1d7fbf5488cff6f358c248788ca6871ca0df08c436ec06d257
|
3 |
+
size 4932552328
|
model-00026-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da1100f0d0de95a5eb6ccefba32c58bc7a692c6d1e8d00e7ce9e24da06eb1eab
|
3 |
+
size 4278215736
|
model-00027-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52fe4a19d17611006fa62c5beb7f85f8211527cd829420f3d52b8fec6fbb163a
|
3 |
+
size 4278215736
|
model-00028-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3b06d697dca0655fc69d8c2e5e100ff9a7ca4c105e8684d755d17b623297380
|
3 |
+
size 4932552328
|
model-00029-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4c675c6becb47b8960df36772eeca74a965328a79e76995ec7b99fb1b56ff10
|
3 |
+
size 4278215736
|
model-00030-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df68be08ed81f4ae1dfc01191078df24ae82256a31727c79319492e6912fefd2
|
3 |
+
size 4278215736
|
model-00031-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecff21c1a0c7fb2818608a2ec1b2aa3dfe8c47b8768c1d1d531195f39d3b9e65
|
3 |
+
size 4932552328
|
model-00032-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d90353213c0865c246c0e2f11ea2475ff67a3685e44ef081795677fca7f9305a
|
3 |
+
size 4278215736
|
model-00033-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fee733dddd12515c2bf44b1198d48a083d728402318b6c6a9945f5cd0eccc6f4
|
3 |
+
size 4278215736
|
model-00034-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ba24822d19b295292f5b7cadd0a285ec555a7395c534b49eb9678e5c03fe8d9
|
3 |
+
size 4932552328
|
model-00035-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ac2a0edfdfe02f15450068051c925253e92526813a14ff179ac58a19e7513a1
|
3 |
+
size 4278215736
|
model-00036-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e418b8c6c5e2e52efa9e2ad76791ebcd5fae477dd4456ff02535a20a2bab583
|
3 |
+
size 4278215736
|
model-00037-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3c61d13e9190ee802175d9e87d95eef87beb13587f371e0b5cd2b1edfee7e59
|
3 |
+
size 4932552328
|
model-00038-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:389ff526ee7f8031a464dcdaf8baf423a6b225206b5716415a4ab17dcd2d8cf7
|
3 |
+
size 4278215736
|
model-00039-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b05cda093c7a907d3b9dc57e1262ccd986fa9cfd730d8da90dfcaad79de30cfc
|
3 |
+
size 4278215736
|
model-00040-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ed1afe77efac6d4907ce1ca701fc2912c7323c95986f96f3d0fe9ff63bc8e94
|
3 |
+
size 4932552328
|
model-00041-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a622f7db46d89cecffb16d48081af286b0931bf62c8c554b5f78e60de96652fb
|
3 |
+
size 4278215736
|
model-00042-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92539d2d95dc636421101be8832055b13d49eece12b95e72a80dbe5bb913f5b5
|
3 |
+
size 4278215736
|
model-00043-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d0dd6b575104594db55420675ff6f2108ad38ae5a2dc99ea1191092dad72945
|
3 |
+
size 4932552328
|
model-00044-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:559f7b08d10e8930e911bc5eb96230c8ba87472a991d2a2d5769ff358224060e
|
3 |
+
size 4278215736
|
model-00045-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:923a0c2c46e8adfe6361ea470a650d036a887d3c7e1c258be0ea0c24a7c5cfdc
|
3 |
+
size 4278215736
|
model-00046-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab316d92fd2a4213f63f88ad9a17a28c56d165ab70ed64d6c9f7934d7addba97
|
3 |
+
size 4932552328
|
model-00047-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db9599674b74fac9daa53dac2ea4e5d477225f9143d7b6655bc6fb073e09de4d
|
3 |
+
size 4278215736
|
model-00048-of-00049.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70721e08b4b847d92739fecb7cdf1c9718d1be434f59e02941d69a62154b40c9
|
3 |
+
size 4278215736
|