roslein commited on
Commit
d39be35
·
verified ·
1 Parent(s): 23589eb

Initial commit msg

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. config.json +38 -0
  3. generation_config.json +8 -0
  4. model-00001-of-00049.safetensors +3 -0
  5. model-00002-of-00049.safetensors +3 -0
  6. model-00003-of-00049.safetensors +3 -0
  7. model-00004-of-00049.safetensors +3 -0
  8. model-00005-of-00049.safetensors +3 -0
  9. model-00006-of-00049.safetensors +3 -0
  10. model-00007-of-00049.safetensors +3 -0
  11. model-00008-of-00049.safetensors +3 -0
  12. model-00009-of-00049.safetensors +3 -0
  13. model-00010-of-00049.safetensors +3 -0
  14. model-00011-of-00049.safetensors +3 -0
  15. model-00012-of-00049.safetensors +3 -0
  16. model-00013-of-00049.safetensors +3 -0
  17. model-00014-of-00049.safetensors +3 -0
  18. model-00015-of-00049.safetensors +3 -0
  19. model-00016-of-00049.safetensors +3 -0
  20. model-00017-of-00049.safetensors +3 -0
  21. model-00018-of-00049.safetensors +3 -0
  22. model-00019-of-00049.safetensors +3 -0
  23. model-00020-of-00049.safetensors +3 -0
  24. model-00021-of-00049.safetensors +3 -0
  25. model-00022-of-00049.safetensors +3 -0
  26. model-00023-of-00049.safetensors +3 -0
  27. model-00024-of-00049.safetensors +3 -0
  28. model-00025-of-00049.safetensors +3 -0
  29. model-00026-of-00049.safetensors +3 -0
  30. model-00027-of-00049.safetensors +3 -0
  31. model-00028-of-00049.safetensors +3 -0
  32. model-00029-of-00049.safetensors +3 -0
  33. model-00030-of-00049.safetensors +3 -0
  34. model-00031-of-00049.safetensors +3 -0
  35. model-00032-of-00049.safetensors +3 -0
  36. model-00033-of-00049.safetensors +3 -0
  37. model-00034-of-00049.safetensors +3 -0
  38. model-00035-of-00049.safetensors +3 -0
  39. model-00036-of-00049.safetensors +3 -0
  40. model-00037-of-00049.safetensors +3 -0
  41. model-00038-of-00049.safetensors +3 -0
  42. model-00039-of-00049.safetensors +3 -0
  43. model-00040-of-00049.safetensors +3 -0
  44. model-00041-of-00049.safetensors +3 -0
  45. model-00042-of-00049.safetensors +3 -0
  46. model-00043-of-00049.safetensors +3 -0
  47. model-00044-of-00049.safetensors +3 -0
  48. model-00045-of-00049.safetensors +3 -0
  49. model-00046-of-00049.safetensors +3 -0
  50. model-00047-of-00049.safetensors +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Cohere2ForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 5,
8
+ "cache_implementation": "hybrid",
9
+ "eos_token_id": 255001,
10
+ "head_dim": 128,
11
+ "hidden_act": "silu",
12
+ "hidden_size": 12288,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 36864,
15
+ "layer_norm_eps": 1e-05,
16
+ "logit_scale": 0.25,
17
+ "max_position_embeddings": 131072,
18
+ "model_type": "cohere2",
19
+ "num_attention_heads": 96,
20
+ "num_hidden_layers": 64,
21
+ "num_key_value_heads": 8,
22
+ "order_of_interleaved_layers": "local_attn_first",
23
+ "pad_token_id": 0,
24
+ "position_embedding_type": "rope_gptj",
25
+ "rope_scaling": null,
26
+ "rope_theta": 50000,
27
+ "rotary_pct": 1.0,
28
+ "sliding_window": 4096,
29
+ "sliding_window_pattern": 4,
30
+ "torch_dtype": "bfloat16",
31
+ "transformers_version": "4.51.3",
32
+ "use_cache": true,
33
+ "use_embedding_sharing": true,
34
+ "use_gated_activation": true,
35
+ "use_parallel_block": true,
36
+ "use_parallel_embedding": true,
37
+ "vocab_size": 256000
38
+ }
generation_config.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 5,
4
+ "cache_implementation": "hybrid",
5
+ "eos_token_id": 255001,
6
+ "pad_token_id": 0,
7
+ "transformers_version": "4.51.3"
8
+ }
model-00001-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8b510a976376c61d1387063aec33104a962b451416d69d901089758bb00d9e8
3
+ size 6291456144
model-00002-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0ea81efb8d0de2b89d93b739050dadef418c9ae4e4c6f03371823237a3d5937
3
+ size 4932527624
model-00003-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f044481b393603e9cc97f7cdc800a998d67540c0a9c7d2b655fb88109f2bade
3
+ size 4278215728
model-00004-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47cd7432a1bb6b3ee8c1a81527f970b8c0634ca970ac50ed7564302ca86b0fd7
3
+ size 4932552312
model-00005-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc136b3f90cfb7ea55f129953300d4514fa54ca0a0662f695dd949c3803d649d
3
+ size 4278215728
model-00006-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25d50f13efa6ebc7598da45602369e0b4e8e7e75e008134eed90d42ff931481d
3
+ size 4278215728
model-00007-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ec2161bcfbef3374784e39ecede6504c6e6ac2348411efe8e98841a56e888b7
3
+ size 4932552312
model-00008-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b214e8b70c6aa3d1ce2f55f7853e03ae1054866f53a9d4d83d1cb915d09eb6b1
3
+ size 4278215728
model-00009-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18ee22d0a3c246b1dcceaffe7e4bd0529df5273a8e196d54babceb7cdddc33f2
3
+ size 4278215744
model-00010-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96c9bf123254369870ab916535e22749978c04267b4a21b7f338cfc8a148df08
3
+ size 4932552328
model-00011-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ddaf1756de7c6eb27ca333c5683adf83260c8ea4f07b61cc9c6c65c02bc4eb3
3
+ size 4278215736
model-00012-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:325da7b9f1970e12ee500e7809de6e2c8ac7e20ee420e00763cd398e83b95082
3
+ size 4278215736
model-00013-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6233340996bbd6f5ece3ad294db84413358b1c3d78c4206e8a8b43e13d19d225
3
+ size 4932552328
model-00014-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68f0b7180b42654307b521a4419fab9d0694d1239127704bf49ab1bf8c0deaa3
3
+ size 4278215736
model-00015-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11eb62dd1dd2c47d6052f1e34859909ae883fcc7c684cfb65b58e6103f91557f
3
+ size 4278215736
model-00016-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efe94c7cf845ef01c9ee6740db48c83fbffaa6cf84a588db6767ad280da0d921
3
+ size 4932552328
model-00017-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14c5937be907455c1d4a7cce887eb17ccfbc7f09378a958e86414c6077a4f6ab
3
+ size 4278215736
model-00018-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cdc884e44eb8793656732b7e49ddcb8d75257145787e157b20cff46d975fa1d
3
+ size 4278215736
model-00019-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d596611ea90b2544c5961a69de12a31ac4c81503150f8ce556dc6a7704ffdaee
3
+ size 4932552328
model-00020-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c807d25b7c3eccb8722aa4c1f478e616598025377c191aff499de01495956c94
3
+ size 4278215736
model-00021-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89c8fde8c54bad65a5ac62b9f9410186d0706b61f73cf017028b24b409a98c37
3
+ size 4278215736
model-00022-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cae35cbeccdfb97c79b32db485785d312f97436903097d687d543c3ea33ded0b
3
+ size 4932552328
model-00023-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c48a592815fa59548f87b232538f9c3f8b5c8a46292d69bdea7dc32af9a6e579
3
+ size 4278215736
model-00024-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f94f541e57515c8cbdc752b95559c444ab2d62a7598e257e933a50f215a16c8
3
+ size 4278215736
model-00025-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90c60206ef473df82600e7aa1a976350880ab096fee65f665b4d833845855083
3
+ size 4932552328
model-00026-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7241ce5f8501f7840fa8f2c92830417651c006bbdbf44ae6878cdd4c15de0360
3
+ size 4278215736
model-00027-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92be22ec815d2943c6504e6070b5b57700ccdc84c750258708ca5d8b0e0038c8
3
+ size 4278215736
model-00028-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aadf5fcb1f66ade1a843e81e390ec66e6ad5cd4dbe465f45842bc85595193913
3
+ size 4932552328
model-00029-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70d18188981e5c1a6d11ff1f03be832dc3a01a14de3364ed438f0faffe33a8ac
3
+ size 4278215736
model-00030-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e877487f0708084ec100620788d6ff9282cfa419067b223cb88193ee10cf56da
3
+ size 4278215736
model-00031-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64241a7fa49275902ee1e6deb8625c291c935e4bbb22ef0dd2e29b2f95e14d66
3
+ size 4932552328
model-00032-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc5eda9ab38b90fa836b1686c53a92f4bc46fdcdbafebbd26302b056a9f69937
3
+ size 4278215736
model-00033-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac0d234db1352ce2a4918adf731d7c0f37b28d27eff2f0d75152d286ed9689ef
3
+ size 4278215736
model-00034-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2971412914273cbea936eff56ef6ba761c6bbcd86ff8921a807aa347d022c2eb
3
+ size 4932552328
model-00035-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52ecae7da51ad27ef7f72dd31a980e553ca008abca8248757b9694956f109836
3
+ size 4278215736
model-00036-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3daa3ee111063a613d45a99441c8b175105743405625e0c8435614063f2b7243
3
+ size 4278215736
model-00037-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:877916e2241263428305db382c8aeb44f945a75f30b87b4a194bacae9cdb2e20
3
+ size 4932552328
model-00038-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6780d6c019fe95ff8de0cdb828d1999daa53d419832621e4b107f939319d4c4
3
+ size 4278215736
model-00039-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6c70dfa6c18f6d16327258de6a1bc3bf3a93600059f9d90cabe6227ebb3e9fc
3
+ size 4278215736
model-00040-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ce6d501bc3942293a5dd9239a0ed6b6e074b1195569af1293b2295aca66e7f5
3
+ size 4932552328
model-00041-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc1cad1ca8d82eb544c5fd1284f3e3865f5d81238c3a6f087844b59ee7c49a62
3
+ size 4278215736
model-00042-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a609ce1376e99744b837b24a52ae58246f384c8bc47debb3779330bc98a978cf
3
+ size 4278215736
model-00043-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:caf19220e673d82310d383b5faee6bb4ab9a6783bf7e9fe7c143df1c7df393b9
3
+ size 4932552328
model-00044-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d431492a0ce20191423fa19c5e41f7fe6d15e02a82ae613a02ac32869dc7744
3
+ size 4278215736
model-00045-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30cf59f634cec3fbf2281904a61c44d4f1cb08c64c404725c93eb18a8ed82101
3
+ size 4278215736
model-00046-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4df006e73a32e6f3c17fa6019cb3f04df433f1b66590eeb4c5dbc7ce99e10d49
3
+ size 4932552328
model-00047-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddbfc14a0cc030453f92941a07af59c32942081c011d334de208e3c8c19b219b
3
+ size 4278215736