chrisjcundy commited on
Commit
5603653
·
verified ·
1 Parent(s): 9c4edc7

Upload LlamaForCausalLM

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +39 -0
  2. generation_config.json +12 -0
  3. model-00001-of-00062.safetensors +3 -0
  4. model-00002-of-00062.safetensors +3 -0
  5. model-00003-of-00062.safetensors +3 -0
  6. model-00004-of-00062.safetensors +3 -0
  7. model-00005-of-00062.safetensors +3 -0
  8. model-00006-of-00062.safetensors +3 -0
  9. model-00007-of-00062.safetensors +3 -0
  10. model-00008-of-00062.safetensors +3 -0
  11. model-00009-of-00062.safetensors +3 -0
  12. model-00010-of-00062.safetensors +3 -0
  13. model-00011-of-00062.safetensors +3 -0
  14. model-00012-of-00062.safetensors +3 -0
  15. model-00013-of-00062.safetensors +3 -0
  16. model-00014-of-00062.safetensors +3 -0
  17. model-00015-of-00062.safetensors +3 -0
  18. model-00016-of-00062.safetensors +3 -0
  19. model-00017-of-00062.safetensors +3 -0
  20. model-00018-of-00062.safetensors +3 -0
  21. model-00019-of-00062.safetensors +3 -0
  22. model-00020-of-00062.safetensors +3 -0
  23. model-00021-of-00062.safetensors +3 -0
  24. model-00022-of-00062.safetensors +3 -0
  25. model-00023-of-00062.safetensors +3 -0
  26. model-00024-of-00062.safetensors +3 -0
  27. model-00025-of-00062.safetensors +3 -0
  28. model-00026-of-00062.safetensors +3 -0
  29. model-00027-of-00062.safetensors +3 -0
  30. model-00028-of-00062.safetensors +3 -0
  31. model-00029-of-00062.safetensors +3 -0
  32. model-00030-of-00062.safetensors +3 -0
  33. model-00031-of-00062.safetensors +3 -0
  34. model-00032-of-00062.safetensors +3 -0
  35. model-00033-of-00062.safetensors +3 -0
  36. model-00034-of-00062.safetensors +3 -0
  37. model-00035-of-00062.safetensors +3 -0
  38. model-00036-of-00062.safetensors +3 -0
  39. model-00037-of-00062.safetensors +3 -0
  40. model-00038-of-00062.safetensors +3 -0
  41. model-00039-of-00062.safetensors +3 -0
  42. model-00040-of-00062.safetensors +3 -0
  43. model-00041-of-00062.safetensors +3 -0
  44. model-00042-of-00062.safetensors +3 -0
  45. model-00043-of-00062.safetensors +3 -0
  46. model-00044-of-00062.safetensors +3 -0
  47. model-00045-of-00062.safetensors +3 -0
  48. model-00046-of-00062.safetensors +3 -0
  49. model-00047-of-00062.safetensors +3 -0
  50. model-00048-of-00062.safetensors +3 -0
config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "LlamaForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 128000,
8
+ "eos_token_id": [
9
+ 128001,
10
+ 128008,
11
+ 128009
12
+ ],
13
+ "head_dim": 128,
14
+ "hidden_act": "silu",
15
+ "hidden_size": 8192,
16
+ "initializer_range": 0.02,
17
+ "intermediate_size": 28672,
18
+ "max_position_embeddings": 131072,
19
+ "mlp_bias": false,
20
+ "model_type": "llama",
21
+ "num_attention_heads": 64,
22
+ "num_hidden_layers": 80,
23
+ "num_key_value_heads": 8,
24
+ "pretraining_tp": 1,
25
+ "rms_norm_eps": 1e-05,
26
+ "rope_scaling": {
27
+ "factor": 8.0,
28
+ "high_freq_factor": 4.0,
29
+ "low_freq_factor": 1.0,
30
+ "original_max_position_embeddings": 8192,
31
+ "rope_type": "llama3"
32
+ },
33
+ "rope_theta": 500000.0,
34
+ "tie_word_embeddings": false,
35
+ "torch_dtype": "float32",
36
+ "transformers_version": "4.55.4",
37
+ "use_cache": true,
38
+ "vocab_size": 128256
39
+ }
generation_config.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 128000,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 128001,
6
+ 128008,
7
+ 128009
8
+ ],
9
+ "temperature": 0.6,
10
+ "top_p": 0.9,
11
+ "transformers_version": "4.55.4"
12
+ }
model-00001-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0508c741f14a81d48939a8914390e6c81fb7baf12c64a1229000b2fd86c4c1c
3
+ size 4806672984
model-00002-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c91c948b01faa5b782d99e80ea1e83b5be28370e52f9b40b9b1369b9771187f
3
+ size 4362142864
model-00003-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1de0ce3843e4269829108067a9847bc3ad64d067700de0ad825f9cd5db52dc09
3
+ size 4362142864
model-00004-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ba0f0fec9a0de39a7f9b052dfa22d788b297c420e8afefdd92317beb1263687
3
+ size 4966188864
model-00005-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5304375b5f6e589972dcd2f1968bf2169b85a559d7fb914691e0880f5600dfb6
3
+ size 4362142864
model-00006-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7265f7f523e64f52478da5d7d4a3f6244d0f192b5ea3a22832b5441d03ea0cf1
3
+ size 4362142864
model-00007-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd08393d2b258f739be730b0b7434eb4ace6a7b787629df6ea785df90335f7be
3
+ size 4966188864
model-00008-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84d7a8db4ea21f9d9aa7ae1556c1027a67110e49f46ecd69c299a1eb040623aa
3
+ size 4362142864
model-00009-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75720b6d95ed5476f553492fd7aa03f40c4c326c84887e8b7a1b2b764cdada90
3
+ size 4362142880
model-00010-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e3f2571c0537b4376dd758886f96d64073790fc38341412af1e9db628dc9b0f
3
+ size 4966188880
model-00011-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c256c8b0cb99d86ad83d70532b373ddfde33e1454e2f02e1fafffd25773ea766
3
+ size 4362142872
model-00012-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e900554b94df3e317eb03d3e98cff39a1fffab83152f21511e928b568f4443b4
3
+ size 4362142872
model-00013-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84a4ca0995c0f03143cbd2441b7da58231562b5ba82456e72d4e65ca50f60cc6
3
+ size 4966188880
model-00014-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2ed247b06df6a41fa836b749c4f05c069b9c8d761ff9719fb38ea22b8187bea
3
+ size 4362142872
model-00015-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fdef788283d72177a9cc756244e4f3109b93f6176dfd25203188a26d32f38c4
3
+ size 4362142872
model-00016-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e01309a1d15eab168df74e3f45898247bba72bd37b121967b92e2ce78fef1d57
3
+ size 4966188880
model-00017-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89eeb359fed2a5a5464842279e38e40aeb1e7f0c35b89b4d215b23856605f2ba
3
+ size 4362142872
model-00018-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48768615c36034b987ecea279d798f7a193fce8b7abf74d81ed592536be4c505
3
+ size 4362142872
model-00019-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50fc90357fce91f42ce6cf43eb39c7d3b75fc41cd07b7a98d453137582d81b10
3
+ size 4966188880
model-00020-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2044e0d55ecff82f80915d775e0446090a6b2a80b96ddc066cb0f370638c248
3
+ size 4362142872
model-00021-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66b5ae0b5c3eb3571bb800f15e30461dee9070fb10172d0ecda7c6847082a970
3
+ size 4362142872
model-00022-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42a41a23d9fbe7e9f1e6638a9143713d04fbd876ef328acc26af5d33dd4f6ff3
3
+ size 4966188880
model-00023-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4000eb1e81a12540366dc1187cc4ad6390432e97db3829fe6f761be5b9473211
3
+ size 4362142872
model-00024-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9294f226e52ee97d21b1900366ac337704655af87e52deace45e30897da39b35
3
+ size 4362142872
model-00025-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2ee0fa5bdd45cefdd442b4e8b1135947d6b9541ff1d9459d1fc17a9bbb46a24
3
+ size 4966188880
model-00026-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba79140600211832f84d2244b4795390721f5cf5aba11aec38983df4a54147d3
3
+ size 4362142872
model-00027-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6a4419b08856470bb4be66bddc136807b4418c0807af6e9d6362b390ff66c84
3
+ size 4362142872
model-00028-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca0e46def37f60864b8a801d16bfea5b7476140168995a8911c5bf49b812d502
3
+ size 4966188880
model-00029-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81faa2c4402dabfd9041e1fffb8480dcdf3e0337bc6fed8f8bd0be82240c7dd9
3
+ size 4362142872
model-00030-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d6cb8470bf5cb73bcdd0fafe57f26f1cca6fae07fdacb9b173ba9784d91f6d0
3
+ size 4362142872
model-00031-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9fbda00c24f7c9a128c6f0a9f551c6a4b8668829fd68f5f2459786dc4ce420a6
3
+ size 4966188880
model-00032-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ae31c5bd1a7ce2c81b1a818c998da53cd5edf1d66dfd1673409b957344e2f93
3
+ size 4362142872
model-00033-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f05d6f3186cd7a43f6d69584c6279a98a5063c31cdeddb3265c3950debf86ce
3
+ size 4362142872
model-00034-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be840476ed2a376f0ae48f610596a45bff750f68713725b2edccfea4fb4f700d
3
+ size 4966188880
model-00035-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a6304c20e12f45834a7914cfb7d8ee4bed83e90e2554891cf87f4c1c6bf0619
3
+ size 4362142872
model-00036-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:988f6d21cbade0a8cdf9bb9c087fc2ef5697605f6a99c6afc1a5fa24cb0b2983
3
+ size 4362142872
model-00037-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55c4bbb4b88a6350462849866f01f8127536ffe3686a6c91be0995f6e6f288c4
3
+ size 4966188880
model-00038-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17b2a65b2d44cbf5c232c0e6cd6e0af546e2eca0c93dbabc77aec363e31ffcd0
3
+ size 4362142872
model-00039-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bad18c25dde63d2ca5b11f11532a03dcb1cdeef7648391f60e9289798d7b7dbe
3
+ size 4362142872
model-00040-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43b91b70638c7448d29ec353315140abbc0d55f6ac32f72136b4dac9712a3e08
3
+ size 4966188880
model-00041-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:affb7608ebab90b7271143468f4ea3b1a514106e998924cb77b8c27b1752fd19
3
+ size 4362142872
model-00042-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c8f173eac47d7d5d29eaf6078aa80e746087bca5ca27bcd9e8685af4ec8ec4f
3
+ size 4362142872
model-00043-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a69220773e0b4165658dee2d9aa8afab1908de70f79463de637d90f77e74a6d
3
+ size 4966188880
model-00044-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:089153f4bb3a180467cdbbfdf647dda2d5cef97ebc97564eca809d61c942a54a
3
+ size 4362142872
model-00045-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab179e919b081cde43c215833bd920b83873e525244a77ec496efdad5bfb2648
3
+ size 4362142872
model-00046-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae114ecdfe01644eb47203fdd79a1fc0cecf8e426aa2442df04d034f6681b301
3
+ size 4966188880
model-00047-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:945af301f5b977c538039fba1edd3cda0fdba49ba6f78bbb70556594b2667a5c
3
+ size 4362142872
model-00048-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25780374dc10114e61793bdf221a1319d39a7e2336e3cacf6385a3d8e65c5d44
3
+ size 4362142872