danielhanchen commited on
Commit
6868cf2
1 Parent(s): 86c587c

Upload LlamaForCausalLM

Browse files
Files changed (47) hide show
  1. config.json +1 -3
  2. generation_config.json +0 -2
  3. model-00001-of-00044.safetensors +3 -0
  4. model-00002-of-00044.safetensors +3 -0
  5. model-00003-of-00044.safetensors +3 -0
  6. model-00004-of-00044.safetensors +3 -0
  7. model-00005-of-00044.safetensors +3 -0
  8. model-00006-of-00044.safetensors +3 -0
  9. model-00007-of-00044.safetensors +3 -0
  10. model-00008-of-00044.safetensors +3 -0
  11. model-00009-of-00044.safetensors +3 -0
  12. model-00010-of-00044.safetensors +3 -0
  13. model-00011-of-00044.safetensors +3 -0
  14. model-00012-of-00044.safetensors +3 -0
  15. model-00013-of-00044.safetensors +3 -0
  16. model-00014-of-00044.safetensors +3 -0
  17. model-00015-of-00044.safetensors +3 -0
  18. model-00016-of-00044.safetensors +3 -0
  19. model-00017-of-00044.safetensors +3 -0
  20. model-00018-of-00044.safetensors +3 -0
  21. model-00019-of-00044.safetensors +3 -0
  22. model-00020-of-00044.safetensors +3 -0
  23. model-00021-of-00044.safetensors +3 -0
  24. model-00022-of-00044.safetensors +3 -0
  25. model-00023-of-00044.safetensors +3 -0
  26. model-00024-of-00044.safetensors +3 -0
  27. model-00025-of-00044.safetensors +3 -0
  28. model-00026-of-00044.safetensors +3 -0
  29. model-00027-of-00044.safetensors +3 -0
  30. model-00028-of-00044.safetensors +3 -0
  31. model-00029-of-00044.safetensors +3 -0
  32. model-00030-of-00044.safetensors +3 -0
  33. model-00031-of-00044.safetensors +3 -0
  34. model-00032-of-00044.safetensors +3 -0
  35. model-00033-of-00044.safetensors +3 -0
  36. model-00034-of-00044.safetensors +3 -0
  37. model-00035-of-00044.safetensors +3 -0
  38. model-00036-of-00044.safetensors +3 -0
  39. model-00037-of-00044.safetensors +3 -0
  40. model-00038-of-00044.safetensors +3 -0
  41. model-00039-of-00044.safetensors +3 -0
  42. model-00040-of-00044.safetensors +3 -0
  43. model-00041-of-00044.safetensors +3 -0
  44. model-00042-of-00044.safetensors +3 -0
  45. model-00043-of-00044.safetensors +3 -0
  46. model-00044-of-00044.safetensors +3 -0
  47. model.safetensors.index.json +0 -0
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "unsloth/Meta-Llama-3.1-405B",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
@@ -17,7 +17,6 @@
17
  "num_attention_heads": 128,
18
  "num_hidden_layers": 126,
19
  "num_key_value_heads": 8,
20
- "pad_token_id": 128004,
21
  "pretraining_tp": 1,
22
  "quantization_config": {
23
  "_load_in_4bit": true,
@@ -46,7 +45,6 @@
46
  "tie_word_embeddings": false,
47
  "torch_dtype": "bfloat16",
48
  "transformers_version": "4.44.2",
49
- "unsloth_version": "2024.9",
50
  "use_cache": true,
51
  "vocab_size": 128256
52
  }
 
1
  {
2
+ "_name_or_path": "meta-llama/Meta-Llama-3.1-405B",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
 
17
  "num_attention_heads": 128,
18
  "num_hidden_layers": 126,
19
  "num_key_value_heads": 8,
 
20
  "pretraining_tp": 1,
21
  "quantization_config": {
22
  "_load_in_4bit": true,
 
45
  "tie_word_embeddings": false,
46
  "torch_dtype": "bfloat16",
47
  "transformers_version": "4.44.2",
 
48
  "use_cache": true,
49
  "vocab_size": 128256
50
  }
generation_config.json CHANGED
@@ -3,8 +3,6 @@
3
  "bos_token_id": 128000,
4
  "do_sample": true,
5
  "eos_token_id": 128001,
6
- "max_length": 131072,
7
- "pad_token_id": 128004,
8
  "temperature": 0.6,
9
  "top_p": 0.9,
10
  "transformers_version": "4.44.2"
 
3
  "bos_token_id": 128000,
4
  "do_sample": true,
5
  "eos_token_id": 128001,
 
 
6
  "temperature": 0.6,
7
  "top_p": 0.9,
8
  "transformers_version": "4.44.2"
model-00001-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94cb37dbb5f7c756f8fe94b9de244d2db18ea8f4f86ded646c1ba9868eadf9d1
3
+ size 4947019582
model-00002-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0223d0bb178a982153a7e905066d498dac06c175c991244c4ddcb41331d88ca8
3
+ size 4933502252
model-00003-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a312d1a09677592c87d0a983bed404fad9f85db0a5ee944a03ac94d586d0fc0d
3
+ size 4933502250
model-00004-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b77a4927f431105935169c509580c0702c0a61cc1454def926b9a6de9b7735d
3
+ size 4933502251
model-00005-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9175deab6aaa82721c67749c8e22ad281321686155764e4712836b5e8cd48124
3
+ size 4933502348
model-00006-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c305ef7ea3eb453d61a45ff37391d0dba389efb75afa1a6fe2e2c489f7c2b28
3
+ size 4933502387
model-00007-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51beb88c5811647c05e7a1fa957a918671b2c9f3c113f3f85c918f4cd861adf4
3
+ size 4933502390
model-00008-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd7b24bb3f0e623bdc799735389d9a89004aa45c2cee5cb4eafbbb9a3119cd3f
3
+ size 4933502390
model-00009-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23dab6f1c7ac6a4780944c27a96fb545acd9203487cd028b60e392a8eeb467f1
3
+ size 4933502388
model-00010-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d8a8368513b66ba7e495d598dc20a679b368ac5ac028eac32ba6ead4e7c73a7
3
+ size 4933502385
model-00011-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e86fbf3906a5a20f2f7d40b71f19d1dab1c211759d482530ae2f042ec890b328
3
+ size 4933502390
model-00012-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa0a2bb8724cd009caa0ab84fac493e8003b85cadaacf513e429345290319d2a
3
+ size 4933502382
model-00013-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17cc17377bb8f9a2ad19bf654a91957ba5d4056708af5b589325ef539f6c2ab2
3
+ size 4933502386
model-00014-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b77662d4d9f8c61c2e6e6e7973ca10bc35e559d837c2871a2279eb8cbbccb5c
3
+ size 4933502387
model-00015-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7780c50e2c4c00fe0150e7c6400fd8706775277e8ce4e803b0c9f70a0061afce
3
+ size 4933502387
model-00016-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6af36a43efc2bd20c8a70cfe549b919dd8df5b1f508ab42d23a91d6876bc52eb
3
+ size 4933502382
model-00017-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a7b6a38befa67094a8705e730e8cc139db91265bb7f3f32628abb0e8261db62
3
+ size 4933502385
model-00018-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20e0d6efa2022afa1842236c41f25bb962cee5077dfc7b54553aff3187a168d0
3
+ size 4933502389
model-00019-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8b98346ec0651f050036faa57a8ff3065a5573d63bbba178b6ba87ec51b2fe1
3
+ size 4933502384
model-00020-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a90269648c0b4979ebb5a95dab776aeb473d6722c68ed93c3792cc33cedc86b1
3
+ size 4933502389
model-00021-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:191f3442eba5052cf01f45c54562aa397d38496deaf6124c20c1c57b432a31da
3
+ size 4933502388
model-00022-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7dd73d573f84091d31ef1afe6274feaaa91429f153fb38bd6a73d6f3ae2a83b
3
+ size 4933502388
model-00023-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7480ff2098ea16b76120cc8cfc22e663f346a96d0d723e4b59742e26cd3d3caa
3
+ size 4933502383
model-00024-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8b8a62005d62d37a94e29a4206f4e85978f6049faf83ccad649a5b758b4ce80
3
+ size 4933502385
model-00025-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b737efdfea1b699e30cdcaa5e68b164ab3798f4e70065dcb0a4e27618e54f97
3
+ size 4933502386
model-00026-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbf458e61393e8029417070d0056789bc85b43d2a25912962c8da9d0a23e7345
3
+ size 4933502388
model-00027-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ee14c28ecf23443765d8ba956948a9bbf2d34b9ef549749e1e193990d6c8e4a
3
+ size 4933502387
model-00028-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a2a4f3e05b31740768432ee73d5f423fbd020054f1c114dee96319ec06dc835
3
+ size 4933502387
model-00029-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1691cab0756e0c942159054eec547b37e39281470e5de052acfc0a9f55cc553a
3
+ size 4933502386
model-00030-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:398e090dabd847d59652f8e919a05e88fb1b6ee13ef627c0b882977f61c3c235
3
+ size 4933502391
model-00031-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5bbff0c977edcf2c3be2262a894e11a8e4383f44a60d19b3db13fe7f691f7a1
3
+ size 4933502389
model-00032-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86b900809f71220de786b24f98901b52e203a1bda3a879b78d198cff697c327a
3
+ size 4933502389
model-00033-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0de8e9fa44104372f2c1689a702546fbe8790f2d9578699e5f8b7664ce27eba
3
+ size 4933502388
model-00034-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20540e4bb34fe00cc0560e097425aa560f298e9a2de2545a52c9cd3e22ab457f
3
+ size 4933502390
model-00035-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6517c2c7e65a4e58410068dad6320d712c934046a2f2e6fe907973946bb4f550
3
+ size 4933502486
model-00036-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07554b7370f6dcf268abfb2e4bf2a9189021a455ab7480801d3b61cfe91377eb
3
+ size 4933502519
model-00037-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:187b68ea1ddc0b760fb338f66d4ab69e04bbbaa53b968859b8f630fadba7d28c
3
+ size 4933502515
model-00038-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96af7fc711f8e60f465813b7f9e36c3393523dd4ac05c3177a3ee17cb2a9eaba
3
+ size 4933502518
model-00039-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab221e030982ec9c605425af92d2129b478b58adf38b01456309bc7a163a01bf
3
+ size 4933502513
model-00040-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a30307fba3f4872e3347d8bc3b428d238e51cc8b67fe322c52b990e4995a93be
3
+ size 4933502517
model-00041-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7b1ad47f8d28bb0a5b95db27a878556f6aed167b4da791756789f2b50044a05
3
+ size 4933502512
model-00042-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f52725f959f2ce437cfc89aa993b5a573048f191fb804de20fc996c2371f8100
3
+ size 4933502514
model-00043-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:026b2bb50e06f859180872ef455b662a86bc890cbc01f66213008c3b18a1581d
3
+ size 4189208444
model-00044-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c19b417dcc7fd337f97811ce0cd49f33750240019dc873802e7e15b6ee63b428
3
+ size 4202692736
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff