morgul commited on
Commit
b25c209
1 Parent(s): 754677a

Upload folder using huggingface_hub (#1)

Browse files

- 1e81aac96809fa3ae0b242eb4211834272edac3f8e487efbc27db83b676248c8 (242fbfb42052b2a22f833a6abf78c1f78932f8a8)
- 5f693e1910e1fa136dec861716114982980eb654f85b4f386c4b6b68f502689f (90728aafc633ab7e9826b5ee4743cc15e8088dad)
- 42da350d0490ab704b3aa1963056d749dbaa74669b1cecf747230db69921664a (767d775da859c7ed9b67ae69668e067f90398cde)
- 903b0cc41485d5869dbd0ea14e650f6afee60169536830e229817aecc853323b (66fa9eea48e52062126f93ff888e5b4e0011ab8b)
- 1a7ece2d7bb78c01dfb50bf79f2e6a0cdcaa9cd2d35f314ef13800e629ac9f5d (a880e043f6f1be15aafa61b4114c2bf7ae55ef64)
- fa41d386caf5674c49dfe8742eb357d7fc056e0269e12f11caca431ecd0047ba (24d33144d96f0e60d5b41d2273a9457010c4e8f8)
- 8e89416a187ccf38e5eb950d13ca75f59ab0c173ac466cab95c31543f0e8015b (6b4becf0ec8b7ac0de6e87bf5a7dc7049a3fc3bb)
- 8588da70081b7350b4bd36fb4d1a86279420ecfad7b77a3eec27f9ef5e145710 (a9d9d95425685fe1f08b4a119d40594da2f92125)
- 85938d6657bf1c5b600df05535d5eba437151736855a1c6383b00712435d785e (f7997b11eea0e9d70dccfc1d4689b61d470e0d5f)
- 3dc10c1f91bdc50bb25d25f4fc00293d33154ed9bbb0802dcb4554b2586c4c69 (37900f09b7920adf82d9ca93abaeffa802b7b28b)
- 8c0f5e711433311b91e9a347f60f706c9114a2d7db596b5b2f5b8568ff0d65ea (0e6a9e6d290eefbad1d2d8aa0593c7ed2e24fb30)
- f6a7decc21833aa5d1689794107925afb032549ac7731eea093142fb9f989411 (9c79fa6021238e7461820cc20ae818b2443bb8aa)
- a3b2cb53b1e59f22a6141ea3822b0d07d6ab47e250391cc6e1617cbf0a50bcec (5908706a7de6b0448e1e83dc64cde8fc656ddf47)
- ddc1af1312e74bf27fa22245433441416c5d0e6fca041cbadbb63e00432dce68 (125945f4888e27dbee01cdacfd694b45fba5f4e3)
- 69ab2117d76ffd98ac524c54d61877dcdf0490c8d83d0d40f49b5547143c4139 (70b1744aab80bcb752532ed29a8e7927d2c3a462)
- 7e201964abd59fdb5912bb4a04f36867b2e6a45cbde4d04fc3ed22daee88359c (8fb171111f04308ad7d86e43fdc6ddad8bef1de9)
- f9534233eb68869db461d5115d3ab050261dd39a23cb0adc819fb8d0dec180d1 (1f6dbb73655d1c26daca113516f84381c41a0e16)
- ab9a3210ec8b289ef867f1f88c5cf520a8d73be11d3901fb967479efe68d51f7 (437f7f0cfca64a0286919ac6b9f6eaedef5e78d5)
- d537a08f5012a9381893b5c14c81575c883d3decfd52b5f11f3f6cd48d21e9fa (aaddacd67576fd2d6a157f18537f56486fd85869)
- de8291dfb236027cd6270fce493a9644d1cf1f39a7b566295cd0aa3c732747c0 (e355d40a03d4531babfe9fa3ce31e0ba29e00b6f)
- cb1b1893a28b935d41aec00d6be2147b71ef8220f8527238268da86e7293f428 (cda8c4e4add1bac1aa345df7d7e07b763ddc4fa7)
- babd5a9375327e0006a5b8f83dc815684fbaaa320a5fc6daee90cabe330bab6a (cde068980befde4b3c0150f7645fbbba220a4440)
- 16378b2fb4e5d0259947efb0a17209e5ba298b83c9641ed296357d5f1ecce09a (78355667469384d488dc09556d34f948ac7beb34)
- ab58b10ddb459fcfcf00b2c1f11948ce8bc9f0cd0636173dd2a404161de76af0 (ce2d1283acde40da58c296c67acab4dce53c9a3f)
- 5d6c78deb881d1cea073baf85297f9d84433316b5ba17a8266e7dbc07fd999a3 (34541ca8bcf34d270fbe545e8272df87c30c16b1)
- 086668beb549a1fbc8f042dec818bdda778e535210e803c8bab54899b2e0f170 (bb9f096f85f11febadc612caa666f65502a84ae9)
- c11da3afd1a29656370279cfcc6fa6d87d73f17ad7f05d8dae6f9be48ed08e75 (60f35ba2524badd174bc2e8b83e43c76e8feadc4)
- 40c4c547a199cd13b4f88586b6159f48c874c505d41dbec2925329e1678b8382 (329e481d9d17e1b8ded1e100ddf7f29e8bc99d04)
- 43dd48783069ac9579fff185a58bec16f6b1ddd56176e79dbe7e22669e1a0b07 (1c9bb9d314b0e9b19f2bc8fbec9eebc85a1ee286)

README.md ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: rAIfle/SorcererLM-8x22b-bf16
3
+ license: apache-2.0
4
+ tags:
5
+ - mlx
6
+ ---
7
+
8
+ # mlx-community/SorcererLM-8x22b-bf16
9
+
10
+ The Model [mlx-community/SorcererLM-8x22b-bf16](https://huggingface.co/mlx-community/SorcererLM-8x22b-bf16) was converted to MLX format from [rAIfle/SorcererLM-8x22b-bf16](https://huggingface.co/rAIfle/SorcererLM-8x22b-bf16) using mlx-lm version **0.19.0**.
11
+
12
+ ## Use with mlx
13
+
14
+ ```bash
15
+ pip install mlx-lm
16
+ ```
17
+
18
+ ```python
19
+ from mlx_lm import load, generate
20
+
21
+ model, tokenizer = load("mlx-community/SorcererLM-8x22b-bf16")
22
+
23
+ prompt="hello"
24
+
25
+ if hasattr(tokenizer, "apply_chat_template") and tokenizer.chat_template is not None:
26
+ messages = [{"role": "user", "content": prompt}]
27
+ prompt = tokenizer.apply_chat_template(
28
+ messages, tokenize=False, add_generation_prompt=True
29
+ )
30
+
31
+ response = generate(model, tokenizer, prompt=prompt, verbose=True)
32
+ ```
config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "MixtralForCausalLM"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "bos_token_id": 1,
7
+ "eos_token_id": 2,
8
+ "hidden_act": "silu",
9
+ "hidden_size": 6144,
10
+ "initializer_range": 0.02,
11
+ "intermediate_size": 16384,
12
+ "max_position_embeddings": 65536,
13
+ "model_type": "mixtral",
14
+ "num_attention_heads": 48,
15
+ "num_experts_per_tok": 2,
16
+ "num_hidden_layers": 56,
17
+ "num_key_value_heads": 8,
18
+ "num_local_experts": 8,
19
+ "output_router_logits": false,
20
+ "quantization": {
21
+ "group_size": 64,
22
+ "bits": 8
23
+ },
24
+ "quantization_config": {
25
+ "group_size": 64,
26
+ "bits": 8
27
+ },
28
+ "rms_norm_eps": 1e-05,
29
+ "rope_theta": 1000000,
30
+ "router_aux_loss_coef": 0.001,
31
+ "router_jitter_noise": 0.0,
32
+ "sliding_window": null,
33
+ "tie_word_embeddings": false,
34
+ "torch_dtype": "bfloat16",
35
+ "transformers_version": "4.45.0.dev0",
36
+ "use_cache": false,
37
+ "vocab_size": 32000
38
+ }
model-00001-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ba964d1309abec4d4eac78c90573e032071cd59eb310e6a0c1665a69ec7300f
3
+ size 4674392006
model-00002-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61b821cb2d6b2bdac663530e4b091cb378d707e07c946274a899d18a3e6a42c9
3
+ size 5321158926
model-00003-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5c6d48a28980ac0dc6bd063464b3ad5a2ce38600d3b18b0e87aaca517bd9f30
3
+ size 5321158930
model-00004-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74873815902f131ed3a60d4e57511bab64ce750e9d83d9e23e9e1e10fed4c378
3
+ size 5321158888
model-00005-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b8f6e80caf4a0137a6601e51451a2ebe8ae7635450a3dd3fee6dde08bfc1c79
3
+ size 5321158932
model-00006-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8549a2e46c763a101d0482a0b66fad319f78051bb726058fef103d727a37ea1
3
+ size 5321158935
model-00007-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08fe1248263b59ea7ecb6c6966f416ec4c769d8f41c326ccf7a2224a82a1596e
3
+ size 5321158948
model-00008-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a1f30bb22d90f774a6514928de1b5eba75f6231572a56706aa7c504d7da4943
3
+ size 5321158982
model-00009-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:469fb655dc07e8114c5b209ff20a160c905424deb08db2431f3b80bc2eb04aca
3
+ size 5321158942
model-00010-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d9c2636eb31b1b567b725d113c04c626588e4bd2f7185ccc08a414fcc244f5b
3
+ size 5321158978
model-00011-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0c43521cb3e9334e399e9dbaedcbcfe061303dc7aebbfa87a7fb3beda5b4eae
3
+ size 5321158952
model-00012-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:561512c39f72681308e4106d440fa70aeac26d7384bf4b57f2747416fc930248
3
+ size 5321158940
model-00013-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0e547bf5215d0fcf96fd9f5104218fb8fbc0ad862313661c62cabe93a26903d
3
+ size 5321158950
model-00014-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b2cf82d40a02510f03eb6a0304e0711ed7bab7b88b96496b370d18f2c49192a
3
+ size 5321158974
model-00015-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec0a3fb81c84ab2f73853d29f98d640950068510d5167e0e867c05144a009ff4
3
+ size 5321158958
model-00016-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22f67a8f5ff20ae62d645f590a588f8bde007915cf5810ebc9e88ca56b61065b
3
+ size 5321158948
model-00017-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2737db403795501f4e4657000e2e26ba02b8011892499ce66c72c7de4c7956b8
3
+ size 5321158972
model-00018-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d10d08556cefb5959a20afac8c3fe5789e18f239e20367f5b43e4cfe0770758a
3
+ size 5321158976
model-00019-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08c1a157a7574b1216dfd62dd4e7a208a19d7db3e83240fc9f746904eaf44b23
3
+ size 5321158970
model-00020-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e136c221ddba2c182c9f985616b2e56b9b28441f462c980775f4f07decdf5775
3
+ size 5321158978
model-00021-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4f870e0fedf04d94bac758d840e37c77fd029a44c52a7b904d0fa8b5c2e71bd
3
+ size 5321158928
model-00022-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a648d442b367235686614170b440dfedaabe3e43e0107ddd455815a79b495bd3
3
+ size 5321158974
model-00023-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:436630120002bb54769830f64ba5fdbac7c47071dbd05351cad7762746c95e05
3
+ size 5321158948
model-00024-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53bb51ac6943fd7735d76fb4e23b91b6bbcc84704bfd3c2fa147911533b1f648
3
+ size 5321158952
model-00025-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:291cbf0dc1c3a85d44ab8b90d8e26bcec70ee65cb5cfc201f65372e390930f4f
3
+ size 5321158978
model-00026-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44e5b7aa45e268076baa7201142e76b5ababeec017772dc2d77251e94177530e
3
+ size 5321158982
model-00027-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ca89e48215ed3588187f0e4d0289a36f02ab7b13fe029414a885e60d17f0cbf
3
+ size 5321158952
model-00028-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cc73380988da9f65303688f83920d08f312c0d6940bba46301421a98b373513
3
+ size 5321158976
model-00029-of-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78a1f82d2a2beb60e17958f9c12dd4c6182740ec183558f71fef3d575de4e7d4
3
+ size 1064571904
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
special_tokens_map.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "<unk>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "unk_token": {
24
+ "content": "<unk>",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ }
30
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dadfd56d766715c61d2ef780a525ab43b8e6da4de6865bda3d95fdef5e134055
3
+ size 493443
tokenizer_config.json ADDED
@@ -0,0 +1,45 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": true,
3
+ "add_eos_token": false,
4
+ "add_prefix_space": true,
5
+ "added_tokens_decoder": {
6
+ "0": {
7
+ "content": "<unk>",
8
+ "lstrip": false,
9
+ "normalized": false,
10
+ "rstrip": false,
11
+ "single_word": false,
12
+ "special": true
13
+ },
14
+ "1": {
15
+ "content": "<s>",
16
+ "lstrip": false,
17
+ "normalized": false,
18
+ "rstrip": false,
19
+ "single_word": false,
20
+ "special": true
21
+ },
22
+ "2": {
23
+ "content": "</s>",
24
+ "lstrip": false,
25
+ "normalized": false,
26
+ "rstrip": false,
27
+ "single_word": false,
28
+ "special": true
29
+ }
30
+ },
31
+ "additional_special_tokens": [],
32
+ "bos_token": "<s>",
33
+ "chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{{ messages[0]['content'].strip() }}{% else %}{% set loop_messages = messages %}{{ 'A chat between a curious user and an artificial intelligence assistant. The assistant gives helpful, detailed, and polite answers to the user\\'s questions.' }}{% endif %}{% for message in loop_messages %}{% if loop.index0 == 0 %}{% if message['role'] == 'system' or message['role'] == 'user' %}{{ ' USER: ' + message['content'].strip() }}{% else %}{{ ' ASSISTANT: ' + message['content'].strip() + eos_token }}{% endif %}{% else %}{% if message['role'] == 'system' or message['role'] == 'user' %}{{ '\nUSER: ' + message['content'].strip() }}{% else %}{{ ' ASSISTANT: ' + message['content'].strip() + eos_token }}{% endif %}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ ' ASSISTANT:' }}{% endif %}",
34
+ "clean_up_tokenization_spaces": false,
35
+ "eos_token": "</s>",
36
+ "legacy": true,
37
+ "model_max_length": 1000000000000000019884624838656,
38
+ "pad_token": "<unk>",
39
+ "padding_side": "right",
40
+ "sp_model_kwargs": {},
41
+ "spaces_between_special_tokens": false,
42
+ "tokenizer_class": "LlamaTokenizer",
43
+ "unk_token": "<unk>",
44
+ "use_default_system_prompt": true
45
+ }