morriszms commited on
Commit
1319e5f
·
verified ·
1 Parent(s): 908dcb6

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,15 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ Mixtral_34Bx2_MoE_60B-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
37
+ Mixtral_34Bx2_MoE_60B-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
38
+ Mixtral_34Bx2_MoE_60B-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
39
+ Mixtral_34Bx2_MoE_60B-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
40
+ Mixtral_34Bx2_MoE_60B-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
41
+ Mixtral_34Bx2_MoE_60B-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
42
+ Mixtral_34Bx2_MoE_60B-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
43
+ Mixtral_34Bx2_MoE_60B-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
44
+ Mixtral_34Bx2_MoE_60B-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
45
+ Mixtral_34Bx2_MoE_60B-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
46
+ Mixtral_34Bx2_MoE_60B-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
47
+ Mixtral_34Bx2_MoE_60B-Q8_0/Mixtral_34Bx2_MoE_60B-Q8_0-00001-of-00002.gguf filter=lfs diff=lfs merge=lfs -text
Mixtral_34Bx2_MoE_60B-Q2_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97b5ac32507cf5c7d74b84a86a042e4eff8f6c415556d368b9d7bad77a3f554a
3
+ size 22393660064
Mixtral_34Bx2_MoE_60B-Q3_K_L.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5dac24e88e70afbdad1ccaadfc3408ee58cf4d7128f378f116c11e3ba7bc80a3
3
+ size 31767827104
Mixtral_34Bx2_MoE_60B-Q3_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e332c8766029847dc9fb2d84ba8f87fcd63427da2584f2f7a4330b2a8aacb7a
3
+ size 29237351072
Mixtral_34Bx2_MoE_60B-Q3_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35805c733a73b3c00ee0b3af8e024b40f4f56f4654efe720d8f3a85334da18ce
3
+ size 26317853344
Mixtral_34Bx2_MoE_60B-Q4_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd8464df56e5755c77af5a3e86f658bda7455bd13dfe635e8923383327008b74
3
+ size 34333541024
Mixtral_34Bx2_MoE_60B-Q4_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43ca2a54d0d030ed5bd26435ce6883f921fdec605b5c922c9aa0cdd7cc96c261
3
+ size 36661133984
Mixtral_34Bx2_MoE_60B-Q4_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec8a78e59fef8a0e1cddd0213c0af78cefe0fc922247140a3307064f5d3b5989
3
+ size 34594112160
Mixtral_34Bx2_MoE_60B-Q5_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6ffe1f6474b6a6bf8b528e51753aacc4b9e2aaad65f8fe900c0361beec15b44
3
+ size 41877717664
Mixtral_34Bx2_MoE_60B-Q5_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:951763279c79a55f5d827947bbde8d50c2d400da3ece4579629a86a1d8daad22
3
+ size 43076780704
Mixtral_34Bx2_MoE_60B-Q5_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd517e549fe50a43cd1841f30fbba0b645bae8902350ef1ca5e05144c7524f77
3
+ size 41877717664
Mixtral_34Bx2_MoE_60B-Q6_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb0bbf2e0f447dcb5e2c63116e61696f3b77993f0a2f6f7aaba805f297578a17
3
+ size 49893405344
Mixtral_34Bx2_MoE_60B-Q8_0/Mixtral_34Bx2_MoE_60B-Q8_0-00001-of-00002.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a4b510e558cca99107106c89a14fd45c3cb5baa481a5b8aeb336c71073240e2
3
+ size 959213568
README.md ADDED
@@ -0,0 +1,173 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - yi
5
+ - moe
6
+ - TensorBlock
7
+ - GGUF
8
+ base_model: cloudyu/Mixtral_34Bx2_MoE_60B
9
+ model-index:
10
+ - name: Mixtral_34Bx2_MoE_60B
11
+ results:
12
+ - task:
13
+ type: text-generation
14
+ name: Text Generation
15
+ dataset:
16
+ name: IFEval (0-Shot)
17
+ type: HuggingFaceH4/ifeval
18
+ args:
19
+ num_few_shot: 0
20
+ metrics:
21
+ - type: inst_level_strict_acc and prompt_level_strict_acc
22
+ value: 45.38
23
+ name: strict accuracy
24
+ source:
25
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=cloudyu/Mixtral_34Bx2_MoE_60B
26
+ name: Open LLM Leaderboard
27
+ - task:
28
+ type: text-generation
29
+ name: Text Generation
30
+ dataset:
31
+ name: BBH (3-Shot)
32
+ type: BBH
33
+ args:
34
+ num_few_shot: 3
35
+ metrics:
36
+ - type: acc_norm
37
+ value: 41.21
38
+ name: normalized accuracy
39
+ source:
40
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=cloudyu/Mixtral_34Bx2_MoE_60B
41
+ name: Open LLM Leaderboard
42
+ - task:
43
+ type: text-generation
44
+ name: Text Generation
45
+ dataset:
46
+ name: MATH Lvl 5 (4-Shot)
47
+ type: hendrycks/competition_math
48
+ args:
49
+ num_few_shot: 4
50
+ metrics:
51
+ - type: exact_match
52
+ value: 6.57
53
+ name: exact match
54
+ source:
55
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=cloudyu/Mixtral_34Bx2_MoE_60B
56
+ name: Open LLM Leaderboard
57
+ - task:
58
+ type: text-generation
59
+ name: Text Generation
60
+ dataset:
61
+ name: GPQA (0-shot)
62
+ type: Idavidrein/gpqa
63
+ args:
64
+ num_few_shot: 0
65
+ metrics:
66
+ - type: acc_norm
67
+ value: 11.74
68
+ name: acc_norm
69
+ source:
70
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=cloudyu/Mixtral_34Bx2_MoE_60B
71
+ name: Open LLM Leaderboard
72
+ - task:
73
+ type: text-generation
74
+ name: Text Generation
75
+ dataset:
76
+ name: MuSR (0-shot)
77
+ type: TAUR-Lab/MuSR
78
+ args:
79
+ num_few_shot: 0
80
+ metrics:
81
+ - type: acc_norm
82
+ value: 17.78
83
+ name: acc_norm
84
+ source:
85
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=cloudyu/Mixtral_34Bx2_MoE_60B
86
+ name: Open LLM Leaderboard
87
+ - task:
88
+ type: text-generation
89
+ name: Text Generation
90
+ dataset:
91
+ name: MMLU-PRO (5-shot)
92
+ type: TIGER-Lab/MMLU-Pro
93
+ config: main
94
+ split: test
95
+ args:
96
+ num_few_shot: 5
97
+ metrics:
98
+ - type: acc
99
+ value: 41.85
100
+ name: accuracy
101
+ source:
102
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=cloudyu/Mixtral_34Bx2_MoE_60B
103
+ name: Open LLM Leaderboard
104
+ ---
105
+
106
+ <div style="width: auto; margin-left: auto; margin-right: auto">
107
+ <img src="https://i.imgur.com/jC7kdl8.jpeg" alt="TensorBlock" style="width: 100%; min-width: 400px; display: block; margin: auto;">
108
+ </div>
109
+ <div style="display: flex; justify-content: space-between; width: 100%;">
110
+ <div style="display: flex; flex-direction: column; align-items: flex-start;">
111
+ <p style="margin-top: 0.5em; margin-bottom: 0em;">
112
+ Feedback and support: TensorBlock's <a href="https://x.com/tensorblock_aoi">Twitter/X</a>, <a href="https://t.me/TensorBlock">Telegram Group</a> and <a href="https://x.com/tensorblock_aoi">Discord server</a>
113
+ </p>
114
+ </div>
115
+ </div>
116
+
117
+ ## cloudyu/Mixtral_34Bx2_MoE_60B - GGUF
118
+
119
+ This repo contains GGUF format model files for [cloudyu/Mixtral_34Bx2_MoE_60B](https://huggingface.co/cloudyu/Mixtral_34Bx2_MoE_60B).
120
+
121
+ The files were quantized using machines provided by [TensorBlock](https://tensorblock.co/), and they are compatible with llama.cpp as of [commit b4242](https://github.com/ggerganov/llama.cpp/commit/a6744e43e80f4be6398fc7733a01642c846dce1d).
122
+
123
+ <div style="text-align: left; margin: 20px 0;">
124
+ <a href="https://tensorblock.co/waitlist/client" style="display: inline-block; padding: 10px 20px; background-color: #007bff; color: white; text-decoration: none; border-radius: 5px; font-weight: bold;">
125
+ Run them on the TensorBlock client using your local machine ↗
126
+ </a>
127
+ </div>
128
+
129
+ ## Prompt template
130
+
131
+ ```
132
+
133
+ ```
134
+
135
+ ## Model file specification
136
+
137
+ | Filename | Quant type | File Size | Description |
138
+ | -------- | ---------- | --------- | ----------- |
139
+ | [Mixtral_34Bx2_MoE_60B-Q2_K.gguf](https://huggingface.co/tensorblock/Mixtral_34Bx2_MoE_60B-GGUF/blob/main/Mixtral_34Bx2_MoE_60B-Q2_K.gguf) | Q2_K | 22.394 GB | smallest, significant quality loss - not recommended for most purposes |
140
+ | [Mixtral_34Bx2_MoE_60B-Q3_K_S.gguf](https://huggingface.co/tensorblock/Mixtral_34Bx2_MoE_60B-GGUF/blob/main/Mixtral_34Bx2_MoE_60B-Q3_K_S.gguf) | Q3_K_S | 26.318 GB | very small, high quality loss |
141
+ | [Mixtral_34Bx2_MoE_60B-Q3_K_M.gguf](https://huggingface.co/tensorblock/Mixtral_34Bx2_MoE_60B-GGUF/blob/main/Mixtral_34Bx2_MoE_60B-Q3_K_M.gguf) | Q3_K_M | 29.237 GB | very small, high quality loss |
142
+ | [Mixtral_34Bx2_MoE_60B-Q3_K_L.gguf](https://huggingface.co/tensorblock/Mixtral_34Bx2_MoE_60B-GGUF/blob/main/Mixtral_34Bx2_MoE_60B-Q3_K_L.gguf) | Q3_K_L | 31.768 GB | small, substantial quality loss |
143
+ | [Mixtral_34Bx2_MoE_60B-Q4_0.gguf](https://huggingface.co/tensorblock/Mixtral_34Bx2_MoE_60B-GGUF/blob/main/Mixtral_34Bx2_MoE_60B-Q4_0.gguf) | Q4_0 | 34.334 GB | legacy; small, very high quality loss - prefer using Q3_K_M |
144
+ | [Mixtral_34Bx2_MoE_60B-Q4_K_S.gguf](https://huggingface.co/tensorblock/Mixtral_34Bx2_MoE_60B-GGUF/blob/main/Mixtral_34Bx2_MoE_60B-Q4_K_S.gguf) | Q4_K_S | 34.594 GB | small, greater quality loss |
145
+ | [Mixtral_34Bx2_MoE_60B-Q4_K_M.gguf](https://huggingface.co/tensorblock/Mixtral_34Bx2_MoE_60B-GGUF/blob/main/Mixtral_34Bx2_MoE_60B-Q4_K_M.gguf) | Q4_K_M | 36.661 GB | medium, balanced quality - recommended |
146
+ | [Mixtral_34Bx2_MoE_60B-Q5_0.gguf](https://huggingface.co/tensorblock/Mixtral_34Bx2_MoE_60B-GGUF/blob/main/Mixtral_34Bx2_MoE_60B-Q5_0.gguf) | Q5_0 | 41.878 GB | legacy; medium, balanced quality - prefer using Q4_K_M |
147
+ | [Mixtral_34Bx2_MoE_60B-Q5_K_S.gguf](https://huggingface.co/tensorblock/Mixtral_34Bx2_MoE_60B-GGUF/blob/main/Mixtral_34Bx2_MoE_60B-Q5_K_S.gguf) | Q5_K_S | 41.878 GB | large, low quality loss - recommended |
148
+ | [Mixtral_34Bx2_MoE_60B-Q5_K_M.gguf](https://huggingface.co/tensorblock/Mixtral_34Bx2_MoE_60B-GGUF/blob/main/Mixtral_34Bx2_MoE_60B-Q5_K_M.gguf) | Q5_K_M | 43.077 GB | large, very low quality loss - recommended |
149
+ | [Mixtral_34Bx2_MoE_60B-Q6_K.gguf](https://huggingface.co/tensorblock/Mixtral_34Bx2_MoE_60B-GGUF/blob/main/Mixtral_34Bx2_MoE_60B-Q6_K.gguf) | Q6_K | 49.893 GB | very large, extremely low quality loss |
150
+ | [Mixtral_34Bx2_MoE_60B-Q8_0](https://huggingface.co/tensorblock/Mixtral_34Bx2_MoE_60B-GGUF/blob/main/Mixtral_34Bx2_MoE_60B-Q8_0) | Q8_0 | 0.959 GB | very large, extremely low quality loss - not recommended |
151
+
152
+
153
+ ## Downloading instruction
154
+
155
+ ### Command line
156
+
157
+ Firstly, install Huggingface Client
158
+
159
+ ```shell
160
+ pip install -U "huggingface_hub[cli]"
161
+ ```
162
+
163
+ Then, downoad the individual model file the a local directory
164
+
165
+ ```shell
166
+ huggingface-cli download tensorblock/Mixtral_34Bx2_MoE_60B-GGUF --include "Mixtral_34Bx2_MoE_60B-Q2_K.gguf" --local-dir MY_LOCAL_DIR
167
+ ```
168
+
169
+ If you wanna download multiple model files with a pattern (e.g., `*Q4_K*gguf`), you can try:
170
+
171
+ ```shell
172
+ huggingface-cli download tensorblock/Mixtral_34Bx2_MoE_60B-GGUF --local-dir MY_LOCAL_DIR --local-dir-use-symlinks False --include='*Q4_K*gguf'
173
+ ```