morriszms commited on
Commit
20dba86
·
verified ·
1 Parent(s): ae4d912

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,15 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ megatron_v1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
37
+ megatron_v1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
38
+ megatron_v1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
39
+ megatron_v1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
40
+ megatron_v1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
41
+ megatron_v1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
42
+ megatron_v1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
43
+ megatron_v1-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
44
+ megatron_v1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
45
+ megatron_v1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
46
+ megatron_v1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
47
+ megatron_v1-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,181 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - moe
5
+ - merge
6
+ - TensorBlock
7
+ - GGUF
8
+ base_model: Eurdem/megatron_v1
9
+ model-index:
10
+ - name: megatron_v1
11
+ results:
12
+ - task:
13
+ type: text-generation
14
+ name: Text Generation
15
+ dataset:
16
+ name: AI2 Reasoning Challenge (25-Shot)
17
+ type: ai2_arc
18
+ config: ARC-Challenge
19
+ split: test
20
+ args:
21
+ num_few_shot: 25
22
+ metrics:
23
+ - type: acc_norm
24
+ value: 65.96
25
+ name: normalized accuracy
26
+ source:
27
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Eurdem/megatron_v1
28
+ name: Open LLM Leaderboard
29
+ - task:
30
+ type: text-generation
31
+ name: Text Generation
32
+ dataset:
33
+ name: HellaSwag (10-Shot)
34
+ type: hellaswag
35
+ split: validation
36
+ args:
37
+ num_few_shot: 10
38
+ metrics:
39
+ - type: acc_norm
40
+ value: 84.8
41
+ name: normalized accuracy
42
+ source:
43
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Eurdem/megatron_v1
44
+ name: Open LLM Leaderboard
45
+ - task:
46
+ type: text-generation
47
+ name: Text Generation
48
+ dataset:
49
+ name: MMLU (5-Shot)
50
+ type: cais/mmlu
51
+ config: all
52
+ split: test
53
+ args:
54
+ num_few_shot: 5
55
+ metrics:
56
+ - type: acc
57
+ value: 65.02
58
+ name: accuracy
59
+ source:
60
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Eurdem/megatron_v1
61
+ name: Open LLM Leaderboard
62
+ - task:
63
+ type: text-generation
64
+ name: Text Generation
65
+ dataset:
66
+ name: TruthfulQA (0-shot)
67
+ type: truthful_qa
68
+ config: multiple_choice
69
+ split: validation
70
+ args:
71
+ num_few_shot: 0
72
+ metrics:
73
+ - type: mc2
74
+ value: 60.32
75
+ source:
76
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Eurdem/megatron_v1
77
+ name: Open LLM Leaderboard
78
+ - task:
79
+ type: text-generation
80
+ name: Text Generation
81
+ dataset:
82
+ name: Winogrande (5-shot)
83
+ type: winogrande
84
+ config: winogrande_xl
85
+ split: validation
86
+ args:
87
+ num_few_shot: 5
88
+ metrics:
89
+ - type: acc
90
+ value: 79.79
91
+ name: accuracy
92
+ source:
93
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Eurdem/megatron_v1
94
+ name: Open LLM Leaderboard
95
+ - task:
96
+ type: text-generation
97
+ name: Text Generation
98
+ dataset:
99
+ name: GSM8k (5-shot)
100
+ type: gsm8k
101
+ config: main
102
+ split: test
103
+ args:
104
+ num_few_shot: 5
105
+ metrics:
106
+ - type: acc
107
+ value: 57.01
108
+ name: accuracy
109
+ source:
110
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Eurdem/megatron_v1
111
+ name: Open LLM Leaderboard
112
+ ---
113
+
114
+ <div style="width: auto; margin-left: auto; margin-right: auto">
115
+ <img src="https://i.imgur.com/jC7kdl8.jpeg" alt="TensorBlock" style="width: 100%; min-width: 400px; display: block; margin: auto;">
116
+ </div>
117
+ <div style="display: flex; justify-content: space-between; width: 100%;">
118
+ <div style="display: flex; flex-direction: column; align-items: flex-start;">
119
+ <p style="margin-top: 0.5em; margin-bottom: 0em;">
120
+ Feedback and support: TensorBlock's <a href="https://x.com/tensorblock_aoi">Twitter/X</a>, <a href="https://t.me/TensorBlock">Telegram Group</a> and <a href="https://x.com/tensorblock_aoi">Discord server</a>
121
+ </p>
122
+ </div>
123
+ </div>
124
+
125
+ ## Eurdem/megatron_v1 - GGUF
126
+
127
+ This repo contains GGUF format model files for [Eurdem/megatron_v1](https://huggingface.co/Eurdem/megatron_v1).
128
+
129
+ The files were quantized using machines provided by [TensorBlock](https://tensorblock.co/), and they are compatible with llama.cpp as of [commit b4242](https://github.com/ggerganov/llama.cpp/commit/a6744e43e80f4be6398fc7733a01642c846dce1d).
130
+
131
+ <div style="text-align: left; margin: 20px 0;">
132
+ <a href="https://tensorblock.co/waitlist/client" style="display: inline-block; padding: 10px 20px; background-color: #007bff; color: white; text-decoration: none; border-radius: 5px; font-weight: bold;">
133
+ Run them on the TensorBlock client using your local machine ↗
134
+ </a>
135
+ </div>
136
+
137
+ ## Prompt template
138
+
139
+ ```
140
+ <s>GPT4 Correct System: {system_prompt}<|end_of_turn|>GPT4 Correct User: {prompt}<|end_of_turn|>GPT4 Correct Assistant:
141
+ ```
142
+
143
+ ## Model file specification
144
+
145
+ | Filename | Quant type | File Size | Description |
146
+ | -------- | ---------- | --------- | ----------- |
147
+ | [megatron_v1-Q2_K.gguf](https://huggingface.co/tensorblock/megatron_v1-GGUF/blob/main/megatron_v1-Q2_K.gguf) | Q2_K | 4.761 GB | smallest, significant quality loss - not recommended for most purposes |
148
+ | [megatron_v1-Q3_K_S.gguf](https://huggingface.co/tensorblock/megatron_v1-GGUF/blob/main/megatron_v1-Q3_K_S.gguf) | Q3_K_S | 5.588 GB | very small, high quality loss |
149
+ | [megatron_v1-Q3_K_M.gguf](https://huggingface.co/tensorblock/megatron_v1-GGUF/blob/main/megatron_v1-Q3_K_M.gguf) | Q3_K_M | 6.207 GB | very small, high quality loss |
150
+ | [megatron_v1-Q3_K_L.gguf](https://huggingface.co/tensorblock/megatron_v1-GGUF/blob/main/megatron_v1-Q3_K_L.gguf) | Q3_K_L | 6.730 GB | small, substantial quality loss |
151
+ | [megatron_v1-Q4_0.gguf](https://huggingface.co/tensorblock/megatron_v1-GGUF/blob/main/megatron_v1-Q4_0.gguf) | Q4_0 | 7.281 GB | legacy; small, very high quality loss - prefer using Q3_K_M |
152
+ | [megatron_v1-Q4_K_S.gguf](https://huggingface.co/tensorblock/megatron_v1-GGUF/blob/main/megatron_v1-Q4_K_S.gguf) | Q4_K_S | 7.342 GB | small, greater quality loss |
153
+ | [megatron_v1-Q4_K_M.gguf](https://huggingface.co/tensorblock/megatron_v1-GGUF/blob/main/megatron_v1-Q4_K_M.gguf) | Q4_K_M | 7.783 GB | medium, balanced quality - recommended |
154
+ | [megatron_v1-Q5_0.gguf](https://huggingface.co/tensorblock/megatron_v1-GGUF/blob/main/megatron_v1-Q5_0.gguf) | Q5_0 | 8.874 GB | legacy; medium, balanced quality - prefer using Q4_K_M |
155
+ | [megatron_v1-Q5_K_S.gguf](https://huggingface.co/tensorblock/megatron_v1-GGUF/blob/main/megatron_v1-Q5_K_S.gguf) | Q5_K_S | 8.874 GB | large, low quality loss - recommended |
156
+ | [megatron_v1-Q5_K_M.gguf](https://huggingface.co/tensorblock/megatron_v1-GGUF/blob/main/megatron_v1-Q5_K_M.gguf) | Q5_K_M | 9.133 GB | large, very low quality loss - recommended |
157
+ | [megatron_v1-Q6_K.gguf](https://huggingface.co/tensorblock/megatron_v1-GGUF/blob/main/megatron_v1-Q6_K.gguf) | Q6_K | 10.567 GB | very large, extremely low quality loss |
158
+ | [megatron_v1-Q8_0.gguf](https://huggingface.co/tensorblock/megatron_v1-GGUF/blob/main/megatron_v1-Q8_0.gguf) | Q8_0 | 13.686 GB | very large, extremely low quality loss - not recommended |
159
+
160
+
161
+ ## Downloading instruction
162
+
163
+ ### Command line
164
+
165
+ Firstly, install Huggingface Client
166
+
167
+ ```shell
168
+ pip install -U "huggingface_hub[cli]"
169
+ ```
170
+
171
+ Then, downoad the individual model file the a local directory
172
+
173
+ ```shell
174
+ huggingface-cli download tensorblock/megatron_v1-GGUF --include "megatron_v1-Q2_K.gguf" --local-dir MY_LOCAL_DIR
175
+ ```
176
+
177
+ If you wanna download multiple model files with a pattern (e.g., `*Q4_K*gguf`), you can try:
178
+
179
+ ```shell
180
+ huggingface-cli download tensorblock/megatron_v1-GGUF --local-dir MY_LOCAL_DIR --local-dir-use-symlinks False --include='*Q4_K*gguf'
181
+ ```
megatron_v1-Q2_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4524197646f8ffd6c89ffed00067530df82039059b5bbfdf6630d19d33a0233d
3
+ size 4760833024
megatron_v1-Q3_K_L.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79c169a7184301362b74de7c4a18f267ba1c47d86a4e10509db361089271d728
3
+ size 6729740096
megatron_v1-Q3_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5082cb08d4feca19c49c3a544ad62a11a24b36668db7419fdb63e927550a91b2
3
+ size 6206500672
megatron_v1-Q3_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8611463ad97818755f01aee2fa75b15085974cb9df770303e78b56d429039d3c
3
+ size 5587840832
megatron_v1-Q4_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a999ac7ab3480820399ce3b220be63fbb85304e329ec018666e777833e2e495
3
+ size 7280874368
megatron_v1-Q4_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c1c285752bcbf220218ca11db90a42c5217c8c116a7e6ed84882b2f0f05c153
3
+ size 7782617984
megatron_v1-Q4_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c34552cc296bd5b203f4ef5ba8abb4b7710bc3c399e1535b5619da835eb0e92f
3
+ size 7341691776
megatron_v1-Q5_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:966900eec8ff1752b453276089a4766d09b01f98154deee23ca7eb136bb3c439
3
+ size 8874317696
megatron_v1-Q5_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5be817bc6ac3ee053984b912833e6c794177d6db9c0b7ba9ac23512c586eada
3
+ size 9132791680
megatron_v1-Q5_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88431d4c4ea3bb27905a4874700660d2d13dce5647ec2f3a169f0881c2cfbfd7
3
+ size 8874317696
megatron_v1-Q6_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79bb0b93da8e4af2b407b338fddb023386d12375cbdec06b3a56a7366bf20b73
3
+ size 10567351232
megatron_v1-Q8_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b428b5df572897821ce53335855a4aa836165b494c1e93ce9aa7bc296a2eb46e
3
+ size 13686393664