xfh
/

alpaca.cpp_65b_ggml

Model card Files Files and versions Community

xfh commited on Mar 22, 2023

Commit

6390cb4

•

1 Parent(s): f2ad455

Upload with huggingface_hub

Files changed (6) hide show

.gitattributes +4 -0
README.md +34 -0
ggml-model-q4_0.bin.4 +3 -0
ggml-model-q4_0.bin.5 +3 -0
ggml-model-q4_0.bin.6 +3 -0
ggml-model-q4_0.bin.7 +3 -0

.gitattributes CHANGED Viewed

@@ -35,3 +35,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 ggml-model-q4_0.bin.1 filter=lfs diff=lfs merge=lfs -text
 ggml-model-q4_0.bin.2 filter=lfs diff=lfs merge=lfs -text
 ggml-model-q4_0.bin.3 filter=lfs diff=lfs merge=lfs -text

 ggml-model-q4_0.bin.1 filter=lfs diff=lfs merge=lfs -text
 ggml-model-q4_0.bin.2 filter=lfs diff=lfs merge=lfs -text
 ggml-model-q4_0.bin.3 filter=lfs diff=lfs merge=lfs -text
+ggml-model-q4_0.bin.4 filter=lfs diff=lfs merge=lfs -text
+ggml-model-q4_0.bin.5 filter=lfs diff=lfs merge=lfs -text
+ggml-model-q4_0.bin.6 filter=lfs diff=lfs merge=lfs -text
+ggml-model-q4_0.bin.7 filter=lfs diff=lfs merge=lfs -text

README.md ADDED Viewed

	@@ -0,0 +1,34 @@

+ ### alpaca.cpp 65B ggml model weight
+ ### make 65B ggml story
+ #### 1. clone 65B model data
+ ```shell
+ git clone https://huggingface.co/datasets/nyanko7/LLaMA-65B/
+ ```
+ #### 2. clone alpaca.cpp
+```shell
+ git clone https://github.com/antimatter15/alpaca.cpp
+ ```
+ #### 3. weight quantize.sh
+```shell
+mv LLaMA-65B/tokenizer.model ./
+python convert-pth-to-ggml.py ../LLaMA-65B/ 1
+cd alpaca.cpp
+mkdir -p models/65B
+mv ../LLaMA-65B/ggml-model-f16.bin models/65B/
+mv ../LLaMA-65B/ggml-model-f16.bin.* models/65B/
+bash quantize.sh 65B
+```
+#### 4. upload weight file
+##### Upload is slower. The upload is taking almost 2 days, I decided to curve the upload
+##### I using https://tmp.link/ as temp store
+##### I using colab and huggingface api upload
+### run
+```shell
+git clone https://github.com/antimatter15/
+./chat -m alpaca.cpp_65b_ggml/ggml-model-q4_0.bin
+```

ggml-model-q4_0.bin.4 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5ee474051e418c5732b7949190b084d9d679db447f83c1de0d2a82daaa1a0cfa
+size 5105954665

ggml-model-q4_0.bin.5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a45aa05e7212bd6782790722d68056c5419667ea6b564ccc94bbcb8111d79b8b
+size 5105954665

ggml-model-q4_0.bin.6 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a58fda714b759c28ad5e4c1d8bf8fda7b158fd5e4c4a49f851f36342fa97a105
+size 5105954665

ggml-model-q4_0.bin.7 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a3540cfcbcda33c223c6b0d606034adbd78f17e0e5de1582b78795e78754f7a8
+size 5105954665