dengcao commited on
Commit
0159070
·
verified ·
1 Parent(s): 4c87098

Upload 7 files

Browse files
.gitattributes CHANGED
@@ -33,3 +33,8 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ ERNIE-4.5-0.3B-PT-F16.gguf filter=lfs diff=lfs merge=lfs -text
37
+ ernie-4.5-0.3b-pt-q3_k_m.gguf filter=lfs diff=lfs merge=lfs -text
38
+ ernie-4.5-0.3b-pt-q4_k_m.gguf filter=lfs diff=lfs merge=lfs -text
39
+ ERNIE-4.5-0.3B-PT-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
40
+ ernie-4.5-0.3b-pt-q8_0.gguf filter=lfs diff=lfs merge=lfs -text
ERNIE-4.5-0.3B-PT-F16.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aee25587d9f4843661bf61eb064cd67b7915a73c1317fb833952de9754eada01
3
+ size 723954720
ERNIE-4.5-0.3B-PT-Q5_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6bdd700c4b088c07d600d6c1e4cb6fb9d1a63698b7d1546e24c2a93aac5ed7b
3
+ size 268662240
README.md CHANGED
@@ -1,3 +1,57 @@
1
- ---
2
- license: apache-2.0
3
- ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ language:
4
+ - en
5
+ - zh
6
+ pipeline_tag: text-generation
7
+ tags:
8
+ - ERNIE4.5
9
+ - llama-cpp
10
+ - gguf-my-repo
11
+ library_name: transformers
12
+ base_model: baidu/ERNIE-4.5-0.3B-PT
13
+ ---
14
+
15
+ # dengcao/ERNIE-4.5-0.3B-PT-GGUF
16
+ This model was converted to GGUF format from [`baidu/ERNIE-4.5-0.3B-PT`](https://huggingface.co/baidu/ERNIE-4.5-0.3B-PT) using llama.cpp via the ggml.ai's [GGUF-my-repo](https://huggingface.co/spaces/ggml-org/gguf-my-repo) space.
17
+ Refer to the [original model card](https://huggingface.co/baidu/ERNIE-4.5-0.3B-PT) for more details on the model.
18
+
19
+ ## Use with llama.cpp
20
+ Install llama.cpp through brew (works on Mac and Linux)
21
+
22
+ ```bash
23
+ brew install llama.cpp
24
+
25
+ ```
26
+ Invoke the llama.cpp server or the CLI.
27
+
28
+ ### CLI:
29
+ ```bash
30
+ llama-cli --hf-repo dengcao/ERNIE-4.5-0.3B-PT-GGUF --hf-file ernie-4.5-0.3b-pt-q4_k_m.gguf -p "The meaning to life and the universe is"
31
+ ```
32
+
33
+ ### Server:
34
+ ```bash
35
+ llama-server --hf-repo dengcao/ERNIE-4.5-0.3B-PT-GGUF --hf-file ernie-4.5-0.3b-pt-q4_k_m.gguf -c 2048
36
+ ```
37
+
38
+ Note: You can also use this checkpoint directly through the [usage steps](https://github.com/ggerganov/llama.cpp?tab=readme-ov-file#usage) listed in the Llama.cpp repo as well.
39
+
40
+ Step 1: Clone llama.cpp from GitHub.
41
+ ```
42
+ git clone https://github.com/ggerganov/llama.cpp
43
+ ```
44
+
45
+ Step 2: Move into the llama.cpp folder and build it with `LLAMA_CURL=1` flag along with other hardware-specific flags (for ex: LLAMA_CUDA=1 for Nvidia GPUs on Linux).
46
+ ```
47
+ cd llama.cpp && LLAMA_CURL=1 make
48
+ ```
49
+
50
+ Step 3: Run inference through the main binary.
51
+ ```
52
+ ./llama-cli --hf-repo dengcao/ERNIE-4.5-0.3B-PT-GGUF --hf-file ernie-4.5-0.3b-pt-q4_k_m.gguf -p "The meaning to life and the universe is"
53
+ ```
54
+ or
55
+ ```
56
+ ./llama-server --hf-repo dengcao/ERNIE-4.5-0.3B-PT-GGUF --hf-file ernie-4.5-0.3b-pt-q4_k_m.gguf -c 2048
57
+ ```
ernie-4.5-0.3b-pt-q3_k_m.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a65e10d5e6c215cd13121ea7d9c096d5f4850f7b19c3997466bf1744279465d9
3
+ size 212515872
ernie-4.5-0.3b-pt-q4_k_m.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c29ced3fdde116b9b626345a156c2638402090bd267af8c8f9b6d38888997557
3
+ size 240645152
ernie-4.5-0.3b-pt-q8_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d492d453e980e6b30b7a3dfb6062a8cafdd90cf583a411135f6f298f2fe5623
3
+ size 385788960
gitattributes ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ *.gguf filter=lfs diff=lfs merge=lfs -text