teknium commited on
Commit
cf716d4
·
verified ·
1 Parent(s): c8c7341

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ DeepHermes-3-Llama-3-3B-Preview-q4.gguf filter=lfs diff=lfs merge=lfs -text
37
+ DeepHermes-3-Llama-3-3B-Preview-q5.gguf filter=lfs diff=lfs merge=lfs -text
38
+ DeepHermes-3-Llama-3-3B-Preview-q6.gguf filter=lfs diff=lfs merge=lfs -text
39
+ DeepHermes-3-Llama-3-3B-Preview-q8.gguf filter=lfs diff=lfs merge=lfs -text
DeepHermes-3-Llama-3-3B-Preview-q4.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cff70f3a76a72a668e9584afafe06610b259820e724a45aebee087a2dfd2d2d1
3
+ size 1917192608
DeepHermes-3-Llama-3-3B-Preview-q5.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0fe60ce94a8243e6d79ad82ba8ac23016937eb459664cf98a967872bbc04c71
3
+ size 2269514144
DeepHermes-3-Llama-3-3B-Preview-q6.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce615b26be4f1321e7557f86da3c90f4393a46c4ae1988c8936d0c80e04f42b4
3
+ size 2643855776
DeepHermes-3-Llama-3-3B-Preview-q8.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88eb0d7bcd002b48225f45fc3c0a18c11201985e9b5ce685eb791cd19149c012
3
+ size 3421901216
README.md ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # GGUF Quantized Models
2
+
3
+ This repository contains GGUF quantized versions of language models for efficient inference.
4
+
5
+ ## Files
6
+
7
+ The following GGUF files are available in this repository:
8
+
9
+ - `DeepHermes-3-Llama-3-3B-Preview-q4.gguf` (1.8G)
10
+ - `DeepHermes-3-Llama-3-3B-Preview-q5.gguf` (2.2G)
11
+ - `DeepHermes-3-Llama-3-3B-Preview-q6.gguf` (2.5G)
12
+ - `DeepHermes-3-Llama-3-3B-Preview-q8.gguf` (3.2G)
13
+
14
+ ## Usage
15
+
16
+ These models are compatible with [llama.cpp](https://github.com/ggerganov/llama.cpp) and similar frameworks.
17
+
18
+ Example usage with llama.cpp:
19
+ ```bash
20
+ ./main -m /path/to/model.gguf -p "Hello, I am a language model" -n 128
21
+ ```
22
+
23
+ ## Upload Information
24
+ Files were uploaded on Tue Mar 11 04:28:49 PDT 2025