GGUF
Inference Endpoints
imatrix
File size: 4,063 Bytes
38388f0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1e7170f
7a881e3
72d3578
dd6d82d
12132ac
3a8eea0
e735694
217a4b5
cbba92f
67e7392
bfc98e0
2e66c0b
0b8339f
cd880fb
48f3f39
755f25b
7600cbb
e142c56
f1a7171
290fd6c
e24a300
aea49df
6391b75
12e2a19
b351f35
4a85c6a
47147ed
c3d64a8
6585cfd
1894899
a8b6592
cf64c33
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
*.7z filter=lfs diff=lfs merge=lfs -text
*.arrow filter=lfs diff=lfs merge=lfs -text
*.bin filter=lfs diff=lfs merge=lfs -text
*.bz2 filter=lfs diff=lfs merge=lfs -text
*.ckpt filter=lfs diff=lfs merge=lfs -text
*.ftz filter=lfs diff=lfs merge=lfs -text
*.gz filter=lfs diff=lfs merge=lfs -text
*.h5 filter=lfs diff=lfs merge=lfs -text
*.joblib filter=lfs diff=lfs merge=lfs -text
*.lfs.* filter=lfs diff=lfs merge=lfs -text
*.mlmodel filter=lfs diff=lfs merge=lfs -text
*.model filter=lfs diff=lfs merge=lfs -text
*.msgpack filter=lfs diff=lfs merge=lfs -text
*.npy filter=lfs diff=lfs merge=lfs -text
*.npz filter=lfs diff=lfs merge=lfs -text
*.onnx filter=lfs diff=lfs merge=lfs -text
*.ot filter=lfs diff=lfs merge=lfs -text
*.parquet filter=lfs diff=lfs merge=lfs -text
*.pb filter=lfs diff=lfs merge=lfs -text
*.pickle filter=lfs diff=lfs merge=lfs -text
*.pkl filter=lfs diff=lfs merge=lfs -text
*.pt filter=lfs diff=lfs merge=lfs -text
*.pth filter=lfs diff=lfs merge=lfs -text
*.rar filter=lfs diff=lfs merge=lfs -text
*.safetensors filter=lfs diff=lfs merge=lfs -text
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.tar.* filter=lfs diff=lfs merge=lfs -text
*.tar filter=lfs diff=lfs merge=lfs -text
*.tflite filter=lfs diff=lfs merge=lfs -text
*.tgz filter=lfs diff=lfs merge=lfs -text
*.wasm filter=lfs diff=lfs merge=lfs -text
*.xz filter=lfs diff=lfs merge=lfs -text
*.zip filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text
imatrix.dat filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-F16.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q5_1.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q4_0_4_4.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q4_0_4_8.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q4_0_8_8.gguf filter=lfs diff=lfs merge=lfs -text