cstr commited on
Commit
f64b401
·
verified ·
1 Parent(s): a06c7df

Add model card for jina-v5-small GGUF

Browse files
Files changed (1) hide show
  1. README.md +5 -4
README.md CHANGED
@@ -16,6 +16,7 @@ Jina Embeddings v5 Small. Full-size decoder model, 1024-dimensional.
16
 
17
  | File | Quantization | Size |
18
  |------|-------------|------|
 
19
  | [jina-v5-small-q8_0.gguf](https://huggingface.co/cstr/jina-v5-small-GGUF/resolve/main/jina-v5-small-q8_0.gguf) | Q8_0 | 609 MB |
20
  | [jina-v5-small.gguf](https://huggingface.co/cstr/jina-v5-small-GGUF/resolve/main/jina-v5-small.gguf) | F32 | 2279 MB |
21
 
@@ -24,10 +25,10 @@ Jina Embeddings v5 Small. Full-size decoder model, 1024-dimensional.
24
 
25
  ```bash
26
  # Download
27
- huggingface-cli download cstr/jina-v5-small-GGUF jina-v5-small-q8_0.gguf --local-dir .
28
 
29
  # Run with CrispEmbed
30
- ./crispembed -m jina-v5-small-q8_0.gguf "Hello world"
31
 
32
  # Or with auto-download
33
  ./crispembed -m jina-v5-small "Hello world"
@@ -61,10 +62,10 @@ cd CrispEmbed
61
  cmake -S . -B build && cmake --build build -j
62
 
63
  # Encode
64
- ./build/crispembed -m jina-v5-small-q8_0.gguf "query text"
65
 
66
  # Server mode
67
- ./build/crispembed-server -m jina-v5-small-q8_0.gguf --port 8080
68
  curl -X POST http://localhost:8080/v1/embeddings \
69
  -d '{"input": ["Hello world"], "model": "jina-v5-small"}'
70
  ```
 
16
 
17
  | File | Quantization | Size |
18
  |------|-------------|------|
19
+ | [jina-v5-small-q4_k.gguf](https://huggingface.co/cstr/jina-v5-small-GGUF/resolve/main/jina-v5-small-q4_k.gguf) | Q4_K | 835 MB |
20
  | [jina-v5-small-q8_0.gguf](https://huggingface.co/cstr/jina-v5-small-GGUF/resolve/main/jina-v5-small-q8_0.gguf) | Q8_0 | 609 MB |
21
  | [jina-v5-small.gguf](https://huggingface.co/cstr/jina-v5-small-GGUF/resolve/main/jina-v5-small.gguf) | F32 | 2279 MB |
22
 
 
25
 
26
  ```bash
27
  # Download
28
+ huggingface-cli download cstr/jina-v5-small-GGUF jina-v5-small-q4_k.gguf --local-dir .
29
 
30
  # Run with CrispEmbed
31
+ ./crispembed -m jina-v5-small-q4_k.gguf "Hello world"
32
 
33
  # Or with auto-download
34
  ./crispembed -m jina-v5-small "Hello world"
 
62
  cmake -S . -B build && cmake --build build -j
63
 
64
  # Encode
65
+ ./build/crispembed -m jina-v5-small-q4_k.gguf "query text"
66
 
67
  # Server mode
68
+ ./build/crispembed-server -m jina-v5-small-q4_k.gguf --port 8080
69
  curl -X POST http://localhost:8080/v1/embeddings \
70
  -d '{"input": ["Hello world"], "model": "jina-v5-small"}'
71
  ```