Skip to content

Commit 572daa6

Browse files
committed
fix: update embedding model references to jina-embeddings-v4 in configuration files
1 parent 37cc993 commit 572daa6

File tree

4 files changed

+13
-8
lines changed

4 files changed

+13
-8
lines changed

.env.example

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -133,8 +133,9 @@ CODEGRAPH_EMBEDDING_PROVIDER=auto
133133
# - Jina: Variable Matryoska dimensions depending on model 2048, 1024, 512, 256
134134
# - OpenAI: Small 1536 dimensions, Large 3072 dimensions
135135
# - Local ONNX: typically 384 qdrant/all-mini-llm-onnx
136-
# - Local Ollama: qwen3-embedder:0.6b-8b 1024, 2048, 4096
136+
# - Local Ollama: qwen3-embedder:0.6b-8b 1024, 2048, 4096, embeddingsgemma 768, all-mini-llm 384
137137
# - 384 (all-mini-llm:latest)
138+
# - 768 (embeddingsgemma:latest)
138139
# - 1024 (qwen3-embedding:0.6b)
139140
# - 1536 (text-embedding-3-small)
140141
# - 2048 (qwen3-embedding:4b, jina-embeddings-v4)

config/.codegraph.toml.example

Lines changed: 8 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -13,10 +13,10 @@ provider = "lmstudio"
1313
# Model path or identifier
1414
# For ONNX: Absolute path to model directory (auto-detected from HuggingFace cache)
1515
# For Ollama: Model name (e.g., "all-minilm:latest")
16-
# For LM Studio: Model name (e.g., "jinaai/jina-embeddings-v3")
16+
# For LM Studio: Model name (e.g., "jinaai/jina-embeddings-v4")
1717
# For OpenAI: Model name (e.g., "text-embedding-3-small")
18-
# Recommended: jinaai/jina-embeddings-v3 (1536-dim, optimized for code)
19-
model = "jinaai/jina-embeddings-v3"
18+
# Recommended: jinaai/jina-embeddings-v4 (2048-dim, optimized for code)
19+
model = "jinaai/jina-embeddings-v4"
2020

2121
# LM Studio URL (default port 1234)
2222
lmstudio_url = "http://localhost:1234"
@@ -28,8 +28,11 @@ ollama_url = "http://localhost:11434"
2828
# Can also be set via OPENAI_API_KEY environment variable
2929
# openai_api_key = "sk-..."
3030

31-
# Embedding dimension (1536 for jina-code-embeddings-1.5b, 384 for all-MiniLM)
32-
dimension = 1536
31+
# Embedding dimension (2048 for jina-embeddings-v4, 384 for all-MiniLM, 1024 for qwen3-embedding:0.6b etc. check your model and what's available in the schema)
32+
# All mini-minilm:latest (ollama for speed)
33+
# embeddingsgemma or qwen3-embedding:0.6b or 4b or8b for local SOTA
34+
# Jina for SOTA accuracy
35+
dimension = 2048
3336

3437
# Batch size for embedding generation (GPU optimization)
3538
batch_size = 64

crates/codegraph-mcp/src/bin/codegraph.rs

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1294,7 +1294,8 @@ async fn handle_index(
12941294
println!(
12951295
"{}\n • {}\n • {}\n • {}\n • {}",
12961296
"🧠 Using Local Embeddings".green(),
1297-
"384-dim all-mini-llm".green(),
1297+
"384-dim all-minilm:latest".green(),
1298+
"768-dim embeddingsgemma:latest".green(),
12981299
"1024-dim qwen3-embedding:0.6b".green(),
12991300
"2048-dim qwen3-embedding:4b".green(),
13001301
"4096-dim qwen3-embedding:8b".green()

crates/codegraph-napi/README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -106,7 +106,7 @@ dimension = 384
106106

107107
# Optional: Jina AI cloud embeddings
108108
jina_api_key = "jina_xxx" # Or use JINA_API_KEY env var
109-
jina_model = "jina-embeddings-v3"
109+
jina_model = "jina-embeddings-v4"
110110
jina_task_type = "retrieval.query"
111111
jina_enable_reranking = true
112112

0 commit comments

Comments
 (0)