We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 44b83ca commit 1e20be6Copy full SHA for 1e20be6
llama_cpp/server/app.py
@@ -48,6 +48,10 @@ class Settings(BaseSettings):
48
description="Use mmap.",
49
)
50
embedding: bool = Field(default=True, description="Whether to use embeddings.")
51
+ low_vram: bool = Field(
52
+ default=False,
53
+ description="Whether to use less VRAM. This will reduce performance.",
54
+ )
55
last_n_tokens_size: int = Field(
56
default=64,
57
ge=0,
0 commit comments