rishikanthc · EdrisT · Dec 3, 2025 · Dec 3, 2025 · Dec 4, 2025 · Dec 5, 2025
diff --git a/internal/api/chat_handlers.go b/internal/api/chat_handlers.go
@@ -88,7 +88,7 @@ func (h *Handler) getLLMService(ctx context.Context) (llm.Service, string, error
 		if cfg.APIKey == nil || *cfg.APIKey == "" {
 			return nil, cfg.Provider, fmt.Errorf("OpenAI API key not configured")
 		}
-		return llm.NewOpenAIService(*cfg.APIKey), cfg.Provider, nil
+		return llm.NewOpenAIService(*cfg.APIKey, cfg.OpenAIBaseURL), cfg.Provider, nil
 	case "ollama":
 		if cfg.BaseURL == nil || *cfg.BaseURL == "" {
 			return nil, cfg.Provider, fmt.Errorf("Ollama base URL not configured")

diff --git a/internal/api/handlers.go b/internal/api/handlers.go
@@ -171,21 +171,23 @@ type YouTubeDownloadResponse struct {
 
 // LLMConfigRequest represents the LLM configuration request
 type LLMConfigRequest struct {
-	Provider string  `json:"provider" binding:"required,oneof=ollama openai"`
-	BaseURL  *string `json:"base_url,omitempty"`
-	APIKey   *string `json:"api_key,omitempty"`
-	IsActive bool    `json:"is_active"`
+	Provider      string  `json:"provider" binding:"required,oneof=ollama openai"`
+	BaseURL       *string `json:"base_url,omitempty"`
+	OpenAIBaseURL *string `json:"openai_base_url,omitempty"`
+	APIKey        *string `json:"api_key,omitempty"`
+	IsActive      bool    `json:"is_active"`
 }
 
 // LLMConfigResponse represents the LLM configuration response
 type LLMConfigResponse struct {
-	ID        uint    `json:"id"`
-	Provider  string  `json:"provider"`
-	BaseURL   *string `json:"base_url,omitempty"`
-	HasAPIKey bool    `json:"has_api_key"` // Don't return actual API key
-	IsActive  bool    `json:"is_active"`
-	CreatedAt string  `json:"created_at"`
-	UpdatedAt string  `json:"updated_at"`
+	ID            uint    `json:"id"`
+	Provider      string  `json:"provider"`
+	BaseURL       *string `json:"base_url,omitempty"`
+	OpenAIBaseURL *string `json:"openai_base_url,omitempty"`
+	HasAPIKey     bool    `json:"has_api_key"` // Don't return actual API key
+	IsActive      bool    `json:"is_active"`
+	CreatedAt     string  `json:"created_at"`
+	UpdatedAt     string  `json:"updated_at"`
 }
 
 // APIKeyListResponse represents an API key in the list (without the actual key)
@@ -1880,13 +1882,14 @@ func (h *Handler) GetLLMConfig(c *gin.Context) {
 	}
 
 	response := LLMConfigResponse{
-		ID:        config.ID,
-		Provider:  config.Provider,
-		BaseURL:   config.BaseURL,
-		HasAPIKey: config.APIKey != nil && *config.APIKey != "",
-		IsActive:  config.IsActive,
-		CreatedAt: config.CreatedAt.Format("2006-01-02 15:04:05"),
-		UpdatedAt: config.UpdatedAt.Format("2006-01-02 15:04:05"),
+		ID:            config.ID,
+		Provider:      config.Provider,
+		BaseURL:       config.BaseURL,
+		OpenAIBaseURL: config.OpenAIBaseURL,
+		HasAPIKey:     config.APIKey != nil && *config.APIKey != "",
+		IsActive:      config.IsActive,
+		CreatedAt:     config.CreatedAt.Format("2006-01-02 15:04:05"),
+		UpdatedAt:     config.UpdatedAt.Format("2006-01-02 15:04:05"),
 	}
 
 	c.JSON(http.StatusOK, response)
@@ -1914,10 +1917,6 @@ func (h *Handler) SaveLLMConfig(c *gin.Context) {
 		c.JSON(http.StatusBadRequest, gin.H{"error": "Base URL is required for Ollama provider"})
 		return
 	}
-	if req.Provider == "openai" && (req.APIKey == nil || *req.APIKey == "") {
-		c.JSON(http.StatusBadRequest, gin.H{"error": "API key is required for OpenAI provider"})
-		return
-	}
 
 	// Check if there's an existing active configuration
 	existingConfig, err := h.llmConfigRepo.GetActive(c.Request.Context())
@@ -1926,15 +1925,32 @@ func (h *Handler) SaveLLMConfig(c *gin.Context) {
 		return
 	}
 
+	// Handle API Key logic for OpenAI
+	var apiKeyToSave *string
+	if req.Provider == "openai" {
+		if req.APIKey != nil && *req.APIKey != "" {
+			// New key provided
+			apiKeyToSave = req.APIKey
+		} else if existingConfig != nil && existingConfig.APIKey != nil && *existingConfig.APIKey != "" {
+			// Reuse existing key
+			apiKeyToSave = existingConfig.APIKey
+		} else {
+			// No key provided and no existing key
+			c.JSON(http.StatusBadRequest, gin.H{"error": "API key is required for OpenAI provider"})
+			return
+		}
+	}
+
 	var config *models.LLMConfig
 
 	if err == gorm.ErrRecordNotFound {
 		// No existing active config, create new one
 		config = &models.LLMConfig{
-			Provider: req.Provider,
-			BaseURL:  req.BaseURL,
-			APIKey:   req.APIKey,
-			IsActive: req.IsActive,
+			Provider:      req.Provider,
+			BaseURL:       req.BaseURL,
+			OpenAIBaseURL: req.OpenAIBaseURL,
+			APIKey:        apiKeyToSave,
+			IsActive:      req.IsActive,
 		}
 
 		if err := h.llmConfigRepo.Create(c.Request.Context(), config); err != nil {
@@ -1945,7 +1961,8 @@ func (h *Handler) SaveLLMConfig(c *gin.Context) {
 		// Update existing config
 		existingConfig.Provider = req.Provider
 		existingConfig.BaseURL = req.BaseURL
-		existingConfig.APIKey = req.APIKey
+		existingConfig.OpenAIBaseURL = req.OpenAIBaseURL
+		existingConfig.APIKey = apiKeyToSave
 		existingConfig.IsActive = req.IsActive
 
 		if err := h.llmConfigRepo.Update(c.Request.Context(), existingConfig); err != nil {
@@ -1956,13 +1973,14 @@ func (h *Handler) SaveLLMConfig(c *gin.Context) {
 	}
 
 	response := LLMConfigResponse{
-		ID:        config.ID,
-		Provider:  config.Provider,
-		BaseURL:   config.BaseURL,
-		HasAPIKey: config.APIKey != nil && *config.APIKey != "",
-		IsActive:  config.IsActive,
-		CreatedAt: config.CreatedAt.Format("2006-01-02 15:04:05"),
-		UpdatedAt: config.UpdatedAt.Format("2006-01-02 15:04:05"),
+		ID:            config.ID,
+		Provider:      config.Provider,
+		BaseURL:       config.BaseURL,
+		OpenAIBaseURL: config.OpenAIBaseURL,
+		HasAPIKey:     config.APIKey != nil && *config.APIKey != "",
+		IsActive:      config.IsActive,
+		CreatedAt:     config.CreatedAt.Format("2006-01-02 15:04:05"),
+		UpdatedAt:     config.UpdatedAt.Format("2006-01-02 15:04:05"),
 	}
 
 	c.JSON(http.StatusOK, response)

diff --git a/internal/llm/openai.go b/internal/llm/openai.go
@@ -21,10 +21,14 @@ type OpenAIService struct {
 }
 
 // NewOpenAIService creates a new OpenAI service
-func NewOpenAIService(apiKey string) *OpenAIService {
+func NewOpenAIService(apiKey string, baseURL *string) *OpenAIService {
+	url := "https://api.openai.com/v1"
+	if baseURL != nil && *baseURL != "" {
+		url = *baseURL
+	}
 	return &OpenAIService{
 		apiKey:  apiKey,
-		baseURL: "https://api.openai.com/v1",
+		baseURL: url,
 		client: &http.Client{
 			Timeout: 300 * time.Second,
 		},

diff --git a/internal/models/transcription.go b/internal/models/transcription.go
@@ -202,13 +202,14 @@ func (tp *TranscriptionProfile) BeforeSave(tx *gorm.DB) error {
 
 // LLMConfig represents LLM configuration settings
 type LLMConfig struct {
-	ID        uint      `json:"id" gorm:"primaryKey"`
-	Provider  string    `json:"provider" gorm:"not null;type:varchar(50)"` // "ollama" or "openai"
-	BaseURL   *string   `json:"base_url,omitempty" gorm:"type:text"`       // For Ollama
-	APIKey    *string   `json:"api_key,omitempty" gorm:"type:text"`        // For OpenAI (encrypted)
-	IsActive  bool      `json:"is_active" gorm:"type:boolean;default:false"`
-	CreatedAt time.Time `json:"created_at" gorm:"autoCreateTime"`
-	UpdatedAt time.Time `json:"updated_at" gorm:"autoUpdateTime"`
+	ID            uint      `json:"id" gorm:"primaryKey"`
+	Provider      string    `json:"provider" gorm:"not null;type:varchar(50)"` // "ollama" or "openai"
+	BaseURL       *string   `json:"base_url,omitempty" gorm:"type:text"`       // For Ollama
+	OpenAIBaseURL *string   `json:"openai_base_url,omitempty" gorm:"type:text"` // For OpenAI custom endpoint
+	APIKey        *string   `json:"api_key,omitempty" gorm:"type:text"`        // For OpenAI (encrypted)
+	IsActive      bool      `json:"is_active" gorm:"type:boolean;default:false"`
+	CreatedAt     time.Time `json:"created_at" gorm:"autoCreateTime"`
+	UpdatedAt     time.Time `json:"updated_at" gorm:"autoUpdateTime"`
 }
 
 // BeforeSave ensures only one LLM config can be active

diff --git a/internal/transcription/adapters/whisperx_adapter.go b/internal/transcription/adapters/whisperx_adapter.go
@@ -64,8 +64,8 @@ func NewWhisperXAdapter(envPath string) *WhisperXAdapter {
 			Name:        "model",
 			Type:        "string",
 			Required:    false,
-			Default:     "small",
-			Options:     []string{"tiny", "tiny.en", "base", "base.en", "small", "small.en", "medium", "medium.en", "large", "large-v1", "large-v2", "large-v3"},
+			Default:     "KBLab/kb-whisper-large",
+			Options:     []string{"KBLab/kb-whisper-large","KBLab/kb-whisper-medium","KBLab/kb-whisper-small","KBLab/kb-whisper-base","KBLab/kb-whisper-tiny","tiny", "tiny.en", "base", "base.en", "small", "small.en", "medium", "medium.en", "large", "large-v1", "large-v2", "large-v3"},
 			Description: "Whisper model size to use",
 			Group:       "basic",
 		},
@@ -75,7 +75,7 @@ func NewWhisperXAdapter(envPath string) *WhisperXAdapter {
 			Name:        "device",
 			Type:        "string",
 			Required:    false,
-			Default:     "cpu",
+			Default:     "cuda",
 			Options:     []string{"cpu", "cuda"},
 			Description: "Device to use for computation",
 			Group:       "basic",
@@ -104,7 +104,7 @@ func NewWhisperXAdapter(envPath string) *WhisperXAdapter {
 			Name:        "compute_type",
 			Type:        "string",
 			Required:    false,
-			Default:     "float32",
+			Default:     "float16",
 			Options:     []string{"float16", "float32", "int8"},
 			Description: "Computation precision",
 			Group:       "advanced",
@@ -125,7 +125,7 @@ func NewWhisperXAdapter(envPath string) *WhisperXAdapter {
 			Name:        "language",
 			Type:        "string",
 			Required:    false,
-			Default:     nil,
+			Default:     "sv",
 			Description: "Language code (auto-detect if not specified)",
 			Group:       "basic",
 		},
@@ -144,7 +144,7 @@ func NewWhisperXAdapter(envPath string) *WhisperXAdapter {
 			Name:        "diarize",
 			Type:        "bool",
 			Required:    false,
-			Default:     false,
+			Default:     true,
 			Description: "Enable speaker diarization",
 			Group:       "basic",
 		},
@@ -258,6 +258,16 @@ func NewWhisperXAdapter(envPath string) *WhisperXAdapter {
 			Description: "VAD offset threshold",
 			Group:       "advanced",
 		},
+
+		// Custom Alignment Model
+		{
+			Name:        "align_model",
+			Type:        "string",
+			Required:    false,
+			Default:     nil,
+			Description: "Custom alignment model (e.g. KBLab/wav2vec2-large-voxrex-swedish)",
+			Group:       "advanced",
+		},
 	}
 
 	baseAdapter := NewBaseAdapter("whisperx", filepath.Join(envPath, "WhisperX"), capabilities, schema)
@@ -273,6 +283,11 @@ func NewWhisperXAdapter(envPath string) *WhisperXAdapter {
 // GetSupportedModels returns the list of Whisper models supported
 func (w *WhisperXAdapter) GetSupportedModels() []string {
 	return []string{
+		"KBLab/kb-whisper-large",
+		"KBLab/kb-whisper-medium",
+		"KBLab/kb-whisper-small",
+		"KBLab/kb-whisper-base",
+		"KBLab/kb-whisper-tiny",
 		"tiny", "tiny.en",
 		"base", "base.en",
 		"small", "small.en",
@@ -484,6 +499,11 @@ func (w *WhisperXAdapter) buildWhisperXArgs(input interfaces.AudioInput, params
 	args = append(args, "--vad_onset", fmt.Sprintf("%.3f", w.GetFloatParameter(params, "vad_onset")))
 	args = append(args, "--vad_offset", fmt.Sprintf("%.3f", w.GetFloatParameter(params, "vad_offset")))
 
+	// Custom alignment model
+	if alignModel := w.GetStringParameter(params, "align_model"); alignModel != "" {
+		args = append(args, "--align_model", alignModel)
+	}
+
 	// Diarization
 	if w.GetBoolParameter(params, "diarize") {
 		args = append(args, "--diarize")

diff --git a/web/frontend/src/components/LLMSettings.tsx b/web/frontend/src/components/LLMSettings.tsx
@@ -10,6 +10,7 @@ interface LLMConfig {
 	id?: number;
 	provider: string;
 	base_url?: string;
+	openai_base_url?: string;
 	has_api_key?: boolean;
 	is_active: boolean;
 	created_at?: string;
@@ -22,6 +23,7 @@ export function LLMSettings() {
 		is_active: false,
 	});
 	const [baseUrl, setBaseUrl] = useState("");
+	const [openAIBaseUrl, setOpenAIBaseUrl] = useState("");
 	const [apiKey, setApiKey] = useState("");
 	const [loading, setLoading] = useState(true);
 	const [saving, setSaving] = useState(false);
@@ -42,6 +44,7 @@ export function LLMSettings() {
 				const data = await response.json();
 				setConfig(data);
 				setBaseUrl(data.base_url || "");
+				setOpenAIBaseUrl(data.openai_base_url || "");
 				// Don't set API key from response for security
 			} else if (response.status !== 404) {
 				console.error("Failed to fetch LLM config");
@@ -61,7 +64,10 @@ export function LLMSettings() {
 			provider: config.provider,
 			is_active: true, // Always set to active when saving
 			...(config.provider === "ollama" && { base_url: baseUrl }),
-			...(config.provider === "openai" && { api_key: apiKey }),
+			...(config.provider === "openai" && {
+				api_key: apiKey,
+				openai_base_url: openAIBaseUrl
+			}),
 		};
 
 		try {
@@ -228,27 +234,44 @@ export function LLMSettings() {
 						)}
 
 						{config.provider === "openai" && (
-							<div>
-								<Label htmlFor="apiKey" className="flex items-center gap-2">
-									<Key className="h-4 w-4" />
-									OpenAI API Key *
-									{config.has_api_key && (
-										<span className="text-xs bg-green-100 dark:bg-green-900/30 text-green-700 dark:text-green-300 px-2 py-1 rounded">
-											Already configured
-										</span>
-									)}
-								</Label>
-								<Input
-									id="apiKey"
-									type="password"
-									placeholder={config.has_api_key ? "Enter new API key to update" : "sk-..."}
-									value={apiKey}
-									onChange={(e) => setApiKey(e.target.value)}
-									className="mt-1"
-								/>
-								<p className="text-xs text-carbon-500 dark:text-carbon-400 mt-1">
-									Your OpenAI API key. {config.has_api_key ? "Leave blank to keep current key." : ""}
-								</p>
+							<div className="space-y-4">
+								<div>
+									<Label htmlFor="apiKey" className="flex items-center gap-2">
+										<Key className="h-4 w-4" />
+										OpenAI API Key *
+										{config.has_api_key && (
+											<span className="text-xs bg-green-100 dark:bg-green-900/30 text-green-700 dark:text-green-300 px-2 py-1 rounded">
+												Already configured
+											</span>
+										)}
+									</Label>
+									<Input
+										id="apiKey"
+										type="password"
+										placeholder={config.has_api_key ? "Enter new API key to update" : "sk-..."}
+										value={apiKey}
+										onChange={(e) => setApiKey(e.target.value)}
+										className="mt-1"
+									/>
+									<p className="text-xs text-carbon-500 dark:text-carbon-400 mt-1">
+										Your OpenAI API key. {config.has_api_key ? "Leave blank to keep current key." : ""}
+									</p>
+								</div>
+
+								<div>
+									<Label htmlFor="openAIBaseUrl">OpenAI Base URL (Optional)</Label>
+									<Input
+										id="openAIBaseUrl"
+										type="url"
+										placeholder="https://api.openai.com/v1"
+										value={openAIBaseUrl}
+										onChange={(e) => setOpenAIBaseUrl(e.target.value)}
+										className="mt-1"
+									/>
+									<p className="text-xs text-carbon-500 dark:text-carbon-400 mt-1">
+										Custom endpoint URL for OpenAI-compatible services. Leave blank for default.
+									</p>
+								</div>
 							</div>
 						)}
 					</div>