Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 2 additions & 2 deletions src/database/repositories/SettingsRepository.ts
Original file line number Diff line number Diff line change
Expand Up @@ -80,8 +80,8 @@ export class SettingsRepository {
private async createDefaultInterviewerSettings(): Promise<InterviewerSettings> {
const defaults: InterviewerSettings = {
modelProvider: 'lemonade-server',
modelName: 'gpt-oss-mxp4',
extractionModelName: 'gpt-oss-mxp4',
modelName: 'Qwen3-Coder-30B-A3B-Instruct-GGUF',
extractionModelName: 'Qwen3-Coder-30B-A3B-Instruct-GGUF',
temperature: 0.7,
maxTokens: 2000,
interviewStyle: 'conversational',
Expand Down
8 changes: 5 additions & 3 deletions src/services/LemonadeClient.ts
Original file line number Diff line number Diff line change
Expand Up @@ -97,7 +97,7 @@ export class LemonadeClient {
/**
* Send a message and get AI response
*/
async sendMessage(conversationHistory: Message[], options?: { maxTokens?: number; maxInputTokens?: number }): Promise<string> {
async sendMessage(conversationHistory: Message[], options?: { maxTokens?: number; maxInputTokens?: number; model?: string }): Promise<string> {
try {
// Check server connection first
if (!this.isConnected) {
Expand Down Expand Up @@ -132,8 +132,10 @@ export class LemonadeClient {
const sentInputChars = truncatedHistory.reduce((s, m) => s + m.content.length, 0);
const wasTruncated = truncatedHistory.length < conversationHistory.length;

const modelToUse = options?.model ?? this.settings.modelName;

console.log(`[LLM:sendMessage] ── Request ─────────────────────────────────`);
console.log(`[LLM:sendMessage] model=${this.settings.modelName}`);
console.log(`[LLM:sendMessage] model=${modelToUse}`);
console.log(`[LLM:sendMessage] maxInputTokens=${maxInputTokens}, maxOutputTokens=${options?.maxTokens ?? this.settings.maxTokens}`);
console.log(`[LLM:sendMessage] messages: ${conversationHistory.length} total → ${truncatedHistory.length} sent${wasTruncated ? ' (TRUNCATED)' : ''}`);
console.log(`[LLM:sendMessage] input chars: ${totalInputChars} total → ${sentInputChars} sent (~${Math.round(sentInputChars/4)} tokens)`);
Expand All @@ -151,7 +153,7 @@ export class LemonadeClient {
// consume tokens for chain-of-thought before producing visible content.
const maxTokens = options?.maxTokens ?? this.settings.maxTokens;
const completion = await this.client.chat.completions.create({
model: this.settings.modelName,
model: modelToUse,
messages: messages,
temperature: this.settings.temperature,
max_tokens: maxTokens,
Expand Down
3 changes: 3 additions & 0 deletions src/services/StructuredExtractionService.ts
Original file line number Diff line number Diff line change
Expand Up @@ -60,6 +60,7 @@ export class StructuredExtractionService {

const response = await this.lemonadeClient.sendMessage(messages, {
maxTokens: 2048,
model: this.extractionModel,
});

console.log('[StructuredExtractionService] Feedback extraction raw response:', response.substring(0, 500));
Expand Down Expand Up @@ -135,6 +136,7 @@ export class StructuredExtractionService {

const response = await this.lemonadeClient.sendMessage(messages, {
maxTokens: 1024,
model: this.extractionModel,
});

const parsed = this.parseJSON(response);
Expand Down Expand Up @@ -206,6 +208,7 @@ export class StructuredExtractionService {
// 2048 gives sufficient headroom for thinking + a compact JSON response.
const response = await this.lemonadeClient.sendMessage(messages, {
maxTokens: 2048,
model: this.extractionModel,
});

const parsed = this.parseJSON(response);
Expand Down
6 changes: 3 additions & 3 deletions src/ui/main.tsx
Original file line number Diff line number Diff line change
@@ -1,14 +1,14 @@
import React from 'react';
import ReactDOM from 'react-dom/client';
import { BrowserRouter } from 'react-router-dom';
import { HashRouter } from 'react-router-dom';
import App from './App';
import './index.css';

ReactDOM.createRoot(document.getElementById('root')!).render(
<React.StrictMode>
{/* @ts-expect-error: Suppressing future flag type error until types catch up */}
<BrowserRouter future={{ v7_startTransition: true, v7_relativeSplatPath: true }}>
<HashRouter future={{ v7_startTransition: true, v7_relativeSplatPath: true }}>
<App />
</BrowserRouter>
</HashRouter>
</React.StrictMode>,
);