diff --git a/src/commons/modelInfo.ts b/src/commons/modelInfo.ts index 5f7521e..48c960d 100644 --- a/src/commons/modelInfo.ts +++ b/src/commons/modelInfo.ts @@ -1,7 +1,7 @@ export const DEFAULT_MODEL_INFO = new Map(); [{ - id: 'nomic-embed-text:latest', - size: '274MB', + id: 'granite-embedding:278m', + size: '563MB', digest: '' }, { diff --git a/src/commons/modelRequirements.ts b/src/commons/modelRequirements.ts index cd0003e..d9decbc 100644 --- a/src/commons/modelRequirements.ts +++ b/src/commons/modelRequirements.ts @@ -1,4 +1,4 @@ -import { GB } from "./sizeUtils"; +import { GB, MB } from "./sizeUtils"; import { hasDiscreteGPU, isHighEndApple, SystemInfo } from "./sysInfo"; import { formatSize } from './textUtils'; @@ -34,11 +34,11 @@ export const MODEL_REQUIREMENTS: Record = { gpuRecommended: true, sizeBytes: Math.ceil(4.6 * GB) }, - "nomic-embed-text:latest": { + "granite-embedding:278m": { minMemoryBytes: 2 * GB, recommendedMemoryBytes: 4 * GB, gpuRecommended: false, - sizeBytes: Math.ceil(0.274 * GB) + sizeBytes: Math.ceil(563 * MB) } }; diff --git a/src/commons/sysInfo.ts b/src/commons/sysInfo.ts index cf487b8..9f6a1b3 100644 --- a/src/commons/sysInfo.ts +++ b/src/commons/sysInfo.ts @@ -65,6 +65,6 @@ export function getRecommendedModels(systemInfo: SystemInfo) { return { defaultChatModel: defaultGraniteModel, defaultTabModel: defaultGraniteModel, - defaultEmbeddingsModel: "nomic-embed-text:latest" + defaultEmbeddingsModel: "granite-embedding:278m" }; } \ No newline at end of file diff --git a/src/configureAssistant.ts b/src/configureAssistant.ts index 939ac22..1355e90 100644 --- a/src/configureAssistant.ts +++ b/src/configureAssistant.ts @@ -82,7 +82,7 @@ const modelConfigs: ModelConfig[] = [ ...baseGraniteConfig, }, { - model: "nomic-embed-text", + model: "granite-embedding:278m", ...baseConfig, } ]; @@ -90,7 +90,7 @@ const modelConfigs: ModelConfig[] = [ function getModelConfig(model: string): ModelConfig { let modelConfig = modelConfigs.find(m => m.model === model); if (!modelConfig) { - const configTemplate = model.includes("granite") ? baseGraniteConfig : baseConfig; + const configTemplate = model.includes("embed") ? baseConfig : baseGraniteConfig; modelConfig = { ...configTemplate, model, diff --git a/src/ollama/mockServer.ts b/src/ollama/mockServer.ts index beadd10..8d1f706 100644 --- a/src/ollama/mockServer.ts +++ b/src/ollama/mockServer.ts @@ -39,7 +39,7 @@ export class MockServer extends OllamaServer implements IModelServer { ["granite-code:8b", new MockModel("granite-code:8b", 4000)], ["granite-code:20b", new MockModel("granite-code:20b", 11000, ModelStatus.installed)], ["granite-code:34b", new MockModel("granite-code:34b", 20000)], - ["nomic-embed-text:latest", new MockModel("nomic-embed-text:latest", 274, ModelStatus.stale)], + ["granite-embedding:278m", new MockModel("granite-embedding:278m", 563, ModelStatus.stale)], ]); /** diff --git a/webviews/src/App.test.tsx b/webviews/src/App.test.tsx index bfa0a44..0d62b7a 100644 --- a/webviews/src/App.test.tsx +++ b/webviews/src/App.test.tsx @@ -83,7 +83,7 @@ describe("App Component", () => { data: { chatModelId: "granite3.1-dense:2b", tabModelId: "granite3.1-dense:2b", - embeddingsModelId: "nomic-embed-text:latest", + embeddingsModelId: "granite-embedding:278m", }, }); }); @@ -164,7 +164,7 @@ describe("App Component", () => { data: { chatModelId: "granite3.1-dense:2b", tabModelId: "granite3.1-dense:2b", - embeddingsModelId: "nomic-embed-text:latest", + embeddingsModelId: "granite-embedding:278m", }, }); }); diff --git a/webviews/src/App.tsx b/webviews/src/App.tsx index b18a0b7..c2ce0a5 100644 --- a/webviews/src/App.tsx +++ b/webviews/src/App.tsx @@ -40,9 +40,9 @@ function App() { const embeddingsOptions: ModelOption[] = [ { - label: "nomic-embed-text", - value: "nomic-embed-text:latest", - info: formatSize(MODEL_REQUIREMENTS["nomic-embed-text:latest"].sizeBytes), + label: "granite-embedding", + value: "granite-embedding:278m", + info: formatSize(MODEL_REQUIREMENTS["granite-embedding:278m"].sizeBytes), }, { label: "Keep existing configuration", value: null, info: null }, ];