feat: add intelligent provider profile recommendation

This commit is contained in:
Vasanthdev2004
2026-04-01 11:10:51 +05:30
parent 2d7aa9c841
commit 174eb8ad3b
9 changed files with 945 additions and 40 deletions

View File

@@ -1,6 +1,16 @@
// @ts-nocheck
import { writeFileSync } from 'node:fs'
import { resolve } from 'node:path'
import {
getGoalDefaultOpenAIModel,
normalizeRecommendationGoal,
recommendOllamaModel,
} from '../src/utils/providerRecommendation.ts'
import {
getOllamaChatBaseUrl,
hasLocalOllama,
listOllamaModels,
} from './provider-discovery.ts'
type ProviderProfile = 'openai' | 'ollama'
@@ -27,51 +37,55 @@ function parseProviderArg(): ProviderProfile | 'auto' {
return 'auto'
}
async function hasLocalOllama(): Promise<boolean> {
const endpoint = 'http://localhost:11434/api/tags'
const controller = new AbortController()
const timeout = setTimeout(() => controller.abort(), 1200)
try {
const response = await fetch(endpoint, {
method: 'GET',
signal: controller.signal,
})
return response.ok
} catch {
return false
} finally {
clearTimeout(timeout)
}
}
function sanitizeApiKey(key: string | null): string | undefined {
if (!key || key === 'SUA_CHAVE') return undefined
return key
}
async function resolveOllamaModel(
argModel: string | null,
argBaseUrl: string | null,
goal: ReturnType<typeof normalizeRecommendationGoal>,
): Promise<string> {
if (argModel) return argModel
const discovered = await listOllamaModels(argBaseUrl || undefined)
const recommended = recommendOllamaModel(discovered, goal)
if (recommended) {
return recommended.name
}
return process.env.OPENAI_MODEL || 'llama3.1:8b'
}
async function main(): Promise<void> {
const provider = parseProviderArg()
const argModel = parseArg('--model')
const argBaseUrl = parseArg('--base-url')
const argApiKey = parseArg('--api-key')
const goal = normalizeRecommendationGoal(
parseArg('--goal') || process.env.OPENCLAUDE_PROFILE_GOAL,
)
let selected: ProviderProfile
if (provider === 'auto') {
selected = (await hasLocalOllama()) ? 'ollama' : 'openai'
selected = (await hasLocalOllama(argBaseUrl || undefined)) ? 'ollama' : 'openai'
} else {
selected = provider
}
const env: ProfileFile['env'] = {}
if (selected === 'ollama') {
env.OPENAI_BASE_URL = argBaseUrl || 'http://localhost:11434/v1'
env.OPENAI_MODEL = argModel || process.env.OPENAI_MODEL || 'llama3.1:8b'
env.OPENAI_BASE_URL = getOllamaChatBaseUrl(argBaseUrl || undefined)
env.OPENAI_MODEL = await resolveOllamaModel(argModel, argBaseUrl, goal)
const key = sanitizeApiKey(argApiKey || process.env.OPENAI_API_KEY || null)
if (key) env.OPENAI_API_KEY = key
} else {
env.OPENAI_BASE_URL = argBaseUrl || process.env.OPENAI_BASE_URL || 'https://api.openai.com/v1'
env.OPENAI_MODEL = argModel || process.env.OPENAI_MODEL || 'gpt-4o'
env.OPENAI_MODEL =
argModel ||
process.env.OPENAI_MODEL ||
getGoalDefaultOpenAIModel(goal)
const key = sanitizeApiKey(argApiKey || process.env.OPENAI_API_KEY || null)
if (!key) {
console.error('OpenAI profile requires a real API key. Use --api-key or set OPENAI_API_KEY.')
@@ -90,6 +104,8 @@ async function main(): Promise<void> {
writeFileSync(outputPath, JSON.stringify(profile, null, 2), 'utf8')
console.log(`Saved profile: ${selected}`)
console.log(`Goal: ${goal}`)
console.log(`Model: ${profile.env.OPENAI_MODEL}`)
console.log(`Path: ${outputPath}`)
console.log('Next: bun run dev:profile')
}

View File

@@ -0,0 +1,129 @@
import type { OllamaModelDescriptor } from '../src/utils/providerRecommendation.ts'
export const DEFAULT_OLLAMA_BASE_URL = 'http://localhost:11434'
function withTimeoutSignal(timeoutMs: number): {
signal: AbortSignal
clear: () => void
} {
const controller = new AbortController()
const timeout = setTimeout(() => controller.abort(), timeoutMs)
return {
signal: controller.signal,
clear: () => clearTimeout(timeout),
}
}
function trimTrailingSlash(value: string): string {
return value.replace(/\/+$/, '')
}
export function getOllamaApiBaseUrl(baseUrl?: string): string {
const parsed = new URL(
baseUrl || process.env.OLLAMA_BASE_URL || DEFAULT_OLLAMA_BASE_URL,
)
const pathname = trimTrailingSlash(parsed.pathname)
parsed.pathname = pathname.endsWith('/v1')
? pathname.slice(0, -3) || '/'
: pathname || '/'
parsed.search = ''
parsed.hash = ''
return trimTrailingSlash(parsed.toString())
}
export function getOllamaChatBaseUrl(baseUrl?: string): string {
return `${getOllamaApiBaseUrl(baseUrl)}/v1`
}
export async function hasLocalOllama(baseUrl?: string): Promise<boolean> {
const { signal, clear } = withTimeoutSignal(1200)
try {
const response = await fetch(`${getOllamaApiBaseUrl(baseUrl)}/api/tags`, {
method: 'GET',
signal,
})
return response.ok
} catch {
return false
} finally {
clear()
}
}
export async function listOllamaModels(
baseUrl?: string,
): Promise<OllamaModelDescriptor[]> {
const { signal, clear } = withTimeoutSignal(5000)
try {
const response = await fetch(`${getOllamaApiBaseUrl(baseUrl)}/api/tags`, {
method: 'GET',
signal,
})
if (!response.ok) {
return []
}
const data = await response.json() as {
models?: Array<{
name?: string
size?: number
details?: {
family?: string
families?: string[]
parameter_size?: string
quantization_level?: string
}
}>
}
return (data.models ?? [])
.filter(model => Boolean(model.name))
.map(model => ({
name: model.name!,
sizeBytes: typeof model.size === 'number' ? model.size : null,
family: model.details?.family ?? null,
families: model.details?.families ?? [],
parameterSize: model.details?.parameter_size ?? null,
quantizationLevel: model.details?.quantization_level ?? null,
}))
} catch {
return []
} finally {
clear()
}
}
export async function benchmarkOllamaModel(
modelName: string,
baseUrl?: string,
): Promise<number | null> {
const start = Date.now()
const { signal, clear } = withTimeoutSignal(20000)
try {
const response = await fetch(`${getOllamaApiBaseUrl(baseUrl)}/api/chat`, {
method: 'POST',
headers: {
'Content-Type': 'application/json',
},
signal,
body: JSON.stringify({
model: modelName,
stream: false,
messages: [{ role: 'user', content: 'Reply with OK.' }],
options: {
temperature: 0,
num_predict: 8,
},
}),
})
if (!response.ok) {
return null
}
await response.json()
return Date.now() - start
} catch {
return null
} finally {
clear()
}
}

View File

@@ -2,6 +2,16 @@
import { spawn } from 'node:child_process'
import { existsSync, readFileSync } from 'node:fs'
import { resolve } from 'node:path'
import {
getGoalDefaultOpenAIModel,
normalizeRecommendationGoal,
recommendOllamaModel,
} from '../src/utils/providerRecommendation.ts'
import {
getOllamaChatBaseUrl,
hasLocalOllama,
listOllamaModels,
} from './provider-discovery.ts'
type ProviderProfile = 'openai' | 'ollama'
@@ -18,20 +28,29 @@ type LaunchOptions = {
requestedProfile: ProviderProfile | 'auto' | null
passthroughArgs: string[]
fast: boolean
goal: ReturnType<typeof normalizeRecommendationGoal>
}
function parseLaunchOptions(argv: string[]): LaunchOptions {
let requestedProfile: ProviderProfile | 'auto' | null = 'auto'
const passthroughArgs: string[] = []
let fast = false
let goal = normalizeRecommendationGoal(process.env.OPENCLAUDE_PROFILE_GOAL)
for (const arg of argv) {
for (let i = 0; i < argv.length; i++) {
const arg = argv[i]!
const lower = arg.toLowerCase()
if (lower === '--fast') {
fast = true
continue
}
if (lower === '--goal') {
goal = normalizeRecommendationGoal(argv[i + 1] ?? null)
i++
continue
}
if ((lower === 'auto' || lower === 'openai' || lower === 'ollama') && requestedProfile === 'auto') {
requestedProfile = lower as ProviderProfile | 'auto'
continue
@@ -54,6 +73,7 @@ function parseLaunchOptions(argv: string[]): LaunchOptions {
requestedProfile,
passthroughArgs,
fast,
goal,
}
}
@@ -71,18 +91,12 @@ function loadPersistedProfile(): ProfileFile | null {
}
}
async function hasLocalOllama(): Promise<boolean> {
const endpoint = 'http://localhost:11434/api/tags'
const controller = new AbortController()
const timeout = setTimeout(() => controller.abort(), 1200)
try {
const response = await fetch(endpoint, { signal: controller.signal })
return response.ok
} catch {
return false
} finally {
clearTimeout(timeout)
}
async function resolveOllamaDefaultModel(
goal: ReturnType<typeof normalizeRecommendationGoal>,
): Promise<string> {
const models = await listOllamaModels()
const recommended = recommendOllamaModel(models, goal)
return recommended?.name || process.env.OPENAI_MODEL || 'llama3.1:8b'
}
function runCommand(command: string, env: NodeJS.ProcessEnv): Promise<number> {
@@ -99,7 +113,11 @@ function runCommand(command: string, env: NodeJS.ProcessEnv): Promise<number> {
})
}
function buildEnv(profile: ProviderProfile, persisted: ProfileFile | null): NodeJS.ProcessEnv {
async function buildEnv(
profile: ProviderProfile,
persisted: ProfileFile | null,
goal: ReturnType<typeof normalizeRecommendationGoal>,
): Promise<NodeJS.ProcessEnv> {
const persistedEnv = persisted?.env ?? {}
const env: NodeJS.ProcessEnv = {
...process.env,
@@ -107,8 +125,14 @@ function buildEnv(profile: ProviderProfile, persisted: ProfileFile | null): Node
}
if (profile === 'ollama') {
env.OPENAI_BASE_URL = persistedEnv.OPENAI_BASE_URL || process.env.OPENAI_BASE_URL || 'http://localhost:11434/v1'
env.OPENAI_MODEL = persistedEnv.OPENAI_MODEL || process.env.OPENAI_MODEL || 'llama3.1:8b'
env.OPENAI_BASE_URL =
persistedEnv.OPENAI_BASE_URL ||
process.env.OPENAI_BASE_URL ||
getOllamaChatBaseUrl()
env.OPENAI_MODEL =
persistedEnv.OPENAI_MODEL ||
process.env.OPENAI_MODEL ||
await resolveOllamaDefaultModel(goal)
if (!process.env.OPENAI_API_KEY || process.env.OPENAI_API_KEY === 'SUA_CHAVE') {
delete env.OPENAI_API_KEY
}
@@ -116,7 +140,10 @@ function buildEnv(profile: ProviderProfile, persisted: ProfileFile | null): Node
}
env.OPENAI_BASE_URL = process.env.OPENAI_BASE_URL || persistedEnv.OPENAI_BASE_URL || 'https://api.openai.com/v1'
env.OPENAI_MODEL = process.env.OPENAI_MODEL || persistedEnv.OPENAI_MODEL || 'gpt-4o'
env.OPENAI_MODEL =
process.env.OPENAI_MODEL ||
persistedEnv.OPENAI_MODEL ||
getGoalDefaultOpenAIModel(goal)
env.OPENAI_API_KEY = process.env.OPENAI_API_KEY || persistedEnv.OPENAI_API_KEY
return env
}
@@ -165,7 +192,7 @@ async function main(): Promise<void> {
profile = requestedProfile
}
const env = buildEnv(profile, persisted)
const env = await buildEnv(profile, persisted, options.goal)
if (options.fast) {
applyFastFlags(env)
}

View File

@@ -0,0 +1,277 @@
// @ts-nocheck
import { writeFileSync } from 'node:fs'
import { resolve } from 'node:path'
import {
applyBenchmarkLatency,
getGoalDefaultOpenAIModel,
normalizeRecommendationGoal,
rankOllamaModels,
type BenchmarkedOllamaModel,
type RecommendationGoal,
} from '../src/utils/providerRecommendation.ts'
import {
benchmarkOllamaModel,
getOllamaChatBaseUrl,
hasLocalOllama,
listOllamaModels,
} from './provider-discovery.ts'
type ProviderProfile = 'openai' | 'ollama'
type ProfileFile = {
profile: ProviderProfile
env: {
OPENAI_BASE_URL?: string
OPENAI_MODEL?: string
OPENAI_API_KEY?: string
}
createdAt: string
}
type CliOptions = {
apply: boolean
benchmark: boolean
goal: RecommendationGoal
json: boolean
provider: ProviderProfile | 'auto'
baseUrl: string | null
}
function parseOptions(argv: string[]): CliOptions {
const options: CliOptions = {
apply: false,
benchmark: false,
goal: normalizeRecommendationGoal(process.env.OPENCLAUDE_PROFILE_GOAL),
json: false,
provider: 'auto',
baseUrl: null,
}
for (let i = 0; i < argv.length; i++) {
const arg = argv[i]?.toLowerCase()
if (!arg) continue
if (arg === '--apply') {
options.apply = true
continue
}
if (arg === '--benchmark') {
options.benchmark = true
continue
}
if (arg === '--json') {
options.json = true
continue
}
if (arg === '--goal') {
options.goal = normalizeRecommendationGoal(argv[i + 1] ?? null)
i++
continue
}
if (arg === '--provider') {
const provider = argv[i + 1]?.toLowerCase()
if (
provider === 'openai' ||
provider === 'ollama' ||
provider === 'auto'
) {
options.provider = provider
}
i++
continue
}
if (arg === '--base-url') {
options.baseUrl = argv[i + 1] ?? null
i++
}
}
return options
}
function sanitizeApiKey(key: string | undefined): string | undefined {
if (!key || key === 'SUA_CHAVE') return undefined
return key
}
function printHumanSummary(payload: {
goal: RecommendationGoal
recommendedProfile: ProviderProfile
recommendedModel: string
rankedModels: BenchmarkedOllamaModel[]
benchmarked: boolean
applied: boolean
}): void {
console.log(`Recommendation goal: ${payload.goal}`)
console.log(`Recommended profile: ${payload.recommendedProfile}`)
console.log(`Recommended model: ${payload.recommendedModel}`)
if (payload.rankedModels.length > 0) {
console.log('\nRanked Ollama models:')
for (const [index, model] of payload.rankedModels.slice(0, 5).entries()) {
const benchmarkPart =
payload.benchmarked && model.benchmarkMs !== null
? ` | ${Math.round(model.benchmarkMs)}ms`
: ''
console.log(
`${index + 1}. ${model.name} | score=${model.score}${benchmarkPart} | ${model.summary}`,
)
}
}
if (payload.applied) {
console.log('\nSaved .openclaude-profile.json with the recommended profile.')
console.log('Next: bun run dev:profile')
} else {
console.log(
'\nTip: run `bun run profile:auto -- --goal ' +
payload.goal +
'` to apply this automatically.',
)
}
}
async function maybeApplyProfile(
profile: ProviderProfile,
model: string,
goal: RecommendationGoal,
baseUrl: string | null,
): Promise<boolean> {
const env: ProfileFile['env'] = {}
if (profile === 'ollama') {
env.OPENAI_BASE_URL = getOllamaChatBaseUrl(baseUrl ?? undefined)
env.OPENAI_MODEL = model
const key = sanitizeApiKey(process.env.OPENAI_API_KEY)
if (key) env.OPENAI_API_KEY = key
} else {
const key = sanitizeApiKey(process.env.OPENAI_API_KEY)
if (!key) {
console.error('Cannot apply an OpenAI profile without OPENAI_API_KEY.')
return false
}
env.OPENAI_BASE_URL =
process.env.OPENAI_BASE_URL || 'https://api.openai.com/v1'
env.OPENAI_MODEL = model || getGoalDefaultOpenAIModel(goal)
env.OPENAI_API_KEY = key
}
const profileFile: ProfileFile = {
profile,
env,
createdAt: new Date().toISOString(),
}
writeFileSync(
resolve(process.cwd(), '.openclaude-profile.json'),
JSON.stringify(profileFile, null, 2),
'utf8',
)
return true
}
async function main(): Promise<void> {
const options = parseOptions(process.argv.slice(2))
const ollamaAvailable =
options.provider !== 'openai' &&
(await hasLocalOllama(options.baseUrl ?? undefined))
const ollamaModels = ollamaAvailable
? await listOllamaModels(options.baseUrl ?? undefined)
: []
const heuristicRanked = rankOllamaModels(ollamaModels, options.goal)
const benchmarkInput = options.benchmark ? heuristicRanked.slice(0, 3) : []
const benchmarkResults: Record<string, number | null> = {}
for (const model of benchmarkInput) {
benchmarkResults[model.name] = await benchmarkOllamaModel(
model.name,
options.baseUrl ?? undefined,
)
}
const rankedModels: BenchmarkedOllamaModel[] = options.benchmark
? applyBenchmarkLatency(heuristicRanked, benchmarkResults, options.goal)
: heuristicRanked.map(model => ({
...model,
benchmarkMs: null,
}))
const recommendedOllama = rankedModels[0] ?? null
const openAIConfigured = Boolean(sanitizeApiKey(process.env.OPENAI_API_KEY))
let recommendedProfile: ProviderProfile
let recommendedModel: string
if (options.provider === 'openai') {
recommendedProfile = 'openai'
recommendedModel = getGoalDefaultOpenAIModel(options.goal)
} else if (options.provider === 'ollama') {
if (!recommendedOllama) {
console.error(
'No Ollama models were discovered. Pull a model first or switch to --provider openai.',
)
process.exit(1)
}
recommendedProfile = 'ollama'
recommendedModel = recommendedOllama.name
} else if (recommendedOllama) {
recommendedProfile = 'ollama'
recommendedModel = recommendedOllama.name
} else {
recommendedProfile = 'openai'
recommendedModel = getGoalDefaultOpenAIModel(options.goal)
}
let applied = false
if (options.apply) {
applied = await maybeApplyProfile(
recommendedProfile,
recommendedModel,
options.goal,
options.baseUrl,
)
if (!applied) {
process.exit(1)
}
}
const payload = {
goal: options.goal,
provider: options.provider,
ollamaAvailable,
openAIConfigured,
recommendedProfile,
recommendedModel,
benchmarked: options.benchmark,
rankedModels,
applied,
}
if (options.json) {
console.log(JSON.stringify(payload, null, 2))
return
}
printHumanSummary({
goal: options.goal,
recommendedProfile,
recommendedModel,
rankedModels,
benchmarked: options.benchmark,
applied,
})
if (!recommendedOllama && !openAIConfigured) {
console.log(
'\nNo local Ollama model was detected and OPENAI_API_KEY is unset.',
)
console.log(
'Next steps: `ollama pull qwen2.5-coder:7b` or set OPENAI_API_KEY.',
)
}
}
await main()
export {}