model.ts
utils/model/model.ts
619
Lines
21409
Bytes
30
Exports
13
Imports
10
Keywords
What this is
This page documents one file from the repository and includes its full source so you can read it without leaving the docs site.
Beginner explanation
This file is one piece of the larger system. Its name, directory, imports, and exports show where it fits. Start by reading the exports and related files first.
How it is used
Start from the exports list and related files. Those are the easiest clues for where this file fits into the system.
Expert explanation
Architecturally, this file intersects with modes. It contains 619 lines, 13 detected imports, and 30 detected exports.
Important relationships
Detected exports
ModelShortNameModelNameModelSettinggetSmallFastModelisNonCustomOpusModelgetUserSpecifiedModelSettinggetMainLoopModelgetBestModelgetDefaultOpusModelgetDefaultSonnetModelgetDefaultHaikuModelgetRuntimeMainLoopModelgetDefaultMainLoopModelSettinggetDefaultMainLoopModelfirstPartyNameToCanonicalgetCanonicalNamegetClaudeAiUserDefaultModelDescriptionrenderDefaultModelSettinggetOpus46PricingSuffixisOpus1mMergeEnabledrenderModelSettinggetPublicModelDisplayNamerenderModelNamegetPublicModelNameparseUserSpecifiedModelresolveSkillModelOverrideisLegacyModelRemapEnabledmodelDisplayStringgetMarketingNameForModelnormalizeModelStringForAPI
Keywords
modelnameopussonnetincludesgetmodelstringsmodelnamecasecanonicalcontext
Detected imports
../../bootstrap/state.js../auth.js../context.js../envUtils.js./modelStrings.js../modelCost.js../settings/settings.js../permissions/PermissionMode.js./providers.js../../constants/figures.js./modelAllowlist.js./aliases.js../stringUtils.js
Source notes
This page embeds the full file contents. Small or leaf files are still indexed honestly instead of being over-explained.
Full source
// biome-ignore-all assist/source/organizeImports: ANT-ONLY import markers must not be reordered
/**
* Ensure that any model codenames introduced here are also added to
* scripts/excluded-strings.txt to avoid leaking them. Wrap any codename string
* literals with process.env.USER_TYPE === 'ant' for Bun to remove the codenames
* during dead code elimination
*/
import { getMainLoopModelOverride } from '../../bootstrap/state.js'
import {
getSubscriptionType,
isClaudeAISubscriber,
isMaxSubscriber,
isProSubscriber,
isTeamPremiumSubscriber,
} from '../auth.js'
import {
has1mContext,
is1mContextDisabled,
modelSupports1M,
} from '../context.js'
import { isEnvTruthy } from '../envUtils.js'
import { getModelStrings, resolveOverriddenModel } from './modelStrings.js'
import { formatModelPricing, getOpus46CostTier } from '../modelCost.js'
import { getSettings_DEPRECATED } from '../settings/settings.js'
import type { PermissionMode } from '../permissions/PermissionMode.js'
import { getAPIProvider } from './providers.js'
import { LIGHTNING_BOLT } from '../../constants/figures.js'
import { isModelAllowed } from './modelAllowlist.js'
import { type ModelAlias, isModelAlias } from './aliases.js'
import { capitalize } from '../stringUtils.js'
export type ModelShortName = string
export type ModelName = string
export type ModelSetting = ModelName | ModelAlias | null
export function getSmallFastModel(): ModelName {
return process.env.ANTHROPIC_SMALL_FAST_MODEL || getDefaultHaikuModel()
}
export function isNonCustomOpusModel(model: ModelName): boolean {
return (
model === getModelStrings().opus40 ||
model === getModelStrings().opus41 ||
model === getModelStrings().opus45 ||
model === getModelStrings().opus46
)
}
/**
* Helper to get the model from /model (including via /config), the --model flag, environment variable,
* or the saved settings. The returned value can be a model alias if that's what the user specified.
* Undefined if the user didn't configure anything, in which case we fall back to
* the default (null).
*
* Priority order within this function:
* 1. Model override during session (from /model command) - highest priority
* 2. Model override at startup (from --model flag)
* 3. ANTHROPIC_MODEL environment variable
* 4. Settings (from user's saved settings)
*/
export function getUserSpecifiedModelSetting(): ModelSetting | undefined {
let specifiedModel: ModelSetting | undefined
const modelOverride = getMainLoopModelOverride()
if (modelOverride !== undefined) {
specifiedModel = modelOverride
} else {
const settings = getSettings_DEPRECATED() || {}
specifiedModel = process.env.ANTHROPIC_MODEL || settings.model || undefined
}
// Ignore the user-specified model if it's not in the availableModels allowlist.
if (specifiedModel && !isModelAllowed(specifiedModel)) {
return undefined
}
return specifiedModel
}
/**
* Get the main loop model to use for the current session.
*
* Model Selection Priority Order:
* 1. Model override during session (from /model command) - highest priority
* 2. Model override at startup (from --model flag)
* 3. ANTHROPIC_MODEL environment variable
* 4. Settings (from user's saved settings)
* 5. Built-in default
*
* @returns The resolved model name to use
*/
export function getMainLoopModel(): ModelName {
const model = getUserSpecifiedModelSetting()
if (model !== undefined && model !== null) {
return parseUserSpecifiedModel(model)
}
return getDefaultMainLoopModel()
}
export function getBestModel(): ModelName {
return getDefaultOpusModel()
}
// @[MODEL LAUNCH]: Update the default Opus model (3P providers may lag so keep defaults unchanged).
export function getDefaultOpusModel(): ModelName {
if (process.env.ANTHROPIC_DEFAULT_OPUS_MODEL) {
return process.env.ANTHROPIC_DEFAULT_OPUS_MODEL
}
// 3P providers (Bedrock, Vertex, Foundry) — kept as a separate branch
// even when values match, since 3P availability lags firstParty and
// these will diverge again at the next model launch.
if (getAPIProvider() !== 'firstParty') {
return getModelStrings().opus46
}
return getModelStrings().opus46
}
// @[MODEL LAUNCH]: Update the default Sonnet model (3P providers may lag so keep defaults unchanged).
export function getDefaultSonnetModel(): ModelName {
if (process.env.ANTHROPIC_DEFAULT_SONNET_MODEL) {
return process.env.ANTHROPIC_DEFAULT_SONNET_MODEL
}
// Default to Sonnet 4.5 for 3P since they may not have 4.6 yet
if (getAPIProvider() !== 'firstParty') {
return getModelStrings().sonnet45
}
return getModelStrings().sonnet46
}
// @[MODEL LAUNCH]: Update the default Haiku model (3P providers may lag so keep defaults unchanged).
export function getDefaultHaikuModel(): ModelName {
if (process.env.ANTHROPIC_DEFAULT_HAIKU_MODEL) {
return process.env.ANTHROPIC_DEFAULT_HAIKU_MODEL
}
// Haiku 4.5 is available on all platforms (first-party, Foundry, Bedrock, Vertex)
return getModelStrings().haiku45
}
/**
* Get the model to use for runtime, depending on the runtime context.
* @param params Subset of the runtime context to determine the model to use.
* @returns The model to use
*/
export function getRuntimeMainLoopModel(params: {
permissionMode: PermissionMode
mainLoopModel: string
exceeds200kTokens?: boolean
}): ModelName {
const { permissionMode, mainLoopModel, exceeds200kTokens = false } = params
// opusplan uses Opus in plan mode without [1m] suffix.
if (
getUserSpecifiedModelSetting() === 'opusplan' &&
permissionMode === 'plan' &&
!exceeds200kTokens
) {
return getDefaultOpusModel()
}
// sonnetplan by default
if (getUserSpecifiedModelSetting() === 'haiku' && permissionMode === 'plan') {
return getDefaultSonnetModel()
}
return mainLoopModel
}
/**
* Get the default main loop model setting.
*
* This handles the built-in default:
* - Opus for Max and Team Premium users
* - Sonnet 4.6 for all other users (including Team Standard, Pro, Enterprise)
*
* @returns The default model setting to use
*/
export function getDefaultMainLoopModelSetting(): ModelName | ModelAlias {
// Ants default to defaultModel from flag config, or Opus 1M if not configured
if (process.env.USER_TYPE === 'ant') {
return (
getAntModelOverrideConfig()?.defaultModel ??
getDefaultOpusModel() + '[1m]'
)
}
// Max users get Opus as default
if (isMaxSubscriber()) {
return getDefaultOpusModel() + (isOpus1mMergeEnabled() ? '[1m]' : '')
}
// Team Premium gets Opus (same as Max)
if (isTeamPremiumSubscriber()) {
return getDefaultOpusModel() + (isOpus1mMergeEnabled() ? '[1m]' : '')
}
// PAYG (1P and 3P), Enterprise, Team Standard, and Pro get Sonnet as default
// Note that PAYG (3P) may default to an older Sonnet model
return getDefaultSonnetModel()
}
/**
* Synchronous operation to get the default main loop model to use
* (bypassing any user-specified values).
*/
export function getDefaultMainLoopModel(): ModelName {
return parseUserSpecifiedModel(getDefaultMainLoopModelSetting())
}
// @[MODEL LAUNCH]: Add a canonical name mapping for the new model below.
/**
* Pure string-match that strips date/provider suffixes from a first-party model
* name. Input must already be a 1P-format ID (e.g. 'claude-3-7-sonnet-20250219',
* 'us.anthropic.claude-opus-4-6-v1:0'). Does not touch settings, so safe at
* module top-level (see MODEL_COSTS in modelCost.ts).
*/
export function firstPartyNameToCanonical(name: ModelName): ModelShortName {
name = name.toLowerCase()
// Special cases for Claude 4+ models to differentiate versions
// Order matters: check more specific versions first (4-5 before 4)
if (name.includes('claude-opus-4-6')) {
return 'claude-opus-4-6'
}
if (name.includes('claude-opus-4-5')) {
return 'claude-opus-4-5'
}
if (name.includes('claude-opus-4-1')) {
return 'claude-opus-4-1'
}
if (name.includes('claude-opus-4')) {
return 'claude-opus-4'
}
if (name.includes('claude-sonnet-4-6')) {
return 'claude-sonnet-4-6'
}
if (name.includes('claude-sonnet-4-5')) {
return 'claude-sonnet-4-5'
}
if (name.includes('claude-sonnet-4')) {
return 'claude-sonnet-4'
}
if (name.includes('claude-haiku-4-5')) {
return 'claude-haiku-4-5'
}
// Claude 3.x models use a different naming scheme (claude-3-{family})
if (name.includes('claude-3-7-sonnet')) {
return 'claude-3-7-sonnet'
}
if (name.includes('claude-3-5-sonnet')) {
return 'claude-3-5-sonnet'
}
if (name.includes('claude-3-5-haiku')) {
return 'claude-3-5-haiku'
}
if (name.includes('claude-3-opus')) {
return 'claude-3-opus'
}
if (name.includes('claude-3-sonnet')) {
return 'claude-3-sonnet'
}
if (name.includes('claude-3-haiku')) {
return 'claude-3-haiku'
}
const match = name.match(/(claude-(\d+-\d+-)?\w+)/)
if (match && match[1]) {
return match[1]
}
// Fall back to the original name if no pattern matches
return name
}
/**
* Maps a full model string to a shorter canonical version that's unified across 1P and 3P providers.
* For example, 'claude-3-5-haiku-20241022' and 'us.anthropic.claude-3-5-haiku-20241022-v1:0'
* would both be mapped to 'claude-3-5-haiku'.
* @param fullModelName The full model name (e.g., 'claude-3-5-haiku-20241022')
* @returns The short name (e.g., 'claude-3-5-haiku') if found, or the original name if no mapping exists
*/
export function getCanonicalName(fullModelName: ModelName): ModelShortName {
// Resolve overridden model IDs (e.g. Bedrock ARNs) back to canonical names.
// resolved is always a 1P-format ID, so firstPartyNameToCanonical can handle it.
return firstPartyNameToCanonical(resolveOverriddenModel(fullModelName))
}
// @[MODEL LAUNCH]: Update the default model description strings shown to users.
export function getClaudeAiUserDefaultModelDescription(
fastMode = false,
): string {
if (isMaxSubscriber() || isTeamPremiumSubscriber()) {
if (isOpus1mMergeEnabled()) {
return `Opus 4.6 with 1M context · Most capable for complex work${fastMode ? getOpus46PricingSuffix(true) : ''}`
}
return `Opus 4.6 · Most capable for complex work${fastMode ? getOpus46PricingSuffix(true) : ''}`
}
return 'Sonnet 4.6 · Best for everyday tasks'
}
export function renderDefaultModelSetting(
setting: ModelName | ModelAlias,
): string {
if (setting === 'opusplan') {
return 'Opus 4.6 in plan mode, else Sonnet 4.6'
}
return renderModelName(parseUserSpecifiedModel(setting))
}
export function getOpus46PricingSuffix(fastMode: boolean): string {
if (getAPIProvider() !== 'firstParty') return ''
const pricing = formatModelPricing(getOpus46CostTier(fastMode))
const fastModeIndicator = fastMode ? ` (${LIGHTNING_BOLT})` : ''
return ` ·${fastModeIndicator} ${pricing}`
}
export function isOpus1mMergeEnabled(): boolean {
if (
is1mContextDisabled() ||
isProSubscriber() ||
getAPIProvider() !== 'firstParty'
) {
return false
}
// Fail closed when a subscriber's subscription type is unknown. The VS Code
// config-loading subprocess can have OAuth tokens with valid scopes but no
// subscriptionType field (stale or partial refresh). Without this guard,
// isProSubscriber() returns false for such users and the merge leaks
// opus[1m] into the model dropdown — the API then rejects it with a
// misleading "rate limit reached" error.
if (isClaudeAISubscriber() && getSubscriptionType() === null) {
return false
}
return true
}
export function renderModelSetting(setting: ModelName | ModelAlias): string {
if (setting === 'opusplan') {
return 'Opus Plan'
}
if (isModelAlias(setting)) {
return capitalize(setting)
}
return renderModelName(setting)
}
// @[MODEL LAUNCH]: Add display name cases for the new model (base + [1m] variant if applicable).
/**
* Returns a human-readable display name for known public models, or null
* if the model is not recognized as a public model.
*/
export function getPublicModelDisplayName(model: ModelName): string | null {
switch (model) {
case getModelStrings().opus46:
return 'Opus 4.6'
case getModelStrings().opus46 + '[1m]':
return 'Opus 4.6 (1M context)'
case getModelStrings().opus45:
return 'Opus 4.5'
case getModelStrings().opus41:
return 'Opus 4.1'
case getModelStrings().opus40:
return 'Opus 4'
case getModelStrings().sonnet46 + '[1m]':
return 'Sonnet 4.6 (1M context)'
case getModelStrings().sonnet46:
return 'Sonnet 4.6'
case getModelStrings().sonnet45 + '[1m]':
return 'Sonnet 4.5 (1M context)'
case getModelStrings().sonnet45:
return 'Sonnet 4.5'
case getModelStrings().sonnet40:
return 'Sonnet 4'
case getModelStrings().sonnet40 + '[1m]':
return 'Sonnet 4 (1M context)'
case getModelStrings().sonnet37:
return 'Sonnet 3.7'
case getModelStrings().sonnet35:
return 'Sonnet 3.5'
case getModelStrings().haiku45:
return 'Haiku 4.5'
case getModelStrings().haiku35:
return 'Haiku 3.5'
default:
return null
}
}
function maskModelCodename(baseName: string): string {
// Mask only the first dash-separated segment (the codename), preserve the rest
// e.g. capybara-v2-fast → cap*****-v2-fast
const [codename = '', ...rest] = baseName.split('-')
const masked =
codename.slice(0, 3) + '*'.repeat(Math.max(0, codename.length - 3))
return [masked, ...rest].join('-')
}
export function renderModelName(model: ModelName): string {
const publicName = getPublicModelDisplayName(model)
if (publicName) {
return publicName
}
if (process.env.USER_TYPE === 'ant') {
const resolved = parseUserSpecifiedModel(model)
const antModel = resolveAntModel(model)
if (antModel) {
const baseName = antModel.model.replace(/\[1m\]$/i, '')
const masked = maskModelCodename(baseName)
const suffix = has1mContext(resolved) ? '[1m]' : ''
return masked + suffix
}
if (resolved !== model) {
return `${model} (${resolved})`
}
return resolved
}
return model
}
/**
* Returns a safe author name for public display (e.g., in git commit trailers).
* Returns "Claude {ModelName}" for publicly known models, or "Claude ({model})"
* for unknown/internal models so the exact model name is preserved.
*
* @param model The full model name
* @returns "Claude {ModelName}" for public models, or "Claude ({model})" for non-public models
*/
export function getPublicModelName(model: ModelName): string {
const publicName = getPublicModelDisplayName(model)
if (publicName) {
return `Claude ${publicName}`
}
return `Claude (${model})`
}
/**
* Returns a full model name for use in this session, possibly after resolving
* a model alias.
*
* This function intentionally does not support version numbers to align with
* the model switcher.
*
* Supports [1m] suffix on any model alias (e.g., haiku[1m], sonnet[1m]) to enable
* 1M context window without requiring each variant to be in MODEL_ALIASES.
*
* @param modelInput The model alias or name provided by the user.
*/
export function parseUserSpecifiedModel(
modelInput: ModelName | ModelAlias,
): ModelName {
const modelInputTrimmed = modelInput.trim()
const normalizedModel = modelInputTrimmed.toLowerCase()
const has1mTag = has1mContext(normalizedModel)
const modelString = has1mTag
? normalizedModel.replace(/\[1m]$/i, '').trim()
: normalizedModel
if (isModelAlias(modelString)) {
switch (modelString) {
case 'opusplan':
return getDefaultSonnetModel() + (has1mTag ? '[1m]' : '') // Sonnet is default, Opus in plan mode
case 'sonnet':
return getDefaultSonnetModel() + (has1mTag ? '[1m]' : '')
case 'haiku':
return getDefaultHaikuModel() + (has1mTag ? '[1m]' : '')
case 'opus':
return getDefaultOpusModel() + (has1mTag ? '[1m]' : '')
case 'best':
return getBestModel()
default:
}
}
// Opus 4/4.1 are no longer available on the first-party API (same as
// Claude.ai) — silently remap to the current Opus default. The 'opus'
// alias already resolves to 4.6, so the only users on these explicit
// strings pinned them in settings/env/--model/SDK before 4.5 launched.
// 3P providers may not yet have 4.6 capacity, so pass through unchanged.
if (
getAPIProvider() === 'firstParty' &&
isLegacyOpusFirstParty(modelString) &&
isLegacyModelRemapEnabled()
) {
return getDefaultOpusModel() + (has1mTag ? '[1m]' : '')
}
if (process.env.USER_TYPE === 'ant') {
const has1mAntTag = has1mContext(normalizedModel)
const baseAntModel = normalizedModel.replace(/\[1m]$/i, '').trim()
const antModel = resolveAntModel(baseAntModel)
if (antModel) {
const suffix = has1mAntTag ? '[1m]' : ''
return antModel.model + suffix
}
// Fall through to the alias string if we cannot load the config. The API calls
// will fail with this string, but we should hear about it through feedback and
// can tell the user to restart/wait for flag cache refresh to get the latest values.
}
// Preserve original case for custom model names (e.g., Azure Foundry deployment IDs)
// Only strip [1m] suffix if present, maintaining case of the base model
if (has1mTag) {
return modelInputTrimmed.replace(/\[1m\]$/i, '').trim() + '[1m]'
}
return modelInputTrimmed
}
/**
* Resolves a skill's `model:` frontmatter against the current model, carrying
* the `[1m]` suffix over when the target family supports it.
*
* A skill author writing `model: opus` means "use opus-class reasoning" — not
* "downgrade to 200K". If the user is on opus[1m] at 230K tokens and invokes a
* skill with `model: opus`, passing the bare alias through drops the effective
* context window from 1M to 200K, which trips autocompact at 23% apparent usage
* and surfaces "Context limit reached" even though nothing overflowed.
*
* We only carry [1m] when the target actually supports it (sonnet/opus). A skill
* with `model: haiku` on a 1M session still downgrades — haiku has no 1M variant,
* so the autocompact that follows is correct. Skills that already specify [1m]
* are left untouched.
*/
export function resolveSkillModelOverride(
skillModel: string,
currentModel: string,
): string {
if (has1mContext(skillModel) || !has1mContext(currentModel)) {
return skillModel
}
// modelSupports1M matches on canonical IDs ('claude-opus-4-6', 'claude-sonnet-4');
// a bare 'opus' alias falls through getCanonicalName unmatched. Resolve first.
if (modelSupports1M(parseUserSpecifiedModel(skillModel))) {
return skillModel + '[1m]'
}
return skillModel
}
const LEGACY_OPUS_FIRSTPARTY = [
'claude-opus-4-20250514',
'claude-opus-4-1-20250805',
'claude-opus-4-0',
'claude-opus-4-1',
]
function isLegacyOpusFirstParty(model: string): boolean {
return LEGACY_OPUS_FIRSTPARTY.includes(model)
}
/**
* Opt-out for the legacy Opus 4.0/4.1 → current Opus remap.
*/
export function isLegacyModelRemapEnabled(): boolean {
return !isEnvTruthy(process.env.CLAUDE_CODE_DISABLE_LEGACY_MODEL_REMAP)
}
export function modelDisplayString(model: ModelSetting): string {
if (model === null) {
if (process.env.USER_TYPE === 'ant') {
return `Default for Ants (${renderDefaultModelSetting(getDefaultMainLoopModelSetting())})`
} else if (isClaudeAISubscriber()) {
return `Default (${getClaudeAiUserDefaultModelDescription()})`
}
return `Default (${getDefaultMainLoopModel()})`
}
const resolvedModel = parseUserSpecifiedModel(model)
return model === resolvedModel ? resolvedModel : `${model} (${resolvedModel})`
}
// @[MODEL LAUNCH]: Add a marketing name mapping for the new model below.
export function getMarketingNameForModel(modelId: string): string | undefined {
if (getAPIProvider() === 'foundry') {
// deployment ID is user-defined in Foundry, so it may have no relation to the actual model
return undefined
}
const has1m = modelId.toLowerCase().includes('[1m]')
const canonical = getCanonicalName(modelId)
if (canonical.includes('claude-opus-4-6')) {
return has1m ? 'Opus 4.6 (with 1M context)' : 'Opus 4.6'
}
if (canonical.includes('claude-opus-4-5')) {
return 'Opus 4.5'
}
if (canonical.includes('claude-opus-4-1')) {
return 'Opus 4.1'
}
if (canonical.includes('claude-opus-4')) {
return 'Opus 4'
}
if (canonical.includes('claude-sonnet-4-6')) {
return has1m ? 'Sonnet 4.6 (with 1M context)' : 'Sonnet 4.6'
}
if (canonical.includes('claude-sonnet-4-5')) {
return has1m ? 'Sonnet 4.5 (with 1M context)' : 'Sonnet 4.5'
}
if (canonical.includes('claude-sonnet-4')) {
return has1m ? 'Sonnet 4 (with 1M context)' : 'Sonnet 4'
}
if (canonical.includes('claude-3-7-sonnet')) {
return 'Claude 3.7 Sonnet'
}
if (canonical.includes('claude-3-5-sonnet')) {
return 'Claude 3.5 Sonnet'
}
if (canonical.includes('claude-haiku-4-5')) {
return 'Haiku 4.5'
}
if (canonical.includes('claude-3-5-haiku')) {
return 'Claude 3.5 Haiku'
}
return undefined
}
export function normalizeModelStringForAPI(model: string): string {
return model.replace(/\[(1|2)m\]/gi, '')
}