Skip to content

Commit 68e5d89

Browse files
authored
chore: bump and switch LLM models per query complexity (CM-1051) (#3944)
Signed-off-by: Yeganathan S <63534555+skwowet@users.noreply.github.com>
1 parent e2e09fa commit 68e5d89

2 files changed

Lines changed: 21 additions & 15 deletions

File tree

services/libs/types/src/enums/llm.ts

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -3,6 +3,7 @@ export enum LlmModelType {
33
CLAUDE_3_5_SONNET_V2 = 'anthropic.claude-3-5-sonnet-20241022-v2:0',
44
CLAUDE_3_OPUS = 'anthropic.claude-3-opus-20240229-v1:0',
55
CLAUDE_SONNET_4 = 'us.anthropic.claude-sonnet-4-20250514-v1:0',
6+
CLAUDE_HAIKU_4_5 = 'us.anthropic.claude-haiku-4-5-20251001-v1:0',
67
}
78

89
export enum LlmQueryType {

services/libs/types/src/llm.ts

Lines changed: 20 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -32,6 +32,7 @@ export const LLM_MODEL_REGION_MAP: Record<LlmModelType, string> = {
3232
[LlmModelType.CLAUDE_3_5_SONNET]: 'us-east-1',
3333
[LlmModelType.CLAUDE_3_5_SONNET_V2]: 'us-west-2',
3434
[LlmModelType.CLAUDE_SONNET_4]: 'us-east-1',
35+
[LlmModelType.CLAUDE_HAIKU_4_5]: 'us-east-1',
3536
}
3637

3738
// to estimate costs - these numbers can change
@@ -52,67 +53,71 @@ export const LLM_MODEL_PRICING_MAP: Record<LlmModelType, ILlmPricing> = {
5253
costPer1000InputTokens: 0.003,
5354
costPer1000OutputTokens: 0.015,
5455
},
56+
[LlmModelType.CLAUDE_HAIKU_4_5]: {
57+
costPer1000InputTokens: 0.001,
58+
costPer1000OutputTokens: 0.005,
59+
},
5560
}
5661

5762
export const LLM_SETTINGS: Record<LlmQueryType, ILlmSettings> = {
5863
[LlmQueryType.MEMBER_ENRICHMENT]: {
59-
modelId: LlmModelType.CLAUDE_3_5_SONNET,
64+
modelId: LlmModelType.CLAUDE_SONNET_4,
6065
arguments: {
61-
max_tokens: 200000,
66+
max_tokens: 65536,
6267
anthropic_version: 'bedrock-2023-05-31',
6368
temperature: 0,
6469
},
6570
},
6671
[LlmQueryType.MEMBER_ENRICHMENT_FIND_RELATED_LINKEDIN_PROFILES]: {
67-
modelId: LlmModelType.CLAUDE_3_5_SONNET_V2,
72+
modelId: LlmModelType.CLAUDE_HAIKU_4_5,
6873
arguments: {
69-
max_tokens: 200000,
74+
max_tokens: 2000,
7075
anthropic_version: 'bedrock-2023-05-31',
7176
temperature: 0,
7277
},
7378
},
7479
[LlmQueryType.MEMBER_ENRICHMENT_SQUASH_MULTIPLE_VALUE_ATTRIBUTES]: {
75-
modelId: LlmModelType.CLAUDE_3_5_SONNET_V2,
80+
modelId: LlmModelType.CLAUDE_SONNET_4,
7681
arguments: {
77-
max_tokens: 200000,
82+
max_tokens: 40000,
7883
anthropic_version: 'bedrock-2023-05-31',
7984
temperature: 0,
8085
},
8186
},
8287
[LlmQueryType.MEMBER_ENRICHMENT_SQUASH_WORK_EXPERIENCES_FROM_MULTIPLE_SOURCES]: {
83-
modelId: LlmModelType.CLAUDE_3_5_SONNET_V2,
88+
modelId: LlmModelType.CLAUDE_SONNET_4,
8489
arguments: {
85-
max_tokens: 200000,
90+
max_tokens: 40000,
8691
anthropic_version: 'bedrock-2023-05-31',
8792
temperature: 0,
8893
},
8994
},
9095
[LlmQueryType.MATCH_MAIN_GITHUB_ORGANIZATION_AND_DESCRIPTION]: {
91-
modelId: LlmModelType.CLAUDE_3_5_SONNET_V2,
96+
modelId: LlmModelType.CLAUDE_HAIKU_4_5,
9297
arguments: {
93-
max_tokens: 200000,
98+
max_tokens: 5000,
9499
anthropic_version: 'bedrock-2023-05-31',
95100
temperature: 0,
96101
},
97102
},
98103
[LlmQueryType.REPO_CATEGORIES]: {
99-
modelId: LlmModelType.CLAUDE_3_5_SONNET_V2,
104+
modelId: LlmModelType.CLAUDE_SONNET_4,
100105
arguments: {
101-
max_tokens: 200000,
106+
max_tokens: 2000,
102107
anthropic_version: 'bedrock-2023-05-31',
103108
temperature: 0,
104109
},
105110
},
106111
[LlmQueryType.REPO_COLLECTIONS]: {
107-
modelId: LlmModelType.CLAUDE_3_5_SONNET_V2,
112+
modelId: LlmModelType.CLAUDE_SONNET_4,
108113
arguments: {
109-
max_tokens: 200000,
114+
max_tokens: 2000,
110115
anthropic_version: 'bedrock-2023-05-31',
111116
temperature: 0,
112117
},
113118
},
114119
[LlmQueryType.MEMBER_BOT_VALIDATION]: {
115-
modelId: LlmModelType.CLAUDE_SONNET_4,
120+
modelId: LlmModelType.CLAUDE_HAIKU_4_5,
116121
arguments: {
117122
max_tokens: 2000,
118123
anthropic_version: 'bedrock-2023-05-31',

0 commit comments

Comments
 (0)