From 632ba05e001131ee3e9dcf2df6e1d34dca9c4d94 Mon Sep 17 00:00:00 2001 From: Yeganathan S <63534555+skwowet@users.noreply.github.com> Date: Mon, 23 Mar 2026 17:18:42 +0530 Subject: [PATCH 1/3] feat: use Claude Haiku 4.5 for low-complexity llm queries Signed-off-by: Yeganathan S <63534555+skwowet@users.noreply.github.com> --- services/libs/types/src/enums/llm.ts | 1 + services/libs/types/src/llm.ts | 13 +++++++++---- 2 files changed, 10 insertions(+), 4 deletions(-) diff --git a/services/libs/types/src/enums/llm.ts b/services/libs/types/src/enums/llm.ts index b95b8dc3c5..1a5a7bd340 100644 --- a/services/libs/types/src/enums/llm.ts +++ b/services/libs/types/src/enums/llm.ts @@ -3,6 +3,7 @@ export enum LlmModelType { CLAUDE_3_5_SONNET_V2 = 'anthropic.claude-3-5-sonnet-20241022-v2:0', CLAUDE_3_OPUS = 'anthropic.claude-3-opus-20240229-v1:0', CLAUDE_SONNET_4 = 'us.anthropic.claude-sonnet-4-20250514-v1:0', + CLAUDE_HAIKU_4_5 = 'us.anthropic.claude-haiku-4-5-20251001-v1:0', } export enum LlmQueryType { diff --git a/services/libs/types/src/llm.ts b/services/libs/types/src/llm.ts index 2e79cd2ff3..13546c984d 100644 --- a/services/libs/types/src/llm.ts +++ b/services/libs/types/src/llm.ts @@ -32,6 +32,7 @@ export const LLM_MODEL_REGION_MAP: Record = { [LlmModelType.CLAUDE_3_5_SONNET]: 'us-east-1', [LlmModelType.CLAUDE_3_5_SONNET_V2]: 'us-west-2', [LlmModelType.CLAUDE_SONNET_4]: 'us-east-1', + [LlmModelType.CLAUDE_HAIKU_4_5]: 'us-east-1', } // to estimate costs - these numbers can change @@ -52,6 +53,10 @@ export const LLM_MODEL_PRICING_MAP: Record = { costPer1000InputTokens: 0.003, costPer1000OutputTokens: 0.015, }, + [LlmModelType.CLAUDE_HAIKU_4_5]: { + costPer1000InputTokens: 0.001, + costPer1000OutputTokens: 0.005, + }, } export const LLM_SETTINGS: Record = { @@ -64,7 +69,7 @@ export const LLM_SETTINGS: Record = { }, }, [LlmQueryType.MEMBER_ENRICHMENT_FIND_RELATED_LINKEDIN_PROFILES]: { - modelId: LlmModelType.CLAUDE_3_5_SONNET_V2, + modelId: LlmModelType.CLAUDE_HAIKU_4_5, arguments: { max_tokens: 200000, anthropic_version: 'bedrock-2023-05-31', @@ -72,7 +77,7 @@ export const LLM_SETTINGS: Record = { }, }, [LlmQueryType.MEMBER_ENRICHMENT_SQUASH_MULTIPLE_VALUE_ATTRIBUTES]: { - modelId: LlmModelType.CLAUDE_3_5_SONNET_V2, + modelId: LlmModelType.CLAUDE_HAIKU_4_5, arguments: { max_tokens: 200000, anthropic_version: 'bedrock-2023-05-31', @@ -96,7 +101,7 @@ export const LLM_SETTINGS: Record = { }, }, [LlmQueryType.REPO_CATEGORIES]: { - modelId: LlmModelType.CLAUDE_3_5_SONNET_V2, + modelId: LlmModelType.CLAUDE_HAIKU_4_5, arguments: { max_tokens: 200000, anthropic_version: 'bedrock-2023-05-31', @@ -104,7 +109,7 @@ export const LLM_SETTINGS: Record = { }, }, [LlmQueryType.REPO_COLLECTIONS]: { - modelId: LlmModelType.CLAUDE_3_5_SONNET_V2, + modelId: LlmModelType.CLAUDE_HAIKU_4_5, arguments: { max_tokens: 200000, anthropic_version: 'bedrock-2023-05-31', From 7627b6d5e0da62fee96ed0e41639914e757f4db6 Mon Sep 17 00:00:00 2001 From: Yeganathan S <63534555+skwowet@users.noreply.github.com> Date: Wed, 25 Mar 2026 19:37:54 +0530 Subject: [PATCH 2/3] chore: optimize llm model usage across query types Signed-off-by: Yeganathan S <63534555+skwowet@users.noreply.github.com> --- services/libs/types/src/llm.ts | 14 +++++++------- 1 file changed, 7 insertions(+), 7 deletions(-) diff --git a/services/libs/types/src/llm.ts b/services/libs/types/src/llm.ts index 13546c984d..ec28ddc168 100644 --- a/services/libs/types/src/llm.ts +++ b/services/libs/types/src/llm.ts @@ -61,7 +61,7 @@ export const LLM_MODEL_PRICING_MAP: Record = { export const LLM_SETTINGS: Record = { [LlmQueryType.MEMBER_ENRICHMENT]: { - modelId: LlmModelType.CLAUDE_3_5_SONNET, + modelId: LlmModelType.CLAUDE_SONNET_4, arguments: { max_tokens: 200000, anthropic_version: 'bedrock-2023-05-31', @@ -77,7 +77,7 @@ export const LLM_SETTINGS: Record = { }, }, [LlmQueryType.MEMBER_ENRICHMENT_SQUASH_MULTIPLE_VALUE_ATTRIBUTES]: { - modelId: LlmModelType.CLAUDE_HAIKU_4_5, + modelId: LlmModelType.CLAUDE_SONNET_4, arguments: { max_tokens: 200000, anthropic_version: 'bedrock-2023-05-31', @@ -85,7 +85,7 @@ export const LLM_SETTINGS: Record = { }, }, [LlmQueryType.MEMBER_ENRICHMENT_SQUASH_WORK_EXPERIENCES_FROM_MULTIPLE_SOURCES]: { - modelId: LlmModelType.CLAUDE_3_5_SONNET_V2, + modelId: LlmModelType.CLAUDE_SONNET_4, arguments: { max_tokens: 200000, anthropic_version: 'bedrock-2023-05-31', @@ -93,7 +93,7 @@ export const LLM_SETTINGS: Record = { }, }, [LlmQueryType.MATCH_MAIN_GITHUB_ORGANIZATION_AND_DESCRIPTION]: { - modelId: LlmModelType.CLAUDE_3_5_SONNET_V2, + modelId: LlmModelType.CLAUDE_HAIKU_4_5, arguments: { max_tokens: 200000, anthropic_version: 'bedrock-2023-05-31', @@ -101,7 +101,7 @@ export const LLM_SETTINGS: Record = { }, }, [LlmQueryType.REPO_CATEGORIES]: { - modelId: LlmModelType.CLAUDE_HAIKU_4_5, + modelId: LlmModelType.CLAUDE_SONNET_4, arguments: { max_tokens: 200000, anthropic_version: 'bedrock-2023-05-31', @@ -109,7 +109,7 @@ export const LLM_SETTINGS: Record = { }, }, [LlmQueryType.REPO_COLLECTIONS]: { - modelId: LlmModelType.CLAUDE_HAIKU_4_5, + modelId: LlmModelType.CLAUDE_SONNET_4, arguments: { max_tokens: 200000, anthropic_version: 'bedrock-2023-05-31', @@ -117,7 +117,7 @@ export const LLM_SETTINGS: Record = { }, }, [LlmQueryType.MEMBER_BOT_VALIDATION]: { - modelId: LlmModelType.CLAUDE_SONNET_4, + modelId: LlmModelType.CLAUDE_HAIKU_4_5, arguments: { max_tokens: 2000, anthropic_version: 'bedrock-2023-05-31', From ec0aa27046ccfea0e5f7c84fde0c8ab3a2aeb40e Mon Sep 17 00:00:00 2001 From: Yeganathan S <63534555+skwowet@users.noreply.github.com> Date: Wed, 25 Mar 2026 20:34:58 +0530 Subject: [PATCH 3/3] chore: update max_tokens for LLM settings to improve performance Signed-off-by: Yeganathan S <63534555+skwowet@users.noreply.github.com> --- services/libs/types/src/llm.ts | 14 +++++++------- 1 file changed, 7 insertions(+), 7 deletions(-) diff --git a/services/libs/types/src/llm.ts b/services/libs/types/src/llm.ts index ec28ddc168..dc02ba8d7d 100644 --- a/services/libs/types/src/llm.ts +++ b/services/libs/types/src/llm.ts @@ -63,7 +63,7 @@ export const LLM_SETTINGS: Record = { [LlmQueryType.MEMBER_ENRICHMENT]: { modelId: LlmModelType.CLAUDE_SONNET_4, arguments: { - max_tokens: 200000, + max_tokens: 65536, anthropic_version: 'bedrock-2023-05-31', temperature: 0, }, @@ -71,7 +71,7 @@ export const LLM_SETTINGS: Record = { [LlmQueryType.MEMBER_ENRICHMENT_FIND_RELATED_LINKEDIN_PROFILES]: { modelId: LlmModelType.CLAUDE_HAIKU_4_5, arguments: { - max_tokens: 200000, + max_tokens: 2000, anthropic_version: 'bedrock-2023-05-31', temperature: 0, }, @@ -79,7 +79,7 @@ export const LLM_SETTINGS: Record = { [LlmQueryType.MEMBER_ENRICHMENT_SQUASH_MULTIPLE_VALUE_ATTRIBUTES]: { modelId: LlmModelType.CLAUDE_SONNET_4, arguments: { - max_tokens: 200000, + max_tokens: 40000, anthropic_version: 'bedrock-2023-05-31', temperature: 0, }, @@ -87,7 +87,7 @@ export const LLM_SETTINGS: Record = { [LlmQueryType.MEMBER_ENRICHMENT_SQUASH_WORK_EXPERIENCES_FROM_MULTIPLE_SOURCES]: { modelId: LlmModelType.CLAUDE_SONNET_4, arguments: { - max_tokens: 200000, + max_tokens: 40000, anthropic_version: 'bedrock-2023-05-31', temperature: 0, }, @@ -95,7 +95,7 @@ export const LLM_SETTINGS: Record = { [LlmQueryType.MATCH_MAIN_GITHUB_ORGANIZATION_AND_DESCRIPTION]: { modelId: LlmModelType.CLAUDE_HAIKU_4_5, arguments: { - max_tokens: 200000, + max_tokens: 5000, anthropic_version: 'bedrock-2023-05-31', temperature: 0, }, @@ -103,7 +103,7 @@ export const LLM_SETTINGS: Record = { [LlmQueryType.REPO_CATEGORIES]: { modelId: LlmModelType.CLAUDE_SONNET_4, arguments: { - max_tokens: 200000, + max_tokens: 2000, anthropic_version: 'bedrock-2023-05-31', temperature: 0, }, @@ -111,7 +111,7 @@ export const LLM_SETTINGS: Record = { [LlmQueryType.REPO_COLLECTIONS]: { modelId: LlmModelType.CLAUDE_SONNET_4, arguments: { - max_tokens: 200000, + max_tokens: 2000, anthropic_version: 'bedrock-2023-05-31', temperature: 0, },