Skip to content

Commit 8d7dddd

Browse files
authored
Qwen3 model (#1311)
1 parent 53bda27 commit 8d7dddd

File tree

5 files changed

+86
-0
lines changed

5 files changed

+86
-0
lines changed

docs/en/DEPLOY_OPTION.md

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -980,6 +980,10 @@ This solution supports the following text generation models:
980980
"apac.anthropic.claude-3-5-sonnet-20240620-v1:0",
981981
"apac.anthropic.claude-3-5-sonnet-20241022-v2:0",
982982
"us.deepseek.r1-v1:0",
983+
"qwen.qwen3-235b-a22b-2507-v1:0",
984+
"qwen.qwen3-32b-v1:0",
985+
"qwen.qwen3-coder-480b-a35b-v1:0",
986+
"qwen.qwen3-coder-30b-a3b-v1:0",
983987
"us.writer.palmyra-x5-v1:0",
984988
"us.writer.palmyra-x4-v1:0",
985989
"amazon.titan-text-premier-v1:0",

docs/ja/DEPLOY_OPTION.md

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -995,6 +995,10 @@ const envs: Record<string, Partial<StackInput>> = {
995995
"apac.anthropic.claude-3-5-sonnet-20240620-v1:0",
996996
"apac.anthropic.claude-3-5-sonnet-20241022-v2:0",
997997
"us.deepseek.r1-v1:0",
998+
"qwen.qwen3-235b-a22b-2507-v1:0",
999+
"qwen.qwen3-32b-v1:0",
1000+
"qwen.qwen3-coder-480b-a35b-v1:0",
1001+
"qwen.qwen3-coder-30b-a3b-v1:0",
9981002
"us.writer.palmyra-x5-v1:0",
9991003
"us.writer.palmyra-x4-v1:0",
10001004
"amazon.titan-text-premier-v1:0",

docs/ko/DEPLOY_OPTION.md

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -976,6 +976,10 @@ const envs: Record<string, Partial<StackInput>> = {
976976
"apac.anthropic.claude-3-5-sonnet-20240620-v1:0",
977977
"apac.anthropic.claude-3-5-sonnet-20241022-v2:0",
978978
"us.deepseek.r1-v1:0",
979+
"qwen.qwen3-235b-a22b-2507-v1:0",
980+
"qwen.qwen3-32b-v1:0",
981+
"qwen.qwen3-coder-480b-a35b-v1:0",
982+
"qwen.qwen3-coder-30b-a3b-v1:0",
979983
"us.writer.palmyra-x5-v1:0",
980984
"us.writer.palmyra-x4-v1:0",
981985
"amazon.titan-text-premier-v1:0",

packages/cdk/lambda/utils/models.ts

Lines changed: 57 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -206,6 +206,31 @@ const DEEPSEEK_DEFAULT_PARAMS: ConverseInferenceParams = {
206206
},
207207
};
208208

209+
// Qwen3 model parameters based on actual AWS Bedrock limits
210+
const QWEN_16K_DEFAULT_PARAMS: ConverseInferenceParams = {
211+
inferenceConfig: {
212+
maxTokens: 16384,
213+
temperature: 0.7,
214+
topP: 0.9,
215+
},
216+
};
217+
218+
const QWEN_64K_DEFAULT_PARAMS: ConverseInferenceParams = {
219+
inferenceConfig: {
220+
maxTokens: 65536,
221+
temperature: 0.7,
222+
topP: 0.9,
223+
},
224+
};
225+
226+
const QWEN_192K_DEFAULT_PARAMS: ConverseInferenceParams = {
227+
inferenceConfig: {
228+
maxTokens: 196608,
229+
temperature: 0.7,
230+
topP: 0.9,
231+
},
232+
};
233+
209234
const PALMYRA_DEFAULT_PARAMS: ConverseInferenceParams = {
210235
inferenceConfig: {
211236
maxTokens: 8192,
@@ -1491,6 +1516,38 @@ export const BEDROCK_TEXT_GEN_MODELS: {
14911516
extractConverseOutput: extractConverseOutput,
14921517
extractConverseStreamOutput: extractConverseStreamOutput,
14931518
},
1519+
'qwen.qwen3-235b-a22b-2507-v1:0': {
1520+
defaultParams: QWEN_192K_DEFAULT_PARAMS,
1521+
usecaseParams: USECASE_DEFAULT_PARAMS,
1522+
createConverseCommandInput: createConverseCommandInput,
1523+
createConverseStreamCommandInput: createConverseStreamCommandInput,
1524+
extractConverseOutput: extractConverseOutput,
1525+
extractConverseStreamOutput: extractConverseStreamOutput,
1526+
},
1527+
'qwen.qwen3-32b-v1:0': {
1528+
defaultParams: QWEN_16K_DEFAULT_PARAMS,
1529+
usecaseParams: USECASE_DEFAULT_PARAMS,
1530+
createConverseCommandInput: createConverseCommandInput,
1531+
createConverseStreamCommandInput: createConverseStreamCommandInput,
1532+
extractConverseOutput: extractConverseOutput,
1533+
extractConverseStreamOutput: extractConverseStreamOutput,
1534+
},
1535+
'qwen.qwen3-coder-480b-a35b-v1:0': {
1536+
defaultParams: QWEN_64K_DEFAULT_PARAMS,
1537+
usecaseParams: USECASE_DEFAULT_PARAMS,
1538+
createConverseCommandInput: createConverseCommandInput,
1539+
createConverseStreamCommandInput: createConverseStreamCommandInput,
1540+
extractConverseOutput: extractConverseOutput,
1541+
extractConverseStreamOutput: extractConverseStreamOutput,
1542+
},
1543+
'qwen.qwen3-coder-30b-a3b-v1:0': {
1544+
defaultParams: QWEN_192K_DEFAULT_PARAMS,
1545+
usecaseParams: USECASE_DEFAULT_PARAMS,
1546+
createConverseCommandInput: createConverseCommandInput,
1547+
createConverseStreamCommandInput: createConverseStreamCommandInput,
1548+
extractConverseOutput: extractConverseOutput,
1549+
extractConverseStreamOutput: extractConverseStreamOutput,
1550+
},
14941551
// Although Palmyra supports system context, the model seems work best without it.
14951552
'us.writer.palmyra-x4-v1:0': {
14961553
defaultParams: PALMYRA_DEFAULT_PARAMS,

packages/common/src/application/model.ts

Lines changed: 17 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -384,6 +384,23 @@ export const modelMetadata: Record<string, ModelMetadata> = {
384384
flags: MODEL_FEATURE.TEXT_DOC_REASONING,
385385
displayName: 'DeepSeek-R1',
386386
},
387+
// Qwen
388+
'qwen.qwen3-235b-a22b-2507-v1:0': {
389+
flags: MODEL_FEATURE.TEXT_ONLY,
390+
displayName: 'Qwen3 235B A22B 2507',
391+
},
392+
'qwen.qwen3-32b-v1:0': {
393+
flags: MODEL_FEATURE.TEXT_ONLY,
394+
displayName: 'Qwen3 32B',
395+
},
396+
'qwen.qwen3-coder-480b-a35b-v1:0': {
397+
flags: MODEL_FEATURE.TEXT_ONLY,
398+
displayName: 'Qwen3-Coder 480B A35B Instruct',
399+
},
400+
'qwen.qwen3-coder-30b-a3b-v1:0': {
401+
flags: MODEL_FEATURE.TEXT_ONLY,
402+
displayName: 'Qwen3-Coder 30B A3B Instruct',
403+
},
387404
// Writer
388405
'us.writer.palmyra-x4-v1:0': {
389406
flags: MODEL_FEATURE.TEXT_DOC,

0 commit comments

Comments
 (0)