@@ -2333,15 +2333,21 @@ def pad_hf_embedding_layer(input_tensor, target_shape):
23332333 "gemma3-12b" : GEMMA3_MAXTEXT_TO_HF_PARAM_MAPPING ,
23342334 "gemma3-27b" : GEMMA3_MAXTEXT_TO_HF_PARAM_MAPPING ,
23352335 "qwen3-0.6b" : QWEN3_MAXTEXT_TO_HF_PARAM_MAPPING ,
2336+ "qwen3-1.7b" : QWEN3_MAXTEXT_TO_HF_PARAM_MAPPING ,
2337+ "qwen3-1.7b-base" : QWEN3_MAXTEXT_TO_HF_PARAM_MAPPING ,
23362338 "qwen3-4b" : QWEN3_MAXTEXT_TO_HF_PARAM_MAPPING ,
2339+ "qwen3-4b-base" : QWEN3_MAXTEXT_TO_HF_PARAM_MAPPING ,
23372340 "qwen3-4b-thinking-2507" : QWEN3_MAXTEXT_TO_HF_PARAM_MAPPING ,
23382341 "qwen3-8b" : QWEN3_MAXTEXT_TO_HF_PARAM_MAPPING ,
2342+ "qwen3-8b-base" : QWEN3_MAXTEXT_TO_HF_PARAM_MAPPING ,
23392343 "qwen3-14b" : QWEN3_MAXTEXT_TO_HF_PARAM_MAPPING ,
2344+ "qwen3-14b-base" : QWEN3_MAXTEXT_TO_HF_PARAM_MAPPING ,
23402345 "qwen3-32b" : QWEN3_MAXTEXT_TO_HF_PARAM_MAPPING ,
23412346 "llama3.1-8b" : LLAMA31_MAXTEXT_TO_HF_PARAM_MAPPING ,
23422347 "llama3.1-70b" : LLAMA31_MAXTEXT_TO_HF_PARAM_MAPPING ,
23432348 "llama3.1-405b" : LLAMA31_MAXTEXT_TO_HF_PARAM_MAPPING ,
23442349 "qwen3-30b-a3b" : QWEN3_MAXTEXT_TO_HF_PARAM_MAPPING ,
2350+ "qwen3-30b-a3b-base" : QWEN3_MAXTEXT_TO_HF_PARAM_MAPPING ,
23452351 "qwen3-235b-a22b" : QWEN3_MAXTEXT_TO_HF_PARAM_MAPPING ,
23462352 "qwen3-coder-480b-a35b" : QWEN3_MAXTEXT_TO_HF_PARAM_MAPPING ,
23472353 "deepseek3-671b" : DEEPSEEK_MAXTEXT_TO_HF_PARAM_MAPPING ,
@@ -2365,15 +2371,21 @@ def pad_hf_embedding_layer(input_tensor, target_shape):
23652371 "gemma3-12b" : GEMMA3_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
23662372 "gemma3-27b" : GEMMA3_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
23672373 "qwen3-0.6b" : QWEN3_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
2374+ "qwen3-1.7b" : QWEN3_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
2375+ "qwen3-1.7b-base" : QWEN3_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
23682376 "qwen3-4b" : QWEN3_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
2377+ "qwen3-4b-base" : QWEN3_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
23692378 "qwen3-4b-thinking-2507" : QWEN3_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
23702379 "qwen3-8b" : QWEN3_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
2380+ "qwen3-8b-base" : QWEN3_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
23712381 "qwen3-14b" : QWEN3_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
2382+ "qwen3-14b-base" : QWEN3_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
23722383 "qwen3-32b" : QWEN3_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
23732384 "llama3.1-8b" : LLAMA31_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
23742385 "llama3.1-70b" : LLAMA31_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
23752386 "llama3.1-405b" : LLAMA31_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
23762387 "qwen3-30b-a3b" : QWEN3_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
2388+ "qwen3-30b-a3b-base" : QWEN3_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
23772389 "qwen3-235b-a22b" : QWEN3_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
23782390 "qwen3-coder-480b-a35b" : QWEN3_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
23792391 "deepseek3-671b" : DEEPSEEK_MAXTEXT_TO_HF_PARAM_HOOK_FN ,
0 commit comments