From 7b195e474c1c762a99a80211a82ec806b72a8510 Mon Sep 17 00:00:00 2001 From: Jack Zhang <32371937+jackzhxng@users.noreply.github.com> Date: Thu, 1 May 2025 17:03:47 -0700 Subject: [PATCH] Qwen3 doc and config tweaks --- examples/models/qwen3/4b_config.json | 2 +- examples/models/qwen3/README.md | 3 +++ 2 files changed, 4 insertions(+), 1 deletion(-) diff --git a/examples/models/qwen3/4b_config.json b/examples/models/qwen3/4b_config.json index 0874682bd80..a7a710c7779 100644 --- a/examples/models/qwen3/4b_config.json +++ b/examples/models/qwen3/4b_config.json @@ -13,5 +13,5 @@ "use_hf_rope": true, "attention_qkv_bias": false, "use_qk_norm": true, - "qk_norm_before_repo": true + "qk_norm_before_rope": true } diff --git a/examples/models/qwen3/README.md b/examples/models/qwen3/README.md index 767cbafe03d..d5507d79f2f 100644 --- a/examples/models/qwen3/README.md +++ b/examples/models/qwen3/README.md @@ -25,6 +25,7 @@ python -m examples.models.llama.export_llama \ -X \ --xnnpack-extended-ops \ -qmode 8da4w \ + --metadata '{"get_bos_id": 151644, "get_eos_ids":[151645]}' \ --output_name="qwen3-0_6b.pte" \ --verbose ``` @@ -40,6 +41,7 @@ python -m examples.models.llama.export_llama \ -X \ --xnnpack-extended-ops \ -qmode 8da4w \ + --metadata '{"get_bos_id": 151644, "get_eos_ids":[151645]}' \ --output_name="qwen3-1_7b.pte" \ --verbose ``` @@ -55,6 +57,7 @@ python -m examples.models.llama.export_llama \ -X \ --xnnpack-extended-ops \ -qmode 8da4w \ + --metadata '{"get_bos_id": 151644, "get_eos_ids":[151645]}' \ --output_name="qwen3-4b.pte" \ --verbose ```