Cleanup and fix issues with text encoder quants. (#10872)

2025-11-24 22:48:53 -08:00
parent 22a2644e57
commit 25022e0b09
7 changed files with 128 additions and 102 deletions
@@ -18,6 +18,9 @@ def llama_detect(state_dict, prefix=""):
    if scaled_fp8_key in state_dict:
        out["llama_scaled_fp8"] = state_dict[scaled_fp8_key].dtype

+    if "_quantization_metadata" in state_dict:
+        out["llama_quantization_metadata"] = state_dict["_quantization_metadata"]
+
    return out