Revert "install quant docker"

This reverts commit 1523e08a9e0dd749f758a181a9f4df010c3a3d27.
add script
2025-10-21 01:23:56 +08:00 · 2024-11-22 17:42:30 +01:00 · 2024-11-22 17:40:16 +01:00 · 2024-11-22 17:39:57 +01:00 · 2024-11-21 15:27:59 +01:00
1 changed files with 36 additions and 0 deletions
--- a/src/transformers/models/llama/quantize_fp8_llama.py
+++ b/src/transformers/models/llama/quantize_fp8_llama.py
@ -0,0 +1,36 @@
+# Copyright 2024 The HuggingFace Inc. team. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import torch
+
+from transformers import FbgemmFp8Config, LlamaForCausalLM
+
+
+modules_to_not_convert = []
+
+# As defined by Meta, we don't quantize the first and last layers as well as the lm_head. Also, we don't quantize the self_attn layers.
+modules_to_not_convert.append("model.layers.0")
+modules_to_not_convert.append("model.layers.125")
+modules_to_not_convert.append("lm_head")
+for layer_i in range(1, 125):
+    modules_to_not_convert.append(f"model.layers.{layer_i}.self_attn")
+
+quantization_config = FbgemmFp8Config(modules_to_not_convert=modules_to_not_convert)
+model_name = "meta-llama/Llama-3.1-405B"
+
+model = LlamaForCausalLM.from_pretrained(
+    model_name, torch_dtype=torch.bfloat16, device_map="auto", quantization_config=quantization_config
+)
+
+model.save_pretrained(f"{model_name}-FP8")
Author	SHA1	Message	Date
Marc Sun	624add74b1	Revert "install quant docker" This reverts commit 1523e08a9e0dd749f758a181a9f4df010c3a3d27.	2024-11-22 17:42:30 +01:00
Marc Sun	1a989b7e22	add script	2024-11-22 17:40:16 +01:00
Marc Sun	3f4d7ef6ad	Merge branch 'main' of github.com:huggingface/transformers into main	2024-11-22 17:39:57 +01:00
Marc Sun	1523e08a9e	install quant docker	2024-11-21 15:27:59 +01:00