We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 814d7a3 commit c18f0efCopy full SHA for c18f0ef
examples/quantization_w4a4_fp4/trinity_large_nvfp4.py
@@ -21,7 +21,7 @@
21
DATASET_ID = "HuggingFaceH4/ultrachat_200k"
22
DATASET_SPLIT = "train_sft"
23
24
-NUM_CALIBRATION_SAMPLES = 100
+NUM_CALIBRATION_SAMPLES = 256
25
MAX_SEQUENCE_LENGTH = 2048
26
27
# Load dataset and preprocess.
@@ -89,6 +89,6 @@ def tokenize(sample):
89
90
91
# Save to disk in compressed-tensors format.
92
-SAVE_DIR = "/raid/engine/dsikka/" + MODEL_ID.rstrip("/").split("/")[-1] + "-NVFP4"
93
-model.save_pretrained(SAVE_DIR, save_compressed=True)
+SAVE_DIR = MODEL_ID.rstrip("/").split("/")[-1] + "-NVFP4"
+model.save_pretrained(SAVE_DIR)
94
tokenizer.save_pretrained(SAVE_DIR)
0 commit comments