Skip to content

Commit 5203864

Browse files
authored
add MXFP4 size and description
1 parent 3887e3c commit 5203864

File tree

1 file changed

+5
-0
lines changed

1 file changed

+5
-0
lines changed

packages/gguf/src/quant-descriptions.ts

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -132,6 +132,10 @@ export const GGUF_QUANT_DESCRIPTIONS: Record<GGMLQuantizationType, { txt: string
132132
txt: "Ternary quantization.",
133133
src_url: "https://github.com/ggml-org/llama.cpp/pull/8151",
134134
},
135+
[GGMLQuantizationType.MXFP4]: {
136+
txt: "4-bit Microscaling Block Floating Point.",
137+
src_url: "https://github.com/ggml-org/llama.cpp/pull/15091",
138+
},
135139
};
136140

137141
const QK_K = 256;
@@ -173,4 +177,5 @@ export const GGML_QUANT_SIZES = {
173177
[GGMLQuantizationType.BF16]: calcBPW(1, 2),
174178
[GGMLQuantizationType.TQ1_0]: calcBPW(256, 2 + 4 * 13),
175179
[GGMLQuantizationType.TQ2_0]: calcBPW(256, 2 + 64),
180+
[GGMLQuantizationType.MXFP4]: calcBPW(32, 1 + 16),
176181
};

0 commit comments

Comments
 (0)