From 29f9e18fad9a6dda681cea66f79ce0b8f44e0b91 Mon Sep 17 00:00:00 2001 From: Hyukjin Jeong Date: Tue, 5 Nov 2024 09:32:58 +0900 Subject: [PATCH 1/4] [nnpackage] Add mx dtypes to schema This adds mxfp4 and mxint8 to circle schema. ONE-DCO-1.0-Signed-off-by: Hyukjin Jeong --- nnpackage/schema/circle_schema.fbs | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/nnpackage/schema/circle_schema.fbs b/nnpackage/schema/circle_schema.fbs index e13bd3842cb..97e71789e3e 100644 --- a/nnpackage/schema/circle_schema.fbs +++ b/nnpackage/schema/circle_schema.fbs @@ -78,6 +78,11 @@ enum TensorType : byte { GGML_Q4_1 = -3, GGML_Q8_0 = -4, GGML_Q8_1 = -5, + + + // MX dtypes + MXFP4 = -6, + MXINT8 = -7, } // Custom quantization parameters for experimenting with new quantization From f44f7317061dd6b4edfbf5b8161119d9cf800d64 Mon Sep 17 00:00:00 2001 From: Hyukjin Jeong Date: Tue, 5 Nov 2024 10:26:38 +0900 Subject: [PATCH 2/4] Update version history --- nnpackage/schema/circle_schema.fbs | 1 + 1 file changed, 1 insertion(+) diff --git a/nnpackage/schema/circle_schema.fbs b/nnpackage/schema/circle_schema.fbs index 97e71789e3e..437a00fce65 100644 --- a/nnpackage/schema/circle_schema.fbs +++ b/nnpackage/schema/circle_schema.fbs @@ -35,6 +35,7 @@ // Version 0.8: GRU op is added. UINT4 is added. // Version 0.9: GGML_Q{X}_{Y} types are added. Weight compression option is added. // ROPE op is added. +// Version 0.10: MXFP4, MXINT8 types are added. namespace circle; From b6db12ab283a68a8ae0a55127b7dd3997be865c3 Mon Sep 17 00:00:00 2001 From: Hyukjin Jeong Date: Tue, 5 Nov 2024 11:11:38 +0900 Subject: [PATCH 3/4] Stick to 0.9 --- nnpackage/schema/circle_schema.fbs | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/nnpackage/schema/circle_schema.fbs b/nnpackage/schema/circle_schema.fbs index 437a00fce65..ccbd6cb8440 100644 --- a/nnpackage/schema/circle_schema.fbs +++ b/nnpackage/schema/circle_schema.fbs @@ -34,8 +34,7 @@ // Version 0.7: Base up to TensorFlow Lite v2.15.0 schema, deprecate data_format in Subgraph table // Version 0.8: GRU op is added. UINT4 is added. // Version 0.9: GGML_Q{X}_{Y} types are added. Weight compression option is added. -// ROPE op is added. -// Version 0.10: MXFP4, MXINT8 types are added. +// ROPE op is added. MXFP4, MXINT8 types are added. namespace circle; From 802851af54edd1142e5d8829311d09f91fd2ea10 Mon Sep 17 00:00:00 2001 From: Hyukjin Jeong Date: Tue, 5 Nov 2024 12:17:34 +0900 Subject: [PATCH 4/4] Remove empty line --- nnpackage/schema/circle_schema.fbs | 1 - 1 file changed, 1 deletion(-) diff --git a/nnpackage/schema/circle_schema.fbs b/nnpackage/schema/circle_schema.fbs index ccbd6cb8440..118a8198dbb 100644 --- a/nnpackage/schema/circle_schema.fbs +++ b/nnpackage/schema/circle_schema.fbs @@ -79,7 +79,6 @@ enum TensorType : byte { GGML_Q8_0 = -4, GGML_Q8_1 = -5, - // MX dtypes MXFP4 = -6, MXINT8 = -7,