From 427e02696f1ede596ef6dce82787a37e122efa78 Mon Sep 17 00:00:00 2001 From: Nathan Bailey Date: Tue, 27 Feb 2024 12:46:52 +0000 Subject: feat: Implement the clustering rewrite for fp32 Implements a clustering rewrite for fully connected layers for fp32 models Resolves: MLIA-1079 Signed-off-by: Nathan Bailey Change-Id: I4c12f0bf911219b4066f0760976e424ebe900a0b --- src/mlia/nn/rewrite/core/rewrite.py | 24 ++++++++++++++++++++++-- 1 file changed, 22 insertions(+), 2 deletions(-) (limited to 'src/mlia/nn/rewrite/core/rewrite.py') diff --git a/src/mlia/nn/rewrite/core/rewrite.py b/src/mlia/nn/rewrite/core/rewrite.py index a8084e8..6a3695a 100644 --- a/src/mlia/nn/rewrite/core/rewrite.py +++ b/src/mlia/nn/rewrite/core/rewrite.py @@ -23,6 +23,9 @@ from mlia.nn.common import Optimizer from mlia.nn.common import OptimizerConfiguration from mlia.nn.rewrite.core.train import train from mlia.nn.rewrite.core.train import TrainingParameters +from mlia.nn.rewrite.library.fc_clustering_layer import ( + get_keras_model_clus as fc_clustering_rewrite, +) from mlia.nn.rewrite.library.fc_layer import get_keras_model as fc_rewrite from mlia.nn.rewrite.library.fc_sparsity24_layer import ( get_keras_model as fc_rewrite_sparsity24, @@ -63,6 +66,24 @@ class Rewrite(ABC): """Return default post-processing rewrite options.""" +class ClusteringRewrite(Rewrite): + """Graph clustering rewrite logic to be used by RewritingOptimizer.""" + + strip_pruning_wrapper = staticmethod(tfmot.clustering.keras.strip_clustering) + + def quantize(self, model: keras.Model) -> keras.Model: + """Return a quantized model.""" + return model + + def post_process(self, model: keras.Model) -> keras.Model: + """Return the clustering stripped model.""" + return self.strip_pruning_wrapper(model) + + def training_callbacks(self) -> list: + """Return default rewrite callbacks.""" + return [] + + class QATRewrite(Rewrite): """Logic for rewrites requiring quantization-aware training.""" @@ -157,7 +178,7 @@ class RewritingOptimizer(Optimizer): [ FullyConnectedRewrite("fully-connected", fc_rewrite), Sparsity24Rewrite("fully-connected-sparsity24", fc_rewrite_sparsity24), - FullyConnectedRewrite("fully-connected-clustering", fc_rewrite), + ClusteringRewrite("fully-connected-clustering", fc_clustering_rewrite), ] ) @@ -191,7 +212,6 @@ class RewritingOptimizer(Optimizer): raise ConfigurationError( "Input and output tensor names need to be set for rewrite." ) - orig_vs_repl_stats, total_stats = train( source_model=tflite_model, unmodified_model=tflite_model if use_unmodified_model else None, -- cgit v1.2.1