aboutsummaryrefslogtreecommitdiff
path: root/src
diff options
context:
space:
mode:
authorNathan Bailey <nathan.bailey@arm.com>2024-02-27 12:46:52 +0000
committerNathan Bailey <nathan.bailey@arm.com>2024-04-16 12:57:10 +0100
commit427e02696f1ede596ef6dce82787a37e122efa78 (patch)
tree1fae7f7c8cb10af4f7c5119b73371b709c2c7caa /src
parent2973b6d52914023f9b8797aec8309957457d4189 (diff)
downloadmlia-427e02696f1ede596ef6dce82787a37e122efa78.tar.gz
feat: Implement the clustering rewrite for fp32
Implements a clustering rewrite for fully connected layers for fp32 models Resolves: MLIA-1079 Signed-off-by: Nathan Bailey <nathan.bailey@arm.com> Change-Id: I4c12f0bf911219b4066f0760976e424ebe900a0b
Diffstat (limited to 'src')
-rw-r--r--src/mlia/nn/rewrite/core/rewrite.py24
-rw-r--r--src/mlia/nn/rewrite/library/fc_clustering_layer.py19
2 files changed, 38 insertions, 5 deletions
diff --git a/src/mlia/nn/rewrite/core/rewrite.py b/src/mlia/nn/rewrite/core/rewrite.py
index a8084e8..6a3695a 100644
--- a/src/mlia/nn/rewrite/core/rewrite.py
+++ b/src/mlia/nn/rewrite/core/rewrite.py
@@ -23,6 +23,9 @@ from mlia.nn.common import Optimizer
from mlia.nn.common import OptimizerConfiguration
from mlia.nn.rewrite.core.train import train
from mlia.nn.rewrite.core.train import TrainingParameters
+from mlia.nn.rewrite.library.fc_clustering_layer import (
+ get_keras_model_clus as fc_clustering_rewrite,
+)
from mlia.nn.rewrite.library.fc_layer import get_keras_model as fc_rewrite
from mlia.nn.rewrite.library.fc_sparsity24_layer import (
get_keras_model as fc_rewrite_sparsity24,
@@ -63,6 +66,24 @@ class Rewrite(ABC):
"""Return default post-processing rewrite options."""
+class ClusteringRewrite(Rewrite):
+ """Graph clustering rewrite logic to be used by RewritingOptimizer."""
+
+ strip_pruning_wrapper = staticmethod(tfmot.clustering.keras.strip_clustering)
+
+ def quantize(self, model: keras.Model) -> keras.Model:
+ """Return a quantized model."""
+ return model
+
+ def post_process(self, model: keras.Model) -> keras.Model:
+ """Return the clustering stripped model."""
+ return self.strip_pruning_wrapper(model)
+
+ def training_callbacks(self) -> list:
+ """Return default rewrite callbacks."""
+ return []
+
+
class QATRewrite(Rewrite):
"""Logic for rewrites requiring quantization-aware training."""
@@ -157,7 +178,7 @@ class RewritingOptimizer(Optimizer):
[
FullyConnectedRewrite("fully-connected", fc_rewrite),
Sparsity24Rewrite("fully-connected-sparsity24", fc_rewrite_sparsity24),
- FullyConnectedRewrite("fully-connected-clustering", fc_rewrite),
+ ClusteringRewrite("fully-connected-clustering", fc_clustering_rewrite),
]
)
@@ -191,7 +212,6 @@ class RewritingOptimizer(Optimizer):
raise ConfigurationError(
"Input and output tensor names need to be set for rewrite."
)
-
orig_vs_repl_stats, total_stats = train(
source_model=tflite_model,
unmodified_model=tflite_model if use_unmodified_model else None,
diff --git a/src/mlia/nn/rewrite/library/fc_clustering_layer.py b/src/mlia/nn/rewrite/library/fc_clustering_layer.py
index 07c07ac..72931c0 100644
--- a/src/mlia/nn/rewrite/library/fc_clustering_layer.py
+++ b/src/mlia/nn/rewrite/library/fc_clustering_layer.py
@@ -3,11 +3,24 @@
"""Example rewrite with one fully connected clustered layer."""
from typing import Any
+import tensorflow_model_optimization as tfmot
from keras.api._v2 import keras # Temporary workaround for now: MLIA-1107
-from mlia.nn.rewrite.library.fc_layer import get_keras_model
-
def get_keras_model_clus(input_shape: Any, output_shape: Any) -> keras.Model:
"""Generate TensorFlow Lite model for clustering rewrite."""
- return get_keras_model(input_shape, output_shape)
+ clustering_params = {
+ "number_of_clusters": 32,
+ "cluster_centroids_init": tfmot.clustering.keras.CentroidInitialization.LINEAR,
+ }
+ model = tfmot.clustering.keras.cluster_weights(
+ to_cluster=keras.Sequential(
+ [
+ keras.layers.InputLayer(input_shape=input_shape),
+ keras.layers.Flatten(),
+ keras.layers.Dense(units=output_shape),
+ ]
+ ),
+ **clustering_params
+ )
+ return model