chore: add readme in root folder of deployment use case + fix cifar (#…

…876)
zama-ai · Oct 28, 2024 · 4829444 · 4829444
1 parent b307ca5
commit 4829444
Show file tree

Hide file tree

Showing 8 changed files with 406 additions and 3 deletions.
diff --git a/use_case_examples/deployment/README.md b/use_case_examples/deployment/README.md
@@ -0,0 +1,42 @@
+# Deployment Examples
+
+This folder contains examples of how to deploy Concrete ML models using Fully Homomorphic Encryption (FHE). These examples demonstrate the process of training, compiling, and deploying models for various use cases.
+
+## Overview
+
+The deployment process generally follows these steps:
+
+1. Train the model (optional, depending on the use case)
+2. Compile the model to an FHE circuit
+3. Deploy the model using Docker
+4. Run inference using a client (locally or in Docker)
+
+## Available Examples
+
+We provide three different use cases to demonstrate the deployment process:
+
+1. [Breast Cancer Classification](./breast_cancer/README.md)
+2. [Sentiment Analysis](./sentiment_analysis/README.md)
+3. [CIFAR-10 Image Classification](./cifar/README.md)
+
+## Getting Started
+
+Each example folder contains its own README with specific instructions. However, the general process is similar:
+
+1. Train or compile the model using the provided scripts
+2. Deploy the model using `deploy_to_docker.py` from the `server` folder
+3. Build the client Docker image
+4. Run the client to interact with the deployed model
+
+For detailed instructions, please refer to the README in each example folder.
+
+## Requirements
+
+- Docker
+- Python 3.8 or later
+- Concrete ML library installed
+
+## Additional Resources
+
+- [Client-Server Guide](../../docs/guides/client_server.md)
+- [Server Deployment Scripts](./server/README.md)
diff --git a/use_case_examples/deployment/cifar/models/__init__.py b/use_case_examples/deployment/cifar/models/__init__.py
@@ -0,0 +1,64 @@
+# MIT License
+#
+# Copyright (c) 2019 Xilinx
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in all
+# copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+# Original file can be found at https://github.com/Xilinx/brevitas/blob/8c3d9de0113528cf6693c6474a13d802a66682c6/src/brevitas_examples/bnn_pynq/models/__init__.py
+
+import os
+from configparser import ConfigParser
+
+import torch
+from torch import hub
+
+__all__ = ["cnv_2w2a"]
+
+from .model import cnv
+
+model_impl = {
+    "CNV": cnv,
+}
+
+
+def get_model_cfg(name):
+    cfg = ConfigParser()
+    current_dir = os.path.dirname(os.path.abspath(__file__))
+    config_path = os.path.join(current_dir, name.lower() + ".ini")
+    assert os.path.exists(config_path)
+    cfg.read(config_path)
+    return cfg
+
+
+def model_with_cfg(name, pre_trained):
+    cfg = get_model_cfg(name)
+    arch = cfg.get("MODEL", "ARCH")
+    model = model_impl[arch](cfg)
+    if pre_trained:
+        checkpoint = cfg.get("MODEL", "PRETRAINED_URL")
+        state_dict = hub.load_state_dict_from_url(checkpoint, progress=True, map_location="cpu")
+        model.load_state_dict(state_dict, strict=True)
+    return model, cfg
+
+
+def cnv_2w2a(pre_trained=False):
+    assert (
+        pre_trained == False
+    ), "No online pre-trained network are available. Use --resume instead with a valid checkpoint."
+    model, _ = model_with_cfg("cnv_2w2a", pre_trained)
+    return model
diff --git a/use_case_examples/deployment/cifar/models/cnv_2w2a.ini b/use_case_examples/deployment/cifar/models/cnv_2w2a.ini
@@ -0,0 +1,13 @@
+[MODEL]
+ARCH: CNV
+PRETRAINED_URL: https://github.com/Xilinx/brevitas/releases/download/bnn_pynq-r0/cnv_2w2a-0702987f.pth
+EVAL_LOG: https://github.com/Xilinx/brevitas/releases/download/cnv_test_ref-r0/cnv_2w2a_eval-5aaca4c6.txt
+DATASET: CIFAR10
+IN_CHANNELS: 3
+NUM_CLASSES: 10
+
+[QUANT]
+WEIGHT_BIT_WIDTH: 2
+ACT_BIT_WIDTH: 2
+IN_BIT_WIDTH: 8
+
diff --git a/use_case_examples/deployment/cifar/models/common.py b/use_case_examples/deployment/cifar/models/common.py
@@ -0,0 +1,79 @@
+# MIT License
+#
+# Copyright (c) 2019 Xilinx
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in all
+# copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+# Original file can be found at https://github.com/Xilinx/brevitas/blob/8c3d9de0113528cf6693c6474a13d802a66682c6/src/brevitas_examples/bnn_pynq/models/common.py
+from brevitas.core.bit_width import BitWidthImplType
+from brevitas.core.quant import QuantType
+from brevitas.core.restrict_val import FloatToIntImplType, RestrictValueType
+from brevitas.core.scaling import ScalingImplType
+from brevitas.core.zero_point import ZeroZeroPoint
+from brevitas.inject import ExtendedInjector
+from brevitas.quant import Int8WeightPerTensorFloat
+from brevitas.quant.solver import ActQuantSolver, WeightQuantSolver
+from dependencies import value
+
+
+class CommonQuant(ExtendedInjector):
+    bit_width_impl_type = BitWidthImplType.CONST
+    scaling_impl_type = ScalingImplType.CONST
+    restrict_scaling_type = RestrictValueType.FP
+    zero_point_impl = ZeroZeroPoint
+    float_to_int_impl_type = FloatToIntImplType.ROUND
+    scaling_per_output_channel = False
+    narrow_range = True
+    signed = True
+
+    @value
+    def quant_type(bit_width):
+        if bit_width is None:
+            return QuantType.FP
+        elif bit_width == 1:
+            return QuantType.BINARY
+        else:
+            return QuantType.INT
+
+
+class CommonIntWeightPerTensorQuant(Int8WeightPerTensorFloat):
+    """
+    Common per-tensor weight quantizer with bit-width set to None so that it is forced to be
+    specified by each layer.
+    """
+
+    scaling_min_val = 2e-16
+    bit_width = None
+
+
+class CommonIntWeightPerChannelQuant(CommonIntWeightPerTensorQuant):
+    """
+    Common per-channel weight quantizer with bit-width set to None so that it is forced to be
+    specified by each layer.
+    """
+
+    scaling_per_output_channel = True
+
+
+class CommonWeightQuant(CommonQuant, WeightQuantSolver):
+    scaling_const = 1.0
+
+
+class CommonActQuant(CommonQuant, ActQuantSolver):
+    min_val = -1.0
+    max_val = 1.0
diff --git a/use_case_examples/deployment/cifar/models/model.py b/use_case_examples/deployment/cifar/models/model.py
@@ -0,0 +1,141 @@
+# MIT License
+#
+# Copyright (c) 2019 Xilinx
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in all
+# copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+# Original file can be found at https://github.com/Xilinx/brevitas/blob/8c3d9de0113528cf6693c6474a13d802a66682c6/src/brevitas_examples/bnn_pynq/models/CNV.py
+
+import torch
+from brevitas.core.restrict_val import RestrictValueType
+from brevitas.nn import QuantConv2d, QuantIdentity, QuantLinear
+from torch.nn import AvgPool2d, BatchNorm1d, BatchNorm2d, Module, ModuleList
+
+from .common import CommonActQuant, CommonWeightQuant
+from .tensor_norm import TensorNorm
+
+CNV_OUT_CH_POOL = [(64, False), (64, True), (128, False), (128, True), (256, False), (256, False)]
+INTERMEDIATE_FC_FEATURES = [(256, 512), (512, 512)]
+LAST_FC_IN_FEATURES = 512
+LAST_FC_PER_OUT_CH_SCALING = False
+POOL_SIZE = 2
+KERNEL_SIZE = 3
+
+
+class CNV(Module):
+    def __init__(self, num_classes, weight_bit_width, act_bit_width, in_bit_width, in_ch):
+        super(CNV, self).__init__()
+
+        self.conv_features = ModuleList()
+        self.linear_features = ModuleList()
+
+        self.conv_features.append(
+            QuantIdentity(  # for Q1.7 input format
+                act_quant=CommonActQuant,
+                return_quant_tensor=True,
+                bit_width=in_bit_width,
+                min_val=-1.0,
+                max_val=1.0 - 2.0 ** (-7),
+                narrow_range=False,
+                restrict_scaling_type=RestrictValueType.POWER_OF_TWO,
+            )
+        )
+
+        for out_ch, is_pool_enabled in CNV_OUT_CH_POOL:
+            self.conv_features.append(
+                QuantConv2d(
+                    kernel_size=KERNEL_SIZE,
+                    in_channels=in_ch,
+                    out_channels=out_ch,
+                    bias=False,
+                    weight_quant=CommonWeightQuant,
+                    weight_bit_width=weight_bit_width,
+                )
+            )
+            in_ch = out_ch
+            self.conv_features.append(BatchNorm2d(in_ch, eps=1e-4))
+            self.conv_features.append(
+                QuantIdentity(act_quant=CommonActQuant, bit_width=act_bit_width)
+            )
+            if is_pool_enabled:
+                self.conv_features.append(AvgPool2d(kernel_size=2))
+                self.conv_features.append(
+                    QuantIdentity(act_quant=CommonActQuant, bit_width=act_bit_width)
+                )
+
+        for in_features, out_features in INTERMEDIATE_FC_FEATURES:
+            self.linear_features.append(
+                QuantLinear(
+                    in_features=in_features,
+                    out_features=out_features,
+                    bias=False,
+                    weight_quant=CommonWeightQuant,
+                    weight_bit_width=weight_bit_width,
+                )
+            )
+            self.linear_features.append(BatchNorm1d(out_features, eps=1e-4))
+            self.linear_features.append(
+                QuantIdentity(act_quant=CommonActQuant, bit_width=act_bit_width)
+            )
+
+        self.linear_features.append(
+            QuantLinear(
+                in_features=LAST_FC_IN_FEATURES,
+                out_features=num_classes,
+                bias=False,
+                weight_quant=CommonWeightQuant,
+                weight_bit_width=weight_bit_width,
+            )
+        )
+        self.linear_features.append(TensorNorm())
+
+        for m in self.modules():
+            if isinstance(m, QuantConv2d) or isinstance(m, QuantLinear):
+                torch.nn.init.uniform_(m.weight.data, -1, 1)
+
+    def clip_weights(self, min_val, max_val):
+        for mod in self.conv_features:
+            if isinstance(mod, QuantConv2d):
+                mod.weight.data.clamp_(min_val, max_val)
+        for mod in self.linear_features:
+            if isinstance(mod, QuantLinear):
+                mod.weight.data.clamp_(min_val, max_val)
+
+    def forward(self, x):
+        for mod in self.conv_features:
+            x = mod(x)
+        x = torch.flatten(x, 1)
+        for mod in self.linear_features:
+            x = mod(x)
+        return x
+
+
+def cnv(cfg):
+    weight_bit_width = cfg.getint("QUANT", "WEIGHT_BIT_WIDTH")
+    act_bit_width = cfg.getint("QUANT", "ACT_BIT_WIDTH")
+    in_bit_width = cfg.getint("QUANT", "IN_BIT_WIDTH")
+    num_classes = cfg.getint("MODEL", "NUM_CLASSES")
+    in_channels = cfg.getint("MODEL", "IN_CHANNELS")
+    net = CNV(
+        weight_bit_width=weight_bit_width,
+        act_bit_width=act_bit_width,
+        in_bit_width=in_bit_width,
+        num_classes=num_classes,
+        in_ch=in_channels,
+    )
+    return net