intel
diff --git a/‎.azure-pipelines/scripts/codeScan/pylint/pylint.sh‎
Lines changed: 1 addition & 1 deletion b/‎.azure-pipelines/scripts/codeScan/pylint/pylint.sh‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/source/releases_info.md‎
Lines changed: 0 additions & 2 deletions b/‎docs/source/releases_info.md‎
Lines changed: 0 additions & 2 deletions
diff --git a/‎examples/.config/model_params_tensorflow.json‎
Lines changed: 6 additions & 6 deletions b/‎examples/.config/model_params_tensorflow.json‎
Lines changed: 6 additions & 6 deletions
diff --git a/‎examples/README.md‎
Lines changed: 1 addition & 1 deletion b/‎examples/README.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/pytorch/image_recognition/segment_anything/README.md‎
Lines changed: 68 additions & 0 deletions b/‎examples/pytorch/image_recognition/segment_anything/README.md‎
Lines changed: 68 additions & 0 deletions
diff --git a/‎examples/pytorch/image_recognition/segment_anything/download_dataset.py‎
Lines changed: 7 additions & 0 deletions b/‎examples/pytorch/image_recognition/segment_anything/download_dataset.py‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎examples/pytorch/image_recognition/segment_anything/inc_dataset_loader.py‎
Lines changed: 173 additions & 0 deletions b/‎examples/pytorch/image_recognition/segment_anything/inc_dataset_loader.py‎
Lines changed: 173 additions & 0 deletions
@@ -54,7 +54,7 @@ elif [ "${scan_module}" = "neural_insights" ]; then
 fi
 
 python -m pylint -f json --disable=R,C,W,E1129 --enable=line-too-long --max-line-length=120 --extension-pkg-whitelist=numpy --ignored-classes=TensorProto,NodeProto \
---ignored-modules=tensorflow,torch,torch.quantization,torch.tensor,torchvision,fairseq,mxnet,onnx,onnxruntime,intel_extension_for_pytorch,intel_extension_for_tensorflow,torchinfo,horovod,transformers \
+--ignored-modules=tensorflow,keras,torch,torch.quantization,torch.tensor,torchvision,fairseq,mxnet,onnx,onnxruntime,intel_extension_for_pytorch,intel_extension_for_tensorflow,torchinfo,horovod,transformers \
 /neural-compressor/${scan_module} > $log_dir/pylint.json
 
 exit_code=$?
 
@@ -19,8 +19,6 @@ The MSE tuning strategy does not work with the PyTorch adaptor layer. This strat
 
 The diagnosis function does not work with ONNX Runtime 1.13.1 for QDQ format quantization of ONNX models. It can not dump the output value of QDQ pairs since framework limitation.
 
-Keras version 2.13.0 is experiencing an open issue [18284](https://github.com/keras-team/keras/issues/18284) related to the absence of a `safe_mode` parameter in `tf.keras.models.model_from_json()`. This deficiency could potentially hinder the successful quantization of certain Keras models.
-
 ## Incompatible Changes
 
 [Neural Compressor v1.2](https://github.com/intel/neural-compressor/tree/v1.2) introduces incompatible changes in user facing APIs. Please refer to [incompatible changes](incompatible_changes.md) to know which incompatible changes are made in v1.2.
 
@@ -209,17 +209,17 @@
       "main_script": "main.py",       
       "batch_size": 10
     },
-    "faster_rcnn_inception_resnet_v2": {
-      "model_src_dir": "object_detection/tensorflow_models/faster_rcnn_inception_resnet_v2/quantization/ptq",
+    "faster_rcnn_inception_v2": {
+      "model_src_dir": "object_detection/tensorflow_models/faster_rcnn_inception_v2/quantization/ptq",
       "dataset_location": "/tf_dataset/tensorflow/mini-coco-500.record",
-      "input_model": "/tf_dataset/pre-train-model-oob/object_detection/faster_rcnn_inception_resnet_v2/frozen_inference_graph.pb",
+      "input_model": "/tf_dataset/pre-train-model-oob/object_detection/faster_rcnn_inception_v2/frozen_inference_graph.pb",
       "main_script": "main.py",       
       "batch_size": 10
     },
-    "faster_rcnn_inception_resnet_v2_saved": {
-      "model_src_dir": "object_detection/tensorflow_models/faster_rcnn_inception_resnet_v2/quantization/ptq",
+    "faster_rcnn_inception_v2_saved": {
+      "model_src_dir": "object_detection/tensorflow_models/faster_rcnn_inception_v2/quantization/ptq",
       "dataset_location": "/tf_dataset/tensorflow/mini-coco-500.record",
-      "input_model": "/tf_dataset/pre-train-model-oob/object_detection/faster_rcnn_inception_resnet_v2/saved_model",
+      "input_model": "/tf_dataset/pre-train-model-oob/object_detection/faster_rcnn_inception_v2/saved_model",
       "main_script": "main.py",       
       "batch_size": 10
     },
 
@@ -220,7 +220,7 @@ Intel® Neural Compressor validated examples with multiple compression technique
     <td>Faster R-CNN Inception ResNet V2</td>
     <td>Object Detection</td>
     <td>Post-Training Static Quantization</td>
-    <td><a href="./tensorflow/object_detection/tensorflow_models/faster_rcnn_inception_resnet_v2/quantization/ptq">pb</a> / <a href="./tensorflow/object_detection/tensorflow_models/faster_rcnn_inception_resnet_v2/quantization/ptq">SavedModel</a></td>
+    <td><a href="./tensorflow/object_detection/tensorflow_models/faster_rcnn_inception_v2/quantization/ptq">pb</a> / <a href="./tensorflow/object_detection/tensorflow_models/faster_rcnn_inception_v2/quantization/ptq">SavedModel</a></td>
   </tr>
   <tr>
     <td>Faster R-CNN ResNet101</td>
 
@@ -0,0 +1,68 @@
+Step-by-Step
+============
+This document describes the step-by-step instructions for applying post training quantization on Segment Anything Model (SAM) using VOC dataset.
+
+# Prerequisite
+## Environment
+```shell
+# install dependencies
+pip install -r ./requirements.txt
+# retrieve SAM model codes and pre-trained weight
+pip install git+https://github.com/facebookresearch/segment-anything.git
+wget https://dl.fbaipublicfiles.com/segment_anything/sam_vit_b_01ec64.pth
+```
+
+# PTQ
+PTQ example on Segment Anything Model (SAM) using VOC dataset.
+
+## 1. Prepare VOC dataset
+```shell
+python download_dataset.py
+```
+
+## 2. Start PTQ
+```shell
+bash run_quant.sh --voc_dataset_location=./voc_dataset/VOCdevkit/VOC2012/ --pretrained_weight_location=./sam_vit_b_01ec64.pth
+```
+
+## 3. Benchmarking
+```shell
+bash run_benchmark.sh --tuned_checkpoint=./saved_results --voc_dataset_location=./voc_dataset/VOCdevkit/VOC2012/ --int8=True --mode=performance
+```
+
+# Result
+| | Baseline (FP32) | INT8 
+| ------------- | ------------- | -------------
+Accuracy | 0.7939  | 0.7849
+
+# Saving and Loading Model
+
+* Saving model:
+  After tuning with Neural Compressor, we can get neural_compressor.model:
+
+```
+from neural_compressor import PostTrainingQuantConfig
+from neural_compressor import quantization
+conf = PostTrainingQuantConfig()
+q_model = quantization.fit(model,
+                            conf,
+                            calib_dataloader=val_loader,
+                            eval_func=eval_func)
+```
+
+Here, `q_model` is the Neural Compressor model class, so it has "save" API:
+
+```python
+q_model.save("Path_to_save_quantized_model")
+```
+
+* Loading model:
+
+```python
+from neural_compressor.utils.pytorch import load
+quantized_model = load(os.path.abspath(os.path.expanduser(args.tuned_checkpoint)),
+                        model,
+                        dataloader=val_loader)
+```
+
+Please refer to main.py for reference.
@@ -0,0 +1,7 @@
+import torchvision
+
+print("Downloading VOC dataset")
+torchvision.datasets.VOCDetection(root='./voc_dataset', year='2012', image_set ='trainval', download=True)
+
+
+
@@ -0,0 +1,173 @@
+from segment_anything import SamPredictor, sam_model_registry
+import torchvision
+import torch
+from PIL import Image
+
+import numpy as np
+import os
+import xml.etree.ElementTree as ET
+from statistics import mean
+from torch.nn.functional import threshold, normalize
+import torch.nn.functional as F
+from segment_anything.utils.transforms import ResizeLongestSide
+from typing import List, Tuple
+
+# Pad image - based on SAM 
+def pad_image(x: torch.Tensor, square_length = 1024) -> torch.Tensor:
+    # C, H, W
+    h, w = x.shape[-2:]
+    padh = square_length - h
+    padw = square_length - w
+    x = F.pad(x, (0, padw, 0, padh))
+    return x
+
+# Custom dataset
+class INC_SAMVOC2012Dataset(object):
+    def __init__(self, voc_root, type):
+        self.voc_root = voc_root
+        self.num_of_data = -1
+        self.dataset = {}  # Item will be : ["filename", "class_name", [4x bounding boxes coordinates], etc)
+        self.resizelongestside = ResizeLongestSide(target_length=1024)
+        pixel_mean = [123.675, 116.28, 103.53]
+        pixel_std = [58.395, 57.12, 57.375]
+        self.pixel_mean = torch.Tensor(pixel_mean).view(-1, 1, 1)
+        self.pixel_std = torch.Tensor(pixel_std).view(-1, 1, 1)
+
+        # Read through all the samples and output a dictionary 
+        # Key of the dictionary will be idx
+        # Item of the dictionary will be filename, class id and bounding boxes
+        annotation_dir = os.path.join(voc_root, "Annotations")
+        files = os.listdir(annotation_dir)
+        files = [f for f in files if os.path.isfile(annotation_dir+'/'+f)] #Filter directory
+        annotation_files = [os.path.join(annotation_dir, x) for x in files]
+
+        # Get the name list of the segmentation files
+        segmentation_dir = os.path.join(voc_root, "SegmentationObject")
+        files = os.listdir(segmentation_dir)
+        files = [f for f in files if os.path.isfile(segmentation_dir+'/'+f)] #Filter directory
+        segmentation_files = [x for x in files]
+    
+
+        # Based on the type (train/val) to select data
+        train_val_dir = os.path.join(voc_root, 'ImageSets/Segmentation/')
+        if type == 'train':
+            txt_file_name = 'train.txt'
+        elif type =='val':
+            txt_file_name = 'val.txt'
+        else:
+            print('Error! Type of dataset should be ''train'' or ''val'' ')
+
+        with open(train_val_dir + txt_file_name, 'r') as f:
+            permitted_files = []
+            for row in f:
+                permitted_files.append(row.rstrip('\n'))
+        
+        for file in annotation_files:
+            file_name = file.split('/')[-1].split('.xml')[0]
+
+            if not(file_name in permitted_files): 
+                continue #skip the file
+            
+            if file_name + '.png' in segmentation_files: # check that if there is any related segmentation file for this annotation
+                tree = ET.parse(file)
+                root = tree.getroot()
+                for child in root:
+                    if child.tag == 'object':
+                        details = [file_name]
+                        for node in child:
+                            if node.tag == 'name':
+                                object_name = node.text
+                            if node.tag == 'bndbox':
+                                for coordinates in node:
+                                    if coordinates.tag == 'xmax':
+                                        xmax = int(coordinates.text)
+                                    if coordinates.tag == 'xmin':
+                                        xmin = int(coordinates.text)
+                                    if coordinates.tag == 'ymax':
+                                        ymax = int(coordinates.text)
+                                    if coordinates.tag == 'ymin':
+                                        ymin = int(coordinates.text)
+                                boundary = [xmin, ymin, xmax, ymax]
+                        details.append(object_name)
+                        details.append(boundary)
+                        self.num_of_data += 1
+                        self.dataset[self.num_of_data] = details
+
+    def __len__(self):
+        return self.num_of_data
+
+    # Preprocess the segmentation mask. Output only 1 object semantic information.
+    def preprocess_segmentation(self, filename, bounding_box, pad=True):
+        
+        #read the semantic mask
+        segment_mask = Image.open(self.voc_root + 'SegmentationObject/' + filename + '.png')
+        segment_mask_np = torchvision.transforms.functional.pil_to_tensor(segment_mask)
+
+        #Crop the segmentation based on the bounding box
+        xmin, ymin = int(bounding_box[0]), int(bounding_box[1])
+        xmax, ymax = int(bounding_box[2]), int(bounding_box[3])
+        cropped_mask = segment_mask.crop((xmin, ymin, xmax, ymax))
+        cropped_mask_np = torchvision.transforms.functional.pil_to_tensor(cropped_mask)
+                                 
+        #Count the majority element
+        bincount = np.bincount(cropped_mask_np.reshape(-1))
+        bincount[0] = 0 #Remove the black pixel
+        if (bincount.shape[0] >= 256):
+            bincount[255] = 0 #Remove the white pixel
+        majority_element = bincount.argmax()
+        
+        #Based on the majority element, binary mask the segmentation
+        segment_mask_np[np.where((segment_mask_np != 0) & (segment_mask_np != majority_element))] = 0
+        segment_mask_np[segment_mask_np == majority_element] = 1
+
+        #Pad the segment mask to 1024x1024 (for batching in dataloader)
+        if pad:
+            segment_mask_np = pad_image(segment_mask_np)
+
+        return segment_mask_np
+
+    # Preprocess the image to an appropriate format for SAM
+    def preprocess_image(self, img):
+        # ~= predictor.py - set_image()
+        img = np.array(img)
+        input_image = self.resizelongestside.apply_image(img)
+        input_image_torch = torch.as_tensor(input_image, device='cpu')
+        input_image_torch = input_image_torch.permute(2, 0, 1).contiguous()
+        input_image_torch = (input_image_torch - self.pixel_mean) / self.pixel_std #normalize
+        original_size = img.shape[:2]
+        input_size = tuple(input_image_torch.shape[-2:])
+       
+        return pad_image(input_image_torch), original_size, input_size
+
+    def __getitem__(self, idx):
+        data = self.dataset[idx]
+        filename, classname = data[0], data[1]
+        bounding_box = data[2]
+
+        # No padding + preprocessing
+        mask_gt = self.preprocess_segmentation(filename, bounding_box, pad=False)
+
+        image, original_size, input_size = self.preprocess_image(Image.open(self.voc_root + 'JPEGImages/' + filename + '.jpg')) # read the image
+        prompt  = bounding_box # bounding box - input_boxes x1, y1, x2, y2
+        training_data = {}
+        training_data['image'] = image
+        training_data["original_size"] = original_size
+        training_data["input_size"] = input_size
+        training_data["ground_truth_mask"] = mask_gt
+        training_data["prompt"] = prompt
+        return (training_data, mask_gt) #data, label
+
+
+class INC_SAMVOC2012Dataloader:
+    def __init__(self, batch_size, **kwargs):
+        self.batch_size = batch_size
+        self.dataset = []
+        ds = INC_SAMVOC2012Dataset(kwargs['voc_root'], kwargs['type'])
+        # operations to add (input_data, label) pairs into self.dataset
+        for i in range(len(ds)):
+            self.dataset.append(ds[i])
+
+
+    def __iter__(self):
+        for input_data, label in self.dataset:
+            yield input_data, label