quantization/image_classification/migraphx/resnet50/e2e_migraphx_resnet_example.py

import os
import onnx
import glob
import scipy.io
import numpy as np
import logging
from PIL import Image
import onnx
import argparse
import onnxruntime
from onnxruntime.quantization import CalibrationDataReader, create_calibrator, write_calibration_table

def parse_input_args():
    parser = argparse.ArgumentParser()

    parser.add_argument(
        "--model",
        required=False,
        default='./resnet50-v2-7.onnx',
        help='Target DIR for model. Default is ./resnet50-v2-7.onnx',
    )

    parser.add_argument(
        "--fp16",
        action="store_true",
        required=False,
        default=False,
        help='Perform fp16 quantizaton in addition to int8',
    )

    parser.add_argument(
        "--fp32",
        action="store_true",
        required=False,
        default=False,
        help='Perform no quantization',
    )

    parser.add_argument(
        "--fp8",
        action="store_true",
        required=False,
        default=False,
        help='Perform fp8 quantizaton instead of int8',
    )

    parser.add_argument(
        "--image_dir",
        required=False,
        default="./ILSVRC2012",
        help='Target DIR for images to infer. Default is .ILSVRC2012')

    parser.add_argument("--batch",
                        required=False,
                        default=20,
                        help='Batch size of images per inference',
                        type=int)


    parser.add_argument("--cal_size",
                        required=False,
                        default=1000,
                        help='Size of images for calibration',
                        type=int)

    parser.add_argument(
        "--exhaustive_tune",
        action="store_true",
        required=False,
        default=False,
        help='Enable MIGraphX Exhaustive tune before compile. Default False',
    )

    parser.add_argument(
        "--cache",
        action="store_true",
        required=False,
        default=True,
        help='cache the compiled model between runs. Saves quantization and compile time. Default true',
    )

    parser.add_argument(
        "--cache_name",
        required=False,
        default="./cached_model.mxr",
        help='Name and path of the compiled model cache. Default: ./cached_model.mxr',
    )

    return parser.parse_args()

class ImageNetDataReader(CalibrationDataReader):
    def __init__(self,
                 image_folder,
                 width=224,
                 height=224,
                 start_index=0,
                 end_index=0,
                 stride=1,
                 batch_size=1,
                 model_path='augmented_model.onnx',
                 input_name='data'):
        '''
        :param image_folder: image dataset folder
        :param width: image width
        :param height: image height
        :param start_index: start index of images
        :param end_index: end index of images
        :param stride: image size of each data get
        :param batch_size: batch size of inference
        :param model_path: model name and path
        :param input_name: model input name
        '''

        self.image_folder = image_folder + "/val"
        self.model_path = model_path
        self.preprocess_flag = True
        self.enum_data_dicts = iter([])
        self.datasize = 0
        self.width = width
        self.height = height
        self.start_index = start_index
        self.end_index = len(os.listdir(self.image_folder)) if end_index == 0 else end_index
        self.stride = stride if stride >= 1 else 1
        self.batch_size = batch_size
        self.input_name = input_name

    def get_dataset_size(self):
        return len(os.listdir(self.image_folder))

    def get_input_name(self):
        if self.input_name:
            return
        session = onnxruntime.InferenceSession(self.model_path, providers=['CPUExecutionProvider'])
        self.input_name = session.get_inputs()[0].name

    def get_next(self):
        iter_data = next(self.enum_data_dicts, None)
        if iter_data:
            return iter_data

        self.enum_data_dicts = None
        if self.start_index < self.end_index:
            if self.batch_size == 1:
                data = self.load_serial()
            else:
                data = self.load_batches()

            self.start_index += self.stride
            self.enum_data_dicts = iter(data)

            return next(self.enum_data_dicts, None)
        else:
            return None

    def load_serial(self):
        width = self.width
        height = self.width
        nchw_data_list, filename_list, image_size_list = self.preprocess_imagenet(self.image_folder, height, width,
                                                                                  self.start_index, self.stride)
        input_name = self.input_name

        data = []
        for i in range(len(nchw_data_list)):
            nhwc_data = nchw_data_list[i]
            file_name = filename_list[i]
            data.append({input_name: nhwc_data})
        return data

    def load_batches(self):
        width = self.width
        height = self.height
        batch_size = self.batch_size
        stride = self.stride
        input_name = self.input_name

        batches = []
        for index in range(0, stride, batch_size):
            start_index = self.start_index + index
            nchw_data_list, filename_list, image_size_list = self.preprocess_imagenet(
                self.image_folder, height, width, start_index, batch_size)

            if nchw_data_list.size == 0:
                break

            nchw_data_batch = []
            for i in range(len(nchw_data_list)):
                nhwc_data = np.squeeze(nchw_data_list[i], 0)
                nchw_data_batch.append(nhwc_data)
            batch_data = np.concatenate(np.expand_dims(nchw_data_batch, axis=0), axis=0)
            data = {input_name: batch_data}

            batches.append(data)

        return batches

    def preprocess_imagenet(self, images_folder, height, width, start_index=0, size_limit=0):
        '''
        Loads a batch of images and preprocess them
        parameter images_folder: path to folder storing images
        parameter height: image height in pixels
        parameter width: image width in pixels
        parameter start_index: image index to start with
        parameter size_limit: number of images to load. Default is 0 which means all images are picked.
        return: list of matrices characterizing multiple images
        '''
        def preprocess_images(input, channels=3, height=224, width=224):
            image = input.resize((width, height), Image.Resampling.LANCZOS)
            if image.mode in ["CMYK", "RGBA"]:
                image = image.convert("RGB")
            input_data = np.asarray(image).astype(np.float32)
            if len(input_data.shape) != 2:
                input_data = input_data.transpose([2, 0, 1])
            else:
                input_data = np.stack([input_data] * 3)
            mean = np.array([0.079, 0.05, 0]) + 0.406
            std = np.array([0.005, 0, 0.001]) + 0.224
            for channel in range(input_data.shape[0]):
                try:
                    m = mean[channel]
                    s = std[channel]
                    c = input_data[channel, :, :]
                    input_data[channel, :, :] = (c / 255 - m) / s
                except:
                    print(input_data.shape)
                    return None
            return input_data

        image_names = os.listdir(images_folder)
        image_names.sort()
        if size_limit > 0 and len(image_names) >= size_limit:
            end_index = start_index + size_limit
            if end_index > len(image_names):
                end_index = len(image_names)
            batch_filenames = [image_names[i] for i in range(start_index, end_index)]
        else:
            batch_filenames = image_names

        unconcatenated_batch_data = []
        image_size_list = []

        for image_name in batch_filenames:
            image_filepath = images_folder + '/' + image_name
            img = Image.open(image_filepath)
            image_data = preprocess_images(img)
            if image_data is None:
                print(image_name)
                continue
            image_data = np.expand_dims(image_data, 0)
            unconcatenated_batch_data.append(image_data)
            image_size_list.append(np.array([img.size[1], img.size[0]], dtype=np.float32).reshape(1, 2))

        batch_data = np.concatenate(np.expand_dims(unconcatenated_batch_data, axis=0), axis=0)
        return batch_data, batch_filenames, image_size_list

    def get_synset_id(self, image_folder, offset, dataset_size):
        ilsvrc2012_meta = scipy.io.loadmat(image_folder + "/devkit/data/meta.mat")
        id_to_synset = {}
        for i in range(1000):
            id = int(ilsvrc2012_meta["synsets"][i, 0][0][0][0])
            id_to_synset[id] = ilsvrc2012_meta["synsets"][i, 0][1][0]

        synset_to_id = {}
        file = open(image_folder + "/synset_words.txt", "r")
        index = 0
        for line in file:
            parts = line.split(" ")
            synset_to_id[parts[0]] = index
            index = index + 1
        file.close()

        file = open(image_folder + "/devkit/data/ILSVRC2012_validation_ground_truth.txt", "r")
        id = file.read().strip().split("\n")
        id = list(map(int, id))
        file.close()

        image_names = os.listdir(image_folder + "/val")
        image_names.sort()
        image_names = image_names[offset:offset + dataset_size]
        seq_num = []
        for file in image_names:
            seq_num.append(int(file.split("_")[-1].split(".")[0]))
        id = np.array([id[index - 1] for index in seq_num])
        synset_id = np.array([synset_to_id[id_to_synset[index]] for index in id])

        # one-hot encoding
        synset_id_onehot = np.zeros((len(synset_id), 1000), dtype=np.float32)
        for i, id in enumerate(synset_id):
            synset_id_onehot[i, id] = 1.0
        return synset_id_onehot


class ImageClassificationEvaluator:
    def __init__(self,
                 model_path,
                 synset_id,
                 flags,
                 data_reader: CalibrationDataReader,
                 providers=["MIGraphXExecutionProvider"]):
        '''
        :param model_path: ONNX model to validate
        :param synset_id: ILSVRC2012 synset id
        :param data_reader: user implemented object to read in and preprocess calibration dataset
                            based on CalibrationDataReader Interface
        :param providers: ORT execution provider type
        '''

        self.model_path = model_path
        self.data_reader = data_reader
        self.providers = providers
        self.prediction_result_list = []
        self.synset_id = synset_id

    def get_result(self):
        return self.prediction_result_list

    def predict(self):
        sess_options = onnxruntime.SessionOptions()
        sess_options.log_severity_level = 2
        sess_options.log_verbosity_level = 2
        sess_options.graph_optimization_level = onnxruntime.GraphOptimizationLevel.ORT_DISABLE_ALL
        session = onnxruntime.InferenceSession(self.model_path, sess_options=sess_options, 
                                                providers=[("MIGraphXExecutionProvider", 
                                                            {"migraphx_fp8_enable": flags.fp8 and not flags.fp32,
                                                             "migraphx_int8_enable": not (flags.fp8 or flags.fp32),
                                                              "migraphx_fp16_enable": flags.fp16 and not flags.fp32,
                                                              "migraphx_int8_calibration_table_name": flags.calibration_table,
                                                              "migraphx_use_native_calibration_table": flags.native_calibration_table,
                                                              "migraphx_save_compiled_model": flags.cache,
                                                              "migraphx_save_model_path": flags.cache_name,
                                                              "migraphx_load_compiled_model": flags.cache,
                                                              "migraphx_load_model_path": flags.cache_name,
                                                              "migraphx_exhaustive_tune": flags.exhaustive_tune})])

        inference_outputs_list = []
        while True:
            inputs = self.data_reader.get_next()
            if not inputs:
                break
            output = session.run(None, inputs)
            inference_outputs_list.append(output)
        self.prediction_result_list = inference_outputs_list

    def top_k_accuracy(self, truth, prediction, k=1):
        '''From https://github.com/chainer/chainer/issues/606
        '''
        y = np.argsort(prediction)[:, -k:]
        return np.any(y.T == truth.argmax(axis=1), axis=0).mean()

    def evaluate(self, prediction_results):
        batch_size = len(prediction_results[0][0])
        total_val_images = len(prediction_results) * batch_size
        y_prediction = np.empty((total_val_images, 1000), dtype=np.float32)
        i = 0
        for res in prediction_results:
            y_prediction[i:i + res[0].shape[0], :] = res[0]
            i = i + batch_size
        print("top 1: ", self.top_k_accuracy(self.synset_id, y_prediction, k=1))
        print("top 5: ", self.top_k_accuracy(self.synset_id, y_prediction, k=5))


def convert_model_batch_to_dynamic(model_path):
    model = onnx.load(model_path)
    initializers =  [node.name for node in model.graph.initializer]
    inputs = []
    for node in model.graph.input:
        if node.name not in initializers:
            inputs.append(node)
    input_name = inputs[0].name
    shape = inputs[0].type.tensor_type.shape
    dim = shape.dim
    if not dim[0].dim_param:
        dim[0].dim_param = 'N'
        model = onnx.shape_inference.infer_shapes(model)
        model_name = model_path.split(".")
        model_path = model_name[0] + "_dynamic.onnx"
        onnx.save(model, model_path)
    return [model_path, input_name]


def get_dataset_size(dataset_path, calibration_dataset_size):
    total_dataset_size = len(os.listdir(dataset_path + "/val"))
    if calibration_dataset_size > total_dataset_size:
        logging.warning(
            "calibration data size is bigger than available dataset. Will assign half of the dataset for calibration")
        calibration_dataset_size = total_dataset_size // 2
    calibration_dataset_size = (calibration_dataset_size // batch_size) * batch_size
    if calibration_dataset_size == 0:
        logging.warning("No dataset is assigned for calibration. Please use bigger dataset")

    prediction_dataset_size = ((total_dataset_size - calibration_dataset_size) // batch_size) * batch_size
    if prediction_dataset_size <= 0:
        logging.warning("No dataset is assigned for evaluation. Please use bigger dataset")
    return [calibration_dataset_size, prediction_dataset_size]


if __name__ == '__main__':
    '''
    MIGraphX EP INT8 Inference on Resnet model

    The script is using ILSVRC2012 ImageNet dataset for calibration and prediction.
    Please prepare the dataset as below, 
    1. Create dataset folder 'ILSVRC2012' in workspace.
    2. Download ILSVRC2012 validation dataset and development kit from http://www.image-net.org/challenges/LSVRC/2012/downloads.
    3. Extract validation dataset JPEG files to 'ILSVRC2012/val'.
    4. Extract development kit to 'ILSVRC2012/devkit'. Two files in the development kit are used, 'ILSVRC2012_validation_ground_truth.txt' and 'meta.mat'.
       These are also available to download at https://github.com/miraclewkf/MobileNetV2-PyTorch/tree/master/ImageNet/ILSVRC2012_devkit_t12/data
    5. Download 'synset_words.txt' from https://github.com/HoldenCaulfieldRye/caffe/blob/master/data/ilsvrc12/synset_words.txt into 'ILSVRC2012/'.

    Please download Resnet50 model from ONNX model zoo https://github.com/onnx/models/blob/master/vision/classification/resnet/model/resnet50-v2-7.tar.gz
    Untar the model into the workspace
    '''
    flags = parse_input_args()

    # Dataset settings
    model_path = flags.model
    ilsvrc2012_dataset_path = flags.image_dir
    augmented_model_path = "./augmented_model.onnx"
    batch_size = flags.batch
    calibration_dataset_size = 0 if flags.fp32 else flags.cal_size  # Size of dataset for calibration

    precision=""

    if not (flags.fp8 or flags.fp32):
        precision = precision + "_int8"

    if flags.fp8 and not flags.fp32:
        precision = precision + "_fp8"

    if flags.fp16 and not flags.fp32:
        precision = "_fp16" + precision

    calibration_table_generation_enable = False
    if not flags.fp32:
        calibration_table_generation_enable = True  # Enable/Disable INT8 calibration
        flags.calibration_table = "calibration_cal"+ str(flags.cal_size) + precision + ".flatbuffers"
        flags.native_calibration_table = "False"
        if os.path.isfile("./" + flags.calibration_table):
            calibration_table_generation = False
            print("Found previous calibration: " + flags.calibration_table + "Skipping generating table")

    execution_provider = ["MIGraphXExecutionProvider"]

    # Convert static batch to dynamic batch
    [new_model_path, input_name] = convert_model_batch_to_dynamic(model_path)

    # Get calibration and prediction dataset size
    [calibration_dataset_size, prediction_dataset_size] = get_dataset_size(ilsvrc2012_dataset_path,
                                                                           calibration_dataset_size)

    # Generate INT8 calibration table
    if calibration_table_generation_enable:
        print("Generating Calibration Table")
        calibrator = create_calibrator(new_model_path, [], augmented_model_path=augmented_model_path)
        calibrator.set_execution_providers(["ROCMExecutionProvider"])
        data_reader = ImageNetDataReader(ilsvrc2012_dataset_path,
                                         start_index=0,
                                         end_index=calibration_dataset_size,
                                         stride=calibration_dataset_size,
                                         batch_size=batch_size,
                                         model_path=augmented_model_path,
                                         input_name=input_name)
        calibrator.collect_data(data_reader)
        cal_tensors = calibrator.compute_data()

        serial_cal_tensors = {}
        for keys, values in cal_tensors.data.items():
            serial_cal_tensors[keys] = [float(x[0]) for x in values.range_value]

        print("Writing calibration table to:" + flags.calibration_table)
        write_calibration_table(serial_cal_tensors)
        os.rename("./calibration.flatbuffers", flags.calibration_table)
        print("Write complete")

    # Run prediction in MIGraphX EP138G
    data_reader = ImageNetDataReader(ilsvrc2012_dataset_path,
                                     start_index=calibration_dataset_size,
                                     end_index=calibration_dataset_size + prediction_dataset_size,
                                     stride=prediction_dataset_size,
                                     batch_size=batch_size,
                                     model_path=new_model_path,
                                     input_name=input_name)
    print("Completed Data Reader")
    synset_id = data_reader.get_synset_id(ilsvrc2012_dataset_path, calibration_dataset_size,
                                          prediction_dataset_size)  # Generate synset id
    print("Prepping Evalulator")
    evaluator = ImageClassificationEvaluator(new_model_path, synset_id, flags, data_reader, providers=execution_provider)
    print("Performing Predictions")
    evaluator.predict()
    print("Read out answer")
    result = evaluator.get_result()
    evaluator.evaluate(result)