openvino/tools/pot/tests/test_scales.py

# Copyright (C) 2020-2022 Intel Corporation
# SPDX-License-Identifier: Apache-2.0

import json
import os

from copy import deepcopy
import numpy as np
import pytest
from addict import Dict

from openvino.tools.pot.algorithms.algorithm_selector import COMPRESSION_ALGORITHMS
from openvino.tools.pot.engines.ac_engine import ACEngine
from openvino.tools.pot.graph import load_model
from openvino.tools.pot.graph.node_utils import get_node_inputs, get_node_input, get_node_value
from openvino.tools.pot.graph import model_utils as mu
from openvino.tools.pot.statistics.collector import StatisticsCollector

class NumpyEncoder(json.JSONEncoder):
    """ Special json encoder for numpy types """
    # pylint: disable=W0221, E0202
    def default(self, o):
        if isinstance(o, np.integer):
            return int(o)
        if isinstance(o, np.floating):
            return float(o)
        if isinstance(o, np.ndarray):
            return o.tolist()
        return json.JSONEncoder.default(self, o)

def get_fq_nodes_stats_algo(model, preset, bits, is_weights, clipping_value=None):
    test_dir = os.path.join(os.path.dirname(os.path.realpath(__file__)),
                            './data/reference_scale/test_data')

    config = _get_pytorch_accuracy_checker_config(test_dir)

    compression_config = Dict(
        {
            'name': 'MinMaxQuantization',
            'stat_subset_size': 1,
            'preset': preset,
            'target_device': 'CPU',
            'activations': {
                'bits': bits,
                'range_estimator': {
                    'max': {
                        'clipping_value': clipping_value
                    }
                }

            },
            'weights': {
                'bits': bits,
                'mode': 'symmetric' if preset == 'performance' else 'asymmetric'
            }
        })

    engine = ACEngine(config)
    compression_config.subset_indices = [0]
    algo = COMPRESSION_ALGORITHMS.get('MinMaxQuantization')(compression_config, engine)

    model = load_model(model.model_params)

    stats_collector = StatisticsCollector(engine)
    algo.register_statistics(model, stats_collector)
    stats_collector.compute_statistics(model)

    model = algo.run(model)
    out = {}
    for fq in mu.get_nodes_by_type(model, ['FakeQuantize']):
        fq_inputs = get_node_inputs(fq)
        if is_weights and fq_inputs[0].type == 'Const':
            min_weights = np.reshape(fq_inputs[1].value, (fq_inputs[1].value.shape[0]))
            max_weights = np.reshape(fq_inputs[2].value, (fq_inputs[2].value.shape[0]))
            out[fq.name] = {'low_level': min_weights, 'high_level': max_weights}
        elif not is_weights and fq_inputs[0].type != 'Const':
            if not fq_inputs[1].value.shape:
                out[fq.name] = {'low_level': fq_inputs[1].value, 'high_level': fq_inputs[2].value}
            else:
                min_act = np.reshape(fq_inputs[1].value, (fq_inputs[1].value.shape[1]))
                max_act = np.reshape(fq_inputs[2].value, (fq_inputs[2].value.shape[1]))
                out[fq.name] = {'low_level': min_act, 'high_level': max_act}
    return out


def get_ref_stats(stats_path):
    with open(stats_path) as json_file:
        return json.load(json_file)


CONFIGURATIONS = [('performance', 8,
                   os.path.join(os.path.dirname(os.path.realpath(__file__)),
                                './data/reference_scale/mobilenet-v2-pytorch_performance_activations.json'), None),
                  ('performance', 8,
                   os.path.join(os.path.dirname(os.path.realpath(__file__)),
                                './data/reference_scale/mobilenet-v2-pytorch_clipped_activations.json'), 3.0),
                  ('accuracy', 8,
                   os.path.join(os.path.dirname(os.path.realpath(__file__)),
                                './data/reference_scale/mobilenet-v2-pytorch_accuracy_activations.json'), None)
                  ]


@pytest.mark.parametrize(
    'preset, bits, stats_path, clipping_value', CONFIGURATIONS,
    ids=['symmetric_{}_bits_{}_clipping_value_{}'.format(m[0], m[1], m[3]) for m in CONFIGURATIONS]
)
def test_activation_scales(tmp_path, models, preset, bits, stats_path, clipping_value):

    def normalize(_list):
        norm_coef = 0
        for fq_name in _list:
            min_level, max_level = _list[fq_name]['low_level'], _list[fq_name]['high_level']
            norm_coef = max(norm_coef, max(abs(np.mean(min_level)), abs(np.mean(max_level))))

        res = {}
        for item_name in _list:
            res[item_name] = (np.mean(_list[item_name]['low_level']) / norm_coef,
                              np.mean(_list[item_name]['high_level']) / norm_coef)

        return res

    model = models.get('mobilenet-v2-pytorch', 'pytorch', tmp_path)

    ref_nodes = get_ref_stats(stats_path)
    nodes = normalize(get_fq_nodes_stats_algo(model, preset, bits, False,
                                              clipping_value=clipping_value))
    local_path = os.path.join(tmp_path, '{}.json'.format(stats_path.split("_")[-2]))
    dump_intermediate_scales(local_path, nodes)

    assert len(ref_nodes) == len(nodes)
    processed_nodes = []
    eps = 1e-3
    for ref_name in ref_nodes:

        ref_min, ref_max = ref_nodes[ref_name]
        node_min, node_max = nodes[ref_name]

        error = max(abs(node_min - ref_min), abs(node_max - ref_max))

        if error <= eps and ref_name not in processed_nodes:
            processed_nodes.append((
                ref_name, abs(node_min - ref_min), abs(node_max - ref_max)))

    assert len(processed_nodes) == len(ref_nodes)


def test_weights_scales(tmp_path, models):
    path_to_weights = os.path.join(os.path.dirname(os.path.realpath(__file__)),
                                   './data/reference_scale/mobilenet-v2-pytorch_weights.json')

    model = models.get('mobilenet-v2-pytorch', 'pytorch', tmp_path)
    ref_weights = get_ref_stats(path_to_weights)
    weights = get_fq_nodes_stats_algo(model, False, 8, True)
    local_path = os.path.join(tmp_path, '{}.json'.format('mv2_weights'))
    dump_intermediate_scales(local_path, weights)

    for fq_name in weights:
        item_min, item_max = weights[fq_name]['low_level'], weights[fq_name]['high_level']
        if not item_min.shape:
            continue
        shape = item_min.shape[0]

        ref_min, ref_max = ref_weights[fq_name]['low_level'], ref_weights[fq_name]['high_level']
        assert_flag = False

        if np.array_equal(ref_min, item_min) and \
                np.array_equal(ref_max, item_max):
            assert_flag = True

        if not assert_flag:
            print(shape)

        assert assert_flag


def load_refs(path_to_refs):
    with open(path_to_refs) as json_file:
        return json.load(json_file)


CONFIGURATIONS = [
    ('mobilenet-v2-pytorch', 'pytorch', 'symmetric'),
    ('mobilenet-v2-pytorch', 'pytorch', 'asymmetric'),
    ('mobilenet-v2-pytorch', 'pytorch', 'mixed'),
    ('resnet-50-pytorch', 'pytorch', 'symmetric'),
    ('resnet-50-pytorch', 'pytorch', 'asymmetric'),
    ('resnet-50-pytorch', 'pytorch', 'mixed'),
    ('googlenet-v3', 'tf', 'symmetric'),
    ('googlenet-v3', 'tf', 'asymmetric'),
    ('googlenet-v3', 'tf', 'mixed'),
]

REFERENCES_DIR = os.path.join(os.path.dirname(os.path.realpath(__file__)),
                              './data/reference_fake_quantize_conf')


@pytest.mark.parametrize(
    'model_name, model_framework, algo_mode', CONFIGURATIONS,
    ids=['{}_{}_{}'.format(m[0], m[1], m[2]) for m in CONFIGURATIONS]
)
def test_fake_quantize_configurations(tmp_path, models, model_name, model_framework, algo_mode):
    test_dir = os.path.join(os.path.dirname(os.path.realpath(__file__)),
                            './data/reference_scale/test_data')

    config = _get_pytorch_accuracy_checker_config(test_dir) \
        if model_framework == 'pytorch' else _get_tf_accuracy_checker_config(test_dir)

    if algo_mode == 'symmetric':
        activations_mode, weights_mode, level_low = 'symmetric', 'symmetric', -127
    elif algo_mode == 'asymmetric':
        activations_mode, weights_mode, level_low = 'asymmetric', 'asymmetric', -128
    else:
        activations_mode, weights_mode, level_low = 'asymmetric', 'symmetric', -127

    compression_config = Dict({
        'name': 'MinMaxQuantization',
        'stat_subset_size': 1,
        'preset': 'performance',
        'target_device': 'CPU',
        'activations': {
            'bits': 8,
            'mode': activations_mode
        },
        'weights': {
            'bits': 8,
            'mode': weights_mode,
            'granularity': 'perchannel',
            'level_low': level_low,
            'level_high': 127
        }
    })

    def _make_list(x):
        if isinstance(x, np.ndarray):
            x = x.tolist()
        if isinstance(x, list):
            return x
        return [x]

    engine = ACEngine(config)
    compression_config.subset_indices = [0]
    algo = COMPRESSION_ALGORITHMS.get('MinMaxQuantization')(compression_config, engine)
    model = models.get(model_name, model_framework, tmp_path)
    model = load_model(model.model_params)

    stats_collector = StatisticsCollector(engine)
    algo.register_statistics(model, stats_collector)
    stats_collector.compute_statistics(model)

    model = algo.run(model)

    refs_path = os.path.join(REFERENCES_DIR, '{}_{}.json'.format(model_name, algo_mode))
    local_path = os.path.join(tmp_path, '{}.json'.format(model_name))

    ref_exists = os.path.isfile(refs_path)

    refs = load_refs(refs_path) if ref_exists else {}
    ref_file = None if ref_exists else open(refs_path, 'w')
    local_file = open(local_path, 'w')
    model_values = {}

    eps = 1e-3
    fq_list = mu.get_nodes_by_type(model, ['FakeQuantize'])
    for fq in sorted(fq_list, key=lambda item: item.name):
        min_levels, max_levels = tuple([get_node_value(node)
                                        for node in get_node_inputs(fq)[1:3]])
        fq_name = fq.name
        if get_node_input(fq, 0).type == 'Const':
            min_levels = min_levels.reshape(min_levels.shape[0])
            max_levels = max_levels.reshape(max_levels.shape[0])
        else:
            if not min_levels.shape and not max_levels.shape:
                pass
            else:
                min_levels = min_levels.reshape(min_levels.shape[1])
                max_levels = max_levels.reshape(max_levels.shape[1])

        min_levels = _make_list(min_levels)
        max_levels = _make_list(max_levels)
        model_values[fq_name] = {'max': max_levels, 'min': min_levels}

    if not ref_exists:
        json.dump(model_values, ref_file)
        return
    json.dump(model_values, local_file)

    for ref_name in refs:
        refs_min_levels = _make_list(refs[ref_name]['min'])
        refs_max_levels = _make_list(refs[ref_name]['max'])
        min_levels = model_values[ref_name]['min']
        max_levels = model_values[ref_name]['max']

        for min_level, max_level, ref_min, ref_max in zip(
                min_levels, max_levels, refs_min_levels, refs_max_levels):
            assert abs(min_level - ref_min) < eps
            assert abs(max_level - ref_max) < eps


def _get_pytorch_accuracy_checker_config(path_to_dataset):
    return Dict({
        'log_dir': './logs',
        'models': [{
            'name': 'test_conf',
            'launchers': [{
                'framework': 'dlsdk',
                'device': 'CPU',
                'adapter': 'classification'}],
            'datasets': [
                {
                    'name': 'test_dataset',
                    'data_source': path_to_dataset,
                    'reader': 'pillow_imread',
                    'preprocessing':
                        [
                            {
                                'type': 'resize',
                                'size': 256,
                                'aspect_ratio_scale': 'greater',
                                'interpolation': 'BILINEAR',
                                'use_pillow': True
                            },
                            {
                                'type': 'crop',
                                'size': 224,
                                'use_pillow': True
                            },
                            {
                                'type': 'bgr_to_rgb'
                            }]
                }
            ]}]})


def _get_tf_accuracy_checker_config(path_to_dataset):
    return Dict({
        'log_dir': './logs',
        'models': [{
            'name': 'test_conf',
            'launchers': [{
                'framework': 'dlsdk',
                'device': 'CPU',
                'adapter': 'classification'}],
            'datasets': [
                {
                    'name': 'test_dataset',
                    'data_source': path_to_dataset,
                    'reader': 'pillow_imread',
                    'preprocessing':
                        [
                            {
                                'type': 'crop',
                                'central_fraction': 0.875
                            },
                            {
                                'type': 'resize',
                                'size': 299
                            }]
                }
            ]}]})


def dump_intermediate_scales(local_path, data):
    data = json.dumps(deepcopy(data), cls=NumpyEncoder)
    local_file = open(local_path, 'w')
    json.dump(data, local_file)