validation/fixtures/GEMMLowpFixture.h

*c217d954SCole Faust/*
*c217d954SCole Faust * Copyright (c) 2017-2022 Arm Limited.
*c217d954SCole Faust *
*c217d954SCole Faust * SPDX-License-Identifier: MIT
*c217d954SCole Faust *
*c217d954SCole Faust * Permission is hereby granted, free of charge, to any person obtaining a copy
*c217d954SCole Faust * of this software and associated documentation files (the "Software"), to
*c217d954SCole Faust * deal in the Software without restriction, including without limitation the
*c217d954SCole Faust * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
*c217d954SCole Faust * sell copies of the Software, and to permit persons to whom the Software is
*c217d954SCole Faust * furnished to do so, subject to the following conditions:
*c217d954SCole Faust *
*c217d954SCole Faust * The above copyright notice and this permission notice shall be included in all
*c217d954SCole Faust * copies or substantial portions of the Software.
*c217d954SCole Faust *
*c217d954SCole Faust * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
*c217d954SCole Faust * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
*c217d954SCole Faust * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
*c217d954SCole Faust * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
*c217d954SCole Faust * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
*c217d954SCole Faust * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
*c217d954SCole Faust * SOFTWARE.
*c217d954SCole Faust */
*c217d954SCole Faust#ifndef ARM_COMPUTE_TEST_GEMMLOWP_FIXTURE
*c217d954SCole Faust#define ARM_COMPUTE_TEST_GEMMLOWP_FIXTURE
*c217d954SCole Faust
*c217d954SCole Faust#include "arm_compute/core/utils/quantization/AsymmHelpers.h"
*c217d954SCole Faust#include "tests/framework/Fixture.h"
*c217d954SCole Faust#include "tests/validation/Validation.h"
*c217d954SCole Faust#include "tests/validation/reference/GEMMLowp.h"
*c217d954SCole Faust
*c217d954SCole Faustnamespace arm_compute
*c217d954SCole Faust{
*c217d954SCole Faustnamespace test
*c217d954SCole Faust{
*c217d954SCole Faustnamespace validation
*c217d954SCole Faust{
*c217d954SCole Faustnamespace
*c217d954SCole Faust{
*c217d954SCole Fausttemplate <typename U>
*c217d954SCole Faustvoid fill(U &&tensor, int i)
*c217d954SCole Faust{
*c217d954SCole Faust    switch(tensor.data_type())
*c217d954SCole Faust    {
*c217d954SCole Faust        case DataType::QSYMM8_PER_CHANNEL:
*c217d954SCole Faust        {
*c217d954SCole Faust            int min_bound = 128;
*c217d954SCole Faust            int max_bound = -127;
*c217d954SCole Faust            for(size_t j = 0; j < tensor.quantization_info().scale().size(); j++)
*c217d954SCole Faust            {
*c217d954SCole Faust                std::pair<int, int> bounds = get_symm_quantized_per_channel_bounds(tensor.quantization_info(), -1.0f, 1.0f, i);
*c217d954SCole Faust                if(bounds.first < min_bound)
*c217d954SCole Faust                {
*c217d954SCole Faust                    min_bound = bounds.first;
*c217d954SCole Faust                }
*c217d954SCole Faust                if(bounds.second > max_bound)
*c217d954SCole Faust                {
*c217d954SCole Faust                    max_bound = bounds.second;
*c217d954SCole Faust                }
*c217d954SCole Faust            }
*c217d954SCole Faust            std::uniform_int_distribution<int32_t> distribution(min_bound, max_bound);
*c217d954SCole Faust            library->fill(tensor, distribution, i);
*c217d954SCole Faust            break;
*c217d954SCole Faust        }
*c217d954SCole Faust        case DataType::QASYMM8:
*c217d954SCole Faust        {
*c217d954SCole Faust            std::uniform_int_distribution<uint32_t> distribution(1, 254);
*c217d954SCole Faust            library->fill(tensor, distribution, i);
*c217d954SCole Faust            break;
*c217d954SCole Faust        }
*c217d954SCole Faust        case DataType::S32:
*c217d954SCole Faust        {
*c217d954SCole Faust            std::uniform_int_distribution<int32_t> distribution(-20000, 20000);
*c217d954SCole Faust            library->fill(tensor, distribution, i);
*c217d954SCole Faust            break;
*c217d954SCole Faust        }
*c217d954SCole Faust        case DataType::F16:
*c217d954SCole Faust        {
*c217d954SCole Faust            arm_compute::utils::uniform_real_distribution_16bit<half> distribution{ -1.0f, 1.0f };
*c217d954SCole Faust            library->fill(tensor, distribution, i);
*c217d954SCole Faust            break;
*c217d954SCole Faust        }
*c217d954SCole Faust        case DataType::F32:
*c217d954SCole Faust        {
*c217d954SCole Faust            std::uniform_real_distribution<float> distribution(-1.0f, 1.0f);
*c217d954SCole Faust            library->fill(tensor, distribution, i);
*c217d954SCole Faust            break;
*c217d954SCole Faust        }
*c217d954SCole Faust        default:
*c217d954SCole Faust            library->fill_tensor_uniform(tensor, i);
*c217d954SCole Faust    }
*c217d954SCole Faust}
*c217d954SCole Faust
*c217d954SCole Fausttemplate <typename TensorType, typename AccessorType, typename FunctionType, bool reinterpret_input_as_3d, bool reinterpret_output_as_3d, typename OutputType, bool is_fused = false, bool run_twice = false>
*c217d954SCole FaustTensorType compute_gemmlowp_target(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_output, int32_t a_offset, int32_t b_offset,
*c217d954SCole Faust                                   GEMMLowpOutputStageInfo output_stage = GEMMLowpOutputStageInfo(), DataType data_type_a = DataType::QASYMM8, DataType data_type_b = DataType::QASYMM8,
*c217d954SCole Faust                                   QuantizationInfo b_qinfo = QuantizationInfo(), bool reshape_b_only_on_first_run = false)
*c217d954SCole Faust{
*c217d954SCole Faust    // Create tensors
*c217d954SCole Faust    DataType data_type_output = output_stage.type == GEMMLowpOutputStageType::NONE ? DataType::S32 : data_type_a;
*c217d954SCole Faust
*c217d954SCole Faust    TensorType a      = create_tensor<TensorType>(shape_a, data_type_a, 1);
*c217d954SCole Faust    TensorType b      = create_tensor<TensorType>(shape_b, data_type_b, 1); // gemm output before output stage mismatch if i pass data_layout_output here. to be investigated
*c217d954SCole Faust    TensorType output = create_tensor<TensorType>(shape_output, data_type_output, 1);
*c217d954SCole Faust
*c217d954SCole Faust    a.info()->set_quantization_info(QuantizationInfo(1.0f / 255, a_offset));
*c217d954SCole Faust
*c217d954SCole Faust    if(data_type_b == DataType::QSYMM8_PER_CHANNEL)
*c217d954SCole Faust    {
*c217d954SCole Faust        b.info()->set_quantization_info(b_qinfo);
*c217d954SCole Faust    }
*c217d954SCole Faust    else
*c217d954SCole Faust    {
*c217d954SCole Faust        b.info()->set_quantization_info(QuantizationInfo(1.0f / 255, b_offset));
*c217d954SCole Faust    }
*c217d954SCole Faust    TensorType bias;
*c217d954SCole Faust    if(is_fused)
*c217d954SCole Faust    {
*c217d954SCole Faust        TensorShape bias_shape(shape_b[0]);
*c217d954SCole Faust        bias = create_tensor<TensorType>(bias_shape, DataType::S32, 1);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    // Create and configure function
*c217d954SCole Faust    // The GEMMinfo includes the values of the depth in case of reinterpreted 3d input/output
*c217d954SCole Faust    FunctionType gemmlowp;
*c217d954SCole Faust    gemmlowp.configure(&a, &b, is_fused ? &bias : nullptr, &output, GEMMInfo(false, false, reshape_b_only_on_first_run, (reinterpret_output_as_3d ? shape_output[2] : 0), reinterpret_input_as_3d, false,
*c217d954SCole Faust                                                                             output_stage));
*c217d954SCole Faust
*c217d954SCole Faust    ARM_COMPUTE_ASSERT(a.info()->is_resizable());
*c217d954SCole Faust    ARM_COMPUTE_ASSERT(b.info()->is_resizable());
*c217d954SCole Faust    ARM_COMPUTE_ASSERT(output.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust    add_padding_x({ &a, &b, &output });
*c217d954SCole Faust
*c217d954SCole Faust    // Allocate tensors
*c217d954SCole Faust    a.allocator()->allocate();
*c217d954SCole Faust    b.allocator()->allocate();
*c217d954SCole Faust    output.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust    ARM_COMPUTE_ASSERT(!a.info()->is_resizable());
*c217d954SCole Faust    ARM_COMPUTE_ASSERT(!b.info()->is_resizable());
*c217d954SCole Faust    ARM_COMPUTE_ASSERT(!output.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust    // Fill tensors
*c217d954SCole Faust    fill(AccessorType(a), 0);
*c217d954SCole Faust    fill(AccessorType(b), 1);
*c217d954SCole Faust
*c217d954SCole Faust    if(is_fused)
*c217d954SCole Faust    {
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(bias.info()->is_resizable());
*c217d954SCole Faust        bias.allocator()->allocate();
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());
*c217d954SCole Faust        fill(AccessorType(bias), 2);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    // Run with variable inputs.
*c217d954SCole Faust    if(run_twice)
*c217d954SCole Faust    {
*c217d954SCole Faust        gemmlowp.run();
*c217d954SCole Faust        fill(AccessorType(a), 3); // Fill tensors with new seed after run
*c217d954SCole Faust        fill(AccessorType(b), 4);
*c217d954SCole Faust        if(is_fused)
*c217d954SCole Faust        {
*c217d954SCole Faust            fill(AccessorType(bias), 5);
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    // Compute GEMM function
*c217d954SCole Faust    gemmlowp.run();
*c217d954SCole Faust    return output;
*c217d954SCole Faust}
*c217d954SCole Faust
*c217d954SCole Fausttemplate <bool reinterpret_input_as_3d, typename TI = uint8_t, typename TW = uint8_t, bool pretranspose_A = false, bool pretranspose_B = false, bool run_twice = false>
*c217d954SCole FaustSimpleTensor<int32_t> compute_gemmlowp_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_output, int32_t a_offset, int32_t b_offset,
*c217d954SCole Faust                                                 DataType data_type_a = DataType::QASYMM8, DataType data_type_b = DataType::QASYMM8, QuantizationInfo b_qinfo = QuantizationInfo())
*c217d954SCole Faust{
*c217d954SCole Faust    TensorShape shape_a_to_use = shape_a;
*c217d954SCole Faust    if(reinterpret_input_as_3d)
*c217d954SCole Faust    {
*c217d954SCole Faust        // Collapse the second and third dimension if the input is 3D
*c217d954SCole Faust        shape_a_to_use.collapse(2U, 1U);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    // Create reference
*c217d954SCole Faust    SimpleTensor<TI> a{ shape_a_to_use, data_type_a, 1 };
*c217d954SCole Faust    SimpleTensor<TW> b{ shape_b, data_type_b, 1, data_type_b == DataType::QSYMM8_PER_CHANNEL ? b_qinfo : QuantizationInfo(1.0f / 255, b_offset) };
*c217d954SCole Faust
*c217d954SCole Faust    TensorShape shape_a_to_use_transposed{ shape_a_to_use };
*c217d954SCole Faust    TensorShape shape_b_transposed{ shape_b };
*c217d954SCole Faust
*c217d954SCole Faust    shape_a_to_use_transposed.set(0, shape_a_to_use[1]);
*c217d954SCole Faust    shape_a_to_use_transposed.set(1, shape_a_to_use[0]);
*c217d954SCole Faust    shape_b_transposed.set(0, shape_b[1]);
*c217d954SCole Faust    shape_b_transposed.set(1, shape_b[0]);
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<TI> a_transposed{ shape_a_to_use_transposed, data_type_a, 1 };
*c217d954SCole Faust    SimpleTensor<TW> b_transposed{ shape_b_transposed, data_type_b, 1, data_type_b == DataType::QSYMM8_PER_CHANNEL ? b_qinfo : QuantizationInfo(1.0f / 255, b_offset) };
*c217d954SCole Faust
*c217d954SCole Faust    // Fill reference
*c217d954SCole Faust    fill(a, 0);
*c217d954SCole Faust    fill(b, 1);
*c217d954SCole Faust
*c217d954SCole Faust    // Transpose reference if required
*c217d954SCole Faust    /* Note: Assuming the usual batch matmul dimensions A = (B x M x K), B = (B x K x N), if pretranspose_A is set to true, then A is assumed to be (B x K x M),
*c217d954SCole Faust       therefore, A must be pre-transposed before passing it to the fixture. And, we transpose A again in the fixture to make it (B x M x K)
*c217d954SCole Faust       in order to be able to call reference implementation that works with (B x M x K) input.
*c217d954SCole Faust       Similarly, if pretranspose_B is set to true, then B is assumed to be (B x N x K), B must be pre-transposed before passing it to the fixture. */
*c217d954SCole Faust    if(pretranspose_A)
*c217d954SCole Faust    {
*c217d954SCole Faust        transpose_matrix<TI>(a, a_transposed);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    if(pretranspose_B)
*c217d954SCole Faust    {
*c217d954SCole Faust        transpose_matrix<TW>(b, b_transposed);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    // Run with variable inputs.
*c217d954SCole Faust    if(run_twice)
*c217d954SCole Faust    {
*c217d954SCole Faust        reference::gemmlowp_matrix_multiply_core<int32_t, TI, TW>((pretranspose_A ? a_transposed : a), (pretranspose_B ? b_transposed : b), shape_output, a_offset, b_offset);
*c217d954SCole Faust        fill((pretranspose_A) ? a_transposed : a, 3);
*c217d954SCole Faust        fill((pretranspose_B) ? b_transposed : b, 4);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    return reference::gemmlowp_matrix_multiply_core<int32_t, TI, TW>((pretranspose_A ? a_transposed : a), (pretranspose_B ? b_transposed : b), shape_output, a_offset, b_offset);
*c217d954SCole Faust}
*c217d954SCole Faust}
*c217d954SCole Faust
*c217d954SCole Fausttemplate <typename TensorType, typename AccessorType, typename FunctionType, bool reinterpret_input_as_3d = false, bool reinterpret_output_as_3d = false, bool run_twice = false>
*c217d954SCole Faustclass GEMMLowpMatrixMultiplyCoreValidationFixture : public framework::Fixture
*c217d954SCole Faust{
*c217d954SCole Faustpublic:
*c217d954SCole Faust    template <typename...>
*c217d954SCole Faust    void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_output, int32_t a_offset, int32_t b_offset)
*c217d954SCole Faust    {
*c217d954SCole Faust        _target    = compute_target(shape_a, shape_b, shape_output, a_offset, b_offset);
*c217d954SCole Faust        _reference = compute_reference(shape_a, shape_b, shape_output, a_offset, b_offset);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faustprotected:
*c217d954SCole Faust    TensorType compute_target(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_output, int32_t a_offset, int32_t b_offset)
*c217d954SCole Faust    {
*c217d954SCole Faust        return compute_gemmlowp_target<TensorType, AccessorType, FunctionType, reinterpret_input_as_3d, reinterpret_output_as_3d, int32_t, false, run_twice>(shape_a, shape_b, shape_output, a_offset,
*c217d954SCole Faust                b_offset);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<int32_t> compute_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_output, int32_t a_offset, int32_t b_offset)
*c217d954SCole Faust    {
*c217d954SCole Faust        return compute_gemmlowp_reference<reinterpret_input_as_3d, uint8_t, uint8_t, false, false, run_twice>(shape_a, shape_b, shape_output, a_offset, b_offset);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType            _target{};
*c217d954SCole Faust    SimpleTensor<int32_t> _reference{};
*c217d954SCole Faust};
*c217d954SCole Faust
*c217d954SCole Fausttemplate <typename TensorType, typename AccessorType, typename FunctionType, bool reinterpret_input_as_3d = false, bool reinterpret_output_as_3d = false, typename TI = uint8_t, typename TW = uint8_t, bool run_twice = false>
*c217d954SCole Faustclass GEMMLowpMatrixMultiplyCoreFusedOffsetOutputGenericValidationFixture : public framework::Fixture
*c217d954SCole Faust{
*c217d954SCole Faustpublic:
*c217d954SCole Faust    template <typename...>
*c217d954SCole Faust    void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_output, int32_t a_offset, int32_t b_offset, GEMMLowpOutputStageInfo output_stage, DataType data_type_b,
*c217d954SCole Faust               bool reshape_b_only_on_first_run)
*c217d954SCole Faust    {
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(output_stage.type != GEMMLowpOutputStageType::NONE);
*c217d954SCole Faust        DataType data_type_a = data_type_b == DataType::QASYMM8_SIGNED ? DataType::QASYMM8_SIGNED : DataType::QASYMM8;
*c217d954SCole Faust
*c217d954SCole Faust        if(data_type_b == DataType::QSYMM8_PER_CHANNEL)
*c217d954SCole Faust        {
*c217d954SCole Faust            output_stage.is_quantized_per_channel              = true;
*c217d954SCole Faust            const size_t                          num_channels = shape_b[0];
*c217d954SCole Faust            std::vector<float>                    scales(num_channels);
*c217d954SCole Faust            std::uniform_real_distribution<float> distribution(0.f, 1.f);
*c217d954SCole Faust            library->fill(scales, distribution, 0);
*c217d954SCole Faust            output_stage.gemmlowp_multipliers.resize(num_channels);
*c217d954SCole Faust            output_stage.gemmlowp_shifts.resize(num_channels);
*c217d954SCole Faust            for(size_t i = 0; i < num_channels; ++i)
*c217d954SCole Faust            {
*c217d954SCole Faust                quantization::calculate_quantized_multiplier(scales[i], &output_stage.gemmlowp_multipliers[i], &output_stage.gemmlowp_shifts[i]);
*c217d954SCole Faust            }
*c217d954SCole Faust
*c217d954SCole Faust            _reference = compute_reference(shape_a, shape_b, shape_output, a_offset, 0, output_stage, data_type_a, data_type_b, QuantizationInfo(scales));
*c217d954SCole Faust            _target    = compute_target(shape_a, shape_b, shape_output, a_offset, 0, output_stage, data_type_a, data_type_b, QuantizationInfo(scales), reshape_b_only_on_first_run);
*c217d954SCole Faust        }
*c217d954SCole Faust        else
*c217d954SCole Faust        {
*c217d954SCole Faust            _reference = compute_reference(shape_a, shape_b, shape_output, a_offset, b_offset, output_stage, data_type_a, data_type_b, QuantizationInfo());
*c217d954SCole Faust            _target    = compute_target(shape_a, shape_b, shape_output, a_offset, b_offset, output_stage, data_type_a, data_type_b, QuantizationInfo(), reshape_b_only_on_first_run);
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faustprotected:
*c217d954SCole Faust    TensorType compute_target(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_output, int32_t a_offset, int32_t b_offset, GEMMLowpOutputStageInfo output_stage,
*c217d954SCole Faust                              DataType data_type_a, DataType data_type_b, QuantizationInfo b_qinfo, bool reshape_b_only_on_first_run = false)
*c217d954SCole Faust    {
*c217d954SCole Faust        return compute_gemmlowp_target<TensorType, AccessorType, FunctionType, reinterpret_input_as_3d, reinterpret_output_as_3d, qasymm8_t, true, run_twice>(shape_a, shape_b, shape_output, a_offset,
*c217d954SCole Faust                b_offset,
*c217d954SCole Faust                output_stage, data_type_a, data_type_b, b_qinfo, reshape_b_only_on_first_run);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<TI> compute_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_output, int32_t a_offset, int32_t b_offset,
*c217d954SCole Faust                                       GEMMLowpOutputStageInfo output_stage, DataType data_type_a, DataType data_type_b, QuantizationInfo b_qinfo)
*c217d954SCole Faust    {
*c217d954SCole Faust        SimpleTensor<int32_t> output = compute_gemmlowp_reference<reinterpret_input_as_3d, TI, TW, false, false, run_twice>(shape_a, shape_b, shape_output, a_offset, b_offset, data_type_a, data_type_b,
*c217d954SCole Faust                                                                                                                            b_qinfo);
*c217d954SCole Faust
*c217d954SCole Faust        TensorShape           bias_shape(shape_b[0]);
*c217d954SCole Faust        SimpleTensor<int32_t> bias{ bias_shape, DataType::S32, 1 };
*c217d954SCole Faust        (run_twice) ? fill(bias, 5) : fill(bias, 2); // Fill bias with same seed as last run of gemmlowp_target
*c217d954SCole Faust
*c217d954SCole Faust        switch(output_stage.type)
*c217d954SCole Faust        {
*c217d954SCole Faust            case GEMMLowpOutputStageType::QUANTIZE_DOWN:
*c217d954SCole Faust                return reference::gemmlowp_quantize_down_scale<int32_t, TW>(output, bias,
*c217d954SCole Faust                                                                            output_stage.gemmlowp_offset, output_stage.gemmlowp_multipliers, output_stage.gemmlowp_shifts, output_stage.gemmlowp_min_bound, output_stage.gemmlowp_max_bound);
*c217d954SCole Faust                break;
*c217d954SCole Faust            case GEMMLowpOutputStageType::QUANTIZE_DOWN_FIXEDPOINT:
*c217d954SCole Faust                return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, TW>(output, bias,
*c217d954SCole Faust                                                                                          output_stage.gemmlowp_multipliers, output_stage.gemmlowp_shifts, output_stage.gemmlowp_offset, output_stage.gemmlowp_min_bound, output_stage.gemmlowp_max_bound);
*c217d954SCole Faust                break;
*c217d954SCole Faust            default:
*c217d954SCole Faust                ARM_COMPUTE_ERROR("Not Supported!");
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType       _target{};
*c217d954SCole Faust    SimpleTensor<TI> _reference{};
*c217d954SCole Faust};
*c217d954SCole Faust
*c217d954SCole Fausttemplate <typename TensorType, typename AccessorType, typename FunctionType, bool reinterpret_input_as_3d = false, bool reinterpret_output_as_3d = false, typename TI = uint8_t, typename TW = uint8_t>
*c217d954SCole Faustclass GEMMLowpMatrixMultiplyCoreFusedOffsetOutputValidationFixture : public
*c217d954SCole Faust    GEMMLowpMatrixMultiplyCoreFusedOffsetOutputGenericValidationFixture<TensorType, AccessorType, FunctionType, reinterpret_input_as_3d, reinterpret_output_as_3d, TI, TW>
*c217d954SCole Faust{
*c217d954SCole Faustpublic:
*c217d954SCole Faust    template <typename...>
*c217d954SCole Faust    void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_output, int32_t a_offset, int32_t b_offset, GEMMLowpOutputStageInfo output_stage, DataType data_type_b)
*c217d954SCole Faust    {
*c217d954SCole Faust        GEMMLowpMatrixMultiplyCoreFusedOffsetOutputGenericValidationFixture<TensorType, AccessorType, FunctionType, reinterpret_input_as_3d, reinterpret_output_as_3d, TI, TW>::setup(shape_a, shape_b,
*c217d954SCole Faust                shape_output, a_offset, b_offset, output_stage, data_type_b, false);
*c217d954SCole Faust    }
*c217d954SCole Faust};
*c217d954SCole Faust
*c217d954SCole Fausttemplate <typename TensorType, typename AccessorType, typename FunctionType>
*c217d954SCole Faustclass GEMMLowpQuantizeDownInt32ToUint8ScaleValidationFixture : public framework::Fixture
*c217d954SCole Faust{
*c217d954SCole Faustpublic:
*c217d954SCole Faust    template <typename...>
*c217d954SCole Faust    void setup(TensorShape shape, int32_t result_offset, int32_t result_mult_int, int32_t result_shift, int32_t min, int32_t max, bool add_bias)
*c217d954SCole Faust    {
*c217d954SCole Faust        _target    = compute_target(shape, result_offset, result_mult_int, result_shift, min, max, add_bias);
*c217d954SCole Faust        _reference = compute_reference(shape, result_offset, result_mult_int, result_shift, min, max, add_bias);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faustprotected:
*c217d954SCole Faust    template <typename U>
*c217d954SCole Faust    void fill(U &&tensor, int i)
*c217d954SCole Faust    {
*c217d954SCole Faust        std::uniform_int_distribution<> distribution(-6000, 6000);
*c217d954SCole Faust        library->fill(tensor, distribution, i);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType compute_target(const TensorShape &shape, int32_t result_offset, int32_t result_mult_int, int32_t result_shift, int32_t min, int32_t max, bool add_bias)
*c217d954SCole Faust    {
*c217d954SCole Faust        TensorShape shape_bias(shape[0]);
*c217d954SCole Faust
*c217d954SCole Faust        // Create tensors
*c217d954SCole Faust        TensorType a = create_tensor<TensorType>(shape, DataType::S32, 1);
*c217d954SCole Faust        TensorType b = create_tensor<TensorType>(shape_bias, DataType::S32, 1);
*c217d954SCole Faust        TensorType c = create_tensor<TensorType>(shape, DataType::QASYMM8, 1);
*c217d954SCole Faust
*c217d954SCole Faust        // Create and configure function
*c217d954SCole Faust        FunctionType            output_stage;
*c217d954SCole Faust        GEMMLowpOutputStageInfo output_stage_info = GEMMLowpOutputStageInfo();
*c217d954SCole Faust        output_stage_info.type                    = GEMMLowpOutputStageType::QUANTIZE_DOWN;
*c217d954SCole Faust        output_stage_info.gemmlowp_offset         = result_offset;
*c217d954SCole Faust        output_stage_info.gemmlowp_multiplier     = result_mult_int;
*c217d954SCole Faust        output_stage_info.gemmlowp_shift          = result_shift;
*c217d954SCole Faust        output_stage_info.gemmlowp_min_bound      = min;
*c217d954SCole Faust        output_stage_info.gemmlowp_max_bound      = max;
*c217d954SCole Faust        output_stage_info.output_data_type        = DataType::QASYMM8;
*c217d954SCole Faust        output_stage.configure(&a, add_bias ? &b : nullptr, &c, output_stage_info);
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(a.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(c.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        // Allocate tensors
*c217d954SCole Faust        a.allocator()->allocate();
*c217d954SCole Faust        c.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!a.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!c.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        // Fill tensor
*c217d954SCole Faust        fill(AccessorType(a), 0);
*c217d954SCole Faust
*c217d954SCole Faust        if(add_bias)
*c217d954SCole Faust        {
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(b.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust            // Allocate bias tensor
*c217d954SCole Faust            b.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(!b.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust            // Fill tensor
*c217d954SCole Faust            fill(AccessorType(b), 1);
*c217d954SCole Faust        }
*c217d954SCole Faust
*c217d954SCole Faust        // Compute GEMM function
*c217d954SCole Faust        output_stage.run();
*c217d954SCole Faust        return c;
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<uint8_t> compute_reference(const TensorShape &shape, int32_t result_offset, int32_t result_mult_int, int32_t result_shift, int32_t min, int32_t max, bool add_bias)
*c217d954SCole Faust    {
*c217d954SCole Faust        // Create reference
*c217d954SCole Faust        TensorShape shape_bias(shape[0]);
*c217d954SCole Faust
*c217d954SCole Faust        SimpleTensor<int32_t> a{ shape, DataType::S32, 1 };
*c217d954SCole Faust        SimpleTensor<int32_t> b{ shape_bias, DataType::S32, 1 };
*c217d954SCole Faust
*c217d954SCole Faust        // Fill reference
*c217d954SCole Faust        fill(a, 0);
*c217d954SCole Faust
*c217d954SCole Faust        const std::vector<int32_t> result_mult_int_vec = { result_mult_int };
*c217d954SCole Faust        const std::vector<int32_t> result_shift_vec    = { result_shift };
*c217d954SCole Faust
*c217d954SCole Faust        if(add_bias)
*c217d954SCole Faust        {
*c217d954SCole Faust            // Fill bias
*c217d954SCole Faust            fill(b, 1);
*c217d954SCole Faust
*c217d954SCole Faust            return reference::gemmlowp_quantize_down_scale<int32_t, uint8_t>(a, b, result_offset, result_mult_int_vec, result_shift_vec, min, max);
*c217d954SCole Faust        }
*c217d954SCole Faust        else
*c217d954SCole Faust        {
*c217d954SCole Faust            return reference::gemmlowp_quantize_down_scale<int32_t, uint8_t>(a, result_offset, result_mult_int_vec, result_shift_vec, min, max);
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType            _target{};
*c217d954SCole Faust    SimpleTensor<uint8_t> _reference{};
*c217d954SCole Faust};
*c217d954SCole Faust
*c217d954SCole Fausttemplate <typename TensorType, typename AccessorType, typename FunctionType>
*c217d954SCole Faustclass GEMMLowpQuantizeDownInt32ToInt8ScaleValidationFixture : public framework::Fixture
*c217d954SCole Faust{
*c217d954SCole Faustpublic:
*c217d954SCole Faust    template <typename...>
*c217d954SCole Faust    void setup(TensorShape shape, int32_t result_offset, int32_t result_mult_int, int32_t result_shift, int32_t min, int32_t max, bool add_bias)
*c217d954SCole Faust    {
*c217d954SCole Faust        _target    = compute_target(shape, result_offset, result_mult_int, result_shift, min, max, add_bias);
*c217d954SCole Faust        _reference = compute_reference(shape, result_offset, result_mult_int, result_shift, min, max, add_bias);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faustprotected:
*c217d954SCole Faust    template <typename U>
*c217d954SCole Faust    void fill(U &&tensor, int i)
*c217d954SCole Faust    {
*c217d954SCole Faust        std::uniform_int_distribution<> distribution(-6000, 6000);
*c217d954SCole Faust        library->fill(tensor, distribution, i);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType compute_target(const TensorShape &shape, int32_t result_offset, int32_t result_mult_int, int32_t result_shift, int32_t min, int32_t max, bool add_bias)
*c217d954SCole Faust    {
*c217d954SCole Faust        TensorShape shape_bias(shape[0]);
*c217d954SCole Faust
*c217d954SCole Faust        // Create tensors
*c217d954SCole Faust        TensorType a = create_tensor<TensorType>(shape, DataType::S32, 1);
*c217d954SCole Faust        TensorType b = create_tensor<TensorType>(shape_bias, DataType::S32, 1);
*c217d954SCole Faust        TensorType c = create_tensor<TensorType>(shape, DataType::QASYMM8_SIGNED, 1);
*c217d954SCole Faust
*c217d954SCole Faust        // Create and configure function
*c217d954SCole Faust        FunctionType            output_stage;
*c217d954SCole Faust        GEMMLowpOutputStageInfo output_stage_info = GEMMLowpOutputStageInfo();
*c217d954SCole Faust        output_stage_info.type                    = GEMMLowpOutputStageType::QUANTIZE_DOWN;
*c217d954SCole Faust        output_stage_info.gemmlowp_offset         = result_offset;
*c217d954SCole Faust        output_stage_info.gemmlowp_multiplier     = result_mult_int;
*c217d954SCole Faust        output_stage_info.gemmlowp_shift          = result_shift;
*c217d954SCole Faust        output_stage_info.gemmlowp_min_bound      = min;
*c217d954SCole Faust        output_stage_info.gemmlowp_max_bound      = max;
*c217d954SCole Faust        output_stage_info.output_data_type        = DataType::QASYMM8_SIGNED;
*c217d954SCole Faust        output_stage.configure(&a, add_bias ? &b : nullptr, &c, output_stage_info);
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(a.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(c.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        // Allocate tensors
*c217d954SCole Faust        a.allocator()->allocate();
*c217d954SCole Faust        c.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!a.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!c.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        // Fill tensor
*c217d954SCole Faust        fill(AccessorType(a), 0);
*c217d954SCole Faust
*c217d954SCole Faust        if(add_bias)
*c217d954SCole Faust        {
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(b.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust            // Allocate bias tensor
*c217d954SCole Faust            b.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(!b.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust            // Fill tensor
*c217d954SCole Faust            fill(AccessorType(b), 1);
*c217d954SCole Faust        }
*c217d954SCole Faust
*c217d954SCole Faust        // Compute GEMM function
*c217d954SCole Faust        output_stage.run();
*c217d954SCole Faust        return c;
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<int8_t> compute_reference(const TensorShape &shape, int32_t result_offset, int32_t result_mult_int, int32_t result_shift, int32_t min, int32_t max, bool add_bias)
*c217d954SCole Faust    {
*c217d954SCole Faust        // Create reference
*c217d954SCole Faust        TensorShape shape_bias(shape[0]);
*c217d954SCole Faust
*c217d954SCole Faust        SimpleTensor<int32_t> a{ shape, DataType::S32, 1 };
*c217d954SCole Faust        SimpleTensor<int32_t> b{ shape_bias, DataType::S32, 1 };
*c217d954SCole Faust
*c217d954SCole Faust        // Fill reference
*c217d954SCole Faust        fill(a, 0);
*c217d954SCole Faust
*c217d954SCole Faust        const std::vector<int32_t> result_mult_int_vec = { result_mult_int };
*c217d954SCole Faust        const std::vector<int32_t> result_shift_vec    = { result_shift };
*c217d954SCole Faust
*c217d954SCole Faust        if(add_bias)
*c217d954SCole Faust        {
*c217d954SCole Faust            // Fill bias
*c217d954SCole Faust            fill(b, 1);
*c217d954SCole Faust
*c217d954SCole Faust            return reference::gemmlowp_quantize_down_scale<int32_t, int8_t>(a, b, result_offset, result_mult_int_vec, result_shift_vec, min, max);
*c217d954SCole Faust        }
*c217d954SCole Faust        else
*c217d954SCole Faust        {
*c217d954SCole Faust            return reference::gemmlowp_quantize_down_scale<int32_t, int8_t>(a, result_offset, result_mult_int_vec, result_shift_vec, min, max);
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType           _target{};
*c217d954SCole Faust    SimpleTensor<int8_t> _reference{};
*c217d954SCole Faust};
*c217d954SCole Faust
*c217d954SCole Fausttemplate <typename TensorType, typename AccessorType, typename FunctionType>
*c217d954SCole Faustclass GEMMLowpQuantizeDownInt32ToInt8ScaleByFixedPointValidationFixture : public framework::Fixture
*c217d954SCole Faust{
*c217d954SCole Faustpublic:
*c217d954SCole Faust    template <typename...>
*c217d954SCole Faust    void setup(TensorShape shape, int32_t result_fixedpoint_multiplier, int32_t result_shift, int32_t result_offset_after_shift, int32_t min, int32_t max, bool add_bias)
*c217d954SCole Faust    {
*c217d954SCole Faust        _target    = compute_target(shape, result_fixedpoint_multiplier, result_shift, result_offset_after_shift, min, max, add_bias);
*c217d954SCole Faust        _reference = compute_reference(shape, result_fixedpoint_multiplier, result_shift, result_offset_after_shift, min, max, add_bias);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faustprotected:
*c217d954SCole Faust    template <typename U>
*c217d954SCole Faust    void fill(U &&tensor, int i)
*c217d954SCole Faust    {
*c217d954SCole Faust        std::uniform_int_distribution<> distribution(-6000, 6000);
*c217d954SCole Faust        library->fill(tensor, distribution, i);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType compute_target(const TensorShape &shape, int32_t result_fixedpoint_multiplier, int32_t result_shift, int32_t result_offset_after_shift, int32_t min, int32_t max, bool add_bias)
*c217d954SCole Faust    {
*c217d954SCole Faust        TensorShape shape_bias(shape[0]);
*c217d954SCole Faust
*c217d954SCole Faust        // Create tensors
*c217d954SCole Faust        TensorType a = create_tensor<TensorType>(shape, DataType::S32, 1);
*c217d954SCole Faust        TensorType b = create_tensor<TensorType>(shape_bias, DataType::S32, 1);
*c217d954SCole Faust        TensorType c = create_tensor<TensorType>(shape, DataType::QASYMM8_SIGNED, 1);
*c217d954SCole Faust
*c217d954SCole Faust        // Create and configure function
*c217d954SCole Faust        FunctionType output_stage;
*c217d954SCole Faust        output_stage.configure(&a, add_bias ? &b : nullptr, &c, result_fixedpoint_multiplier, result_shift, result_offset_after_shift, min, max);
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(a.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(c.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        // Allocate tensors
*c217d954SCole Faust        a.allocator()->allocate();
*c217d954SCole Faust        c.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!a.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!c.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        // Fill tensor
*c217d954SCole Faust        fill(AccessorType(a), 0);
*c217d954SCole Faust
*c217d954SCole Faust        if(add_bias)
*c217d954SCole Faust        {
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(b.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust            // Allocate bias tensor
*c217d954SCole Faust            b.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(!b.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust            // Fill tensor
*c217d954SCole Faust            fill(AccessorType(b), 1);
*c217d954SCole Faust        }
*c217d954SCole Faust
*c217d954SCole Faust        // Compute GEMM function
*c217d954SCole Faust        output_stage.run();
*c217d954SCole Faust        return c;
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<int8_t> compute_reference(const TensorShape &shape, int32_t result_fixed_point_multiplier, int32_t result_shift, int32_t result_offset_after_shift, int32_t min, int32_t max,
*c217d954SCole Faust                                           bool add_bias)
*c217d954SCole Faust    {
*c217d954SCole Faust        // Create reference
*c217d954SCole Faust        TensorShape shape_bias(shape[0]);
*c217d954SCole Faust
*c217d954SCole Faust        SimpleTensor<int32_t> a{ shape, DataType::S32, 1 };
*c217d954SCole Faust        SimpleTensor<int32_t> b{ shape_bias, DataType::S32, 1 };
*c217d954SCole Faust
*c217d954SCole Faust        // Fill reference
*c217d954SCole Faust        fill(a, 0);
*c217d954SCole Faust
*c217d954SCole Faust        const std::vector<int32_t> result_fixed_point_multiplier_vec = { result_fixed_point_multiplier };
*c217d954SCole Faust        const std::vector<int32_t> result_shift_vec                  = { result_shift };
*c217d954SCole Faust
*c217d954SCole Faust        if(add_bias)
*c217d954SCole Faust        {
*c217d954SCole Faust            // Fill bias
*c217d954SCole Faust            fill(b, 1);
*c217d954SCole Faust
*c217d954SCole Faust            return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, int8_t>(a, b, result_fixed_point_multiplier_vec, result_shift_vec, result_offset_after_shift, min, max);
*c217d954SCole Faust        }
*c217d954SCole Faust        else
*c217d954SCole Faust        {
*c217d954SCole Faust            return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, int8_t>(a, result_fixed_point_multiplier_vec, result_shift_vec, result_offset_after_shift, min, max);
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType           _target{};
*c217d954SCole Faust    SimpleTensor<int8_t> _reference{};
*c217d954SCole Faust};
*c217d954SCole Faust
*c217d954SCole Fausttemplate <typename TensorType, typename AccessorType, typename FunctionType>
*c217d954SCole Faustclass GEMMLowpQuantizeDownInt32ToUint8ScaleByFixedPointValidationFixture : public framework::Fixture
*c217d954SCole Faust{
*c217d954SCole Faustpublic:
*c217d954SCole Faust    template <typename...>
*c217d954SCole Faust    void setup(TensorShape shape, int32_t result_fixedpoint_multiplier, int32_t result_shift, int32_t result_offset_after_shift, int32_t min, int32_t max, bool add_bias)
*c217d954SCole Faust    {
*c217d954SCole Faust        _target    = compute_target(shape, result_fixedpoint_multiplier, result_shift, result_offset_after_shift, min, max, add_bias);
*c217d954SCole Faust        _reference = compute_reference(shape, result_fixedpoint_multiplier, result_shift, result_offset_after_shift, min, max, add_bias);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faustprotected:
*c217d954SCole Faust    template <typename U>
*c217d954SCole Faust    void fill(U &&tensor, int i)
*c217d954SCole Faust    {
*c217d954SCole Faust        std::uniform_int_distribution<> distribution(-6000, 6000);
*c217d954SCole Faust        library->fill(tensor, distribution, i);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType compute_target(const TensorShape &shape, int32_t result_fixedpoint_multiplier, int32_t result_shift, int32_t result_offset_after_shift, int32_t min, int32_t max, bool add_bias)
*c217d954SCole Faust    {
*c217d954SCole Faust        TensorShape shape_bias(shape[0]);
*c217d954SCole Faust
*c217d954SCole Faust        // Create tensors
*c217d954SCole Faust        TensorType a = create_tensor<TensorType>(shape, DataType::S32, 1);
*c217d954SCole Faust        TensorType b = create_tensor<TensorType>(shape_bias, DataType::S32, 1);
*c217d954SCole Faust        TensorType c = create_tensor<TensorType>(shape, DataType::QASYMM8, 1);
*c217d954SCole Faust
*c217d954SCole Faust        // Create and configure function
*c217d954SCole Faust        FunctionType output_stage;
*c217d954SCole Faust        output_stage.configure(&a, add_bias ? &b : nullptr, &c, result_fixedpoint_multiplier, result_shift, result_offset_after_shift, min, max);
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(a.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(c.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        // Allocate tensors
*c217d954SCole Faust        a.allocator()->allocate();
*c217d954SCole Faust        c.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!a.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!c.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        // Fill tensor
*c217d954SCole Faust        fill(AccessorType(a), 0);
*c217d954SCole Faust
*c217d954SCole Faust        if(add_bias)
*c217d954SCole Faust        {
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(b.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust            // Allocate bias tensor
*c217d954SCole Faust            b.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(!b.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust            // Fill tensor
*c217d954SCole Faust            fill(AccessorType(b), 1);
*c217d954SCole Faust        }
*c217d954SCole Faust
*c217d954SCole Faust        // Compute GEMM function
*c217d954SCole Faust        output_stage.run();
*c217d954SCole Faust        return c;
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<uint8_t> compute_reference(const TensorShape &shape, int32_t result_fixed_point_multiplier, int32_t result_shift, int32_t result_offset_after_shift, int32_t min, int32_t max,
*c217d954SCole Faust                                            bool add_bias)
*c217d954SCole Faust    {
*c217d954SCole Faust        // Create reference
*c217d954SCole Faust        TensorShape shape_bias(shape[0]);
*c217d954SCole Faust
*c217d954SCole Faust        SimpleTensor<int32_t> a{ shape, DataType::S32, 1 };
*c217d954SCole Faust        SimpleTensor<int32_t> b{ shape_bias, DataType::S32, 1 };
*c217d954SCole Faust
*c217d954SCole Faust        // Fill reference
*c217d954SCole Faust        fill(a, 0);
*c217d954SCole Faust
*c217d954SCole Faust        const std::vector<int32_t> result_fixed_point_multiplier_vec = { result_fixed_point_multiplier };
*c217d954SCole Faust        const std::vector<int32_t> result_shift_vec                  = { result_shift };
*c217d954SCole Faust
*c217d954SCole Faust        if(add_bias)
*c217d954SCole Faust        {
*c217d954SCole Faust            // Fill bias
*c217d954SCole Faust            fill(b, 1);
*c217d954SCole Faust
*c217d954SCole Faust            return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, uint8_t>(a, b, result_fixed_point_multiplier_vec, result_shift_vec, result_offset_after_shift, min, max);
*c217d954SCole Faust        }
*c217d954SCole Faust        else
*c217d954SCole Faust        {
*c217d954SCole Faust            return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, uint8_t>(a, result_fixed_point_multiplier_vec, result_shift_vec, result_offset_after_shift, min, max);
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType            _target{};
*c217d954SCole Faust    SimpleTensor<uint8_t> _reference{};
*c217d954SCole Faust};
*c217d954SCole Faust
*c217d954SCole Fausttemplate <typename TensorType, typename AccessorType, typename FunctionType, typename T>
*c217d954SCole Faustclass GEMMLowpQuantizeDownInt32ScaleByFloatValidationFixture : public framework::Fixture
*c217d954SCole Faust{
*c217d954SCole Faustpublic:
*c217d954SCole Faust    template <typename...>
*c217d954SCole Faust    void setup(DataType data_type, TensorShape shape, float result_real_multiplier, int32_t result_offset, int32_t min, int32_t max, bool add_bias)
*c217d954SCole Faust    {
*c217d954SCole Faust        _target    = compute_target(data_type, shape, result_real_multiplier, result_offset, min, max, add_bias);
*c217d954SCole Faust        _reference = compute_reference(shape, result_real_multiplier, result_offset, min, max, add_bias);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faustprotected:
*c217d954SCole Faust    template <typename U>
*c217d954SCole Faust    void fill(U &&tensor, int i)
*c217d954SCole Faust    {
*c217d954SCole Faust        // To avoid data all being clampped
*c217d954SCole Faust        std::uniform_int_distribution<> distribution(-500, 500);
*c217d954SCole Faust        library->fill(tensor, distribution, i);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType compute_target(DataType data_type, const TensorShape &shape, float result_multiplier, int32_t result_offset, int32_t min, int32_t max, bool add_bias)
*c217d954SCole Faust    {
*c217d954SCole Faust        TensorShape shape_bias(shape[0]);
*c217d954SCole Faust
*c217d954SCole Faust        // Create tensors
*c217d954SCole Faust        TensorType a = create_tensor<TensorType>(shape, DataType::S32, 1);
*c217d954SCole Faust        TensorType b = create_tensor<TensorType>(shape_bias, DataType::S32, 1);
*c217d954SCole Faust        TensorType c = create_tensor<TensorType>(shape, data_type, 1);
*c217d954SCole Faust
*c217d954SCole Faust        // create output stage info
*c217d954SCole Faust        GEMMLowpOutputStageInfo info;
*c217d954SCole Faust        info.gemmlowp_max_bound       = max;
*c217d954SCole Faust        info.gemmlowp_min_bound       = min;
*c217d954SCole Faust        info.gemmlowp_real_multiplier = result_multiplier;
*c217d954SCole Faust        info.gemmlowp_offset          = result_offset;
*c217d954SCole Faust        info.type                     = GEMMLowpOutputStageType::QUANTIZE_DOWN_FLOAT;
*c217d954SCole Faust        info.output_data_type         = data_type;
*c217d954SCole Faust
*c217d954SCole Faust        // Create and configure function
*c217d954SCole Faust        FunctionType output_stage;
*c217d954SCole Faust        output_stage.configure(&a, add_bias ? &b : nullptr, &c, info);
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(a.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(c.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        // Allocate tensors
*c217d954SCole Faust        a.allocator()->allocate();
*c217d954SCole Faust        c.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!a.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!c.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        // Fill tensor
*c217d954SCole Faust        fill(AccessorType(a), 0);
*c217d954SCole Faust
*c217d954SCole Faust        if(add_bias)
*c217d954SCole Faust        {
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(b.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust            // Allocate bias tensor
*c217d954SCole Faust            b.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(!b.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust            // Fill tensor
*c217d954SCole Faust            fill(AccessorType(b), 1);
*c217d954SCole Faust        }
*c217d954SCole Faust
*c217d954SCole Faust        // Compute GEMM function
*c217d954SCole Faust        output_stage.run();
*c217d954SCole Faust        return c;
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<T> compute_reference(const TensorShape &shape, float_t result_real_multiplier, int32_t result_offset, int32_t min, int32_t max, bool add_bias)
*c217d954SCole Faust    {
*c217d954SCole Faust        // Create reference
*c217d954SCole Faust        TensorShape shape_bias(shape[0]);
*c217d954SCole Faust
*c217d954SCole Faust        SimpleTensor<int32_t> a{ shape, DataType::S32, 1 };
*c217d954SCole Faust        SimpleTensor<int32_t> b{ shape_bias, DataType::S32, 1 };
*c217d954SCole Faust
*c217d954SCole Faust        // Fill reference
*c217d954SCole Faust        fill(a, 0);
*c217d954SCole Faust
*c217d954SCole Faust        const std::vector<float_t> result_float_multiplier_vec = { result_real_multiplier };
*c217d954SCole Faust
*c217d954SCole Faust        if(add_bias)
*c217d954SCole Faust        {
*c217d954SCole Faust            // Fill bias
*c217d954SCole Faust            fill(b, 1);
*c217d954SCole Faust
*c217d954SCole Faust            return reference::gemmlowp_quantize_down_scale_by_float<int32_t, T>(a, b, result_float_multiplier_vec, result_offset, min, max);
*c217d954SCole Faust        }
*c217d954SCole Faust        else
*c217d954SCole Faust        {
*c217d954SCole Faust            return reference::gemmlowp_quantize_down_scale_by_float<int32_t, T>(a, result_float_multiplier_vec, result_offset, min, max);
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType      _target{};
*c217d954SCole Faust    SimpleTensor<T> _reference{};
*c217d954SCole Faust};
*c217d954SCole Faust
*c217d954SCole Fausttemplate <typename TensorType, typename AccessorType, typename FunctionType>
*c217d954SCole Faustclass GEMMLowpQuantizeDownInt32ToInt16ScaleByFixedPointValidationFixture : public framework::Fixture
*c217d954SCole Faust{
*c217d954SCole Faustpublic:
*c217d954SCole Faust    template <typename...>
*c217d954SCole Faust    void setup(TensorShape shape, int32_t result_fixedpoint_multiplier, int32_t result_shift, int32_t min, int32_t max, bool add_bias)
*c217d954SCole Faust    {
*c217d954SCole Faust        _target    = compute_target(shape, result_fixedpoint_multiplier, result_shift, min, max, add_bias);
*c217d954SCole Faust        _reference = compute_reference(shape, result_fixedpoint_multiplier, result_shift, min, max, add_bias);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faustprotected:
*c217d954SCole Faust    template <typename U>
*c217d954SCole Faust    void fill(U &&tensor, int i)
*c217d954SCole Faust    {
*c217d954SCole Faust        std::uniform_int_distribution<> distribution(-6000, 6000);
*c217d954SCole Faust        library->fill(tensor, distribution, i);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType compute_target(const TensorShape &shape, int32_t result_fixedpoint_multiplier, int32_t result_shift, int32_t min, int32_t max, bool add_bias)
*c217d954SCole Faust    {
*c217d954SCole Faust        TensorShape shape_bias(shape[0]);
*c217d954SCole Faust
*c217d954SCole Faust        // Create tensors
*c217d954SCole Faust        TensorType a = create_tensor<TensorType>(shape, DataType::S32, 1);
*c217d954SCole Faust        TensorType b = create_tensor<TensorType>(shape_bias, DataType::S32, 1);
*c217d954SCole Faust        TensorType c = create_tensor<TensorType>(shape, DataType::QSYMM16, 1);
*c217d954SCole Faust
*c217d954SCole Faust        // Create and configure function
*c217d954SCole Faust        FunctionType output_stage;
*c217d954SCole Faust        output_stage.configure(&a, add_bias ? &b : nullptr, &c, result_fixedpoint_multiplier, result_shift, min, max);
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(a.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(c.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        // Allocate tensors
*c217d954SCole Faust        a.allocator()->allocate();
*c217d954SCole Faust        c.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!a.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!c.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        // Fill tensor
*c217d954SCole Faust        fill(AccessorType(a), 0);
*c217d954SCole Faust
*c217d954SCole Faust        if(add_bias)
*c217d954SCole Faust        {
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(b.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust            // Allocate bias tensor
*c217d954SCole Faust            b.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(!b.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust            // Fill tensor
*c217d954SCole Faust            fill(AccessorType(b), 1);
*c217d954SCole Faust        }
*c217d954SCole Faust
*c217d954SCole Faust        // Compute GEMM function
*c217d954SCole Faust        output_stage.run();
*c217d954SCole Faust        return c;
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<int16_t> compute_reference(const TensorShape &shape, int32_t result_fixed_point_multiplier, int32_t result_shift, int32_t min, int32_t max,
*c217d954SCole Faust                                            bool add_bias)
*c217d954SCole Faust    {
*c217d954SCole Faust        // Create reference
*c217d954SCole Faust        TensorShape shape_bias(shape[0]);
*c217d954SCole Faust
*c217d954SCole Faust        SimpleTensor<int32_t> a{ shape, DataType::S32, 1 };
*c217d954SCole Faust        SimpleTensor<int32_t> b{ shape_bias, DataType::S32, 1 };
*c217d954SCole Faust
*c217d954SCole Faust        // Fill reference
*c217d954SCole Faust        fill(a, 0);
*c217d954SCole Faust
*c217d954SCole Faust        const std::vector<int32_t> result_fixed_point_multiplier_vec = { result_fixed_point_multiplier };
*c217d954SCole Faust        const std::vector<int32_t> result_shift_vec                  = { result_shift };
*c217d954SCole Faust
*c217d954SCole Faust        if(add_bias)
*c217d954SCole Faust        {
*c217d954SCole Faust            // Fill bias
*c217d954SCole Faust            fill(b, 1);
*c217d954SCole Faust
*c217d954SCole Faust            return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, int16_t>(a, b, result_fixed_point_multiplier_vec, result_shift_vec, 0, min, max);
*c217d954SCole Faust        }
*c217d954SCole Faust        else
*c217d954SCole Faust        {
*c217d954SCole Faust            return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, int16_t>(a, result_fixed_point_multiplier_vec, result_shift_vec, 0, min, max);
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType            _target{};
*c217d954SCole Faust    SimpleTensor<int16_t> _reference{};
*c217d954SCole Faust};
*c217d954SCole Faust
*c217d954SCole Fausttemplate <typename TensorType, typename AccessorType, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMFunctionType>
*c217d954SCole Faustclass GEMMLowpMatrixMultiplyReshapedValidationFixture : public framework::Fixture
*c217d954SCole Faust{
*c217d954SCole Faustpublic:
*c217d954SCole Faust    template <typename...>
*c217d954SCole Faust    void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0, bool interleave_lhs,
*c217d954SCole Faust               bool interleave_rhs, DataType data_type)
*c217d954SCole Faust    {
*c217d954SCole Faust        GEMMLHSMatrixInfo lhs_info;
*c217d954SCole Faust        lhs_info.m0         = m0;
*c217d954SCole Faust        lhs_info.k0         = k0;
*c217d954SCole Faust        lhs_info.v0         = v0;
*c217d954SCole Faust        lhs_info.interleave = interleave_lhs;
*c217d954SCole Faust        lhs_info.transpose  = false;
*c217d954SCole Faust
*c217d954SCole Faust        GEMMRHSMatrixInfo rhs_info;
*c217d954SCole Faust        rhs_info.n0         = n0;
*c217d954SCole Faust        rhs_info.k0         = k0;
*c217d954SCole Faust        rhs_info.h0         = h0;
*c217d954SCole Faust        rhs_info.interleave = interleave_rhs;
*c217d954SCole Faust        rhs_info.transpose  = true;
*c217d954SCole Faust
*c217d954SCole Faust        // Set the tensor shapes for LHS and RHS matrices
*c217d954SCole Faust        const TensorShape lhs_shape(k, m, batch_size);
*c217d954SCole Faust        const TensorShape rhs_shape(n, k, batch_size);
*c217d954SCole Faust
*c217d954SCole Faust        _target    = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info, data_type);
*c217d954SCole Faust        _reference = compute_reference(lhs_shape, rhs_shape, data_type);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faustprotected:
*c217d954SCole Faust    template <typename U>
*c217d954SCole Faust    void fill(U &&tensor, int i)
*c217d954SCole Faust    {
*c217d954SCole Faust        switch(tensor.data_type())
*c217d954SCole Faust        {
*c217d954SCole Faust            case DataType::QASYMM8:
*c217d954SCole Faust            {
*c217d954SCole Faust                // Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path
*c217d954SCole Faust                std::uniform_int_distribution<> distribution(1, 254);
*c217d954SCole Faust                library->fill(tensor, distribution, i);
*c217d954SCole Faust            }
*c217d954SCole Faust            break;
*c217d954SCole Faust            case DataType::QASYMM8_SIGNED:
*c217d954SCole Faust            {
*c217d954SCole Faust                std::uniform_int_distribution<> distribution(-127, 126);
*c217d954SCole Faust                library->fill(tensor, distribution, i);
*c217d954SCole Faust            }
*c217d954SCole Faust            break;
*c217d954SCole Faust            default:
*c217d954SCole Faust                ARM_COMPUTE_ERROR("Unsupported data type");
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info, DataType data_type)
*c217d954SCole Faust    {
*c217d954SCole Faust        // Create tensors
*c217d954SCole Faust        TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);
*c217d954SCole Faust        TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);
*c217d954SCole Faust        TensorType lhs_reshaped;
*c217d954SCole Faust        TensorType rhs_reshaped;
*c217d954SCole Faust        TensorType dst;
*c217d954SCole Faust
*c217d954SCole Faust        const unsigned int M = lhs_shape[1];
*c217d954SCole Faust        const unsigned int N = rhs_shape[0];
*c217d954SCole Faust        const unsigned int K = lhs_shape[0];
*c217d954SCole Faust
*c217d954SCole Faust        // The output tensor will be auto-initialized within the function
*c217d954SCole Faust
*c217d954SCole Faust        // Create and configure function
*c217d954SCole Faust        ReshapeLHSOperatorType reshape_lhs;
*c217d954SCole Faust        ReshapeRHSOperatorType reshape_rhs;
*c217d954SCole Faust        GEMMFunctionType       gemm;
*c217d954SCole Faust        reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);
*c217d954SCole Faust        reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);
*c217d954SCole Faust        gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), dst.info(), lhs_info, rhs_info, GEMMReshapeInfo(M, N, K));
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &dst });
*c217d954SCole Faust
*c217d954SCole Faust        // Allocate tensors
*c217d954SCole Faust        lhs.allocator()->allocate();
*c217d954SCole Faust        rhs.allocator()->allocate();
*c217d954SCole Faust        lhs_reshaped.allocator()->allocate();
*c217d954SCole Faust        rhs_reshaped.allocator()->allocate();
*c217d954SCole Faust        dst.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        // Fill tensors
*c217d954SCole Faust        fill(AccessorType(lhs), 0);
*c217d954SCole Faust        fill(AccessorType(rhs), 1);
*c217d954SCole Faust
*c217d954SCole Faust        // Compute GEMM
*c217d954SCole Faust        ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };
*c217d954SCole Faust        reshape_lhs.run(reshape_lhs_pack);
*c217d954SCole Faust        ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };
*c217d954SCole Faust        reshape_rhs.run(reshape_rhs_pack);
*c217d954SCole Faust        ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped }, { ACL_SRC_1, &rhs_reshaped }, { ACL_DST, &dst } });
*c217d954SCole Faust        gemm.run(gemm_pack);
*c217d954SCole Faust
*c217d954SCole Faust        return dst;
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type)
*c217d954SCole Faust    {
*c217d954SCole Faust        TensorShape dst_shape = lhs_shape;
*c217d954SCole Faust        dst_shape[0]          = rhs_shape[0];
*c217d954SCole Faust        dst_shape[1]          = lhs_shape[1];
*c217d954SCole Faust
*c217d954SCole Faust        switch(data_type)
*c217d954SCole Faust        {
*c217d954SCole Faust            case DataType::QASYMM8:
*c217d954SCole Faust            {
*c217d954SCole Faust                // Create reference
*c217d954SCole Faust                SimpleTensor<uint8_t> lhs{ lhs_shape, data_type, 1 };
*c217d954SCole Faust                SimpleTensor<uint8_t> rhs{ rhs_shape, data_type, 1 };
*c217d954SCole Faust
*c217d954SCole Faust                // Fill reference
*c217d954SCole Faust                fill(lhs, 0);
*c217d954SCole Faust                fill(rhs, 1);
*c217d954SCole Faust
*c217d954SCole Faust                return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);
*c217d954SCole Faust            }
*c217d954SCole Faust            case DataType::QASYMM8_SIGNED:
*c217d954SCole Faust            {
*c217d954SCole Faust                // Create reference
*c217d954SCole Faust                SimpleTensor<int8_t> lhs{ lhs_shape, data_type, 1 };
*c217d954SCole Faust                SimpleTensor<int8_t> rhs{ rhs_shape, data_type, 1 };
*c217d954SCole Faust
*c217d954SCole Faust                // Fill reference
*c217d954SCole Faust                fill(lhs, 0);
*c217d954SCole Faust                fill(rhs, 1);
*c217d954SCole Faust
*c217d954SCole Faust                return reference::gemmlowp_matrix_multiply_core<int32_t, int8_t>(lhs, rhs, dst_shape, 0, 0);
*c217d954SCole Faust            }
*c217d954SCole Faust            default:
*c217d954SCole Faust                ARM_COMPUTE_ERROR("Unsupported data type");
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType            _target{};
*c217d954SCole Faust    SimpleTensor<int32_t> _reference{};
*c217d954SCole Faust};
*c217d954SCole Faust
*c217d954SCole Fausttemplate <typename TensorType, typename AccessorType, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMFunctionType>
*c217d954SCole Faustclass GEMMLowpMatrixMultiplyReshaped3DValidationFixture : public framework::Fixture
*c217d954SCole Faust{
*c217d954SCole Faustpublic:
*c217d954SCole Faust    template <typename...>
*c217d954SCole Faust    void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0,
*c217d954SCole Faust               bool interleave_lhs, bool interleave_rhs, DataType data_type)
*c217d954SCole Faust    {
*c217d954SCole Faust        GEMMLHSMatrixInfo lhs_info;
*c217d954SCole Faust        lhs_info.m0         = m0;
*c217d954SCole Faust        lhs_info.k0         = k0;
*c217d954SCole Faust        lhs_info.v0         = v0;
*c217d954SCole Faust        lhs_info.interleave = interleave_lhs;
*c217d954SCole Faust        lhs_info.transpose  = false;
*c217d954SCole Faust
*c217d954SCole Faust        GEMMRHSMatrixInfo rhs_info;
*c217d954SCole Faust        rhs_info.n0         = n0;
*c217d954SCole Faust        rhs_info.k0         = k0;
*c217d954SCole Faust        rhs_info.h0         = h0;
*c217d954SCole Faust        rhs_info.interleave = interleave_rhs;
*c217d954SCole Faust        rhs_info.transpose  = true;
*c217d954SCole Faust
*c217d954SCole Faust        // In case of GEMM3D, m is the product between m_w and m_h
*c217d954SCole Faust        const unsigned int m = m_w * m_h;
*c217d954SCole Faust
*c217d954SCole Faust        // Set the tensor shapes for LHS and RHS matrices
*c217d954SCole Faust        const TensorShape lhs_shape(k, m, batch_size);
*c217d954SCole Faust        const TensorShape rhs_shape(n, k, batch_size);
*c217d954SCole Faust
*c217d954SCole Faust        _target    = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info, m_h, data_type);
*c217d954SCole Faust        _reference = compute_reference(lhs_shape, rhs_shape, m_h, data_type);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faustprotected:
*c217d954SCole Faust    template <typename U>
*c217d954SCole Faust    void fill(U &&tensor, int i)
*c217d954SCole Faust    {
*c217d954SCole Faust        switch(tensor.data_type())
*c217d954SCole Faust        {
*c217d954SCole Faust            case DataType::QASYMM8:
*c217d954SCole Faust            {
*c217d954SCole Faust                // Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path
*c217d954SCole Faust                std::uniform_int_distribution<> distribution(1, 254);
*c217d954SCole Faust                library->fill(tensor, distribution, i);
*c217d954SCole Faust            }
*c217d954SCole Faust            break;
*c217d954SCole Faust            case DataType::QASYMM8_SIGNED:
*c217d954SCole Faust            {
*c217d954SCole Faust                std::uniform_int_distribution<> distribution(-127, 126);
*c217d954SCole Faust                library->fill(tensor, distribution, i);
*c217d954SCole Faust            }
*c217d954SCole Faust            break;
*c217d954SCole Faust            default:
*c217d954SCole Faust                ARM_COMPUTE_ERROR("Unsupported data type");
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info, unsigned int m_h,
*c217d954SCole Faust                              DataType data_type)
*c217d954SCole Faust    {
*c217d954SCole Faust        // Create tensors
*c217d954SCole Faust        TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);
*c217d954SCole Faust        TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);
*c217d954SCole Faust        TensorType lhs_reshaped;
*c217d954SCole Faust        TensorType rhs_reshaped;
*c217d954SCole Faust        TensorType dst;
*c217d954SCole Faust
*c217d954SCole Faust        const unsigned int M = lhs_shape[1];
*c217d954SCole Faust        const unsigned int N = rhs_shape[0];
*c217d954SCole Faust        const unsigned int K = lhs_shape[0];
*c217d954SCole Faust
*c217d954SCole Faust        // The output tensor will be auto-initialized within the function
*c217d954SCole Faust
*c217d954SCole Faust        // Create and configure function
*c217d954SCole Faust        ReshapeLHSOperatorType reshape_lhs;
*c217d954SCole Faust        ReshapeRHSOperatorType reshape_rhs;
*c217d954SCole Faust        GEMMFunctionType       gemm;
*c217d954SCole Faust        reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);
*c217d954SCole Faust        reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);
*c217d954SCole Faust        gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), dst.info(), lhs_info, rhs_info, GEMMReshapeInfo(M, N, K, 1, 1, m_h));
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &dst });
*c217d954SCole Faust
*c217d954SCole Faust        // Allocate tensors
*c217d954SCole Faust        lhs.allocator()->allocate();
*c217d954SCole Faust        rhs.allocator()->allocate();
*c217d954SCole Faust        lhs_reshaped.allocator()->allocate();
*c217d954SCole Faust        rhs_reshaped.allocator()->allocate();
*c217d954SCole Faust        dst.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        // Fill tensors
*c217d954SCole Faust        fill(AccessorType(lhs), 0);
*c217d954SCole Faust        fill(AccessorType(rhs), 1);
*c217d954SCole Faust
*c217d954SCole Faust        // Compute GEMM
*c217d954SCole Faust        ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };
*c217d954SCole Faust        reshape_lhs.run(reshape_lhs_pack);
*c217d954SCole Faust        ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };
*c217d954SCole Faust        reshape_rhs.run(reshape_rhs_pack);
*c217d954SCole Faust        ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped }, { ACL_SRC_1, &rhs_reshaped }, { ACL_DST, &dst } });
*c217d954SCole Faust        gemm.run(gemm_pack);
*c217d954SCole Faust
*c217d954SCole Faust        return dst;
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, unsigned int m_h, DataType data_type)
*c217d954SCole Faust    {
*c217d954SCole Faust        TensorShape dst_shape = lhs_shape;
*c217d954SCole Faust        dst_shape.set(0, rhs_shape[0]);
*c217d954SCole Faust        dst_shape.set(1, lhs_shape[1] / m_h);
*c217d954SCole Faust        dst_shape.set(2, m_h);
*c217d954SCole Faust        dst_shape.set(3, lhs_shape[2]);
*c217d954SCole Faust
*c217d954SCole Faust        switch(data_type)
*c217d954SCole Faust        {
*c217d954SCole Faust            case DataType::QASYMM8:
*c217d954SCole Faust            {
*c217d954SCole Faust                // Create reference
*c217d954SCole Faust                SimpleTensor<uint8_t> lhs{ lhs_shape, data_type, 1 };
*c217d954SCole Faust                SimpleTensor<uint8_t> rhs{ rhs_shape, data_type, 1 };
*c217d954SCole Faust
*c217d954SCole Faust                // Fill reference
*c217d954SCole Faust                fill(lhs, 0);
*c217d954SCole Faust                fill(rhs, 1);
*c217d954SCole Faust
*c217d954SCole Faust                return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);
*c217d954SCole Faust            }
*c217d954SCole Faust            case DataType::QASYMM8_SIGNED:
*c217d954SCole Faust            {
*c217d954SCole Faust                // Create reference
*c217d954SCole Faust                SimpleTensor<int8_t> lhs{ lhs_shape, data_type, 1 };
*c217d954SCole Faust                SimpleTensor<int8_t> rhs{ rhs_shape, data_type, 1 };
*c217d954SCole Faust
*c217d954SCole Faust                // Fill reference
*c217d954SCole Faust                fill(lhs, 0);
*c217d954SCole Faust                fill(rhs, 1);
*c217d954SCole Faust
*c217d954SCole Faust                return reference::gemmlowp_matrix_multiply_core<int32_t, int8_t>(lhs, rhs, dst_shape, 0, 0);
*c217d954SCole Faust            }
*c217d954SCole Faust            default:
*c217d954SCole Faust                ARM_COMPUTE_ERROR("Unsupported data type");
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType            _target{};
*c217d954SCole Faust    SimpleTensor<int32_t> _reference{};
*c217d954SCole Faust};
*c217d954SCole Faust
*c217d954SCole Fausttemplate <typename TensorType, typename AccessorType, typename ReshapeRHSOperatorType, typename GEMMFunctionType>
*c217d954SCole Faustclass GEMMLowpMatrixMultiplyReshapedOnlyRHSValidationFixture : public framework::Fixture
*c217d954SCole Faust{
*c217d954SCole Faustpublic:
*c217d954SCole Faust    template <typename...>
*c217d954SCole Faust    void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0,
*c217d954SCole Faust               unsigned int k0, unsigned int h0, bool interleave_rhs, bool transpose_rhs, DataType data_type)
*c217d954SCole Faust    {
*c217d954SCole Faust        GEMMLHSMatrixInfo lhs_info;
*c217d954SCole Faust        lhs_info.m0 = m0;
*c217d954SCole Faust        lhs_info.k0 = k0;
*c217d954SCole Faust
*c217d954SCole Faust        GEMMRHSMatrixInfo rhs_info;
*c217d954SCole Faust        rhs_info.n0         = n0;
*c217d954SCole Faust        rhs_info.k0         = k0;
*c217d954SCole Faust        rhs_info.h0         = h0;
*c217d954SCole Faust        rhs_info.interleave = interleave_rhs;
*c217d954SCole Faust        rhs_info.transpose  = transpose_rhs;
*c217d954SCole Faust
*c217d954SCole Faust        // Set the tensor shapes for LHS and RHS matrices
*c217d954SCole Faust        const TensorShape lhs_shape(k, m, batch_size);
*c217d954SCole Faust        const TensorShape rhs_shape(n, k, batch_size);
*c217d954SCole Faust
*c217d954SCole Faust        _target    = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info, data_type);
*c217d954SCole Faust        _reference = compute_reference(lhs_shape, rhs_shape, data_type);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faustprotected:
*c217d954SCole Faust    template <typename U>
*c217d954SCole Faust    void fill(U &&tensor, int i)
*c217d954SCole Faust    {
*c217d954SCole Faust        switch(tensor.data_type())
*c217d954SCole Faust        {
*c217d954SCole Faust            case DataType::QASYMM8:
*c217d954SCole Faust            {
*c217d954SCole Faust                // Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path
*c217d954SCole Faust                std::uniform_int_distribution<> distribution(1, 254);
*c217d954SCole Faust                library->fill(tensor, distribution, i);
*c217d954SCole Faust            }
*c217d954SCole Faust            break;
*c217d954SCole Faust            case DataType::QASYMM8_SIGNED:
*c217d954SCole Faust            {
*c217d954SCole Faust                std::uniform_int_distribution<> distribution(-127, 126);
*c217d954SCole Faust                library->fill(tensor, distribution, i);
*c217d954SCole Faust            }
*c217d954SCole Faust            break;
*c217d954SCole Faust            default:
*c217d954SCole Faust                ARM_COMPUTE_ERROR("Unsupported data type");
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info,
*c217d954SCole Faust                              const GEMMRHSMatrixInfo &rhs_info, DataType data_type)
*c217d954SCole Faust    {
*c217d954SCole Faust        // Create tensors
*c217d954SCole Faust        TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);
*c217d954SCole Faust        TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);
*c217d954SCole Faust        TensorType rhs_reshaped;
*c217d954SCole Faust        TensorType dst;
*c217d954SCole Faust
*c217d954SCole Faust        const unsigned int M = lhs_shape[1];
*c217d954SCole Faust        const unsigned int N = rhs_shape[0];
*c217d954SCole Faust        const unsigned int K = lhs_shape[0];
*c217d954SCole Faust
*c217d954SCole Faust        GEMMKernelInfo gemm_info;
*c217d954SCole Faust        gemm_info.m        = M;
*c217d954SCole Faust        gemm_info.n        = N;
*c217d954SCole Faust        gemm_info.k        = K;
*c217d954SCole Faust        gemm_info.lhs_info = lhs_info;
*c217d954SCole Faust        gemm_info.rhs_info = rhs_info;
*c217d954SCole Faust        // The output tensor will be auto-initialized within the function
*c217d954SCole Faust
*c217d954SCole Faust        // Create and configure function
*c217d954SCole Faust        ReshapeRHSOperatorType reshape_rhs;
*c217d954SCole Faust        GEMMFunctionType       gemm;
*c217d954SCole Faust        reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);
*c217d954SCole Faust        gemm.configure(lhs.info(), rhs_reshaped.info(), dst.info(), gemm_info);
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        add_padding_x({ &lhs, &rhs, &rhs_reshaped, &dst });
*c217d954SCole Faust
*c217d954SCole Faust        // Allocate tensors
*c217d954SCole Faust        lhs.allocator()->allocate();
*c217d954SCole Faust        rhs.allocator()->allocate();
*c217d954SCole Faust        rhs_reshaped.allocator()->allocate();
*c217d954SCole Faust        dst.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        // Fill tensors
*c217d954SCole Faust        fill(AccessorType(lhs), 0);
*c217d954SCole Faust        fill(AccessorType(rhs), 1);
*c217d954SCole Faust
*c217d954SCole Faust        // Compute GEMM
*c217d954SCole Faust        ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };
*c217d954SCole Faust        reshape_rhs.run(reshape_rhs_pack);
*c217d954SCole Faust        ITensorPack gemm_pack({ { ACL_SRC_0, &lhs }, { ACL_SRC_1, &rhs_reshaped }, { ACL_DST, &dst } });
*c217d954SCole Faust        gemm.run(gemm_pack);
*c217d954SCole Faust
*c217d954SCole Faust        return dst;
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type)
*c217d954SCole Faust    {
*c217d954SCole Faust        TensorShape dst_shape = lhs_shape;
*c217d954SCole Faust        dst_shape[0]          = rhs_shape[0];
*c217d954SCole Faust        dst_shape[1]          = lhs_shape[1];
*c217d954SCole Faust
*c217d954SCole Faust        if(data_type == DataType::QASYMM8)
*c217d954SCole Faust        {
*c217d954SCole Faust            // Create reference
*c217d954SCole Faust            SimpleTensor<uint8_t> lhs{ lhs_shape, data_type, 1 };
*c217d954SCole Faust            SimpleTensor<uint8_t> rhs{ rhs_shape, data_type, 1 };
*c217d954SCole Faust
*c217d954SCole Faust            // Fill reference
*c217d954SCole Faust            fill(lhs, 0);
*c217d954SCole Faust            fill(rhs, 1);
*c217d954SCole Faust
*c217d954SCole Faust            return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);
*c217d954SCole Faust        }
*c217d954SCole Faust        else
*c217d954SCole Faust        {
*c217d954SCole Faust            // Create reference
*c217d954SCole Faust            SimpleTensor<int8_t> lhs{ lhs_shape, data_type, 1 };
*c217d954SCole Faust            SimpleTensor<int8_t> rhs{ rhs_shape, data_type, 1 };
*c217d954SCole Faust
*c217d954SCole Faust            // Fill reference
*c217d954SCole Faust            fill(lhs, 0);
*c217d954SCole Faust            fill(rhs, 1);
*c217d954SCole Faust
*c217d954SCole Faust            return reference::gemmlowp_matrix_multiply_core<int32_t, int8_t>(lhs, rhs, dst_shape, 0, 0);
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType            _target{};
*c217d954SCole Faust    SimpleTensor<int32_t> _reference{};
*c217d954SCole Faust};
*c217d954SCole Faust
*c217d954SCole Fausttemplate <typename T, typename TensorType, typename AccessorType, typename ReshapeRHSOperatorType, typename GEMMFunctionType, typename ReduceOperation, typename CastOperation>
*c217d954SCole Faustclass GEMMLowpMatrixMultiplyReshapedOnlyRHSMMULOutputStageValidationFixture : public framework::Fixture
*c217d954SCole Faust{
*c217d954SCole Faustpublic:
*c217d954SCole Faust    template <typename...>
*c217d954SCole Faust    void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0,
*c217d954SCole Faust               unsigned int k0, unsigned int h0, bool interleave_rhs, bool transpose_rhs, bool broadcast_bias, DataType data_type)
*c217d954SCole Faust    {
*c217d954SCole Faust        GEMMLowpOutputStageInfo output_stage;
*c217d954SCole Faust        output_stage.type                    = GEMMLowpOutputStageType::QUANTIZE_DOWN_FIXEDPOINT;
*c217d954SCole Faust        output_stage.output_data_type        = data_type;
*c217d954SCole Faust        output_stage.gemmlowp_multipliers    = std::vector<int32_t> { 1 };
*c217d954SCole Faust        output_stage.gemmlowp_shifts         = std::vector<int32_t> { 1 };
*c217d954SCole Faust        output_stage.gemmlowp_multipliers[0] = 1;
*c217d954SCole Faust        output_stage.gemmlowp_shifts[0]      = 1;
*c217d954SCole Faust        output_stage.gemmlowp_offset         = 0;
*c217d954SCole Faust        constexpr float scale                = 0.001f;
*c217d954SCole Faust        quantization::calculate_quantized_multiplier(scale, &output_stage.gemmlowp_multipliers[0], &output_stage.gemmlowp_shifts[0]);
*c217d954SCole Faust        output_stage.gemmlowp_min_bound = -100;
*c217d954SCole Faust        output_stage.gemmlowp_max_bound = 100;
*c217d954SCole Faust
*c217d954SCole Faust        GEMMLHSMatrixInfo lhs_info;
*c217d954SCole Faust        lhs_info.m0 = m0;
*c217d954SCole Faust        lhs_info.k0 = k0;
*c217d954SCole Faust
*c217d954SCole Faust        GEMMRHSMatrixInfo rhs_info;
*c217d954SCole Faust        rhs_info.n0         = n0;
*c217d954SCole Faust        rhs_info.k0         = k0;
*c217d954SCole Faust        rhs_info.h0         = h0;
*c217d954SCole Faust        rhs_info.interleave = interleave_rhs;
*c217d954SCole Faust        rhs_info.transpose  = transpose_rhs;
*c217d954SCole Faust
*c217d954SCole Faust        int a_offset = 1;
*c217d954SCole Faust        int b_offset = 1;
*c217d954SCole Faust
*c217d954SCole Faust        // Set the tensor shapes for LHS and RHS matrices
*c217d954SCole Faust        const TensorShape lhs_shape(k, m, batch_size);
*c217d954SCole Faust        const TensorShape rhs_shape(n, k, batch_size);
*c217d954SCole Faust        const TensorShape bias_shape(n,
*c217d954SCole Faust                                     broadcast_bias ? 1 : m,
*c217d954SCole Faust                                     broadcast_bias ? 1 : batch_size);
*c217d954SCole Faust
*c217d954SCole Faust        _target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, output_stage, a_offset, b_offset);
*c217d954SCole Faust        if(gemm_validated == true)
*c217d954SCole Faust        {
*c217d954SCole Faust            _reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, output_stage, a_offset, b_offset);
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faustprotected:
*c217d954SCole Faust    template <typename U>
*c217d954SCole Faust    void fill(U &&tensor, int i)
*c217d954SCole Faust    {
*c217d954SCole Faust        switch(tensor.data_type())
*c217d954SCole Faust        {
*c217d954SCole Faust            case DataType::QASYMM8:
*c217d954SCole Faust            {
*c217d954SCole Faust                // Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path
*c217d954SCole Faust                std::uniform_int_distribution<> distribution(1, 254);
*c217d954SCole Faust                library->fill(tensor, distribution, i);
*c217d954SCole Faust            }
*c217d954SCole Faust            break;
*c217d954SCole Faust            case DataType::QASYMM8_SIGNED:
*c217d954SCole Faust            {
*c217d954SCole Faust                std::uniform_int_distribution<> distribution(-127, 126);
*c217d954SCole Faust                library->fill(tensor, distribution, i);
*c217d954SCole Faust            }
*c217d954SCole Faust            break;
*c217d954SCole Faust            case DataType::S32:
*c217d954SCole Faust            {
*c217d954SCole Faust                std::uniform_int_distribution<> distribution(-10000, 10000);
*c217d954SCole Faust                library->fill(tensor, distribution, i);
*c217d954SCole Faust            }
*c217d954SCole Faust            break;
*c217d954SCole Faust            default:
*c217d954SCole Faust                ARM_COMPUTE_ERROR("Unsupported data type");
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info,
*c217d954SCole Faust                              const GEMMRHSMatrixInfo &rhs_info, DataType data_type, GEMMLowpOutputStageInfo output_stage, const int a_offset, const int b_offset)
*c217d954SCole Faust    {
*c217d954SCole Faust        // Create tensors
*c217d954SCole Faust        TensorType lhs  = create_tensor<TensorType>(lhs_shape, data_type, 1, QuantizationInfo(1.0f / 255, a_offset));
*c217d954SCole Faust        TensorType rhs  = create_tensor<TensorType>(rhs_shape, data_type, 1, QuantizationInfo(1.0f / 255, b_offset));
*c217d954SCole Faust        TensorType bias = create_tensor<TensorType>(bias_shape, DataType::S32, 1);
*c217d954SCole Faust        TensorType dst;
*c217d954SCole Faust        TensorType rhs_reshaped;
*c217d954SCole Faust
*c217d954SCole Faust        const unsigned int M = lhs_shape[1];
*c217d954SCole Faust        const unsigned int N = rhs_shape[0];
*c217d954SCole Faust        const unsigned int K = lhs_shape[0];
*c217d954SCole Faust
*c217d954SCole Faust        // Tensors for precomputing sum of lhs rows / rhs columns
*c217d954SCole Faust        TensorType vec_sum_rows = create_tensor<TensorType>(TensorShape(M, 1, lhs_shape[2]), DataType::S32, 1);
*c217d954SCole Faust        TensorType vec_sum_cols = create_tensor<TensorType>(TensorShape(N, 1, rhs_shape[2]), DataType::S32, 1);
*c217d954SCole Faust
*c217d954SCole Faust        GEMMKernelInfo gemm_info;
*c217d954SCole Faust        gemm_info.m            = M;
*c217d954SCole Faust        gemm_info.n            = N;
*c217d954SCole Faust        gemm_info.k            = K;
*c217d954SCole Faust        gemm_info.lhs_info     = lhs_info;
*c217d954SCole Faust        gemm_info.rhs_info     = rhs_info;
*c217d954SCole Faust        gemm_info.output_stage = output_stage;
*c217d954SCole Faust        gemm_info.a_offset     = a_offset;
*c217d954SCole Faust        gemm_info.b_offset     = b_offset;
*c217d954SCole Faust        // The output tensor will be auto-initialized within the function
*c217d954SCole Faust
*c217d954SCole Faust        // Create and configure function
*c217d954SCole Faust        ReshapeRHSOperatorType reshape_rhs;
*c217d954SCole Faust        GEMMFunctionType       gemm;
*c217d954SCole Faust        reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);
*c217d954SCole Faust
*c217d954SCole Faust        // If GEMM is not validated, do not try to run. The validation will check
*c217d954SCole Faust        // if the technology supports this extension. If not, the test will be skipped.
*c217d954SCole Faust        // If it supports, the test will fail anyway because target and reference
*c217d954SCole Faust        // will not match.
*c217d954SCole Faust        gemm_validated = bool(gemm.validate(lhs.info(), rhs_reshaped.info(), dst.info(), gemm_info, vec_sum_cols.info(), vec_sum_rows.info(), bias.info()));
*c217d954SCole Faust        if(gemm_validated == true)
*c217d954SCole Faust        {
*c217d954SCole Faust            gemm.configure(lhs.info(), rhs_reshaped.info(), dst.info(), gemm_info, vec_sum_cols.info(), vec_sum_rows.info(), bias.info());
*c217d954SCole Faust
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(bias.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust            // Allocate tensors
*c217d954SCole Faust            lhs.allocator()->allocate();
*c217d954SCole Faust            rhs.allocator()->allocate();
*c217d954SCole Faust            rhs_reshaped.allocator()->allocate();
*c217d954SCole Faust            bias.allocator()->allocate();
*c217d954SCole Faust            vec_sum_cols.allocator()->allocate();
*c217d954SCole Faust            vec_sum_rows.allocator()->allocate();
*c217d954SCole Faust            dst.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(!vec_sum_cols.info()->is_resizable());
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(!vec_sum_rows.info()->is_resizable());
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust            // Fill tensors
*c217d954SCole Faust            fill(AccessorType(lhs), 0);
*c217d954SCole Faust            fill(AccessorType(rhs), 1);
*c217d954SCole Faust            fill(AccessorType(bias), 2);
*c217d954SCole Faust
*c217d954SCole Faust            TensorType    lhs_32 = create_tensor<TensorType>(lhs_shape, DataType::S32, 1);
*c217d954SCole Faust            TensorType    rhs_32 = create_tensor<TensorType>(rhs_shape, DataType::S32, 1);
*c217d954SCole Faust            CastOperation cast_lhs;
*c217d954SCole Faust            CastOperation cast_rhs;
*c217d954SCole Faust            cast_lhs.configure(&lhs, &lhs_32, ConvertPolicy::SATURATE);
*c217d954SCole Faust            cast_rhs.configure(&rhs, &rhs_32, ConvertPolicy::SATURATE);
*c217d954SCole Faust            lhs_32.allocator()->allocate();
*c217d954SCole Faust            rhs_32.allocator()->allocate();
*c217d954SCole Faust            cast_lhs.run();
*c217d954SCole Faust            cast_rhs.run();
*c217d954SCole Faust
*c217d954SCole Faust            ReduceOperation lhs_sum_rows;
*c217d954SCole Faust            ReduceOperation rhs_sum_cols;
*c217d954SCole Faust
*c217d954SCole Faust            lhs_sum_rows.configure(&lhs_32, &vec_sum_rows, 0, ReductionOperation::SUM, false);
*c217d954SCole Faust            rhs_sum_cols.configure(&rhs_32, &vec_sum_cols, 1, ReductionOperation::SUM);
*c217d954SCole Faust
*c217d954SCole Faust            lhs_sum_rows.run();
*c217d954SCole Faust            rhs_sum_cols.run();
*c217d954SCole Faust
*c217d954SCole Faust            // Compute GEMM
*c217d954SCole Faust            ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };
*c217d954SCole Faust            reshape_rhs.run(reshape_rhs_pack);
*c217d954SCole Faust            ITensorPack gemm_pack({ { ACL_SRC_0, &lhs }, { ACL_SRC_1, &rhs_reshaped }, { ACL_SRC_2, &bias }, { ACL_DST, &dst }, { ACL_VEC_COL_SUM, &vec_sum_cols }, { ACL_VEC_ROW_SUM, &vec_sum_rows } });
*c217d954SCole Faust            gemm.run(gemm_pack);
*c217d954SCole Faust        }
*c217d954SCole Faust
*c217d954SCole Faust        return dst;
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, GEMMLowpOutputStageInfo output_stage,
*c217d954SCole Faust                                      const int a_offset, const int b_offset)
*c217d954SCole Faust    {
*c217d954SCole Faust        TensorShape dst_shape = lhs_shape;
*c217d954SCole Faust        dst_shape[0]          = rhs_shape[0];
*c217d954SCole Faust        dst_shape[1]          = lhs_shape[1];
*c217d954SCole Faust
*c217d954SCole Faust        // Create reference
*c217d954SCole Faust        SimpleTensor<T>       lhs{ lhs_shape, data_type, 1, QuantizationInfo(1.0f / 255, a_offset) };
*c217d954SCole Faust        SimpleTensor<T>       rhs{ rhs_shape, data_type, 1, QuantizationInfo(1.0f / 255, b_offset) };
*c217d954SCole Faust        SimpleTensor<int32_t> bias{ bias_shape, DataType::S32, 1 };
*c217d954SCole Faust        SimpleTensor<int32_t> dst{ dst_shape, DataType::S32, 1 };
*c217d954SCole Faust        SimpleTensor<T>       dst_final{ dst_shape, data_type, 1 };
*c217d954SCole Faust
*c217d954SCole Faust        // Fill reference
*c217d954SCole Faust        fill(lhs, 0);
*c217d954SCole Faust        fill(rhs, 1);
*c217d954SCole Faust        fill(bias, 2);
*c217d954SCole Faust
*c217d954SCole Faust        dst       = reference::gemmlowp_matrix_multiply_core<int32_t, T>(lhs, rhs, dst_shape, a_offset, b_offset);
*c217d954SCole Faust        dst_final = reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, T>(dst, bias,
*c217d954SCole Faust                                                                                      output_stage.gemmlowp_multipliers, output_stage.gemmlowp_shifts, output_stage.gemmlowp_offset, output_stage.gemmlowp_min_bound, output_stage.gemmlowp_max_bound);
*c217d954SCole Faust        return dst_final;
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    bool            gemm_validated = true;
*c217d954SCole Faust    TensorType      _target{};
*c217d954SCole Faust    SimpleTensor<T> _reference{};
*c217d954SCole Faust};
*c217d954SCole Faust
*c217d954SCole Fausttemplate <typename TensorType, typename AccessorType, typename ReshapeRHSOperatorType, typename GEMMFunctionType>
*c217d954SCole Faustclass GEMMLowpMatrixMultiplyReshapedOnlyRHSMMULValidationFixture : public framework::Fixture
*c217d954SCole Faust{
*c217d954SCole Faustpublic:
*c217d954SCole Faust    template <typename...>
*c217d954SCole Faust    void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0,
*c217d954SCole Faust               unsigned int k0, unsigned int h0, bool interleave_rhs, bool transpose_rhs, DataType data_type)
*c217d954SCole Faust    {
*c217d954SCole Faust        GEMMLHSMatrixInfo lhs_info;
*c217d954SCole Faust        lhs_info.m0 = m0;
*c217d954SCole Faust        lhs_info.k0 = k0;
*c217d954SCole Faust
*c217d954SCole Faust        GEMMRHSMatrixInfo rhs_info;
*c217d954SCole Faust        rhs_info.n0         = n0;
*c217d954SCole Faust        rhs_info.k0         = k0;
*c217d954SCole Faust        rhs_info.h0         = h0;
*c217d954SCole Faust        rhs_info.interleave = interleave_rhs;
*c217d954SCole Faust        rhs_info.transpose  = transpose_rhs;
*c217d954SCole Faust
*c217d954SCole Faust        // Set the tensor shapes for LHS and RHS matrices
*c217d954SCole Faust        const TensorShape lhs_shape(k, m, batch_size);
*c217d954SCole Faust        const TensorShape rhs_shape(n, k, batch_size);
*c217d954SCole Faust
*c217d954SCole Faust        _target = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info, data_type);
*c217d954SCole Faust        if(gemm_validated == true)
*c217d954SCole Faust        {
*c217d954SCole Faust            _reference = compute_reference(lhs_shape, rhs_shape, data_type);
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faustprotected:
*c217d954SCole Faust    template <typename U>
*c217d954SCole Faust    void fill(U &&tensor, int i)
*c217d954SCole Faust    {
*c217d954SCole Faust        switch(tensor.data_type())
*c217d954SCole Faust        {
*c217d954SCole Faust            case DataType::QASYMM8:
*c217d954SCole Faust            {
*c217d954SCole Faust                // Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path
*c217d954SCole Faust                std::uniform_int_distribution<> distribution(1, 254);
*c217d954SCole Faust                library->fill(tensor, distribution, i);
*c217d954SCole Faust            }
*c217d954SCole Faust            break;
*c217d954SCole Faust            case DataType::QASYMM8_SIGNED:
*c217d954SCole Faust            {
*c217d954SCole Faust                std::uniform_int_distribution<> distribution(-127, 126);
*c217d954SCole Faust                library->fill(tensor, distribution, i);
*c217d954SCole Faust            }
*c217d954SCole Faust            break;
*c217d954SCole Faust            default:
*c217d954SCole Faust                ARM_COMPUTE_ERROR("Unsupported data type");
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info,
*c217d954SCole Faust                              const GEMMRHSMatrixInfo &rhs_info, DataType data_type)
*c217d954SCole Faust    {
*c217d954SCole Faust        // Create tensors
*c217d954SCole Faust        TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);
*c217d954SCole Faust        TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);
*c217d954SCole Faust        TensorType rhs_reshaped;
*c217d954SCole Faust        TensorType dst;
*c217d954SCole Faust
*c217d954SCole Faust        const unsigned int M = lhs_shape[1];
*c217d954SCole Faust        const unsigned int N = rhs_shape[0];
*c217d954SCole Faust        const unsigned int K = lhs_shape[0];
*c217d954SCole Faust
*c217d954SCole Faust        GEMMKernelInfo gemm_info;
*c217d954SCole Faust        gemm_info.m        = M;
*c217d954SCole Faust        gemm_info.n        = N;
*c217d954SCole Faust        gemm_info.k        = K;
*c217d954SCole Faust        gemm_info.lhs_info = lhs_info;
*c217d954SCole Faust        gemm_info.rhs_info = rhs_info;
*c217d954SCole Faust        // The output tensor will be auto-initialized within the function
*c217d954SCole Faust
*c217d954SCole Faust        // Create and configure function
*c217d954SCole Faust        ReshapeRHSOperatorType reshape_rhs;
*c217d954SCole Faust        GEMMFunctionType       gemm;
*c217d954SCole Faust        reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);
*c217d954SCole Faust
*c217d954SCole Faust        // If GEMM is not validated, do not try to run. The validation will check
*c217d954SCole Faust        // if the technology supports this extension. If not, the test will be skipped.
*c217d954SCole Faust        // If it supports, the test will fail anyway because target and reference
*c217d954SCole Faust        // will not match.
*c217d954SCole Faust        gemm_validated = bool(gemm.validate(lhs.info(), rhs_reshaped.info(), dst.info(), gemm_info, nullptr, nullptr, nullptr));
*c217d954SCole Faust        if(gemm_validated == true)
*c217d954SCole Faust        {
*c217d954SCole Faust            gemm.configure(lhs.info(), rhs_reshaped.info(), dst.info(), gemm_info, nullptr, nullptr, nullptr);
*c217d954SCole Faust
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust            // Allocate tensors
*c217d954SCole Faust            lhs.allocator()->allocate();
*c217d954SCole Faust            rhs.allocator()->allocate();
*c217d954SCole Faust            rhs_reshaped.allocator()->allocate();
*c217d954SCole Faust            dst.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());
*c217d954SCole Faust            ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust            // Fill tensors
*c217d954SCole Faust            fill(AccessorType(lhs), 0);
*c217d954SCole Faust            fill(AccessorType(rhs), 1);
*c217d954SCole Faust
*c217d954SCole Faust            // Compute GEMM
*c217d954SCole Faust            ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };
*c217d954SCole Faust            reshape_rhs.run(reshape_rhs_pack);
*c217d954SCole Faust            ITensorPack gemm_pack({ { ACL_SRC_0, &lhs }, { ACL_SRC_1, &rhs_reshaped }, { ACL_DST, &dst } });
*c217d954SCole Faust            gemm.run(gemm_pack);
*c217d954SCole Faust        }
*c217d954SCole Faust
*c217d954SCole Faust        return dst;
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type)
*c217d954SCole Faust    {
*c217d954SCole Faust        TensorShape dst_shape = lhs_shape;
*c217d954SCole Faust        dst_shape[0]          = rhs_shape[0];
*c217d954SCole Faust        dst_shape[1]          = lhs_shape[1];
*c217d954SCole Faust
*c217d954SCole Faust        if(data_type == DataType::QASYMM8)
*c217d954SCole Faust        {
*c217d954SCole Faust            // Create reference
*c217d954SCole Faust            SimpleTensor<uint8_t> lhs{ lhs_shape, data_type, 1 };
*c217d954SCole Faust            SimpleTensor<uint8_t> rhs{ rhs_shape, data_type, 1 };
*c217d954SCole Faust            SimpleTensor<int32_t> dst{ dst_shape, DataType::S32, 1 };
*c217d954SCole Faust
*c217d954SCole Faust            // Fill reference
*c217d954SCole Faust            fill(lhs, 0);
*c217d954SCole Faust            fill(rhs, 1);
*c217d954SCole Faust
*c217d954SCole Faust            return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);
*c217d954SCole Faust        }
*c217d954SCole Faust        else
*c217d954SCole Faust        {
*c217d954SCole Faust            // Create reference
*c217d954SCole Faust            SimpleTensor<int8_t>  lhs{ lhs_shape, data_type, 1 };
*c217d954SCole Faust            SimpleTensor<int8_t>  rhs{ rhs_shape, data_type, 1 };
*c217d954SCole Faust            SimpleTensor<int32_t> dst{ dst_shape, DataType::S32, 1 };
*c217d954SCole Faust
*c217d954SCole Faust            // Fill reference
*c217d954SCole Faust            fill(lhs, 0);
*c217d954SCole Faust            fill(rhs, 1);
*c217d954SCole Faust
*c217d954SCole Faust            return reference::gemmlowp_matrix_multiply_core<int32_t, int8_t>(lhs, rhs, dst_shape, 0, 0);
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    bool                  gemm_validated = true;
*c217d954SCole Faust    TensorType            _target{};
*c217d954SCole Faust    SimpleTensor<int32_t> _reference{};
*c217d954SCole Faust};
*c217d954SCole Faust
*c217d954SCole Fausttemplate <typename TensorType, typename AccessorType, typename ReshapeRHSOperatorType, typename GEMMFunctionType>
*c217d954SCole Faustclass GEMMLowpMatrixMultiplyReshapedOnlyRHS3DValidationFixture : public framework::Fixture
*c217d954SCole Faust{
*c217d954SCole Faustpublic:
*c217d954SCole Faust    template <typename...>
*c217d954SCole Faust    void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0,
*c217d954SCole Faust               unsigned int k0, unsigned int h0, bool interleave_rhs, bool transpose_rhs, DataType data_type)
*c217d954SCole Faust    {
*c217d954SCole Faust        GEMMLHSMatrixInfo lhs_info;
*c217d954SCole Faust        lhs_info.m0 = m0;
*c217d954SCole Faust        lhs_info.k0 = k0;
*c217d954SCole Faust
*c217d954SCole Faust        GEMMRHSMatrixInfo rhs_info;
*c217d954SCole Faust        rhs_info.n0         = n0;
*c217d954SCole Faust        rhs_info.k0         = k0;
*c217d954SCole Faust        rhs_info.h0         = h0;
*c217d954SCole Faust        rhs_info.interleave = interleave_rhs;
*c217d954SCole Faust        rhs_info.transpose  = transpose_rhs;
*c217d954SCole Faust
*c217d954SCole Faust        // In case of GEMM3D, m is the product between m_w and m_h
*c217d954SCole Faust        const unsigned int m = m_w * m_h;
*c217d954SCole Faust
*c217d954SCole Faust        // Set the tensor shapes for LHS and RHS matrices
*c217d954SCole Faust        const TensorShape lhs_shape(k, m, batch_size);
*c217d954SCole Faust        const TensorShape rhs_shape(n, k, batch_size);
*c217d954SCole Faust
*c217d954SCole Faust        _target    = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info, m_h, data_type);
*c217d954SCole Faust        _reference = compute_reference(lhs_shape, rhs_shape, m_h, data_type);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faustprotected:
*c217d954SCole Faust    template <typename U>
*c217d954SCole Faust    void fill(U &&tensor, int i)
*c217d954SCole Faust    {
*c217d954SCole Faust        switch(tensor.data_type())
*c217d954SCole Faust        {
*c217d954SCole Faust            case DataType::QASYMM8:
*c217d954SCole Faust            {
*c217d954SCole Faust                // Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path
*c217d954SCole Faust                std::uniform_int_distribution<> distribution(1, 254);
*c217d954SCole Faust                library->fill(tensor, distribution, i);
*c217d954SCole Faust            }
*c217d954SCole Faust            break;
*c217d954SCole Faust            case DataType::QASYMM8_SIGNED:
*c217d954SCole Faust            {
*c217d954SCole Faust                std::uniform_int_distribution<> distribution(-127, 126);
*c217d954SCole Faust                library->fill(tensor, distribution, i);
*c217d954SCole Faust            }
*c217d954SCole Faust            break;
*c217d954SCole Faust            default:
*c217d954SCole Faust                ARM_COMPUTE_ERROR("Unsupported data type");
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info,
*c217d954SCole Faust                              const GEMMRHSMatrixInfo &rhs_info, unsigned int m_h, DataType data_type)
*c217d954SCole Faust    {
*c217d954SCole Faust        // Create tensors
*c217d954SCole Faust        TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);
*c217d954SCole Faust        TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);
*c217d954SCole Faust        TensorType rhs_reshaped;
*c217d954SCole Faust        TensorType dst;
*c217d954SCole Faust
*c217d954SCole Faust        const unsigned int M = lhs_shape[1];
*c217d954SCole Faust        const unsigned int N = rhs_shape[0];
*c217d954SCole Faust        const unsigned int K = lhs_shape[0];
*c217d954SCole Faust
*c217d954SCole Faust        GEMMKernelInfo gemm_info;
*c217d954SCole Faust        gemm_info.m                   = M;
*c217d954SCole Faust        gemm_info.n                   = N;
*c217d954SCole Faust        gemm_info.k                   = K;
*c217d954SCole Faust        gemm_info.depth_output_gemm3d = m_h;
*c217d954SCole Faust        gemm_info.lhs_info            = lhs_info;
*c217d954SCole Faust        gemm_info.rhs_info            = rhs_info;
*c217d954SCole Faust        // The output tensor will be auto-initialized within the function
*c217d954SCole Faust
*c217d954SCole Faust        // Create and configure function
*c217d954SCole Faust        ReshapeRHSOperatorType reshape_rhs;
*c217d954SCole Faust        GEMMFunctionType       gemm;
*c217d954SCole Faust        reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);
*c217d954SCole Faust        gemm.configure(lhs.info(), rhs_reshaped.info(), dst.info(), gemm_info);
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        add_padding_x({ &lhs, &rhs, &rhs_reshaped, &dst });
*c217d954SCole Faust
*c217d954SCole Faust        // Allocate tensors
*c217d954SCole Faust        lhs.allocator()->allocate();
*c217d954SCole Faust        rhs.allocator()->allocate();
*c217d954SCole Faust        rhs_reshaped.allocator()->allocate();
*c217d954SCole Faust        dst.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        // Fill tensors
*c217d954SCole Faust        fill(AccessorType(lhs), 0);
*c217d954SCole Faust        fill(AccessorType(rhs), 1);
*c217d954SCole Faust
*c217d954SCole Faust        // Compute GEMM
*c217d954SCole Faust        ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };
*c217d954SCole Faust        reshape_rhs.run(reshape_rhs_pack);
*c217d954SCole Faust        ITensorPack gemm_pack({ { ACL_SRC_0, &lhs }, { ACL_SRC_1, &rhs_reshaped }, { ACL_DST, &dst } });
*c217d954SCole Faust        gemm.run(gemm_pack);
*c217d954SCole Faust
*c217d954SCole Faust        return dst;
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, unsigned int m_h, DataType data_type)
*c217d954SCole Faust    {
*c217d954SCole Faust        TensorShape dst_shape = lhs_shape;
*c217d954SCole Faust        dst_shape.set(0, rhs_shape[0]);
*c217d954SCole Faust        dst_shape.set(1, lhs_shape[1] / m_h);
*c217d954SCole Faust        dst_shape.set(2, m_h);
*c217d954SCole Faust        dst_shape.set(3, lhs_shape[2]);
*c217d954SCole Faust
*c217d954SCole Faust        if(data_type == DataType::QASYMM8)
*c217d954SCole Faust        {
*c217d954SCole Faust            // Create reference
*c217d954SCole Faust            SimpleTensor<uint8_t> lhs{ lhs_shape, data_type, 1 };
*c217d954SCole Faust            SimpleTensor<uint8_t> rhs{ rhs_shape, data_type, 1 };
*c217d954SCole Faust
*c217d954SCole Faust            // Fill reference
*c217d954SCole Faust            fill(lhs, 0);
*c217d954SCole Faust            fill(rhs, 1);
*c217d954SCole Faust
*c217d954SCole Faust            return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);
*c217d954SCole Faust        }
*c217d954SCole Faust        else
*c217d954SCole Faust        {
*c217d954SCole Faust            // Create reference
*c217d954SCole Faust            SimpleTensor<int8_t> lhs{ lhs_shape, data_type, 1 };
*c217d954SCole Faust            SimpleTensor<int8_t> rhs{ rhs_shape, data_type, 1 };
*c217d954SCole Faust
*c217d954SCole Faust            // Fill reference
*c217d954SCole Faust            fill(lhs, 0);
*c217d954SCole Faust            fill(rhs, 1);
*c217d954SCole Faust
*c217d954SCole Faust            return reference::gemmlowp_matrix_multiply_core<int32_t, int8_t>(lhs, rhs, dst_shape, 0, 0);
*c217d954SCole Faust        }
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType            _target{};
*c217d954SCole Faust    SimpleTensor<int32_t> _reference{};
*c217d954SCole Faust};
*c217d954SCole Faust
*c217d954SCole Fausttemplate <typename TensorType, typename AccessorType, typename GEMMFunctionType>
*c217d954SCole Faustclass GEMMLowpMatrixMultiplyNativeValidationFixture : public framework::Fixture
*c217d954SCole Faust{
*c217d954SCole Faustpublic:
*c217d954SCole Faust    template <typename...>
*c217d954SCole Faust    void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0)
*c217d954SCole Faust    {
*c217d954SCole Faust        GEMMLHSMatrixInfo lhs_info;
*c217d954SCole Faust        lhs_info.m0 = m0;
*c217d954SCole Faust        lhs_info.k0 = k0;
*c217d954SCole Faust
*c217d954SCole Faust        GEMMRHSMatrixInfo rhs_info;
*c217d954SCole Faust        rhs_info.n0 = n0;
*c217d954SCole Faust        rhs_info.k0 = k0;
*c217d954SCole Faust
*c217d954SCole Faust        // Set the tensor shapes for LHS and RHS matrices
*c217d954SCole Faust        const TensorShape lhs_shape(k, m, batch_size);
*c217d954SCole Faust        const TensorShape rhs_shape(n, k, batch_size);
*c217d954SCole Faust
*c217d954SCole Faust        _target    = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info);
*c217d954SCole Faust        _reference = compute_reference(lhs_shape, rhs_shape);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faustprotected:
*c217d954SCole Faust    template <typename U>
*c217d954SCole Faust    void fill(U &&tensor, int i)
*c217d954SCole Faust    {
*c217d954SCole Faust        // Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path
*c217d954SCole Faust        std::uniform_int_distribution<> distribution(1, 254);
*c217d954SCole Faust        library->fill(tensor, distribution, i);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info)
*c217d954SCole Faust    {
*c217d954SCole Faust        // Create tensors
*c217d954SCole Faust        TensorType lhs = create_tensor<TensorType>(lhs_shape, DataType::QASYMM8, 1);
*c217d954SCole Faust        TensorType rhs = create_tensor<TensorType>(rhs_shape, DataType::QASYMM8, 1);
*c217d954SCole Faust        TensorType dst;
*c217d954SCole Faust
*c217d954SCole Faust        const unsigned int M = lhs_shape[1];
*c217d954SCole Faust        const unsigned int N = rhs_shape[0];
*c217d954SCole Faust        const unsigned int K = lhs_shape[0];
*c217d954SCole Faust
*c217d954SCole Faust        // The output tensor will be auto-initialized within the function
*c217d954SCole Faust
*c217d954SCole Faust        // Create and configure function
*c217d954SCole Faust        GEMMFunctionType gemm;
*c217d954SCole Faust        gemm.configure(lhs.info(), rhs.info(), dst.info(), lhs_info, rhs_info, GEMMReshapeInfo(M, N, K));
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        add_padding_x({ &lhs, &rhs, &dst });
*c217d954SCole Faust
*c217d954SCole Faust        // Allocate tensors
*c217d954SCole Faust        lhs.allocator()->allocate();
*c217d954SCole Faust        rhs.allocator()->allocate();
*c217d954SCole Faust        dst.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        // Fill tensors
*c217d954SCole Faust        fill(AccessorType(lhs), 0);
*c217d954SCole Faust        fill(AccessorType(rhs), 1);
*c217d954SCole Faust
*c217d954SCole Faust        // Compute GEMM
*c217d954SCole Faust        ITensorPack gemm_pack({ { ACL_SRC_0, &lhs }, { ACL_SRC_1, &rhs }, { ACL_DST, &dst } });
*c217d954SCole Faust        gemm.run(gemm_pack);
*c217d954SCole Faust
*c217d954SCole Faust        return dst;
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape)
*c217d954SCole Faust    {
*c217d954SCole Faust        TensorShape dst_shape = lhs_shape;
*c217d954SCole Faust        dst_shape[0]          = rhs_shape[0];
*c217d954SCole Faust        dst_shape[1]          = lhs_shape[1];
*c217d954SCole Faust
*c217d954SCole Faust        // Create reference
*c217d954SCole Faust        SimpleTensor<uint8_t> lhs{ lhs_shape, DataType::QASYMM8, 1 };
*c217d954SCole Faust        SimpleTensor<uint8_t> rhs{ rhs_shape, DataType::QASYMM8, 1 };
*c217d954SCole Faust
*c217d954SCole Faust        // Fill reference
*c217d954SCole Faust        fill(lhs, 0);
*c217d954SCole Faust        fill(rhs, 1);
*c217d954SCole Faust
*c217d954SCole Faust        return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType            _target{};
*c217d954SCole Faust    SimpleTensor<int32_t> _reference{};
*c217d954SCole Faust};
*c217d954SCole Faust
*c217d954SCole Fausttemplate <typename TensorType, typename AccessorType, typename GEMMFunctionType>
*c217d954SCole Faustclass GEMMLowpMatrixMultiplyNative3DValidationFixture : public framework::Fixture
*c217d954SCole Faust{
*c217d954SCole Faustpublic:
*c217d954SCole Faust    template <typename...>
*c217d954SCole Faust    void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0)
*c217d954SCole Faust    {
*c217d954SCole Faust        GEMMLHSMatrixInfo lhs_info;
*c217d954SCole Faust        lhs_info.m0 = m0;
*c217d954SCole Faust        lhs_info.k0 = k0;
*c217d954SCole Faust
*c217d954SCole Faust        GEMMRHSMatrixInfo rhs_info;
*c217d954SCole Faust        rhs_info.n0 = n0;
*c217d954SCole Faust        rhs_info.k0 = k0;
*c217d954SCole Faust
*c217d954SCole Faust        // In case of GEMM3D, m is the product between m_w and m_h
*c217d954SCole Faust        const unsigned int m = m_w * m_h;
*c217d954SCole Faust
*c217d954SCole Faust        // Set the tensor shapes for LHS and RHS matrices
*c217d954SCole Faust        const TensorShape lhs_shape(k, m, batch_size);
*c217d954SCole Faust        const TensorShape rhs_shape(n, k, batch_size);
*c217d954SCole Faust
*c217d954SCole Faust        _target    = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info, m_h);
*c217d954SCole Faust        _reference = compute_reference(lhs_shape, rhs_shape, m_h);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faustprotected:
*c217d954SCole Faust    template <typename U>
*c217d954SCole Faust    void fill(U &&tensor, int i)
*c217d954SCole Faust    {
*c217d954SCole Faust        // Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path
*c217d954SCole Faust        std::uniform_int_distribution<> distribution(1, 254);
*c217d954SCole Faust        library->fill(tensor, distribution, i);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info, unsigned int m_h)
*c217d954SCole Faust    {
*c217d954SCole Faust        // Create tensors
*c217d954SCole Faust        TensorType lhs = create_tensor<TensorType>(lhs_shape, DataType::QASYMM8, 1);
*c217d954SCole Faust        TensorType rhs = create_tensor<TensorType>(rhs_shape, DataType::QASYMM8, 1);
*c217d954SCole Faust        TensorType dst;
*c217d954SCole Faust
*c217d954SCole Faust        const unsigned int M = lhs_shape[1];
*c217d954SCole Faust        const unsigned int N = rhs_shape[0];
*c217d954SCole Faust        const unsigned int K = lhs_shape[0];
*c217d954SCole Faust
*c217d954SCole Faust        // The output tensor will be auto-initialized within the function
*c217d954SCole Faust
*c217d954SCole Faust        // Create and configure function
*c217d954SCole Faust        GEMMFunctionType gemm;
*c217d954SCole Faust        gemm.configure(lhs.info(), rhs.info(), dst.info(), lhs_info, rhs_info, GEMMReshapeInfo(M, N, K, 1, 1, m_h));
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        add_padding_x({ &lhs, &rhs, &dst });
*c217d954SCole Faust
*c217d954SCole Faust        // Allocate tensors
*c217d954SCole Faust        lhs.allocator()->allocate();
*c217d954SCole Faust        rhs.allocator()->allocate();
*c217d954SCole Faust        dst.allocator()->allocate();
*c217d954SCole Faust
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());
*c217d954SCole Faust        ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());
*c217d954SCole Faust
*c217d954SCole Faust        // Fill tensors
*c217d954SCole Faust        fill(AccessorType(lhs), 0);
*c217d954SCole Faust        fill(AccessorType(rhs), 1);
*c217d954SCole Faust
*c217d954SCole Faust        // Compute GEMM
*c217d954SCole Faust        ITensorPack gemm_pack({ { ACL_SRC_0, &lhs }, { ACL_SRC_1, &rhs }, { ACL_DST, &dst } });
*c217d954SCole Faust        gemm.run(gemm_pack);
*c217d954SCole Faust
*c217d954SCole Faust        return dst;
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, unsigned int m_h)
*c217d954SCole Faust    {
*c217d954SCole Faust        TensorShape dst_shape = lhs_shape;
*c217d954SCole Faust        dst_shape.set(0, rhs_shape[0]);
*c217d954SCole Faust        dst_shape.set(1, lhs_shape[1] / m_h);
*c217d954SCole Faust        dst_shape.set(2, m_h);
*c217d954SCole Faust        dst_shape.set(3, lhs_shape[2]);
*c217d954SCole Faust
*c217d954SCole Faust        // Create reference
*c217d954SCole Faust        SimpleTensor<uint8_t> lhs{ lhs_shape, DataType::QASYMM8, 1 };
*c217d954SCole Faust        SimpleTensor<uint8_t> rhs{ rhs_shape, DataType::QASYMM8, 1 };
*c217d954SCole Faust
*c217d954SCole Faust        // Fill reference
*c217d954SCole Faust        fill(lhs, 0);
*c217d954SCole Faust        fill(rhs, 1);
*c217d954SCole Faust
*c217d954SCole Faust        return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);
*c217d954SCole Faust    }
*c217d954SCole Faust
*c217d954SCole Faust    TensorType            _target{};
*c217d954SCole Faust    SimpleTensor<int32_t> _reference{};
*c217d954SCole Faust};
*c217d954SCole Faust} // namespace validation
*c217d954SCole Faust} // namespace test
*c217d954SCole Faust} // namespace arm_compute
*c217d954SCole Faust#endif /* ARM_COMPUTE_TEST_GEMMLOWP_FIXTURE */