vktSpvAsmFloatControlsTests.cpp (revision 35238bce31c2a825756842865a792f8cf7f89930) - OpenGrok cross reference for /aosp_15_r20/external/deqp/external/vulkancts/modules/vulkan/spirv_assembly/vktSpvAsmFloatControlsTests.cpp

/*-------------------------------------------------------------------------
 * Vulkan Conformance Tests
 * ------------------------
 *
 * Copyright (c) 2018 The Khronos Group Inc.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 *
 *//*!
 * \file
 * \brief VK_KHR_shader_float_controls tests.
 *//*--------------------------------------------------------------------*/

#define _USE_MATH_DEFINES

#include "vktSpvAsmFloatControlsTests.hpp"
#include "vktSpvAsmComputeShaderCase.hpp"
#include "vktSpvAsmGraphicsShaderTestUtil.hpp"
#include "vktTestGroupUtil.hpp"
#include "tcuFloat.hpp"
#include "tcuFloatFormat.hpp"
#include "tcuStringTemplate.hpp"
#include "deUniquePtr.hpp"
#include "deFloat16.h"
#include "vkQueryUtil.hpp"
#include "vkRefUtil.hpp"
#include <cstring>
#include <vector>
#include <limits>
#include <cstdint>
#include <fenv.h>
#include <cstdint>
#include <cmath>

namespace vkt
{
namespace SpirVAssembly
{

namespace
{

using namespace std;
using namespace tcu;

enum VariableType
{
    FP16 = 0,
    FP32,
    FP64,
    UINT32,
    UINT64,
    INT32,
    INT64
};

enum class BufferDataType
{
    DATA_UNKNOWN = 0,
    DATA_FP16    = 1,
    DATA_FP32    = 2,
    DATA_FP64    = 3,
};

enum FloatUsage
{
    // If the float type is 16bit, then the use of the type is supported by
    // VK_KHR_16bit_storage.
    FLOAT_STORAGE_ONLY = 0,
    // Use of the float type goes beyond VK_KHR_16bit_storage.
    FLOAT_ARITHMETIC
};

enum FloatStatementUsageBits
{
    B_STATEMENT_USAGE_ARGS_CONST_FLOAT     = (1 << 0),
    B_STATEMENT_USAGE_ARGS_CONST_FP16      = (1 << 1),
    B_STATEMENT_USAGE_ARGS_CONST_FP32      = (1 << 2),
    B_STATEMENT_USAGE_ARGS_CONST_FP64      = (1 << 3),
    B_STATEMENT_USAGE_TYPES_TYPE_FLOAT     = (1 << 4),
    B_STATEMENT_USAGE_TYPES_TYPE_FP16      = (1 << 5),
    B_STATEMENT_USAGE_TYPES_TYPE_FP32      = (1 << 6),
    B_STATEMENT_USAGE_TYPES_TYPE_FP64      = (1 << 7),
    B_STATEMENT_USAGE_CONSTS_TYPE_FLOAT    = (1 << 8),
    B_STATEMENT_USAGE_CONSTS_TYPE_FP16     = (1 << 9),
    B_STATEMENT_USAGE_CONSTS_TYPE_FP32     = (1 << 10),
    B_STATEMENT_USAGE_CONSTS_TYPE_FP64     = (1 << 11),
    B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT = (1 << 12),
    B_STATEMENT_USAGE_COMMANDS_CONST_FP16  = (1 << 13),
    B_STATEMENT_USAGE_COMMANDS_CONST_FP32  = (1 << 14),
    B_STATEMENT_USAGE_COMMANDS_CONST_FP64  = (1 << 15),
    B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT  = (1 << 16),
    B_STATEMENT_USAGE_COMMANDS_TYPE_FP16   = (1 << 17),
    B_STATEMENT_USAGE_COMMANDS_TYPE_FP32   = (1 << 18),
    B_STATEMENT_USAGE_COMMANDS_TYPE_FP64   = (1 << 19),
};

typedef uint32_t FloatStatementUsageFlags;

// Enum containing float behaviors that its possible to test.
enum BehaviorFlagBits
{
    B_DENORM_PRESERVE = 0x00000001, // DenormPreserve
    B_DENORM_FLUSH    = 0x00000002, // DenormFlushToZero
    B_ZIN_PRESERVE    = 0x00000004, // SignedZeroInfNanPreserve
    B_RTE_ROUNDING    = 0x00000008, // RoundingModeRTE
    B_RTZ_ROUNDING    = 0x00000010  // RoundingModeRTZ
};

typedef uint32_t BehaviorFlags;

// Codes for all float values used in tests as arguments and operation results
// This approach allows to replace values with different types reducing complexity of the tests implementation
enum ValueId
{
    // common values used as both arguments and results
    V_UNUSED = 0, // used to mark arguments that are not used in operation
    V_MINUS_INF,  //    or results of tests cases that should be skipped
    V_MINUS_ONE,  // -1.0
    V_MINUS_ZERO, // -0.0
    V_ZERO,       //  0.0
    V_HALF,       //  0.5
    V_ONE,        //  1.0
    V_INF,
    V_DENORM,
    V_NAN,

    // arguments for rounding mode tests - used only when arguments are passed from input
    V_ADD_ARG_A,
    V_ADD_ARG_B,
    V_SUB_ARG_A,
    V_SUB_ARG_B,
    V_MUL_ARG_A,
    V_MUL_ARG_B,
    V_DOT_ARG_A,
    V_DOT_ARG_B,

    // arguments of conversion operations - used only when arguments are passed from input
    // Subcases are:
    //    ...UP: rounds away from zero, e.g. trailing bits are 101..
    //    ...DOWN: rounds toward zero, e.g. trailing bits are 011..
    //    ...TIE_UP: rounds up to even, e.g. preserved bit is 1, trailing are 10*
    //    ...TIE_DOWN: rounds up to even, e.g. preserved bit is 0, trailing are 10*
    V_CONV_FROM_FP32_TO_FP16_UP_ARG,
    V_CONV_FROM_FP32_TO_FP16_DOWN_ARG,
    V_CONV_FROM_FP32_TO_FP16_TIE_UP_ARG,
    V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_ARG,
    V_CONV_FROM_FP64_TO_FP16_UP_ARG,
    V_CONV_FROM_FP64_TO_FP16_DOWN_ARG,
    V_CONV_FROM_FP64_TO_FP16_TIE_UP_ARG,
    V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_ARG,
    V_CONV_FROM_FP64_TO_FP32_UP_ARG,
    V_CONV_FROM_FP64_TO_FP32_DOWN_ARG,
    V_CONV_FROM_FP64_TO_FP32_TIE_UP_ARG,
    V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_ARG,

    // arguments of integer conversion rounding, not all values can be represented by all integer sizes
    // and only those that can will be used for testing
    // Subcases are:
    //    ...UP: rounds away from zero, e.g. integer's value is closer to higher float value even
    //    ...DOWN: rounds towards zero, e.g. integer's value is closer to lower float value even
    //    ...TIE: rounds towards zero, e.g. integer's value is equidistant to lower and higher float value
    // 16 bit values can only use width-conversions -> No rounding testing
    V_CONV_FROM_UINT_TO_FP32_UP_ARG,
    V_CONV_FROM_UINT_TO_FP32_DOWN_ARG,
    V_CONV_FROM_UINT_TO_FP32_TIE_ARG,
    V_CONV_FROM_UINT_TO_FP64_UP_ARG,
    V_CONV_FROM_UINT_TO_FP64_DOWN_ARG,
    V_CONV_FROM_UINT_TO_FP64_TIE_ARG,

    // Same as UINT but will only test with negative values
    V_CONV_FROM_INT_TO_FP32_UP_ARG,
    V_CONV_FROM_INT_TO_FP32_DOWN_ARG,
    V_CONV_FROM_INT_TO_FP32_TIE_ARG,
    V_CONV_FROM_INT_TO_FP64_UP_ARG,
    V_CONV_FROM_INT_TO_FP64_DOWN_ARG,
    V_CONV_FROM_INT_TO_FP64_TIE_ARG,

    // arguments of rounding operations
    V_ADD_RTZ_RESULT,
    V_ADD_RTE_RESULT,
    V_SUB_RTZ_RESULT,
    V_SUB_RTE_RESULT,
    V_MUL_RTZ_RESULT,
    V_MUL_RTE_RESULT,
    V_DOT_RTZ_RESULT,
    V_DOT_RTE_RESULT,

    // non comon results of some operation - corner cases
    V_ZERO_OR_DENORM_TIMES_TWO, // fp16 addition of non-flushed denorm with itself (or equivalent dot-product or vector-matrix multiply)
    V_MINUS_ONE_OR_CLOSE, // value used only for fp16 subtraction result of preserved denorm and one
    V_PI_DIV_2,
    V_ZERO_OR_MINUS_ZERO,          // both +0 and -0 are accepted
    V_ZERO_OR_ONE,                 // both +0 and 1 are accepted
    V_ZERO_OR_FP16_DENORM_TO_FP32, // both 0 and fp32 representation of fp16 denorm are accepted
    V_ZERO_OR_FP16_DENORM_TO_FP64,
    V_ZERO_OR_FP32_DENORM_TO_FP64,
    V_DENORM_TIMES_TWO,
    V_DEGREES_DENORM,
    V_TRIG_ONE, // 1.0 trigonometric operations, including precision margin
    V_MINUS_INF_OR_LOG_DENORM,
    V_MINUS_INF_OR_LOG2_DENORM,
    V_ZERO_OR_SQRT_DENORM,
    V_INF_OR_INV_SQRT_DENORM,

    // Results of conversion operations: RTZ
    V_CONV_FROM_FP32_TO_FP16_UP_RTZ_RESULT,
    V_CONV_FROM_FP32_TO_FP16_DOWN_RTZ_RESULT,
    V_CONV_FROM_FP32_TO_FP16_TIE_UP_RTZ_RESULT,
    V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_RTZ_RESULT,
    V_CONV_FROM_FP64_TO_FP16_UP_RTZ_RESULT,
    V_CONV_FROM_FP64_TO_FP16_DOWN_RTZ_RESULT,
    V_CONV_FROM_FP64_TO_FP16_TIE_UP_RTZ_RESULT,
    V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_RTZ_RESULT,
    V_CONV_FROM_FP64_TO_FP32_UP_RTZ_RESULT,
    V_CONV_FROM_FP64_TO_FP32_DOWN_RTZ_RESULT,
    V_CONV_FROM_FP64_TO_FP32_TIE_UP_RTZ_RESULT,
    V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_RTZ_RESULT,
    // Results of conversion operations: RTE
    V_CONV_FROM_FP32_TO_FP16_UP_RTE_RESULT,
    V_CONV_FROM_FP32_TO_FP16_DOWN_RTE_RESULT,
    V_CONV_FROM_FP32_TO_FP16_TIE_UP_RTE_RESULT,
    V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_RTE_RESULT,
    V_CONV_FROM_FP64_TO_FP16_UP_RTE_RESULT,
    V_CONV_FROM_FP64_TO_FP16_DOWN_RTE_RESULT,
    V_CONV_FROM_FP64_TO_FP16_TIE_UP_RTE_RESULT,
    V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_RTE_RESULT,
    V_CONV_FROM_FP64_TO_FP32_UP_RTE_RESULT,
    V_CONV_FROM_FP64_TO_FP32_DOWN_RTE_RESULT,
    V_CONV_FROM_FP64_TO_FP32_TIE_UP_RTE_RESULT,
    V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_RTE_RESULT,

    // Results of conversion operations: RTZ
    // 16 bit values can only use width-conversions -> No rounding testing
    V_CONV_FROM_UINT32_UP_RTZ_RESULT,
    V_CONV_FROM_UINT32_DOWN_RTZ_RESULT,
    V_CONV_FROM_UINT32_TIE_RTZ_RESULT,
    V_CONV_FROM_UINT64_UP_RTZ_RESULT,
    V_CONV_FROM_UINT64_DOWN_RTZ_RESULT,
    V_CONV_FROM_UINT64_TIE_RTZ_RESULT,
    // Results of conversion operations: RTE
    // 16 bit values can only use width-conversions -> No rounding testing
    V_CONV_FROM_UINT32_UP_RTE_RESULT,
    V_CONV_FROM_UINT32_DOWN_RTE_RESULT,
    V_CONV_FROM_UINT32_TIE_RTE_RESULT,
    V_CONV_FROM_UINT64_UP_RTE_RESULT,
    V_CONV_FROM_UINT64_DOWN_RTE_RESULT,
    V_CONV_FROM_UINT64_TIE_RTE_RESULT,

    // Same as UINT but will only test with negative values
    // Results of conversion operations: RTZ
    V_CONV_FROM_INT32_UP_RTZ_RESULT,
    V_CONV_FROM_INT32_DOWN_RTZ_RESULT,
    V_CONV_FROM_INT32_TIE_RTZ_RESULT,
    V_CONV_FROM_INT64_UP_RTZ_RESULT,
    V_CONV_FROM_INT64_DOWN_RTZ_RESULT,
    V_CONV_FROM_INT64_TIE_RTZ_RESULT,
    // Results of conversion operations: RTE
    V_CONV_FROM_INT32_UP_RTE_RESULT,
    V_CONV_FROM_INT32_DOWN_RTE_RESULT,
    V_CONV_FROM_INT32_TIE_RTE_RESULT,
    V_CONV_FROM_INT64_UP_RTE_RESULT,
    V_CONV_FROM_INT64_DOWN_RTE_RESULT,
    V_CONV_FROM_INT64_TIE_RTE_RESULT,

    V_CONV_DENORM_SMALLER, // used e.g. when converting fp16 denorm to fp32
    V_CONV_DENORM_BIGGER,
};

// Enum containing all tested operations. Operations are defined in generic way so that
// they can be used to generate tests operating on arguments with different values of
// specified float type.
enum OperationId
{
    // spir-v unary operations
    OID_NEGATE = 0,
    OID_COMPOSITE,
    OID_COMPOSITE_INS,
    OID_COPY,
    OID_D_EXTRACT,
    OID_D_INSERT,
    OID_SHUFFLE,
    OID_TRANSPOSE,
    OID_CONV_FROM_UINT_TO_FP32,
    OID_CONV_FROM_UINT_TO_FP64,
    OID_CONV_FROM_INT_TO_FP32,
    OID_CONV_FROM_INT_TO_FP64,
    // No SCONST_CONV_FROM_UINT since it requires Kernel Capability and Vulkan does not expose it
    OID_CONV_FROM_FP16,
    OID_CONV_FROM_FP32,
    OID_CONV_FROM_FP64,
    OID_SCONST_CONV_FROM_FP32_TO_FP16_UP,       // Round::UP case
    OID_SCONST_CONV_FROM_FP32_TO_FP16_DOWN,     // Round::DOWN case
    OID_SCONST_CONV_FROM_FP32_TO_FP16_TIE_UP,   // Round::TIE_DOWN case
    OID_SCONST_CONV_FROM_FP32_TO_FP16_TIE_DOWN, // Round::TIE_DOWN case
    OID_SCONST_CONV_FROM_FP64_TO_FP32_UP,
    OID_SCONST_CONV_FROM_FP64_TO_FP32_DOWN,
    OID_SCONST_CONV_FROM_FP64_TO_FP32_TIE_UP,
    OID_SCONST_CONV_FROM_FP64_TO_FP32_TIE_DOWN,
    OID_SCONST_CONV_FROM_FP64_TO_FP16_UP,
    OID_SCONST_CONV_FROM_FP64_TO_FP16_DOWN,
    OID_SCONST_CONV_FROM_FP64_TO_FP16_TIE_UP,
    OID_SCONST_CONV_FROM_FP64_TO_FP16_TIE_DOWN,
    OID_RETURN_VAL,

    // spir-v binary operations
    OID_ADD,
    OID_SUB,
    OID_MUL,
    OID_DIV,
    OID_REM,
    OID_MOD,
    OID_PHI,
    OID_SELECT,
    OID_DOT,
    OID_VEC_MUL_S,
    OID_VEC_MUL_M,
    OID_MAT_MUL_S,
    OID_MAT_MUL_V,
    OID_MAT_MUL_M,
    OID_OUT_PROD,
    OID_ORD_EQ,
    OID_UORD_EQ,
    OID_ORD_NEQ,
    OID_UORD_NEQ,
    OID_ORD_LS,
    OID_UORD_LS,
    OID_ORD_GT,
    OID_UORD_GT,
    OID_ORD_LE,
    OID_UORD_LE,
    OID_ORD_GE,
    OID_UORD_GE,

    // glsl unary operations
    OID_ROUND,
    OID_ROUND_EV,
    OID_TRUNC,
    OID_ABS,
    OID_SIGN,
    OID_FLOOR,
    OID_CEIL,
    OID_FRACT,
    OID_RADIANS,
    OID_DEGREES,
    OID_SIN,
    OID_COS,
    OID_TAN,
    OID_ASIN,
    OID_ACOS,
    OID_ATAN,
    OID_SINH,
    OID_COSH,
    OID_TANH,
    OID_ASINH,
    OID_ACOSH,
    OID_ATANH,
    OID_EXP,
    OID_LOG,
    OID_EXP2,
    OID_LOG2,
    OID_SQRT,
    OID_INV_SQRT,
    OID_MODF,
    OID_MODF_ST,
    OID_FREXP,
    OID_FREXP_ST,
    OID_LENGTH,
    OID_NORMALIZE,
    OID_REFLECT,
    OID_REFRACT,
    OID_MAT_DET,
    OID_MAT_INV,
    OID_PH_DENORM, // PackHalf2x16
    OID_UPH_DENORM,
    OID_PD_DENORM, // PackDouble2x32
    OID_UPD_DENORM_FLUSH,
    OID_UPD_DENORM_PRESERVE,

    // glsl binary operations
    OID_ATAN2,
    OID_POW,
    OID_MIX,
    OID_FMA,
    OID_MIN,
    OID_MAX,
    OID_CLAMP,
    OID_STEP,
    OID_SSTEP,
    OID_DIST,
    OID_CROSS,
    OID_FACE_FWD,
    OID_NMIN,
    OID_NMAX,
    OID_NCLAMP,

    OID_ORTE_ROUND,
    OID_ORTZ_ROUND
};

// Structures storing data required to test DenormPreserve and DenormFlushToZero modes.
// Operations are separated into binary and unary lists because binary operations can be tested with
// two attributes and thus denorms can be tested in combination with value, denorm, inf and nan.
// Unary operations are only tested with denorms.
struct BinaryCase
{
    OperationId operationId;
    ValueId opVarResult;
    ValueId opDenormResult;
    ValueId opInfResult;
    ValueId opNanResult;
};
struct UnaryCase
{
    OperationId operationId;
    ValueId result;
};

// Function replacing all occurrences of substring with string passed in last parameter.
string replace(string str, const string &from, const string &to)
{
    // to keep spir-v code clean and easier to read parts of it are processed
    // with this method instead of StringTemplate; main usage of this method is the
    // replacement of "float_" with "f16_", "f32_" or "f64_" depending on test case

    size_t start_pos = 0;
    while ((start_pos = str.find(from, start_pos)) != std::string::npos)
    {
        str.replace(start_pos, from.length(), to);
        start_pos += to.length();
    }
    return str;
}

// Structure used to perform bits conversion int type <-> float type.
template <typename FLOAT_TYPE, typename UINT_TYPE>
struct RawConvert
{
    union Value
    {
        FLOAT_TYPE fp;
        UINT_TYPE ui;
    };
};

// Traits used to get int type that can store equivalent float type.
template <typename FLOAT_TYPE>
struct GetCoresponding
{
    typedef uint16_t uint_type;
};
template <>
struct GetCoresponding<float>
{
    typedef uint32_t uint_type;
};
template <>
struct GetCoresponding<double>
{
    typedef uint64_t uint_type;
};

// All values used for arguments and operation results are stored in single map.
// Each float type (fp16, fp32, fp64) has its own map that is used during
// test setup and during verification. TypeValuesBase is interface to that map.
class TypeValuesBase
{
public:
    TypeValuesBase();
    virtual ~TypeValuesBase() = default;

    virtual BufferSp constructInputBuffer(const ValueId *twoArguments) const                                     = 0;
    virtual BufferSp constructOutputBuffer(ValueId result) const                                                 = 0;
    virtual void fillInputData(const ValueId *twoArguments, vector<uint8_t> &bufferData, uint32_t &offset) const = 0;
};

TypeValuesBase::TypeValuesBase()
{
}

typedef de::SharedPtr<TypeValuesBase> TypeValuesSP;

template <typename FLOAT_TYPE>
class TypeValues : public TypeValuesBase
{
public:
    TypeValues();

    BufferSp constructInputBuffer(const ValueId *twoArguments) const override;
    BufferSp constructOutputBuffer(ValueId result) const override;
    void fillInputData(const ValueId *twoArguments, vector<uint8_t> &bufferData, uint32_t &offset) const override;

    FLOAT_TYPE getValue(ValueId id) const;

    template <typename UINT_TYPE>
    FLOAT_TYPE exactByteEquivalent(UINT_TYPE byteValue) const;

private:
    typedef map<ValueId, FLOAT_TYPE> ValueMap;
    ValueMap m_valueIdToVariableType;
};

template <typename FLOAT_TYPE>
BufferSp TypeValues<FLOAT_TYPE>::constructInputBuffer(const ValueId *twoArguments) const
{
    std::vector<FLOAT_TYPE> inputData(2);
    inputData[0] = m_valueIdToVariableType.at(twoArguments[0]);
    inputData[1] = m_valueIdToVariableType.at(twoArguments[1]);
    return BufferSp(new Buffer<FLOAT_TYPE>(inputData));
}

template <typename FLOAT_TYPE>
BufferSp TypeValues<FLOAT_TYPE>::constructOutputBuffer(ValueId result) const
{
    // note: we are not doing maping here, ValueId is directly saved in
    // float type in order to be able to retireve it during verification

    typedef typename GetCoresponding<FLOAT_TYPE>::uint_type uint_t;
    uint_t value = static_cast<uint_t>(result);

    // For FP16 we increase the buffer size to hold an unsigned integer, as
    // we can be in the no 16bit_storage case.
    const uint_t outputSize = sizeof(FLOAT_TYPE) == 2u ? 2u : 1u;
    std::vector<FLOAT_TYPE> outputData(outputSize, exactByteEquivalent<uint_t>(value));
    return BufferSp(new Buffer<FLOAT_TYPE>(outputData));
}

template <typename FLOAT_TYPE>
void TypeValues<FLOAT_TYPE>::fillInputData(const ValueId *twoArguments, vector<uint8_t> &bufferData,
                                           uint32_t &offset) const
{
    uint32_t typeSize = sizeof(FLOAT_TYPE);

    FLOAT_TYPE argA = getValue(twoArguments[0]);
    deMemcpy(&bufferData[offset], &argA, typeSize);
    offset += typeSize;

    FLOAT_TYPE argB = getValue(twoArguments[1]);
    deMemcpy(&bufferData[offset], &argB, typeSize);
    offset += typeSize;
}

template <typename FLOAT_TYPE>
FLOAT_TYPE TypeValues<FLOAT_TYPE>::getValue(ValueId id) const
{
    return m_valueIdToVariableType.at(id);
}

template <typename FLOAT_TYPE>
template <typename UINT_TYPE>
FLOAT_TYPE TypeValues<FLOAT_TYPE>::exactByteEquivalent(UINT_TYPE byteValue) const
{
    typename RawConvert<FLOAT_TYPE, UINT_TYPE>::Value value;
    value.ui = byteValue;
    return value.fp;
}

// For floating point conversions, rounding modes only matter when
// doing a narrowing conversion, i.e. from more mantissa bits
// to fewer.
//
// There are four rounding cases, depending on the value of the
// least significant mantissa bit that is preserved, and the
// mantissa bits that are eliminated:
//
// Least significant  | Eliminated bit     |  Produces which
// retained bit       | string             |  Rounding Case
// -------------------|--------------------|-----------------
//   don't care       | 0y, y is anything  |  DOWN: Round toward zero
//   don't care       | 1y, y is non-zero  |  UP: Round away from zero
//   0                | 1y, y is zero      |  TIE_DOWN: Round toward zero
//   1                | 1y, y is zero      |  TIE_UP: Round away from zero
enum class Round
{
    DOWN,
    UP,
    TIE_DOWN,
    TIE_UP
};

template <typename FROM_FLOAT_TYPE, typename TO_FLOAT_TYPE>
struct conversionDetail
{
    typedef typename FROM_FLOAT_TYPE::StorageType FromInt;
    typedef typename TO_FLOAT_TYPE::StorageType ToInt;

    // How many bits will be removed from the mantissa by the conversion?
    static const int excessWidth = FROM_FLOAT_TYPE::MANTISSA_BITS - TO_FLOAT_TYPE::MANTISSA_BITS;

    // 'tie' contains the bits for the "1y, y is 0" case in RoundCase table.
    // All the positions in tie32 will be thrown away, but help determine
    // the rounding direction.
    static const FromInt tie         = ((FromInt)1) << (excessWidth - 1);
    static const FromInt down        = tie - 1;          // bits to trigger down case
    static const FromInt up          = tie + 1;          // bits to trigger up case
    static const FromInt tieDown     = tie;              // bits to trigger tie-down case
    static const FromInt tieUp       = (tie << 1) | tie; // bits to trigger tie-up case
    static const int exampleSign     = 1;                // Could be -1
    static const int exampleExponent = TO_FLOAT_TYPE::EXPONENT_BIAS;

    // Not all platforms will support 16 or 64 bit values. We need to detect those cases
    // and make the tests pass through since we cannot validate them.
    static bool hasExcessBits(void)
    {
        return 0 < excessWidth;
    }

    // Returns arbitrary but nontrivial bits for the mantissa of the conversion
    // result. This has TO_FLOAT_TYPE::MANTISSA_BITS. The bottom bit must be
    // zero so it can be filled in later.
    static ToInt exampleMSBBits(void)
    {
        switch (int(TO_FLOAT_TYPE::MANTISSA_BITS))
        {
        case 10: // Float16
            // The Mantissa has 10 explicitly represented bits, and 1 bit
            // that is normally hidden, but required here.
            // The upper 9 are arbitrary, and the bottom bit is 0, to be filled
            // in later.
            return static_cast<ToInt>((1 << 10) | 0x39a);
        case 23: // Float32
            // The Mantissa has 23 explicitly represented bits, and 1 bit
            // that is normally hidden, but required here.
            // The upper 22 are arbitrary, and the bottom bit is 0, to be filled
            // in later.
            return static_cast<ToInt>((1 << 23) | 0x3a5a5a);
        }
        DE_ASSERT(false && "Expected Float16 or Float32");
        return 0;
    }

    static FromInt inputMantissa(Round r)
    {
        const FromInt base = static_cast<FromInt>(exampleMSBBits()) << excessWidth;
        switch (r)
        {
        case Round::DOWN:
            return base | down;
        case Round::UP:
            return base | up;
        case Round::TIE_DOWN:
            return base | tieDown;
        case Round::TIE_UP:
            return base | tieUp;
        }
        DE_ASSERT(false);
        return 0; // Unreachable
    }

    static ToInt outputMantissa(FromInt mantissa, Round r)
    {
        const ToInt base = static_cast<ToInt>(mantissa >> excessWidth);
        switch (r)
        {
        case Round::DOWN:
        case Round::TIE_DOWN:
            return base;
        case Round::UP:
        case Round::TIE_UP:
            return static_cast<ToInt>(base + 1);
        }
        DE_ASSERT(false);
        return 0; // Unreachable
    }

    // Returns the value for the sample input, for an intended rounding outcome.
    static FROM_FLOAT_TYPE from(Round r)
    {
        return FROM_FLOAT_TYPE::construct(exampleSign, exampleExponent, inputMantissa(r));
    }

    // Returns the value of from(r) in string form as a sequence of 32 bit words.
    static std::string fromStr(Round r)
    {
        const FromInt value = from(r).bits();
        switch (sizeof(FromInt))
        {
        case 8:
            // Return low word first, high word second
            return to_string(value & 0xFFFFFFFFu) + " " + to_string(value >> 16 >> 16);
        case 4:
            return to_string(value);
        }
        DE_ASSERT(false);
        return "";
    }

    // Return the float value expected for a RTZ conversion.
    static TO_FLOAT_TYPE resultRTZ(Round r)
    {
        // Reconstruct the original input, then round toward zero.
        const ToInt mantissa = outputMantissa(inputMantissa(r), Round::DOWN);
        return TO_FLOAT_TYPE::construct(exampleSign, exampleExponent, mantissa);
    }
    // Return the bits for the float value expected for a RTZ conversion.
    static ToInt resultRTZBits(Round r)
    {
        return resultRTZ(r).bits();
    }
    // Return the float value expected for a RTE conversion.
    static TO_FLOAT_TYPE resultRTE(Round r)
    {
        // Reconstruct the original input, then round as specified.
        const ToInt mantissa = outputMantissa(inputMantissa(r), r);
        return TO_FLOAT_TYPE::construct(exampleSign, exampleExponent, mantissa);
    }
    // Return the bits for the float value expected for a RTE conversion.
    static ToInt resultRTEBits(Round r)
    {
        return resultRTE(r).bits();
    }
};

template <>
TypeValues<deFloat16>::TypeValues() : TypeValuesBase()
{
    // NOTE: when updating entries in m_valueIdToVariableType make sure to
    // update also valueIdToSnippetArgMap defined in updateSpirvSnippets()
    ValueMap &vm     = m_valueIdToVariableType;
    vm[V_UNUSED]     = deFloat32To16(0.0f);
    vm[V_MINUS_INF]  = 0xfc00;
    vm[V_MINUS_ONE]  = deFloat32To16(-1.0f);
    vm[V_MINUS_ZERO] = 0x8000;
    vm[V_ZERO]       = 0x0000;
    vm[V_HALF]       = deFloat32To16(0.5f);
    vm[V_ONE]        = deFloat32To16(1.0f);
    vm[V_INF]        = 0x7c00;
    vm[V_DENORM]     = 0x03f0; // this value should be the same as the result of denormBase - epsilon
    vm[V_NAN]        = 0x7cf0;

    vm[V_PI_DIV_2]         = deFloat32To16((float)M_PI_2);
    vm[V_DENORM_TIMES_TWO] = 0x07e0;
    vm[V_DEGREES_DENORM]   = 0x1b0c;

    vm[V_ADD_ARG_A] = 0x3c03;
    vm[V_ADD_ARG_B] = vm[V_ONE];
    vm[V_SUB_ARG_A] = vm[V_ADD_ARG_A];
    vm[V_SUB_ARG_B] = 0x4203;
    vm[V_MUL_ARG_A] = vm[V_ADD_ARG_A];
    vm[V_MUL_ARG_B] = 0x1900;
    vm[V_DOT_ARG_A] = vm[V_ADD_ARG_A];
    vm[V_DOT_ARG_B] = vm[V_MUL_ARG_B];

    // Float16 is not the source type for a narrowing conversion, so these
    // entries are unused.
    vm[V_CONV_FROM_FP32_TO_FP16_UP_ARG]       = vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_DOWN_ARG]     = vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_TIE_UP_ARG]   = vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_ARG] = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_UP_ARG]       = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_DOWN_ARG]     = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_TIE_UP_ARG]   = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_ARG] = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_UP_ARG]       = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_DOWN_ARG]     = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_TIE_UP_ARG]   = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_ARG] = vm[V_UNUSED];

    // 16 values can only be used for width-conversions
    vm[V_CONV_FROM_UINT_TO_FP32_UP_ARG]   = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT_TO_FP32_DOWN_ARG] = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT_TO_FP32_TIE_ARG]  = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT_TO_FP64_UP_ARG]   = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT_TO_FP64_DOWN_ARG] = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT_TO_FP64_TIE_ARG]  = vm[V_UNUSED];

    vm[V_CONV_FROM_INT_TO_FP32_UP_ARG]   = vm[V_UNUSED];
    vm[V_CONV_FROM_INT_TO_FP32_DOWN_ARG] = vm[V_UNUSED];
    vm[V_CONV_FROM_INT_TO_FP32_TIE_ARG]  = vm[V_UNUSED];
    vm[V_CONV_FROM_INT_TO_FP64_UP_ARG]   = vm[V_UNUSED];
    vm[V_CONV_FROM_INT_TO_FP64_DOWN_ARG] = vm[V_UNUSED];
    vm[V_CONV_FROM_INT_TO_FP64_TIE_ARG]  = vm[V_UNUSED];

    vm[V_ADD_RTZ_RESULT] = 0x4001; // deFloat16Add(vm[V_ADD_ARG_A], vm[V_ADD_ARG_B], rtz)
    vm[V_SUB_RTZ_RESULT] = 0xc001; // deFloat16Sub(vm[V_SUB_ARG_A], vm[V_SUB_ARG_B], rtz)
    vm[V_MUL_RTZ_RESULT] = 0x1903; // deFloat16Mul(vm[V_MUL_ARG_A], vm[V_MUL_ARG_B], rtz)
    vm[V_DOT_RTZ_RESULT] = 0x1d03;

    vm[V_ADD_RTE_RESULT] = 0x4002; // deFloat16Add(vm[V_ADD_ARG_A], vm[V_ADD_ARG_B], rte)
    vm[V_SUB_RTE_RESULT] = 0xc002; // deFloat16Sub(vm[V_SUB_ARG_A], vm[V_SUB_ARG_B], rte)
    vm[V_MUL_RTE_RESULT] = 0x1904; // deFloat16Mul(vm[V_MUL_ARG_A], vm[V_MUL_ARG_B], rte)
    vm[V_DOT_RTE_RESULT] = 0x1d04;

    typedef conversionDetail<Float32, Float16> from32;
    typedef conversionDetail<Float64, Float16> from64;
    vm[V_CONV_FROM_FP32_TO_FP16_UP_RTZ_RESULT] =
        from32::hasExcessBits() ? from32::resultRTZBits(Round::UP) : vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_DOWN_RTZ_RESULT] =
        from32::hasExcessBits() ? from32::resultRTZBits(Round::DOWN) : vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_TIE_UP_RTZ_RESULT] =
        from32::hasExcessBits() ? from32::resultRTZBits(Round::TIE_UP) : vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_RTZ_RESULT] =
        from32::hasExcessBits() ? from32::resultRTZBits(Round::TIE_DOWN) : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_UP_RTZ_RESULT] =
        from64::hasExcessBits() ? from64::resultRTZBits(Round::UP) : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_DOWN_RTZ_RESULT] =
        from64::hasExcessBits() ? from64::resultRTZBits(Round::DOWN) : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_TIE_UP_RTZ_RESULT] =
        from64::hasExcessBits() ? from64::resultRTZBits(Round::TIE_UP) : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_RTZ_RESULT] =
        from64::hasExcessBits() ? from64::resultRTZBits(Round::TIE_DOWN) : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_UP_RTZ_RESULT]       = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_DOWN_RTZ_RESULT]     = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_TIE_UP_RTZ_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_RTZ_RESULT] = vm[V_UNUSED];

    vm[V_CONV_FROM_FP32_TO_FP16_UP_RTE_RESULT] =
        from32::hasExcessBits() ? from32::resultRTEBits(Round::UP) : vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_DOWN_RTE_RESULT] =
        from32::hasExcessBits() ? from32::resultRTEBits(Round::DOWN) : vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_TIE_UP_RTE_RESULT] =
        from32::hasExcessBits() ? from32::resultRTEBits(Round::TIE_UP) : vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_RTE_RESULT] =
        from32::hasExcessBits() ? from32::resultRTEBits(Round::TIE_DOWN) : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_UP_RTE_RESULT] =
        from64::hasExcessBits() ? from64::resultRTEBits(Round::UP) : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_DOWN_RTE_RESULT] =
        from64::hasExcessBits() ? from64::resultRTEBits(Round::DOWN) : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_TIE_UP_RTE_RESULT] =
        from64::hasExcessBits() ? from64::resultRTEBits(Round::TIE_UP) : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_RTE_RESULT] =
        from64::hasExcessBits() ? from64::resultRTEBits(Round::TIE_DOWN) : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_UP_RTE_RESULT]       = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_DOWN_RTE_RESULT]     = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_TIE_UP_RTE_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_RTE_RESULT] = vm[V_UNUSED];

    // 16 values can only be used for width-conversions
    vm[V_CONV_FROM_UINT32_UP_RTZ_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT32_DOWN_RTZ_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT32_TIE_RTZ_RESULT]  = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT64_UP_RTZ_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT64_DOWN_RTZ_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT64_TIE_RTZ_RESULT]  = vm[V_UNUSED];

    vm[V_CONV_FROM_UINT32_UP_RTE_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT32_DOWN_RTE_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT32_TIE_RTE_RESULT]  = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT64_UP_RTE_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT64_DOWN_RTE_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT64_TIE_RTE_RESULT]  = vm[V_UNUSED];

    vm[V_CONV_FROM_INT32_UP_RTZ_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_INT32_DOWN_RTZ_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_INT32_TIE_RTZ_RESULT]  = vm[V_UNUSED];
    vm[V_CONV_FROM_INT64_UP_RTZ_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_INT64_DOWN_RTZ_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_INT64_TIE_RTZ_RESULT]  = vm[V_UNUSED];

    vm[V_CONV_FROM_INT32_UP_RTE_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_INT32_DOWN_RTE_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_INT32_TIE_RTE_RESULT]  = vm[V_UNUSED];
    vm[V_CONV_FROM_INT64_UP_RTE_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_INT64_DOWN_RTE_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_INT64_TIE_RTE_RESULT]  = vm[V_UNUSED];

    // there is no precision to store fp32 denorm nor fp64 denorm
    vm[V_CONV_DENORM_SMALLER] = vm[V_ZERO];
    vm[V_CONV_DENORM_BIGGER]  = vm[V_ZERO];
}

template <>
TypeValues<float>::TypeValues() : TypeValuesBase()
{
    // NOTE: when updating entries in m_valueIdToVariableType make sure to
    // update also valueIdToSnippetArgMap defined in updateSpirvSnippets()
    ValueMap &vm     = m_valueIdToVariableType;
    vm[V_UNUSED]     = 0.0f;
    vm[V_MINUS_INF]  = -std::numeric_limits<float>::infinity();
    vm[V_MINUS_ONE]  = -1.0f;
    vm[V_MINUS_ZERO] = -0.0f;
    vm[V_ZERO]       = 0.0f;
    vm[V_HALF]       = 0.5f;
    vm[V_ONE]        = 1.0f;
    vm[V_INF]        = std::numeric_limits<float>::infinity();
    vm[V_DENORM]     = static_cast<float>(1.413e-42); // 0x000003f0
    vm[V_NAN]        = std::numeric_limits<float>::quiet_NaN();

    vm[V_PI_DIV_2]         = static_cast<float>(M_PI_2);
    vm[V_DENORM_TIMES_TWO] = vm[V_DENORM] + vm[V_DENORM];
    vm[V_DEGREES_DENORM]   = deFloatDegrees(vm[V_DENORM]);

    float e         = std::numeric_limits<float>::epsilon();
    vm[V_ADD_ARG_A] = 1.0f + 3 * e;
    vm[V_ADD_ARG_B] = 1.0f;
    vm[V_SUB_ARG_A] = vm[V_ADD_ARG_A];
    vm[V_SUB_ARG_B] = 3.0f + 6 * e;
    vm[V_MUL_ARG_A] = vm[V_ADD_ARG_A];
    vm[V_MUL_ARG_B] = 5 * e;
    vm[V_DOT_ARG_A] = vm[V_ADD_ARG_A];
    vm[V_DOT_ARG_B] = 5 * e;

    // Float32 is the source of a narrowing conversionsto Float16.
    typedef conversionDetail<Float32, Float16> from32;
    vm[V_CONV_FROM_FP32_TO_FP16_UP_ARG] = from32::hasExcessBits() ? from32::from(Round::UP).asFloat() : vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_DOWN_ARG] =
        from32::hasExcessBits() ? from32::from(Round::DOWN).asFloat() : vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_TIE_UP_ARG] =
        from32::hasExcessBits() ? from32::from(Round::TIE_UP).asFloat() : vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_ARG] =
        from32::hasExcessBits() ? from32::from(Round::TIE_DOWN).asFloat() : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_UP_ARG]       = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_DOWN_ARG]     = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_TIE_UP_ARG]   = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_ARG] = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_UP_ARG]       = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_DOWN_ARG]     = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_TIE_UP_ARG]   = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_ARG] = vm[V_UNUSED];

    vm[V_CONV_FROM_UINT_TO_FP32_UP_ARG]   = exactByteEquivalent(0x02000003); // 33554435
    vm[V_CONV_FROM_UINT_TO_FP32_DOWN_ARG] = exactByteEquivalent(0x02000001); // 33554433
    vm[V_CONV_FROM_UINT_TO_FP32_TIE_ARG]  = exactByteEquivalent(0x02000002); // 33554434
    vm[V_CONV_FROM_UINT_TO_FP64_UP_ARG]   = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT_TO_FP64_DOWN_ARG] = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT_TO_FP64_TIE_ARG]  = vm[V_UNUSED];

    vm[V_CONV_FROM_INT_TO_FP32_UP_ARG]   = exactByteEquivalent(0xfdfffffd); // -33554435
    vm[V_CONV_FROM_INT_TO_FP32_DOWN_ARG] = exactByteEquivalent(0xfdffffff); // -33554433
    vm[V_CONV_FROM_INT_TO_FP32_TIE_ARG]  = exactByteEquivalent(0xfdfffffe); // -33554434
    vm[V_CONV_FROM_INT_TO_FP64_UP_ARG]   = vm[V_UNUSED];
    vm[V_CONV_FROM_INT_TO_FP64_DOWN_ARG] = vm[V_UNUSED];
    vm[V_CONV_FROM_INT_TO_FP64_TIE_ARG]  = vm[V_UNUSED];

    int prevRound = fegetround();
    fesetround(FE_TOWARDZERO);
    vm[V_ADD_RTZ_RESULT] = vm[V_ADD_ARG_A] + vm[V_ADD_ARG_B];
    vm[V_SUB_RTZ_RESULT] = vm[V_SUB_ARG_A] - vm[V_SUB_ARG_B];
    vm[V_MUL_RTZ_RESULT] = vm[V_MUL_ARG_A] * vm[V_MUL_ARG_B];
    vm[V_DOT_RTZ_RESULT] = vm[V_MUL_RTZ_RESULT] + vm[V_MUL_RTZ_RESULT];

    fesetround(FE_TONEAREST);
    vm[V_ADD_RTE_RESULT] = vm[V_ADD_ARG_A] + vm[V_ADD_ARG_B];
    vm[V_SUB_RTE_RESULT] = vm[V_SUB_ARG_A] - vm[V_SUB_ARG_B];
    vm[V_MUL_RTE_RESULT] = vm[V_MUL_ARG_A] * vm[V_MUL_ARG_B];
    vm[V_DOT_RTE_RESULT] = vm[V_MUL_RTE_RESULT] + vm[V_MUL_RTE_RESULT];
    fesetround(prevRound);

    typedef conversionDetail<Float64, Float32> from64;
    vm[V_CONV_FROM_FP32_TO_FP16_UP_RTZ_RESULT]       = vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_DOWN_RTZ_RESULT]     = vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_TIE_UP_RTZ_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_RTZ_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_UP_RTZ_RESULT]       = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_DOWN_RTZ_RESULT]     = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_TIE_UP_RTZ_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_RTZ_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_UP_RTZ_RESULT] =
        from64::hasExcessBits() ? from64::resultRTZ(Round::UP).asFloat() : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_DOWN_RTZ_RESULT] =
        from64::hasExcessBits() ? from64::resultRTZ(Round::DOWN).asFloat() : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_TIE_UP_RTZ_RESULT] =
        from64::hasExcessBits() ? from64::resultRTZ(Round::TIE_UP).asFloat() : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_RTZ_RESULT] =
        from64::hasExcessBits() ? from64::resultRTZ(Round::TIE_DOWN).asFloat() : vm[V_UNUSED];

    vm[V_CONV_FROM_FP32_TO_FP16_UP_RTE_RESULT]       = vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_DOWN_RTE_RESULT]     = vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_TIE_UP_RTE_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_RTE_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_UP_RTE_RESULT]       = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_DOWN_RTE_RESULT]     = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_TIE_UP_RTE_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_RTE_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_UP_RTE_RESULT] =
        from64::hasExcessBits() ? from64::resultRTE(Round::UP).asFloat() : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_DOWN_RTE_RESULT] =
        from64::hasExcessBits() ? from64::resultRTE(Round::DOWN).asFloat() : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_TIE_UP_RTE_RESULT] =
        from64::hasExcessBits() ? from64::resultRTE(Round::TIE_UP).asFloat() : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_RTE_RESULT] =
        from64::hasExcessBits() ? from64::resultRTE(Round::TIE_DOWN).asFloat() : vm[V_UNUSED];

    vm[V_CONV_FROM_UINT32_UP_RTZ_RESULT]   = exactByteEquivalent(0x4c000000); // 33554432.0
    vm[V_CONV_FROM_UINT32_DOWN_RTZ_RESULT] = exactByteEquivalent(0x4c000000); // 33554432.0
    vm[V_CONV_FROM_UINT32_TIE_RTZ_RESULT]  = exactByteEquivalent(0x4c000000); // 33554432.0
    vm[V_CONV_FROM_UINT64_UP_RTZ_RESULT]   = exactByteEquivalent(0x4c000000); // 33554432.0
    vm[V_CONV_FROM_UINT64_DOWN_RTZ_RESULT] = exactByteEquivalent(0x4c000000); // 33554432.0
    vm[V_CONV_FROM_UINT64_TIE_RTZ_RESULT]  = exactByteEquivalent(0x4c000000); // 33554432.0

    vm[V_CONV_FROM_UINT32_UP_RTE_RESULT]   = exactByteEquivalent(0x4c000001); // 33554434.0
    vm[V_CONV_FROM_UINT32_DOWN_RTE_RESULT] = exactByteEquivalent(0x4c000000); // 33554432.0
    vm[V_CONV_FROM_UINT32_TIE_RTE_RESULT]  = exactByteEquivalent(0x4c000000); // 33554432.0
    vm[V_CONV_FROM_UINT64_UP_RTE_RESULT]   = exactByteEquivalent(0x4c000001); // 33554434.0
    vm[V_CONV_FROM_UINT64_DOWN_RTE_RESULT] = exactByteEquivalent(0x4c000000); // 33554432.0
    vm[V_CONV_FROM_UINT64_TIE_RTE_RESULT]  = exactByteEquivalent(0x4c000000); // 33554432.0

    vm[V_CONV_FROM_INT32_UP_RTZ_RESULT]   = exactByteEquivalent(0xcc000000); // -33554432.0
    vm[V_CONV_FROM_INT32_DOWN_RTZ_RESULT] = exactByteEquivalent(0xcc000000); // -33554432.0
    vm[V_CONV_FROM_INT32_TIE_RTZ_RESULT]  = exactByteEquivalent(0xcc000000); // -33554432.0
    vm[V_CONV_FROM_INT64_UP_RTZ_RESULT]   = exactByteEquivalent(0xcc000000); // -33554432.0
    vm[V_CONV_FROM_INT64_DOWN_RTZ_RESULT] = exactByteEquivalent(0xcc000000); // -33554432.0
    vm[V_CONV_FROM_INT64_TIE_RTZ_RESULT]  = exactByteEquivalent(0xcc000000); // -33554432.0

    vm[V_CONV_FROM_INT32_UP_RTE_RESULT]   = exactByteEquivalent(0xcc000001); // -33554434.0
    vm[V_CONV_FROM_INT32_DOWN_RTE_RESULT] = exactByteEquivalent(0xcc000000); // -33554432.0
    vm[V_CONV_FROM_INT32_TIE_RTE_RESULT]  = exactByteEquivalent(0xcc000000); // -33554432.0
    vm[V_CONV_FROM_INT64_UP_RTE_RESULT]   = exactByteEquivalent(0xcc000001); // -33554434.0
    vm[V_CONV_FROM_INT64_DOWN_RTE_RESULT] = exactByteEquivalent(0xcc000000); // -33554432.0
    vm[V_CONV_FROM_INT64_TIE_RTE_RESULT]  = exactByteEquivalent(0xcc000000); // -33554432.0

    // there is no precision to store fp64 denorm
    vm[V_CONV_DENORM_SMALLER] = exactByteEquivalent<uint32_t>(0x387c0000); // fp16 denorm
    vm[V_CONV_DENORM_BIGGER]  = vm[V_ZERO];
}

template <>
TypeValues<double>::TypeValues() : TypeValuesBase()
{
    // NOTE: when updating entries in m_valueIdToVariableType make sure to
    // update also valueIdToSnippetArgMap defined in updateSpirvSnippets()
    ValueMap &vm     = m_valueIdToVariableType;
    vm[V_UNUSED]     = 0.0;
    vm[V_MINUS_INF]  = -std::numeric_limits<double>::infinity();
    vm[V_MINUS_ONE]  = -1.0;
    vm[V_MINUS_ZERO] = -0.0;
    vm[V_ZERO]       = 0.0;
    vm[V_HALF]       = 0.5;
    vm[V_ONE]        = 1.0;
    vm[V_INF]        = std::numeric_limits<double>::infinity();
    vm[V_DENORM]     = 4.98e-321; // 0x00000000000003F0
    vm[V_NAN]        = std::numeric_limits<double>::quiet_NaN();

    vm[V_PI_DIV_2]         = M_PI_2;
    vm[V_DENORM_TIMES_TWO] = vm[V_DENORM] + vm[V_DENORM];
    vm[V_DEGREES_DENORM]   = vm[V_UNUSED];

    double e        = std::numeric_limits<double>::epsilon();
    vm[V_ADD_ARG_A] = 1.0 + 3 * e;
    vm[V_ADD_ARG_B] = 1.0;
    vm[V_SUB_ARG_A] = vm[V_ADD_ARG_A];
    vm[V_SUB_ARG_B] = 3.0 + 6 * e;
    vm[V_MUL_ARG_A] = vm[V_ADD_ARG_A];
    vm[V_MUL_ARG_B] = 5 * e;
    vm[V_DOT_ARG_A] = vm[V_ADD_ARG_A];
    vm[V_DOT_ARG_B] = 5 * e;

    // Float64 is the source of narrowing conversions to Float32 and Float16.
    typedef conversionDetail<Float64, Float16> to16;
    typedef conversionDetail<Float64, Float32> to32;
    vm[V_CONV_FROM_FP32_TO_FP16_UP_ARG]       = vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_DOWN_ARG]     = vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_TIE_UP_ARG]   = vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_ARG] = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_UP_ARG]       = to16::hasExcessBits() ? to16::from(Round::UP).asDouble() : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_DOWN_ARG] = to16::hasExcessBits() ? to16::from(Round::DOWN).asDouble() : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_TIE_UP_ARG] =
        to16::hasExcessBits() ? to16::from(Round::TIE_UP).asDouble() : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_ARG] =
        to16::hasExcessBits() ? to16::from(Round::TIE_DOWN).asDouble() : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_UP_ARG]   = to32::hasExcessBits() ? to32::from(Round::UP).asDouble() : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_DOWN_ARG] = to32::hasExcessBits() ? to32::from(Round::DOWN).asDouble() : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_TIE_UP_ARG] =
        to32::hasExcessBits() ? to32::from(Round::TIE_UP).asDouble() : vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_ARG] =
        to32::hasExcessBits() ? to32::from(Round::TIE_DOWN).asDouble() : vm[V_UNUSED];

    vm[V_CONV_FROM_UINT_TO_FP32_UP_ARG]   = exactByteEquivalent(static_cast<uint64_t>(0x0000000002000003)); // 33554435
    vm[V_CONV_FROM_UINT_TO_FP32_DOWN_ARG] = exactByteEquivalent(static_cast<uint64_t>(0x0000000002000001)); // 33554433
    vm[V_CONV_FROM_UINT_TO_FP32_TIE_ARG]  = exactByteEquivalent(static_cast<uint64_t>(0x0000000002000002)); // 33554434
    vm[V_CONV_FROM_UINT_TO_FP64_UP_ARG] =
        exactByteEquivalent(static_cast<uint64_t>(0x0040000000000003)); // 18014398509481987
    vm[V_CONV_FROM_UINT_TO_FP64_DOWN_ARG] =
        exactByteEquivalent(static_cast<uint64_t>(0x0040000000000001)); // 18014398509481985
    vm[V_CONV_FROM_UINT_TO_FP64_TIE_ARG] =
        exactByteEquivalent(static_cast<uint64_t>(0x0040000000000002)); // 18014398509481986

    vm[V_CONV_FROM_INT_TO_FP32_UP_ARG]   = exactByteEquivalent(static_cast<uint64_t>(0xfffffffffdfffffd)); // -33554435
    vm[V_CONV_FROM_INT_TO_FP32_DOWN_ARG] = exactByteEquivalent(static_cast<uint64_t>(0xfffffffffdffffff)); // -33554433
    vm[V_CONV_FROM_INT_TO_FP32_TIE_ARG]  = exactByteEquivalent(static_cast<uint64_t>(0xfffffffffdfffffe)); // -33554434
    vm[V_CONV_FROM_INT_TO_FP64_UP_ARG] =
        exactByteEquivalent(static_cast<uint64_t>(0xffbffffffffffffd)); // -18014398509481987
    vm[V_CONV_FROM_INT_TO_FP64_DOWN_ARG] =
        exactByteEquivalent(static_cast<uint64_t>(0xffbfffffffffffff)); // -18014398509481985
    vm[V_CONV_FROM_INT_TO_FP64_TIE_ARG] =
        exactByteEquivalent(static_cast<uint64_t>(0xffbffffffffffffe)); // -18014398509481986

    int prevRound = fegetround();
    fesetround(FE_TOWARDZERO);
    vm[V_ADD_RTZ_RESULT] = vm[V_ADD_ARG_A] + vm[V_ADD_ARG_B];
    vm[V_SUB_RTZ_RESULT] = vm[V_SUB_ARG_A] - vm[V_SUB_ARG_B];
    vm[V_MUL_RTZ_RESULT] = vm[V_MUL_ARG_A] * vm[V_MUL_ARG_B];
    vm[V_DOT_RTZ_RESULT] = vm[V_MUL_RTZ_RESULT] + vm[V_MUL_RTZ_RESULT];

    fesetround(FE_TONEAREST);
    vm[V_ADD_RTE_RESULT] = vm[V_ADD_ARG_A] + vm[V_ADD_ARG_B];
    vm[V_SUB_RTE_RESULT] = vm[V_SUB_ARG_A] - vm[V_SUB_ARG_B];
    vm[V_MUL_RTE_RESULT] = vm[V_MUL_ARG_A] * vm[V_MUL_ARG_B];
    vm[V_DOT_RTE_RESULT] = vm[V_MUL_RTE_RESULT] + vm[V_MUL_RTE_RESULT];
    fesetround(prevRound);

    // Float64 is not the destination of any narrowing conversions.
    vm[V_CONV_FROM_FP32_TO_FP16_UP_RTZ_RESULT]       = vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_DOWN_RTZ_RESULT]     = vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_TIE_UP_RTZ_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_RTZ_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_UP_RTZ_RESULT]       = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_DOWN_RTZ_RESULT]     = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_TIE_UP_RTZ_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_RTZ_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_UP_RTZ_RESULT]       = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_DOWN_RTZ_RESULT]     = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_TIE_UP_RTZ_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_RTZ_RESULT] = vm[V_UNUSED];

    vm[V_CONV_FROM_FP32_TO_FP16_UP_RTE_RESULT]       = vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_DOWN_RTE_RESULT]     = vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_TIE_UP_RTE_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_RTE_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_UP_RTE_RESULT]       = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_DOWN_RTE_RESULT]     = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_TIE_UP_RTE_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_RTE_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_UP_RTE_RESULT]       = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_DOWN_RTE_RESULT]     = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_TIE_UP_RTE_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_RTE_RESULT] = vm[V_UNUSED];

    vm[V_CONV_FROM_UINT32_UP_RTZ_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT32_DOWN_RTZ_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT32_TIE_RTZ_RESULT]  = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT64_UP_RTZ_RESULT] =
        exactByteEquivalent(static_cast<uint64_t>(0x4350000000000000)); // 18014398509481984.0
    vm[V_CONV_FROM_UINT64_DOWN_RTZ_RESULT] =
        exactByteEquivalent(static_cast<uint64_t>(0x4350000000000000)); // 18014398509481984.0
    vm[V_CONV_FROM_UINT64_TIE_RTZ_RESULT] =
        exactByteEquivalent(static_cast<uint64_t>(0x4350000000000000)); // 18014398509481984.0

    vm[V_CONV_FROM_UINT32_UP_RTE_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT32_DOWN_RTE_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT32_TIE_RTE_RESULT]  = vm[V_UNUSED];
    vm[V_CONV_FROM_UINT64_UP_RTE_RESULT] =
        exactByteEquivalent(static_cast<uint64_t>(0x4350000000000001)); // 18014398509481988.0
    vm[V_CONV_FROM_UINT64_DOWN_RTE_RESULT] =
        exactByteEquivalent(static_cast<uint64_t>(0x4350000000000000)); // 18014398509481984.0
    vm[V_CONV_FROM_UINT64_TIE_RTE_RESULT] =
        exactByteEquivalent(static_cast<uint64_t>(0x4350000000000000)); // 18014398509481984.0

    vm[V_CONV_FROM_INT32_UP_RTZ_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_INT32_DOWN_RTZ_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_INT32_TIE_RTZ_RESULT]  = vm[V_UNUSED];
    vm[V_CONV_FROM_INT64_UP_RTZ_RESULT] =
        exactByteEquivalent(static_cast<uint64_t>(0xc350000000000000)); // -18014398509481984.0
    vm[V_CONV_FROM_INT64_DOWN_RTZ_RESULT] =
        exactByteEquivalent(static_cast<uint64_t>(0xc350000000000000)); // -18014398509481984.0
    vm[V_CONV_FROM_INT64_TIE_RTZ_RESULT] =
        exactByteEquivalent(static_cast<uint64_t>(0xc350000000000000)); // -18014398509481984.0

    vm[V_CONV_FROM_INT32_UP_RTE_RESULT]   = vm[V_UNUSED];
    vm[V_CONV_FROM_INT32_DOWN_RTE_RESULT] = vm[V_UNUSED];
    vm[V_CONV_FROM_INT32_TIE_RTE_RESULT]  = vm[V_UNUSED];
    vm[V_CONV_FROM_INT64_UP_RTE_RESULT] =
        exactByteEquivalent(static_cast<uint64_t>(0xc350000000000001)); // -18014398509481988.0
    vm[V_CONV_FROM_INT64_DOWN_RTE_RESULT] =
        exactByteEquivalent(static_cast<uint64_t>(0xc350000000000000)); // -18014398509481984.0
    vm[V_CONV_FROM_INT64_TIE_RTE_RESULT] =
        exactByteEquivalent(static_cast<uint64_t>(0xc350000000000000)); // -18014398509481984.0

    vm[V_CONV_DENORM_SMALLER] = exactByteEquivalent<uint64_t>(0x3f0f800000000000); // 0x03f0 is fp16 denorm
    vm[V_CONV_DENORM_BIGGER]  = exactByteEquivalent<uint64_t>(0x373f800000000000); // 0x000003f0 is fp32 denorm
}

// Each type (fp16, fp32, fp64, uint16, uint32, uint64, int16, int32, int64)
// has specific set of SPIR-V snippets that was extracted to separate template
// specialization. Those snippets are used to compose final test shaders.
// With this approach parameterization can be done just once per type and reused
// for many tests.
class TypeSnippetsBase
{
public:
    TypeSnippetsBase(bool floatType, bool signedInteger) : isFloatType(floatType), isSignedInteger(signedInteger)
    {
    }

    virtual ~TypeSnippetsBase() = default;

    const char *getValueTypeString() const
    {
        return isFloatType ? "f" : (isSignedInteger ? "i" : "u");
    }

protected:
    void updateSpirvSnippets();

public: // Type specific data:
    // Number of bits consumed by float type
    string bitWidth;

    // Minimum positive normal
    string epsilon;

    // denormBase is a normal value (found empirically) used to generate denorm value.
    // Denorm is generated by substracting epsilon from denormBase.
    // denormBase is not a denorm - it is used to create denorm.
    // This value is needed when operations are tested with arguments that were
    // generated in the code. Generated denorm should be the same as denorm
    // used when arguments are passed via input (m_valueIdToVariableType[V_DENORM]).
    // This is required as result of some operations depends on actual denorm value
    // e.g. OpRadians(0x0001) is 0 but OpRadians(0x03f0) is denorm.
    string denormBase;

    string capabilities;
    string extensions;
    string capabilitiesFp16Without16BitStorage;
    string extensionsFp16Without16BitStorage;
    string arrayStride;

    bool loadStoreRequiresShaderFloat16;
    bool isFloatType;
    bool isSignedInteger;

public: // Type specific spir-v snippets:
    // Common annotations
    string typeAnnotationsSnippet;

    // Definitions of all types commonly used by operation tests
    string typeDefinitionsSnippet;

    // Definitions of all types commonly used by settings tests
    string minTypeDefinitionsSnippet;

    // Definitions of all constants commonly used by tests
    string constantsDefinitionsSnippet;

    // Map that stores instructions that generate arguments of specified value.
    // Every test that uses generated inputod will select up to two items from this map
    typedef map<ValueId, string> SnippetMap;
    SnippetMap valueIdToSnippetArgMap;

    // Spir-v snippets that read argument from SSBO
    string argumentsFromInputSnippet;
    string multiArgumentsFromInputSnippet;

    // SSBO with stage input/output definitions
    string inputAnnotationsSnippet;
    string inputDefinitionsSnippet;
    string outputAnnotationsSnippet;
    string multiOutputAnnotationsSnippet;
    string outputDefinitionsSnippet;
    string multiOutputDefinitionsSnippet;

    // Varying is required to pass result from vertex stage to fragment stage,
    // one of requirements was to not use SSBO writes in vertex stage so we
    // need to do that in fragment stage; we also cant pass operation result
    // directly because of interpolation, to avoid it we do a bitcast to uint
    string varyingsTypesSnippet;
    string inputVaryingsSnippet;
    string outputVaryingsSnippet;
    string storeVertexResultSnippet;
    string loadVertexResultSnippet;

    string storeResultsSnippet;
    string multiStoreResultsSnippet;

    string argumentsFromInputFp16Snippet;
    string storeResultsFp16Snippet;
    string multiArgumentsFromInputFp16Snippet;
    string multiOutputAnnotationsFp16Snippet;
    string multiStoreResultsFp16Snippet;
    string multiOutputDefinitionsFp16Snippet;
    string inputDefinitionsFp16Snippet;
    string outputDefinitionsFp16Snippet;
    string typeAnnotationsFp16Snippet;
    string typeDefinitionsFp16Snippet;
};

void TypeSnippetsBase::updateSpirvSnippets()
{
    // annotations to types that are commonly used by tests
    const string typeAnnotationsTemplate = "OpDecorate %type_valueType_arr_1 ArrayStride " + arrayStride +
                                           "\n"
                                           "OpDecorate %type_valueType_arr_2 ArrayStride " +
                                           arrayStride + "\n";

    // definition off all types that are commonly used by tests
    const string floatTypeDefinition = "%type_valueType             = OpTypeFloat " + bitWidth +
                                       "\n"
                                       "%type_valueType_uptr        = OpTypePointer Uniform %type_valueType\n"
                                       "%type_valueType_fptr        = OpTypePointer Function %type_valueType\n"
                                       "%type_valueType_vec2        = OpTypeVector %type_valueType 2\n"
                                       "%type_valueType_vec3        = OpTypeVector %type_valueType 3\n"
                                       "%type_valueType_vec4        = OpTypeVector %type_valueType 4\n"
                                       "%type_valueType_vec4_iptr   = OpTypePointer Input %type_valueType_vec4\n"
                                       "%type_valueType_vec4_optr   = OpTypePointer Output %type_valueType_vec4\n"
                                       "%type_valueType_mat2x2      = OpTypeMatrix %type_valueType_vec2 2\n"
                                       "%type_valueType_arr_1       = OpTypeArray %type_valueType %c_i32_1\n"
                                       "%type_valueType_arr_2       = OpTypeArray %type_valueType %c_i32_2\n";
    const string uintTypeDefinition =
        (bitWidth == "32" ? "" : // 32 bit values are already defined
             "%type_valueType             = OpTypeInt " + bitWidth + " " + (isSignedInteger ? "1" : "0") + "\n") +
        "%type_valueType_uptr        = OpTypePointer Uniform %type_valueType\n" +
        (bitWidth == "32" ? "" : // 32 bit values are already defined
                            "%type_valueType_fptr        = OpTypePointer Function %type_valueType\n"
                            "%type_valueType_vec2        = OpTypeVector %type_valueType 2\n"
                            "%type_valueType_vec3        = OpTypeVector %type_valueType 3\n") +
        "%type_valueType_vec4        = OpTypeVector %type_valueType 4\n"
        "%type_valueType_vec4_iptr   = OpTypePointer Input %type_valueType_vec4\n"
        "%type_valueType_vec4_optr   = OpTypePointer Output %type_valueType_vec4\n"
        "%type_valueType_arr_1       = OpTypeArray %type_valueType %c_i32_1\n"
        "%type_valueType_arr_2       = OpTypeArray %type_valueType %c_i32_2\n";

    const string typeDefinitionsTemplate = isFloatType ? floatTypeDefinition : uintTypeDefinition;

    // minimal type definition set that is used by settings tests
    const string minTypeDefinitionsTemplate = "%type_valueType             = OpTypeFloat " + bitWidth +
                                              "\n"
                                              "%type_valueType_uptr        = OpTypePointer Uniform %type_valueType\n"
                                              "%type_valueType_arr_2       = OpTypeArray %type_valueType %c_i32_2\n";

    // definition off all constants that are used by tests
    const string constantsDefinitionsTemplate = "%c_valueType_n1             = OpConstant %type_valueType -1\n"
                                                "%c_valueType_0              = OpConstant %type_valueType 0.0\n"
                                                "%c_valueType_0_5            = OpConstant %type_valueType 0.5\n"
                                                "%c_valueType_1              = OpConstant %type_valueType 1\n"
                                                "%c_valueType_2              = OpConstant %type_valueType 2\n"
                                                "%c_valueType_3              = OpConstant %type_valueType 3\n"
                                                "%c_valueType_4              = OpConstant %type_valueType 4\n"
                                                "%c_valueType_5              = OpConstant %type_valueType 5\n"
                                                "%c_valueType_6              = OpConstant %type_valueType 6\n"
                                                "%c_valueType_eps            = OpConstant %type_valueType " +
                                                epsilon +
                                                "\n"
                                                "%c_valueType_denorm_base    = OpConstant %type_valueType " +
                                                denormBase + "\n";

    // when arguments are read from SSBO this snipped is placed in main function
    const string argumentsFromInputTemplate =
        "%arg1loc                = OpAccessChain %type_valueType_uptr %ssbo_in %c_i32_0 %c_i32_0\n"
        "%arg1                   = OpLoad %type_valueType %arg1loc\n"
        "%arg2loc                = OpAccessChain %type_valueType_uptr %ssbo_in %c_i32_0 %c_i32_1\n"
        "%arg2                   = OpLoad %type_valueType %arg2loc\n";

    const string multiArgumentsFromInputTemplate =
        "%arg1_valueType_loc         = OpAccessChain %type_valueType_uptr %ssbo_in %c_i32_${attr} %c_i32_0\n"
        "%arg2_valueType_loc         = OpAccessChain %type_valueType_uptr %ssbo_in %c_i32_${attr} %c_i32_1\n"
        "%arg1_valueType             = OpLoad %type_valueType %arg1_valueType_loc\n"
        "%arg2_valueType             = OpLoad %type_valueType %arg2_valueType_loc\n";

    // when tested shader stage reads from SSBO it has to have this snippet
    inputAnnotationsSnippet = "OpMemberDecorate %SSBO_in 0 Offset 0\n"
                              "OpDecorate %SSBO_in BufferBlock\n"
                              "OpDecorate %ssbo_in DescriptorSet 0\n"
                              "OpDecorate %ssbo_in Binding 0\n"
                              "OpDecorate %ssbo_in NonWritable\n";

    const string inputDefinitionsTemplate = "%SSBO_in              = OpTypeStruct %type_valueType_arr_2\n"
                                            "%up_SSBO_in           = OpTypePointer Uniform %SSBO_in\n"
                                            "%ssbo_in              = OpVariable %up_SSBO_in Uniform\n";

    outputAnnotationsSnippet = "OpMemberDecorate %SSBO_out 0 Offset 0\n"
                               "OpDecorate %SSBO_out BufferBlock\n"
                               "OpDecorate %ssbo_out DescriptorSet 0\n"
                               "OpDecorate %ssbo_out Binding 1\n";

    const string multiOutputAnnotationsTemplate = "OpMemberDecorate %SSBO_valueType_out 0 Offset 0\n"
                                                  "OpDecorate %type_valueType_arr_2 ArrayStride " +
                                                  arrayStride +
                                                  "\n"
                                                  "OpDecorate %SSBO_valueType_out BufferBlock\n"
                                                  "OpDecorate %ssbo_valueType_out DescriptorSet 0\n";

    const string outputDefinitionsTemplate = "%SSBO_out             = OpTypeStruct %type_valueType_arr_1\n"
                                             "%up_SSBO_out          = OpTypePointer Uniform %SSBO_out\n"
                                             "%ssbo_out             = OpVariable %up_SSBO_out Uniform\n";

    const string multiOutputDefinitionsTemplate =
        "%SSBO_valueType_out         = OpTypeStruct %type_valueType\n"
        "%up_SSBO_valueType_out      = OpTypePointer Uniform %SSBO_valueType_out\n"
        "%ssbo_valueType_out         = OpVariable %up_SSBO_valueType_out Uniform\n";

    // this snippet is used by compute and fragment stage but not by vertex stage
    const string storeResultsTemplate =
        "%outloc               = OpAccessChain %type_valueType_uptr %ssbo_out %c_i32_0 %c_i32_0\n"
        "OpStore %outloc %result\n";

    const string multiStoreResultsTemplate =
        "%outloc" + bitWidth +
        "             = OpAccessChain %type_valueType_uptr %ssbo_valueType_out %c_i32_0\n"
        "                        OpStore %outloc" +
        bitWidth + " %result" + bitWidth + "\n";

    const string typeToken = "_valueType";
    const string typeName  = string("_") + getValueTypeString() + bitWidth;

    typeAnnotationsSnippet         = replace(typeAnnotationsTemplate, typeToken, typeName);
    typeDefinitionsSnippet         = replace(typeDefinitionsTemplate, typeToken, typeName);
    minTypeDefinitionsSnippet      = replace(minTypeDefinitionsTemplate, typeToken, typeName);
    constantsDefinitionsSnippet    = isFloatType ? replace(constantsDefinitionsTemplate, typeToken, typeName) :
                                                   ""; // Not needed for int conversion tests
    argumentsFromInputSnippet      = replace(argumentsFromInputTemplate, typeToken, typeName);
    multiArgumentsFromInputSnippet = replace(multiArgumentsFromInputTemplate, typeToken, typeName);
    inputDefinitionsSnippet        = replace(inputDefinitionsTemplate, typeToken, typeName);
    multiOutputAnnotationsSnippet  = replace(multiOutputAnnotationsTemplate, typeToken, typeName);
    outputDefinitionsSnippet       = replace(outputDefinitionsTemplate, typeToken, typeName);
    multiOutputDefinitionsSnippet  = replace(multiOutputDefinitionsTemplate, typeToken, typeName);
    storeResultsSnippet            = replace(storeResultsTemplate, typeToken, typeName);
    multiStoreResultsSnippet       = replace(multiStoreResultsTemplate, typeToken, typeName);

    argumentsFromInputFp16Snippet      = "";
    storeResultsFp16Snippet            = "";
    multiArgumentsFromInputFp16Snippet = "";
    multiOutputAnnotationsFp16Snippet  = "";
    multiStoreResultsFp16Snippet       = "";
    multiOutputDefinitionsFp16Snippet  = "";
    inputDefinitionsFp16Snippet        = "";
    typeAnnotationsFp16Snippet         = "";
    outputDefinitionsFp16Snippet       = "";
    typeDefinitionsFp16Snippet         = "";

    if (bitWidth.compare("16") == 0)
    {
        typeDefinitionsFp16Snippet = "%type_u32_uptr       = OpTypePointer Uniform %type_u32\n"
                                     "%type_u32_arr_1      = OpTypeArray %type_u32 %c_i32_1\n";

        typeAnnotationsFp16Snippet  = "OpDecorate %type_u32_arr_1 ArrayStride 4\n";
        const string inputToken     = "_f16_arr_2";
        const string inputName      = "_u32_arr_1";
        inputDefinitionsFp16Snippet = replace(inputDefinitionsSnippet, inputToken, inputName);

        argumentsFromInputFp16Snippet = "%argloc            = OpAccessChain %type_u32_uptr %ssbo_in %c_i32_0 %c_i32_0\n"
                                        "%inval             = OpLoad %type_u32 %argloc\n"
                                        "%arg               = OpBitcast %type_f16_vec2 %inval\n"
                                        "%arg1              = OpCompositeExtract %type_f16 %arg 0\n"
                                        "%arg2              = OpCompositeExtract %type_f16 %arg 1\n";

        const string outputToken     = "_f16_arr_1";
        const string outputName      = "_u32_arr_1";
        outputDefinitionsFp16Snippet = replace(outputDefinitionsSnippet, outputToken, outputName);

        storeResultsFp16Snippet = "%result_f16_vec2   = OpCompositeConstruct %type_f16_vec2 %result %c_f16_0\n"
                                  "%result_u32 = OpBitcast %type_u32 %result_f16_vec2\n"
                                  "%outloc            = OpAccessChain %type_u32_uptr %ssbo_out %c_i32_0 %c_i32_0\n"
                                  "OpStore %outloc %result_u32\n";

        multiArgumentsFromInputFp16Snippet =
            "%arg_u32_loc         = OpAccessChain %type_u32_uptr %ssbo_in %c_i32_${attr} %c_i32_0\n"
            "%arg_u32             = OpLoad %type_u32 %arg_u32_loc\n"
            "%arg_f16_vec2        = OpBitcast %type_f16_vec2 %arg_u32\n"
            "%arg1_f16            = OpCompositeExtract %type_f16 %arg_f16_vec2 0\n"
            "%arg2_f16            = OpCompositeExtract %type_f16 %arg_f16_vec2 1\n";

        multiOutputAnnotationsFp16Snippet = "OpMemberDecorate %SSBO_u32_out 0 Offset 0\n"
                                            "OpDecorate %type_u32_arr_1 ArrayStride 4\n"
                                            "OpDecorate %SSBO_u32_out BufferBlock\n"
                                            "OpDecorate %ssbo_u32_out DescriptorSet 0\n";

        multiStoreResultsFp16Snippet = "%outloc_u32            = OpAccessChain %type_u32_uptr %ssbo_u32_out %c_i32_0\n"
                                       "%result16_vec2 = OpCompositeConstruct %type_f16_vec2 %result16 %c_f16_0\n"
                                       "%result_u32            = OpBitcast %type_u32 %result16_vec2\n"
                                       "                        OpStore %outloc_u32 %result_u32\n";

        multiOutputDefinitionsFp16Snippet = "%c_f16_0              = OpConstant %type_f16 0.0\n"
                                            "%SSBO_u32_out         = OpTypeStruct %type_u32\n"
                                            "%up_SSBO_u32_out      = OpTypePointer Uniform %SSBO_u32_out\n"
                                            "%ssbo_u32_out         = OpVariable %up_SSBO_u32_out Uniform\n";
    }

    // NOTE: only values used as _generated_ arguments in test operations
    // need to be in this map, arguments that are only used by tests,
    // that grab arguments from input, do need to be in this map
    // NOTE: when updating entries in valueIdToSnippetArgMap make
    // sure to update also m_valueIdToVariableType for all valueType width
    SnippetMap &sm   = valueIdToSnippetArgMap;
    sm[V_UNUSED]     = "OpFSub %type_valueType %c_valueType_0 %c_valueType_0\n";
    sm[V_MINUS_INF]  = "OpFDiv %type_valueType %c_valueType_n1 %c_valueType_0\n";
    sm[V_MINUS_ONE]  = "OpFAdd %type_valueType %c_valueType_n1 %c_valueType_0\n";
    sm[V_MINUS_ZERO] = "OpFMul %type_valueType %c_valueType_n1 %c_valueType_0\n";
    sm[V_ZERO]       = "OpFMul %type_valueType %c_valueType_0 %c_valueType_0\n";
    sm[V_HALF]       = "OpFAdd %type_valueType %c_valueType_0_5 %c_valueType_0\n";
    sm[V_ONE]        = "OpFAdd %type_valueType %c_valueType_1 %c_valueType_0\n";
    sm[V_INF]        = "OpFDiv %type_valueType %c_valueType_1 %c_valueType_0\n"; // x / 0 == Inf
    sm[V_DENORM]     = "OpFSub %type_valueType %c_valueType_denorm_base %c_valueType_eps\n";
    sm[V_NAN]        = "OpFDiv %type_valueType %c_valueType_0 %c_valueType_0\n"; // 0 / 0 == Nan

    map<ValueId, string>::iterator it;
    for (it = sm.begin(); it != sm.end(); it++)
        sm[it->first] = replace(it->second, typeToken, typeName);
}

typedef de::SharedPtr<TypeSnippetsBase> TypeSnippetsSP;

template <typename FLOAT_TYPE>
class TypeSnippets : public TypeSnippetsBase
{
public:
    TypeSnippets(bool floatType = true, bool signedInteger = false);
};

template <>
TypeSnippets<deFloat16>::TypeSnippets(bool floatType, bool signedInteger) : TypeSnippetsBase(floatType, signedInteger)
{
    bitWidth = "16";
    epsilon  = "6.104e-5"; // 2^-14 = 0x0400

    // 1.2113e-4 is 0x07f0 which after substracting epsilon will give 0x03f0 (same as vm[V_DENORM])
    // NOTE: constants in SPIR-V cant be specified as exact fp16 - there is conversion from double to fp16
    denormBase = "1.2113e-4";

    capabilities = "OpCapability StorageUniform16\n";
    extensions   = "OpExtension \"SPV_KHR_16bit_storage\"\n";

    capabilitiesFp16Without16BitStorage = "OpCapability Float16\n";
    extensionsFp16Without16BitStorage   = "";

    arrayStride = "2";

    varyingsTypesSnippet     = "%type_u32_iptr        = OpTypePointer Input %type_u32\n"
                               "%type_u32_optr        = OpTypePointer Output %type_u32\n";
    inputVaryingsSnippet     = "%BP_vertex_result    = OpVariable %type_u32_iptr Input\n";
    outputVaryingsSnippet    = "%BP_vertex_result    = OpVariable %type_u32_optr Output\n";
    storeVertexResultSnippet = "%tmp_vec2            = OpCompositeConstruct %type_f16_vec2 %result %c_f16_0\n"
                               "%packed_result       = OpBitcast %type_u32 %tmp_vec2\n"
                               "OpStore %BP_vertex_result %packed_result\n";
    loadVertexResultSnippet  = "%packed_result       = OpLoad %type_u32 %BP_vertex_result\n"
                               "%tmp_vec2            = OpBitcast %type_f16_vec2 %packed_result\n"
                               "%result              = OpCompositeExtract %type_f16 %tmp_vec2 0\n";

    loadStoreRequiresShaderFloat16 = true;

    updateSpirvSnippets();
}

template <>
TypeSnippets<float>::TypeSnippets(bool floatType, bool signedInteger) : TypeSnippetsBase(floatType, signedInteger)
{
    bitWidth                            = "32";
    epsilon                             = "1.175494351e-38";
    denormBase                          = "1.1756356e-38";
    capabilities                        = "";
    extensions                          = "";
    capabilitiesFp16Without16BitStorage = "";
    extensionsFp16Without16BitStorage   = "";
    arrayStride                         = "4";

    varyingsTypesSnippet     = "%type_u32_iptr        = OpTypePointer Input %type_u32\n"
                               "%type_u32_optr        = OpTypePointer Output %type_u32\n";
    inputVaryingsSnippet     = "%BP_vertex_result    = OpVariable %type_u32_iptr Input\n";
    outputVaryingsSnippet    = "%BP_vertex_result    = OpVariable %type_u32_optr Output\n";
    storeVertexResultSnippet = "%packed_result       = OpBitcast %type_u32 %result\n"
                               "OpStore %BP_vertex_result %packed_result\n";
    loadVertexResultSnippet  = "%packed_result       = OpLoad %type_u32 %BP_vertex_result\n"
                               "%result              = OpBitcast %type_f32 %packed_result\n";

    loadStoreRequiresShaderFloat16 = false;

    updateSpirvSnippets();
}

template <>
TypeSnippets<double>::TypeSnippets(bool floatType, bool signedInteger) : TypeSnippetsBase(floatType, signedInteger)
{
    const string float64Capability      = "OpCapability Float64\n";
    const string int64Capability        = "OpCapability Int64\n";
    bitWidth                            = "64";
    epsilon                             = "2.2250738585072014e-308"; // 0x0010000000000000
    denormBase                          = "2.2250738585076994e-308"; // 0x00100000000003F0
    capabilities                        = floatType ? float64Capability : int64Capability;
    extensions                          = "";
    capabilitiesFp16Without16BitStorage = "";
    extensionsFp16Without16BitStorage   = "";
    arrayStride                         = "8";

    varyingsTypesSnippet     = "%type_u32_vec2_iptr   = OpTypePointer Input %type_u32_vec2\n"
                               "%type_u32_vec2_optr   = OpTypePointer Output %type_u32_vec2\n";
    inputVaryingsSnippet     = "%BP_vertex_result     = OpVariable %type_u32_vec2_iptr Input\n";
    outputVaryingsSnippet    = "%BP_vertex_result     = OpVariable %type_u32_vec2_optr Output\n";
    storeVertexResultSnippet = "%packed_result        = OpBitcast %type_u32_vec2 %result\n"
                               "OpStore %BP_vertex_result %packed_result\n";
    loadVertexResultSnippet  = "%packed_result        = OpLoad %type_u32_vec2 %BP_vertex_result\n"
                               "%result               = OpBitcast %type_f64 %packed_result\n";

    loadStoreRequiresShaderFloat16 = false;

    updateSpirvSnippets();
}

class TypeTestResultsBase
{
public:
    virtual ~TypeTestResultsBase()
    {
    }
    VariableType variableType() const;

protected:
    VariableType m_variableType;

public:
    // Vectors containing test data for float controls
    vector<BinaryCase> binaryOpFTZ;
    vector<UnaryCase> unaryOpFTZ;
    vector<BinaryCase> binaryOpDenormPreserve;
    vector<UnaryCase> unaryOpDenormPreserve;
};

VariableType TypeTestResultsBase::variableType() const
{
    return m_variableType;
}

typedef de::SharedPtr<TypeTestResultsBase> TypeTestResultsSP;

template <typename FLOAT_TYPE>
class TypeTestResults : public TypeTestResultsBase
{
public:
    TypeTestResults();
};

template <>
TypeTestResults<deFloat16>::TypeTestResults()
{
    m_variableType = FP16;

    // note: there are many FTZ test cases that can produce diferent result depending
    // on input denorm being flushed or not; because of that FTZ tests can be limited
    // to those that return denorm as those are the ones affected by tested extension
    const BinaryCase binaryOpFTZArr[] = {
        //operation            den op one        den op den        den op inf        den op nan
        {OID_ADD, V_ONE, V_ZERO_OR_DENORM_TIMES_TWO, V_INF, V_UNUSED},
        {OID_SUB, V_MINUS_ONE, V_ZERO, V_MINUS_INF, V_UNUSED},
        {OID_MUL, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_DIV, V_ZERO, V_UNUSED, V_ZERO, V_UNUSED},
        {OID_REM, V_ZERO, V_UNUSED, V_UNUSED, V_UNUSED},
        {OID_MOD, V_ZERO, V_UNUSED, V_UNUSED, V_UNUSED},
        {OID_VEC_MUL_S, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_VEC_MUL_M, V_ZERO_OR_DENORM_TIMES_TWO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_MAT_MUL_S, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_MAT_MUL_V, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_MAT_MUL_M, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_OUT_PROD, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_DOT, V_ZERO_OR_DENORM_TIMES_TWO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_ATAN2, V_ZERO, V_UNUSED, V_ZERO, V_UNUSED},
        {OID_POW, V_ZERO, V_UNUSED, V_ZERO, V_UNUSED},
        {OID_MIX, V_HALF, V_ZERO, V_INF, V_UNUSED},
        {OID_MIN, V_ZERO, V_ZERO, V_ZERO, V_UNUSED},
        {OID_MAX, V_ONE, V_ZERO, V_INF, V_UNUSED},
        {OID_CLAMP, V_ONE, V_ZERO, V_INF, V_UNUSED},
        {OID_STEP, V_ONE, V_ONE, V_ONE, V_UNUSED},
        {OID_SSTEP, V_HALF, V_ONE, V_ZERO, V_UNUSED},
        {OID_FMA, V_HALF, V_HALF, V_UNUSED, V_UNUSED},
        {OID_FACE_FWD, V_MINUS_ONE, V_MINUS_ONE, V_MINUS_ONE, V_MINUS_ONE},
        {OID_NMIN, V_ZERO, V_ZERO, V_ZERO, V_ZERO},
        {OID_NMAX, V_ONE, V_ZERO, V_INF, V_ZERO},
        {OID_NCLAMP, V_ONE, V_ZERO, V_INF, V_ZERO},
        {OID_DIST, V_ONE, V_ZERO, V_INF, V_UNUSED},
        {OID_CROSS, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
    };

    const UnaryCase unaryOpFTZArr[] = {
        //operation            op den
        {OID_NEGATE, V_MINUS_ZERO},
        {OID_ROUND, V_ZERO},
        {OID_ROUND_EV, V_ZERO},
        {OID_TRUNC, V_ZERO},
        {OID_ABS, V_ZERO},
        {OID_FLOOR, V_ZERO},
        {OID_CEIL, V_ZERO_OR_ONE},
        {OID_FRACT, V_ZERO},
        {OID_RADIANS, V_ZERO},
        {OID_DEGREES, V_ZERO},
        {OID_SIN, V_ZERO},
        {OID_COS, V_TRIG_ONE},
        {OID_TAN, V_ZERO},
        {OID_ASIN, V_ZERO},
        {OID_ACOS, V_PI_DIV_2},
        {OID_ATAN, V_ZERO},
        {OID_SINH, V_ZERO},
        {OID_COSH, V_ONE},
        {OID_TANH, V_ZERO},
        {OID_ASINH, V_ZERO},
        {OID_ACOSH, V_UNUSED},
        {OID_ATANH, V_ZERO},
        {OID_EXP, V_ONE},
        {OID_LOG, V_MINUS_INF_OR_LOG_DENORM},
        {OID_EXP2, V_ONE},
        {OID_LOG2, V_MINUS_INF_OR_LOG2_DENORM},
        {OID_SQRT, V_ZERO_OR_SQRT_DENORM},
        {OID_INV_SQRT, V_INF_OR_INV_SQRT_DENORM},
        {OID_MAT_DET, V_ZERO},
        {OID_MAT_INV, V_ZERO_OR_MINUS_ZERO},
        {OID_MODF, V_ZERO},
        {OID_MODF_ST, V_ZERO},
        {OID_NORMALIZE, V_ZERO},
        {OID_REFLECT, V_ZERO},
        {OID_REFRACT, V_ZERO},
        {OID_LENGTH, V_ZERO},
    };

    const BinaryCase binaryOpDenormPreserveArr[] = {
        //operation            den op one                den op den                den op inf        den op nan
        {OID_PHI, V_DENORM, V_DENORM, V_DENORM, V_DENORM},
        {OID_SELECT, V_DENORM, V_DENORM, V_DENORM, V_DENORM},
        {OID_ADD, V_ONE, V_DENORM_TIMES_TWO, V_INF, V_NAN},
        {OID_SUB, V_MINUS_ONE_OR_CLOSE, V_ZERO, V_MINUS_INF, V_NAN},
        {OID_MUL, V_DENORM, V_ZERO, V_INF, V_NAN},
        {OID_VEC_MUL_S, V_DENORM, V_ZERO, V_INF, V_NAN},
        {OID_VEC_MUL_M, V_DENORM_TIMES_TWO, V_ZERO, V_INF, V_NAN},
        {OID_MAT_MUL_S, V_DENORM, V_ZERO, V_INF, V_NAN},
        {OID_MAT_MUL_V, V_DENORM_TIMES_TWO, V_ZERO, V_INF, V_NAN},
        {OID_MAT_MUL_M, V_DENORM_TIMES_TWO, V_ZERO, V_INF, V_NAN},
        {OID_OUT_PROD, V_DENORM, V_ZERO, V_INF, V_NAN},
        {OID_DOT, V_DENORM_TIMES_TWO, V_ZERO, V_INF, V_NAN},
        {OID_MIX, V_HALF, V_DENORM, V_INF, V_NAN},
        {OID_FMA, V_HALF, V_HALF, V_INF, V_NAN},
        {OID_MIN, V_DENORM, V_DENORM, V_DENORM, V_UNUSED},
        {OID_MAX, V_ONE, V_DENORM, V_INF, V_UNUSED},
        {OID_CLAMP, V_ONE, V_DENORM, V_INF, V_UNUSED},
        {OID_NMIN, V_DENORM, V_DENORM, V_DENORM, V_DENORM},
        {OID_NMAX, V_ONE, V_DENORM, V_INF, V_DENORM},
        {OID_NCLAMP, V_ONE, V_DENORM, V_INF, V_DENORM},
    };

    const UnaryCase unaryOpDenormPreserveArr[] = {
        //operation                op den
        {OID_RETURN_VAL, V_DENORM},
        {OID_D_EXTRACT, V_DENORM},
        {OID_D_INSERT, V_DENORM},
        {OID_SHUFFLE, V_DENORM},
        {OID_COMPOSITE, V_DENORM},
        {OID_COMPOSITE_INS, V_DENORM},
        {OID_COPY, V_DENORM},
        {OID_TRANSPOSE, V_DENORM},
        {OID_NEGATE, V_DENORM},
        {OID_ABS, V_DENORM},
        {OID_SIGN, V_ONE},
        {OID_RADIANS, V_DENORM},
        {OID_DEGREES, V_DEGREES_DENORM},
    };

    binaryOpFTZ.insert(binaryOpFTZ.begin(), binaryOpFTZArr, binaryOpFTZArr + DE_LENGTH_OF_ARRAY(binaryOpFTZArr));
    unaryOpFTZ.insert(unaryOpFTZ.begin(), unaryOpFTZArr, unaryOpFTZArr + DE_LENGTH_OF_ARRAY(unaryOpFTZArr));
    binaryOpDenormPreserve.insert(binaryOpDenormPreserve.begin(), binaryOpDenormPreserveArr,
                                  binaryOpDenormPreserveArr + DE_LENGTH_OF_ARRAY(binaryOpDenormPreserveArr));
    unaryOpDenormPreserve.insert(unaryOpDenormPreserve.begin(), unaryOpDenormPreserveArr,
                                 unaryOpDenormPreserveArr + DE_LENGTH_OF_ARRAY(unaryOpDenormPreserveArr));
}

template <>
TypeTestResults<float>::TypeTestResults()
{
    m_variableType = FP32;

    const BinaryCase binaryOpFTZArr[] = {
        //operation            den op one        den op den        den op inf        den op nan
        {OID_ADD, V_ONE, V_ZERO, V_INF, V_UNUSED},
        {OID_SUB, V_MINUS_ONE, V_ZERO, V_MINUS_INF, V_UNUSED},
        {OID_MUL, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_DIV, V_ZERO, V_UNUSED, V_ZERO, V_UNUSED},
        {OID_REM, V_ZERO, V_UNUSED, V_UNUSED, V_UNUSED},
        {OID_MOD, V_ZERO, V_UNUSED, V_UNUSED, V_UNUSED},
        {OID_VEC_MUL_S, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_VEC_MUL_M, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_MAT_MUL_S, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_MAT_MUL_V, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_MAT_MUL_M, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_OUT_PROD, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_DOT, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_ATAN2, V_ZERO, V_UNUSED, V_ZERO, V_UNUSED},
        {OID_POW, V_ZERO, V_UNUSED, V_ZERO, V_UNUSED},
        {OID_MIX, V_HALF, V_ZERO, V_INF, V_UNUSED},
        {OID_MIN, V_ZERO, V_ZERO, V_ZERO, V_UNUSED},
        {OID_MAX, V_ONE, V_ZERO, V_INF, V_UNUSED},
        {OID_CLAMP, V_ONE, V_ZERO, V_INF, V_UNUSED},
        {OID_STEP, V_ONE, V_ONE, V_ONE, V_UNUSED},
        {OID_SSTEP, V_HALF, V_ONE, V_ZERO, V_UNUSED},
        {OID_FMA, V_HALF, V_HALF, V_UNUSED, V_UNUSED},
        {OID_FACE_FWD, V_MINUS_ONE, V_MINUS_ONE, V_MINUS_ONE, V_MINUS_ONE},
        {OID_NMIN, V_ZERO, V_ZERO, V_ZERO, V_ZERO},
        {OID_NMAX, V_ONE, V_ZERO, V_INF, V_ZERO},
        {OID_NCLAMP, V_ONE, V_ZERO, V_INF, V_ZERO},
        {OID_DIST, V_ONE, V_ZERO, V_INF, V_UNUSED},
        {OID_CROSS, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
    };

    const UnaryCase unaryOpFTZArr[] = {
        //operation            op den
        {OID_NEGATE, V_MINUS_ZERO},
        {OID_ROUND, V_ZERO},
        {OID_ROUND_EV, V_ZERO},
        {OID_TRUNC, V_ZERO},
        {OID_ABS, V_ZERO},
        {OID_FLOOR, V_ZERO},
        {OID_CEIL, V_ZERO_OR_ONE},
        {OID_FRACT, V_ZERO},
        {OID_RADIANS, V_ZERO},
        {OID_DEGREES, V_ZERO},
        {OID_SIN, V_ZERO},
        {OID_COS, V_TRIG_ONE},
        {OID_TAN, V_ZERO},
        {OID_ASIN, V_ZERO},
        {OID_ACOS, V_PI_DIV_2},
        {OID_ATAN, V_ZERO},
        {OID_SINH, V_ZERO},
        {OID_COSH, V_ONE},
        {OID_TANH, V_ZERO},
        {OID_ASINH, V_ZERO},
        {OID_ACOSH, V_UNUSED},
        {OID_ATANH, V_ZERO},
        {OID_EXP, V_ONE},
        {OID_LOG, V_MINUS_INF_OR_LOG_DENORM},
        {OID_EXP2, V_ONE},
        {OID_LOG2, V_MINUS_INF_OR_LOG2_DENORM},
        {OID_SQRT, V_ZERO_OR_SQRT_DENORM},
        {OID_INV_SQRT, V_INF_OR_INV_SQRT_DENORM},
        {OID_MAT_DET, V_ZERO},
        {OID_MAT_INV, V_ZERO_OR_MINUS_ZERO},
        {OID_MODF, V_ZERO},
        {OID_MODF_ST, V_ZERO},
        {OID_NORMALIZE, V_ZERO},
        {OID_REFLECT, V_ZERO},
        {OID_REFRACT, V_ZERO},
        {OID_LENGTH, V_ZERO},
    };

    const BinaryCase binaryOpDenormPreserveArr[] = {
        //operation            den op one            den op den                den op inf        den op nan
        {OID_PHI, V_DENORM, V_DENORM, V_DENORM, V_DENORM},  {OID_SELECT, V_DENORM, V_DENORM, V_DENORM, V_DENORM},
        {OID_ADD, V_ONE, V_DENORM_TIMES_TWO, V_INF, V_NAN}, {OID_SUB, V_MINUS_ONE, V_ZERO, V_MINUS_INF, V_NAN},
        {OID_MUL, V_DENORM, V_ZERO, V_INF, V_NAN},          {OID_VEC_MUL_S, V_DENORM, V_ZERO, V_INF, V_NAN},
        {OID_VEC_MUL_M, V_DENORM, V_ZERO, V_INF, V_NAN},    {OID_MAT_MUL_S, V_DENORM, V_ZERO, V_INF, V_NAN},
        {OID_MAT_MUL_V, V_DENORM, V_ZERO, V_INF, V_NAN},    {OID_MAT_MUL_M, V_DENORM, V_ZERO, V_INF, V_NAN},
        {OID_OUT_PROD, V_DENORM, V_ZERO, V_INF, V_NAN},     {OID_DOT, V_DENORM_TIMES_TWO, V_ZERO, V_INF, V_NAN},
        {OID_MIX, V_HALF, V_DENORM, V_INF, V_NAN},          {OID_FMA, V_HALF, V_HALF, V_INF, V_NAN},
        {OID_MIN, V_DENORM, V_DENORM, V_DENORM, V_UNUSED},  {OID_MAX, V_ONE, V_DENORM, V_INF, V_UNUSED},
        {OID_CLAMP, V_ONE, V_DENORM, V_INF, V_UNUSED},      {OID_NMIN, V_DENORM, V_DENORM, V_DENORM, V_DENORM},
        {OID_NMAX, V_ONE, V_DENORM, V_INF, V_DENORM},       {OID_NCLAMP, V_ONE, V_DENORM, V_INF, V_DENORM},
    };

    const UnaryCase unaryOpDenormPreserveArr[] = {
        //operation                op den
        {OID_RETURN_VAL, V_DENORM},
        {OID_D_EXTRACT, V_DENORM},
        {OID_D_INSERT, V_DENORM},
        {OID_SHUFFLE, V_DENORM},
        {OID_COMPOSITE, V_DENORM},
        {OID_COMPOSITE_INS, V_DENORM},
        {OID_COPY, V_DENORM},
        {OID_TRANSPOSE, V_DENORM},
        {OID_NEGATE, V_DENORM},
        {OID_ABS, V_DENORM},
        {OID_SIGN, V_ONE},
        {OID_RADIANS, V_DENORM},
        {OID_DEGREES, V_DEGREES_DENORM},
    };

    binaryOpFTZ.insert(binaryOpFTZ.begin(), binaryOpFTZArr, binaryOpFTZArr + DE_LENGTH_OF_ARRAY(binaryOpFTZArr));
    unaryOpFTZ.insert(unaryOpFTZ.begin(), unaryOpFTZArr, unaryOpFTZArr + DE_LENGTH_OF_ARRAY(unaryOpFTZArr));
    binaryOpDenormPreserve.insert(binaryOpDenormPreserve.begin(), binaryOpDenormPreserveArr,
                                  binaryOpDenormPreserveArr + DE_LENGTH_OF_ARRAY(binaryOpDenormPreserveArr));
    unaryOpDenormPreserve.insert(unaryOpDenormPreserve.begin(), unaryOpDenormPreserveArr,
                                 unaryOpDenormPreserveArr + DE_LENGTH_OF_ARRAY(unaryOpDenormPreserveArr));
}

template <>
TypeTestResults<double>::TypeTestResults()
{
    m_variableType = FP64;

    // fp64 is supported by fewer operations then fp16 and fp32
    // e.g. Radians and Degrees functions are not supported
    const BinaryCase binaryOpFTZArr[] = {
        //operation            den op one        den op den        den op inf        den op nan
        {OID_ADD, V_ONE, V_ZERO, V_INF, V_UNUSED},
        {OID_SUB, V_MINUS_ONE, V_ZERO, V_MINUS_INF, V_UNUSED},
        {OID_MUL, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_DIV, V_ZERO, V_UNUSED, V_ZERO, V_UNUSED},
        {OID_REM, V_ZERO, V_UNUSED, V_UNUSED, V_UNUSED},
        {OID_MOD, V_ZERO, V_UNUSED, V_UNUSED, V_UNUSED},
        {OID_VEC_MUL_S, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_VEC_MUL_M, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_MAT_MUL_S, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_MAT_MUL_V, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_MAT_MUL_M, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_OUT_PROD, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_DOT, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
        {OID_MIX, V_HALF, V_ZERO, V_INF, V_UNUSED},
        {OID_MIN, V_ZERO, V_ZERO, V_ZERO, V_UNUSED},
        {OID_MAX, V_ONE, V_ZERO, V_INF, V_UNUSED},
        {OID_CLAMP, V_ONE, V_ZERO, V_INF, V_UNUSED},
        {OID_STEP, V_ONE, V_ONE, V_ONE, V_UNUSED},
        {OID_SSTEP, V_HALF, V_ONE, V_ZERO, V_UNUSED},
        {OID_FMA, V_HALF, V_HALF, V_UNUSED, V_UNUSED},
        {OID_FACE_FWD, V_MINUS_ONE, V_MINUS_ONE, V_MINUS_ONE, V_MINUS_ONE},
        {OID_NMIN, V_ZERO, V_ZERO, V_ZERO, V_ZERO},
        {OID_NMAX, V_ONE, V_ZERO, V_INF, V_ZERO},
        {OID_NCLAMP, V_ONE, V_ZERO, V_INF, V_ZERO},
        {OID_DIST, V_ONE, V_ZERO, V_INF, V_UNUSED},
        {OID_CROSS, V_ZERO, V_ZERO, V_UNUSED, V_UNUSED},
    };

    const UnaryCase unaryOpFTZArr[] = {
        //operation            op den
        {OID_NEGATE, V_MINUS_ZERO},
        {OID_ROUND, V_ZERO},
        {OID_ROUND_EV, V_ZERO},
        {OID_TRUNC, V_ZERO},
        {OID_ABS, V_ZERO},
        {OID_FLOOR, V_ZERO},
        {OID_CEIL, V_ZERO_OR_ONE},
        {OID_FRACT, V_ZERO},
        {OID_SQRT, V_ZERO_OR_SQRT_DENORM},
        {OID_INV_SQRT, V_INF_OR_INV_SQRT_DENORM},
        {OID_MAT_DET, V_ZERO},
        {OID_MAT_INV, V_ZERO_OR_MINUS_ZERO},
        {OID_MODF, V_ZERO},
        {OID_MODF_ST, V_ZERO},
        {OID_NORMALIZE, V_ZERO},
        {OID_REFLECT, V_ZERO},
        {OID_LENGTH, V_ZERO},
    };

    const BinaryCase binaryOpDenormPreserveArr[] = {
        //operation            den op one            den op den                den op inf        den op nan
        {OID_PHI, V_DENORM, V_DENORM, V_DENORM, V_DENORM},
        {OID_SELECT, V_DENORM, V_DENORM, V_DENORM, V_DENORM},
        {OID_ADD, V_ONE, V_DENORM_TIMES_TWO, V_INF, V_NAN},
        {OID_SUB, V_MINUS_ONE, V_ZERO, V_MINUS_INF, V_NAN},
        {OID_MUL, V_DENORM, V_ZERO, V_INF, V_NAN},
        {OID_VEC_MUL_S, V_DENORM, V_ZERO, V_INF, V_NAN},
        {OID_VEC_MUL_M, V_DENORM_TIMES_TWO, V_ZERO, V_INF, V_NAN},
        {OID_MAT_MUL_S, V_DENORM, V_ZERO, V_INF, V_NAN},
        {OID_MAT_MUL_V, V_DENORM_TIMES_TWO, V_ZERO, V_INF, V_NAN},
        {OID_MAT_MUL_M, V_DENORM_TIMES_TWO, V_ZERO, V_INF, V_NAN},
        {OID_OUT_PROD, V_DENORM, V_ZERO, V_INF, V_NAN},
        {OID_DOT, V_DENORM_TIMES_TWO, V_ZERO, V_INF, V_NAN},
        {OID_MIX, V_HALF, V_DENORM, V_INF, V_NAN},
        {OID_FMA, V_HALF, V_HALF, V_INF, V_NAN},
        {OID_MIN, V_DENORM, V_DENORM, V_DENORM, V_UNUSED},
        {OID_MAX, V_ONE, V_DENORM, V_INF, V_UNUSED},
        {OID_CLAMP, V_ONE, V_DENORM, V_INF, V_UNUSED},
        {OID_NMIN, V_DENORM, V_DENORM, V_DENORM, V_DENORM},
        {OID_NMAX, V_ONE, V_DENORM, V_INF, V_DENORM},
        {OID_NCLAMP, V_ONE, V_DENORM, V_INF, V_DENORM},
    };

    const UnaryCase unaryOpDenormPreserveArr[] = {
        //operation                op den
        {OID_RETURN_VAL, V_DENORM}, {OID_D_EXTRACT, V_DENORM},     {OID_D_INSERT, V_DENORM}, {OID_SHUFFLE, V_DENORM},
        {OID_COMPOSITE, V_DENORM},  {OID_COMPOSITE_INS, V_DENORM}, {OID_COPY, V_DENORM},     {OID_TRANSPOSE, V_DENORM},
        {OID_NEGATE, V_DENORM},     {OID_ABS, V_DENORM},           {OID_SIGN, V_ONE},
    };

    binaryOpFTZ.insert(binaryOpFTZ.begin(), binaryOpFTZArr, binaryOpFTZArr + DE_LENGTH_OF_ARRAY(binaryOpFTZArr));
    unaryOpFTZ.insert(unaryOpFTZ.begin(), unaryOpFTZArr, unaryOpFTZArr + DE_LENGTH_OF_ARRAY(unaryOpFTZArr));
    binaryOpDenormPreserve.insert(binaryOpDenormPreserve.begin(), binaryOpDenormPreserveArr,
                                  binaryOpDenormPreserveArr + DE_LENGTH_OF_ARRAY(binaryOpDenormPreserveArr));
    unaryOpDenormPreserve.insert(unaryOpDenormPreserve.begin(), unaryOpDenormPreserveArr,
                                 unaryOpDenormPreserveArr + DE_LENGTH_OF_ARRAY(unaryOpDenormPreserveArr));
}

// Operation structure holds data needed to test specified SPIR-V operation. This class contains
// additional annotations, additional types and aditional constants that should be properly included
// in SPIR-V code. Commands attribute in this structure contains code that performs tested operation
// on given arguments, in some cases verification is also performed there.
// All snipets stroed in this structure are generic and can be specialized for fp16, fp32 or fp64,
// thanks to that this data can be shared by many OperationTestCase instances (testing diferent
// float behaviors on diferent float widths).
struct Operation
{
    // operation name is included in test case name
    const char *name;

    // How extensively is the floating point type used?
    FloatUsage floatUsage;

    // operation specific spir-v snippets that will be
    // placed in proper places in final test shader
    const char *annotations;
    const char *types;
    const char *constants;
    const char *variables;
    const char *functions;
    const char *commands;

    // conversion operations operate on one float type and produce float
    // type with different bit width; restrictedInputType is used only when
    // isInputTypeRestricted is set to true and it restricts usage of this
    // operation to specified input type
    bool isInputTypeRestricted;
    VariableType restrictedInputType;

    // arguments for OpSpecConstant need to be specified also as constant
    bool isSpecConstant;

    // set if c_float* constant is used in operation
    FloatStatementUsageFlags statementUsageFlags;

    Operation()
    {
    }

    // Minimal constructor - used by most of operations
    Operation(const char *_name, FloatUsage _floatUsage, const char *_commands,
              const FloatStatementUsageFlags _statementUsageFlags = 0)
        : name(_name)
        , floatUsage(_floatUsage)
        , annotations("")
        , types("")
        , constants("")
        , variables("")
        , functions("")
        , commands(_commands)
        , isInputTypeRestricted(false)
        , restrictedInputType(FP16) // not used as isInputTypeRestricted is false
        , isSpecConstant(false)
        , statementUsageFlags(_statementUsageFlags)
    {
    }

    // Conversion operations constructor (used also by conversions done in SpecConstantOp)
    Operation(const char *_name, FloatUsage _floatUsage, bool specConstant, VariableType _inputType,
              const char *_constants, const char *_commands, const FloatStatementUsageFlags _statementUsageFlags = 0)
        : name(_name)
        , floatUsage(_floatUsage)
        , annotations("")
        , types("")
        , constants(_constants)
        , variables("")
        , functions("")
        , commands(_commands)
        , isInputTypeRestricted(true)
        , restrictedInputType(_inputType)
        , isSpecConstant(specConstant)
        , statementUsageFlags(_statementUsageFlags)
    {
    }

    // Full constructor - used by few operations, that are more complex to test
    Operation(const char *_name, FloatUsage _floatUsage, const char *_annotations, const char *_types,
              const char *_constants, const char *_variables, const char *_functions, const char *_commands,
              const FloatStatementUsageFlags _statementUsageFlags = 0)
        : name(_name)
        , floatUsage(_floatUsage)
        , annotations(_annotations)
        , types(_types)
        , constants(_constants)
        , variables(_variables)
        , functions(_functions)
        , commands(_commands)
        , isInputTypeRestricted(false)
        , restrictedInputType(FP16) // not used as isInputTypeRestricted is false
        , isSpecConstant(false)
        , statementUsageFlags(_statementUsageFlags)
    {
    }

    // Full constructor - used by rounding override cases
    Operation(const char *_name, FloatUsage _floatUsage, VariableType _inputType, const char *_annotations,
              const char *_types, const char *_constants, const char *_commands,
              const FloatStatementUsageFlags _statementUsageFlags = 0)
        : name(_name)
        , floatUsage(_floatUsage)
        , annotations(_annotations)
        , types(_types)
        , constants(_constants)
        , variables("")
        , functions("")
        , commands(_commands)
        , isInputTypeRestricted(true)
        , restrictedInputType(_inputType)
        , isSpecConstant(false)
        , statementUsageFlags(_statementUsageFlags)
    {
    }
};

// Class storing input that will be passed to operation and expected
// output that should be generated for specified behaviour.
class OperationTestCase
{
public:
    OperationTestCase()
    {
    }

    OperationTestCase(const char *_baseName, BehaviorFlags _behaviorFlags, OperationId _operationId, ValueId _input1,
                      ValueId _input2, ValueId _expectedOutput, bool _fp16Without16BitStorage = false)
        : behaviorFlags(_behaviorFlags)
        , operationId(_operationId)
        , expectedOutput(_expectedOutput)
        , fp16Without16BitStorage(_fp16Without16BitStorage)
    {
        baseName = _baseName;
        if (fp16Without16BitStorage)
            baseName += "_nostorage";
        input[0] = _input1;
        input[1] = _input2;
    }

public:
    string baseName;
    BehaviorFlags behaviorFlags;
    OperationId operationId;
    ValueId input[2];
    ValueId expectedOutput;
    bool fp16Without16BitStorage;
};

// Helper structure used to store specialized operation
// data. This data is ready to be used during shader assembly.
struct SpecializedOperation
{
    string constants;
    string annotations;
    string types;
    string arguments;
    string variables;
    string functions;
    string commands;

    VariableType inVariableType;
    TypeSnippetsSP inTypeSnippets;
    TypeSnippetsSP outTypeSnippets;
    FloatStatementUsageFlags argumentsUsesFloatConstant;
};

// Class responsible for constructing list of test cases for specified
// float type and specified way of preparation of arguments.
// Arguments can be either read from input SSBO or generated via math
// operations in spir-v code.
class TestCasesBuilder
{
public:
    void init();
    void build(vector<OperationTestCase> &testCases, TypeTestResultsSP typeTestResults, bool argumentsFromInput);
    const Operation &getOperation(OperationId id) const;

private:
    void createUnaryTestCases(vector<OperationTestCase> &testCases, OperationId operationId,
                              ValueId denormPreserveResult, ValueId denormFTZResult,
                              bool fp16WithoutStorage = false) const;

private:
    // Operations are shared betwean test cases so they are
    // passed to them as pointers to data stored in TestCasesBuilder.
    typedef OperationTestCase OTC;
    typedef Operation Op;
    map<int, Op> m_operations;
    // SPIR-V assembly snippets that are used in m_operations
    vector<std::string> m_saved_strings;

    // We expect 12 strings: 3 kinds of narrowing conversions, with
    // 4 cases each.
    const size_t m_num_expected_strings = 12;
    // Saves the given string in m_strings, and returns a pointer to its data.
    const char *save(std::string str)
    {
        m_saved_strings.emplace_back(std::move(str));
        return m_saved_strings.back().data();
    }
};

void TestCasesBuilder::init()
{
    map<int, Op> &mo = m_operations;
    m_saved_strings.reserve(m_num_expected_strings);

    // predefine operations repeatedly used in tests; note that "_valueType"
    // in every operation command will be replaced with either "_f16",
    // "_f32", "_f64", "_ui16", "ui32", "_ui64", "_i16", "_i32", "_i64"
    // StringTemplate is not used here because it would make code less
    // readable m_operations contains generic operation definitions that
    // can be used for all float types

    mo[OID_NEGATE]    = Op("negate", FLOAT_ARITHMETIC, "%result             = OpFNegate %type_valueType %arg1\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_COMPOSITE] = Op("composite", FLOAT_ARITHMETIC,
                           "%vec1               = OpCompositeConstruct %type_valueType_vec2 %arg1 %arg1\n"
                           "%result             = OpCompositeExtract %type_valueType %vec1 0\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_COMPOSITE_INS] =
        Op("comp_ins", FLOAT_ARITHMETIC,
           "%vec1               = OpCompositeConstruct %type_valueType_vec2 %c_valueType_0 %c_valueType_0\n"
           "%vec2               = OpCompositeInsert %type_valueType_vec2 %arg1 %vec1 0\n"
           "%result             = OpCompositeExtract %type_valueType %vec2 0\n",
           B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_COPY]      = Op("copy", FLOAT_STORAGE_ONLY, "%result             = OpCopyObject %type_valueType %arg1\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_D_EXTRACT] = Op("extract", FLOAT_ARITHMETIC,
                           "%vec1               = OpCompositeConstruct %type_valueType_vec2 %arg1 %arg1\n"
                           "%result             = OpVectorExtractDynamic %type_valueType %vec1 %c_i32_0\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_D_INSERT] =
        Op("insert", FLOAT_ARITHMETIC,
           "%tmpVec             = OpCompositeConstruct %type_valueType_vec2 %c_valueType_2 %c_valueType_2\n"
           "%vec1               = OpVectorInsertDynamic %type_valueType_vec2 %tmpVec %arg1 %c_i32_0\n"
           "%result             = OpCompositeExtract %type_valueType %vec1 0\n",
           B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_SHUFFLE] = Op(
        "shuffle", FLOAT_ARITHMETIC,
        "%tmpVec1            = OpCompositeConstruct %type_valueType_vec2 %arg1 %arg1\n"
        "%tmpVec2            = OpCompositeConstruct %type_valueType_vec2 %c_valueType_2 "
        "%c_valueType_2\n" // NOTE: its impossible to test shuffle with denorms flushed
        "%vec1               = OpVectorShuffle %type_valueType_vec2 %tmpVec1 %tmpVec2 0 2\n" //       to zero as this will be done by earlier operation
        "%result             = OpCompositeExtract %type_valueType %vec1 0\n", //       (this also applies to few other operations)
        B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_TRANSPOSE]  = Op("transpose", FLOAT_ARITHMETIC,
                            "%col                = OpCompositeConstruct %type_valueType_vec2 %arg1 %arg1\n"
                             "%mat                = OpCompositeConstruct %type_valueType_mat2x2 %col %col\n"
                             "%tmat               = OpTranspose %type_valueType_mat2x2 %mat\n"
                             "%tcol               = OpCompositeExtract %type_valueType_vec2 %tmat 0\n"
                             "%result             = OpCompositeExtract %type_valueType %tcol 0\n",
                            B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_RETURN_VAL] = Op("ret_val", FLOAT_ARITHMETIC, "",
                            "%type_test_fun      = OpTypeFunction %type_valueType %type_valueType\n", "", "",
                            "%test_fun = OpFunction %type_valueType None %type_test_fun\n"
                            "%param = OpFunctionParameter %type_valueType\n"
                            "%entry = OpLabel\n"
                            "OpReturnValue %param\n"
                            "OpFunctionEnd\n",
                            "%result             = OpFunctionCall %type_valueType %test_fun %arg1\n",
                            B_STATEMENT_USAGE_TYPES_TYPE_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);

    // conversion operations that are meant to be used only for single output type (defined by the second number in name)
    const char *convertSource = "%result             = OpFConvert %type_valueType %arg1\n";
    mo[OID_CONV_FROM_FP16] =
        Op("conv_from_fp16", FLOAT_STORAGE_ONLY, false, FP16, "", convertSource, B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_CONV_FROM_FP32] =
        Op("conv_from_fp32", FLOAT_STORAGE_ONLY, false, FP32, "", convertSource, B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_CONV_FROM_FP64] =
        Op("conv_from_fp64", FLOAT_STORAGE_ONLY, false, FP64, "", convertSource, B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);

    const char *convertFromUintSource = "%result             = OpConvertUToF %type_valueType %arg1\n";
    mo[OID_CONV_FROM_UINT_TO_FP32]    = Op("conv_uint_to_fp32", FLOAT_STORAGE_ONLY, false, UINT32, "",
                                           convertFromUintSource, B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_CONV_FROM_UINT_TO_FP64]    = Op("conv_uint_to_fp64", FLOAT_STORAGE_ONLY, false, UINT64, "",
                                           convertFromUintSource, B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    const char *convertFromIntSource  = "%result             = OpConvertSToF %type_valueType %arg1\n";
    mo[OID_CONV_FROM_INT_TO_FP32] = Op("conv_uint_to_fp32", FLOAT_STORAGE_ONLY, false, INT32, "", convertFromIntSource,
                                       B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_CONV_FROM_INT_TO_FP64] = Op("conv_uint_to_fp64", FLOAT_STORAGE_ONLY, false, INT64, "", convertFromIntSource,
                                       B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);

    // From all operands supported by OpSpecConstantOp we can only test FConvert opcode with literals as everything
    // else requires Karnel capability (OpenCL); values of literals used in SPIR-V code must be equivalent to
    // the values V_CONV_FROM_....  Use the feature of the SPIR-V assembler where use ! to inject raw integer
    // words into the SPIR-V binary.

    // fp32 -> fp16 with cases UP, DOWN, TIE_UP, TIE_DOWN
    typedef conversionDetail<Float32, Float16> conv32to16;
    mo[OID_SCONST_CONV_FROM_FP32_TO_FP16_UP] =
        Op("sconst_conv_from_fp32_up", FLOAT_ARITHMETIC, true, FP32,
           save("%c_arg              = OpConstant %type_f32 !" + conv32to16::fromStr(Round::UP) +
                "\n"
                "%result             = OpSpecConstantOp %type_f16 FConvert %c_arg\n"),
           "", B_STATEMENT_USAGE_CONSTS_TYPE_FP16 | B_STATEMENT_USAGE_CONSTS_TYPE_FP32);
    mo[OID_SCONST_CONV_FROM_FP32_TO_FP16_DOWN] =
        Op("sconst_conv_from_fp32_down", FLOAT_ARITHMETIC, true, FP32,
           save("%c_arg              = OpConstant %type_f32 !" + conv32to16::fromStr(Round::DOWN) +
                "\n"
                "%result             = OpSpecConstantOp %type_f16 FConvert %c_arg\n"),
           "", B_STATEMENT_USAGE_CONSTS_TYPE_FP16 | B_STATEMENT_USAGE_CONSTS_TYPE_FP32);
    mo[OID_SCONST_CONV_FROM_FP32_TO_FP16_TIE_UP] =
        Op("sconst_conv_from_fp32_tie_up", FLOAT_ARITHMETIC, true, FP32,
           save("%c_arg              = OpConstant %type_f32 !" + conv32to16::fromStr(Round::TIE_UP) +
                "\n"
                "%result             = OpSpecConstantOp %type_f16 FConvert %c_arg\n"),
           "", B_STATEMENT_USAGE_CONSTS_TYPE_FP16 | B_STATEMENT_USAGE_CONSTS_TYPE_FP32);
    mo[OID_SCONST_CONV_FROM_FP32_TO_FP16_TIE_DOWN] =
        Op("sconst_conv_from_fp32_tie_down", FLOAT_ARITHMETIC, true, FP32,
           save("%c_arg              = OpConstant %type_f32 !" + conv32to16::fromStr(Round::TIE_DOWN) +
                "\n"
                "%result             = OpSpecConstantOp %type_f16 FConvert %c_arg\n"),
           "", B_STATEMENT_USAGE_CONSTS_TYPE_FP16 | B_STATEMENT_USAGE_CONSTS_TYPE_FP32);

    // fp64 -> fp32 with cases UP, DOWN, TIE_UP, TIE_DOWN
    // To inject a 64 bit value, inject 2 32-bit words.
    typedef conversionDetail<Float64, Float32> conv64to32;
    mo[OID_SCONST_CONV_FROM_FP64_TO_FP32_UP] =
        Op("sconst_conv_from_fp64_up", FLOAT_ARITHMETIC, true, FP64,
           save("%c_arg              = OpConstant %type_f64 !" + conv64to32::fromStr(Round::UP) +
                "\n"
                "%result             = OpSpecConstantOp %type_f32 FConvert %c_arg\n"),
           "", B_STATEMENT_USAGE_CONSTS_TYPE_FP32 | B_STATEMENT_USAGE_CONSTS_TYPE_FP64);
    mo[OID_SCONST_CONV_FROM_FP64_TO_FP32_DOWN] =
        Op("sconst_conv_from_fp64_down", FLOAT_ARITHMETIC, true, FP64,
           save("%c_arg              = OpConstant %type_f64 !" + conv64to32::fromStr(Round::DOWN) +
                "\n"
                "%result             = OpSpecConstantOp %type_f32 FConvert %c_arg\n"),
           "", B_STATEMENT_USAGE_CONSTS_TYPE_FP32 | B_STATEMENT_USAGE_CONSTS_TYPE_FP64);
    mo[OID_SCONST_CONV_FROM_FP64_TO_FP32_TIE_UP] =
        Op("sconst_conv_from_fp64_tie_up", FLOAT_ARITHMETIC, true, FP64,
           save("%c_arg              = OpConstant %type_f64 !" + conv64to32::fromStr(Round::TIE_UP) +
                "\n"
                "%result             = OpSpecConstantOp %type_f32 FConvert %c_arg\n"),
           "", B_STATEMENT_USAGE_CONSTS_TYPE_FP32 | B_STATEMENT_USAGE_CONSTS_TYPE_FP64);
    mo[OID_SCONST_CONV_FROM_FP64_TO_FP32_TIE_DOWN] =
        Op("sconst_conv_from_fp64_tie_down", FLOAT_ARITHMETIC, true, FP64,
           save("%c_arg              = OpConstant %type_f64 !" + conv64to32::fromStr(Round::TIE_DOWN) +
                "\n"
                "%result             = OpSpecConstantOp %type_f32 FConvert %c_arg\n"),
           "", B_STATEMENT_USAGE_CONSTS_TYPE_FP32 | B_STATEMENT_USAGE_CONSTS_TYPE_FP64);

    // fp64 -> fp16 with cases UP, DOWN, TIE_UP, TIE_DOWN
    typedef conversionDetail<Float64, Float16> conv64to16;
    mo[OID_SCONST_CONV_FROM_FP64_TO_FP16_UP] =
        Op("sconst_conv_from_fp64_up", FLOAT_ARITHMETIC, true, FP64,
           save("%c_arg              = OpConstant %type_f64 !" + conv64to16::fromStr(Round::UP) +
                "\n"
                "%result             = OpSpecConstantOp %type_f16 FConvert %c_arg\n"),
           "", B_STATEMENT_USAGE_CONSTS_TYPE_FP16 | B_STATEMENT_USAGE_CONSTS_TYPE_FP64);
    mo[OID_SCONST_CONV_FROM_FP64_TO_FP16_DOWN] =
        Op("sconst_conv_from_fp64_down", FLOAT_ARITHMETIC, true, FP64,
           save("%c_arg              = OpConstant %type_f64 !" + conv64to16::fromStr(Round::DOWN) +
                "\n"
                "%result             = OpSpecConstantOp %type_f16 FConvert %c_arg\n"),
           "", B_STATEMENT_USAGE_CONSTS_TYPE_FP16 | B_STATEMENT_USAGE_CONSTS_TYPE_FP64);
    mo[OID_SCONST_CONV_FROM_FP64_TO_FP16_TIE_UP] =
        Op("sconst_conv_from_fp64_tie_up", FLOAT_ARITHMETIC, true, FP64,
           save("%c_arg              = OpConstant %type_f64 !" + conv64to16::fromStr(Round::TIE_UP) +
                "\n"
                "%result             = OpSpecConstantOp %type_f16 FConvert %c_arg\n"),
           "", B_STATEMENT_USAGE_CONSTS_TYPE_FP16 | B_STATEMENT_USAGE_CONSTS_TYPE_FP64);
    mo[OID_SCONST_CONV_FROM_FP64_TO_FP16_TIE_DOWN] =
        Op("sconst_conv_from_fp64_tie_down", FLOAT_ARITHMETIC, true, FP64,
           save("%c_arg              = OpConstant %type_f64 !" + conv64to16::fromStr(Round::TIE_DOWN) +
                "\n"
                "%result             = OpSpecConstantOp %type_f16 FConvert %c_arg\n"),
           "", B_STATEMENT_USAGE_CONSTS_TYPE_FP16 | B_STATEMENT_USAGE_CONSTS_TYPE_FP64);

    mo[OID_ADD]       = Op("add", FLOAT_ARITHMETIC, "%result             = OpFAdd %type_valueType %arg1 %arg2\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_SUB]       = Op("sub", FLOAT_ARITHMETIC, "%result             = OpFSub %type_valueType %arg1 %arg2\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_MUL]       = Op("mul", FLOAT_ARITHMETIC, "%result             = OpFMul %type_valueType %arg1 %arg2\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_DIV]       = Op("div", FLOAT_ARITHMETIC, "%result             = OpFDiv %type_valueType %arg1 %arg2\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_REM]       = Op("rem", FLOAT_ARITHMETIC, "%result             = OpFRem %type_valueType %arg1 %arg2\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_MOD]       = Op("mod", FLOAT_ARITHMETIC, "%result             = OpFMod %type_valueType %arg1 %arg2\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_PHI]       = Op("phi", FLOAT_ARITHMETIC,
                           "%comp               = OpFOrdGreaterThan %type_bool %arg1 %arg2\n"
                                 "                      OpSelectionMerge %comp_merge None\n"
                                 "                      OpBranchConditional %comp %true_branch %false_branch\n"
                                 "%true_branch        = OpLabel\n"
                                 "                      OpBranch %comp_merge\n"
                                 "%false_branch       = OpLabel\n"
                                 "                      OpBranch %comp_merge\n"
                                 "%comp_merge         = OpLabel\n"
                                 "%result             = OpPhi %type_valueType %arg2 %true_branch %arg1 %false_branch\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_SELECT]    = Op("select", FLOAT_ARITHMETIC,
                           "%always_true        = OpFOrdGreaterThan %type_bool %c_valueType_1 %c_valueType_0\n"
                              "%result             = OpSelect %type_valueType %always_true %arg1 %arg2\n",
                           B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_DOT]       = Op("dot", FLOAT_ARITHMETIC,
                           "%vec1               = OpCompositeConstruct %type_valueType_vec2 %arg1 %arg1\n"
                                 "%vec2               = OpCompositeConstruct %type_valueType_vec2 %arg2 %arg2\n"
                                 "%result             = OpDot %type_valueType %vec1 %vec2\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_VEC_MUL_S] = Op("vmuls", FLOAT_ARITHMETIC,
                           "%vec                = OpCompositeConstruct %type_valueType_vec2 %arg1 %arg1\n"
                           "%tmpVec             = OpVectorTimesScalar %type_valueType_vec2 %vec %arg2\n"
                           "%result             = OpCompositeExtract %type_valueType %tmpVec 0\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_VEC_MUL_M] = Op("vmulm", FLOAT_ARITHMETIC,
                           "%col                = OpCompositeConstruct %type_valueType_vec2 %arg1 %arg1\n"
                           "%mat                = OpCompositeConstruct %type_valueType_mat2x2 %col %col\n"
                           "%vec                = OpCompositeConstruct %type_valueType_vec2 %arg2 %arg2\n"
                           "%tmpVec             = OpVectorTimesMatrix %type_valueType_vec2 %vec %mat\n"
                           "%result             = OpCompositeExtract %type_valueType %tmpVec 0\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_MAT_MUL_S] = Op("mmuls", FLOAT_ARITHMETIC,
                           "%col                = OpCompositeConstruct %type_valueType_vec2 %arg1 %arg1\n"
                           "%mat                = OpCompositeConstruct %type_valueType_mat2x2 %col %col\n"
                           "%mulMat             = OpMatrixTimesScalar %type_valueType_mat2x2 %mat %arg2\n"
                           "%extCol             = OpCompositeExtract %type_valueType_vec2 %mulMat 0\n"
                           "%result             = OpCompositeExtract %type_valueType %extCol 0\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_MAT_MUL_V] = Op("mmulv", FLOAT_ARITHMETIC,
                           "%col                = OpCompositeConstruct %type_valueType_vec2 %arg1 %arg1\n"
                           "%mat                = OpCompositeConstruct %type_valueType_mat2x2 %col %col\n"
                           "%vec                = OpCompositeConstruct %type_valueType_vec2 %arg2 %arg2\n"
                           "%mulVec             = OpMatrixTimesVector %type_valueType_vec2 %mat %vec\n"
                           "%result             = OpCompositeExtract %type_valueType %mulVec 0\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_MAT_MUL_M] = Op("mmulm", FLOAT_ARITHMETIC,
                           "%col1               = OpCompositeConstruct %type_valueType_vec2 %arg1 %arg1\n"
                           "%mat1               = OpCompositeConstruct %type_valueType_mat2x2 %col1 %col1\n"
                           "%col2               = OpCompositeConstruct %type_valueType_vec2 %arg2 %arg2\n"
                           "%mat2               = OpCompositeConstruct %type_valueType_mat2x2 %col2 %col2\n"
                           "%mulMat             = OpMatrixTimesMatrix %type_valueType_mat2x2 %mat1 %mat2\n"
                           "%extCol             = OpCompositeExtract %type_valueType_vec2 %mulMat 0\n"
                           "%result             = OpCompositeExtract %type_valueType %extCol 0\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_OUT_PROD]  = Op("out_prod", FLOAT_ARITHMETIC,
                           "%vec1               = OpCompositeConstruct %type_valueType_vec2 %arg1 %arg1\n"
                            "%vec2               = OpCompositeConstruct %type_valueType_vec2 %arg2 %arg2\n"
                            "%mulMat             = OpOuterProduct %type_valueType_mat2x2 %vec1 %vec2\n"
                            "%extCol             = OpCompositeExtract %type_valueType_vec2 %mulMat 0\n"
                            "%result             = OpCompositeExtract %type_valueType %extCol 0\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);

    // comparison operations
    mo[OID_ORD_EQ]   = Op("ord_eq", FLOAT_ARITHMETIC,
                          "%boolVal           = OpFOrdEqual %type_bool %arg1 %arg2\n"
                            "%result            = OpSelect %type_valueType %boolVal %c_valueType_1 %c_valueType_0\n",
                          B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_UORD_EQ]  = Op("uord_eq", FLOAT_ARITHMETIC,
                          "%boolVal           = OpFUnordEqual %type_bool %arg1 %arg2\n"
                           "%result            = OpSelect %type_valueType %boolVal %c_valueType_1 %c_valueType_0\n",
                          B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_ORD_NEQ]  = Op("ord_neq", FLOAT_ARITHMETIC,
                          "%boolVal           = OpFOrdNotEqual %type_bool %arg1 %arg2\n"
                           "%result            = OpSelect %type_valueType %boolVal %c_valueType_1 %c_valueType_0\n",
                          B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_UORD_NEQ] = Op("uord_neq", FLOAT_ARITHMETIC,
                          "%boolVal           = OpFUnordNotEqual %type_bool %arg1 %arg2\n"
                          "%result            = OpSelect %type_valueType %boolVal %c_valueType_1 %c_valueType_0\n",
                          B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_ORD_LS]   = Op("ord_ls", FLOAT_ARITHMETIC,
                          "%boolVal           = OpFOrdLessThan %type_bool %arg1 %arg2\n"
                            "%result            = OpSelect %type_valueType %boolVal %c_valueType_1 %c_valueType_0\n",
                          B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_UORD_LS]  = Op("uord_ls", FLOAT_ARITHMETIC,
                          "%boolVal           = OpFUnordLessThan %type_bool %arg1 %arg2\n"
                           "%result            = OpSelect %type_valueType %boolVal %c_valueType_1 %c_valueType_0\n",
                          B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_ORD_GT]   = Op("ord_gt", FLOAT_ARITHMETIC,
                          "%boolVal           = OpFOrdGreaterThan %type_bool %arg1 %arg2\n"
                            "%result            = OpSelect %type_valueType %boolVal %c_valueType_1 %c_valueType_0\n",
                          B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_UORD_GT]  = Op("uord_gt", FLOAT_ARITHMETIC,
                          "%boolVal           = OpFUnordGreaterThan %type_bool %arg1 %arg2\n"
                           "%result            = OpSelect %type_valueType %boolVal %c_valueType_1 %c_valueType_0\n",
                          B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_ORD_LE]   = Op("ord_le", FLOAT_ARITHMETIC,
                          "%boolVal           = OpFOrdLessThanEqual %type_bool %arg1 %arg2\n"
                            "%result            = OpSelect %type_valueType %boolVal %c_valueType_1 %c_valueType_0\n",
                          B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_UORD_LE]  = Op("uord_le", FLOAT_ARITHMETIC,
                          "%boolVal           = OpFUnordLessThanEqual %type_bool %arg1 %arg2\n"
                           "%result            = OpSelect %type_valueType %boolVal %c_valueType_1 %c_valueType_0\n",
                          B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_ORD_GE]   = Op("ord_ge", FLOAT_ARITHMETIC,
                          "%boolVal           = OpFOrdGreaterThanEqual %type_bool %arg1 %arg2\n"
                            "%result            = OpSelect %type_valueType %boolVal %c_valueType_1 %c_valueType_0\n",
                          B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_UORD_GE]  = Op("uord_ge", FLOAT_ARITHMETIC,
                          "%boolVal           = OpFUnordGreaterThanEqual %type_bool %arg1 %arg2\n"
                           "%result            = OpSelect %type_valueType %boolVal %c_valueType_1 %c_valueType_0\n",
                          B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);

    mo[OID_ATAN2] =
        Op("atan2", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Atan2 %arg1 %arg2\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_POW] =
        Op("pow", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Pow %arg1 %arg2\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_MIX] = Op("mix", FLOAT_ARITHMETIC,
                     "%result             = OpExtInst %type_valueType %std450 FMix %arg1 %arg2 %c_valueType_0_5\n",
                     B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_FMA] = Op("fma", FLOAT_ARITHMETIC,
                     "%result             = OpExtInst %type_valueType %std450 Fma %arg1 %arg2 %c_valueType_0_5\n",
                     B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_MIN] =
        Op("min", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 FMin %arg1 %arg2\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_MAX] =
        Op("max", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 FMax %arg1 %arg2\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_CLAMP] = Op("clamp", FLOAT_ARITHMETIC,
                       "%result             = OpExtInst %type_valueType %std450 FClamp %arg1 %arg2 %arg2\n",
                       B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_STEP] =
        Op("step", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Step %arg1 %arg2\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_SSTEP] =
        Op("sstep", FLOAT_ARITHMETIC,
           "%result             = OpExtInst %type_valueType %std450 SmoothStep %arg1 %arg2 %c_valueType_0_5\n",
           B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_DIST]  = Op("distance", FLOAT_ARITHMETIC,
                       "%result             = OpExtInst %type_valueType %std450 Distance %arg1 %arg2\n",
                       B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_CROSS] = Op("cross", FLOAT_ARITHMETIC,
                       "%vec1               = OpCompositeConstruct %type_valueType_vec3 %arg1 %arg1 %arg1\n"
                       "%vec2               = OpCompositeConstruct %type_valueType_vec3 %arg2 %arg2 %arg2\n"
                       "%tmpVec             = OpExtInst %type_valueType_vec3 %std450 Cross %vec1 %vec2\n"
                       "%result             = OpCompositeExtract %type_valueType %tmpVec 0\n",
                       B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_FACE_FWD] =
        Op("face_fwd", FLOAT_ARITHMETIC,
           "%result             = OpExtInst %type_valueType %std450 FaceForward %c_valueType_1 %arg1 %arg2\n",
           B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_NMIN] =
        Op("nmin", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 NMin %arg1 %arg2\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_NMAX] =
        Op("nmax", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 NMax %arg1 %arg2\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_NCLAMP] = Op("nclamp", FLOAT_ARITHMETIC,
                        "%result             = OpExtInst %type_valueType %std450 NClamp %arg2 %arg1 %arg2\n",
                        B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);

    mo[OID_ROUND] =
        Op("round", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Round %arg1\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_ROUND_EV] =
        Op("round_ev", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 RoundEven %arg1\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_TRUNC] =
        Op("trunc", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Trunc %arg1\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_ABS]  = Op("abs", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 FAbs %arg1\n",
                      B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_SIGN] = Op("sign", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 FSign %arg1\n",
                      B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_FLOOR] =
        Op("floor", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Floor %arg1\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_CEIL] = Op("ceil", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Ceil %arg1\n",
                      B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_FRACT] =
        Op("fract", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Fract %arg1\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_RADIANS] =
        Op("radians", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Radians %arg1\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_DEGREES] =
        Op("degrees", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Degrees %arg1\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_SIN]  = Op("sin", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Sin %arg1\n",
                      B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_COS]  = Op("cos", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Cos %arg1\n",
                      B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_TAN]  = Op("tan", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Tan %arg1\n",
                      B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_ASIN] = Op("asin", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Asin %arg1\n",
                      B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_ACOS] = Op("acos", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Acos %arg1\n",
                      B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_ATAN] = Op("atan", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Atan %arg1\n",
                      B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_SINH] = Op("sinh", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Sinh %arg1\n",
                      B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_COSH] = Op("cosh", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Cosh %arg1\n",
                      B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_TANH] = Op("tanh", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Tanh %arg1\n",
                      B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_ASINH] =
        Op("asinh", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Asinh %arg1\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_ACOSH] =
        Op("acosh", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Acosh %arg1\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_ATANH] =
        Op("atanh", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Atanh %arg1\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_EXP]  = Op("exp", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Exp %arg1\n",
                      B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_LOG]  = Op("log", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Log %arg1\n",
                      B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_EXP2] = Op("exp2", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Exp2 %arg1\n",
                      B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_LOG2] = Op("log2", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Log2 %arg1\n",
                      B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_SQRT] = Op("sqrt", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Sqrt %arg1\n",
                      B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_INV_SQRT] =
        Op("inv_sqrt", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 InverseSqrt %arg1\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_MODF] =
        Op("modf", FLOAT_ARITHMETIC, "", "", "", "%tmpVarPtr          = OpVariable %type_valueType_fptr Function\n", "",
           "%result             = OpExtInst %type_valueType %std450 Modf %arg1 %tmpVarPtr\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_MODF_ST] = Op("modf_st", FLOAT_ARITHMETIC,
                         "OpMemberDecorate %struct_ff 0 Offset 0\n"
                         "OpMemberDecorate %struct_ff 1 Offset ${float_width}\n",
                         "%struct_ff          = OpTypeStruct %type_valueType %type_valueType\n"
                         "%struct_ff_fptr     = OpTypePointer Function %struct_ff\n",
                         "", "%tmpStructPtr       = OpVariable %struct_ff_fptr Function\n", "",
                         "%tmpStruct          = OpExtInst %struct_ff %std450 ModfStruct %arg1\n"
                         "                      OpStore %tmpStructPtr %tmpStruct\n"
                         "%tmpLoc             = OpAccessChain %type_valueType_fptr %tmpStructPtr %c_i32_0\n"
                         "%result             = OpLoad %type_valueType %tmpLoc\n",
                         B_STATEMENT_USAGE_TYPES_TYPE_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_FREXP] =
        Op("frexp", FLOAT_ARITHMETIC, "", "", "", "%tmpVarPtr          = OpVariable %type_i32_fptr Function\n", "",
           "%result             = OpExtInst %type_valueType %std450 Frexp %arg1 %tmpVarPtr\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_FREXP_ST] = Op("frexp_st", FLOAT_ARITHMETIC,
                          "OpMemberDecorate %struct_fi 0 Offset 0\n"
                          "OpMemberDecorate %struct_fi 1 Offset ${float_width}\n",
                          "%struct_fi          = OpTypeStruct %type_valueType %type_i32\n"
                          "%struct_fi_fptr     = OpTypePointer Function %struct_fi\n",
                          "", "%tmpStructPtr       = OpVariable %struct_fi_fptr Function\n", "",
                          "%tmpStruct          = OpExtInst %struct_fi %std450 FrexpStruct %arg1\n"
                          "                      OpStore %tmpStructPtr %tmpStruct\n"
                          "%tmpLoc             = OpAccessChain %type_valueType_fptr %tmpStructPtr %c_i32_0\n"
                          "%result             = OpLoad %type_valueType %tmpLoc\n",
                          B_STATEMENT_USAGE_TYPES_TYPE_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_LENGTH] =
        Op("length", FLOAT_ARITHMETIC, "%result             = OpExtInst %type_valueType %std450 Length %arg1\n",
           B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_NORMALIZE] = Op("normalize", FLOAT_ARITHMETIC,
                           "%vec1               = OpCompositeConstruct %type_valueType_vec2 %arg1 %c_valueType_2\n"
                           "%tmpVec             = OpExtInst %type_valueType_vec2 %std450 Normalize %vec1\n"
                           "%result             = OpCompositeExtract %type_valueType %tmpVec 0\n",
                           B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_REFLECT] =
        Op("reflect", FLOAT_ARITHMETIC,
           "%vec1               = OpCompositeConstruct %type_valueType_vec2 %arg1 %arg1\n"
           "%vecN               = OpCompositeConstruct %type_valueType_vec2 %c_valueType_0 %c_valueType_n1\n"
           "%tmpVec             = OpExtInst %type_valueType_vec2 %std450 Reflect %vec1 %vecN\n"
           "%result             = OpCompositeExtract %type_valueType %tmpVec 0\n",
           B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_REFRACT] =
        Op("refract", FLOAT_ARITHMETIC,
           "%vec1               = OpCompositeConstruct %type_valueType_vec2 %arg1 %arg1\n"
           "%vecN               = OpCompositeConstruct %type_valueType_vec2 %c_valueType_0 %c_valueType_n1\n"
           "%tmpVec             = OpExtInst %type_valueType_vec2 %std450 Refract %vec1 %vecN %c_valueType_0_5\n"
           "%result             = OpCompositeExtract %type_valueType %tmpVec 0\n",
           B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_MAT_DET] = Op("mat_det", FLOAT_ARITHMETIC,
                         "%col                = OpCompositeConstruct %type_valueType_vec2 %arg1 %arg1\n"
                         "%mat                = OpCompositeConstruct %type_valueType_mat2x2 %col %col\n"
                         "%result             = OpExtInst %type_valueType %std450 Determinant %mat\n",
                         B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);
    mo[OID_MAT_INV] =
        Op("mat_inv", FLOAT_ARITHMETIC,
           "%col1               = OpCompositeConstruct %type_valueType_vec2 %arg1 %c_valueType_1\n"
           "%col2               = OpCompositeConstruct %type_valueType_vec2 %c_valueType_1 %c_valueType_1\n"
           "%mat                = OpCompositeConstruct %type_valueType_mat2x2 %col1 %col2\n"
           "%invMat             = OpExtInst %type_valueType_mat2x2 %std450 MatrixInverse %mat\n"
           "%extCol             = OpCompositeExtract %type_valueType_vec2 %invMat 1\n"
           "%result             = OpCompositeExtract %type_valueType %extCol 1\n",
           B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_TYPE_FLOAT);

    // PackHalf2x16 is a special case as it operates on fp32 vec2 and returns unsigned int,
    // the verification is done in SPIR-V code (if result is correct 1.0 will be written to SSBO)
    mo[OID_PH_DENORM] =
        Op("ph_denorm", FLOAT_STORAGE_ONLY, "", "",
           "%c_fp32_denorm_fp16 = OpConstant %type_f32 6.01e-5\n" // fp32 representation of fp16 denorm value
           "%c_ref              = OpConstant %type_u32 66061296\n",
           "", "",
           "%srcVec             = OpCompositeConstruct %type_f32_vec2 %c_fp32_denorm_fp16 %c_fp32_denorm_fp16\n"
           "%packedInt          = OpExtInst %type_u32 %std450 PackHalf2x16 %srcVec\n"
           "%boolVal            = OpIEqual %type_bool %c_ref %packedInt\n"
           "%result             = OpSelect %type_f32 %boolVal %c_f32_1 %c_f32_0\n",
           B_STATEMENT_USAGE_CONSTS_TYPE_FP32 | B_STATEMENT_USAGE_COMMANDS_CONST_FP32 |
               B_STATEMENT_USAGE_COMMANDS_TYPE_FP32);

    // UnpackHalf2x16 is a special case that operates on uint32 and returns two 32-bit floats,
    // this function is tested using constants
    mo[OID_UPH_DENORM] = Op("uph_denorm", FLOAT_STORAGE_ONLY, "", "",
                            "%c_u32_2_16_pack    = OpConstant %type_u32 66061296\n", // == packHalf2x16(vec2(denorm))
                            "", "",
                            "%tmpVec             = OpExtInst %type_f32_vec2 %std450 UnpackHalf2x16 %c_u32_2_16_pack\n"
                            "%result             = OpCompositeExtract %type_f32 %tmpVec 0\n",
                            B_STATEMENT_USAGE_COMMANDS_TYPE_FP32);

    // PackDouble2x32 is a special case that operates on two uint32 and returns
    // double, this function is tested using constants
    mo[OID_PD_DENORM] = Op("pd_denorm", FLOAT_STORAGE_ONLY, "", "",
                           "%c_p1               = OpConstant %type_u32 0\n"
                           "%c_p2               = OpConstant %type_u32 262144\n", // == UnpackDouble2x32(denorm)
                           "", "",
                           "%srcVec             = OpCompositeConstruct %type_u32_vec2 %c_p1 %c_p2\n"
                           "%result             = OpExtInst %type_f64 %std450 PackDouble2x32 %srcVec\n",
                           B_STATEMENT_USAGE_COMMANDS_TYPE_FP64);

    // UnpackDouble2x32 is a special case as it operates only on FP64 and returns two ints,
    // the verification is done in SPIR-V code (if result is correct 1.0 will be written to SSBO)
    const char *unpackDouble2x32Types = "%type_bool_vec2     = OpTypeVector %type_bool 2\n";
    const char *unpackDouble2x32Source =
        "%refVec2            = OpCompositeConstruct %type_u32_vec2 %c_p1 %c_p2\n"
        "%resVec2            = OpExtInst %type_u32_vec2 %std450 UnpackDouble2x32 %arg1\n"
        "%boolVec2           = OpIEqual %type_bool_vec2 %refVec2 %resVec2\n"
        "%boolVal            = OpAll %type_bool %boolVec2\n"
        "%result             = OpSelect %type_f64 %boolVal %c_f64_1 %c_f64_0\n";
    mo[OID_UPD_DENORM_FLUSH]    = Op("upd_denorm", FLOAT_STORAGE_ONLY, "", unpackDouble2x32Types,
                                     "%c_p1               = OpConstant %type_u32 0\n"
                                        "%c_p2               = OpConstant %type_u32 0\n",
                                     "", "", unpackDouble2x32Source,
                                     B_STATEMENT_USAGE_COMMANDS_CONST_FP64 | B_STATEMENT_USAGE_COMMANDS_TYPE_FP64);
    mo[OID_UPD_DENORM_PRESERVE] = Op("upd_denorm", FLOAT_STORAGE_ONLY, "", unpackDouble2x32Types,
                                     "%c_p1               = OpConstant %type_u32 1008\n"
                                     "%c_p2               = OpConstant %type_u32 0\n",
                                     "", "", unpackDouble2x32Source,
                                     B_STATEMENT_USAGE_COMMANDS_CONST_FP64 | B_STATEMENT_USAGE_COMMANDS_TYPE_FP64);

    mo[OID_ORTE_ROUND] = Op("orte_round", FLOAT_STORAGE_ONLY, FP32, "OpDecorate %result FPRoundingMode RTE\n", "", "",
                            "%result             = OpFConvert %type_f16 %arg1\n", B_STATEMENT_USAGE_COMMANDS_TYPE_FP16);
    mo[OID_ORTZ_ROUND] = Op("ortz_round", FLOAT_STORAGE_ONLY, FP32, "OpDecorate %result FPRoundingMode RTZ\n", "", "",
                            "%result             = OpFConvert %type_f16 %arg1\n", B_STATEMENT_USAGE_COMMANDS_TYPE_FP16);

    DE_ASSERT(m_saved_strings.size() == m_num_expected_strings);
}

void TestCasesBuilder::build(vector<OperationTestCase> &testCases, TypeTestResultsSP typeTestResults,
                             bool argumentsFromInput)
{
    // this method constructs a list of test cases; this list is a bit different
    // for every combination of float type, arguments preparation method and tested float control

    testCases.reserve(750);

    bool isFP16 = typeTestResults->variableType() == FP16;

    for (int j = 0; j < 2; j++)
    {
        // fp16NoStorage tests only supported if testing fp16.
        bool fp16NoStorage = (j == 1);
        if (fp16NoStorage && !isFP16)
            continue;

        // Denorm - FlushToZero - binary operations
        for (size_t i = 0; i < typeTestResults->binaryOpFTZ.size(); ++i)
        {
            const BinaryCase &binaryCase = typeTestResults->binaryOpFTZ[i];
            OperationId operation        = binaryCase.operationId;
            testCases.push_back(OTC("denorm_op_var_flush_to_zero", B_DENORM_FLUSH, operation, V_DENORM, V_ONE,
                                    binaryCase.opVarResult, fp16NoStorage));
            testCases.push_back(OTC("denorm_op_denorm_flush_to_zero", B_DENORM_FLUSH, operation, V_DENORM, V_DENORM,
                                    binaryCase.opDenormResult, fp16NoStorage));
            testCases.push_back(OTC("denorm_op_inf_flush_to_zero", B_DENORM_FLUSH | B_ZIN_PRESERVE, operation, V_DENORM,
                                    V_INF, binaryCase.opInfResult, fp16NoStorage));
            testCases.push_back(OTC("denorm_op_nan_flush_to_zero", B_DENORM_FLUSH | B_ZIN_PRESERVE, operation, V_DENORM,
                                    V_NAN, binaryCase.opNanResult, fp16NoStorage));
        }

        // Denorm - FlushToZero - unary operations
        for (size_t i = 0; i < typeTestResults->unaryOpFTZ.size(); ++i)
        {
            const UnaryCase &unaryCase = typeTestResults->unaryOpFTZ[i];
            OperationId operation      = unaryCase.operationId;
            testCases.push_back(OTC("op_denorm_flush_to_zero", B_DENORM_FLUSH, operation, V_DENORM, V_UNUSED,
                                    unaryCase.result, fp16NoStorage));
        }

        // Denorm - Preserve - binary operations
        for (size_t i = 0; i < typeTestResults->binaryOpDenormPreserve.size(); ++i)
        {
            const BinaryCase &binaryCase = typeTestResults->binaryOpDenormPreserve[i];
            OperationId operation        = binaryCase.operationId;
            testCases.push_back(OTC("denorm_op_var_preserve", B_DENORM_PRESERVE, operation, V_DENORM, V_ONE,
                                    binaryCase.opVarResult, fp16NoStorage));
            testCases.push_back(OTC("denorm_op_denorm_preserve", B_DENORM_PRESERVE, operation, V_DENORM, V_DENORM,
                                    binaryCase.opDenormResult, fp16NoStorage));
            testCases.push_back(OTC("denorm_op_inf_preserve", B_DENORM_PRESERVE | B_ZIN_PRESERVE, operation, V_DENORM,
                                    V_INF, binaryCase.opInfResult, fp16NoStorage));
            testCases.push_back(OTC("denorm_op_nan_preserve", B_DENORM_PRESERVE | B_ZIN_PRESERVE, operation, V_DENORM,
                                    V_NAN, binaryCase.opNanResult, fp16NoStorage));
        }

        // Denorm - Preserve - unary operations
        for (size_t i = 0; i < typeTestResults->unaryOpDenormPreserve.size(); ++i)
        {
            const UnaryCase &unaryCase = typeTestResults->unaryOpDenormPreserve[i];
            OperationId operation      = unaryCase.operationId;
            testCases.push_back(OTC("op_denorm_preserve", B_DENORM_PRESERVE, operation, V_DENORM, V_UNUSED,
                                    unaryCase.result, fp16NoStorage));
        }
    }

    struct ZINCase
    {
        OperationId operationId;
        bool supportedByFP64;
        ValueId secondArgument;
        ValueId preserveZeroResult;
        ValueId preserveSZeroResult;
        ValueId preserveInfResult;
        ValueId preserveSInfResult;
        ValueId preserveNanResult;
    };

    const ZINCase binaryOpZINPreserve[] = {
        // operation        fp64    second arg        preserve zero    preserve szero        preserve inf    preserve sinf        preserve nan
        {OID_PHI, true, V_INF, V_ZERO, V_MINUS_ZERO, V_INF, V_MINUS_INF, V_NAN},
        {OID_SELECT, true, V_ONE, V_ZERO, V_MINUS_ZERO, V_INF, V_MINUS_INF, V_NAN},
        {OID_ADD, true, V_ZERO, V_ZERO, V_ZERO, V_INF, V_MINUS_INF, V_NAN},
        {OID_SUB, true, V_ZERO, V_ZERO, V_MINUS_ZERO, V_INF, V_MINUS_INF, V_NAN},
        {OID_MUL, true, V_ONE, V_ZERO, V_MINUS_ZERO, V_INF, V_MINUS_INF, V_NAN},
    };

    const ZINCase unaryOpZINPreserve[] = {
        // operation                fp64    second arg        preserve zero    preserve szero        preserve inf    preserve sinf        preserve nan
        {OID_RETURN_VAL, true, V_UNUSED, V_ZERO, V_MINUS_ZERO, V_INF, V_MINUS_INF, V_NAN},
        {OID_D_EXTRACT, true, V_UNUSED, V_ZERO, V_MINUS_ZERO, V_INF, V_MINUS_INF, V_NAN},
        {OID_D_INSERT, true, V_UNUSED, V_ZERO, V_MINUS_ZERO, V_INF, V_MINUS_INF, V_NAN},
        {OID_SHUFFLE, true, V_UNUSED, V_ZERO, V_MINUS_ZERO, V_INF, V_MINUS_INF, V_NAN},
        {OID_COMPOSITE, true, V_UNUSED, V_ZERO, V_MINUS_ZERO, V_INF, V_MINUS_INF, V_NAN},
        {OID_COMPOSITE_INS, true, V_UNUSED, V_ZERO, V_MINUS_ZERO, V_INF, V_MINUS_INF, V_NAN},
        {OID_COPY, true, V_UNUSED, V_ZERO, V_MINUS_ZERO, V_INF, V_MINUS_INF, V_NAN},
        {OID_TRANSPOSE, true, V_UNUSED, V_ZERO, V_MINUS_ZERO, V_INF, V_MINUS_INF, V_NAN},
        {OID_NEGATE, true, V_UNUSED, V_MINUS_ZERO, V_ZERO, V_MINUS_INF, V_INF, V_NAN},
    };

    bool isFP64 = typeTestResults->variableType() == FP64;

    // Signed Zero Inf Nan - Preserve - binary operations
    for (int j = 0; j < 2; j++)
    {
        // fp16NoStorage tests only supported if testing fp16.
        bool fp16NoStorage = (j == 1);
        if (fp16NoStorage && !isFP16)
            continue;

        for (size_t i = 0; i < DE_LENGTH_OF_ARRAY(binaryOpZINPreserve); ++i)
        {
            const ZINCase &zc = binaryOpZINPreserve[i];
            if (isFP64 && !zc.supportedByFP64)
                continue;

            testCases.push_back(OTC("zero_op_var_preserve", B_ZIN_PRESERVE, zc.operationId, V_ZERO, zc.secondArgument,
                                    zc.preserveZeroResult, fp16NoStorage));
            testCases.push_back(OTC("signed_zero_op_var_preserve", B_ZIN_PRESERVE, zc.operationId, V_MINUS_ZERO,
                                    zc.secondArgument, zc.preserveSZeroResult, fp16NoStorage));
            testCases.push_back(OTC("inf_op_var_preserve", B_ZIN_PRESERVE, zc.operationId, V_INF, zc.secondArgument,
                                    zc.preserveInfResult, fp16NoStorage));
            testCases.push_back(OTC("signed_inf_op_var_preserve", B_ZIN_PRESERVE, zc.operationId, V_MINUS_INF,
                                    zc.secondArgument, zc.preserveSInfResult, fp16NoStorage));
            testCases.push_back(OTC("nan_op_var_preserve", B_ZIN_PRESERVE, zc.operationId, V_NAN, zc.secondArgument,
                                    zc.preserveNanResult, fp16NoStorage));
        }

        // Signed Zero Inf Nan - Preserve - unary operations
        for (size_t i = 0; i < DE_LENGTH_OF_ARRAY(unaryOpZINPreserve); ++i)
        {
            const ZINCase &zc = unaryOpZINPreserve[i];
            if (isFP64 && !zc.supportedByFP64)
                continue;

            testCases.push_back(OTC("op_zero_preserve", B_ZIN_PRESERVE, zc.operationId, V_ZERO, V_UNUSED,
                                    zc.preserveZeroResult, fp16NoStorage));
            testCases.push_back(OTC("op_signed_zero_preserve", B_ZIN_PRESERVE, zc.operationId, V_MINUS_ZERO, V_UNUSED,
                                    zc.preserveSZeroResult, fp16NoStorage));
            testCases.push_back(OTC("op_inf_preserve", B_ZIN_PRESERVE, zc.operationId, V_INF, V_UNUSED,
                                    zc.preserveInfResult, fp16NoStorage));
            testCases.push_back(OTC("op_signed_inf_preserve", B_ZIN_PRESERVE, zc.operationId, V_MINUS_INF, V_UNUSED,
                                    zc.preserveSInfResult, fp16NoStorage));
            testCases.push_back(OTC("op_nan_preserve", B_ZIN_PRESERVE, zc.operationId, V_NAN, V_UNUSED,
                                    zc.preserveNanResult, fp16NoStorage));
        }
    }

    // comparison operations - tested differently because they return true/false
    struct ComparisonCase
    {
        OperationId operationId;
        ValueId denormPreserveResult;
    };
    const ComparisonCase comparisonCases[] = {// operation    denorm
                                              {OID_ORD_EQ, V_ZERO},  {OID_UORD_EQ, V_ZERO}, {OID_ORD_NEQ, V_ONE},
                                              {OID_UORD_NEQ, V_ONE}, {OID_ORD_LS, V_ONE},   {OID_UORD_LS, V_ONE},
                                              {OID_ORD_GT, V_ZERO},  {OID_UORD_GT, V_ZERO}, {OID_ORD_LE, V_ONE},
                                              {OID_UORD_LE, V_ONE},  {OID_ORD_GE, V_ZERO},  {OID_UORD_GE, V_ZERO}};
    for (int op = 0; op < DE_LENGTH_OF_ARRAY(comparisonCases); ++op)
    {
        const ComparisonCase &cc = comparisonCases[op];
        testCases.push_back(
            OTC("denorm_op_var_preserve", B_DENORM_PRESERVE, cc.operationId, V_DENORM, V_ONE, cc.denormPreserveResult));
        if (isFP16)
            testCases.push_back(OTC("denorm_op_var_preserve", B_DENORM_PRESERVE, cc.operationId, V_DENORM, V_ONE,
                                    cc.denormPreserveResult, true));
    }

    if (argumentsFromInput)
    {
        struct RoundingModeCase
        {
            OperationId operationId;
            ValueId arg1;
            ValueId arg2;
            ValueId expectedRTEResult;
            ValueId expectedRTZResult;
        };

        const RoundingModeCase roundingCases[] = {
            {OID_ADD, V_ADD_ARG_A, V_ADD_ARG_B, V_ADD_RTE_RESULT, V_ADD_RTZ_RESULT},
            {OID_SUB, V_SUB_ARG_A, V_SUB_ARG_B, V_SUB_RTE_RESULT, V_SUB_RTZ_RESULT},
            {OID_MUL, V_MUL_ARG_A, V_MUL_ARG_B, V_MUL_RTE_RESULT, V_MUL_RTZ_RESULT},
            {OID_DOT, V_DOT_ARG_A, V_DOT_ARG_B, V_DOT_RTE_RESULT, V_DOT_RTZ_RESULT},

            // in vect/mat multiplication by scalar operations only first element of result is checked
            // so argument and result values prepared for multiplication can be reused for those cases
            {OID_VEC_MUL_S, V_MUL_ARG_A, V_MUL_ARG_B, V_MUL_RTE_RESULT, V_MUL_RTZ_RESULT},
            {OID_MAT_MUL_S, V_MUL_ARG_A, V_MUL_ARG_B, V_MUL_RTE_RESULT, V_MUL_RTZ_RESULT},
            {OID_OUT_PROD, V_MUL_ARG_A, V_MUL_ARG_B, V_MUL_RTE_RESULT, V_MUL_RTZ_RESULT},

            // in SPIR-V code we return first element of operation result so for following
            // cases argument and result values prepared for dot product can be reused
            {OID_VEC_MUL_M, V_DOT_ARG_A, V_DOT_ARG_B, V_DOT_RTE_RESULT, V_DOT_RTZ_RESULT},
            {OID_MAT_MUL_V, V_DOT_ARG_A, V_DOT_ARG_B, V_DOT_RTE_RESULT, V_DOT_RTZ_RESULT},
            {OID_MAT_MUL_M, V_DOT_ARG_A, V_DOT_ARG_B, V_DOT_RTE_RESULT, V_DOT_RTZ_RESULT},

            // conversion operations are added separately - depending on float type width
        };

        for (int c = 0; c < DE_LENGTH_OF_ARRAY(roundingCases); ++c)
        {
            const RoundingModeCase &rmc = roundingCases[c];
            testCases.push_back(
                OTC("rounding_rte_op", B_RTE_ROUNDING, rmc.operationId, rmc.arg1, rmc.arg2, rmc.expectedRTEResult));
            testCases.push_back(
                OTC("rounding_rtz_op", B_RTZ_ROUNDING, rmc.operationId, rmc.arg1, rmc.arg2, rmc.expectedRTZResult));
            if (isFP16)
            {
                testCases.push_back(OTC("rounding_rte_op", B_RTE_ROUNDING, rmc.operationId, rmc.arg1, rmc.arg2,
                                        rmc.expectedRTEResult, true));
                testCases.push_back(OTC("rounding_rtz_op", B_RTZ_ROUNDING, rmc.operationId, rmc.arg1, rmc.arg2,
                                        rmc.expectedRTZResult, true));
            }
        }
    }

    // special cases
    if (typeTestResults->variableType() == FP16)
    {
        if (argumentsFromInput)
        {
            for (int i = 0; i < 2; i++)
            {
                bool noStorage = (i == 1);

                //// Conversions from arguments
                // fp32 rte
                testCases.push_back(OTC("rounding_rte_conv_from_fp32_up", B_RTE_ROUNDING, OID_CONV_FROM_FP32,
                                        V_CONV_FROM_FP32_TO_FP16_UP_ARG, V_UNUSED,
                                        V_CONV_FROM_FP32_TO_FP16_UP_RTE_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rte_conv_from_fp32_down", B_RTE_ROUNDING, OID_CONV_FROM_FP32,
                                        V_CONV_FROM_FP32_TO_FP16_DOWN_ARG, V_UNUSED,
                                        V_CONV_FROM_FP32_TO_FP16_DOWN_RTE_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rte_conv_from_fp32_tie_up", B_RTE_ROUNDING, OID_CONV_FROM_FP32,
                                        V_CONV_FROM_FP32_TO_FP16_TIE_UP_ARG, V_UNUSED,
                                        V_CONV_FROM_FP32_TO_FP16_TIE_UP_RTE_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rte_conv_from_fp32_tie_down", B_RTE_ROUNDING, OID_CONV_FROM_FP32,
                                        V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_ARG, V_UNUSED,
                                        V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_RTE_RESULT, noStorage));

                // fp32 rtz
                testCases.push_back(OTC("rounding_rtz_conv_from_fp32_up", B_RTZ_ROUNDING, OID_CONV_FROM_FP32,
                                        V_CONV_FROM_FP32_TO_FP16_UP_ARG, V_UNUSED,
                                        V_CONV_FROM_FP32_TO_FP16_UP_RTZ_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rtz_conv_from_fp32_down", B_RTZ_ROUNDING, OID_CONV_FROM_FP32,
                                        V_CONV_FROM_FP32_TO_FP16_DOWN_ARG, V_UNUSED,
                                        V_CONV_FROM_FP32_TO_FP16_DOWN_RTZ_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rtz_conv_from_fp32_tie_up", B_RTZ_ROUNDING, OID_CONV_FROM_FP32,
                                        V_CONV_FROM_FP32_TO_FP16_TIE_UP_ARG, V_UNUSED,
                                        V_CONV_FROM_FP32_TO_FP16_TIE_UP_RTZ_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rtz_conv_from_fp32_tie_down", B_RTZ_ROUNDING, OID_CONV_FROM_FP32,
                                        V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_ARG, V_UNUSED,
                                        V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_RTZ_RESULT, noStorage));

                // fp64 rte
                testCases.push_back(OTC("rounding_rte_conv_from_fp64_up", B_RTE_ROUNDING, OID_CONV_FROM_FP64,
                                        V_CONV_FROM_FP64_TO_FP16_UP_ARG, V_UNUSED,
                                        V_CONV_FROM_FP64_TO_FP16_UP_RTE_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rte_conv_from_fp64_down", B_RTE_ROUNDING, OID_CONV_FROM_FP64,
                                        V_CONV_FROM_FP64_TO_FP16_DOWN_ARG, V_UNUSED,
                                        V_CONV_FROM_FP64_TO_FP16_DOWN_RTE_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rte_conv_from_fp64_tie_up", B_RTE_ROUNDING, OID_CONV_FROM_FP64,
                                        V_CONV_FROM_FP64_TO_FP16_TIE_UP_ARG, V_UNUSED,
                                        V_CONV_FROM_FP64_TO_FP16_TIE_UP_RTE_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rte_conv_from_fp64_tie_down", B_RTE_ROUNDING, OID_CONV_FROM_FP64,
                                        V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_ARG, V_UNUSED,
                                        V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_RTE_RESULT, noStorage));

                // fp64 rtz
                testCases.push_back(OTC("rounding_rtz_conv_from_fp64_up", B_RTZ_ROUNDING, OID_CONV_FROM_FP64,
                                        V_CONV_FROM_FP64_TO_FP16_UP_ARG, V_UNUSED,
                                        V_CONV_FROM_FP64_TO_FP16_UP_RTZ_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rtz_conv_from_fp64_down", B_RTZ_ROUNDING, OID_CONV_FROM_FP64,
                                        V_CONV_FROM_FP64_TO_FP16_DOWN_ARG, V_UNUSED,
                                        V_CONV_FROM_FP64_TO_FP16_DOWN_RTZ_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rtz_conv_from_fp64_tie_up", B_RTZ_ROUNDING, OID_CONV_FROM_FP64,
                                        V_CONV_FROM_FP64_TO_FP16_TIE_UP_ARG, V_UNUSED,
                                        V_CONV_FROM_FP64_TO_FP16_TIE_UP_RTZ_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rtz_conv_from_fp64_tie_down", B_RTZ_ROUNDING, OID_CONV_FROM_FP64,
                                        V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_ARG, V_UNUSED,
                                        V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_RTZ_RESULT, noStorage));

                //// Conversions from specialization constants
                // fp32 rte
                testCases.push_back(OTC("rounding_rte_sconst_conv_from_fp32_up", B_RTE_ROUNDING,
                                        OID_SCONST_CONV_FROM_FP32_TO_FP16_UP, V_CONV_FROM_FP32_TO_FP16_UP_ARG, V_UNUSED,
                                        V_CONV_FROM_FP32_TO_FP16_UP_RTE_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rte_sconst_conv_from_fp32_down", B_RTE_ROUNDING,
                                        OID_SCONST_CONV_FROM_FP32_TO_FP16_DOWN, V_CONV_FROM_FP32_TO_FP16_DOWN_ARG,
                                        V_UNUSED, V_CONV_FROM_FP32_TO_FP16_DOWN_RTE_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rte_sconst_conv_from_fp32_tie_up", B_RTE_ROUNDING,
                                        OID_SCONST_CONV_FROM_FP32_TO_FP16_TIE_UP, V_CONV_FROM_FP32_TO_FP16_TIE_UP_ARG,
                                        V_UNUSED, V_CONV_FROM_FP32_TO_FP16_TIE_UP_RTE_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rte_sconst_conv_from_fp32_tie_down", B_RTE_ROUNDING,
                                        OID_SCONST_CONV_FROM_FP32_TO_FP16_TIE_DOWN,
                                        V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_ARG, V_UNUSED,
                                        V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_RTE_RESULT, noStorage));

                // fp32 rtz
                testCases.push_back(OTC("rounding_rtz_sconst_conv_from_fp32_up", B_RTZ_ROUNDING,
                                        OID_SCONST_CONV_FROM_FP32_TO_FP16_UP, V_CONV_FROM_FP32_TO_FP16_UP_ARG, V_UNUSED,
                                        V_CONV_FROM_FP32_TO_FP16_UP_RTZ_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rtz_sconst_conv_from_fp32_down", B_RTZ_ROUNDING,
                                        OID_SCONST_CONV_FROM_FP32_TO_FP16_DOWN, V_CONV_FROM_FP32_TO_FP16_DOWN_ARG,
                                        V_UNUSED, V_CONV_FROM_FP32_TO_FP16_DOWN_RTZ_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rtz_sconst_conv_from_fp32_tie_up", B_RTZ_ROUNDING,
                                        OID_SCONST_CONV_FROM_FP32_TO_FP16_TIE_UP, V_CONV_FROM_FP32_TO_FP16_TIE_UP_ARG,
                                        V_UNUSED, V_CONV_FROM_FP32_TO_FP16_TIE_UP_RTZ_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rtz_sconst_conv_from_fp32_tie_down", B_RTZ_ROUNDING,
                                        OID_SCONST_CONV_FROM_FP32_TO_FP16_TIE_DOWN,
                                        V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_ARG, V_UNUSED,
                                        V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_RTZ_RESULT, noStorage));

                // fp64 rte
                testCases.push_back(OTC("rounding_rte_sconst_conv_from_fp64_up", B_RTE_ROUNDING,
                                        OID_SCONST_CONV_FROM_FP64_TO_FP16_UP, V_CONV_FROM_FP64_TO_FP16_UP_ARG, V_UNUSED,
                                        V_CONV_FROM_FP64_TO_FP16_UP_RTE_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rte_sconst_conv_from_fp64_down", B_RTE_ROUNDING,
                                        OID_SCONST_CONV_FROM_FP64_TO_FP16_DOWN, V_CONV_FROM_FP64_TO_FP16_DOWN_ARG,
                                        V_UNUSED, V_CONV_FROM_FP64_TO_FP16_DOWN_RTE_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rte_sconst_conv_from_fp64_tie_up", B_RTE_ROUNDING,
                                        OID_SCONST_CONV_FROM_FP64_TO_FP16_TIE_UP, V_CONV_FROM_FP64_TO_FP16_TIE_UP_ARG,
                                        V_UNUSED, V_CONV_FROM_FP64_TO_FP16_TIE_UP_RTE_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rte_sconst_conv_from_fp64_tie_down", B_RTE_ROUNDING,
                                        OID_SCONST_CONV_FROM_FP64_TO_FP16_TIE_DOWN,
                                        V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_ARG, V_UNUSED,
                                        V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_RTE_RESULT, noStorage));

                // fp64 rtz
                testCases.push_back(OTC("rounding_rtz_sconst_conv_from_fp64_up", B_RTZ_ROUNDING,
                                        OID_SCONST_CONV_FROM_FP64_TO_FP16_UP, V_CONV_FROM_FP64_TO_FP16_UP_ARG, V_UNUSED,
                                        V_CONV_FROM_FP64_TO_FP16_UP_RTZ_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rtz_sconst_conv_from_fp64_down", B_RTZ_ROUNDING,
                                        OID_SCONST_CONV_FROM_FP64_TO_FP16_DOWN, V_CONV_FROM_FP64_TO_FP16_DOWN_ARG,
                                        V_UNUSED, V_CONV_FROM_FP64_TO_FP16_DOWN_RTZ_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rtz_sconst_conv_from_fp64_tie_up", B_RTZ_ROUNDING,
                                        OID_SCONST_CONV_FROM_FP64_TO_FP16_TIE_UP, V_CONV_FROM_FP64_TO_FP16_TIE_UP_ARG,
                                        V_UNUSED, V_CONV_FROM_FP64_TO_FP16_TIE_UP_RTZ_RESULT, noStorage));
                testCases.push_back(OTC("rounding_rtz_sconst_conv_from_fp64_tie_down", B_RTZ_ROUNDING,
                                        OID_SCONST_CONV_FROM_FP64_TO_FP16_TIE_DOWN,
                                        V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_ARG, V_UNUSED,
                                        V_CONV_FROM_FP64_TO_FP16_TIE_DOWN_RTZ_RESULT, noStorage));
            }

            // verify that VkShaderFloatingPointRoundingModeKHR can be overridden for a given instruction by the FPRoundingMode decoration.
            // FPRoundingMode decoration requires VK_KHR_16bit_storage.
            testCases.push_back(OTC("rounding_rte_override_from_fp32_up", B_RTE_ROUNDING, OID_ORTZ_ROUND,
                                    V_CONV_FROM_FP32_TO_FP16_UP_ARG, V_UNUSED, V_CONV_FROM_FP32_TO_FP16_UP_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rte_override_from_fp32_down", B_RTE_ROUNDING, OID_ORTZ_ROUND,
                                    V_CONV_FROM_FP32_TO_FP16_DOWN_ARG, V_UNUSED,
                                    V_CONV_FROM_FP32_TO_FP16_DOWN_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rte_override_from_fp32_tie_up", B_RTE_ROUNDING, OID_ORTZ_ROUND,
                                    V_CONV_FROM_FP32_TO_FP16_TIE_UP_ARG, V_UNUSED,
                                    V_CONV_FROM_FP32_TO_FP16_TIE_UP_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rte_override_from_fp32_tie_down", B_RTE_ROUNDING, OID_ORTZ_ROUND,
                                    V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_ARG, V_UNUSED,
                                    V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_RTZ_RESULT));
            // Missing for FP64 -> FP16
            // TODO(https://gitlab.khronos.org/Tracker/vk-gl-cts/-/issues/4539)

            testCases.push_back(OTC("rounding_rtz_override_from_fp32_up", B_RTE_ROUNDING, OID_ORTE_ROUND,
                                    V_CONV_FROM_FP32_TO_FP16_UP_ARG, V_UNUSED, V_CONV_FROM_FP32_TO_FP16_UP_RTE_RESULT));
            testCases.push_back(OTC("rounding_rtz_override_from_fp32_down", B_RTE_ROUNDING, OID_ORTE_ROUND,
                                    V_CONV_FROM_FP32_TO_FP16_DOWN_ARG, V_UNUSED,
                                    V_CONV_FROM_FP32_TO_FP16_DOWN_RTE_RESULT));
            testCases.push_back(OTC("rounding_rtz_override_from_fp32_tie_up", B_RTE_ROUNDING, OID_ORTE_ROUND,
                                    V_CONV_FROM_FP32_TO_FP16_TIE_UP_ARG, V_UNUSED,
                                    V_CONV_FROM_FP32_TO_FP16_TIE_UP_RTE_RESULT));
            testCases.push_back(OTC("rounding_rtz_override_from_fp32_tie_down", B_RTE_ROUNDING, OID_ORTE_ROUND,
                                    V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_ARG, V_UNUSED,
                                    V_CONV_FROM_FP32_TO_FP16_TIE_DOWN_RTE_RESULT));
            // Missing for FP64 -> FP16
            // TODO(https://gitlab.khronos.org/Tracker/vk-gl-cts/-/issues/4539)
        }

        createUnaryTestCases(testCases, OID_CONV_FROM_FP32, V_CONV_DENORM_SMALLER, V_ZERO);
        createUnaryTestCases(testCases, OID_CONV_FROM_FP64, V_CONV_DENORM_BIGGER, V_ZERO);
        createUnaryTestCases(testCases, OID_CONV_FROM_FP32, V_CONV_DENORM_SMALLER, V_ZERO, true);
        createUnaryTestCases(testCases, OID_CONV_FROM_FP64, V_CONV_DENORM_BIGGER, V_ZERO, true);
    }
    else if (typeTestResults->variableType() == FP32)
    {
        if (argumentsFromInput)
        {
            //// Conversions from arguments
            // fp64 rte
            testCases.push_back(OTC("rounding_rte_conv_from_fp64_up", B_RTE_ROUNDING, OID_CONV_FROM_FP64,
                                    V_CONV_FROM_FP64_TO_FP32_UP_ARG, V_UNUSED, V_CONV_FROM_FP64_TO_FP32_UP_RTE_RESULT));
            testCases.push_back(OTC("rounding_rte_conv_from_fp64_down", B_RTE_ROUNDING, OID_CONV_FROM_FP64,
                                    V_CONV_FROM_FP64_TO_FP32_DOWN_ARG, V_UNUSED,
                                    V_CONV_FROM_FP64_TO_FP32_DOWN_RTE_RESULT));
            testCases.push_back(OTC("rounding_rte_conv_from_fp64_tie_up", B_RTE_ROUNDING, OID_CONV_FROM_FP64,
                                    V_CONV_FROM_FP64_TO_FP32_TIE_UP_ARG, V_UNUSED,
                                    V_CONV_FROM_FP64_TO_FP32_TIE_UP_RTE_RESULT));
            testCases.push_back(OTC("rounding_rte_conv_from_fp64_tie_down", B_RTE_ROUNDING, OID_CONV_FROM_FP64,
                                    V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_ARG, V_UNUSED,
                                    V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_RTE_RESULT));

            // fp64 rtz
            testCases.push_back(OTC("rounding_rtz_conv_from_fp64_up", B_RTZ_ROUNDING, OID_CONV_FROM_FP64,
                                    V_CONV_FROM_FP64_TO_FP32_UP_ARG, V_UNUSED, V_CONV_FROM_FP64_TO_FP32_UP_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rtz_conv_from_fp64_down", B_RTZ_ROUNDING, OID_CONV_FROM_FP64,
                                    V_CONV_FROM_FP64_TO_FP32_DOWN_ARG, V_UNUSED,
                                    V_CONV_FROM_FP64_TO_FP32_DOWN_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rtz_conv_from_fp64_tie_up", B_RTZ_ROUNDING, OID_CONV_FROM_FP64,
                                    V_CONV_FROM_FP64_TO_FP32_TIE_UP_ARG, V_UNUSED,
                                    V_CONV_FROM_FP64_TO_FP32_TIE_UP_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rtz_conv_from_fp64_tie_down", B_RTZ_ROUNDING, OID_CONV_FROM_FP64,
                                    V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_ARG, V_UNUSED,
                                    V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_RTZ_RESULT));

            //// Conversions from specialization constants
            // fp64 rte
            testCases.push_back(OTC("rounding_rte_sconst_conv_from_fp64_up", B_RTE_ROUNDING,
                                    OID_SCONST_CONV_FROM_FP64_TO_FP32_UP, V_CONV_FROM_FP64_TO_FP32_UP_ARG, V_UNUSED,
                                    V_CONV_FROM_FP64_TO_FP32_UP_RTE_RESULT));
            testCases.push_back(OTC("rounding_rte_sconst_conv_from_fp64_down", B_RTE_ROUNDING,
                                    OID_SCONST_CONV_FROM_FP64_TO_FP32_DOWN, V_CONV_FROM_FP64_TO_FP32_DOWN_ARG, V_UNUSED,
                                    V_CONV_FROM_FP64_TO_FP32_DOWN_RTE_RESULT));
            testCases.push_back(OTC("rounding_rte_sconst_conv_from_fp64_tie_up", B_RTE_ROUNDING,
                                    OID_SCONST_CONV_FROM_FP64_TO_FP32_TIE_UP, V_CONV_FROM_FP64_TO_FP32_TIE_UP_ARG,
                                    V_UNUSED, V_CONV_FROM_FP64_TO_FP32_TIE_UP_RTE_RESULT));
            testCases.push_back(OTC("rounding_rte_sconst_conv_from_fp64_tie_down", B_RTE_ROUNDING,
                                    OID_SCONST_CONV_FROM_FP64_TO_FP32_TIE_DOWN, V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_ARG,
                                    V_UNUSED, V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_RTE_RESULT));

            // fp64 rtz
            testCases.push_back(OTC("rounding_rtz_sconst_conv_from_fp64_up", B_RTZ_ROUNDING,
                                    OID_SCONST_CONV_FROM_FP64_TO_FP32_UP, V_CONV_FROM_FP64_TO_FP32_UP_ARG, V_UNUSED,
                                    V_CONV_FROM_FP64_TO_FP32_UP_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rtz_sconst_conv_from_fp64_down", B_RTZ_ROUNDING,
                                    OID_SCONST_CONV_FROM_FP64_TO_FP32_DOWN, V_CONV_FROM_FP64_TO_FP32_DOWN_ARG, V_UNUSED,
                                    V_CONV_FROM_FP64_TO_FP32_DOWN_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rtz_sconst_conv_from_fp64_tie_up", B_RTZ_ROUNDING,
                                    OID_SCONST_CONV_FROM_FP64_TO_FP32_TIE_UP, V_CONV_FROM_FP64_TO_FP32_TIE_UP_ARG,
                                    V_UNUSED, V_CONV_FROM_FP64_TO_FP32_TIE_UP_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rtz_sconst_conv_from_fp64_tie_down", B_RTZ_ROUNDING,
                                    OID_SCONST_CONV_FROM_FP64_TO_FP32_TIE_DOWN, V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_ARG,
                                    V_UNUSED, V_CONV_FROM_FP64_TO_FP32_TIE_DOWN_RTZ_RESULT));

            // Verify that VkShaderFloatingPointRoundingModeKHR can be overridden for a given instruction by the FPRoundingMode decoration.
            // Missing for FP64 -> FP32
            // TODO(https://gitlab.khronos.org/Tracker/vk-gl-cts/-/issues/4539)

            // uint32 rtz
            testCases.push_back(OTC("rounding_rtz_conv_from_uint32_up", B_RTZ_ROUNDING, OID_CONV_FROM_UINT_TO_FP32,
                                    V_CONV_FROM_UINT_TO_FP32_UP_ARG, V_UNUSED, V_CONV_FROM_UINT32_UP_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rtz_conv_from_uint32_tie", B_RTZ_ROUNDING, OID_CONV_FROM_UINT_TO_FP32,
                                    V_CONV_FROM_UINT_TO_FP32_TIE_ARG, V_UNUSED, V_CONV_FROM_UINT32_TIE_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rtz_conv_from_uint32_down", B_RTZ_ROUNDING, OID_CONV_FROM_UINT_TO_FP32,
                                    V_CONV_FROM_UINT_TO_FP32_DOWN_ARG, V_UNUSED, V_CONV_FROM_UINT32_DOWN_RTZ_RESULT));

            // uint64 rtz
            testCases.push_back(OTC("rounding_rtz_conv_from_uint64_up", B_RTZ_ROUNDING, OID_CONV_FROM_UINT_TO_FP64,
                                    V_CONV_FROM_UINT_TO_FP32_UP_ARG, V_UNUSED, V_CONV_FROM_UINT64_UP_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rtz_conv_from_uint64_tie", B_RTZ_ROUNDING, OID_CONV_FROM_UINT_TO_FP64,
                                    V_CONV_FROM_UINT_TO_FP32_TIE_ARG, V_UNUSED, V_CONV_FROM_UINT64_TIE_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rtz_conv_from_uint64_down", B_RTZ_ROUNDING, OID_CONV_FROM_UINT_TO_FP64,
                                    V_CONV_FROM_UINT_TO_FP32_DOWN_ARG, V_UNUSED, V_CONV_FROM_UINT64_DOWN_RTZ_RESULT));

            // uint32 rte
            testCases.push_back(OTC("rounding_rte_conv_from_uint32_up", B_RTE_ROUNDING, OID_CONV_FROM_UINT_TO_FP32,
                                    V_CONV_FROM_UINT_TO_FP32_UP_ARG, V_UNUSED, V_CONV_FROM_UINT32_UP_RTE_RESULT));
            testCases.push_back(OTC("rounding_rte_conv_from_uint32_tie", B_RTE_ROUNDING, OID_CONV_FROM_UINT_TO_FP32,
                                    V_CONV_FROM_UINT_TO_FP32_TIE_ARG, V_UNUSED, V_CONV_FROM_UINT32_TIE_RTE_RESULT));
            testCases.push_back(OTC("rounding_rte_conv_from_uint32_down", B_RTE_ROUNDING, OID_CONV_FROM_UINT_TO_FP32,
                                    V_CONV_FROM_UINT_TO_FP32_DOWN_ARG, V_UNUSED, V_CONV_FROM_UINT32_DOWN_RTE_RESULT));

            // uint64 rte
            testCases.push_back(OTC("rounding_rte_conv_from_uint64_up", B_RTE_ROUNDING, OID_CONV_FROM_UINT_TO_FP64,
                                    V_CONV_FROM_UINT_TO_FP32_UP_ARG, V_UNUSED, V_CONV_FROM_UINT64_UP_RTE_RESULT));
            testCases.push_back(OTC("rounding_rte_conv_from_uint64_tie", B_RTE_ROUNDING, OID_CONV_FROM_UINT_TO_FP64,
                                    V_CONV_FROM_UINT_TO_FP32_TIE_ARG, V_UNUSED, V_CONV_FROM_UINT64_TIE_RTE_RESULT));
            testCases.push_back(OTC("rounding_rte_conv_from_uint64_down", B_RTE_ROUNDING, OID_CONV_FROM_UINT_TO_FP64,
                                    V_CONV_FROM_UINT_TO_FP32_DOWN_ARG, V_UNUSED, V_CONV_FROM_UINT64_DOWN_RTE_RESULT));

            // int32 rtz
            testCases.push_back(OTC("rounding_rtz_conv_from_int32_up", B_RTZ_ROUNDING, OID_CONV_FROM_INT_TO_FP32,
                                    V_CONV_FROM_INT_TO_FP32_UP_ARG, V_UNUSED, V_CONV_FROM_INT32_UP_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rtz_conv_from_int32_tie", B_RTZ_ROUNDING, OID_CONV_FROM_INT_TO_FP32,
                                    V_CONV_FROM_INT_TO_FP32_TIE_ARG, V_UNUSED, V_CONV_FROM_INT32_TIE_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rtz_conv_from_int32_down", B_RTZ_ROUNDING, OID_CONV_FROM_INT_TO_FP32,
                                    V_CONV_FROM_INT_TO_FP32_DOWN_ARG, V_UNUSED, V_CONV_FROM_INT32_DOWN_RTZ_RESULT));

            // int64 rtz
            testCases.push_back(OTC("rounding_rtz_conv_from_int64_up", B_RTZ_ROUNDING, OID_CONV_FROM_INT_TO_FP64,
                                    V_CONV_FROM_INT_TO_FP32_UP_ARG, V_UNUSED, V_CONV_FROM_INT64_UP_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rtz_conv_from_int64_tie", B_RTZ_ROUNDING, OID_CONV_FROM_INT_TO_FP64,
                                    V_CONV_FROM_INT_TO_FP32_TIE_ARG, V_UNUSED, V_CONV_FROM_INT64_TIE_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rtz_conv_from_int64_down", B_RTZ_ROUNDING, OID_CONV_FROM_INT_TO_FP64,
                                    V_CONV_FROM_INT_TO_FP32_DOWN_ARG, V_UNUSED, V_CONV_FROM_INT64_DOWN_RTZ_RESULT));

            // int32 rte
            testCases.push_back(OTC("rounding_rte_conv_from_int32_up", B_RTE_ROUNDING, OID_CONV_FROM_INT_TO_FP32,
                                    V_CONV_FROM_INT_TO_FP32_UP_ARG, V_UNUSED, V_CONV_FROM_INT32_UP_RTE_RESULT));
            testCases.push_back(OTC("rounding_rte_conv_from_int32_tie", B_RTE_ROUNDING, OID_CONV_FROM_INT_TO_FP32,
                                    V_CONV_FROM_INT_TO_FP32_TIE_ARG, V_UNUSED, V_CONV_FROM_INT32_TIE_RTE_RESULT));
            testCases.push_back(OTC("rounding_rte_conv_from_int32_down", B_RTE_ROUNDING, OID_CONV_FROM_INT_TO_FP32,
                                    V_CONV_FROM_INT_TO_FP32_DOWN_ARG, V_UNUSED, V_CONV_FROM_INT32_DOWN_RTE_RESULT));

            // int64 rte
            testCases.push_back(OTC("rounding_rte_conv_from_int64_up", B_RTE_ROUNDING, OID_CONV_FROM_INT_TO_FP64,
                                    V_CONV_FROM_INT_TO_FP32_UP_ARG, V_UNUSED, V_CONV_FROM_INT64_UP_RTE_RESULT));
            testCases.push_back(OTC("rounding_rte_conv_from_int64_tie", B_RTE_ROUNDING, OID_CONV_FROM_INT_TO_FP64,
                                    V_CONV_FROM_INT_TO_FP32_TIE_ARG, V_UNUSED, V_CONV_FROM_INT64_TIE_RTE_RESULT));
            testCases.push_back(OTC("rounding_rte_conv_from_int64_down", B_RTE_ROUNDING, OID_CONV_FROM_INT_TO_FP64,
                                    V_CONV_FROM_INT_TO_FP32_DOWN_ARG, V_UNUSED, V_CONV_FROM_INT64_DOWN_RTE_RESULT));
        }
        else
        {
            // PackHalf2x16 - verification done in SPIR-V
            testCases.push_back(
                OTC("pack_half_denorm_preserve", B_DENORM_PRESERVE, OID_PH_DENORM, V_UNUSED, V_UNUSED, V_ONE));

            // UnpackHalf2x16 - custom arguments defined as constants
            testCases.push_back(
                OTC("upack_half_denorm_flush_to_zero", B_DENORM_FLUSH, OID_UPH_DENORM, V_UNUSED, V_UNUSED, V_ZERO));
            testCases.push_back(OTC("upack_half_denorm_preserve", B_DENORM_PRESERVE, OID_UPH_DENORM, V_UNUSED, V_UNUSED,
                                    V_CONV_DENORM_SMALLER));
        }

        createUnaryTestCases(testCases, OID_CONV_FROM_FP16, V_CONV_DENORM_SMALLER, V_ZERO_OR_FP16_DENORM_TO_FP32);
        createUnaryTestCases(testCases, OID_CONV_FROM_FP16, V_CONV_DENORM_SMALLER, V_ZERO_OR_FP16_DENORM_TO_FP32, true);
        createUnaryTestCases(testCases, OID_CONV_FROM_FP64, V_CONV_DENORM_BIGGER, V_ZERO);
    }
    else // FP64
    {
        if (argumentsFromInput)
        {
            // uint64 rtz
            testCases.push_back(OTC("rounding_rtz_conv_from_uint64_up", B_RTZ_ROUNDING, OID_CONV_FROM_UINT_TO_FP64,
                                    V_CONV_FROM_UINT_TO_FP64_UP_ARG, V_UNUSED, V_CONV_FROM_UINT64_UP_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rtz_conv_from_uint64_tie", B_RTZ_ROUNDING, OID_CONV_FROM_UINT_TO_FP64,
                                    V_CONV_FROM_UINT_TO_FP64_TIE_ARG, V_UNUSED, V_CONV_FROM_UINT64_TIE_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rtz_conv_from_uint64_down", B_RTZ_ROUNDING, OID_CONV_FROM_UINT_TO_FP64,
                                    V_CONV_FROM_UINT_TO_FP64_DOWN_ARG, V_UNUSED, V_CONV_FROM_UINT64_DOWN_RTZ_RESULT));

            // uint64 rte
            testCases.push_back(OTC("rounding_rte_conv_from_uint64_up", B_RTE_ROUNDING, OID_CONV_FROM_UINT_TO_FP64,
                                    V_CONV_FROM_UINT_TO_FP64_UP_ARG, V_UNUSED, V_CONV_FROM_UINT64_UP_RTE_RESULT));
            testCases.push_back(OTC("rounding_rte_conv_from_uint64_tie", B_RTE_ROUNDING, OID_CONV_FROM_UINT_TO_FP64,
                                    V_CONV_FROM_UINT_TO_FP64_TIE_ARG, V_UNUSED, V_CONV_FROM_UINT64_TIE_RTE_RESULT));
            testCases.push_back(OTC("rounding_rte_conv_from_uint64_down", B_RTE_ROUNDING, OID_CONV_FROM_UINT_TO_FP64,
                                    V_CONV_FROM_UINT_TO_FP64_DOWN_ARG, V_UNUSED, V_CONV_FROM_UINT64_DOWN_RTE_RESULT));

            // int64 rtz
            testCases.push_back(OTC("rounding_rtz_conv_from_int64_up", B_RTZ_ROUNDING, OID_CONV_FROM_INT_TO_FP64,
                                    V_CONV_FROM_INT_TO_FP64_UP_ARG, V_UNUSED, V_CONV_FROM_INT64_UP_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rtz_conv_from_int64_tie", B_RTZ_ROUNDING, OID_CONV_FROM_INT_TO_FP64,
                                    V_CONV_FROM_INT_TO_FP64_TIE_ARG, V_UNUSED, V_CONV_FROM_INT64_TIE_RTZ_RESULT));
            testCases.push_back(OTC("rounding_rtz_conv_from_int64_down", B_RTZ_ROUNDING, OID_CONV_FROM_INT_TO_FP64,
                                    V_CONV_FROM_INT_TO_FP64_DOWN_ARG, V_UNUSED, V_CONV_FROM_INT64_DOWN_RTZ_RESULT));

            // int64 rte
            testCases.push_back(OTC("rounding_rte_conv_from_int64_up", B_RTE_ROUNDING, OID_CONV_FROM_INT_TO_FP64,
                                    V_CONV_FROM_INT_TO_FP64_UP_ARG, V_UNUSED, V_CONV_FROM_INT64_UP_RTE_RESULT));
            testCases.push_back(OTC("rounding_rte_conv_from_int64_tie", B_RTE_ROUNDING, OID_CONV_FROM_INT_TO_FP64,
                                    V_CONV_FROM_INT_TO_FP64_TIE_ARG, V_UNUSED, V_CONV_FROM_INT64_TIE_RTE_RESULT));
            testCases.push_back(OTC("rounding_rte_conv_from_int64_down", B_RTE_ROUNDING, OID_CONV_FROM_INT_TO_FP64,
                                    V_CONV_FROM_INT_TO_FP64_DOWN_ARG, V_UNUSED, V_CONV_FROM_INT64_DOWN_RTE_RESULT));
        }
        else
        {
            // PackDouble2x32 - custom arguments defined as constants
            testCases.push_back(
                OTC("pack_double_denorm_preserve", B_DENORM_PRESERVE, OID_PD_DENORM, V_UNUSED, V_UNUSED, V_DENORM));

            // UnpackDouble2x32 - verification done in SPIR-V
            testCases.push_back(OTC("upack_double_denorm_flush_to_zero", B_DENORM_FLUSH, OID_UPD_DENORM_FLUSH, V_DENORM,
                                    V_UNUSED, V_ONE));
            testCases.push_back(OTC("upack_double_denorm_preserve", B_DENORM_PRESERVE, OID_UPD_DENORM_PRESERVE,
                                    V_DENORM, V_UNUSED, V_ONE));
        }

        createUnaryTestCases(testCases, OID_CONV_FROM_FP16, V_CONV_DENORM_SMALLER, V_ZERO_OR_FP16_DENORM_TO_FP64);
        createUnaryTestCases(testCases, OID_CONV_FROM_FP16, V_CONV_DENORM_SMALLER, V_ZERO_OR_FP16_DENORM_TO_FP64, true);
        createUnaryTestCases(testCases, OID_CONV_FROM_FP32, V_CONV_DENORM_BIGGER, V_ZERO_OR_FP32_DENORM_TO_FP64);
    }
}

const Operation &TestCasesBuilder::getOperation(OperationId id) const
{
    return m_operations.at(id);
}

void TestCasesBuilder::createUnaryTestCases(vector<OperationTestCase> &testCases, OperationId operationId,
                                            ValueId denormPreserveResult, ValueId denormFTZResult,
                                            bool fp16WithoutStorage) const
{
    // Denorm - Preserve
    testCases.push_back(OTC("op_denorm_preserve", B_DENORM_PRESERVE, operationId, V_DENORM, V_UNUSED,
                            denormPreserveResult, fp16WithoutStorage));

    // Denorm - FlushToZero
    testCases.push_back(OTC("op_denorm_flush_to_zero", B_DENORM_FLUSH, operationId, V_DENORM, V_UNUSED, denormFTZResult,
                            fp16WithoutStorage));

    // Signed Zero Inf Nan - Preserve
    testCases.push_back(
        OTC("op_zero_preserve", B_ZIN_PRESERVE, operationId, V_ZERO, V_UNUSED, V_ZERO, fp16WithoutStorage));
    testCases.push_back(OTC("op_signed_zero_preserve", B_ZIN_PRESERVE, operationId, V_MINUS_ZERO, V_UNUSED,
                            V_MINUS_ZERO, fp16WithoutStorage));
    testCases.push_back(
        OTC("op_inf_preserve", B_ZIN_PRESERVE, operationId, V_INF, V_UNUSED, V_INF, fp16WithoutStorage));
    testCases.push_back(
        OTC("op_nan_preserve", B_ZIN_PRESERVE, operationId, V_NAN, V_UNUSED, V_NAN, fp16WithoutStorage));
}

template <typename TYPE, typename FLOAT_TYPE>
bool isZeroOrOtherValue(const TYPE &returnedFloat, ValueId secondAcceptableResult, TestLog &log)
{
    if (returnedFloat.isZero() && !returnedFloat.signBit())
        return true;

    TypeValues<FLOAT_TYPE> typeValues;
    typedef typename TYPE::StorageType SType;
    typename RawConvert<FLOAT_TYPE, SType>::Value value;
    value.fp = typeValues.getValue(secondAcceptableResult);

    if (returnedFloat.bits() == value.ui)
        return true;

    log << TestLog::Message << "Expected 0 or " << toHex(value.ui) << " (" << value.fp << ")" << TestLog::EndMessage;
    return false;
}

template <typename TYPE>
bool isAcosResultCorrect(const TYPE &returnedFloat, TestLog &log)
{
    // pi/2 is result of acos(0) which in the specs is defined as equivalent to
    // atan2(sqrt(1.0 - x^2), x), where atan2 has 4096 ULP, sqrt is equivalent to
    // 1.0 /inversesqrt(), inversesqrt() is 2 ULP and rcp is another 2.5 ULP

    double precision    = 0;
    const double piDiv2 = M_PI_2;
    if (returnedFloat.MANTISSA_BITS == 23)
    {
        FloatFormat fp32Format(-126, 127, 23, true, tcu::MAYBE, tcu::YES, tcu::MAYBE);
        precision = fp32Format.ulp(piDiv2, 4096.0);
    }
    else
    {
        FloatFormat fp16Format(-14, 15, 10, true, tcu::MAYBE);
        precision = fp16Format.ulp(piDiv2, 5.0);
    }

    if (deAbs(returnedFloat.asDouble() - piDiv2) < precision)
        return true;

    log << TestLog::Message << "Expected result to be in range"
        << " (" << piDiv2 - precision << ", " << piDiv2 + precision << "), got " << returnedFloat.asDouble()
        << TestLog::EndMessage;
    return false;
}

template <typename TYPE>
bool isCosResultCorrect(const TYPE &returnedFloat, TestLog &log)
{
    // for cos(x) with x between -pi and pi, the precision error is 2^-11 for fp32 and 2^-7 for fp16.
    double precision      = returnedFloat.MANTISSA_BITS == 23 ? dePow(2, -11) : dePow(2, -7);
    const double expected = 1.0;

    if (deAbs(returnedFloat.asDouble() - expected) < precision)
        return true;

    log << TestLog::Message << "Expected result to be in range"
        << " (" << expected - precision << ", " << expected + precision << "), got " << returnedFloat.asDouble()
        << TestLog::EndMessage;
    return false;
}

template <typename FLOAT_TYPE>
double getVariableTypeAsDouble(FLOAT_TYPE param)
{
    return param;
}
template <>
double getVariableTypeAsDouble(deFloat16 param)
{
    return deFloat16To64(param);
}

double getPrecisionAt(double value, float ulp, int mantissaBits)
{
    if (mantissaBits == 23)
    {
        FloatFormat fp32Format(-126, 127, 23, true, tcu::MAYBE, tcu::YES, tcu::MAYBE);
        return fp32Format.ulp(value, ulp);
    }
    else if (mantissaBits == 52)
    {
        FloatFormat fp32Format(-1022, 1023, 52, true, tcu::MAYBE, tcu::YES, tcu::MAYBE);
        return fp32Format.ulp(value, ulp);
    }
    else
    {
        DE_ASSERT(mantissaBits == 10);
        FloatFormat fp16Format(-14, 15, 10, true, tcu::MAYBE);
        return fp16Format.ulp(value, ulp);
    }
}

template <typename TYPE, typename FLOAT_TYPE, typename REF_FUNCTION>
bool isLogResultCorrect(const TYPE &returnedFloat, FLOAT_TYPE param, REF_FUNCTION refFunction, TestLog &log)
{
    if (returnedFloat.isInf() && returnedFloat.signBit())
        return true;

    const double expected  = refFunction(getVariableTypeAsDouble(param));
    const double precision = getPrecisionAt(expected, 3.0, returnedFloat.MANTISSA_BITS);

    if (deAbs(returnedFloat.asDouble() - expected) < precision)
        return true;

    log << TestLog::Message << "Expected result to be -INF or in range"
        << " (" << expected - precision << ", " << expected + precision << "), got " << returnedFloat.asDouble()
        << TestLog::EndMessage;
    return false;
}

template <typename TYPE, typename FLOAT_TYPE>
bool isInverseSqrtResultCorrect(const TYPE &returnedFloat, FLOAT_TYPE param, TestLog &log)
{
    if (returnedFloat.isInf() && !returnedFloat.signBit())
        return true;

    const double expected  = 1.0 / deSqrt(getVariableTypeAsDouble(param));
    const double precision = getPrecisionAt(expected, 2.0, returnedFloat.MANTISSA_BITS);

    if (deAbs(returnedFloat.asDouble() - expected) < precision)
        return true;

    log << TestLog::Message << "Expected result to be INF or in range"
        << " (" << expected - precision << ", " << expected + precision << "), got " << returnedFloat.asDouble()
        << TestLog::EndMessage;
    return false;
}

template <typename TYPE, typename FLOAT_TYPE>
bool isSqrtResultCorrect(const TYPE &returnedFloat, FLOAT_TYPE param, TestLog &log)
{
    if (returnedFloat.isZero() && !returnedFloat.signBit())
        return true;

    const double expected             = deSqrt(getVariableTypeAsDouble(param));
    const double expectedInverseSqrt  = 1.0 / expected;
    const double inverseSqrtPrecision = getPrecisionAt(expectedInverseSqrt, 2.0, returnedFloat.MANTISSA_BITS);

    double expectedMin =
        deMin(1.0 / (expectedInverseSqrt - inverseSqrtPrecision), 1.0 / (expectedInverseSqrt + inverseSqrtPrecision));
    double expectedMax =
        deMax(1.0 / (expectedInverseSqrt - inverseSqrtPrecision), 1.0 / (expectedInverseSqrt + inverseSqrtPrecision));

    expectedMin -= getPrecisionAt(expectedMin, 2.5, returnedFloat.MANTISSA_BITS);
    expectedMax += getPrecisionAt(expectedMax, 2.5, returnedFloat.MANTISSA_BITS);

    if (returnedFloat.asDouble() >= expectedMin && returnedFloat.asDouble() <= expectedMax)
        return true;

    log << TestLog::Message << "Expected result to be +0 or in range"
        << " (" << expectedMin << ", " << expectedMax << "), got " << returnedFloat.asDouble() << TestLog::EndMessage;
    return false;
}

// Function used to compare test result with expected output.
// TYPE can be Float16, Float32 or Float64.
// FLOAT_TYPE can be deFloat16, float, double.
template <typename TYPE, typename FLOAT_TYPE>
bool compareBytes(vector<uint8_t> &expectedBytes, AllocationSp outputAlloc, TestLog &log)
{
    const TYPE *returned = static_cast<const TYPE *>(outputAlloc->getHostPtr());
    const TYPE *fValueId = reinterpret_cast<const TYPE *>(&expectedBytes.front());

    // all test return single value
    // Fp16 nostorage tests get their values from a uint32_t value, but we create the
    // buffer with the same size for both cases: 4 bytes.
    if (sizeof(TYPE) == 2u)
        DE_ASSERT((expectedBytes.size() / sizeof(TYPE)) == 2);
    else
        DE_ASSERT((expectedBytes.size() / sizeof(TYPE)) == 1);

    // during test setup we do not store expected value but id that can be used to
    // retrieve actual value - this is done to handle special cases like multiple
    // allowed results or epsilon checks for some cases
    // note that this is workaround - this should be done by changing
    // ComputerShaderCase and GraphicsShaderCase so that additional arguments can
    // be passed to this verification callback
    typedef typename TYPE::StorageType SType;
    SType expectedInt       = fValueId[0].bits();
    ValueId expectedValueId = static_cast<ValueId>(expectedInt);

    // something went wrong, expected value cant be V_UNUSED,
    // if this is the case then test shouldn't be created at all
    DE_ASSERT(expectedValueId != V_UNUSED);

    TYPE returnedFloat = returned[0];

    log << TestLog::Message << "Calculated result: " << toHex(returnedFloat.bits()) << " (" << returnedFloat.asFloat()
        << ")" << TestLog::EndMessage;

    if (expectedValueId == V_NAN)
    {
        if (returnedFloat.isNaN())
            return true;

        log << TestLog::Message << "Expected NaN" << TestLog::EndMessage;
        return false;
    }

    if (expectedValueId == V_DENORM)
    {
        if (returnedFloat.isDenorm())
            return true;

        log << TestLog::Message << "Expected Denorm" << TestLog::EndMessage;
        return false;
    }

    // handle multiple acceptable results cases
    if (expectedValueId == V_ZERO_OR_MINUS_ZERO)
    {
        if (returnedFloat.isZero())
            return true;

        log << TestLog::Message << "Expected 0 or -0" << TestLog::EndMessage;
        return false;
    }
    if (expectedValueId == V_ZERO_OR_ONE)
        return isZeroOrOtherValue<TYPE, FLOAT_TYPE>(returnedFloat, V_ONE, log);
    if ((expectedValueId == V_ZERO_OR_FP16_DENORM_TO_FP32) || (expectedValueId == V_ZERO_OR_FP16_DENORM_TO_FP64))
        return isZeroOrOtherValue<TYPE, FLOAT_TYPE>(returnedFloat, V_CONV_DENORM_SMALLER, log);
    if (expectedValueId == V_ZERO_OR_FP32_DENORM_TO_FP64)
        return isZeroOrOtherValue<TYPE, FLOAT_TYPE>(returnedFloat, V_CONV_DENORM_BIGGER, log);
    if (expectedValueId == V_ZERO_OR_DENORM_TIMES_TWO)
    {
        // this expected value is only needed for fp16
        DE_ASSERT(returnedFloat.EXPONENT_BIAS == 15);
        return isZeroOrOtherValue<TYPE, FLOAT_TYPE>(returnedFloat, V_DENORM_TIMES_TWO, log);
    }
    if (expectedValueId == V_MINUS_ONE_OR_CLOSE)
    {
        // this expected value is only needed for fp16
        DE_ASSERT(returnedFloat.EXPONENT_BIAS == 15);
        typename TYPE::StorageType returnedValue = returnedFloat.bits();
        return (returnedValue == 0xbc00) || (returnedValue == 0xbbff);
    }

    // handle trigonometric operations precision errors
    if (expectedValueId == V_TRIG_ONE)
        return isCosResultCorrect<TYPE>(returnedFloat, log);

    // handle acos(0) case
    if (expectedValueId == V_PI_DIV_2)
        return isAcosResultCorrect<TYPE>(returnedFloat, log);

    TypeValues<FLOAT_TYPE> typeValues;

    if (expectedValueId == V_MINUS_INF_OR_LOG_DENORM)
        return isLogResultCorrect<TYPE>(returnedFloat, typeValues.getValue(V_DENORM), deLog, log);

    if (expectedValueId == V_MINUS_INF_OR_LOG2_DENORM)
        return isLogResultCorrect<TYPE>(returnedFloat, typeValues.getValue(V_DENORM), deLog2, log);

    if (expectedValueId == V_ZERO_OR_SQRT_DENORM)
        return isSqrtResultCorrect<TYPE>(returnedFloat, typeValues.getValue(V_DENORM), log);

    if (expectedValueId == V_INF_OR_INV_SQRT_DENORM)
        return isInverseSqrtResultCorrect<TYPE>(returnedFloat, typeValues.getValue(V_DENORM), log);

    typename RawConvert<FLOAT_TYPE, SType>::Value value;
    value.fp = typeValues.getValue(expectedValueId);

    if (returnedFloat.bits() == value.ui)
        return true;

    log << TestLog::Message << "Expected " << toHex(value.ui) << " (" << value.fp << ")" << TestLog::EndMessage;
    return false;
}

template <typename TYPE, typename FLOAT_TYPE>
bool checkFloats(const vector<Resource> &, const vector<AllocationSp> &outputAllocs,
                 const vector<Resource> &expectedOutputs, TestLog &log)
{
    if (outputAllocs.size() != expectedOutputs.size())
        return false;

    for (uint32_t outputNdx = 0; outputNdx < outputAllocs.size(); ++outputNdx)
    {
        vector<uint8_t> expectedBytes;
        expectedOutputs[outputNdx].getBytes(expectedBytes);

        if (!compareBytes<TYPE, FLOAT_TYPE>(expectedBytes, outputAllocs[outputNdx], log))
            return false;
    }

    return true;
}

bool checkMixedFloats(const vector<Resource> &, const vector<AllocationSp> &outputAllocs,
                      const vector<Resource> &expectedOutputs, TestLog &log)
{
    // this function validates buffers containing floats of diferent widths, order is not important

    if (outputAllocs.size() != expectedOutputs.size())
        return false;

    // The comparison function depends on the data type stored in the resource.
    using compareFun = bool (*)(vector<uint8_t> &expectedBytes, AllocationSp outputAlloc, TestLog &log);
    const map<BufferDataType, compareFun> compareMap = {
        {BufferDataType::DATA_FP16, compareBytes<Float16, deFloat16>},
        {BufferDataType::DATA_FP32, compareBytes<Float32, float>},
        {BufferDataType::DATA_FP64, compareBytes<Float64, double>},
    };

    vector<uint8_t> expectedBytes;
    bool allResultsAreCorrect = true;
    int resultIndex           = static_cast<int>(outputAllocs.size());

    while (resultIndex--)
    {
        expectedOutputs[resultIndex].getBytes(expectedBytes);
        BufferDataType type =
            static_cast<BufferDataType>(reinterpret_cast<std::uintptr_t>(expectedOutputs[resultIndex].getUserData()));
        allResultsAreCorrect &= compareMap.at(type)(expectedBytes, outputAllocs[resultIndex], log);
    }

    return allResultsAreCorrect;
}

// Base class for ComputeTestGroupBuilder and GrephicstestGroupBuilder classes.
// It contains all functionalities that are used by both child classes.
class TestGroupBuilderBase
{
public:
    TestGroupBuilderBase();
    virtual ~TestGroupBuilderBase() = default;

    virtual void createOperationTests(TestCaseGroup *parentGroup, const char *groupName, VariableType variableType,
                                      bool argumentsFromInput) = 0;

    virtual void createSettingsTests(TestCaseGroup *parentGroup) = 0;

protected:
    typedef vector<OperationTestCase> TestCaseVect;

    // Structure containing all data required to create single operation test.
    struct OperationTestCaseInfo
    {
        VariableType outVariableType;
        bool argumentsFromInput;
        VkShaderStageFlagBits testedStage;
        const Operation &operation;
        const OperationTestCase &testCase;
    };

    // Mode used by SettingsTestCaseInfo to specify what settings do we want to test.
    enum SettingsMode
    {
        SM_ROUNDING = 0,
        SM_DENORMS
    };

    // Enum containing available options. When rounding is tested only SO_RTE and SO_RTZ
    // should be used. SO_FLUSH and SO_PRESERVE should be used only for denorm tests.
    enum SettingsOption
    {
        SO_UNUSED = 0,
        SO_RTE,
        SO_RTZ,
        SO_FLUSH,
        SO_PRESERVE
    };

    // Structure containing all data required to create single settings test.
    struct SettingsTestCaseInfo
    {
        const char *name;
        SettingsMode testedMode;
        VkShaderFloatControlsIndependence independenceSetting;

        SettingsOption fp16Option;
        SettingsOption fp32Option;
        SettingsOption fp64Option;
        bool fp16Without16BitStorage;
    };

    void specializeOperation(const OperationTestCaseInfo &testCaseInfo,
                             SpecializedOperation &specializedOperation) const;

    void getBehaviorCapabilityAndExecutionMode(BehaviorFlags behaviorFlags, const string inBitWidth,
                                               const string outBitWidth, string &capability,
                                               string &executionMode) const;

    void setupFloatControlsProperties(VariableType inVariableType, VariableType outVariableType,
                                      BehaviorFlags behaviorFlags,
                                      vk::VkPhysicalDeviceFloatControlsProperties &props) const;

protected:
    struct TypeData
    {
        TypeValuesSP values;
        TypeSnippetsSP snippets;
        TypeTestResultsSP testResults;
    };

    // Type specific parameters are stored in this map.
    map<VariableType, TypeData> m_typeData;

    // Map converting behaviuor id to OpCapability instruction
    typedef map<BehaviorFlagBits, string> BehaviorNameMap;
    BehaviorNameMap m_behaviorToName;
};

TestGroupBuilderBase::TestGroupBuilderBase()
{
    m_typeData[FP16]               = TypeData();
    m_typeData[FP16].values        = TypeValuesSP(new TypeValues<deFloat16>);
    m_typeData[FP16].snippets      = TypeSnippetsSP(new TypeSnippets<deFloat16>);
    m_typeData[FP16].testResults   = TypeTestResultsSP(new TypeTestResults<deFloat16>);
    m_typeData[FP32]               = TypeData();
    m_typeData[FP32].values        = TypeValuesSP(new TypeValues<float>);
    m_typeData[FP32].snippets      = TypeSnippetsSP(new TypeSnippets<float>);
    m_typeData[FP32].testResults   = TypeTestResultsSP(new TypeTestResults<float>);
    m_typeData[FP64]               = TypeData();
    m_typeData[FP64].values        = TypeValuesSP(new TypeValues<double>);
    m_typeData[FP64].snippets      = TypeSnippetsSP(new TypeSnippets<double>);
    m_typeData[FP64].testResults   = TypeTestResultsSP(new TypeTestResults<double>);
    m_typeData[UINT32]             = TypeData();
    m_typeData[UINT32].values      = TypeValuesSP(new TypeValues<float>);
    m_typeData[UINT32].snippets    = TypeSnippetsSP(new TypeSnippets<float>(false));
    m_typeData[UINT32].testResults = TypeTestResultsSP(new TypeTestResults<float>);
    m_typeData[UINT64]             = TypeData();
    m_typeData[UINT64].values      = TypeValuesSP(new TypeValues<double>);
    m_typeData[UINT64].snippets    = TypeSnippetsSP(new TypeSnippets<double>(false));
    m_typeData[UINT64].testResults = TypeTestResultsSP(new TypeTestResults<double>);
    m_typeData[INT32]              = TypeData();
    m_typeData[INT32].values       = TypeValuesSP(new TypeValues<float>);
    m_typeData[INT32].snippets     = TypeSnippetsSP(new TypeSnippets<float>(false, true));
    m_typeData[INT32].testResults  = TypeTestResultsSP(new TypeTestResults<float>);
    m_typeData[INT64]              = TypeData();
    m_typeData[INT64].values       = TypeValuesSP(new TypeValues<double>);
    m_typeData[INT64].snippets     = TypeSnippetsSP(new TypeSnippets<double>(false, true));
    m_typeData[INT64].testResults  = TypeTestResultsSP(new TypeTestResults<double>);

    m_behaviorToName[B_DENORM_PRESERVE] = "DenormPreserve";
    m_behaviorToName[B_DENORM_FLUSH]    = "DenormFlushToZero";
    m_behaviorToName[B_ZIN_PRESERVE]    = "SignedZeroInfNanPreserve";
    m_behaviorToName[B_RTE_ROUNDING]    = "RoundingModeRTE";
    m_behaviorToName[B_RTZ_ROUNDING]    = "RoundingModeRTZ";
}

void TestGroupBuilderBase::specializeOperation(const OperationTestCaseInfo &testCaseInfo,
                                               SpecializedOperation &specializedOperation) const
{
    const string typeToken  = "_valueType";
    const string widthToken = "${float_width}";

    VariableType outVariableType         = testCaseInfo.outVariableType;
    const Operation &operation           = testCaseInfo.operation;
    const TypeSnippetsSP outTypeSnippets = m_typeData.at(outVariableType).snippets;
    const bool inputRestricted           = operation.isInputTypeRestricted;
    VariableType inVariableType          = operation.restrictedInputType;

    // usually input type is same as output but this is not the case for conversion
    // operations; in those cases operation definitions have restricted input type
    inVariableType = inputRestricted ? inVariableType : outVariableType;

    TypeSnippetsSP inTypeSnippets = m_typeData.at(inVariableType).snippets;

    const string inTypePrefix  = string("_") + inTypeSnippets->getValueTypeString() + inTypeSnippets->bitWidth;
    const string outTypePrefix = string("_") + outTypeSnippets->getValueTypeString() + outTypeSnippets->bitWidth;

    std::string byteWidthToken = std::to_string(std::stoi(outTypeSnippets->bitWidth) / 8);

    specializedOperation.constants   = replace(operation.constants, typeToken, inTypePrefix);
    specializedOperation.annotations = replace(operation.annotations, widthToken, byteWidthToken);
    specializedOperation.types       = replace(operation.types, typeToken, outTypePrefix);
    specializedOperation.variables   = replace(operation.variables, typeToken, outTypePrefix);
    specializedOperation.functions   = replace(operation.functions, typeToken, outTypePrefix);
    specializedOperation.commands    = replace(operation.commands, typeToken, outTypePrefix);

    specializedOperation.inVariableType             = inVariableType;
    specializedOperation.inTypeSnippets             = inTypeSnippets;
    specializedOperation.outTypeSnippets            = outTypeSnippets;
    specializedOperation.argumentsUsesFloatConstant = 0;

    if (operation.isSpecConstant)
        return;

    // select way arguments are prepared
    if (testCaseInfo.argumentsFromInput)
    {
        // read arguments from input SSBO in main function
        specializedOperation.arguments = inTypeSnippets->argumentsFromInputSnippet;

        if (inVariableType == FP16 && testCaseInfo.testCase.fp16Without16BitStorage)
            specializedOperation.arguments = inTypeSnippets->argumentsFromInputFp16Snippet;
    }
    else
    {
        // generate proper values in main function
        const string arg1 = "%arg1                 = ";
        const string arg2 = "%arg2                 = ";

        const ValueId *inputArguments = testCaseInfo.testCase.input;
        if (inputArguments[0] != V_UNUSED)
        {
            specializedOperation.arguments = arg1 + inTypeSnippets->valueIdToSnippetArgMap.at(inputArguments[0]);
            specializedOperation.argumentsUsesFloatConstant |= B_STATEMENT_USAGE_ARGS_CONST_FLOAT;
        }
        if (inputArguments[1] != V_UNUSED)
        {
            specializedOperation.arguments += arg2 + inTypeSnippets->valueIdToSnippetArgMap.at(inputArguments[1]);
            specializedOperation.argumentsUsesFloatConstant |= B_STATEMENT_USAGE_ARGS_CONST_FLOAT;
        }
    }
}

void TestGroupBuilderBase::getBehaviorCapabilityAndExecutionMode(BehaviorFlags behaviorFlags, const string inBitWidth,
                                                                 const string outBitWidth, string &capability,
                                                                 string &executionMode) const
{
    // iterate over all behaviours and request those that are needed
    BehaviorNameMap::const_iterator it = m_behaviorToName.begin();
    while (it != m_behaviorToName.end())
    {
        BehaviorFlagBits behaviorId = it->first;
        string behaviorName         = it->second;

        if (behaviorFlags & behaviorId)
        {
            capability += "OpCapability " + behaviorName + "\n";

            // rounding mode should be obeyed for destination type
            bool rounding = (behaviorId == B_RTE_ROUNDING) || (behaviorId == B_RTZ_ROUNDING);
            executionMode +=
                "OpExecutionMode %main " + behaviorName + " " + (rounding ? outBitWidth : inBitWidth) + "\n";
        }

        ++it;
    }

    DE_ASSERT(!capability.empty() && !executionMode.empty());
}

void TestGroupBuilderBase::setupFloatControlsProperties(VariableType inVariableType, VariableType outVariableType,
                                                        BehaviorFlags behaviorFlags,
                                                        vk::VkPhysicalDeviceFloatControlsProperties &props) const
{
    // rounding mode should obey the destination type
    bool rteRounding = (behaviorFlags & B_RTE_ROUNDING) != 0;
    bool rtzRounding = (behaviorFlags & B_RTZ_ROUNDING) != 0;
    if (rteRounding || rtzRounding)
    {
        switch (outVariableType)
        {
        case FP16:
            props.shaderRoundingModeRTEFloat16 = rteRounding;
            props.shaderRoundingModeRTZFloat16 = rtzRounding;
            return;
        case FP32:
            props.shaderRoundingModeRTEFloat32 = rteRounding;
            props.shaderRoundingModeRTZFloat32 = rtzRounding;
            return;
        case FP64:
            props.shaderRoundingModeRTEFloat64 = rteRounding;
            props.shaderRoundingModeRTZFloat64 = rtzRounding;
            return;
        case UINT32:
        case INT32:
        case UINT64:
        case INT64:
            return;
        }
    }

    switch (inVariableType)
    {
    case FP16:
        props.shaderDenormPreserveFloat16           = behaviorFlags & B_DENORM_PRESERVE;
        props.shaderDenormFlushToZeroFloat16        = behaviorFlags & B_DENORM_FLUSH;
        props.shaderSignedZeroInfNanPreserveFloat16 = behaviorFlags & B_ZIN_PRESERVE;
        return;
    case FP32:
        props.shaderDenormPreserveFloat32           = behaviorFlags & B_DENORM_PRESERVE;
        props.shaderDenormFlushToZeroFloat32        = behaviorFlags & B_DENORM_FLUSH;
        props.shaderSignedZeroInfNanPreserveFloat32 = behaviorFlags & B_ZIN_PRESERVE;
        return;
    case FP64:
        props.shaderDenormPreserveFloat64           = behaviorFlags & B_DENORM_PRESERVE;
        props.shaderDenormFlushToZeroFloat64        = behaviorFlags & B_DENORM_FLUSH;
        props.shaderSignedZeroInfNanPreserveFloat64 = behaviorFlags & B_ZIN_PRESERVE;
        return;
    case UINT32:
    case INT32:
    case UINT64:
    case INT64:
        return;
    }
}

// Test case not related to SPIR-V but executed with compute tests. It checks if specified
// features are set to the same value when specific independence settings are used.
tcu::TestStatus verifyIndependenceSettings(Context &context)
{
    if (!context.isDeviceFunctionalitySupported("VK_KHR_shader_float_controls"))
        TCU_THROW(NotSupportedError, "VK_KHR_shader_float_controls not supported");

    vk::VkPhysicalDeviceFloatControlsProperties fcProperties;
    fcProperties.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_FLOAT_CONTROLS_PROPERTIES;
    fcProperties.pNext = DE_NULL;

    vk::VkPhysicalDeviceProperties2 deviceProperties;
    deviceProperties.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_PROPERTIES_2;
    deviceProperties.pNext = &fcProperties;

    auto fail = [](const string &featureGroup)
    { return tcu::TestStatus::fail(featureGroup + " features should be set to the same value"); };

    const VkPhysicalDevice physicalDevice          = context.getPhysicalDevice();
    const vk::InstanceInterface &instanceInterface = context.getInstanceInterface();
    instanceInterface.getPhysicalDeviceProperties2(physicalDevice, &deviceProperties);

    if (fcProperties.roundingModeIndependence == VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE)
    {
        vk::VkBool32 fp16rte = fcProperties.shaderRoundingModeRTEFloat16;
        vk::VkBool32 fp32rte = fcProperties.shaderRoundingModeRTEFloat32;
        vk::VkBool32 fp64rte = fcProperties.shaderRoundingModeRTEFloat64;
        if ((fp16rte != fp32rte) || (fp32rte != fp64rte))
            return fail("shaderRoundingModeRTEFloat*");

        vk::VkBool32 fp16rtz = fcProperties.shaderRoundingModeRTZFloat16;
        vk::VkBool32 fp32rtz = fcProperties.shaderRoundingModeRTZFloat32;
        vk::VkBool32 fp64rtz = fcProperties.shaderRoundingModeRTZFloat64;
        if ((fp16rtz != fp32rtz) || (fp32rtz != fp64rtz))
            return fail("shaderRoundingModeRTZFloat*");
    }
    else if (fcProperties.roundingModeIndependence == VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY)
    {
        vk::VkBool32 fp16rte = fcProperties.shaderRoundingModeRTEFloat16;
        vk::VkBool32 fp64rte = fcProperties.shaderRoundingModeRTEFloat64;
        if ((fp16rte != fp64rte))
            return fail("shaderRoundingModeRTEFloat16 and 64");

        vk::VkBool32 fp16rtz = fcProperties.shaderRoundingModeRTZFloat16;
        vk::VkBool32 fp64rtz = fcProperties.shaderRoundingModeRTZFloat64;
        if ((fp16rtz != fp64rtz))
            return fail("shaderRoundingModeRTZFloat16 and 64");
    }

    if (fcProperties.denormBehaviorIndependence == VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE)
    {
        vk::VkBool32 fp16flush = fcProperties.shaderDenormFlushToZeroFloat16;
        vk::VkBool32 fp32flush = fcProperties.shaderDenormFlushToZeroFloat32;
        vk::VkBool32 fp64flush = fcProperties.shaderDenormFlushToZeroFloat64;
        if ((fp16flush != fp32flush) || (fp32flush != fp64flush))
            return fail("shaderDenormFlushToZeroFloat*");

        vk::VkBool32 fp16preserve = fcProperties.shaderDenormPreserveFloat16;
        vk::VkBool32 fp32preserve = fcProperties.shaderDenormPreserveFloat32;
        vk::VkBool32 fp64preserve = fcProperties.shaderDenormPreserveFloat64;
        if ((fp16preserve != fp32preserve) || (fp32preserve != fp64preserve))
            return fail("shaderDenormPreserveFloat*");
    }
    else if (fcProperties.denormBehaviorIndependence == VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY)
    {
        vk::VkBool32 fp16flush = fcProperties.shaderDenormFlushToZeroFloat16;
        vk::VkBool32 fp64flush = fcProperties.shaderDenormFlushToZeroFloat64;
        if ((fp16flush != fp64flush))
            return fail("shaderDenormFlushToZeroFloat16 and 64");

        vk::VkBool32 fp16preserve = fcProperties.shaderDenormPreserveFloat16;
        vk::VkBool32 fp64preserve = fcProperties.shaderDenormPreserveFloat64;
        if ((fp16preserve != fp64preserve))
            return fail("shaderDenormPreserveFloat16 and 64");
    }

    return tcu::TestStatus::pass("Pass");
}

// ComputeTestGroupBuilder contains logic that creates compute shaders
// for all test cases. As most tests in spirv-assembly it uses functionality
// implemented in vktSpvAsmComputeShaderTestUtil.cpp.
class ComputeTestGroupBuilder : public TestGroupBuilderBase
{
public:
    void init();

    void createOperationTests(TestCaseGroup *parentGroup, const char *groupName, VariableType variableType,
                              bool argumentsFromInput) override;

    void createSettingsTests(TestCaseGroup *parentGroup) override;

protected:
    void fillShaderSpec(const OperationTestCaseInfo &testCaseInfo, ComputeShaderSpec &csSpec) const;
    void fillShaderSpec(const SettingsTestCaseInfo &testCaseInfo, ComputeShaderSpec &csSpec) const;

private:
    StringTemplate m_operationShaderTemplate;
    StringTemplate m_settingsShaderTemplate;
    TestCasesBuilder m_operationTestCaseBuilder;
};

void ComputeTestGroupBuilder::init()
{
    m_operationTestCaseBuilder.init();

    // generic compute shader template with common code for all
    // float types and all possible operations listed in OperationId enum
    m_operationShaderTemplate.setString("OpCapability Shader\n"
                                        "${capabilities}"

                                        "OpExtension \"SPV_KHR_float_controls\"\n"
                                        "${extensions}"

                                        "%std450            = OpExtInstImport \"GLSL.std.450\"\n"
                                        "OpMemoryModel Logical GLSL450\n"
                                        "OpEntryPoint GLCompute %main \"main\" %id\n"
                                        "OpExecutionMode %main LocalSize 1 1 1\n"
                                        "${execution_mode}"

                                        "OpDecorate %id BuiltIn GlobalInvocationId\n"

                                        // some tests require additional annotations
                                        "${annotations}"

                                        "%type_void            = OpTypeVoid\n"
                                        "%type_voidf           = OpTypeFunction %type_void\n"
                                        "%type_bool            = OpTypeBool\n"
                                        "%type_u32             = OpTypeInt 32 0\n"
                                        "%type_i32             = OpTypeInt 32 1\n"
                                        "%type_i32_fptr        = OpTypePointer Function %type_i32\n"
                                        "%type_u32_vec2        = OpTypeVector %type_u32 2\n"
                                        "%type_u32_vec3        = OpTypeVector %type_u32 3\n"
                                        "%type_u32_vec3_ptr    = OpTypePointer Input %type_u32_vec3\n"

                                        "%c_i32_0              = OpConstant %type_i32 0\n"
                                        "%c_i32_1              = OpConstant %type_i32 1\n"
                                        "%c_i32_2              = OpConstant %type_i32 2\n"
                                        "%c_u32_1              = OpConstant %type_u32 1\n"

                                        // if input float type has different width then output then
                                        // both types are defined here along with all types derived from
                                        // them that are commonly used by tests; some tests also define
                                        // their own types (those that are needed just by this single test)
                                        "${types}"

                                        // SSBO definitions
                                        "${io_definitions}"

                                        "%id                   = OpVariable %type_u32_vec3_ptr Input\n"

                                        // set of default constants per float type is placed here,
                                        // operation tests can also define additional constants.
                                        "${constants}"

                                        // O_RETURN_VAL defines function here and becouse
                                        // of that this token needs to be directly before main function
                                        "${functions}"

                                        "%main                 = OpFunction %type_void None %type_voidf\n"
                                        "%label                = OpLabel\n"

                                        "${variables}"

                                        // depending on test case arguments are either read from input ssbo
                                        // or generated in spir-v code - in later case shader input is not used
                                        "${arguments}"

                                        // perform test commands
                                        "${commands}"

                                        // save result to SSBO
                                        "${save_result}"

                                        "OpReturn\n"
                                        "OpFunctionEnd\n");

    m_settingsShaderTemplate.setString("OpCapability Shader\n"
                                       "${capabilities}"

                                       "OpExtension \"SPV_KHR_float_controls\"\n"
                                       "${extensions}"

                                       "%std450 = OpExtInstImport \"GLSL.std.450\"\n"
                                       "OpMemoryModel Logical GLSL450\n"
                                       "OpEntryPoint GLCompute %main \"main\" %id\n"
                                       "OpExecutionMode %main LocalSize 1 1 1\n"
                                       "${execution_modes}"

                                       // annotations
                                       "OpDecorate %SSBO_in BufferBlock\n"
                                       "OpDecorate %ssbo_in DescriptorSet 0\n"
                                       "OpDecorate %ssbo_in Binding 0\n"
                                       "OpDecorate %ssbo_in NonWritable\n"
                                       "${io_annotations}"

                                       "OpDecorate %id BuiltIn GlobalInvocationId\n"

                                       // types
                                       "%type_void            = OpTypeVoid\n"
                                       "%type_voidf           = OpTypeFunction %type_void\n"
                                       "%type_u32             = OpTypeInt 32 0\n"
                                       "%type_i32             = OpTypeInt 32 1\n"
                                       "%type_i32_fptr        = OpTypePointer Function %type_i32\n"
                                       "%type_u32_vec3        = OpTypeVector %type_u32 3\n"
                                       "%type_u32_vec3_ptr    = OpTypePointer Input %type_u32_vec3\n"

                                       "%c_i32_0              = OpConstant %type_i32 0\n"
                                       "%c_i32_1              = OpConstant %type_i32 1\n"
                                       "%c_i32_2              = OpConstant %type_i32 2\n"

                                       "${types}"

                                       // in SSBO definition
                                       "%SSBO_in              = OpTypeStruct ${in_struct}\n"
                                       "%up_SSBO_in           = OpTypePointer Uniform %SSBO_in\n"
                                       "%ssbo_in              = OpVariable %up_SSBO_in Uniform\n"

                                       // out SSBO definitions
                                       "${out_definitions}"

                                       "%id                   = OpVariable %type_u32_vec3_ptr Input\n"
                                       "%main                 = OpFunction %type_void None %type_voidf\n"
                                       "%label                = OpLabel\n"

                                       "${commands}"

                                       "${save_result}"

                                       "OpReturn\n"
                                       "OpFunctionEnd\n");
}

void ComputeTestGroupBuilder::createOperationTests(TestCaseGroup *parentGroup, const char *groupName,
                                                   VariableType variableType, bool argumentsFromInput)
{
    TestContext &testCtx = parentGroup->getTestContext();
    TestCaseGroup *group = new TestCaseGroup(testCtx, groupName);
    parentGroup->addChild(group);

    TestCaseVect testCases;
    m_operationTestCaseBuilder.build(testCases, m_typeData[variableType].testResults, argumentsFromInput);

    for (auto &testCase : testCases)
    {
        // skip cases with undefined output
        if (testCase.expectedOutput == V_UNUSED)
            continue;

        OperationTestCaseInfo testCaseInfo = {variableType, argumentsFromInput, VK_SHADER_STAGE_COMPUTE_BIT,
                                              m_operationTestCaseBuilder.getOperation(testCase.operationId), testCase};

        ComputeShaderSpec csSpec;

        fillShaderSpec(testCaseInfo, csSpec);

        string testName = replace(testCase.baseName, "op", testCaseInfo.operation.name);
        group->addChild(new SpvAsmComputeShaderCase(testCtx, testName.c_str(), csSpec));
    }
}

void ComputeTestGroupBuilder::createSettingsTests(TestCaseGroup *parentGroup)
{
    TestContext &testCtx = parentGroup->getTestContext();
    TestCaseGroup *group = new TestCaseGroup(testCtx, "independence_settings");
    parentGroup->addChild(group);

    using SFCI                 = VkShaderFloatControlsIndependence;
    const SFCI independence32  = VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY;
    const SFCI independenceAll = VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_ALL;

    vector<SettingsTestCaseInfo> testCases = {
        // name                                                            mode            independenceSetting        fp16Option        fp32Option        fp64Option        fp16Without16bitstorage

        // test rounding modes when only two float widths are available
        {"rounding_ind_all_fp16_rte_fp32_rtz", SM_ROUNDING, independenceAll, SO_RTE, SO_RTZ, SO_UNUSED, false},
        {"rounding_ind_all_fp16_rtz_fp32_rte", SM_ROUNDING, independenceAll, SO_RTZ, SO_RTE, SO_UNUSED, false},
        {"rounding_ind_32_fp16_rte_fp32_rtz", SM_ROUNDING, independence32, SO_RTE, SO_RTZ, SO_UNUSED, false},
        {"rounding_ind_32_fp16_rtz_fp32_rte", SM_ROUNDING, independence32, SO_RTZ, SO_RTE, SO_UNUSED, false},
        {"rounding_ind_all_fp16_rte_fp64_rtz", SM_ROUNDING, independenceAll, SO_RTE, SO_UNUSED, SO_RTZ, false},
        {"rounding_ind_all_fp16_rtz_fp64_rte", SM_ROUNDING, independenceAll, SO_RTZ, SO_UNUSED, SO_RTE, false},
        {"rounding_ind_all_fp32_rte_fp64_rtz", SM_ROUNDING, independenceAll, SO_UNUSED, SO_RTE, SO_RTZ, false},
        {"rounding_ind_all_fp32_rtz_fp64_rte", SM_ROUNDING, independenceAll, SO_UNUSED, SO_RTZ, SO_RTE, false},
        {"rounding_ind_32_fp32_rte_fp64_rtz", SM_ROUNDING, independence32, SO_UNUSED, SO_RTE, SO_RTZ, false},
        {"rounding_ind_32_fp32_rtz_fp64_rte", SM_ROUNDING, independence32, SO_UNUSED, SO_RTZ, SO_RTE, false},

        // test rounding modes when three widths are available
        {"rounding_ind_all_fp16_rtz_fp32_rte_fp64_rtz", SM_ROUNDING, independenceAll, SO_RTZ, SO_RTE, SO_RTZ, false},
        {"rounding_ind_32_fp16_rtz_fp32_rte_fp64_rtz", SM_ROUNDING, independence32, SO_RTZ, SO_RTE, SO_RTZ, false},
        {"rounding_ind_all_fp16_rte_fp32_rtz_fp64_rte", SM_ROUNDING, independenceAll, SO_RTE, SO_RTZ, SO_RTE, false},
        {"rounding_ind_32_fp16_rte_fp32_rtz_fp64_rte", SM_ROUNDING, independence32, SO_RTE, SO_RTZ, SO_RTE, false},
        {"rounding_ind_all_fp16_rtz_fp32_rtz_fp64_rte", SM_ROUNDING, independenceAll, SO_RTZ, SO_RTZ, SO_RTE, false},
        {"rounding_ind_all_fp16_rtz_fp32_rte_fp64_rte", SM_ROUNDING, independenceAll, SO_RTZ, SO_RTE, SO_RTE, false},
        {"rounding_ind_all_fp16_rte_fp32_rte_fp64_rtz", SM_ROUNDING, independenceAll, SO_RTE, SO_RTE, SO_RTZ, false},
        {"rounding_ind_all_fp16_rte_fp32_rtz_fp64_rtz", SM_ROUNDING, independenceAll, SO_RTE, SO_RTZ, SO_RTZ, false},

        // test denorm settings when only two float widths are available
        {"denorm_ind_all_fp16_flush_fp32_preserve", SM_DENORMS, independenceAll, SO_FLUSH, SO_PRESERVE, SO_UNUSED,
         false},
        {"denorm_ind_all_fp16_preserve_fp32_flush", SM_DENORMS, independenceAll, SO_PRESERVE, SO_FLUSH, SO_UNUSED,
         false},
        {"denorm_ind_32_fp16_flush_fp32_preserve", SM_DENORMS, independence32, SO_FLUSH, SO_PRESERVE, SO_UNUSED, false},
        {"denorm_ind_32_fp16_preserve_fp32_flush", SM_DENORMS, independence32, SO_PRESERVE, SO_FLUSH, SO_UNUSED, false},
        {"denorm_ind_all_fp16_flush_fp64_preserve", SM_DENORMS, independenceAll, SO_FLUSH, SO_UNUSED, SO_PRESERVE,
         false},
        {"denorm_ind_all_fp16_preserve_fp64_flush", SM_DENORMS, independenceAll, SO_PRESERVE, SO_UNUSED, SO_FLUSH,
         false},
        {"denorm_ind_all_fp32_flush_fp64_preserve", SM_DENORMS, independenceAll, SO_UNUSED, SO_FLUSH, SO_PRESERVE,
         false},
        {"denorm_ind_all_fp32_preserve_fp64_flush", SM_DENORMS, independenceAll, SO_UNUSED, SO_PRESERVE, SO_FLUSH,
         false},
        {"denorm_ind_32_fp32_flush_fp64_preserve", SM_DENORMS, independence32, SO_UNUSED, SO_FLUSH, SO_PRESERVE, false},
        {"denorm_ind_32_fp32_preserve_fp64_flush", SM_DENORMS, independence32, SO_UNUSED, SO_PRESERVE, SO_FLUSH, false},

        // test denorm settings when three widths are available
        {"denorm_ind_all_fp16_preserve_fp32_flush_fp64_preserve", SM_DENORMS, independenceAll, SO_PRESERVE, SO_FLUSH,
         SO_PRESERVE, false},
        {"denorm_ind_32_fp16_preserve_fp32_flush_fp64_preserve", SM_DENORMS, independence32, SO_PRESERVE, SO_FLUSH,
         SO_PRESERVE, false},
        {"denorm_ind_all_fp16_flush_fp32_preserve_fp64_flush", SM_DENORMS, independenceAll, SO_FLUSH, SO_PRESERVE,
         SO_FLUSH, false},
        {"denorm_ind_32_fp16_flush_fp32_preserve_fp64_flush", SM_DENORMS, independence32, SO_FLUSH, SO_PRESERVE,
         SO_FLUSH, false},
        {"denorm_ind_all_fp16_preserve_fp32_preserve_fp64_flush", SM_DENORMS, independenceAll, SO_PRESERVE, SO_PRESERVE,
         SO_FLUSH, false},
        {"denorm_ind_all_fp16_preserve_fp32_flush_fp64_flush", SM_DENORMS, independenceAll, SO_PRESERVE, SO_FLUSH,
         SO_FLUSH, false},
        {"denorm_ind_all_fp16_flush_fp32_flush_fp64_preserve", SM_DENORMS, independenceAll, SO_FLUSH, SO_FLUSH,
         SO_PRESERVE, false},
        {"denorm_ind_all_fp16_flush_fp32_preserve_fp64_preserve", SM_DENORMS, independenceAll, SO_FLUSH, SO_PRESERVE,
         SO_PRESERVE, false},

        // Same fp16 tests but without requiring VK_KHR_16bit_storage
        // test rounding modes when only two float widths are available
        {"rounding_ind_all_fp16_rte_fp32_rtz_nostorage", SM_ROUNDING, independenceAll, SO_RTE, SO_RTZ, SO_UNUSED, true},
        {"rounding_ind_all_fp16_rtz_fp32_rte_nostorage", SM_ROUNDING, independenceAll, SO_RTZ, SO_RTE, SO_UNUSED, true},
        {"rounding_ind_32_fp16_rte_fp32_rtz_nostorage", SM_ROUNDING, independence32, SO_RTE, SO_RTZ, SO_UNUSED, true},
        {"rounding_ind_32_fp16_rtz_fp32_rte_nostorage", SM_ROUNDING, independence32, SO_RTZ, SO_RTE, SO_UNUSED, true},
        {"rounding_ind_all_fp16_rte_fp64_rtz_nostorage", SM_ROUNDING, independenceAll, SO_RTE, SO_UNUSED, SO_RTZ, true},
        {"rounding_ind_all_fp16_rtz_fp64_rte_nostorage", SM_ROUNDING, independenceAll, SO_RTZ, SO_UNUSED, SO_RTE, true},

        // test rounding modes when three widths are available
        {"rounding_ind_all_fp16_rtz_fp32_rte_fp64_rtz_nostorage", SM_ROUNDING, independenceAll, SO_RTZ, SO_RTE, SO_RTZ,
         true},
        {"rounding_ind_32_fp16_rtz_fp32_rte_fp64_rtz_nostorage", SM_ROUNDING, independence32, SO_RTZ, SO_RTE, SO_RTZ,
         true},
        {"rounding_ind_all_fp16_rte_fp32_rtz_fp64_rte_nostorage", SM_ROUNDING, independenceAll, SO_RTE, SO_RTZ, SO_RTE,
         true},
        {"rounding_ind_32_fp16_rte_fp32_rtz_fp64_rte_nostorage", SM_ROUNDING, independence32, SO_RTE, SO_RTZ, SO_RTE,
         true},
        {"rounding_ind_all_fp16_rtz_fp32_rtz_fp64_rte_nostorage", SM_ROUNDING, independenceAll, SO_RTZ, SO_RTZ, SO_RTE,
         true},
        {"rounding_ind_all_fp16_rtz_fp32_rte_fp64_rte_nostorage", SM_ROUNDING, independenceAll, SO_RTZ, SO_RTE, SO_RTE,
         true},
        {"rounding_ind_all_fp16_rte_fp32_rte_fp64_rtz_nostorage", SM_ROUNDING, independenceAll, SO_RTE, SO_RTE, SO_RTZ,
         true},
        {"rounding_ind_all_fp16_rte_fp32_rtz_fp64_rtz_nostorage", SM_ROUNDING, independenceAll, SO_RTE, SO_RTZ, SO_RTZ,
         true},

        // test denorm settings when only two float widths are available
        {"denorm_ind_all_fp16_flush_fp32_preserve_nostorage", SM_DENORMS, independenceAll, SO_FLUSH, SO_PRESERVE,
         SO_UNUSED, true},
        {"denorm_ind_all_fp16_preserve_fp32_flush_nostorage", SM_DENORMS, independenceAll, SO_PRESERVE, SO_FLUSH,
         SO_UNUSED, true},
        {"denorm_ind_32_fp16_flush_fp32_preserve_nostorage", SM_DENORMS, independence32, SO_FLUSH, SO_PRESERVE,
         SO_UNUSED, true},
        {"denorm_ind_32_fp16_preserve_fp32_flush_nostorage", SM_DENORMS, independence32, SO_PRESERVE, SO_FLUSH,
         SO_UNUSED, true},
        {"denorm_ind_all_fp16_flush_fp64_preserve_nostorage", SM_DENORMS, independenceAll, SO_FLUSH, SO_UNUSED,
         SO_PRESERVE, true},
        {"denorm_ind_all_fp16_preserve_fp64_flush_nostorage", SM_DENORMS, independenceAll, SO_PRESERVE, SO_UNUSED,
         SO_FLUSH, true},

        // test denorm settings when three widths are available
        {"denorm_ind_all_fp16_preserve_fp32_flush_fp64_preserve_nostorage", SM_DENORMS, independenceAll, SO_PRESERVE,
         SO_FLUSH, SO_PRESERVE, true},
        {"denorm_ind_32_fp16_preserve_fp32_flush_fp64_preserve_nostorage", SM_DENORMS, independence32, SO_PRESERVE,
         SO_FLUSH, SO_PRESERVE, true},
        {"denorm_ind_all_fp16_flush_fp32_preserve_fp64_flush_nostorage", SM_DENORMS, independenceAll, SO_FLUSH,
         SO_PRESERVE, SO_FLUSH, true},
        {"denorm_ind_32_fp16_flush_fp32_preserve_fp64_flush_nostorage", SM_DENORMS, independence32, SO_FLUSH,
         SO_PRESERVE, SO_FLUSH, true},
        {"denorm_ind_all_fp16_preserve_fp32_preserve_fp64_flush_nostorage", SM_DENORMS, independenceAll, SO_PRESERVE,
         SO_PRESERVE, SO_FLUSH, true},
        {"denorm_ind_all_fp16_preserve_fp32_flush_fp64_flush_nostorage", SM_DENORMS, independenceAll, SO_PRESERVE,
         SO_FLUSH, SO_FLUSH, true},
        {"denorm_ind_all_fp16_flush_fp32_flush_fp64_preserve_nostorage", SM_DENORMS, independenceAll, SO_FLUSH,
         SO_FLUSH, SO_PRESERVE, true},
        {"denorm_ind_all_fp16_flush_fp32_preserve_fp64_preserve_nostorage", SM_DENORMS, independenceAll, SO_FLUSH,
         SO_PRESERVE, SO_PRESERVE, true},
    };

    for (const auto &testCase : testCases)
    {
        ComputeShaderSpec csSpec;
        fillShaderSpec(testCase, csSpec);
        group->addChild(new SpvAsmComputeShaderCase(testCtx, testCase.name, csSpec));
    }

    addFunctionCase(group, "independence_settings", verifyIndependenceSettings);
}

void ComputeTestGroupBuilder::fillShaderSpec(const OperationTestCaseInfo &testCaseInfo, ComputeShaderSpec &csSpec) const
{
    // LUT storing functions used to verify test results
    const VerifyIOFunc checkFloatsLUT[] = {checkFloats<Float16, deFloat16>, checkFloats<Float32, float>,
                                           checkFloats<Float64, double>};

    const Operation &testOperation    = testCaseInfo.operation;
    const OperationTestCase &testCase = testCaseInfo.testCase;
    VariableType outVariableType      = testCaseInfo.outVariableType;

    SpecializedOperation specOpData;
    specializeOperation(testCaseInfo, specOpData);

    TypeSnippetsSP inTypeSnippets  = specOpData.inTypeSnippets;
    TypeSnippetsSP outTypeSnippets = specOpData.outTypeSnippets;
    VariableType inVariableType    = specOpData.inVariableType;

    bool outFp16WithoutStorage = (outVariableType == FP16) && testCase.fp16Without16BitStorage;
    bool inFp16WithoutStorage  = (inVariableType == FP16) && testCase.fp16Without16BitStorage;

    // The feature is required if OpCapability StorageUniform16 is used in the shader.
    bool requiresUniformAndStorage16BitBufferAccess = false;

    // UnpackHalf2x16 is a corner case - it returns two 32-bit floats but
    // internaly operates on fp16 and this type should be used by float controls
    VariableType inVariableTypeForCaps = inVariableType;
    string inFloatWidthForCaps         = inTypeSnippets->bitWidth;
    if (testCase.operationId == OID_UPH_DENORM)
    {
        inVariableTypeForCaps = FP16;
        inFloatWidthForCaps   = "16";
    }

    string behaviorCapability;
    string behaviorExecutionMode;
    getBehaviorCapabilityAndExecutionMode(testCase.behaviorFlags, inFloatWidthForCaps, outTypeSnippets->bitWidth,
                                          behaviorCapability, behaviorExecutionMode);

    string capabilities = behaviorCapability + outTypeSnippets->capabilities;
    string extensions   = outTypeSnippets->extensions;
    string annotations  = inTypeSnippets->inputAnnotationsSnippet + outTypeSnippets->outputAnnotationsSnippet +
                         outTypeSnippets->typeAnnotationsSnippet;
    string types         = outTypeSnippets->typeDefinitionsSnippet;
    string constants     = outTypeSnippets->constantsDefinitionsSnippet;
    string ioDefinitions = "";

    // Getting rid of 16bit_storage dependency imply replacing lots of snippets.
    {
        if (inFp16WithoutStorage)
        {
            ioDefinitions = inTypeSnippets->inputDefinitionsFp16Snippet;
        }
        else
        {
            ioDefinitions = inTypeSnippets->inputDefinitionsSnippet;
        }

        if (outFp16WithoutStorage)
        {
            extensions   = outTypeSnippets->extensionsFp16Without16BitStorage;
            capabilities = behaviorCapability + outTypeSnippets->capabilitiesFp16Without16BitStorage;
            types += outTypeSnippets->typeDefinitionsFp16Snippet;
            annotations += outTypeSnippets->typeAnnotationsFp16Snippet;
            ioDefinitions += outTypeSnippets->outputDefinitionsFp16Snippet;
        }
        else
        {
            ioDefinitions += outTypeSnippets->outputDefinitionsSnippet;

            requiresUniformAndStorage16BitBufferAccess |= (outVariableType == FP16);
        }
    }

    bool outFp16TypeUsage = outTypeSnippets->loadStoreRequiresShaderFloat16;
    bool inFp16TypeUsage  = false;

    if (testOperation.isInputTypeRestricted)
    {
        annotations += inTypeSnippets->typeAnnotationsSnippet;
        types += inTypeSnippets->typeDefinitionsSnippet;
        constants += inTypeSnippets->constantsDefinitionsSnippet;

        if (inFp16WithoutStorage)
        {
            annotations += inTypeSnippets->typeAnnotationsFp16Snippet;
            types += inTypeSnippets->typeDefinitionsFp16Snippet;
            capabilities += inTypeSnippets->capabilitiesFp16Without16BitStorage;
            extensions += inTypeSnippets->extensionsFp16Without16BitStorage;
        }
        else
        {
            capabilities += inTypeSnippets->capabilities;
            extensions += inTypeSnippets->extensions;

            requiresUniformAndStorage16BitBufferAccess |= (inVariableType == FP16);
        }

        inFp16TypeUsage = inTypeSnippets->loadStoreRequiresShaderFloat16;
    }

    map<string, string> specializations;
    specializations["extensions"]     = extensions;
    specializations["execution_mode"] = behaviorExecutionMode;
    specializations["annotations"]    = annotations + specOpData.annotations;
    specializations["types"]          = types + specOpData.types;
    specializations["io_definitions"] = ioDefinitions;
    specializations["variables"]      = specOpData.variables;
    specializations["functions"]      = specOpData.functions;
    specializations["save_result"] =
        (outFp16WithoutStorage ? outTypeSnippets->storeResultsFp16Snippet : outTypeSnippets->storeResultsSnippet);
    specializations["arguments"] = specOpData.arguments;
    specializations["commands"]  = specOpData.commands;

    // Build constants. They are only needed sometimes.
    const FloatStatementUsageFlags argsAnyFloatConstMask =
        B_STATEMENT_USAGE_ARGS_CONST_FLOAT | B_STATEMENT_USAGE_ARGS_CONST_FP16 | B_STATEMENT_USAGE_ARGS_CONST_FP32 |
        B_STATEMENT_USAGE_ARGS_CONST_FP64;
    const bool argsUseFPConstants = (specOpData.argumentsUsesFloatConstant & argsAnyFloatConstMask) != 0;
    const FloatStatementUsageFlags commandsAnyFloatConstMask =
        B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_CONST_FP16 |
        B_STATEMENT_USAGE_COMMANDS_CONST_FP32 | B_STATEMENT_USAGE_COMMANDS_CONST_FP64;
    const bool commandsUseFPConstants = (testCaseInfo.operation.statementUsageFlags & commandsAnyFloatConstMask) != 0;
    const bool needConstants          = argsUseFPConstants || commandsUseFPConstants;
    const FloatStatementUsageFlags constsFloatTypeMask =
        B_STATEMENT_USAGE_CONSTS_TYPE_FLOAT | B_STATEMENT_USAGE_CONSTS_TYPE_FP16;
    const bool constsUsesFP16Type             = (testCaseInfo.operation.statementUsageFlags & constsFloatTypeMask) != 0;
    const bool loadStoreRequiresShaderFloat16 = inFp16TypeUsage || outFp16TypeUsage;
    const bool usesFP16Constants              = constsUsesFP16Type || (needConstants && loadStoreRequiresShaderFloat16);

    specializations["constants"] = "";
    if (needConstants || outFp16WithoutStorage)
    {
        specializations["constants"] = constants;
    }
    specializations["constants"] += specOpData.constants;

    // check which format features are needed
    bool float16FeatureRequired = (outVariableType == FP16) || (inVariableType == FP16);
    bool float64FeatureRequired = (outVariableType == FP64) || (inVariableType == FP64);
    bool int64FeatureRequired   = ((outVariableType == UINT64) || (outVariableType == INT64)) ||
                                ((inVariableType == UINT64) || (inVariableType == INT64));

    // Determine required capabilities.
    bool float16CapabilityAlreadyAdded = inFp16WithoutStorage || outFp16WithoutStorage;
    if ((testOperation.floatUsage == FLOAT_ARITHMETIC && float16FeatureRequired && !float16CapabilityAlreadyAdded) ||
        usesFP16Constants)
    {
        capabilities += "OpCapability Float16\n";
    }
    specializations["capabilities"] = capabilities;

    // specialize shader
    const string shaderCode = m_operationShaderTemplate.specialize(specializations);

    // construct input and output buffers of proper types
    TypeValuesSP inTypeValues  = m_typeData.at(inVariableType).values;
    TypeValuesSP outTypeValues = m_typeData.at(outVariableType).values;
    BufferSp inBufferSp        = inTypeValues->constructInputBuffer(testCase.input);
    BufferSp outBufferSp       = outTypeValues->constructOutputBuffer(testCase.expectedOutput);
    csSpec.inputs.push_back(Resource(inBufferSp, VK_DESCRIPTOR_TYPE_STORAGE_BUFFER));
    csSpec.outputs.push_back(Resource(outBufferSp));

    // check which features/properties are needed
    csSpec.assembly      = shaderCode;
    csSpec.numWorkGroups = IVec3(1, 1, 1);
    csSpec.verifyIO      = checkFloatsLUT[outVariableType];

    csSpec.extensions.push_back("VK_KHR_shader_float_controls");

    csSpec.requestedVulkanFeatures.coreFeatures.shaderFloat64 = float64FeatureRequired;
    csSpec.requestedVulkanFeatures.coreFeatures.shaderInt64   = int64FeatureRequired;
    csSpec.requestedVulkanFeatures.ext16BitStorage.uniformAndStorageBuffer16BitAccess =
        float16FeatureRequired && requiresUniformAndStorage16BitBufferAccess;
    csSpec.requestedVulkanFeatures.extFloat16Int8.shaderFloat16 =
        float16CapabilityAlreadyAdded || usesFP16Constants ||
        (float16FeatureRequired && requiresUniformAndStorage16BitBufferAccess &&
         testOperation.floatUsage == FLOAT_ARITHMETIC);

    setupFloatControlsProperties(
        inVariableTypeForCaps, // usualy same as inFloatType - different only for UnpackHalf2x16
        outVariableType, testCase.behaviorFlags, csSpec.requestedVulkanFeatures.floatControlsProperties);
}

void ComputeTestGroupBuilder::fillShaderSpec(const SettingsTestCaseInfo &testCaseInfo, ComputeShaderSpec &csSpec) const
{
    string capabilities;
    string fp16behaviorName;
    string fp32behaviorName;
    string fp64behaviorName;

    ValueId addArgs[2];
    ValueId fp16resultValue;
    ValueId fp32resultValue;
    ValueId fp64resultValue;

    vk::VkPhysicalDeviceFloatControlsProperties &floatControls = csSpec.requestedVulkanFeatures.floatControlsProperties;
    bool fp16Required                                          = testCaseInfo.fp16Option != SO_UNUSED;
    bool fp32Required                                          = testCaseInfo.fp32Option != SO_UNUSED;
    bool fp64Required                                          = testCaseInfo.fp64Option != SO_UNUSED;

    if (testCaseInfo.testedMode == SM_ROUNDING)
    {
        // make sure that only rounding options are used
        DE_ASSERT((testCaseInfo.fp16Option != SO_FLUSH) && (testCaseInfo.fp16Option != SO_PRESERVE) &&
                  (testCaseInfo.fp32Option != SO_FLUSH) && (testCaseInfo.fp32Option != SO_PRESERVE) &&
                  (testCaseInfo.fp64Option != SO_FLUSH) && (testCaseInfo.fp64Option != SO_PRESERVE));

        bool fp16RteRounding = testCaseInfo.fp16Option == SO_RTE;
        bool fp32RteRounding = testCaseInfo.fp32Option == SO_RTE;
        bool fp64RteRounding = testCaseInfo.fp64Option == SO_RTE;

        const string &rte = m_behaviorToName.at(B_RTE_ROUNDING);
        const string &rtz = m_behaviorToName.at(B_RTZ_ROUNDING);

        fp16behaviorName = fp16RteRounding ? rte : rtz;
        fp32behaviorName = fp32RteRounding ? rte : rtz;
        fp64behaviorName = fp64RteRounding ? rte : rtz;

        addArgs[0]      = V_ADD_ARG_A;
        addArgs[1]      = V_ADD_ARG_B;
        fp16resultValue = fp16RteRounding ? V_ADD_RTE_RESULT : V_ADD_RTZ_RESULT;
        fp32resultValue = fp32RteRounding ? V_ADD_RTE_RESULT : V_ADD_RTZ_RESULT;
        fp64resultValue = fp64RteRounding ? V_ADD_RTE_RESULT : V_ADD_RTZ_RESULT;

        capabilities = "OpCapability " + rte +
                       "\n"
                       "OpCapability " +
                       rtz + "\n";

        floatControls.roundingModeIndependence     = testCaseInfo.independenceSetting;
        floatControls.denormBehaviorIndependence   = VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE;
        floatControls.shaderRoundingModeRTEFloat16 = fp16RteRounding;
        floatControls.shaderRoundingModeRTZFloat16 = fp16Required && !fp16RteRounding;
        floatControls.shaderRoundingModeRTEFloat32 = fp32RteRounding;
        floatControls.shaderRoundingModeRTZFloat32 = fp32Required && !fp32RteRounding;
        floatControls.shaderRoundingModeRTEFloat64 = fp64RteRounding;
        floatControls.shaderRoundingModeRTZFloat64 = fp64Required && !fp64RteRounding;
    }
    else // SM_DENORMS
    {
        // make sure that only denorm options are used
        DE_ASSERT((testCaseInfo.fp16Option != SO_RTE) && (testCaseInfo.fp16Option != SO_RTZ) &&
                  (testCaseInfo.fp32Option != SO_RTE) && (testCaseInfo.fp32Option != SO_RTZ) &&
                  (testCaseInfo.fp64Option != SO_RTE) && (testCaseInfo.fp64Option != SO_RTZ));

        bool fp16DenormPreserve = testCaseInfo.fp16Option == SO_PRESERVE;
        bool fp32DenormPreserve = testCaseInfo.fp32Option == SO_PRESERVE;
        bool fp64DenormPreserve = testCaseInfo.fp64Option == SO_PRESERVE;

        const string &preserve = m_behaviorToName.at(B_DENORM_PRESERVE);
        const string &flush    = m_behaviorToName.at(B_DENORM_FLUSH);

        fp16behaviorName = fp16DenormPreserve ? preserve : flush;
        fp32behaviorName = fp32DenormPreserve ? preserve : flush;
        fp64behaviorName = fp64DenormPreserve ? preserve : flush;

        addArgs[0]      = V_DENORM;
        addArgs[1]      = V_DENORM;
        fp16resultValue = fp16DenormPreserve ? V_DENORM_TIMES_TWO : V_ZERO_OR_DENORM_TIMES_TWO;
        fp32resultValue = fp32DenormPreserve ? V_DENORM_TIMES_TWO : V_ZERO;
        fp64resultValue = fp64DenormPreserve ? V_DENORM_TIMES_TWO : V_ZERO;

        capabilities = "OpCapability " + preserve +
                       "\n"
                       "OpCapability " +
                       flush + "\n";

        floatControls.denormBehaviorIndependence     = testCaseInfo.independenceSetting;
        floatControls.roundingModeIndependence       = VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE;
        floatControls.shaderDenormPreserveFloat16    = fp16DenormPreserve;
        floatControls.shaderDenormFlushToZeroFloat16 = fp16Required && !fp16DenormPreserve;
        floatControls.shaderDenormPreserveFloat32    = fp32DenormPreserve;
        floatControls.shaderDenormFlushToZeroFloat32 = fp32Required && !fp32DenormPreserve;
        floatControls.shaderDenormPreserveFloat64    = fp64DenormPreserve;
        floatControls.shaderDenormFlushToZeroFloat64 = fp64Required && !fp64DenormPreserve;
    }

    const auto &fp64Data = m_typeData.at(FP64);
    const auto &fp32Data = m_typeData.at(FP32);
    const auto &fp16Data = m_typeData.at(FP16);

    uint32_t attributeIndex  = 0;
    uint32_t attributeOffset = 0;
    string attribute;
    string extensions     = "";
    string executionModes = "";
    string ioAnnotations  = "";
    string types          = "";
    string inStruct       = "";
    string outDefinitions = "";
    string commands       = "";
    string saveResult     = "";

    // construct single input buffer containing arguments for all float widths
    // (maxPerStageDescriptorStorageBuffers can be min 4 and we need 3 for outputs)
    uint32_t inputOffset = 0;
    std::vector<uint8_t> inputData((fp64Required * sizeof(double) + sizeof(float) + fp16Required * sizeof(deFloat16)) *
                                   2);

    // to follow storage buffer layout rules we store data in ssbo in order 64 -> 16
    if (fp64Required)
    {
        capabilities += fp64Data.snippets->capabilities;
        executionModes += "OpExecutionMode %main " + fp64behaviorName + " 64\n";
        attribute = to_string(attributeIndex);
        ioAnnotations += "OpMemberDecorate %SSBO_in " + attribute + " Offset " + to_string(attributeOffset) + "\n" +
                         fp64Data.snippets->multiOutputAnnotationsSnippet + "OpDecorate %ssbo_f64_out Binding " +
                         to_string(attributeIndex + 1) + "\n";
        types += fp64Data.snippets->minTypeDefinitionsSnippet;
        inStruct += " %type_f64_arr_2";
        outDefinitions += fp64Data.snippets->multiOutputDefinitionsSnippet;
        commands += replace(fp64Data.snippets->multiArgumentsFromInputSnippet, "${attr}", attribute) +
                    "%result64             = OpFAdd %type_f64 %arg1_f64 %arg2_f64\n";
        saveResult += fp64Data.snippets->multiStoreResultsSnippet;
        attributeOffset += 2 * static_cast<uint32_t>(sizeof(double));
        attributeIndex++;

        fp64Data.values->fillInputData(addArgs, inputData, inputOffset);

        // construct separate buffers for outputs to make validation easier
        BufferSp fp64OutBufferSp = fp64Data.values->constructOutputBuffer(fp64resultValue);
        csSpec.outputs.push_back(Resource(fp64OutBufferSp, vk::VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,
                                          reinterpret_cast<void *>(BufferDataType::DATA_FP64)));

        csSpec.requestedVulkanFeatures.coreFeatures.shaderFloat64 = VK_TRUE;
    }
    if (fp32Required)
    {
        executionModes += "OpExecutionMode %main " + fp32behaviorName + " 32\n";
        attribute = to_string(attributeIndex);
        ioAnnotations += "OpMemberDecorate %SSBO_in " + attribute + " Offset " + to_string(attributeOffset) + "\n" +
                         fp32Data.snippets->multiOutputAnnotationsSnippet + "OpDecorate %ssbo_f32_out Binding " +
                         to_string(attributeIndex + 1) + "\n";
        types += fp32Data.snippets->minTypeDefinitionsSnippet;
        inStruct += " %type_f32_arr_2";
        outDefinitions += fp32Data.snippets->multiOutputDefinitionsSnippet;
        commands += replace(fp32Data.snippets->multiArgumentsFromInputSnippet, "${attr}", attribute) +
                    "%result32             = OpFAdd %type_f32 %arg1_f32 %arg2_f32\n";
        saveResult += fp32Data.snippets->multiStoreResultsSnippet;
        attributeOffset += 2 * static_cast<uint32_t>(sizeof(float));
        attributeIndex++;

        fp32Data.values->fillInputData(addArgs, inputData, inputOffset);

        BufferSp fp32OutBufferSp = fp32Data.values->constructOutputBuffer(fp32resultValue);
        csSpec.outputs.push_back(Resource(fp32OutBufferSp, vk::VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,
                                          reinterpret_cast<void *>(BufferDataType::DATA_FP32)));
    }
    if (fp16Required)
    {
        if (testCaseInfo.fp16Without16BitStorage)
        {
            capabilities += fp16Data.snippets->capabilitiesFp16Without16BitStorage;
            extensions += fp16Data.snippets->extensionsFp16Without16BitStorage;
            executionModes += "OpExecutionMode %main " + fp16behaviorName + " 16\n";
            attribute = to_string(attributeIndex);
            ioAnnotations += "OpMemberDecorate %SSBO_in " + attribute + " Offset " + to_string(attributeOffset) + "\n" +
                             fp16Data.snippets->multiOutputAnnotationsFp16Snippet +
                             "OpDecorate %ssbo_u32_out Binding " + to_string(attributeIndex + 1) + "\n";
            types += fp16Data.snippets->minTypeDefinitionsSnippet + fp16Data.snippets->typeDefinitionsFp16Snippet +
                     "%type_f16_vec2        = OpTypeVector %type_f16 2\n";
            inStruct += " %type_u32_arr_1";
            outDefinitions += fp16Data.snippets->multiOutputDefinitionsFp16Snippet;
            commands += replace(fp16Data.snippets->multiArgumentsFromInputFp16Snippet, "${attr}", attribute) +
                        "%result16             = OpFAdd %type_f16 %arg1_f16 %arg2_f16\n";
            saveResult += fp16Data.snippets->multiStoreResultsFp16Snippet;

            csSpec.extensions.push_back("VK_KHR_shader_float16_int8");
            csSpec.requestedVulkanFeatures.extFloat16Int8.shaderFloat16 = true;
        }
        else
        {
            capabilities += fp16Data.snippets->capabilities + "OpCapability Float16\n";
            extensions += fp16Data.snippets->extensions;
            executionModes += "OpExecutionMode %main " + fp16behaviorName + " 16\n";
            attribute = to_string(attributeIndex);
            ioAnnotations += "OpMemberDecorate %SSBO_in " + attribute + " Offset " + to_string(attributeOffset) + "\n" +
                             fp16Data.snippets->multiOutputAnnotationsSnippet + "OpDecorate %ssbo_f16_out Binding " +
                             to_string(attributeIndex + 1) + "\n";
            types += fp16Data.snippets->minTypeDefinitionsSnippet;
            inStruct += " %type_f16_arr_2";
            outDefinitions += fp16Data.snippets->multiOutputDefinitionsSnippet;
            commands += replace(fp16Data.snippets->multiArgumentsFromInputSnippet, "${attr}", attribute) +
                        "%result16             = OpFAdd %type_f16 %arg1_f16 %arg2_f16\n";
            saveResult += fp16Data.snippets->multiStoreResultsSnippet;

            csSpec.extensions.push_back("VK_KHR_16bit_storage");
            csSpec.requestedVulkanFeatures.ext16BitStorage.uniformAndStorageBuffer16BitAccess = true;
        }

        fp16Data.values->fillInputData(addArgs, inputData, inputOffset);

        BufferSp fp16OutBufferSp = fp16Data.values->constructOutputBuffer(fp16resultValue);
        csSpec.outputs.push_back(Resource(fp16OutBufferSp, vk::VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,
                                          reinterpret_cast<void *>(BufferDataType::DATA_FP16)));
    }

    BufferSp inBufferSp(new Buffer<uint8_t>(inputData));
    csSpec.inputs.push_back(Resource(inBufferSp, VK_DESCRIPTOR_TYPE_STORAGE_BUFFER));

    map<string, string> specializations = {
        {"capabilities", capabilities},      {"extensions", extensions}, {"execution_modes", executionModes},
        {"io_annotations", ioAnnotations},   {"types", types},           {"in_struct", inStruct},
        {"out_definitions", outDefinitions}, {"commands", commands},     {"save_result", saveResult}};

    // specialize shader
    const string shaderCode = m_settingsShaderTemplate.specialize(specializations);

    csSpec.assembly      = shaderCode;
    csSpec.numWorkGroups = IVec3(1, 1, 1);
    csSpec.verifyIO      = checkMixedFloats;
    csSpec.extensions.push_back("VK_KHR_shader_float_controls");
}

void getGraphicsShaderCode(vk::SourceCollections &dst, InstanceContext context)
{
    // this function is used only by GraphicsTestGroupBuilder but it couldn't
    // be implemented as a method because of how addFunctionCaseWithPrograms
    // was implemented

    SpirvVersion targetSpirvVersion = context.resources.spirvVersion;
    const uint32_t vulkanVersion    = dst.usedVulkanVersion;

    static const string vertexTemplate =
        "OpCapability Shader\n"
        "${vert_capabilities}"

        "OpExtension \"SPV_KHR_float_controls\"\n"
        "${vert_extensions}"

        "%std450            = OpExtInstImport \"GLSL.std.450\"\n"
        "OpMemoryModel Logical GLSL450\n"
        "OpEntryPoint Vertex %main \"main\" %BP_stream %BP_position %BP_color %BP_gl_VertexIndex %BP_gl_InstanceIndex "
        "%BP_vertex_color %BP_vertex_result \n"
        "${vert_execution_mode}"

        "OpMemberDecorate %BP_gl_PerVertex 0 BuiltIn Position\n"
        "OpMemberDecorate %BP_gl_PerVertex 1 BuiltIn PointSize\n"
        "OpMemberDecorate %BP_gl_PerVertex 2 BuiltIn ClipDistance\n"
        "OpMemberDecorate %BP_gl_PerVertex 3 BuiltIn CullDistance\n"
        "OpDecorate %BP_gl_PerVertex Block\n"
        "OpDecorate %BP_position Location 0\n"
        "OpDecorate %BP_color Location 1\n"
        "OpDecorate %BP_vertex_color Location 1\n"
        "OpDecorate %BP_vertex_result Location 2\n"
        "OpDecorate %BP_vertex_result Flat\n"
        "OpDecorate %BP_gl_VertexIndex BuiltIn VertexIndex\n"
        "OpDecorate %BP_gl_InstanceIndex BuiltIn InstanceIndex\n"

        // some tests require additional annotations
        "${vert_annotations}"

        // types required by most of tests
        "%type_void            = OpTypeVoid\n"
        "%type_voidf           = OpTypeFunction %type_void\n"
        "%type_bool            = OpTypeBool\n"
        "%type_i32             = OpTypeInt 32 1\n"
        "%type_u32             = OpTypeInt 32 0\n"
        "%type_u32_vec2        = OpTypeVector %type_u32 2\n"
        "%type_i32_iptr        = OpTypePointer Input %type_i32\n"
        "%type_i32_optr        = OpTypePointer Output %type_i32\n"
        "%type_i32_fptr        = OpTypePointer Function %type_i32\n"

        // constants required by most of tests
        "%c_i32_0              = OpConstant %type_i32 0\n"
        "%c_i32_1              = OpConstant %type_i32 1\n"
        "%c_i32_2              = OpConstant %type_i32 2\n"
        "%c_u32_1              = OpConstant %type_u32 1\n"

        // if input float type has different width then output then
        // both types are defined here along with all types derived from
        // them that are commonly used by tests; some tests also define
        // their own types (those that are needed just by this single test)
        "${vert_types}"

        // SSBO is not universally supported for storing
        // data in vertex stages - it is onle read here
        "${vert_io_definitions}"

        "%BP_gl_PerVertex      = OpTypeStruct %type_f32_vec4 %type_f32 %type_f32_arr_1 %type_f32_arr_1\n"
        "%BP_gl_PerVertex_optr = OpTypePointer Output %BP_gl_PerVertex\n"
        "%BP_stream            = OpVariable %BP_gl_PerVertex_optr Output\n"
        "%BP_position          = OpVariable %type_f32_vec4_iptr Input\n"
        "%BP_color             = OpVariable %type_f32_vec4_iptr Input\n"
        "%BP_gl_VertexIndex    = OpVariable %type_i32_iptr Input\n"
        "%BP_gl_InstanceIndex  = OpVariable %type_i32_iptr Input\n"
        "%BP_vertex_color      = OpVariable %type_f32_vec4_optr Output\n"

        // set of default constants per float type is placed here,
        // operation tests can also define additional constants.
        "${vert_constants}"

        // O_RETURN_VAL defines function here and because
        // of that this token needs to be directly before main function.
        "${vert_functions}"

        "%main                 = OpFunction %type_void None %type_voidf\n"
        "%label                = OpLabel\n"

        "${vert_variables}"

        "%position             = OpLoad %type_f32_vec4 %BP_position\n"
        "%gl_pos               = OpAccessChain %type_f32_vec4_optr %BP_stream %c_i32_0\n"
        "OpStore %gl_pos %position\n"
        "%color                = OpLoad %type_f32_vec4 %BP_color\n"
        "OpStore %BP_vertex_color %color\n"

        // this token is filled only when vertex stage is tested;
        // depending on test case arguments are either read from input ssbo
        // or generated in spir-v code - in later case ssbo is not used
        "${vert_arguments}"

        // when vertex shader is tested then test operations are performed
        // here and passed to fragment stage; if fragment stage ts tested
        // then ${comands} and ${vert_process_result} are rplaced with nop
        "${vert_commands}"

        "${vert_process_result}"

        "OpReturn\n"
        "OpFunctionEnd\n";

    static const string fragmentTemplate =
        "OpCapability Shader\n"
        "${frag_capabilities}"

        "OpExtension \"SPV_KHR_float_controls\"\n"
        "${frag_extensions}"

        "%std450            = OpExtInstImport \"GLSL.std.450\"\n"
        "OpMemoryModel Logical GLSL450\n"
        "OpEntryPoint Fragment %main \"main\" %BP_vertex_color %BP_vertex_result %BP_fragColor %BP_gl_FragCoord \n"
        "OpExecutionMode %main OriginUpperLeft\n"
        "${frag_execution_mode}"

        "OpDecorate %BP_fragColor Location 0\n"
        "OpDecorate %BP_vertex_color Location 1\n"
        "OpDecorate %BP_vertex_result Location 2\n"
        "OpDecorate %BP_vertex_result Flat\n"
        "OpDecorate %BP_gl_FragCoord BuiltIn FragCoord\n"

        // some tests require additional annotations
        "${frag_annotations}"

        // types required by most of tests
        "%type_void            = OpTypeVoid\n"
        "%type_voidf           = OpTypeFunction %type_void\n"
        "%type_bool            = OpTypeBool\n"
        "%type_i32             = OpTypeInt 32 1\n"
        "%type_u32             = OpTypeInt 32 0\n"
        "%type_u32_vec2        = OpTypeVector %type_u32 2\n"
        "%type_i32_iptr        = OpTypePointer Input %type_i32\n"
        "%type_i32_optr        = OpTypePointer Output %type_i32\n"
        "%type_i32_fptr        = OpTypePointer Function %type_i32\n"

        // constants required by most of tests
        "%c_i32_0              = OpConstant %type_i32 0\n"
        "%c_i32_1              = OpConstant %type_i32 1\n"
        "%c_i32_2              = OpConstant %type_i32 2\n"
        "%c_u32_1              = OpConstant %type_u32 1\n"

        // if input float type has different width then output then
        // both types are defined here along with all types derived from
        // them that are commonly used by tests; some tests also define
        // their own types (those that are needed just by this single test)
        "${frag_types}"

        "%BP_gl_FragCoord      = OpVariable %type_f32_vec4_iptr Input\n"
        "%BP_vertex_color      = OpVariable %type_f32_vec4_iptr Input\n"
        "%BP_fragColor         = OpVariable %type_f32_vec4_optr Output\n"

        // SSBO definitions
        "${frag_io_definitions}"

        // set of default constants per float type is placed here,
        // operation tests can also define additional constants.
        "${frag_constants}"

        // O_RETURN_VAL defines function here and because
        // of that this token needs to be directly before main function.
        "${frag_functions}"

        "%main                 = OpFunction %type_void None %type_voidf\n"
        "%label                = OpLabel\n"

        "${frag_variables}"

        // just pass vertex color - rendered image is not important in our case
        "%vertex_color         = OpLoad %type_f32_vec4 %BP_vertex_color\n"
        "OpStore %BP_fragColor %vertex_color\n"

        // this token is filled only when fragment stage is tested;
        // depending on test case arguments are either read from input ssbo or
        // generated in spir-v code - in later case ssbo is used only for output
        "${frag_arguments}"

        // when fragment shader is tested then test operations are performed
        // here and saved to ssbo; if vertex stage was tested then its
        // result is just saved to ssbo here
        "${frag_commands}"
        "${frag_process_result}"

        "OpReturn\n"
        "OpFunctionEnd\n";

    dst.spirvAsmSources.add("vert", DE_NULL) << StringTemplate(vertexTemplate).specialize(context.testCodeFragments)
                                             << SpirVAsmBuildOptions(vulkanVersion, targetSpirvVersion);
    dst.spirvAsmSources.add("frag", DE_NULL) << StringTemplate(fragmentTemplate).specialize(context.testCodeFragments)
                                             << SpirVAsmBuildOptions(vulkanVersion, targetSpirvVersion);
}

// GraphicsTestGroupBuilder iterates over all test cases and creates test for both
// vertex and fragment stages. As in most spirv-assembly tests, tests here are also
// executed using functionality defined in vktSpvAsmGraphicsShaderTestUtil.cpp but
// because one of requirements during development was that SSBO wont be used in
// vertex stage we couldn't use createTestForStage functions - we need a custom
// version for both vertex and fragmen shaders at the same time. This was required
// as we needed to pass result from vertex stage to fragment stage where it could
// be saved to ssbo. To achieve that InstanceContext is created manually in
// createInstanceContext method.
class GraphicsTestGroupBuilder : public TestGroupBuilderBase
{
public:
    void init();

    void createOperationTests(TestCaseGroup *parentGroup, const char *groupName, VariableType variableType,
                              bool argumentsFromInput) override;
    void createSettingsTests(TestCaseGroup *parentGroup) override;

protected:
    InstanceContext createInstanceContext(const OperationTestCaseInfo &testCaseInfo) const;

private:
    TestCasesBuilder m_testCaseBuilder;
};

void GraphicsTestGroupBuilder::init()
{
    m_testCaseBuilder.init();
}

void GraphicsTestGroupBuilder::createOperationTests(TestCaseGroup *parentGroup, const char *groupName,
                                                    VariableType variableType, bool argumentsFromInput)
{
    TestContext &testCtx = parentGroup->getTestContext();
    TestCaseGroup *group = new TestCaseGroup(testCtx, groupName);
    parentGroup->addChild(group);

    // create test cases for vertex stage
    TestCaseVect testCases;
    m_testCaseBuilder.build(testCases, m_typeData[variableType].testResults, argumentsFromInput);

    for (auto &testCase : testCases)
    {
        // skip cases with undefined output
        if (testCase.expectedOutput == V_UNUSED)
            continue;

        // FPRoundingMode decoration can be applied only to conversion instruction that is used as the object
        // argument of an OpStore storing through a pointer to a 16-bit floating-point object in Uniform, or
        // PushConstant, or Input, or Output Storage Classes. SSBO writes are not commonly supported
        // in VS so this test case needs to be skiped for vertex stage.
        if ((testCase.operationId == OID_ORTZ_ROUND) || (testCase.operationId == OID_ORTE_ROUND))
            continue;

        OperationTestCaseInfo testCaseInfo = {variableType, argumentsFromInput, VK_SHADER_STAGE_VERTEX_BIT,
                                              m_testCaseBuilder.getOperation(testCase.operationId), testCase};

        InstanceContext ctxVertex = createInstanceContext(testCaseInfo);
        string testName           = replace(testCase.baseName, "op", testCaseInfo.operation.name);

        addFunctionCaseWithPrograms<InstanceContext>(group, testName + "_vert", getGraphicsShaderCode,
                                                     runAndVerifyDefaultPipeline, ctxVertex);
    }

    // create test cases for fragment stage
    testCases.clear();
    m_testCaseBuilder.build(testCases, m_typeData[variableType].testResults, argumentsFromInput);

    for (auto &testCase : testCases)
    {
        // skip cases with undefined output
        if (testCase.expectedOutput == V_UNUSED)
            continue;

        OperationTestCaseInfo testCaseInfo = {variableType, argumentsFromInput, VK_SHADER_STAGE_FRAGMENT_BIT,
                                              m_testCaseBuilder.getOperation(testCase.operationId), testCase};

        InstanceContext ctxFragment = createInstanceContext(testCaseInfo);
        string testName             = replace(testCase.baseName, "op", testCaseInfo.operation.name);

        addFunctionCaseWithPrograms<InstanceContext>(group, testName + "_frag", getGraphicsShaderCode,
                                                     runAndVerifyDefaultPipeline, ctxFragment);
    }
}

void GraphicsTestGroupBuilder::createSettingsTests(TestCaseGroup *parentGroup)
{
    DE_UNREF(parentGroup);

    // WG decided that testing settings only for compute stage is sufficient
}

InstanceContext GraphicsTestGroupBuilder::createInstanceContext(const OperationTestCaseInfo &testCaseInfo) const
{
    // LUT storing functions used to verify test results
    const VerifyIOFunc checkFloatsLUT[] = {checkFloats<Float16, deFloat16>, checkFloats<Float32, float>,
                                           checkFloats<Float64, double>};

    // 32-bit float types are always needed for standard operations on color
    // if tested operation does not require fp32 for either input or output
    // then this minimal type definitions must be appended to types section
    const string f32TypeMinimalRequired = "%type_f32             = OpTypeFloat 32\n"
                                          "%type_f32_arr_1       = OpTypeArray %type_f32 %c_i32_1\n"
                                          "%type_f32_iptr        = OpTypePointer Input %type_f32\n"
                                          "%type_f32_optr        = OpTypePointer Output %type_f32\n"
                                          "%type_f32_vec4        = OpTypeVector %type_f32 4\n"
                                          "%type_f32_vec4_iptr   = OpTypePointer Input %type_f32_vec4\n"
                                          "%type_f32_vec4_optr   = OpTypePointer Output %type_f32_vec4\n";

    const Operation &testOperation    = testCaseInfo.operation;
    const OperationTestCase &testCase = testCaseInfo.testCase;
    VariableType outVariableType      = testCaseInfo.outVariableType;
    VkShaderStageFlagBits testedStage = testCaseInfo.testedStage;

    DE_ASSERT((testedStage == VK_SHADER_STAGE_VERTEX_BIT) || (testedStage == VK_SHADER_STAGE_FRAGMENT_BIT));

    SpecializedOperation specOpData;
    specializeOperation(testCaseInfo, specOpData);

    TypeSnippetsSP inTypeSnippets  = specOpData.inTypeSnippets;
    TypeSnippetsSP outTypeSnippets = specOpData.outTypeSnippets;
    VariableType inVariableType    = specOpData.inVariableType;

    bool outFp16WithoutStorage = (outVariableType == FP16) && testCase.fp16Without16BitStorage;
    bool inFp16WithoutStorage  = (inVariableType == FP16) && testCase.fp16Without16BitStorage;

    // The feature is required if OpCapability StorageUniform16 is used in the shader.
    bool requiresUniformAndStorage16BitBufferAccess = false;

    // There may be several reasons why we need the shaderFloat16 Vulkan feature.
    bool needsShaderFloat16 = inFp16WithoutStorage || outFp16WithoutStorage;
    // There are some weird cases where we need the constants, but would otherwise drop them.
    bool needsSpecialConstants = false;

    // UnpackHalf2x16 is a corner case - it returns two 32-bit floats but
    // internaly operates on fp16 and this type should be used by float controls
    VariableType inVariableTypeForCaps = inVariableType;
    string inFloatWidthForCaps         = inTypeSnippets->bitWidth;
    if (testCase.operationId == OID_UPH_DENORM)
    {
        inVariableTypeForCaps = FP16;
        inFloatWidthForCaps   = "16";
    }

    string behaviorCapability;
    string behaviorExecutionMode;
    getBehaviorCapabilityAndExecutionMode(testCase.behaviorFlags, inFloatWidthForCaps, outTypeSnippets->bitWidth,
                                          behaviorCapability, behaviorExecutionMode);

    // check which format features are needed
    bool float16FeatureRequired = (inVariableType == FP16) || (outVariableType == FP16);
    bool float64FeatureRequired = (inVariableType == FP64) || (outVariableType == FP64);
    bool int64FeatureRequired   = ((inVariableType == UINT64) || (inVariableType == INT64)) ||
                                ((outVariableType == UINT64) || (outVariableType == INT64));

    string vertExecutionMode;
    string fragExecutionMode;
    string vertCapabilities;
    string fragCapabilities;
    string vertExtensions;
    string fragExtensions;
    string vertAnnotations;
    string fragAnnotations;
    string vertTypes;
    string fragTypes;
    string vertConstants;
    string fragConstants;
    string vertFunctions;
    string fragFunctions;
    string vertIODefinitions;
    string fragIODefinitions;
    string vertArguments;
    string fragArguments;
    string vertVariables;
    string fragVariables;
    string vertCommands;
    string fragCommands;
    string vertProcessResult;
    string fragProcessResult;

    // check if operation should be executed in vertex stage
    if (testedStage == VK_SHADER_STAGE_VERTEX_BIT)
    {
        vertAnnotations = inTypeSnippets->inputAnnotationsSnippet + inTypeSnippets->typeAnnotationsSnippet;
        fragAnnotations = outTypeSnippets->outputAnnotationsSnippet + outTypeSnippets->typeAnnotationsSnippet;
        vertFunctions   = specOpData.functions;

        // check if input type is different from tested type (conversion operations)
        if (testOperation.isInputTypeRestricted)
        {
            vertCapabilities = behaviorCapability + inTypeSnippets->capabilities + outTypeSnippets->capabilities;
            fragCapabilities = outTypeSnippets->capabilities;
            vertExtensions   = inTypeSnippets->extensions + outTypeSnippets->extensions;
            fragExtensions   = outTypeSnippets->extensions;
            vertTypes        = inTypeSnippets->typeDefinitionsSnippet + outTypeSnippets->typeDefinitionsSnippet +
                        outTypeSnippets->varyingsTypesSnippet;
            if (inFp16WithoutStorage)
                vertTypes += inTypeSnippets->typeDefinitionsFp16Snippet;

            fragTypes     = outTypeSnippets->typeDefinitionsSnippet + outTypeSnippets->varyingsTypesSnippet;
            vertConstants = inTypeSnippets->constantsDefinitionsSnippet + outTypeSnippets->constantsDefinitionsSnippet;
            fragConstants = outTypeSnippets->constantsDefinitionsSnippet;

            requiresUniformAndStorage16BitBufferAccess |= (inVariableType == FP16);
        }
        else
        {
            // input and output types are the same (majority of operations)

            vertCapabilities = behaviorCapability + outTypeSnippets->capabilities;
            fragCapabilities = vertCapabilities;
            vertExtensions   = outTypeSnippets->extensions;
            fragExtensions   = vertExtensions;
            vertTypes        = outTypeSnippets->typeDefinitionsSnippet + outTypeSnippets->varyingsTypesSnippet;
            fragTypes        = vertTypes;
            vertConstants    = outTypeSnippets->constantsDefinitionsSnippet;
            fragConstants    = outTypeSnippets->constantsDefinitionsSnippet;
        }

        requiresUniformAndStorage16BitBufferAccess |= (outVariableType == FP16);

        if (outVariableType != FP32)
        {
            fragTypes += f32TypeMinimalRequired;
            if (inVariableType != FP32)
                vertTypes += f32TypeMinimalRequired;
        }

        vertAnnotations += specOpData.annotations;
        vertTypes += specOpData.types;
        vertConstants += specOpData.constants;

        vertExecutionMode = behaviorExecutionMode;
        fragExecutionMode = "";
        vertIODefinitions = inTypeSnippets->inputDefinitionsSnippet + outTypeSnippets->outputVaryingsSnippet;
        fragIODefinitions = outTypeSnippets->inputVaryingsSnippet + outTypeSnippets->outputDefinitionsSnippet;
        vertArguments     = specOpData.arguments;
        fragArguments     = "";
        vertVariables     = specOpData.variables;
        fragVariables     = "";
        vertCommands      = specOpData.commands;
        fragCommands      = "";
        vertProcessResult = outTypeSnippets->storeVertexResultSnippet;
        fragProcessResult = outTypeSnippets->loadVertexResultSnippet + outTypeSnippets->storeResultsSnippet;

        if (inFp16WithoutStorage)
        {
            vertAnnotations += inTypeSnippets->typeAnnotationsFp16Snippet;
            vertIODefinitions = inTypeSnippets->inputDefinitionsFp16Snippet + outTypeSnippets->outputVaryingsSnippet;
        }

        if (outFp16WithoutStorage)
        {
            vertTypes += outTypeSnippets->typeDefinitionsFp16Snippet;
            fragTypes += outTypeSnippets->typeDefinitionsFp16Snippet;
            fragAnnotations += outTypeSnippets->typeAnnotationsFp16Snippet;
            fragIODefinitions = outTypeSnippets->inputVaryingsSnippet + outTypeSnippets->outputDefinitionsFp16Snippet;
            fragProcessResult = outTypeSnippets->loadVertexResultSnippet + outTypeSnippets->storeResultsFp16Snippet;
        }

        needsShaderFloat16 |= outTypeSnippets->loadStoreRequiresShaderFloat16;
    }
    else // perform test in fragment stage - vertex stage is empty
    {
        fragFunctions = specOpData.functions;
        // check if input type is different from tested type
        if (testOperation.isInputTypeRestricted)
        {
            fragAnnotations = inTypeSnippets->inputAnnotationsSnippet + inTypeSnippets->typeAnnotationsSnippet +
                              outTypeSnippets->outputAnnotationsSnippet + outTypeSnippets->typeAnnotationsSnippet;
            fragCapabilities = behaviorCapability +
                               (inFp16WithoutStorage ? inTypeSnippets->capabilitiesFp16Without16BitStorage :
                                                       inTypeSnippets->capabilities) +
                               (outFp16WithoutStorage ? outTypeSnippets->capabilitiesFp16Without16BitStorage :
                                                        outTypeSnippets->capabilities);
            fragExtensions = (inFp16WithoutStorage ? inTypeSnippets->extensionsFp16Without16BitStorage :
                                                     inTypeSnippets->extensions) +
                             (outFp16WithoutStorage ? outTypeSnippets->extensionsFp16Without16BitStorage :
                                                      outTypeSnippets->extensions);
            fragTypes     = inTypeSnippets->typeDefinitionsSnippet + outTypeSnippets->typeDefinitionsSnippet;
            fragConstants = inTypeSnippets->constantsDefinitionsSnippet + outTypeSnippets->constantsDefinitionsSnippet;
            ;
            requiresUniformAndStorage16BitBufferAccess |=
                ((inVariableType == FP16) && (testCase.fp16Without16BitStorage == false));
        }
        else
        {
            // input and output types are the same

            fragAnnotations = inTypeSnippets->inputAnnotationsSnippet + inTypeSnippets->typeAnnotationsSnippet +
                              outTypeSnippets->outputAnnotationsSnippet;
            fragCapabilities =
                behaviorCapability + (outFp16WithoutStorage ? outTypeSnippets->capabilitiesFp16Without16BitStorage :
                                                              outTypeSnippets->capabilities);
            fragExtensions = (outFp16WithoutStorage ? outTypeSnippets->extensionsFp16Without16BitStorage :
                                                      outTypeSnippets->extensions);
            fragTypes      = outTypeSnippets->typeDefinitionsSnippet;
            fragConstants  = outTypeSnippets->constantsDefinitionsSnippet;
        }

        requiresUniformAndStorage16BitBufferAccess |=
            ((outVariableType == FP16) && (testCase.fp16Without16BitStorage == false));

        // varying is not used but it needs to be specified so lets use type_i32 for it
        string unusedVertVarying = "%BP_vertex_result     = OpVariable %type_i32_optr Output\n";
        string unusedFragVarying = "%BP_vertex_result     = OpVariable %type_i32_iptr Input\n";

        vertCapabilities = "";
        vertExtensions   = "";
        vertAnnotations  = "OpDecorate %type_f32_arr_1 ArrayStride 4\n";
        vertTypes        = f32TypeMinimalRequired;
        vertConstants    = "";

        if ((outVariableType != FP32) && (inVariableType != FP32))
            fragTypes += f32TypeMinimalRequired;

        fragAnnotations += specOpData.annotations;
        fragTypes += specOpData.types;
        fragConstants += specOpData.constants;

        vertExecutionMode = "";
        fragExecutionMode = behaviorExecutionMode;
        vertIODefinitions = unusedVertVarying;
        fragIODefinitions = unusedFragVarying;

        vertArguments     = "";
        fragArguments     = specOpData.arguments;
        vertVariables     = "";
        fragVariables     = specOpData.variables;
        vertCommands      = "";
        fragCommands      = specOpData.commands;
        vertProcessResult = "";
        fragProcessResult = outTypeSnippets->storeResultsSnippet;

        if (inFp16WithoutStorage)
        {
            fragAnnotations += inTypeSnippets->typeAnnotationsFp16Snippet;
            if (testOperation.isInputTypeRestricted)
            {
                fragTypes += inTypeSnippets->typeDefinitionsFp16Snippet;
            }
            fragIODefinitions += inTypeSnippets->inputDefinitionsFp16Snippet;
        }
        else
        {
            fragIODefinitions += inTypeSnippets->inputDefinitionsSnippet;
        }

        if (outFp16WithoutStorage)
        {
            if (testOperation.isInputTypeRestricted)
            {
                fragAnnotations += outTypeSnippets->typeAnnotationsFp16Snippet;
            }
            fragTypes += outTypeSnippets->typeDefinitionsFp16Snippet;
            fragIODefinitions += outTypeSnippets->outputDefinitionsFp16Snippet;
            fragProcessResult = outTypeSnippets->storeResultsFp16Snippet;
        }
        else
        {
            fragIODefinitions += outTypeSnippets->outputDefinitionsSnippet;
        }

        if (!testCaseInfo.argumentsFromInput)
        {
            switch (testCaseInfo.testCase.operationId)
            {
            case OID_CONV_FROM_FP32:
            case OID_CONV_FROM_FP64:
                needsSpecialConstants = true;
                break;
            default:
                break;
            }
        }
    }

    // Another reason we need shaderFloat16 is the executable instructions uses fp16
    // in a way not supported by the 16bit storage extension.
    needsShaderFloat16 |= float16FeatureRequired && testOperation.floatUsage == FLOAT_ARITHMETIC;

    // Constants are only needed sometimes.  Drop them in the fp16 case if the code doesn't need
    // them, and if we don't otherwise need shaderFloat16.
    bool needsFP16Constants = needsShaderFloat16 || needsSpecialConstants || outFp16WithoutStorage;

    if (!needsFP16Constants && float16FeatureRequired)
    {
        // Check various code fragments
        const FloatStatementUsageFlags commandsFloatConstMask =
            B_STATEMENT_USAGE_COMMANDS_CONST_FLOAT | B_STATEMENT_USAGE_COMMANDS_CONST_FP16;
        const bool commandsUsesFloatConstant =
            (testCaseInfo.operation.statementUsageFlags & commandsFloatConstMask) != 0;
        const FloatStatementUsageFlags argumentsFloatConstMask =
            B_STATEMENT_USAGE_ARGS_CONST_FLOAT | B_STATEMENT_USAGE_ARGS_CONST_FP16;
        const bool argumentsUsesFloatConstant = (specOpData.argumentsUsesFloatConstant & argumentsFloatConstMask) != 0;
        bool hasFP16ConstsInCommandsOrArguments = commandsUsesFloatConstant || argumentsUsesFloatConstant;

        needsFP16Constants |= hasFP16ConstsInCommandsOrArguments;

        if (!needsFP16Constants)
        {
            vertConstants = "";
            fragConstants = "";
        }
    }
    needsShaderFloat16 |= needsFP16Constants;

    if (needsShaderFloat16)
    {
        vertCapabilities += "OpCapability Float16\n";
        fragCapabilities += "OpCapability Float16\n";
    }

    map<string, string> specializations;
    specializations["vert_capabilities"]   = vertCapabilities;
    specializations["vert_extensions"]     = vertExtensions;
    specializations["vert_execution_mode"] = vertExecutionMode;
    specializations["vert_annotations"]    = vertAnnotations;
    specializations["vert_types"]          = vertTypes;
    specializations["vert_constants"]      = vertConstants;
    specializations["vert_io_definitions"] = vertIODefinitions;
    specializations["vert_arguments"]      = vertArguments;
    specializations["vert_variables"]      = vertVariables;
    specializations["vert_functions"]      = vertFunctions;
    specializations["vert_commands"]       = vertCommands;
    specializations["vert_process_result"] = vertProcessResult;
    specializations["frag_capabilities"]   = fragCapabilities;
    specializations["frag_extensions"]     = fragExtensions;
    specializations["frag_execution_mode"] = fragExecutionMode;
    specializations["frag_annotations"]    = fragAnnotations;
    specializations["frag_types"]          = fragTypes;
    specializations["frag_constants"]      = fragConstants;
    specializations["frag_functions"]      = fragFunctions;
    specializations["frag_io_definitions"] = fragIODefinitions;
    specializations["frag_arguments"]      = fragArguments;
    specializations["frag_variables"]      = fragVariables;
    specializations["frag_commands"]       = fragCommands;
    specializations["frag_process_result"] = fragProcessResult;

    // colors are not used by the test - input is passed via uniform buffer
    RGBA defaultColors[4] = {RGBA::white(), RGBA::red(), RGBA::green(), RGBA::blue()};

    // construct input and output buffers of proper types
    TypeValuesSP inTypeValues  = m_typeData.at(inVariableType).values;
    TypeValuesSP outTypeValues = m_typeData.at(outVariableType).values;
    BufferSp inBufferSp        = inTypeValues->constructInputBuffer(testCase.input);
    BufferSp outBufferSp       = outTypeValues->constructOutputBuffer(testCase.expectedOutput);

    vkt::SpirVAssembly::GraphicsResources resources;
    resources.inputs.push_back(Resource(inBufferSp, VK_DESCRIPTOR_TYPE_STORAGE_BUFFER));
    resources.outputs.push_back(Resource(outBufferSp, VK_DESCRIPTOR_TYPE_STORAGE_BUFFER));
    resources.verifyIO = checkFloatsLUT[outVariableType];

    StageToSpecConstantMap noSpecConstants;
    PushConstants noPushConstants;
    GraphicsInterfaces noInterfaces;

    VulkanFeatures vulkanFeatures;
    setupFloatControlsProperties(
        inVariableTypeForCaps, // usualy same as inFloatType - different only for UnpackHalf2x16
        outVariableType, testCase.behaviorFlags, vulkanFeatures.floatControlsProperties);
    vulkanFeatures.coreFeatures.fragmentStoresAndAtomics = true;
    vulkanFeatures.coreFeatures.shaderFloat64            = float64FeatureRequired;
    vulkanFeatures.coreFeatures.shaderInt64              = int64FeatureRequired;
    vulkanFeatures.extFloat16Int8.shaderFloat16          = needsShaderFloat16;
    vulkanFeatures.ext16BitStorage.uniformAndStorageBuffer16BitAccess =
        float16FeatureRequired && requiresUniformAndStorage16BitBufferAccess;

    vector<string> extensions;
    extensions.push_back("VK_KHR_shader_float_controls");

    InstanceContext ctx(defaultColors, defaultColors, specializations, noSpecConstants, noPushConstants, resources,
                        noInterfaces, extensions, vulkanFeatures, testedStage);

    ctx.moduleMap["vert"].push_back(std::make_pair("main", VK_SHADER_STAGE_VERTEX_BIT));
    ctx.moduleMap["frag"].push_back(std::make_pair("main", VK_SHADER_STAGE_FRAGMENT_BIT));

    ctx.requiredStages = static_cast<VkShaderStageFlagBits>(VK_SHADER_STAGE_VERTEX_BIT | VK_SHADER_STAGE_FRAGMENT_BIT);
    ctx.failResult     = QP_TEST_RESULT_FAIL;
    ctx.failMessageTemplate = "Output doesn't match with expected";

    return ctx;
}

} // namespace

tcu::TestCaseGroup *createFloatControlsTestGroup(TestContext &testCtx, TestGroupBuilderBase *groupBuilder)
{
    de::MovePtr<TestCaseGroup> group(new TestCaseGroup(testCtx, "float_controls"));

    struct TestGroup
    {
        VariableType variableType;
        const char *groupName;
    };
    TestGroup testGroups[] = {
        {FP16, "fp16"},
        {FP32, "fp32"},
        {FP64, "fp64"},
    };

    for (int i = 0; i < DE_LENGTH_OF_ARRAY(testGroups); ++i)
    {
        const TestGroup &testGroup = testGroups[i];
        TestCaseGroup *typeGroup   = new TestCaseGroup(testCtx, testGroup.groupName);
        group->addChild(typeGroup);

        groupBuilder->createOperationTests(typeGroup, "input_args", testGroup.variableType, true);
        groupBuilder->createOperationTests(typeGroup, "generated_args", testGroup.variableType, false);
    }

    groupBuilder->createSettingsTests(group.get());

    return group.release();
}

tcu::TestCaseGroup *createFloatControlsComputeGroup(TestContext &testCtx)
{
    ComputeTestGroupBuilder computeTestGroupBuilder;
    computeTestGroupBuilder.init();

    return createFloatControlsTestGroup(testCtx, &computeTestGroupBuilder);
}

tcu::TestCaseGroup *createFloatControlsGraphicsGroup(TestContext &testCtx)
{
    GraphicsTestGroupBuilder graphicsTestGroupBuilder;
    graphicsTestGroupBuilder.init();

    return createFloatControlsTestGroup(testCtx, &graphicsTestGroupBuilder);
}

} // namespace SpirVAssembly
} // namespace vkt