Add OpFConvert precision tests

author Ricardo Garcia <rgarcia@igalia.com>

Fri, 11 Oct 2019 12:28:30 +0000 (14:28 +0200)

committer Alexander Galazin <Alexander.Galazin@arm.com>

Fri, 25 Oct 2019 14:45:13 +0000 (10:45 -0400)
author Ricardo Garcia <rgarcia@igalia.com>
Fri, 11 Oct 2019 12:28:30 +0000 (14:28 +0200)
committer Alexander Galazin <Alexander.Galazin@arm.com>
Fri, 25 Oct 2019 14:45:13 +0000 (10:45 -0400)
diff --git a/AndroidGen.mk b/AndroidGen.mk

index 8e5c018..ec75627 100644 (file)
--- a/AndroidGen.mk
+++ b/AndroidGen.mk
@@ -268,6 +268,7 @@ LOCAL_SRC_FILES := \
         external/vulkancts/modules/vulkan/shaderexecutor/vktShaderClockTests.cpp \
         external/vulkancts/modules/vulkan/shaderexecutor/vktShaderCommonFunctionTests.cpp \
         external/vulkancts/modules/vulkan/shaderexecutor/vktShaderExecutor.cpp \
+       external/vulkancts/modules/vulkan/shaderexecutor/vktShaderFConvertTests.cpp \
         external/vulkancts/modules/vulkan/shaderexecutor/vktShaderIntegerFunctionTests.cpp \
         external/vulkancts/modules/vulkan/shaderexecutor/vktShaderPackingFunctionTests.cpp \
         external/vulkancts/modules/vulkan/shaderrender/vktShaderRender.cpp \
diff --git a/android/cts/master/vk-master.txt b/android/cts/master/vk-master.txt

index a77b7b9..ab242c4 100644 (file)
--- a/android/cts/master/vk-master.txt
+++ b/android/cts/master/vk-master.txt
@@ -314198,6 +314198,30 @@ dEQP-VK.glsl.builtin.precision_fp16_storage32b.fma.compute.scalar
  dEQP-VK.glsl.builtin.precision_fp16_storage32b.fma.compute.vec2
  dEQP-VK.glsl.builtin.precision_fp16_storage32b.fma.compute.vec3
  dEQP-VK.glsl.builtin.precision_fp16_storage32b.fma.compute.vec4
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f32_size_1
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f32_size_2
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f32_size_3
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f32_size_4
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f64_size_1
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f64_size_2
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f64_size_3
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f64_size_4
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f16_size_1
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f16_size_2
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f16_size_3
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f16_size_4
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f64_size_1
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f64_size_2
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f64_size_3
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f64_size_4
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f16_size_1
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f16_size_2
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f16_size_3
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f16_size_4
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f32_size_1
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f32_size_2
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f32_size_3
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f32_size_4
  dEQP-VK.glsl.opaque_type_indexing.sampler.const_literal.vertex.sampler1d
  dEQP-VK.glsl.opaque_type_indexing.sampler.const_literal.vertex.sampler1darray
  dEQP-VK.glsl.opaque_type_indexing.sampler.const_literal.vertex.sampler1darrayshadow
diff --git a/external/vulkancts/modules/vulkan/image/vktImageTranscodingSupportTests.cpp b/external/vulkancts/modules/vulkan/image/vktImageTranscodingSupportTests.cpp

index 1139bd3..9e8095c 100644 (file)
--- a/external/vulkancts/modules/vulkan/image/vktImageTranscodingSupportTests.cpp
+++ b/external/vulkancts/modules/vulkan/image/vktImageTranscodingSupportTests.cpp
@@ -122,35 +122,18 @@ BasicTranscodingTestInstance::BasicTranscodingTestInstance (Context& context, co
  {
  }
  
-// The templated functions below work with specializations of tcu::Float as class T. See "tcuFloat.hpp".
-
-// Return smallest floating point normal value preserving the existing sign bit.
-// The smallest normal value has the mantissa bits zeroed out and 1 as the exponent (tough constructBits() expects something else).
-template <class T>
-inline T SmallestFloat (T value)
-{
-       return T::constructBits(value.sign(), -(T::EXPONENT_BIAS - 1), typename T::StorageType(0u));
-}
-
-// Return the largest floating point normal value preserving the existing sign bit.
-// The largest normal value has the mantissa bits all set to 1 and the exponent set to the largest even value (see constructBits() for the details).
-template <class T>
-inline T LargestFloat (T value)
-{
-       return T::constructBits(value.sign(), T::EXPONENT_BIAS, typename T::StorageType((1<<T::MANTISSA_BITS)-1));
-}
-
  // Replace Infs and NaNs with the largest normal value.
  // Replace denormal numbers with the smallest normal value.
  // Leave the rest untouched.
+// T is a tcu::Float specialization.
  template <class T>
  void fixFloatIfNeeded(deUint8* ptr_)
  {
         T* ptr = reinterpret_cast<T*>(ptr_);
         if (ptr->isInf() || ptr->isNaN())
-               *ptr = LargestFloat<T>(*ptr);
+               *ptr = T::largestNormal(ptr->sign());
         else if (ptr->isDenorm())
-               *ptr = SmallestFloat<T>(*ptr);
+               *ptr = T::smallestNormal(ptr->sign());
  }
  
  void BasicTranscodingTestInstance::generateData (deUint8* toFill, size_t size, const VkFormat format)
diff --git a/external/vulkancts/modules/vulkan/shaderexecutor/CMakeLists.txt b/external/vulkancts/modules/vulkan/shaderexecutor/CMakeLists.txt

index 6ef8eb4..015b0b5 100644 (file)
--- a/external/vulkancts/modules/vulkan/shaderexecutor/CMakeLists.txt
+++ b/external/vulkancts/modules/vulkan/shaderexecutor/CMakeLists.txt
@@ -7,6 +7,8 @@ set(DEQP_VK_SHADEREXECUTOR_SRCS
         vktShaderBuiltinTests.hpp
         vktShaderCommonFunctionTests.cpp
         vktShaderCommonFunctionTests.hpp
+       vktShaderFConvertTests.cpp
+       vktShaderFConvertTests.hpp
         vktShaderIntegerFunctionTests.cpp
         vktShaderIntegerFunctionTests.hpp
         vktShaderPackingFunctionTests.cpp
diff --git a/external/vulkancts/modules/vulkan/shaderexecutor/vktShaderBuiltinTests.cpp b/external/vulkancts/modules/vulkan/shaderexecutor/vktShaderBuiltinTests.cpp

index c1f98b2..0a1a4c6 100644 (file)
--- a/external/vulkancts/modules/vulkan/shaderexecutor/vktShaderBuiltinTests.cpp
+++ b/external/vulkancts/modules/vulkan/shaderexecutor/vktShaderBuiltinTests.cpp
@@ -31,6 +31,7 @@
  #include "vktShaderCommonFunctionTests.hpp"
  #include "vktShaderIntegerFunctionTests.hpp"
  #include "vktShaderPackingFunctionTests.hpp"
+#include "vktShaderFConvertTests.hpp"
  
  namespace vkt
  {
@@ -50,6 +51,7 @@ tcu::TestCaseGroup* createBuiltinTests (tcu::TestContext& testCtx)
         builtinTests->addChild(new BuiltinPrecisionTests(testCtx));
         builtinTests->addChild(new BuiltinPrecision16BitTests(testCtx));
         builtinTests->addChild(new BuiltinPrecision16Storage32BitTests(testCtx));
+       builtinTests->addChild(createPrecisionFconvertGroup(testCtx));
  
         return builtinTests.release();
  }
diff --git a/external/vulkancts/modules/vulkan/shaderexecutor/vktShaderFConvertTests.cpp b/external/vulkancts/modules/vulkan/shaderexecutor/vktShaderFConvertTests.cpp

new file mode 100644 (file)

index 0000000..f577c66
--- /dev/null
+++ b/external/vulkancts/modules/vulkan/shaderexecutor/vktShaderFConvertTests.cpp
@@ -0,0 +1,947 @@
+/*------------------------------------------------------------------------
+ * Vulkan Conformance Tests
+ * ------------------------
+ *
+ * Copyright (c) 2019 Valve Corporation.
+ * Copyright (c) 2019 The Khronos Group Inc.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *      http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ *
+ *//*!
+ * \file
+ * \brief OpFConvert tests.
+ *//*--------------------------------------------------------------------*/
+
+#include "vktShaderFConvertTests.hpp"
+#include "vktTestCase.hpp"
+
+#include "vkBufferWithMemory.hpp"
+#include "vkObjUtil.hpp"
+#include "vkBuilderUtil.hpp"
+#include "vkCmdUtil.hpp"
+#include "vkPrograms.hpp"
+
+#include "deDefs.hpp"
+#include "deRandom.hpp"
+
+#include "tcuFloat.hpp"
+#include "tcuTestLog.hpp"
+#include "tcuFormatUtil.hpp"
+
+#include <vector>
+#include <iterator>
+#include <algorithm>
+#include <memory>
+#include <sstream>
+#include <iomanip>
+#include <string>
+#include <limits>
+
+namespace vkt
+{
+namespace shaderexecutor
+{
+
+namespace
+{
+
+constexpr deUint32     kRandomSeed                                                             = 0xdeadbeef;
+constexpr size_t       kRandomSourcesPerType                                   = 240;
+constexpr size_t       kMinVectorLength                                                = 1;
+constexpr size_t       kMaxVectorLength                                                = 4;
+constexpr size_t       kArrayAlignment                                                 = 16;                                   // Bytes.
+constexpr size_t       kEffectiveLength[kMaxVectorLength + 1]  = { 0, 1, 2, 4, 4 };    // Effective length of a vector of size i.
+constexpr size_t       kGCFNumFloats                                                   = 12;                                   // Greatest Common Factor of the number of floats in a test.
+
+// Get a random normal number.
+// Works for implementations of tcu::Float as T.
+template <class T>
+T getRandomNormal (de::Random& rnd)
+{
+       static constexpr typename T::StorageType        kLeadingMantissaBit     = (static_cast<typename T::StorageType>(1) << T::MANTISSA_BITS);
+       static constexpr int                                            kSignValues[]           = { -1, 1 };
+
+       int                                             signBit         = rnd.getInt(0, 1);
+       int                                             exponent        = rnd.getInt(1 - T::EXPONENT_BIAS, T::EXPONENT_BIAS + 1);
+       typename T::StorageType mantissa        = static_cast<typename T::StorageType>(rnd.getUint64() & static_cast<deUint64>(kLeadingMantissaBit - 1));
+
+       // Construct number.
+       return T::construct(kSignValues[signBit], exponent, (kLeadingMantissaBit | mantissa));
+}
+
+// Get a list of hand-picked interesting samples for tcu::Float class T.
+template <class T>
+const std::vector<T>& interestingSamples ()
+{
+       static const std::vector<T> samples =
+       {
+               T::zero                         (-1),
+               T::zero                         ( 1),
+               //T::inf                                (-1),
+               //T::inf                                ( 1),
+               //T::nan                                (  ),
+               T::largestNormal        (-1),
+               T::largestNormal        ( 1),
+               T::smallestNormal       (-1),
+               T::smallestNormal       ( 1),
+       };
+
+       return samples;
+}
+
+// Get some random interesting numbers.
+// Works for implementations of tcu::Float as T.
+template <class T>
+std::vector<T> getRandomInteresting (de::Random& rnd, size_t numSamples)
+{
+       auto&                   samples = interestingSamples<T>();
+       std::vector<T>  result;
+
+       result.reserve(numSamples);
+       std::generate_n(std::back_inserter(result), numSamples, [&rnd, &samples]() { return rnd.choose<T>(begin(samples), end(samples)); });
+
+       return result;
+}
+
+// Helper class to build each vector only once in a thread-safe way.
+template <class T>
+struct StaticVectorHelper
+{
+       std::vector<T> v;
+
+       StaticVectorHelper (de::Random& rnd)
+       {
+               v.reserve(kRandomSourcesPerType);
+               for (size_t i = 0; i < kRandomSourcesPerType; ++i)
+                       v.push_back(getRandomNormal<T>(rnd));
+       }
+};
+
+// Get a list of random normal input values for type T.
+template <class T>
+const std::vector<T>& getRandomNormals (de::Random& rnd)
+{
+       static StaticVectorHelper<T> helper(rnd);
+       return helper.v;
+}
+
+// Convert a vector of tcu::Float elements of type T1 to type T2.
+template <class T1, class T2>
+std::vector<T2> convertVector (const std::vector<T1>& orig)
+{
+       std::vector<T2> result;
+       result.reserve(orig.size());
+
+       std::transform(begin(orig), end(orig), std::back_inserter(result),
+               [](T1 f) { return T2::convert(f); });
+
+       return result;
+}
+
+// Get converted normal values for other tcu::Float types smaller than T, which should be exact conversions when converting back to
+// those types.
+template <class T>
+std::vector<T> getOtherNormals (de::Random& rnd);
+
+template<>
+std::vector<tcu::Float16> getOtherNormals<tcu::Float16> (de::Random&)
+{
+       // Nothing below tcu::Float16.
+       return std::vector<tcu::Float16>();
+}
+
+template<>
+std::vector<tcu::Float32> getOtherNormals<tcu::Float32> (de::Random& rnd)
+{
+       // The ones from tcu::Float16.
+       return convertVector<tcu::Float16, tcu::Float32>(getRandomNormals<tcu::Float16>(rnd));
+}
+
+template<>
+std::vector<tcu::Float64> getOtherNormals<tcu::Float64> (de::Random& rnd)
+{
+       // The ones from both tcu::Float16 and tcu::Float64.
+       auto v1 = convertVector<tcu::Float16, tcu::Float64>(getRandomNormals<tcu::Float16>(rnd));
+       auto v2 = convertVector<tcu::Float32, tcu::Float64>(getRandomNormals<tcu::Float32>(rnd));
+
+       v1.reserve(v1.size() + v2.size());
+       std::copy(begin(v2), end(v2), std::back_inserter(v1));
+       return v1;
+}
+
+// Get the full list of input values for type T.
+template <class T>
+std::vector<T> getInputValues (de::Random& rnd)
+{
+       auto&   interesting             = interestingSamples<T>();
+       auto&   normals                 = getRandomNormals<T>(rnd);
+       auto    otherNormals    = getOtherNormals<T>(rnd);
+
+       const size_t numValues          = interesting.size() + normals.size() + otherNormals.size();
+       const size_t extraValues        = numValues % kGCFNumFloats;
+       const size_t needed                     = ((extraValues == 0) ? 0 : (kGCFNumFloats - extraValues));
+
+       auto extra = getRandomInteresting<T> (rnd, needed);
+
+       std::vector<T> values;
+       values.reserve(interesting.size() + normals.size() + otherNormals.size() + extra.size());
+
+       std::copy(begin(interesting),   end(interesting),       std::back_inserter(values));
+       std::copy(begin(normals),               end(normals),           std::back_inserter(values));
+       std::copy(begin(otherNormals),  end(otherNormals),      std::back_inserter(values));
+       std::copy(begin(extra),                 end(extra),                     std::back_inserter(values));
+
+       // Shuffle samples around a bit to make it more interesting.
+       rnd.shuffle(begin(values), end(values));
+
+       return values;
+}
+
+// This singleton makes sure generated samples are stable no matter the test order.
+class InputGenerator
+{
+public:
+       static const InputGenerator& getInstance ()
+       {
+               static InputGenerator instance;
+               return instance;
+       }
+
+       const std::vector<tcu::Float16>& getInputValues16 () const
+       {
+               return m_values16;
+       }
+
+       const std::vector<tcu::Float32>& getInputValues32 () const
+       {
+               return m_values32;
+       }
+
+       const std::vector<tcu::Float64>& getInputValues64 () const
+       {
+               return m_values64;
+       }
+
+private:
+       InputGenerator ()
+               : m_rnd(kRandomSeed)
+               , m_values16(getInputValues<tcu::Float16>(m_rnd))
+               , m_values32(getInputValues<tcu::Float32>(m_rnd))
+               , m_values64(getInputValues<tcu::Float64>(m_rnd))
+       {
+       }
+
+       // Cannot copy or assign.
+       InputGenerator(const InputGenerator&)                           = delete;
+       InputGenerator& operator=(const InputGenerator&)        = delete;
+
+       de::Random                                      m_rnd;
+       std::vector<tcu::Float16>       m_values16;
+       std::vector<tcu::Float32>       m_values32;
+       std::vector<tcu::Float64>       m_values64;
+};
+
+// Check single result is as expected.
+// Works for implementations of tcu::Float as T1 and T2.
+template <class T1, class T2>
+bool validConversion (const T1& orig, const T2& result)
+{
+       const T2        acceptedResults[]       = { T2::convert(orig, tcu::ROUND_DOWNWARD), T2::convert(orig, tcu::ROUND_UPWARD) };
+       bool            valid                           = false;
+
+       for (const auto& validResult : acceptedResults)
+       {
+               if (validResult.isNaN() && result.isNaN())
+                       valid = true;
+               else if (validResult.isInf() && result.isInf())
+                       valid = true;
+               else if (validResult.isZero() && result.isZero())
+                       valid = true;
+               else if (validResult.isDenorm() && (result.isDenorm() || result.isZero()))
+                       valid = true;
+               else if (validResult.bits() == result.bits()) // Exact conversion, up or down.
+                       valid = true;
+       }
+
+       return valid;
+}
+
+// Check results vector is as expected.
+template <class T1, class T2>
+bool validConversion (const std::vector<T1>& orig, const std::vector<T2>& converted, tcu::TestLog& log)
+{
+       DE_ASSERT(orig.size() == converted.size());
+
+       bool allValid = true;
+
+       for (size_t i = 0; i < orig.size(); ++i)
+       {
+               const bool valid = validConversion(orig[i], converted[i]);
+
+               {
+                       const double origD = orig[i].asDouble();
+                       const double convD = converted[i].asDouble();
+
+                       std::ostringstream msg;
+                       msg << "[" << i << "] "
+                               << std::setprecision(std::numeric_limits<double>::digits10 + 2) << std::scientific
+                               << origD << " converted to " << convD << ": " << (valid ? "OK" : "FAILURE");
+
+                       log << tcu::TestLog::Message << msg.str() << tcu::TestLog::EndMessage;
+               }
+
+               if (!valid)
+                       allValid = false;
+       }
+
+       return allValid;
+}
+
+// Helps calculate buffer sizes and other parameters for the given number of values and vector length using a given floating point
+// type. This is mostly used in packFloats() below, but we also need this information in the iterate() method for the test instance,
+// so it has been separated.
+struct BufferSizeInfo
+{
+       template <class T>
+       static BufferSizeInfo calculate (size_t numValues_, size_t vectorLength_)
+       {
+               // The vector length must be a known number.
+               DE_ASSERT(vectorLength_ >= kMinVectorLength && vectorLength_ <= kMaxVectorLength);
+               // The number of values must be appropriate for the vector length.
+               DE_ASSERT(numValues_ % vectorLength_ == 0);
+
+               BufferSizeInfo info;
+
+               info.numValues          = numValues_;
+               info.vectorLength       = vectorLength_;
+               info.totalVectors       = numValues_ / vectorLength_;
+
+               const size_t elementSize                = sizeof(typename T::StorageType);
+               const size_t effectiveLength    = kEffectiveLength[vectorLength_];
+               const size_t vectorSize                 = elementSize * effectiveLength;
+               const size_t extraBytes                 = vectorSize % kArrayAlignment;
+
+               info.vectorStrideBytes  = vectorSize + ((extraBytes == 0) ? 0 : (kArrayAlignment - extraBytes));
+               info.memorySizeBytes    = info.vectorStrideBytes * info.totalVectors;
+
+               return info;
+       }
+
+       size_t numValues;
+       size_t vectorLength;
+       size_t totalVectors;
+       size_t vectorStrideBytes;
+       size_t memorySizeBytes;
+};
+
+// Pack an array of tcu::Float values into a buffer to be read from a shader, as if it was an array of vectors with each vector
+// having size vectorLength (e.g. 3 for a vec3). Note: assumes std140.
+template <class T>
+std::vector<deUint8> packFloats (const std::vector<T>& values, size_t vectorLength)
+{
+       BufferSizeInfo sizeInfo = BufferSizeInfo::calculate<T>(values.size(), vectorLength);
+
+       std::vector<deUint8> memory(sizeInfo.memorySizeBytes);
+       for (size_t i = 0; i < sizeInfo.totalVectors; ++i)
+       {
+               T* vectorPtr = reinterpret_cast<T*>(memory.data() + sizeInfo.vectorStrideBytes * i);
+               for (size_t j = 0; j < vectorLength; ++j)
+                       vectorPtr[j] = values[i*vectorLength + j];
+       }
+
+       return memory;
+}
+
+// Unpack an array of vectors into an array of values, undoing what packFloats would do.
+// expectedNumValues is used for verification.
+template <class T>
+std::vector<T> unpackFloats (const std::vector<deUint8>& memory, size_t vectorLength, size_t expectedNumValues)
+{
+       DE_ASSERT(vectorLength >= kMinVectorLength && vectorLength <= kMaxVectorLength);
+
+       const size_t effectiveLength    = kEffectiveLength[vectorLength];
+       const size_t elementSize                = sizeof(typename T::StorageType);
+       const size_t vectorSize                 = elementSize * effectiveLength;
+       const size_t extraBytes                 = vectorSize % kArrayAlignment;
+       const size_t vectorBlockSize    = vectorSize + ((extraBytes == 0) ? 0 : (kArrayAlignment - extraBytes));
+
+       DE_ASSERT(memory.size() % vectorBlockSize == 0);
+       const size_t numStoredVectors   = memory.size() / vectorBlockSize;
+       const size_t numStoredValues    = numStoredVectors * vectorLength;
+
+       DE_UNREF(expectedNumValues); // For release builds.
+       DE_ASSERT(numStoredValues == expectedNumValues);
+       std::vector<T> values;
+       values.reserve(numStoredValues);
+
+       for (size_t i = 0; i < numStoredVectors; ++i)
+       {
+               const T* vectorPtr = reinterpret_cast<const T*>(memory.data() + vectorBlockSize * i);
+               for (size_t j = 0; j < vectorLength; ++j)
+                       values.push_back(vectorPtr[j]);
+       }
+
+       return values;
+}
+
+enum FloatType
+{
+       FLOAT_TYPE_16_BITS = 0,
+       FLOAT_TYPE_32_BITS,
+       FLOAT_TYPE_64_BITS,
+       FLOAT_TYPE_MAX_ENUM,
+};
+
+static const char* const kFloatNames[FLOAT_TYPE_MAX_ENUM] =
+{
+       "f16",
+       "f32",
+       "f64",
+};
+
+static const char* const kGLSLTypes[][kMaxVectorLength + 1] =
+{
+       { nullptr, "float16_t", "f16vec2",      "f16vec3",      "f16vec4"       },
+       { nullptr, "float",             "vec2",         "vec3",         "vec4"          },
+       { nullptr, "double",    "dvec2",        "dvec3",        "dvec4"         },
+};
+
+struct TestParams
+{
+       FloatType       from;
+       FloatType       to;
+       size_t          vectorLength;
+
+       std::string     getInputTypeStr         () const
+       {
+               DE_ASSERT(from >= 0 && from < FLOAT_TYPE_MAX_ENUM);
+               DE_ASSERT(vectorLength >= kMinVectorLength && vectorLength <= kMaxVectorLength);
+               return kGLSLTypes[from][vectorLength];
+       }
+
+       std::string getOutputTypeStr    () const
+       {
+               DE_ASSERT(to >= 0 && to < FLOAT_TYPE_MAX_ENUM);
+               DE_ASSERT(vectorLength >= kMinVectorLength && vectorLength <= kMaxVectorLength);
+               return kGLSLTypes[to][vectorLength];
+       }
+};
+
+class FConvertTestInstance : public TestInstance
+{
+public:
+                                                       FConvertTestInstance    (Context& context, const TestParams& params)
+                                                               : TestInstance(context)
+                                                               , m_params(params)
+                                                               {}
+
+       virtual tcu::TestStatus iterate                                 (void);
+
+private:
+       TestParams      m_params;
+};
+
+class FConvertTestCase : public TestCase
+{
+public:
+                                                               FConvertTestCase        (tcu::TestContext& context, const std::string& name, const std::string& desc, const TestParams& params)
+                                                                       : TestCase      (context, name, desc)
+                                                                       , m_params      (params)
+                                                                       {}
+
+                                                               ~FConvertTestCase       (void) {}
+       virtual TestInstance*           createInstance          (Context& context) const { return new FConvertTestInstance(context, m_params); }
+       virtual void                            initPrograms            (vk::SourceCollections& programCollection) const;
+       virtual void                            checkSupport            (Context& context) const;
+
+private:
+       TestParams      m_params;
+};
+
+void FConvertTestCase::initPrograms (vk::SourceCollections& programCollection) const
+{
+       const std::string               inputType               = m_params.getInputTypeStr();
+       const std::string               outputType              = m_params.getOutputTypeStr();
+       const InputGenerator&   inputGenerator  = InputGenerator::getInstance();
+
+       size_t numValues = 0;
+       switch (m_params.from)
+       {
+       case FLOAT_TYPE_16_BITS:
+               numValues = inputGenerator.getInputValues16().size();
+               break;
+       case FLOAT_TYPE_32_BITS:
+               numValues = inputGenerator.getInputValues32().size();
+               break;
+       case FLOAT_TYPE_64_BITS:
+               numValues = inputGenerator.getInputValues64().size();
+               break;
+       default:
+               DE_ASSERT(false);
+               break;
+       }
+
+       const size_t arraySize = numValues / m_params.vectorLength;
+
+       std::ostringstream shader;
+
+       shader
+               << "#version 450 core\n"
+               << ((m_params.from == FLOAT_TYPE_16_BITS || m_params.to == FLOAT_TYPE_16_BITS) ?
+                       "#extension GL_EXT_shader_16bit_storage: require\n"                                     // This is needed to use 16-bit float types in buffers.
+                       "#extension GL_EXT_shader_explicit_arithmetic_types: require\n"         // This is needed for some conversions.
+                       : "")
+               << "layout(local_size_x = 1, local_size_y = 1, local_size_z = 1) in;\n"
+               << "layout(set = 0, binding = 0, std140) buffer issbodef { " << inputType << " val[" << arraySize << "]; } issbo;\n"
+               << "layout(set = 0, binding = 1, std140) buffer ossbodef { " << outputType << " val[" << arraySize << "]; } ossbo;\n"
+               << "void main()\n"
+               << "{\n"
+               << "    ossbo.val[gl_WorkGroupID.x] = " << outputType << "(issbo.val[gl_WorkGroupID.x]);\n"
+               << "}\n";
+
+       programCollection.glslSources.add("comp") << glu::ComputeSource(shader.str());
+}
+
+void FConvertTestCase::checkSupport (Context& context) const
+{
+       if (m_params.from == FLOAT_TYPE_64_BITS || m_params.to == FLOAT_TYPE_64_BITS)
+       {
+               // Check for 64-bit float support.
+               auto features = context.getDeviceFeatures();
+               if (!features.shaderFloat64)
+                       TCU_THROW(NotSupportedError, "64-bit floats not supported in shader code");
+       }
+
+       if (m_params.from == FLOAT_TYPE_16_BITS || m_params.to == FLOAT_TYPE_16_BITS)
+       {
+               // Check for 16-bit float support.
+               auto& features16 = context.getShaderFloat16Int8Features();
+               if (!features16.shaderFloat16)
+                       TCU_THROW(NotSupportedError, "16-bit floats not supported in shader code");
+
+               auto& storage16 = context.get16BitStorageFeatures();
+               if (!storage16.storageBuffer16BitAccess)
+                       TCU_THROW(NotSupportedError, "16-bit floats not supported for storage buffers");
+       }
+}
+
+tcu::TestStatus FConvertTestInstance::iterate (void)
+{
+       BufferSizeInfo                  inputBufferSizeInfo;
+       BufferSizeInfo                  outputBufferSizeInfo;
+       std::vector<deUint8>    inputMemory;
+
+       // Calculate buffer sizes and convert input values to a packed input memory format, depending on the input and output types.
+       switch (m_params.from)
+       {
+       case FLOAT_TYPE_16_BITS:
+               {
+                       auto& inputValues = InputGenerator::getInstance().getInputValues16();
+                       inputBufferSizeInfo = BufferSizeInfo::calculate<tcu::Float16>(inputValues.size(), m_params.vectorLength);
+                       switch (m_params.to)
+                       {
+                       case FLOAT_TYPE_32_BITS:
+                               outputBufferSizeInfo = BufferSizeInfo::calculate<tcu::Float32>(inputValues.size(), m_params.vectorLength);
+                               break;
+                       case FLOAT_TYPE_64_BITS:
+                               outputBufferSizeInfo = BufferSizeInfo::calculate<tcu::Float64>(inputValues.size(), m_params.vectorLength);
+                               break;
+                       default:
+                               DE_ASSERT(false);
+                               break;
+                       }
+                       inputMemory = packFloats(inputValues, m_params.vectorLength);
+               }
+               break;
+
+       case FLOAT_TYPE_32_BITS:
+               {
+                       auto& inputValues = InputGenerator::getInstance().getInputValues32();
+                       inputBufferSizeInfo = BufferSizeInfo::calculate<tcu::Float32>(inputValues.size(), m_params.vectorLength);
+                       switch (m_params.to)
+                       {
+                       case FLOAT_TYPE_16_BITS:
+                               outputBufferSizeInfo = BufferSizeInfo::calculate<tcu::Float16>(inputValues.size(), m_params.vectorLength);
+                               break;
+                       case FLOAT_TYPE_64_BITS:
+                               outputBufferSizeInfo = BufferSizeInfo::calculate<tcu::Float64>(inputValues.size(), m_params.vectorLength);
+                               break;
+                       default:
+                               DE_ASSERT(false);
+                               break;
+                       }
+                       inputMemory = packFloats(inputValues, m_params.vectorLength);
+               }
+               break;
+
+       case FLOAT_TYPE_64_BITS:
+               {
+                       auto& inputValues = InputGenerator::getInstance().getInputValues64();
+                       inputBufferSizeInfo = BufferSizeInfo::calculate<tcu::Float64>(inputValues.size(), m_params.vectorLength);
+                       switch (m_params.to)
+                       {
+                       case FLOAT_TYPE_16_BITS:
+                               outputBufferSizeInfo = BufferSizeInfo::calculate<tcu::Float16>(inputValues.size(), m_params.vectorLength);
+                               break;
+                       case FLOAT_TYPE_32_BITS:
+                               outputBufferSizeInfo = BufferSizeInfo::calculate<tcu::Float32>(inputValues.size(), m_params.vectorLength);
+                               break;
+                       default:
+                               DE_ASSERT(false);
+                               break;
+                       }
+                       inputMemory = packFloats(inputValues, m_params.vectorLength);
+               }
+               break;
+
+       default:
+               DE_ASSERT(false);
+               break;
+       }
+
+       // Prepare input and output buffers.
+       auto&   vkd                     = m_context.getDeviceInterface();
+       auto    device          = m_context.getDevice();
+       auto&   allocator       = m_context.getDefaultAllocator();
+
+       de::MovePtr<vk::BufferWithMemory> inputBuffer(
+               new vk::BufferWithMemory(vkd, device, allocator,
+                                                                vk::makeBufferCreateInfo(inputBufferSizeInfo.memorySizeBytes, vk::VK_BUFFER_USAGE_STORAGE_BUFFER_BIT),
+                                                                vk::MemoryRequirement::HostVisible)
+       );
+
+       de::MovePtr<vk::BufferWithMemory> outputBuffer(
+               new vk::BufferWithMemory(vkd, device, allocator,
+                                                                vk::makeBufferCreateInfo(outputBufferSizeInfo.memorySizeBytes, vk::VK_BUFFER_USAGE_STORAGE_BUFFER_BIT),
+                                                                vk::MemoryRequirement::HostVisible)
+       );
+
+       // Copy values to input buffer.
+       {
+               auto& alloc = inputBuffer->getAllocation();
+               deMemcpy(reinterpret_cast<deUint8*>(alloc.getHostPtr()) + alloc.getOffset(), inputMemory.data(), inputMemory.size());
+               vk::flushAlloc(vkd, device, alloc);
+       }
+
+       // Create an array with the input and output buffers to make it easier to iterate below.
+       const vk::VkBuffer buffers[] = { inputBuffer->get(), outputBuffer->get() };
+
+       // Create descriptor set layout.
+       std::vector<vk::VkDescriptorSetLayoutBinding> bindings;
+       for (int i = 0; i < DE_LENGTH_OF_ARRAY(buffers); ++i)
+       {
+               const vk::VkDescriptorSetLayoutBinding binding =
+               {
+                       static_cast<deUint32>(i),                                                               // uint32_t              binding;
+                       vk::VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,                                  // VkDescriptorType      descriptorType;
+                       1u,                                                                                                             // uint32_t              descriptorCount;
+                       vk::VK_SHADER_STAGE_COMPUTE_BIT,                                                // VkShaderStageFlags    stageFlags;
+                       DE_NULL,                                                                                                        // const VkSampler*      pImmutableSamplers;
+               };
+               bindings.push_back(binding);
+       }
+
+       const vk::VkDescriptorSetLayoutCreateInfo layoutCreateInfo =
+       {
+               vk::VK_STRUCTURE_TYPE_DESCRIPTOR_SET_LAYOUT_CREATE_INFO,        // VkStructureType                        sType;
+               DE_NULL,                                                                                                        // const void*                            pNext;
+               0,                                                                                                                      // VkDescriptorSetLayoutCreateFlags       flags;
+               static_cast<deUint32>(bindings.size()),                                         // uint32_t                               bindingCount;
+               bindings.data()                                                                                         // const VkDescriptorSetLayoutBinding*    pBindings;
+       };
+       auto descriptorSetLayout = vk::createDescriptorSetLayout(vkd, device, &layoutCreateInfo);
+
+       // Create descriptor set.
+       vk::DescriptorPoolBuilder poolBuilder;
+       for (const auto& b : bindings)
+               poolBuilder.addType(b.descriptorType, 1u);
+       auto descriptorPool = poolBuilder.build(vkd, device, vk::VK_DESCRIPTOR_POOL_CREATE_FREE_DESCRIPTOR_SET_BIT, 1u);
+
+       const vk::VkDescriptorSetAllocateInfo allocateInfo =
+       {
+               vk::VK_STRUCTURE_TYPE_DESCRIPTOR_SET_ALLOCATE_INFO,     // VkStructureType                 sType;
+               DE_NULL,                                                                                        // const void*                     pNext;
+               *descriptorPool,                                                                        // VkDescriptorPool                descriptorPool;
+               1u,                                                                                                     // uint32_t                        descriptorSetCount;
+               &descriptorSetLayout.get()                                                      // const VkDescriptorSetLayout*    pSetLayouts;
+       };
+       auto descriptorSet = vk::allocateDescriptorSet(vkd, device, &allocateInfo);
+
+       // Update descriptor set.
+       std::vector<vk::VkDescriptorBufferInfo> descriptorBufferInfos;
+       std::vector<vk::VkWriteDescriptorSet>   descriptorWrites;
+
+       for (const auto& buffer : buffers)
+       {
+               const vk::VkDescriptorBufferInfo bufferInfo =
+               {
+                       buffer,                 // VkBuffer        buffer;
+                       0u,                             // VkDeviceSize    offset;
+                       VK_WHOLE_SIZE,  // VkDeviceSize    range;
+               };
+               descriptorBufferInfos.push_back(bufferInfo);
+       }
+
+       for (size_t i = 0; i < bindings.size(); ++i)
+       {
+               const vk::VkWriteDescriptorSet write =
+               {
+                       vk::VK_STRUCTURE_TYPE_WRITE_DESCRIPTOR_SET,     // VkStructureType                  sType;
+                       DE_NULL,                                                                        // const void*                      pNext;
+                       *descriptorSet,                                                         // VkDescriptorSet                  dstSet;
+                       static_cast<deUint32>(i),                                       // uint32_t                         dstBinding;
+                       0u,                                                                                     // uint32_t                         dstArrayElement;
+                       1u,                                                                                     // uint32_t                         descriptorCount;
+                       bindings[i].descriptorType,                                     // VkDescriptorType                 descriptorType;
+                       DE_NULL,                                                                        // const VkDescriptorImageInfo*     pImageInfo;
+                       &descriptorBufferInfos[i],                                      // const VkDescriptorBufferInfo*    pBufferInfo;
+                       DE_NULL,                                                                        // const VkBufferView*              pTexelBufferView;
+               };
+               descriptorWrites.push_back(write);
+       }
+       vkd.updateDescriptorSets(device, static_cast<deUint32>(descriptorWrites.size()), descriptorWrites.data(), 0u, DE_NULL);
+
+       // Prepare barriers in advance so data is visible to the shaders and the host.
+       std::vector<vk::VkBufferMemoryBarrier> hostToDevBarriers;
+       std::vector<vk::VkBufferMemoryBarrier> devToHostBarriers;
+       for (int i = 0; i < DE_LENGTH_OF_ARRAY(buffers); ++i)
+       {
+               const vk::VkBufferMemoryBarrier hostToDev =
+               {
+                       vk::VK_STRUCTURE_TYPE_BUFFER_MEMORY_BARRIER,                                            // VkStructureType      sType;
+                       DE_NULL,                                                                                                                        // const void*          pNext;
+                       vk::VK_ACCESS_HOST_WRITE_BIT,                                                                           // VkAccessFlags        srcAccessMask;
+                       (vk::VK_ACCESS_SHADER_READ_BIT | vk::VK_ACCESS_SHADER_WRITE_BIT),       // VkAccessFlags        dstAccessMask;
+                       VK_QUEUE_FAMILY_IGNORED,                                                                                        // deUint32                     srcQueueFamilyIndex;
+                       VK_QUEUE_FAMILY_IGNORED,                                                                                        // deUint32                     dstQueueFamilyIndex;
+                       buffers[i],                                                                                                                     // VkBuffer                     buffer;
+                       0u,                                                                                                                                     // VkDeviceSize         offset;
+                       VK_WHOLE_SIZE,                                                                                                          // VkDeviceSize         size;
+               };
+               hostToDevBarriers.push_back(hostToDev);
+
+               const vk::VkBufferMemoryBarrier devToHost =
+               {
+                       vk::VK_STRUCTURE_TYPE_BUFFER_MEMORY_BARRIER,                                            // VkStructureType      sType;
+                       DE_NULL,                                                                                                                        // const void*          pNext;
+                       vk::VK_ACCESS_SHADER_WRITE_BIT,                                                                         // VkAccessFlags        srcAccessMask;
+                       vk::VK_ACCESS_HOST_READ_BIT,                                                                            // VkAccessFlags        dstAccessMask;
+                       VK_QUEUE_FAMILY_IGNORED,                                                                                        // deUint32                     srcQueueFamilyIndex;
+                       VK_QUEUE_FAMILY_IGNORED,                                                                                        // deUint32                     dstQueueFamilyIndex;
+                       buffers[i],                                                                                                                     // VkBuffer                     buffer;
+                       0u,                                                                                                                                     // VkDeviceSize         offset;
+                       VK_WHOLE_SIZE,                                                                                                          // VkDeviceSize         size;
+               };
+               devToHostBarriers.push_back(devToHost);
+       }
+
+       // Create command pool and command buffer.
+       auto queueFamilyIndex = m_context.getUniversalQueueFamilyIndex();
+
+       const vk::VkCommandPoolCreateInfo cmdPoolCreateInfo =
+       {
+               vk::VK_STRUCTURE_TYPE_COMMAND_POOL_CREATE_INFO, // VkStructureType                              sType;
+               DE_NULL,                                                                                // const void*                                  pNext;
+               vk::VK_COMMAND_POOL_CREATE_TRANSIENT_BIT,               // VkCommandPoolCreateFlags             flags;
+               queueFamilyIndex,                                                               // deUint32                                             queueFamilyIndex;
+       };
+       auto cmdPool = vk::createCommandPool(vkd, device, &cmdPoolCreateInfo);
+
+       const vk::VkCommandBufferAllocateInfo cmdBufferAllocateInfo =
+       {
+               vk::VK_STRUCTURE_TYPE_COMMAND_BUFFER_ALLOCATE_INFO,     // VkStructureType                      sType;
+               DE_NULL,                                                                                        // const void*                          pNext;
+               *cmdPool,                                                                                       // VkCommandPool                        commandPool;
+               vk::VK_COMMAND_BUFFER_LEVEL_PRIMARY,                            // VkCommandBufferLevel         level;
+               1u,                                                                                                     // deUint32                                     commandBufferCount;
+       };
+       auto cmdBuffer = vk::allocateCommandBuffer(vkd, device, &cmdBufferAllocateInfo);
+
+       // Create pipeline layout.
+       const vk::VkPipelineLayoutCreateInfo pipelineLayoutCreateInfo =
+       {
+               vk::VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO,      // VkStructureType                                      sType;
+               DE_NULL,                                                                                        // const void*                                          pNext;
+               0,                                                                                                      // VkPipelineLayoutCreateFlags          flags;
+               1u,                                                                                                     // deUint32                                                     setLayoutCount;
+               &descriptorSetLayout.get(),                                                     // const VkDescriptorSetLayout*         pSetLayouts;
+               0u,                                                                                                     // deUint32                                                     pushConstantRangeCount;
+               DE_NULL,                                                                                        // const VkPushConstantRange*           pPushConstantRanges;
+       };
+       auto pipelineLayout = vk::createPipelineLayout(vkd, device, &pipelineLayoutCreateInfo);
+
+       // Create compute pipeline.
+       const vk::Unique<vk::VkShaderModule> shader(vk::createShaderModule(vkd, device, m_context.getBinaryCollection().get("comp"), 0));
+
+       const vk::VkComputePipelineCreateInfo computeCreateInfo =
+       {
+               vk::VK_STRUCTURE_TYPE_COMPUTE_PIPELINE_CREATE_INFO,     // VkStructureType                    sType;
+               DE_NULL,                                                                                        // const void*                        pNext;
+               0,                                                                                                      // VkPipelineCreateFlags              flags;
+               {                                                                                                       // VkPipelineShaderStageCreateInfo    stage;
+                       vk::VK_STRUCTURE_TYPE_PIPELINE_SHADER_STAGE_CREATE_INFO,        // VkStructureType                     sType;
+                       DE_NULL,                                                                                                        // const void*                         pNext;
+                       0,                                                                                                                      // VkPipelineShaderStageCreateFlags    flags;
+                       vk::VK_SHADER_STAGE_COMPUTE_BIT,                                                        // VkShaderStageFlagBits               stage;
+                       *shader,                                                                                                        // VkShaderModule                      module;
+                       "main",                                                                                                         // const char*                         pName;
+                       DE_NULL,                                                                                                        // const VkSpecializationInfo*         pSpecializationInfo;
+               },
+               *pipelineLayout,                                                                        // VkPipelineLayout                   layout;
+               DE_NULL,                                                                                        // VkPipeline                         basePipelineHandle;
+               0,                                                                                                      // int32_t                            basePipelineIndex;
+       };
+       auto computePipeline = vk::createComputePipeline(vkd, device, DE_NULL, &computeCreateInfo);
+
+       // Run the shader.
+       vk::beginCommandBuffer(vkd, *cmdBuffer);
+               vkd.cmdBindPipeline(*cmdBuffer, vk::VK_PIPELINE_BIND_POINT_COMPUTE, *computePipeline);
+               vkd.cmdBindDescriptorSets(*cmdBuffer, vk::VK_PIPELINE_BIND_POINT_COMPUTE, *pipelineLayout, 0, 1u, &descriptorSet.get(), 0u, DE_NULL);
+               vkd.cmdPipelineBarrier(*cmdBuffer, vk::VK_PIPELINE_STAGE_HOST_BIT, vk::VK_PIPELINE_STAGE_COMPUTE_SHADER_BIT, 0, 0u, DE_NULL, static_cast<deUint32>(hostToDevBarriers.size()), hostToDevBarriers.data(), 0u, DE_NULL);
+               vkd.cmdDispatch(*cmdBuffer, static_cast<deUint32>(inputBufferSizeInfo.totalVectors), 1u, 1u);
+               vkd.cmdPipelineBarrier(*cmdBuffer, vk::VK_PIPELINE_STAGE_COMPUTE_SHADER_BIT, vk::VK_PIPELINE_STAGE_HOST_BIT, 0, 0u, DE_NULL, static_cast<deUint32>(devToHostBarriers.size()), devToHostBarriers.data(), 0u, DE_NULL);
+       vk::endCommandBuffer(vkd, *cmdBuffer);
+       vk::submitCommandsAndWait(vkd, device, m_context.getUniversalQueue(), *cmdBuffer);
+
+       // Invalidate output allocation.
+       vk::invalidateAlloc(vkd, device, outputBuffer->getAllocation());
+
+       // Copy output buffer data.
+       std::vector<deUint8> outputMemory(outputBufferSizeInfo.memorySizeBytes);
+       {
+               auto& alloc = outputBuffer->getAllocation();
+               deMemcpy(outputMemory.data(), reinterpret_cast<deUint8*>(alloc.getHostPtr()) + alloc.getOffset(), outputBufferSizeInfo.memorySizeBytes);
+       }
+
+       // Unpack and verify output data.
+       auto& testLog = m_context.getTestContext().getLog();
+       bool conversionOk = false;
+       switch (m_params.to)
+       {
+       case FLOAT_TYPE_16_BITS:
+               {
+                       auto outputValues = unpackFloats<tcu::Float16>(outputMemory, m_params.vectorLength, inputBufferSizeInfo.numValues);
+                       switch (m_params.from)
+                       {
+                       case FLOAT_TYPE_32_BITS:
+                               {
+                                       auto& inputValues = InputGenerator::getInstance().getInputValues32();
+                                       conversionOk = validConversion(inputValues, outputValues, testLog);
+                               }
+                               break;
+
+                       case FLOAT_TYPE_64_BITS:
+                               {
+                                       auto& inputValues = InputGenerator::getInstance().getInputValues64();
+                                       conversionOk = validConversion(inputValues, outputValues, testLog);
+                               }
+                               break;
+
+                       default:
+                               DE_ASSERT(false);
+                               break;
+                       }
+               }
+               break;
+
+       case FLOAT_TYPE_32_BITS:
+               {
+                       auto outputValues = unpackFloats<tcu::Float32>(outputMemory, m_params.vectorLength, inputBufferSizeInfo.numValues);
+                       switch (m_params.from)
+                       {
+                       case FLOAT_TYPE_16_BITS:
+                               {
+                                       auto& inputValues = InputGenerator::getInstance().getInputValues16();
+                                       conversionOk = validConversion(inputValues, outputValues, testLog);
+                               }
+                               break;
+
+                       case FLOAT_TYPE_64_BITS:
+                               {
+                                       auto& inputValues = InputGenerator::getInstance().getInputValues64();
+                                       conversionOk = validConversion(inputValues, outputValues, testLog);
+                               }
+                               break;
+
+                       default:
+                               DE_ASSERT(false);
+                               break;
+                       }
+               }
+               break;
+
+       case FLOAT_TYPE_64_BITS:
+               {
+                       auto outputValues = unpackFloats<tcu::Float64>(outputMemory, m_params.vectorLength, inputBufferSizeInfo.numValues);
+                       switch (m_params.from)
+                       {
+                       case FLOAT_TYPE_16_BITS:
+                               {
+                                       auto& inputValues = InputGenerator::getInstance().getInputValues16();
+                                       conversionOk = validConversion(inputValues, outputValues, testLog);
+                               }
+                               break;
+
+                       case FLOAT_TYPE_32_BITS:
+                               {
+                                       auto& inputValues = InputGenerator::getInstance().getInputValues32();
+                                       conversionOk = validConversion(inputValues, outputValues, testLog);
+                               }
+                               break;
+
+                       default:
+                               DE_ASSERT(false);
+                               break;
+                       }
+               }
+               break;
+
+       default:
+               DE_ASSERT(false);
+               break;
+       }
+
+       return (conversionOk ? tcu::TestStatus::pass("Pass") : tcu::TestStatus::fail("Fail"));
+}
+
+} // anonymous
+
+tcu::TestCaseGroup*    createPrecisionFconvertGroup (tcu::TestContext& testCtx)
+{
+       tcu::TestCaseGroup* newGroup = new tcu::TestCaseGroup(testCtx, "precision_fconvert", "OpFConvert precision tests");
+
+       for (int i = 0; i < FLOAT_TYPE_MAX_ENUM; ++i)
+       for (int j = 0; j < FLOAT_TYPE_MAX_ENUM; ++j)
+       for (size_t k = kMinVectorLength; k <= kMaxVectorLength; ++k)
+       {
+               // No actual conversion if the types are the same.
+               if (i == j)
+                       continue;
+
+               TestParams params = {
+                       static_cast<FloatType>(i),
+                       static_cast<FloatType>(j),
+                       k,
+               };
+
+               std::string testName = std::string() + kFloatNames[i] + "_to_" + kFloatNames[j] + "_size_" + std::to_string(k);
+               std::string testDescription = std::string("Conversion from ") + kFloatNames[i] + " to " + kFloatNames[j] + " with vectors of size " + std::to_string(k);
+
+               newGroup->addChild(new FConvertTestCase(testCtx, testName, testDescription, params));
+       }
+
+       return newGroup;
+}
+
+} // shaderexecutor
+} // vkt
diff --git a/external/vulkancts/modules/vulkan/shaderexecutor/vktShaderFConvertTests.hpp b/external/vulkancts/modules/vulkan/shaderexecutor/vktShaderFConvertTests.hpp

new file mode 100644 (file)

index 0000000..7c13e6e
--- /dev/null
+++ b/external/vulkancts/modules/vulkan/shaderexecutor/vktShaderFConvertTests.hpp
@@ -0,0 +1,40 @@
+#ifndef _VKTSHADERFCONVERTTESTS_HPP
+#define _VKTSHADERFCONVERTTESTS_HPP
+/*------------------------------------------------------------------------
+ * Vulkan Conformance Tests
+ * ------------------------
+ *
+ * Copyright (c) 2019 Valve Corporation.
+ * Copyright (c) 2019 The Khronos Group Inc.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *      http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ *
+ *//*!
+ * \file
+ * \brief OpFConvert tests.
+ *//*--------------------------------------------------------------------*/
+
+#include "tcuDefs.hpp"
+#include "tcuTestCase.hpp"
+
+namespace vkt
+{
+namespace shaderexecutor
+{
+
+tcu::TestCaseGroup*    createPrecisionFconvertGroup (tcu::TestContext& testCtx);
+
+} // shaderexecutor
+} // vkt
+
+#endif // _VKTSHADERFCONVERTTESTS_HPP
diff --git a/external/vulkancts/mustpass/master/vk-default-no-waivers.txt b/external/vulkancts/mustpass/master/vk-default-no-waivers.txt

index 1eda30e..dc158ec 100644 (file)
--- a/external/vulkancts/mustpass/master/vk-default-no-waivers.txt
+++ b/external/vulkancts/mustpass/master/vk-default-no-waivers.txt
@@ -314213,6 +314213,30 @@ dEQP-VK.glsl.builtin.precision_fp16_storage32b.fma.compute.scalar
  dEQP-VK.glsl.builtin.precision_fp16_storage32b.fma.compute.vec2
  dEQP-VK.glsl.builtin.precision_fp16_storage32b.fma.compute.vec3
  dEQP-VK.glsl.builtin.precision_fp16_storage32b.fma.compute.vec4
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f32_size_1
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f32_size_2
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f32_size_3
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f32_size_4
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f64_size_1
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f64_size_2
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f64_size_3
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f64_size_4
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f16_size_1
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f16_size_2
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f16_size_3
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f16_size_4
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f64_size_1
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f64_size_2
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f64_size_3
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f64_size_4
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f16_size_1
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f16_size_2
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f16_size_3
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f16_size_4
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f32_size_1
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f32_size_2
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f32_size_3
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f32_size_4
  dEQP-VK.glsl.opaque_type_indexing.sampler.const_literal.vertex.sampler1d
  dEQP-VK.glsl.opaque_type_indexing.sampler.const_literal.vertex.sampler1darray
  dEQP-VK.glsl.opaque_type_indexing.sampler.const_literal.vertex.sampler1darrayshadow
diff --git a/external/vulkancts/mustpass/master/vk-default.txt b/external/vulkancts/mustpass/master/vk-default.txt

index 42d359e..4a05237 100644 (file)
--- a/external/vulkancts/mustpass/master/vk-default.txt
+++ b/external/vulkancts/mustpass/master/vk-default.txt
@@ -314175,6 +314175,30 @@ dEQP-VK.glsl.builtin.precision_fp16_storage32b.fma.compute.scalar
  dEQP-VK.glsl.builtin.precision_fp16_storage32b.fma.compute.vec2
  dEQP-VK.glsl.builtin.precision_fp16_storage32b.fma.compute.vec3
  dEQP-VK.glsl.builtin.precision_fp16_storage32b.fma.compute.vec4
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f32_size_1
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f32_size_2
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f32_size_3
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f32_size_4
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f64_size_1
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f64_size_2
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f64_size_3
+dEQP-VK.glsl.builtin.precision_fconvert.f16_to_f64_size_4
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f16_size_1
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f16_size_2
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f16_size_3
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f16_size_4
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f64_size_1
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f64_size_2
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f64_size_3
+dEQP-VK.glsl.builtin.precision_fconvert.f32_to_f64_size_4
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f16_size_1
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f16_size_2
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f16_size_3
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f16_size_4
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f32_size_1
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f32_size_2
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f32_size_3
+dEQP-VK.glsl.builtin.precision_fconvert.f64_to_f32_size_4
  dEQP-VK.glsl.opaque_type_indexing.sampler.const_literal.vertex.sampler1d
  dEQP-VK.glsl.opaque_type_indexing.sampler.const_literal.vertex.sampler1darray
  dEQP-VK.glsl.opaque_type_indexing.sampler.const_literal.vertex.sampler1darrayshadow
diff --git a/framework/common/tcuFloat.hpp b/framework/common/tcuFloat.hpp

index eb1c9c1..1b46e17 100644 (file)
--- a/framework/common/tcuFloat.hpp
+++ b/framework/common/tcuFloat.hpp
@@ -37,6 +37,13 @@ enum FloatFlags
         FLOAT_SUPPORT_DENORM    = (1<<1)
  };
  
+enum RoundingDirection
+{
+       ROUND_TO_EVEN = 0,
+       ROUND_DOWNWARD,         // Towards -Inf.
+       ROUND_UPWARD,           // Towards +Inf.
+};
+
  /*--------------------------------------------------------------------*//*!
   * \brief Floating-point format template
   *
@@ -60,13 +67,13 @@ public:
  
                                                         Float                   (void);
         explicit                                Float                   (StorageType value);
-       explicit                                Float                   (float v);
-       explicit                                Float                   (double v);
+       explicit                                Float                   (float v, RoundingDirection rd = ROUND_TO_EVEN);
+       explicit                                Float                   (double v, RoundingDirection rd = ROUND_TO_EVEN);
  
         template <typename OtherStorageType, int OtherExponentBits, int OtherMantissaBits, int OtherExponentBias, deUint32 OtherFlags>
-       static Float                    convert                 (const Float<OtherStorageType, OtherExponentBits, OtherMantissaBits, OtherExponentBias, OtherFlags>& src);
+       static Float                    convert                 (const Float<OtherStorageType, OtherExponentBits, OtherMantissaBits, OtherExponentBias, OtherFlags>& src, RoundingDirection rd = ROUND_TO_EVEN);
  
-       static inline Float             convert                 (const Float<StorageType, ExponentBits, MantissaBits, ExponentBias, Flags>& src) { return src; }
+       static inline Float             convert                 (const Float<StorageType, ExponentBits, MantissaBits, ExponentBias, Flags>& src, RoundingDirection = ROUND_TO_EVEN) { return src; }
  
         /*--------------------------------------------------------------------*//*!
          * \brief Construct floating point value
@@ -123,6 +130,9 @@ public:
         static Float                    inf                             (int sign);
         static Float                    nan                             (void);
  
+       static Float                    largestNormal   (int sign);
+       static Float                    smallestNormal  (int sign);
+
  private:
         StorageType                             m_value;
  } DE_WARN_UNUSED_TYPE;
@@ -147,21 +157,21 @@ inline Float<StorageType, ExponentBits, MantissaBits, ExponentBias, Flags>::Floa
  }
  
  template <typename StorageType, int ExponentBits, int MantissaBits, int ExponentBias, deUint32 Flags>
-inline Float<StorageType, ExponentBits, MantissaBits, ExponentBias, Flags>::Float (float value)
+inline Float<StorageType, ExponentBits, MantissaBits, ExponentBias, Flags>::Float (float value, RoundingDirection rd)
         : m_value(0)
  {
         deUint32 u32;
         memcpy(&u32, &value, sizeof(deUint32));
-       *this = convert(Float32(u32));
+       *this = convert(Float32(u32), rd);
  }
  
  template <typename StorageType, int ExponentBits, int MantissaBits, int ExponentBias, deUint32 Flags>
-inline Float<StorageType, ExponentBits, MantissaBits, ExponentBias, Flags>::Float (double value)
+inline Float<StorageType, ExponentBits, MantissaBits, ExponentBias, Flags>::Float (double value, RoundingDirection rd)
         : m_value(0)
  {
         deUint64 u64;
         memcpy(&u64, &value, sizeof(deUint64));
-       *this = convert(Float64(u64));
+       *this = convert(Float64(u64), rd);
  }
  
  template <typename StorageType, int ExponentBits, int MantissaBits, int ExponentBias, deUint32 Flags>
@@ -203,6 +213,20 @@ inline Float<StorageType, ExponentBits, MantissaBits, ExponentBias, Flags> Float
  }
  
  template <typename StorageType, int ExponentBits, int MantissaBits, int ExponentBias, deUint32 Flags>
+inline Float<StorageType, ExponentBits, MantissaBits, ExponentBias, Flags> Float<StorageType, ExponentBits, MantissaBits, ExponentBias, Flags>::largestNormal (int sign)
+{
+       DE_ASSERT(sign == 1 || ((Flags & FLOAT_HAS_SIGN) && sign == -1));
+       return Float<StorageType, ExponentBits, MantissaBits, ExponentBias, Flags>::construct(sign, ExponentBias, (static_cast<StorageType>(1) << (MantissaBits + 1)) - 1);
+}
+
+template <typename StorageType, int ExponentBits, int MantissaBits, int ExponentBias, deUint32 Flags>
+inline Float<StorageType, ExponentBits, MantissaBits, ExponentBias, Flags> Float<StorageType, ExponentBits, MantissaBits, ExponentBias, Flags>::smallestNormal (int sign)
+{
+       DE_ASSERT(sign == 1 || ((Flags & FLOAT_HAS_SIGN) && sign == -1));
+       return Float<StorageType, ExponentBits, MantissaBits, ExponentBias, Flags>::construct(sign, 1 - ExponentBias, (static_cast<StorageType>(1) << MantissaBits));
+}
+
+template <typename StorageType, int ExponentBits, int MantissaBits, int ExponentBias, deUint32 Flags>
  Float<StorageType, ExponentBits, MantissaBits, ExponentBias, Flags>
  Float<StorageType, ExponentBits, MantissaBits, ExponentBias, Flags>::construct
         (int sign, int exponent, StorageType mantissa)
@@ -242,98 +266,148 @@ template <typename StorageType, int ExponentBits, int MantissaBits, int Exponent
  template <typename OtherStorageType, int OtherExponentBits, int OtherMantissaBits, int OtherExponentBias, deUint32 OtherFlags>
  Float<StorageType, ExponentBits, MantissaBits, ExponentBias, Flags>
  Float<StorageType, ExponentBits, MantissaBits, ExponentBias, Flags>::convert
-       (const Float<OtherStorageType, OtherExponentBits, OtherMantissaBits, OtherExponentBias, OtherFlags>& other)
+       (const Float<OtherStorageType, OtherExponentBits, OtherMantissaBits, OtherExponentBias, OtherFlags>& other, RoundingDirection rd)
  {
         if (!(Flags & FLOAT_HAS_SIGN) && other.sign() < 0)
         {
                 // Negative number, truncate to zero.
                 return zero(+1);
         }
-       else if (other.isInf())
+
+       if (other.isInf())
         {
                 return inf(other.sign());
         }
-       else if (other.isNaN())
+
+       if (other.isNaN())
         {
                 return nan();
         }
-       else if (other.isZero())
+
+       if (other.isZero())
         {
                 return zero(other.sign());
         }
-       else
-       {
-               const int                       eMin    = 1 - ExponentBias;
-               const int                       eMax    = ((1<<ExponentBits)-2) - ExponentBias;
  
-               const StorageType       s               = StorageType((StorageType(other.signBit())) << (StorageType(ExponentBits+MantissaBits))); // \note Not sign, but sign bit.
-               int                                     e               = other.exponent();
-               deUint64                        m               = other.mantissa();
+       const int                       eMin    = 1 - ExponentBias;
+       const int                       eMax    = ((1<<ExponentBits)-2) - ExponentBias;
  
-               // Normalize denormalized values prior to conversion.
-               while (!(m & (1ull<<OtherMantissaBits)))
-               {
-                       m <<= 1;
-                       e  -= 1;
-               }
+       const StorageType       s               = StorageType((StorageType(other.signBit())) << (StorageType(ExponentBits+MantissaBits))); // \note Not sign, but sign bit.
+       int                                     e               = other.exponent();
+       deUint64                        m               = other.mantissa();
  
-               if (e < eMin)
-               {
-                       // Underflow.
-                       if ((Flags & FLOAT_SUPPORT_DENORM) && (eMin-e-1 <= MantissaBits))
-                       {
-                               // Shift and round (RTE).
-                               int                     bitDiff = (OtherMantissaBits-MantissaBits) + (eMin-e);
-                               deUint64        half    = (1ull << (bitDiff - 1)) - 1;
-                               deUint64        bias    = (m >> bitDiff) & 1;
+       // Normalize denormalized values prior to conversion.
+       while (!(m & (1ull<<OtherMantissaBits)))
+       {
+               m <<= 1;
+               e  -= 1;
+       }
  
-                               return Float(StorageType(s | (m + half + bias) >> bitDiff));
-                       }
-                       else
-                               return zero(other.sign());
-               }
-               else
+       if (e < eMin)
+       {
+               // Underflow.
+               if ((Flags & FLOAT_SUPPORT_DENORM) && (eMin-e-1 <= MantissaBits))
                 {
-                       // Remove leading 1.
-                       m = m & ~(1ull<<OtherMantissaBits);
-
-                       if (MantissaBits < OtherMantissaBits)
+                       // Shift and round.
+                       int                     bitDiff                 = (OtherMantissaBits-MantissaBits) + (eMin-e);
+                       deUint64        lastBitsMask    = (1ull << bitDiff) - 1ull;
+                       deUint64        lastBits                = (static_cast<deUint64>(m) & lastBitsMask);
+                       deUint64        half                    = (1ull << (bitDiff - 1)) - 1;
+                       deUint64        bias                    = (m >> bitDiff) & 1;
+
+                       switch (rd)
                         {
-                               // Round mantissa (round to nearest even).
-                               int                     bitDiff = OtherMantissaBits-MantissaBits;
-                               deUint64        half    = (1ull << (bitDiff - 1)) - 1;
-                               deUint64        bias    = (m >> bitDiff) & 1;
+                       case ROUND_TO_EVEN:
+                               return Float(StorageType(s | (m + half + bias) >> bitDiff));
  
-                               m = (m + half + bias) >> bitDiff;
+                       case ROUND_DOWNWARD:
+                               m = (m >> bitDiff);
+                               if (lastBits != 0ull && other.sign() < 0)
+                               {
+                                       m += 1;
+                               }
+                               return Float(StorageType(s | m));
  
-                               if (m & (1ull<<MantissaBits))
+                       case ROUND_UPWARD:
+                               m = (m >> bitDiff);
+                               if (lastBits != 0ull && other.sign() > 0)
                                 {
-                                       // Overflow in mantissa.
-                                       m  = 0;
-                                       e += 1;
+                                       m += 1;
                                 }
+                               return Float(StorageType(s | m));
+
+                       default:
+                               DE_ASSERT(false);
+                               break;
                         }
-                       else
+               }
+
+               return zero(other.sign());
+       }
+
+       // Remove leading 1.
+       m = m & ~(1ull<<OtherMantissaBits);
+
+       if (MantissaBits < OtherMantissaBits)
+       {
+               // Round mantissa.
+               int                     bitDiff                 = OtherMantissaBits-MantissaBits;
+               deUint64        lastBitsMask    = (1ull << bitDiff) - 1ull;
+               deUint64        lastBits                = (static_cast<deUint64>(m) & lastBitsMask);
+               deUint64        half                    = (1ull << (bitDiff - 1)) - 1;
+               deUint64        bias                    = (m >> bitDiff) & 1;
+
+               switch (rd)
+               {
+               case ROUND_TO_EVEN:
+                       m = (m + half + bias) >> bitDiff;
+                       break;
+
+               case ROUND_DOWNWARD:
+                       m = (m >> bitDiff);
+                       if (lastBits != 0ull && other.sign() < 0)
                         {
-                               int bitDiff = MantissaBits-OtherMantissaBits;
-                               m = m << bitDiff;
+                               m += 1;
                         }
+                       break;
  
-                       if (e > eMax)
+               case ROUND_UPWARD:
+                       m = (m >> bitDiff);
+                       if (lastBits != 0ull && other.sign() > 0)
                         {
-                               // Overflow.
-                               return inf(other.sign());
+                               m += 1;
                         }
-                       else
-                       {
-                               DE_ASSERT(de::inRange(e, eMin, eMax));
-                               DE_ASSERT(((e + ExponentBias) & ~((1ull<<ExponentBits)-1)) == 0);
-                               DE_ASSERT((m & ~((1ull<<MantissaBits)-1)) == 0);
+                       break;
  
-                               return Float(StorageType(s | (StorageType(e + ExponentBias) << MantissaBits) | m));
-                       }
+               default:
+                       DE_ASSERT(false);
+                       break;
                 }
+
+               if (m & (1ull<<MantissaBits))
+               {
+                       // Overflow in mantissa.
+                       m  = 0;
+                       e += 1;
+               }
+       }
+       else
+       {
+               int bitDiff = MantissaBits-OtherMantissaBits;
+               m = m << bitDiff;
         }
+
+       if (e > eMax)
+       {
+               // Overflow.
+               return (((other.sign() < 0 && rd == ROUND_UPWARD) || (other.sign() > 0 && rd == ROUND_DOWNWARD)) ? largestNormal(other.sign()) : inf(other.sign()));
+       }
+
+       DE_ASSERT(de::inRange(e, eMin, eMax));
+       DE_ASSERT(((e + ExponentBias) & ~((1ull<<ExponentBits)-1)) == 0);
+       DE_ASSERT((m & ~((1ull<<MantissaBits)-1)) == 0);
+
+       return Float(StorageType(s | (StorageType(e + ExponentBias) << MantissaBits) | m));
  }
  
  } // tcu
author	Ricardo Garcia <rgarcia@igalia.com>
	Fri, 11 Oct 2019 12:28:30 +0000 (14:28 +0200)
committer	Alexander Galazin <Alexander.Galazin@arm.com>
	Fri, 25 Oct 2019 14:45:13 +0000 (10:45 -0400)
AndroidGen.mk		patch \| blob \| history
android/cts/master/vk-master.txt		patch \| blob \| history
external/vulkancts/modules/vulkan/image/vktImageTranscodingSupportTests.cpp		patch \| blob \| history
external/vulkancts/modules/vulkan/shaderexecutor/CMakeLists.txt		patch \| blob \| history
external/vulkancts/modules/vulkan/shaderexecutor/vktShaderBuiltinTests.cpp		patch \| blob \| history
external/vulkancts/modules/vulkan/shaderexecutor/vktShaderFConvertTests.cpp	[new file with mode: 0644]	patch \| blob
external/vulkancts/modules/vulkan/shaderexecutor/vktShaderFConvertTests.hpp	[new file with mode: 0644]	patch \| blob
external/vulkancts/mustpass/master/vk-default-no-waivers.txt		patch \| blob \| history
external/vulkancts/mustpass/master/vk-default.txt		patch \| blob \| history
framework/common/tcuFloat.hpp		patch \| blob \| history