2017-08-12 15:38:17 +02:00
|
|
|
|
|
|
|
// =================================================================================================
|
|
|
|
// This file is part of the CLBlast project. The project is licensed under Apache Version 2.0. This
|
|
|
|
// project loosely follows the Google C++ styleguide and uses a tab-size of two spaces and a max-
|
|
|
|
// width of 100 characters per line.
|
|
|
|
//
|
|
|
|
// Author(s):
|
|
|
|
// Cedric Nugteren <www.cedricnugteren.nl>
|
|
|
|
//
|
|
|
|
// This file implements the test utility functions.
|
|
|
|
//
|
|
|
|
// =================================================================================================
|
|
|
|
|
|
|
|
#include "test/test_utilities.hpp"
|
|
|
|
|
|
|
|
#include <string>
|
|
|
|
#include <vector>
|
|
|
|
|
|
|
|
namespace clblast {
|
|
|
|
// =================================================================================================
|
|
|
|
|
|
|
|
// Returns whether a scalar is close to zero
|
|
|
|
template <typename T> bool IsCloseToZero(const T value) { return (value > -SmallConstant<T>()) && (value < SmallConstant<T>()); }
|
|
|
|
template bool IsCloseToZero<float>(const float);
|
|
|
|
template bool IsCloseToZero<double>(const double);
|
|
|
|
template <> bool IsCloseToZero(const half value) { return IsCloseToZero(HalfToFloat(value)); }
|
|
|
|
template <> bool IsCloseToZero(const float2 value) { return IsCloseToZero(value.real()) || IsCloseToZero(value.imag()); }
|
|
|
|
template <> bool IsCloseToZero(const double2 value) { return IsCloseToZero(value.real()) || IsCloseToZero(value.imag()); }
|
|
|
|
|
|
|
|
// =================================================================================================
|
|
|
|
|
|
|
|
template <typename T, typename U>
|
|
|
|
void DeviceToHost(const Arguments<U> &args, Buffers<T> &buffers, BuffersHost<T> &buffers_host,
|
|
|
|
Queue &queue, const std::vector<std::string> &names) {
|
|
|
|
for (auto &name: names) {
|
|
|
|
if (name == kBufVecX) {buffers_host.x_vec = std::vector<T>(args.x_size, static_cast<T>(0)); buffers.x_vec.Read(queue, args.x_size, buffers_host.x_vec); }
|
|
|
|
else if (name == kBufVecY) { buffers_host.y_vec = std::vector<T>(args.y_size, static_cast<T>(0)); buffers.y_vec.Read(queue, args.y_size, buffers_host.y_vec); }
|
|
|
|
else if (name == kBufMatA) { buffers_host.a_mat = std::vector<T>(args.a_size, static_cast<T>(0)); buffers.a_mat.Read(queue, args.a_size, buffers_host.a_mat); }
|
|
|
|
else if (name == kBufMatB) { buffers_host.b_mat = std::vector<T>(args.b_size, static_cast<T>(0)); buffers.b_mat.Read(queue, args.b_size, buffers_host.b_mat); }
|
|
|
|
else if (name == kBufMatC) { buffers_host.c_mat = std::vector<T>(args.c_size, static_cast<T>(0)); buffers.c_mat.Read(queue, args.c_size, buffers_host.c_mat); }
|
|
|
|
else if (name == kBufMatAP) { buffers_host.ap_mat = std::vector<T>(args.ap_size, static_cast<T>(0)); buffers.ap_mat.Read(queue, args.ap_size, buffers_host.ap_mat); }
|
|
|
|
else if (name == kBufScalar) { buffers_host.scalar = std::vector<T>(args.scalar_size, static_cast<T>(0)); buffers.scalar.Read(queue, args.scalar_size, buffers_host.scalar); }
|
|
|
|
else { throw std::runtime_error("Invalid buffer name"); }
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename T, typename U>
|
|
|
|
void HostToDevice(const Arguments<U> &args, Buffers<T> &buffers, BuffersHost<T> &buffers_host,
|
|
|
|
Queue &queue, const std::vector<std::string> &names) {
|
|
|
|
for (auto &name: names) {
|
|
|
|
if (name == kBufVecX) { buffers.x_vec.Write(queue, args.x_size, buffers_host.x_vec); }
|
|
|
|
else if (name == kBufVecY) { buffers.y_vec.Write(queue, args.y_size, buffers_host.y_vec); }
|
|
|
|
else if (name == kBufMatA) { buffers.a_mat.Write(queue, args.a_size, buffers_host.a_mat); }
|
|
|
|
else if (name == kBufMatB) { buffers.b_mat.Write(queue, args.b_size, buffers_host.b_mat); }
|
|
|
|
else if (name == kBufMatC) { buffers.c_mat.Write(queue, args.c_size, buffers_host.c_mat); }
|
|
|
|
else if (name == kBufMatAP) { buffers.ap_mat.Write(queue, args.ap_size, buffers_host.ap_mat); }
|
|
|
|
else if (name == kBufScalar) { buffers.scalar.Write(queue, args.scalar_size, buffers_host.scalar); }
|
|
|
|
else { throw std::runtime_error("Invalid buffer name"); }
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Compiles the above functions
|
|
|
|
template void DeviceToHost(const Arguments<half>&, Buffers<half>&, BuffersHost<half>&, Queue&, const std::vector<std::string>&);
|
|
|
|
template void DeviceToHost(const Arguments<float>&, Buffers<float>&, BuffersHost<float>&, Queue&, const std::vector<std::string>&);
|
|
|
|
template void DeviceToHost(const Arguments<double>&, Buffers<double>&, BuffersHost<double>&, Queue&, const std::vector<std::string>&);
|
|
|
|
template void DeviceToHost(const Arguments<float>&, Buffers<float2>&, BuffersHost<float2>&, Queue&, const std::vector<std::string>&);
|
|
|
|
template void DeviceToHost(const Arguments<double>&, Buffers<double2>&, BuffersHost<double2>&, Queue&, const std::vector<std::string>&);
|
|
|
|
template void DeviceToHost(const Arguments<float2>&, Buffers<float2>&, BuffersHost<float2>&, Queue&, const std::vector<std::string>&);
|
|
|
|
template void DeviceToHost(const Arguments<double2>&, Buffers<double2>&, BuffersHost<double2>&, Queue&, const std::vector<std::string>&);
|
|
|
|
template void HostToDevice(const Arguments<half>&, Buffers<half>&, BuffersHost<half>&, Queue&, const std::vector<std::string>&);
|
|
|
|
template void HostToDevice(const Arguments<float>&, Buffers<float>&, BuffersHost<float>&, Queue&, const std::vector<std::string>&);
|
|
|
|
template void HostToDevice(const Arguments<double>&, Buffers<double>&, BuffersHost<double>&, Queue&, const std::vector<std::string>&);
|
|
|
|
template void HostToDevice(const Arguments<float>&, Buffers<float2>&, BuffersHost<float2>&, Queue&, const std::vector<std::string>&);
|
|
|
|
template void HostToDevice(const Arguments<double>&, Buffers<double2>&, BuffersHost<double2>&, Queue&, const std::vector<std::string>&);
|
|
|
|
template void HostToDevice(const Arguments<float2>&, Buffers<float2>&, BuffersHost<float2>&, Queue&, const std::vector<std::string>&);
|
|
|
|
template void HostToDevice(const Arguments<double2>&, Buffers<double2>&, BuffersHost<double2>&, Queue&, const std::vector<std::string>&);
|
|
|
|
|
|
|
|
// =================================================================================================
|
|
|
|
|
|
|
|
// Conversion between half and single-precision
|
|
|
|
std::vector<float> HalfToFloatBuffer(const std::vector<half>& source) {
|
|
|
|
auto result = std::vector<float>(source.size());
|
|
|
|
for (auto i = size_t(0); i < source.size(); ++i) { result[i] = HalfToFloat(source[i]); }
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
void FloatToHalfBuffer(std::vector<half>& result, const std::vector<float>& source) {
|
|
|
|
for (auto i = size_t(0); i < source.size(); ++i) { result[i] = FloatToHalf(source[i]); }
|
|
|
|
}
|
|
|
|
|
|
|
|
// As above, but now for OpenCL data-types instead of std::vectors
|
2017-10-15 13:56:19 +02:00
|
|
|
#ifdef OPENCL_API
|
|
|
|
Buffer<float> HalfToFloatBuffer(const Buffer<half>& source, RawCommandQueue queue_raw) {
|
|
|
|
const auto size = source.GetSize() / sizeof(half);
|
|
|
|
auto queue = Queue(queue_raw);
|
|
|
|
auto context = queue.GetContext();
|
|
|
|
auto source_cpu = std::vector<half>(size);
|
|
|
|
source.Read(queue, size, source_cpu);
|
|
|
|
auto result_cpu = HalfToFloatBuffer(source_cpu);
|
|
|
|
auto result = Buffer<float>(context, size);
|
|
|
|
result.Write(queue, size, result_cpu);
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
void FloatToHalfBuffer(Buffer<half>& result, const Buffer<float>& source, RawCommandQueue queue_raw) {
|
|
|
|
const auto size = source.GetSize() / sizeof(float);
|
|
|
|
auto queue = Queue(queue_raw);
|
|
|
|
auto context = queue.GetContext();
|
|
|
|
auto source_cpu = std::vector<float>(size);
|
|
|
|
source.Read(queue, size, source_cpu);
|
|
|
|
auto result_cpu = std::vector<half>(size);
|
|
|
|
FloatToHalfBuffer(result_cpu, source_cpu);
|
|
|
|
result.Write(queue, size, result_cpu);
|
|
|
|
}
|
|
|
|
#endif
|
2017-08-12 15:38:17 +02:00
|
|
|
|
|
|
|
// =================================================================================================
|
|
|
|
} // namespace clblast
|