This source file includes following definitions.
- is_type_supported
- test
- test_all
- main
#include "Halide.h"
#include <stdio.h>
#include <future>
using namespace Halide;
template<typename A>
const char *string_of_type();
#define DECL_SOT(name) \
template<> \
const char *string_of_type<name>() {return #name;}
DECL_SOT(uint8_t);
DECL_SOT(int8_t);
DECL_SOT(uint16_t);
DECL_SOT(int16_t);
DECL_SOT(uint32_t);
DECL_SOT(int32_t);
DECL_SOT(float);
DECL_SOT(double);
template <typename T>
bool is_type_supported(int vec_width, const Target &target) {
return target.supports_type(type_of<T>().with_lanes(vec_width));
}
template <>
bool is_type_supported<float>(int vec_width, const Target &target) {
if (target.features_any_of({Target::HVX_64, Target::HVX_128})) {
return vec_width == 1;
} else {
return true;
}
}
template <>
bool is_type_supported<double>(int vec_width, const Target &target) {
if (target.has_feature(Target::OpenCL) &&
!target.has_feature(Target::CLDoubles)) {
return false;
} else if (target.features_any_of({Target::HVX_64, Target::HVX_128})) {
return vec_width == 1;
} else {
return true;
}
}
template<typename A, typename B>
bool test(int vec_width, const Target &target) {
if (!is_type_supported<A>(vec_width, target) || !is_type_supported<B>(vec_width, target)) {
return true;
}
int W = 1024;
int H = 1;
Buffer<A> input(W, H);
for (int y = 0; y < H; y++) {
for (int x = 0; x < W; x++) {
input(x, y) = (A)((rand()&0xffff)*0.1);
}
}
Var x, y;
Func f;
f(x, y) = cast<B>(input(x, y));
if (target.has_gpu_feature()) {
Var xo, xi;
f.gpu_tile(x, xo, xi, 64);
} else {
if (target.features_any_of({Target::HVX_64, Target::HVX_128})) {
}
if (vec_width > 1) {
f.vectorize(x, vec_width);
}
}
Buffer<B> output = f.realize(W, H);
for (int y = 0; y < H; y++) {
for (int x = 0; x < W; x++) {
bool ok = ((B)(input(x, y)) == output(x, y));
if (!ok) {
fprintf(stderr, "%s x %d -> %s x %d failed\n",
string_of_type<A>(), vec_width,
string_of_type<B>(), vec_width);
fprintf(stderr, "At %d %d, %f -> %f instead of %f\n",
x, y,
(double)(input(x, y)),
(double)(output(x, y)),
(double)((B)(input(x, y))));
return false;
}
}
}
return true;
}
template<typename A>
bool test_all(int vec_width, const Target &target) {
bool success = true;
success = success && test<A, float>(vec_width, target);
success = success && test<A, double>(vec_width, target);
success = success && test<A, uint8_t>(vec_width, target);
success = success && test<A, uint16_t>(vec_width, target);
success = success && test<A, uint32_t>(vec_width, target);
success = success && test<A, int8_t>(vec_width, target);
success = success && test<A, int16_t>(vec_width, target);
success = success && test<A, int32_t>(vec_width, target);
return success;
}
int main(int argc, char **argv) {
#ifdef WIN32
printf("Not testing on windows\n");
return 0;
#endif
Target target = get_jit_target_from_environment();
Halide::Internal::ThreadPool<bool> pool;
std::vector<std::future<bool>> futures;
for (int vec_width = 1; vec_width <= 64; vec_width*=2) {
futures.push_back(pool.async([=]() {
bool success = true;
success = success && test_all<float>(vec_width, target);
success = success && test_all<double>(vec_width, target);
success = success && test_all<uint8_t>(vec_width, target);
success = success && test_all<uint16_t>(vec_width, target);
success = success && test_all<uint32_t>(vec_width, target);
success = success && test_all<int8_t>(vec_width, target);
success = success && test_all<int16_t>(vec_width, target);
success = success && test_all<int32_t>(vec_width, target);
return success;
}));
}
bool ok = true;
for (auto &f : futures) {
ok &= f.get();
}
if (!ok) return -1;
printf("Success!\n");
return 0;
}