skia2/tests/Float16Test.cpp
mtklein a525cb151b skeleton for float <-> half optimized procs
Nothing fancy yet, just calls the serial code in a loop.

I will try to folow this up with at least some of:
   - SSE2 version of serial code
   - NEON version of serial code
   - NEON version using vcvt.f32.f16/vcvt.f16.f32
   - F16C (between AVX and AVX2) version using vcvtph2ps/vcvtps2ph
The last two are fastest but need runtime detection.

BUG=skia:
GOLD_TRYBOT_URL= https://gold.skia.org/search2?unt=true&query=source_type%3Dgm&master=false&issue=1686543003

Review URL: https://codereview.chromium.org/1686543003
2016-02-09 08:18:10 -08:00

67 lines
1.9 KiB
C++

/*
* Copyright 2016 Google Inc.
*
* Use of this source code is governed by a BSD-style license that can be
* found in the LICENSE file.
*/
#include "Test.h"
#include "SkColor.h"
#include "SkHalf.h"
#include "SkOpts.h"
#include "SkPixmap.h"
static bool eq_within_half_float(float a, float b) {
const float kTolerance = 1.0f / (1 << (8 + 10));
SkHalf ha = SkFloatToHalf(a);
SkHalf hb = SkFloatToHalf(b);
float a2 = SkHalfToFloat(ha);
float b2 = SkHalfToFloat(hb);
return fabsf(a2 - b2) <= kTolerance;
}
static bool eq_within_half_float(const SkPM4f& a, const SkPM4f& b) {
for (int i = 0; i < 4; ++i) {
if (!eq_within_half_float(a.fVec[i], b.fVec[i])) {
return false;
}
}
return true;
}
DEF_TEST(color_half_float, reporter) {
const int w = 100;
const int h = 100;
SkImageInfo info = SkImageInfo::Make(w, h, kRGBA_F16_SkColorType, kPremul_SkAlphaType);
SkAutoPixmapStorage pm;
pm.alloc(info);
REPORTER_ASSERT(reporter, pm.getSafeSize() == SkToSizeT(w * h * sizeof(uint64_t)));
SkColor4f c4 { 0.5f, 1, 0.5f, 0.25f };
pm.erase(c4);
SkPM4f origpm4 = c4.premul();
for (int y = 0; y < pm.height(); ++y) {
for (int x = 0; x < pm.width(); ++x) {
SkPM4f pm4 = SkPM4f::FromF16(pm.addrF16(x, y));
REPORTER_ASSERT(reporter, eq_within_half_float(origpm4, pm4));
}
}
}
DEF_TEST(float_to_half, reporter) {
const float fs[] = { 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0 };
const uint16_t hs[] = { 0x3c00, 0x4000, 0x4200, 0x4400, 0x4500, 0x4600, 0x4700 };
uint16_t hscratch[7];
SkOpts::float_to_half(hscratch, fs, 7);
REPORTER_ASSERT(reporter, 0 == memcmp(hscratch, hs, sizeof(hs)));
float fscratch[7];
SkOpts::half_to_float(fscratch, hs, 7);
REPORTER_ASSERT(reporter, 0 == memcmp(fscratch, fs, sizeof(fs)));
}