auto-generate _d stages
Stage foo_d should always be the same logic as stage foo swapping r and dr, g and dg, b and db, a and da. This means we can infer their definitions. CQ_INCLUDE_TRYBOTS=skia.primary:Test-Ubuntu-GCC-GCE-CPU-AVX2-x86_64-Release-SKNX_NO_SIMD Change-Id: Ia0a3abb29a201c647d9ec1860211abfbc19b56ae Reviewed-on: https://skia-review.googlesource.com/6555 Reviewed-by: Mike Klein <mtklein@chromium.org> Commit-Queue: Mike Klein <mtklein@chromium.org>
This commit is contained in:
parent
2be687af58
commit
e2b66a769b
@ -70,6 +70,12 @@ SI void SK_VECTORCALL just_return(Stage*, size_t, SkNf, SkNf, SkNf, SkNf,
|
||||
name##_kernel(st->ctx, x_tail/N, x_tail%N, r,g,b,a, dr,dg,db,da); \
|
||||
next(st, x_tail, r,g,b,a, dr,dg,db,da); \
|
||||
} \
|
||||
SI void SK_VECTORCALL name##_d(Stage* st, size_t x_tail, \
|
||||
SkNf r, SkNf g, SkNf b, SkNf a, \
|
||||
SkNf dr, SkNf dg, SkNf db, SkNf da) { \
|
||||
name##_kernel(st->ctx, x_tail/N, x_tail%N, dr,dg,db,da, r,g,b,a); \
|
||||
next(st, x_tail, r,g,b,a, dr,dg,db,da); \
|
||||
} \
|
||||
static SK_ALWAYS_INLINE void name##_kernel(void* ctx, size_t x, size_t tail, \
|
||||
SkNf& r, SkNf& g, SkNf& b, SkNf& a, \
|
||||
SkNf& dr, SkNf& dg, SkNf& db, SkNf& da)
|
||||
@ -313,12 +319,6 @@ STAGE(clamp_a) {
|
||||
g = SkNf::Min(g, a);
|
||||
b = SkNf::Min(b, a);
|
||||
}
|
||||
STAGE(clamp_a_d) {
|
||||
da = SkNf::Min(da, 1.0f);
|
||||
dr = SkNf::Min(dr, da);
|
||||
dg = SkNf::Min(dg, da);
|
||||
db = SkNf::Min(db, da);
|
||||
}
|
||||
|
||||
STAGE(unpremul) {
|
||||
auto scale = (a == 0.0f).thenElse(0.0f, 1.0f/a);
|
||||
@ -352,19 +352,13 @@ STAGE(move_dst_src) {
|
||||
a = da;
|
||||
}
|
||||
|
||||
STAGE(swap_rb) { SkTSwap( r, b); }
|
||||
STAGE(swap_rb_d) { SkTSwap(dr, db); }
|
||||
STAGE(swap_rb) { SkTSwap(r, b); }
|
||||
|
||||
STAGE(from_srgb) {
|
||||
r = sk_linear_from_srgb_math(r);
|
||||
g = sk_linear_from_srgb_math(g);
|
||||
b = sk_linear_from_srgb_math(b);
|
||||
}
|
||||
STAGE(from_srgb_d) {
|
||||
dr = sk_linear_from_srgb_math(dr);
|
||||
dg = sk_linear_from_srgb_math(dg);
|
||||
db = sk_linear_from_srgb_math(db);
|
||||
}
|
||||
STAGE(to_srgb) {
|
||||
r = sk_linear_to_srgb_needs_round(r);
|
||||
g = sk_linear_to_srgb_needs_round(g);
|
||||
@ -473,11 +467,6 @@ STAGE(load_565) {
|
||||
from_565(load(tail, ptr), &r,&g,&b);
|
||||
a = 1.0f;
|
||||
}
|
||||
STAGE(load_565_d) {
|
||||
auto ptr = *(const uint16_t**)ctx + x;
|
||||
from_565(load(tail, ptr), &dr,&dg,&db);
|
||||
da = 1.0f;
|
||||
}
|
||||
STAGE(store_565) {
|
||||
auto ptr = *(uint16_t**)ctx + x;
|
||||
store(tail, SkNx_cast<uint16_t>( SkNf_round(r, SK_R16_MASK) << SK_R16_SHIFT
|
||||
@ -497,17 +486,6 @@ STAGE(load_f16) {
|
||||
}
|
||||
from_f16(src, &r, &g, &b, &a);
|
||||
}
|
||||
STAGE(load_f16_d) {
|
||||
auto ptr = *(const uint64_t**)ctx + x;
|
||||
|
||||
const void* src = ptr;
|
||||
SkNx<N, uint64_t> px;
|
||||
if (tail) {
|
||||
px = load(tail, ptr);
|
||||
src = &px;
|
||||
}
|
||||
from_f16(src, &dr, &dg, &db, &da);
|
||||
}
|
||||
STAGE(store_f16) {
|
||||
auto ptr = *(uint64_t**)ctx + x;
|
||||
|
||||
@ -536,10 +514,6 @@ STAGE(load_8888) {
|
||||
auto ptr = *(const uint32_t**)ctx + x;
|
||||
from_8888(load(tail, ptr), &r, &g, &b, &a);
|
||||
}
|
||||
STAGE(load_8888_d) {
|
||||
auto ptr = *(const uint32_t**)ctx + x;
|
||||
from_8888(load(tail, ptr), &dr, &dg, &db, &da);
|
||||
}
|
||||
STAGE(store_8888) {
|
||||
auto byte = [](const SkNf& x, int ix) {
|
||||
// Here's a neat trick: 0x47000000 == 32768.0f, and 0x470000ff == 32768.0f + (255/256.0f).
|
||||
|
Loading…
Reference in New Issue
Block a user