2022-05-10 10:06:48 +00:00
|
|
|
// Copyright (C) 2016 by Southwest Research Institute (R)
|
|
|
|
// Copyright (C) 2019 Intel Corporation.
|
|
|
|
// Copyright (C) 2020 The Qt Company Ltd.
|
|
|
|
// SPDX-License-Identifier: LicenseRef-Qt-Commercial OR LGPL-3.0-only OR GPL-2.0-only OR GPL-3.0-only
|
2013-06-23 00:43:46 +00:00
|
|
|
|
2019-03-14 03:33:52 +00:00
|
|
|
#include <stdint.h>
|
|
|
|
#include <stdio.h>
|
2013-06-23 00:43:46 +00:00
|
|
|
|
2019-06-03 17:42:25 +00:00
|
|
|
/*
|
|
|
|
* This tool generates the tables used by qfloat16 to implement a
|
|
|
|
* software-emulated version of IEEE 754 binary16. qfloat16 automatically uses
|
|
|
|
* CPU instructions to convert to and from float (IEEE 754 binary32), but if
|
|
|
|
* the CPU is not guaranteed to have those instructions available at compile
|
|
|
|
* time, then qfloat16 needs the tables to perform the conversion with
|
|
|
|
* reasonable performance.
|
|
|
|
*
|
|
|
|
* Because Qt requires float to be IEEE 754 binary32, these tables are
|
|
|
|
* platform-independent and will never change.
|
|
|
|
*/
|
|
|
|
|
2019-03-14 03:33:52 +00:00
|
|
|
uint32_t convertmantissa(int32_t i)
|
2013-06-23 00:43:46 +00:00
|
|
|
{
|
2019-03-14 03:33:52 +00:00
|
|
|
uint32_t m = i << 13; // Zero pad mantissa bits
|
|
|
|
uint32_t e = 0; // Zero exponent
|
2013-06-23 00:43:46 +00:00
|
|
|
|
|
|
|
while (!(m & 0x00800000)) { // While not normalized
|
|
|
|
e -= 0x00800000; // Decrement exponent (1<<23)
|
|
|
|
m <<= 1; // Shift mantissa
|
|
|
|
}
|
|
|
|
m &= ~0x00800000; // Clear leading 1 bit
|
|
|
|
e += 0x38800000; // Adjust bias ((127-14)<<23)
|
|
|
|
return m | e; // Return combined number
|
|
|
|
}
|
|
|
|
|
|
|
|
// we first build these tables up and then print them out as a separate step in order
|
|
|
|
// to more closely map the implementation given in the paper.
|
2019-03-14 03:33:52 +00:00
|
|
|
uint32_t basetable[512];
|
|
|
|
uint32_t shifttable[512];
|
2020-07-29 10:11:35 +00:00
|
|
|
uint32_t roundtable[512];
|
2013-06-23 00:43:46 +00:00
|
|
|
|
2019-03-14 03:33:52 +00:00
|
|
|
int main()
|
2013-06-23 00:43:46 +00:00
|
|
|
{
|
2019-03-14 03:33:52 +00:00
|
|
|
uint32_t i;
|
2013-06-23 00:43:46 +00:00
|
|
|
|
2019-06-03 17:42:25 +00:00
|
|
|
printf("/* This file was generated by util/qfloat16-tables/gen_qfloat16_tables.cpp */\n\n");
|
2019-03-14 03:33:52 +00:00
|
|
|
printf("#include <QtCore/qfloat16.h>\n\n");
|
2013-06-23 00:43:46 +00:00
|
|
|
|
2019-03-14 03:33:52 +00:00
|
|
|
printf("QT_BEGIN_NAMESPACE\n\n");
|
2019-11-06 00:00:08 +00:00
|
|
|
printf("#if !defined(__ARM_FP16_FORMAT_IEEE)\n\n");
|
2013-06-23 00:43:46 +00:00
|
|
|
|
2019-03-14 03:33:52 +00:00
|
|
|
printf("const quint32 qfloat16::mantissatable[2048] = {\n");
|
|
|
|
printf("0,\n");
|
2013-06-23 00:43:46 +00:00
|
|
|
for (i = 1; i < 1024; i++)
|
2019-03-14 03:33:52 +00:00
|
|
|
printf("0x%XU,\n", convertmantissa(i));
|
2013-06-23 00:43:46 +00:00
|
|
|
for (i = 1024; i < 2048; i++)
|
2019-03-14 03:33:52 +00:00
|
|
|
printf("0x%XU,\n", 0x38000000U + ((i - 1024) << 13));
|
|
|
|
printf("};\n\n");
|
2013-06-23 00:43:46 +00:00
|
|
|
|
2019-03-14 03:33:52 +00:00
|
|
|
printf("const quint32 qfloat16::exponenttable[64] = {\n");
|
|
|
|
printf("0,\n");
|
2013-06-23 00:43:46 +00:00
|
|
|
for (i = 1; i < 31; i++)
|
2019-03-14 03:33:52 +00:00
|
|
|
printf("0x%XU,\n", i << 23);
|
|
|
|
printf("0x47800000U,\n"); // 31
|
|
|
|
printf("0x80000000U,\n"); // 32
|
2013-06-23 00:43:46 +00:00
|
|
|
for (i = 33; i < 63; i++)
|
2019-03-14 03:33:52 +00:00
|
|
|
printf("0x%XU,\n", 0x80000000U + ((i - 32) << 23));
|
|
|
|
printf("0xC7800000U,\n"); // 63
|
|
|
|
printf("};\n\n");
|
2013-06-23 00:43:46 +00:00
|
|
|
|
2019-03-14 03:33:52 +00:00
|
|
|
printf("const quint32 qfloat16::offsettable[64] = {\n");
|
|
|
|
printf("0,\n");
|
2013-06-23 00:43:46 +00:00
|
|
|
for (i = 1; i < 32; i++)
|
2019-03-14 03:33:52 +00:00
|
|
|
printf("1024U,\n");
|
|
|
|
printf("0,\n");
|
2013-06-23 00:43:46 +00:00
|
|
|
for (i = 33; i < 64; i++)
|
2019-03-14 03:33:52 +00:00
|
|
|
printf("1024U,\n");
|
|
|
|
printf("};\n\n");
|
2013-06-23 00:43:46 +00:00
|
|
|
|
2019-03-14 03:33:52 +00:00
|
|
|
int32_t e;
|
2013-06-23 00:43:46 +00:00
|
|
|
for (i = 0; i < 256; ++i) {
|
|
|
|
e = i - 127;
|
2020-07-29 10:11:35 +00:00
|
|
|
if (e < -25) { // Very small numbers map to zero
|
2013-06-23 00:43:46 +00:00
|
|
|
basetable[i | 0x000] = 0x0000;
|
|
|
|
basetable[i | 0x100] = 0x8000;
|
|
|
|
shifttable[i | 0x000] = 24;
|
|
|
|
shifttable[i | 0x100] = 24;
|
2020-07-29 10:11:35 +00:00
|
|
|
roundtable[i | 0x000] = 0;
|
|
|
|
roundtable[i | 0x100] = 0;
|
2013-06-23 00:43:46 +00:00
|
|
|
|
|
|
|
} else if (e < -14) { // Small numbers map to denorms
|
|
|
|
basetable[i | 0x000] = (0x0400 >> (-e - 14));
|
|
|
|
basetable[i | 0x100] = (0x0400 >> (-e - 14)) | 0x8000;
|
|
|
|
shifttable[i | 0x000] = -e - 1;
|
|
|
|
shifttable[i | 0x100] = -e - 1;
|
2020-07-29 10:11:35 +00:00
|
|
|
if (e == -25) {
|
|
|
|
// rounds up
|
|
|
|
roundtable[i | 0x000] = (1 << 24);
|
|
|
|
roundtable[i | 0x100] = (1 << 24);
|
|
|
|
} else if (e == -24) {
|
|
|
|
// rounds half up
|
|
|
|
roundtable[i | 0x000] = (1 << 22) + 1;
|
|
|
|
roundtable[i | 0x100] = (1 << 22) + 1;
|
|
|
|
} else {
|
|
|
|
roundtable[i | 0x000] = (1 << (-e - 2));
|
|
|
|
roundtable[i | 0x100] = (1 << (-e - 2));
|
|
|
|
}
|
2013-06-23 00:43:46 +00:00
|
|
|
|
|
|
|
} else if (e <= 15) { // Normal numbers just lose precision
|
|
|
|
basetable[i | 0x000] = ((e + 15) << 10);
|
|
|
|
basetable[i | 0x100] = ((e + 15) << 10) | 0x8000;
|
|
|
|
shifttable[i | 0x000] = 13;
|
|
|
|
shifttable[i | 0x100] = 13;
|
2020-07-29 10:11:35 +00:00
|
|
|
roundtable[i | 0x000] = (1 << 12);
|
|
|
|
roundtable[i | 0x100] = (1 << 12);
|
2013-06-23 00:43:46 +00:00
|
|
|
|
|
|
|
} else if (e < 128) { // Large numbers map to Infinity
|
|
|
|
basetable[i | 0x000] = 0x7C00;
|
|
|
|
basetable[i | 0x100] = 0xFC00;
|
|
|
|
shifttable[i | 0x000] = 24;
|
|
|
|
shifttable[i | 0x100] = 24;
|
2020-07-29 10:11:35 +00:00
|
|
|
roundtable[i | 0x000] = 0;
|
|
|
|
roundtable[i | 0x100] = 0;
|
2013-06-23 00:43:46 +00:00
|
|
|
|
|
|
|
} else { // Infinity and NaN's stay Infinity and NaN's
|
|
|
|
basetable[i | 0x000] = 0x7C00;
|
|
|
|
basetable[i | 0x100] = 0xFC00;
|
|
|
|
shifttable[i | 0x000] = 13;
|
|
|
|
shifttable[i | 0x100] = 13;
|
2020-07-29 10:11:35 +00:00
|
|
|
roundtable[i | 0x000] = 0;
|
|
|
|
roundtable[i | 0x100] = 0;
|
2013-06-23 00:43:46 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-07-29 10:11:35 +00:00
|
|
|
printf("const quint16 qfloat16::basetable[512] = {\n");
|
2013-06-23 00:43:46 +00:00
|
|
|
for (i = 0; i < 512; i++)
|
2019-03-14 03:33:52 +00:00
|
|
|
printf("0x%XU,\n", basetable[i]);
|
2013-06-23 00:43:46 +00:00
|
|
|
|
2019-03-14 03:33:52 +00:00
|
|
|
printf("};\n\n");
|
2013-06-23 00:43:46 +00:00
|
|
|
|
2020-07-29 10:11:35 +00:00
|
|
|
printf("const quint16 qfloat16::shifttable[512] = {\n");
|
2013-06-23 00:43:46 +00:00
|
|
|
for (i = 0; i < 512; i++)
|
2019-03-14 03:33:52 +00:00
|
|
|
printf("0x%XU,\n", shifttable[i]);
|
2013-06-23 00:43:46 +00:00
|
|
|
|
2019-03-14 03:33:52 +00:00
|
|
|
printf("};\n\n");
|
2013-06-23 00:43:46 +00:00
|
|
|
|
2020-07-29 10:11:35 +00:00
|
|
|
printf("const quint32 qfloat16::roundtable[512] = {\n");
|
|
|
|
for (i = 0; i < 512; i++)
|
|
|
|
printf("0x%XU,\n", roundtable[i]);
|
|
|
|
|
|
|
|
printf("};\n\n");
|
|
|
|
|
2019-11-06 00:00:08 +00:00
|
|
|
printf("#endif // !__ARM_FP16_FORMAT_IEEE\n\n");
|
2019-03-14 03:33:52 +00:00
|
|
|
printf("QT_END_NAMESPACE\n");
|
2013-06-23 00:43:46 +00:00
|
|
|
return 0;
|
|
|
|
}
|