summaryrefslogtreecommitdiffstats
path: root/src/corelib/global/qfloat16.h
diff options
context:
space:
mode:
authorAllan Sandfeld Jensen <allan.jensen@qt.io>2020-07-29 12:11:35 +0200
committerAllan Sandfeld Jensen <allan.jensen@qt.io>2020-09-06 12:35:12 +0200
commitd3ff95dcb84861e8f42b480910d822b4ca8715b1 (patch)
tree7ade0148126e83ed589258983b632fbe3488d7fb /src/corelib/global/qfloat16.h
parenta0e0b51001edfc1c7aea113c472ce995efa833fd (diff)
Round float->qfloat16 to even
Calibrated to match F16C and ARM-FP16 hardware conversions. Change-Id: I3bdd4d3db3046fee4aeb24e4ce8b9bc9a06e0397 Reviewed-by: Edward Welbourne <edward.welbourne@qt.io> Reviewed-by: Thiago Macieira <thiago.macieira@intel.com>
Diffstat (limited to 'src/corelib/global/qfloat16.h')
-rw-r--r--src/corelib/global/qfloat16.h15
1 files changed, 10 insertions, 5 deletions
diff --git a/src/corelib/global/qfloat16.h b/src/corelib/global/qfloat16.h
index acf9220490..136571bbaf 100644
--- a/src/corelib/global/qfloat16.h
+++ b/src/corelib/global/qfloat16.h
@@ -107,8 +107,9 @@ private:
Q_CORE_EXPORT static const quint32 mantissatable[];
Q_CORE_EXPORT static const quint32 exponenttable[];
Q_CORE_EXPORT static const quint32 offsettable[];
- Q_CORE_EXPORT static const quint32 basetable[];
- Q_CORE_EXPORT static const quint32 shifttable[];
+ Q_CORE_EXPORT static const quint16 basetable[];
+ Q_CORE_EXPORT static const quint16 shifttable[];
+ Q_CORE_EXPORT static const quint32 roundtable[];
friend bool qIsNull(qfloat16 f) noexcept;
#if !defined(QT_NO_FLOAT16_OPERATORS)
@@ -173,14 +174,18 @@ inline qfloat16::qfloat16(float f) noexcept
quint32 u;
memcpy(&u, &f, sizeof(quint32));
const quint32 signAndExp = u >> 23;
- const quint32 base = basetable[signAndExp];
- const quint32 shift = shifttable[signAndExp];
+ const quint16 base = basetable[signAndExp];
+ const quint16 shift = shifttable[signAndExp];
+ const quint32 round = roundtable[signAndExp];
quint32 mantissa = (u & 0x007fffff);
if ((signAndExp & 0xff) == 0xff) {
if (mantissa) // keep nan from truncating to inf
mantissa = qMax(1U << shift, mantissa);
} else {
- mantissa += (1U << (shift - 1)) - 1; // rounding
+ // round half to even
+ mantissa += round;
+ if (mantissa & (1 << shift))
+ --mantissa;
}
// We use add as the mantissa may overflow causing