Commit c5491529 authored by Milo Yip's avatar Milo Yip

Change CountDecimalDigit32() to simple implementation

It is simple and pure C++. And it is found in performance test that it
is even faster than the original version, due to distribution of n. But
the performance gain is not obvious in RapidJSON.
parent 1900b7ba
...@@ -218,27 +218,17 @@ inline void GrisuRound(char* buffer, int len, uint64_t delta, uint64_t rest, uin ...@@ -218,27 +218,17 @@ inline void GrisuRound(char* buffer, int len, uint64_t delta, uint64_t rest, uin
} }
inline unsigned CountDecimalDigit32(uint32_t n) { inline unsigned CountDecimalDigit32(uint32_t n) {
static const uint32_t powers_of_10[] = { // Simple pure C++ implementation was faster than __builtin_clz version in this situation.
0, if (n < 10) return 1;
10, if (n < 100) return 2;
100, if (n < 1000) return 3;
1000, if (n < 10000) return 4;
10000, if (n < 100000) return 5;
100000, if (n < 1000000) return 6;
1000000, if (n < 10000000) return 7;
10000000, if (n < 100000000) return 8;
100000000, if (n < 1000000000) return 9;
1000000000 return 10;
};
#ifdef _MSC_VER
unsigned long i = 0;
_BitScanReverse(&i, n | 1);
uint32_t t = (i + 1) * 1233 >> 12;
#elif __GNUC__
uint32_t t = (32 - __builtin_clz(n | 1)) * 1233 >> 12;
#endif
return t - (n < powers_of_10[t]) + 1;
} }
inline void DigitGen(const DiyFp& W, const DiyFp& Mp, uint64_t delta, char* buffer, int* len, int* K) { inline void DigitGen(const DiyFp& W, const DiyFp& Mp, uint64_t delta, char* buffer, int* len, int* K) {
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment