1
2 /*
3 * Copyright (C) Dmitry Volyntsev
4 * Copyright (C) NGINX, Inc.
5 *
6 * An internal diy_fp implementation.
7 * For details, see Loitsch, Florian. "Printing floating-point numbers quickly
8 * and accurately with integers." ACM Sigplan Notices 45.6 (2010): 233-243.
9 */
10
11
12 #include <njs_main.h>
13 #include <njs_diyfp.h>
14
15
16 typedef struct njs_cpe_s {
17 uint64_t significand;
18 int16_t bin_exp;
19 int16_t dec_exp;
20 } njs_cpe_t;
21
22
23 static const njs_cpe_t njs_cached_powers[] = {
24 { njs_uint64(0xfa8fd5a0, 0x081c0288), -1220, -348 },
25 { njs_uint64(0xbaaee17f, 0xa23ebf76), -1193, -340 },
26 { njs_uint64(0x8b16fb20, 0x3055ac76), -1166, -332 },
27 { njs_uint64(0xcf42894a, 0x5dce35ea), -1140, -324 },
28 { njs_uint64(0x9a6bb0aa, 0x55653b2d), -1113, -316 },
29 { njs_uint64(0xe61acf03, 0x3d1a45df), -1087, -308 },
30 { njs_uint64(0xab70fe17, 0xc79ac6ca), -1060, -300 },
31 { njs_uint64(0xff77b1fc, 0xbebcdc4f), -1034, -292 },
32 { njs_uint64(0xbe5691ef, 0x416bd60c), -1007, -284 },
33 { njs_uint64(0x8dd01fad, 0x907ffc3c), -980, -276 },
34 { njs_uint64(0xd3515c28, 0x31559a83), -954, -268 },
35 { njs_uint64(0x9d71ac8f, 0xada6c9b5), -927, -260 },
36 { njs_uint64(0xea9c2277, 0x23ee8bcb), -901, -252 },
37 { njs_uint64(0xaecc4991, 0x4078536d), -874, -244 },
38 { njs_uint64(0x823c1279, 0x5db6ce57), -847, -236 },
39 { njs_uint64(0xc2109436, 0x4dfb5637), -821, -228 },
40 { njs_uint64(0x9096ea6f, 0x3848984f), -794, -220 },
41 { njs_uint64(0xd77485cb, 0x25823ac7), -768, -212 },
42 { njs_uint64(0xa086cfcd, 0x97bf97f4), -741, -204 },
43 { njs_uint64(0xef340a98, 0x172aace5), -715, -196 },
44 { njs_uint64(0xb23867fb, 0x2a35b28e), -688, -188 },
45 { njs_uint64(0x84c8d4df, 0xd2c63f3b), -661, -180 },
46 { njs_uint64(0xc5dd4427, 0x1ad3cdba), -635, -172 },
47 { njs_uint64(0x936b9fce, 0xbb25c996), -608, -164 },
48 { njs_uint64(0xdbac6c24, 0x7d62a584), -582, -156 },
49 { njs_uint64(0xa3ab6658, 0x0d5fdaf6), -555, -148 },
50 { njs_uint64(0xf3e2f893, 0xdec3f126), -529, -140 },
51 { njs_uint64(0xb5b5ada8, 0xaaff80b8), -502, -132 },
52 { njs_uint64(0x87625f05, 0x6c7c4a8b), -475, -124 },
53 { njs_uint64(0xc9bcff60, 0x34c13053), -449, -116 },
54 { njs_uint64(0x964e858c, 0x91ba2655), -422, -108 },
55 { njs_uint64(0xdff97724, 0x70297ebd), -396, -100 },
56 { njs_uint64(0xa6dfbd9f, 0xb8e5b88f), -369, -92 },
57 { njs_uint64(0xf8a95fcf, 0x88747d94), -343, -84 },
58 { njs_uint64(0xb9447093, 0x8fa89bcf), -316, -76 },
59 { njs_uint64(0x8a08f0f8, 0xbf0f156b), -289, -68 },
60 { njs_uint64(0xcdb02555, 0x653131b6), -263, -60 },
61 { njs_uint64(0x993fe2c6, 0xd07b7fac), -236, -52 },
62 { njs_uint64(0xe45c10c4, 0x2a2b3b06), -210, -44 },
63 { njs_uint64(0xaa242499, 0x697392d3), -183, -36 },
64 { njs_uint64(0xfd87b5f2, 0x8300ca0e), -157, -28 },
65 { njs_uint64(0xbce50864, 0x92111aeb), -130, -20 },
66 { njs_uint64(0x8cbccc09, 0x6f5088cc), -103, -12 },
67 { njs_uint64(0xd1b71758, 0xe219652c), -77, -4 },
68 { njs_uint64(0x9c400000, 0x00000000), -50, 4 },
69 { njs_uint64(0xe8d4a510, 0x00000000), -24, 12 },
70 { njs_uint64(0xad78ebc5, 0xac620000), 3, 20 },
71 { njs_uint64(0x813f3978, 0xf8940984), 30, 28 },
72 { njs_uint64(0xc097ce7b, 0xc90715b3), 56, 36 },
73 { njs_uint64(0x8f7e32ce, 0x7bea5c70), 83, 44 },
74 { njs_uint64(0xd5d238a4, 0xabe98068), 109, 52 },
75 { njs_uint64(0x9f4f2726, 0x179a2245), 136, 60 },
76 { njs_uint64(0xed63a231, 0xd4c4fb27), 162, 68 },
77 { njs_uint64(0xb0de6538, 0x8cc8ada8), 189, 76 },
78 { njs_uint64(0x83c7088e, 0x1aab65db), 216, 84 },
79 { njs_uint64(0xc45d1df9, 0x42711d9a), 242, 92 },
80 { njs_uint64(0x924d692c, 0xa61be758), 269, 100 },
81 { njs_uint64(0xda01ee64, 0x1a708dea), 295, 108 },
82 { njs_uint64(0xa26da399, 0x9aef774a), 322, 116 },
83 { njs_uint64(0xf209787b, 0xb47d6b85), 348, 124 },
84 { njs_uint64(0xb454e4a1, 0x79dd1877), 375, 132 },
85 { njs_uint64(0x865b8692, 0x5b9bc5c2), 402, 140 },
86 { njs_uint64(0xc83553c5, 0xc8965d3d), 428, 148 },
87 { njs_uint64(0x952ab45c, 0xfa97a0b3), 455, 156 },
88 { njs_uint64(0xde469fbd, 0x99a05fe3), 481, 164 },
89 { njs_uint64(0xa59bc234, 0xdb398c25), 508, 172 },
90 { njs_uint64(0xf6c69a72, 0xa3989f5c), 534, 180 },
91 { njs_uint64(0xb7dcbf53, 0x54e9bece), 561, 188 },
92 { njs_uint64(0x88fcf317, 0xf22241e2), 588, 196 },
93 { njs_uint64(0xcc20ce9b, 0xd35c78a5), 614, 204 },
94 { njs_uint64(0x98165af3, 0x7b2153df), 641, 212 },
95 { njs_uint64(0xe2a0b5dc, 0x971f303a), 667, 220 },
96 { njs_uint64(0xa8d9d153, 0x5ce3b396), 694, 228 },
97 { njs_uint64(0xfb9b7cd9, 0xa4a7443c), 720, 236 },
98 { njs_uint64(0xbb764c4c, 0xa7a44410), 747, 244 },
99 { njs_uint64(0x8bab8eef, 0xb6409c1a), 774, 252 },
100 { njs_uint64(0xd01fef10, 0xa657842c), 800, 260 },
101 { njs_uint64(0x9b10a4e5, 0xe9913129), 827, 268 },
102 { njs_uint64(0xe7109bfb, 0xa19c0c9d), 853, 276 },
103 { njs_uint64(0xac2820d9, 0x623bf429), 880, 284 },
104 { njs_uint64(0x80444b5e, 0x7aa7cf85), 907, 292 },
105 { njs_uint64(0xbf21e440, 0x03acdd2d), 933, 300 },
106 { njs_uint64(0x8e679c2f, 0x5e44ff8f), 960, 308 },
107 { njs_uint64(0xd433179d, 0x9c8cb841), 986, 316 },
108 { njs_uint64(0x9e19db92, 0xb4e31ba9), 1013, 324 },
109 { njs_uint64(0xeb96bf6e, 0xbadf77d9), 1039, 332 },
110 { njs_uint64(0xaf87023b, 0x9bf0ee6b), 1066, 340 },
111 };
112
113
114 #define NJS_D_1_LOG2_10 0.30102999566398114 /* 1 / log2(10). */
115
116
117 njs_diyfp_t
njs_cached_power_dec(int exp,int * dec_exp)118 njs_cached_power_dec(int exp, int *dec_exp)
119 {
120 u_int index;
121 const njs_cpe_t *cp;
122
123 index = (exp + NJS_DECIMAL_EXPONENT_OFF) / NJS_DECIMAL_EXPONENT_DIST;
124 cp = &njs_cached_powers[index];
125
126 *dec_exp = cp->dec_exp;
127
128 return njs_diyfp(cp->significand, cp->bin_exp);
129 }
130
131
132 njs_diyfp_t
njs_cached_power_bin(int exp,int * dec_exp)133 njs_cached_power_bin(int exp, int *dec_exp)
134 {
135 int k;
136 u_int index;
137 const njs_cpe_t *cp;
138
139 k = (int) ceil((-61 - exp) * NJS_D_1_LOG2_10)
140 + NJS_DECIMAL_EXPONENT_OFF - 1;
141
142 index = (unsigned) (k >> 3) + 1;
143
144 cp = &njs_cached_powers[index];
145
146 *dec_exp = -(NJS_DECIMAL_EXPONENT_MIN + (int) (index << 3));
147
148 return njs_diyfp(cp->significand, cp->bin_exp);
149 }
150