1 | /* $Id: testmath.c 18083 2009-03-19 09:16:55Z vboxsync $ */
|
---|
2 | /** @file
|
---|
3 | * Testcase for the no-crt math stuff.
|
---|
4 | */
|
---|
5 |
|
---|
6 |
|
---|
7 | /*******************************************************************************
|
---|
8 | * Header Files *
|
---|
9 | *******************************************************************************/
|
---|
10 | #ifndef MATHTEST_STANDALONE
|
---|
11 | # include <iprt/assert.h>
|
---|
12 | # include <math.h>
|
---|
13 | # undef printf
|
---|
14 | # define printf AssertMsg2
|
---|
15 | #else
|
---|
16 | # include <stdio.h>
|
---|
17 | # include <math.h>
|
---|
18 | #endif
|
---|
19 |
|
---|
20 | /* gcc starting with version 4.3 uses the MPFR library which results in more accurate results. gcc-4.3.1 seems to emit the less accurate result. So just allow both results. */
|
---|
21 | #define SIN180a -0.8011526357338304777463731115L
|
---|
22 | #define SIN180b -0.801152635733830477871L
|
---|
23 |
|
---|
24 | static void bitch(const char *pszWhat, const long double *plrdResult, const long double *plrdExpected)
|
---|
25 | {
|
---|
26 | const unsigned char *pach1 = (const unsigned char *)plrdResult;
|
---|
27 | const unsigned char *pach2 = (const unsigned char *)plrdExpected;
|
---|
28 | #ifndef MATHTEST_STANDALONE
|
---|
29 | printf("error: %s - %d instead of %d\n", pszWhat, (int)(*plrdResult * 100000), (int)(*plrdExpected * 100000));
|
---|
30 | #else
|
---|
31 | printf("error: %s - %.25f instead of %.25f\n", pszWhat, (double)*plrdResult, (double)*plrdExpected);
|
---|
32 | #endif
|
---|
33 | printf(" %02x%02x%02x%02x-%02x%02x%02x%02x-%02x%02x\n", pach1[0], pach1[1], pach1[2], pach1[3], pach1[4], pach1[5], pach1[6], pach1[7], pach1[8], pach1[9]);
|
---|
34 | printf(" %02x%02x%02x%02x-%02x%02x%02x%02x-%02x%02x\n", pach2[0], pach2[1], pach2[2], pach2[3], pach2[4], pach2[5], pach2[6], pach2[7], pach2[8], pach2[9]);
|
---|
35 | }
|
---|
36 |
|
---|
37 | static void bitchll(const char *pszWhat, long long llResult, long long llExpected)
|
---|
38 | {
|
---|
39 | #if defined(__MINGW32__) && !defined(Assert)
|
---|
40 | printf("error: %s - %I64d instead of %I64d\n", pszWhat, llResult, llExpected);
|
---|
41 | #else
|
---|
42 | printf("error: %s - %lld instead of %lld\n", pszWhat, llResult, llExpected);
|
---|
43 | #endif
|
---|
44 | }
|
---|
45 |
|
---|
46 | static void bitchl(const char *pszWhat, long lResult, long lExpected)
|
---|
47 | {
|
---|
48 | printf("error: %s - %ld instead of %ld\n", pszWhat, lResult, lExpected);
|
---|
49 | }
|
---|
50 |
|
---|
51 | extern int testsin(void)
|
---|
52 | {
|
---|
53 | return sinl(180.0L) == SIN180a || sinl(180.0L) == SIN180b;
|
---|
54 | }
|
---|
55 |
|
---|
56 | extern int testremainder(void)
|
---|
57 | {
|
---|
58 | static double s_rd1 = 2.5;
|
---|
59 | static double s_rd2 = 2.0;
|
---|
60 | static double s_rd3 = 0.5;
|
---|
61 | return remainder(s_rd1, s_rd2) == s_rd3;
|
---|
62 | }
|
---|
63 |
|
---|
64 | static __inline__ void set_cw(unsigned cw)
|
---|
65 | {
|
---|
66 | __asm __volatile("fldcw %0" : : "m" (cw));
|
---|
67 | }
|
---|
68 |
|
---|
69 | static __inline__ unsigned get_cw(void)
|
---|
70 | {
|
---|
71 | unsigned cw;
|
---|
72 | __asm __volatile("fstcw %0" : : "m" (cw));
|
---|
73 | return cw & 0xffff;
|
---|
74 | }
|
---|
75 |
|
---|
76 | static long double check_lrd(const long double lrd, const unsigned long long ull, const unsigned short us)
|
---|
77 | {
|
---|
78 | static volatile long double lrd2;
|
---|
79 | lrd2 = lrd;
|
---|
80 | if ( *(unsigned long long *)&lrd2 != ull
|
---|
81 | || ((unsigned short *)&lrd2)[4] != us)
|
---|
82 | {
|
---|
83 | #if defined(__MINGW32__) && !defined(Assert)
|
---|
84 | printf("%I64x:%04x instead of %I64x:%04x\n", *(unsigned long long *)&lrd2, ((unsigned short *)&lrd2)[4], ull, us);
|
---|
85 | #else
|
---|
86 | printf("%llx:%04x instead of %llx:%04x\n", *(unsigned long long *)&lrd2, ((unsigned short *)&lrd2)[4], ull, us);
|
---|
87 | #endif
|
---|
88 | __asm__("int3\n");
|
---|
89 | }
|
---|
90 | return lrd;
|
---|
91 | }
|
---|
92 |
|
---|
93 |
|
---|
94 | static long double make_lrd(const unsigned long long ull, const unsigned short us)
|
---|
95 | {
|
---|
96 | union
|
---|
97 | {
|
---|
98 | long double lrd;
|
---|
99 | struct
|
---|
100 | {
|
---|
101 | unsigned long long ull;
|
---|
102 | unsigned short us;
|
---|
103 | } i;
|
---|
104 | } u;
|
---|
105 |
|
---|
106 | u.i.ull = ull;
|
---|
107 | u.i.us = us;
|
---|
108 | return u.lrd;
|
---|
109 | }
|
---|
110 |
|
---|
111 | static long double check_lrd_cw(const long double lrd, const unsigned long long ull, const unsigned short us, const unsigned cw)
|
---|
112 | {
|
---|
113 | set_cw(cw);
|
---|
114 | if (cw != get_cw())
|
---|
115 | {
|
---|
116 | printf("get_cw() -> %#x expected %#x\n", get_cw(), cw);
|
---|
117 | __asm__("int3\n");
|
---|
118 | }
|
---|
119 | return check_lrd(lrd, ull, us);
|
---|
120 | }
|
---|
121 |
|
---|
122 | static long double make_lrd_cw(unsigned long long ull, unsigned short us, unsigned cw)
|
---|
123 | {
|
---|
124 | set_cw(cw);
|
---|
125 | return check_lrd_cw(make_lrd(ull, us), ull, us, cw);
|
---|
126 | }
|
---|
127 |
|
---|
128 | extern int testmath(void)
|
---|
129 | {
|
---|
130 | unsigned cErrors = 0;
|
---|
131 | long double lrdResult;
|
---|
132 | long double lrdExpect;
|
---|
133 | long double lrd;
|
---|
134 | #define CHECK(operation, expect) \
|
---|
135 | do { \
|
---|
136 | lrdExpect = expect; \
|
---|
137 | lrdResult = operation; \
|
---|
138 | if (lrdResult != lrdExpect) \
|
---|
139 | { \
|
---|
140 | bitch(#operation, &lrdResult, &lrdExpect); \
|
---|
141 | cErrors++; \
|
---|
142 | } \
|
---|
143 | } while (0)
|
---|
144 |
|
---|
145 | long long llResult;
|
---|
146 | long long llExpect;
|
---|
147 | #define CHECKLL(operation, expect) \
|
---|
148 | do { \
|
---|
149 | llExpect = expect; \
|
---|
150 | llResult = operation; \
|
---|
151 | if (llResult != llExpect) \
|
---|
152 | { \
|
---|
153 | bitchll(#operation, llResult, llExpect); \
|
---|
154 | cErrors++; \
|
---|
155 | } \
|
---|
156 | } while (0)
|
---|
157 |
|
---|
158 | long lResult;
|
---|
159 | long lExpect;
|
---|
160 | #define CHECKL(operation, expect) \
|
---|
161 | do { \
|
---|
162 | lExpect = expect; \
|
---|
163 | lResult = operation; \
|
---|
164 | if (lResult != lExpect) \
|
---|
165 | { \
|
---|
166 | bitchl(#operation, lResult, lExpect); \
|
---|
167 | cErrors++; \
|
---|
168 | } \
|
---|
169 | } while (0)
|
---|
170 |
|
---|
171 | CHECK(atan2l(1.0L, 1.0L), 0.785398163397448309603L);
|
---|
172 | CHECK(atan2l(2.3L, 3.3L), 0.608689307327411694890L);
|
---|
173 |
|
---|
174 | CHECK(ceill(1.9L), 2.0L);
|
---|
175 | CHECK(ceill(4.5L), 5.0L);
|
---|
176 | CHECK(ceill(3.3L), 4.0L);
|
---|
177 | CHECK(ceill(6.1L), 7.0L);
|
---|
178 |
|
---|
179 | CHECK(floorl(1.9L), 1.0L);
|
---|
180 | CHECK(floorl(4.5L), 4.0L);
|
---|
181 | CHECK(floorl(7.3L), 7.0L);
|
---|
182 | CHECK(floorl(1234.1L), 1234.0L);
|
---|
183 | CHECK(floor(1233.1), 1233.0);
|
---|
184 | CHECK(floor(1239.98989898), 1239.0);
|
---|
185 | CHECK(floorf(9999.999), 9999.0);
|
---|
186 |
|
---|
187 | CHECK(ldexpl(1.0L, 1), 2.0L);
|
---|
188 | CHECK(ldexpl(1.0L, 10), 1024.0L);
|
---|
189 | CHECK(ldexpl(2.25L, 10), 2304.0L);
|
---|
190 |
|
---|
191 | CHECKLL(llrintl(1.0L), 1);
|
---|
192 | CHECKLL(llrintl(1.3L), 1);
|
---|
193 | CHECKLL(llrintl(1.5L), 2);
|
---|
194 | CHECKLL(llrintl(1.9L), 2);
|
---|
195 | CHECKLL(llrintf(123.34), 123);
|
---|
196 | CHECKLL(llrintf(-123.50), -124);
|
---|
197 | CHECKLL(llrint(42.42), 42);
|
---|
198 | CHECKLL(llrint(-2147483648.12343), -2147483648LL);
|
---|
199 | #if !defined(RT_ARCH_AMD64)
|
---|
200 | CHECKLL(lrint(-21474836499.12343), -2147483648LL);
|
---|
201 | CHECKLL(lrint(-2147483649932412.12343), -2147483648LL);
|
---|
202 | #else
|
---|
203 | CHECKLL(lrint(-21474836499.12343), -21474836499L);
|
---|
204 | CHECKLL(lrint(-2147483649932412.12343), -2147483649932412L);
|
---|
205 | #endif
|
---|
206 |
|
---|
207 | // __asm__("int3");
|
---|
208 | CHECKL(lrintl(make_lrd_cw(000000000000000000ULL,000000,0x027f)), 0L);
|
---|
209 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0x3ffe,0x027f)), 0L);
|
---|
210 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0x3ffe,0x027f)), 0L);
|
---|
211 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0x3ffe,0x067f)), 0L);
|
---|
212 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0x3ffe,0x067f)), 0L);
|
---|
213 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0x3ffe,0x0a7f)), 1L);
|
---|
214 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0x3ffe,0x0a7f)), 1L);
|
---|
215 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0x3ffe,0x0e7f)), 0L);
|
---|
216 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0x3ffe,0x0e7f)), 0L);
|
---|
217 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0xbffe,0x027f)), 0L);
|
---|
218 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0xbffe,0x027f)), 0L);
|
---|
219 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0xbffe,0x067f)), -1L);
|
---|
220 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0xbffe,0x067f)), -1L);
|
---|
221 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0xbffe,0x0a7f)), 0L);
|
---|
222 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0xbffe,0x0a7f)), 0L);
|
---|
223 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0xbffe,0x0e7f)), 0L);
|
---|
224 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0xbffe,0x0e7f)), 0L);
|
---|
225 | CHECKL(lrintl(make_lrd_cw(0x9249249249249000ULL,0x3ffc,0x027f)), 0L);
|
---|
226 | CHECKL(lrintl(make_lrd_cw(0x9249249249249000ULL,0x3ffc,0x027f)), 0L);
|
---|
227 | CHECKL(lrintl(make_lrd_cw(0x9249249249249000ULL,0x3ffc,0x067f)), 0L);
|
---|
228 | CHECKL(lrintl(make_lrd_cw(0x9249249249249000ULL,0x3ffc,0x067f)), 0L);
|
---|
229 | CHECKL(lrintl(make_lrd_cw(0x9249249249249000ULL,0x3ffc,0x0a7f)), 1L);
|
---|
230 | CHECKL(lrintl(make_lrd_cw(0x9249249249249000ULL,0x3ffc,0x0a7f)), 1L);
|
---|
231 | CHECKL(lrintl(make_lrd_cw(0x9249249249249000ULL,0x3ffc,0x0e7f)), 0L);
|
---|
232 | CHECKL(lrintl(make_lrd_cw(0x9249249249249000ULL,0x3ffc,0x0e7f)), 0L);
|
---|
233 | CHECKL(lrintl(make_lrd_cw(0xe38e38e38e38e000ULL,0xbffb,0x027f)), 0L);
|
---|
234 | CHECKL(lrintl(make_lrd_cw(0xe38e38e38e38e000ULL,0xbffb,0x027f)), 0L);
|
---|
235 | CHECKL(lrintl(make_lrd_cw(0xe38e38e38e38e000ULL,0xbffb,0x067f)), -1L);
|
---|
236 | CHECKL(lrintl(make_lrd_cw(0xe38e38e38e38e000ULL,0xbffb,0x067f)), -1L);
|
---|
237 | CHECKL(lrintl(make_lrd_cw(0xe38e38e38e38e000ULL,0xbffb,0x0a7f)), 0L);
|
---|
238 | CHECKL(lrintl(make_lrd_cw(0xe38e38e38e38e000ULL,0xbffb,0x0a7f)), 0L);
|
---|
239 | CHECKL(lrintl(make_lrd_cw(0xe38e38e38e38e000ULL,0xbffb,0x0e7f)), 0L);
|
---|
240 | CHECKL(lrintl(make_lrd_cw(0xe38e38e38e38e000ULL,0xbffb,0x0e7f)), 0L);
|
---|
241 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0x400e,0x027f)), 32768L);
|
---|
242 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0x400e,0x027f)), 32768L);
|
---|
243 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0x400e,0x067f)), 32768L);
|
---|
244 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0x400e,0x067f)), 32768L);
|
---|
245 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0x400e,0x0a7f)), 32768L);
|
---|
246 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0x400e,0x0a7f)), 32768L);
|
---|
247 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0x400e,0x0e7f)), 32768L);
|
---|
248 | CHECKL(lrintl(make_lrd_cw(0x8000000000000000ULL,0x400e,0x0e7f)), 32768L);
|
---|
249 | #if !defined(RT_ARCH_AMD64)
|
---|
250 | /* c90 says that the constant is 2147483648 (which is not representable as a signed 32-bit
|
---|
251 | * value). To that constant you've then applied the negation operation. c90 doesn't have
|
---|
252 | * negative constants, only positive ones that have been negated. */
|
---|
253 | CHECKL(lrintl(make_lrd_cw(0xad78ebc5ac620000ULL,0xc041,0x027f)), (long)(-2147483647L - 1));
|
---|
254 | CHECKL(lrintl(make_lrd_cw(0xad78ebc5ac620000ULL,0xc041,0x027f)), (long)(-2147483647L - 1));
|
---|
255 | CHECKL(lrintl(make_lrd_cw(0xad78ebc5ac620000ULL,0xc041,0x067f)), (long)(-2147483647L - 1));
|
---|
256 | CHECKL(lrintl(make_lrd_cw(0xad78ebc5ac620000ULL,0xc041,0x067f)), (long)(-2147483647L - 1));
|
---|
257 | CHECKL(lrintl(make_lrd_cw(0xad78ebc5ac620000ULL,0xc041,0x0a7f)), (long)(-2147483647L - 1));
|
---|
258 | CHECKL(lrintl(make_lrd_cw(0xad78ebc5ac620000ULL,0xc041,0x0a7f)), (long)(-2147483647L - 1));
|
---|
259 | CHECKL(lrintl(make_lrd_cw(0xad78ebc5ac620000ULL,0xc041,0x0e7f)), (long)(-2147483647L - 1));
|
---|
260 | CHECKL(lrintl(make_lrd_cw(0xad78ebc5ac620000ULL,0xc041,0x0e7f)), (long)(-2147483647L - 1));
|
---|
261 | #endif
|
---|
262 | set_cw(0x27f);
|
---|
263 |
|
---|
264 | CHECK(logl(2.7182818284590452353602874713526625L), 1.0);
|
---|
265 |
|
---|
266 | CHECK(remainderl(1.0L, 1.0L), 0.0);
|
---|
267 | CHECK(remainderl(1.0L, 1.5L), -0.5);
|
---|
268 | CHECK(remainderl(42.0L, 34.25L), 7.75);
|
---|
269 | CHECK(remainderf(43.0, 34.25), 8.75);
|
---|
270 | CHECK(remainder(44.25, 34.25), 10.00);
|
---|
271 | double rd1 = 44.25;
|
---|
272 | double rd2 = 34.25;
|
---|
273 | CHECK(remainder(rd1, rd2), 10.00);
|
---|
274 | CHECK(remainder(2.5, 2.0), 0.5);
|
---|
275 | CHECK(remainder(2.5, 2.0), 0.5);
|
---|
276 | CHECK(remainder(2.5, 2.0), 0.5);
|
---|
277 | CHECKLL(testremainder(), 1);
|
---|
278 |
|
---|
279 |
|
---|
280 | /* Only works in extended precision, while double precesion is defaul on BSD (including Darwin) */
|
---|
281 | set_cw(0x37f);
|
---|
282 | CHECK(rintl(1.0L), 1.0);
|
---|
283 | CHECK(rintl(1.4L), 1.0);
|
---|
284 | CHECK(rintl(1.3L), 1.0);
|
---|
285 | CHECK(rintl(0.9L), 1.0);
|
---|
286 | CHECK(rintl(3123.1232L), 3123.0);
|
---|
287 | CHECK(rint(3985.13454), 3985.0);
|
---|
288 | CHECK(rintf(9999.999), 10000.0);
|
---|
289 | set_cw(0x27f);
|
---|
290 |
|
---|
291 | CHECK(sinl(1.0L), 0.84147098480789650664L);
|
---|
292 | lrd = 180.0L;
|
---|
293 | CHECK(sinl(lrd), -0.801152635733830477871L);
|
---|
294 | #if 0
|
---|
295 | CHECK(sinl(180.0L), SIN180);
|
---|
296 | #else
|
---|
297 | lrdExpect = SIN180a;
|
---|
298 | lrdResult = sinl(180.0L);
|
---|
299 | if (lrdResult != lrdExpect)
|
---|
300 | {
|
---|
301 | lrdExpect = SIN180b;
|
---|
302 | if (lrdResult != lrdExpect)
|
---|
303 | {
|
---|
304 | bitch("sinl(180.0L)", &lrdResult, &lrdExpect);
|
---|
305 | cErrors++;
|
---|
306 | }
|
---|
307 | }
|
---|
308 | #endif
|
---|
309 | CHECKLL(testsin(), 1);
|
---|
310 |
|
---|
311 | CHECK(sqrtl(1.0L), 1.0);
|
---|
312 | CHECK(sqrtl(4.0L), 2.0);
|
---|
313 | CHECK(sqrtl(1525225.0L), 1235.0);
|
---|
314 |
|
---|
315 | CHECK(tanl(0.0L), 0.0);
|
---|
316 | CHECK(tanl(0.7853981633974483096156608458198757L), 1.0);
|
---|
317 |
|
---|
318 | CHECK(powl(0.0, 0.0), 1.0);
|
---|
319 | CHECK(powl(2.0, 2.0), 4.0);
|
---|
320 | CHECK(powl(3.0, 3.0), 27.0);
|
---|
321 |
|
---|
322 | return cErrors;
|
---|
323 | }
|
---|
324 |
|
---|
325 |
|
---|
326 | /////////////////////////////////////////////////////////////////////////////////////////
|
---|
327 | /////////////////////////////////////////////////////////////////////////////////////////
|
---|
328 | /////////////////////////////////////////////////////////////////////////////////////////
|
---|
329 | #if 0
|
---|
330 |
|
---|
331 | #define floatx_to_int32 floatx80_to_int32
|
---|
332 | #define floatx_to_int64 floatx80_to_int64
|
---|
333 | #define floatx_to_int32_round_to_zero floatx80_to_int32_round_to_zero
|
---|
334 | #define floatx_to_int64_round_to_zero floatx80_to_int64_round_to_zero
|
---|
335 | #define floatx_abs floatx80_abs
|
---|
336 | #define floatx_chs floatx80_chs
|
---|
337 | #define floatx_round_to_int(foo, bar) floatx80_round_to_int(foo, NULL)
|
---|
338 | #define floatx_compare floatx80_compare
|
---|
339 | #define floatx_compare_quiet floatx80_compare_quiet
|
---|
340 | #undef sin
|
---|
341 | #undef cos
|
---|
342 | #undef sqrt
|
---|
343 | #undef pow
|
---|
344 | #undef log
|
---|
345 | #undef tan
|
---|
346 | #undef atan2
|
---|
347 | #undef floor
|
---|
348 | #undef ceil
|
---|
349 | #undef ldexp
|
---|
350 | #define sin sinl
|
---|
351 | #define cos cosl
|
---|
352 | #define sqrt sqrtl
|
---|
353 | #define pow powl
|
---|
354 | #define log logl
|
---|
355 | #define tan tanl
|
---|
356 | #define atan2 atan2l
|
---|
357 | #define floor floorl
|
---|
358 | #define ceil ceill
|
---|
359 | #define ldexp ldexpl
|
---|
360 |
|
---|
361 |
|
---|
362 | typedef long double CPU86_LDouble;
|
---|
363 |
|
---|
364 | typedef union {
|
---|
365 | long double d;
|
---|
366 | struct {
|
---|
367 | unsigned long long lower;
|
---|
368 | unsigned short upper;
|
---|
369 | } l;
|
---|
370 | } CPU86_LDoubleU;
|
---|
371 |
|
---|
372 | /* the following deal with x86 long double-precision numbers */
|
---|
373 | #define MAXEXPD 0x7fff
|
---|
374 | #define EXPBIAS 16383
|
---|
375 | #define EXPD(fp) (fp.l.upper & 0x7fff)
|
---|
376 | #define SIGND(fp) ((fp.l.upper) & 0x8000)
|
---|
377 | #define MANTD(fp) (fp.l.lower)
|
---|
378 | #define BIASEXPONENT(fp) fp.l.upper = (fp.l.upper & ~(0x7fff)) | EXPBIAS
|
---|
379 |
|
---|
380 | typedef long double floatx80;
|
---|
381 | #define STATUS_PARAM , void *pv
|
---|
382 |
|
---|
383 | static floatx80 floatx80_round_to_int( floatx80 a STATUS_PARAM)
|
---|
384 | {
|
---|
385 | return rintl(a);
|
---|
386 | }
|
---|
387 |
|
---|
388 |
|
---|
389 |
|
---|
390 | struct myenv
|
---|
391 | {
|
---|
392 | unsigned int fpstt; /* top of stack index */
|
---|
393 | unsigned int fpus;
|
---|
394 | unsigned int fpuc;
|
---|
395 | unsigned char fptags[8]; /* 0 = valid, 1 = empty */
|
---|
396 | union {
|
---|
397 | #ifdef USE_X86LDOUBLE
|
---|
398 | CPU86_LDouble d __attribute__((aligned(16)));
|
---|
399 | #else
|
---|
400 | CPU86_LDouble d;
|
---|
401 | #endif
|
---|
402 | } fpregs[8];
|
---|
403 |
|
---|
404 | } my_env, env_org, env_res, *env = &my_env;
|
---|
405 |
|
---|
406 |
|
---|
407 | #define ST0 (env->fpregs[env->fpstt].d)
|
---|
408 | #define ST(n) (env->fpregs[(env->fpstt + (n)) & 7].d)
|
---|
409 | #define ST1 ST(1)
|
---|
410 | #define MAXTAN 9223372036854775808.0
|
---|
411 |
|
---|
412 |
|
---|
413 | static inline void fpush(void)
|
---|
414 | {
|
---|
415 | env->fpstt = (env->fpstt - 1) & 7;
|
---|
416 | env->fptags[env->fpstt] = 0; /* validate stack entry */
|
---|
417 | }
|
---|
418 |
|
---|
419 | static inline void fpop(void)
|
---|
420 | {
|
---|
421 | env->fptags[env->fpstt] = 1; /* invvalidate stack entry */
|
---|
422 | env->fpstt = (env->fpstt + 1) & 7;
|
---|
423 | }
|
---|
424 |
|
---|
425 | static void helper_f2xm1(void)
|
---|
426 | {
|
---|
427 | ST0 = pow(2.0,ST0) - 1.0;
|
---|
428 | }
|
---|
429 |
|
---|
430 | static void helper_fyl2x(void)
|
---|
431 | {
|
---|
432 | CPU86_LDouble fptemp;
|
---|
433 |
|
---|
434 | fptemp = ST0;
|
---|
435 | if (fptemp>0.0){
|
---|
436 | fptemp = log(fptemp)/log(2.0); /* log2(ST) */
|
---|
437 | ST1 *= fptemp;
|
---|
438 | fpop();
|
---|
439 | } else {
|
---|
440 | env->fpus &= (~0x4700);
|
---|
441 | env->fpus |= 0x400;
|
---|
442 | }
|
---|
443 | }
|
---|
444 |
|
---|
445 | static void helper_fptan(void)
|
---|
446 | {
|
---|
447 | CPU86_LDouble fptemp;
|
---|
448 |
|
---|
449 | fptemp = ST0;
|
---|
450 | if((fptemp > MAXTAN)||(fptemp < -MAXTAN)) {
|
---|
451 | env->fpus |= 0x400;
|
---|
452 | } else {
|
---|
453 | ST0 = tan(fptemp);
|
---|
454 | fpush();
|
---|
455 | ST0 = 1.0;
|
---|
456 | env->fpus &= (~0x400); /* C2 <-- 0 */
|
---|
457 | /* the above code is for |arg| < 2**52 only */
|
---|
458 | }
|
---|
459 | }
|
---|
460 |
|
---|
461 | static void helper_fpatan(void)
|
---|
462 | {
|
---|
463 | CPU86_LDouble fptemp, fpsrcop;
|
---|
464 |
|
---|
465 | fpsrcop = ST1;
|
---|
466 | fptemp = ST0;
|
---|
467 | ST1 = atan2(fpsrcop,fptemp);
|
---|
468 | fpop();
|
---|
469 | }
|
---|
470 |
|
---|
471 | static void helper_fxtract(void)
|
---|
472 | {
|
---|
473 | CPU86_LDoubleU temp;
|
---|
474 | unsigned int expdif;
|
---|
475 |
|
---|
476 | temp.d = ST0;
|
---|
477 | expdif = EXPD(temp) - EXPBIAS;
|
---|
478 | /*DP exponent bias*/
|
---|
479 | ST0 = expdif;
|
---|
480 | fpush();
|
---|
481 | BIASEXPONENT(temp);
|
---|
482 | ST0 = temp.d;
|
---|
483 | }
|
---|
484 |
|
---|
485 | static void helper_fprem1(void)
|
---|
486 | {
|
---|
487 | CPU86_LDouble dblq, fpsrcop, fptemp;
|
---|
488 | CPU86_LDoubleU fpsrcop1, fptemp1;
|
---|
489 | int expdif;
|
---|
490 | int q;
|
---|
491 |
|
---|
492 | fpsrcop = ST0;
|
---|
493 | fptemp = ST1;
|
---|
494 | fpsrcop1.d = fpsrcop;
|
---|
495 | fptemp1.d = fptemp;
|
---|
496 | expdif = EXPD(fpsrcop1) - EXPD(fptemp1);
|
---|
497 | if (expdif < 53) {
|
---|
498 | dblq = fpsrcop / fptemp;
|
---|
499 | dblq = (dblq < 0.0)? ceil(dblq): floor(dblq);
|
---|
500 | ST0 = fpsrcop - fptemp*dblq;
|
---|
501 | q = (int)dblq; /* cutting off top bits is assumed here */
|
---|
502 | env->fpus &= (~0x4700); /* (C3,C2,C1,C0) <-- 0000 */
|
---|
503 | /* (C0,C1,C3) <-- (q2,q1,q0) */
|
---|
504 | env->fpus |= (q&0x4) << 6; /* (C0) <-- q2 */
|
---|
505 | env->fpus |= (q&0x2) << 8; /* (C1) <-- q1 */
|
---|
506 | env->fpus |= (q&0x1) << 14; /* (C3) <-- q0 */
|
---|
507 | } else {
|
---|
508 | env->fpus |= 0x400; /* C2 <-- 1 */
|
---|
509 | fptemp = pow(2.0, expdif-50);
|
---|
510 | fpsrcop = (ST0 / ST1) / fptemp;
|
---|
511 | /* fpsrcop = integer obtained by rounding to the nearest */
|
---|
512 | fpsrcop = (fpsrcop-floor(fpsrcop) < ceil(fpsrcop)-fpsrcop)?
|
---|
513 | floor(fpsrcop): ceil(fpsrcop);
|
---|
514 | ST0 -= (ST1 * fpsrcop * fptemp);
|
---|
515 | }
|
---|
516 | }
|
---|
517 |
|
---|
518 | static void helper_fprem(void)
|
---|
519 | {
|
---|
520 | #if 0
|
---|
521 | LogFlow(("helper_fprem: ST0=%.*Rhxs ST1=%.*Rhxs fpus=%#x\n", sizeof(ST0), &ST0, sizeof(ST1), &ST1, env->fpus));
|
---|
522 |
|
---|
523 | __asm__ __volatile__("fldt (%2)\n"
|
---|
524 | "fldt (%1)\n"
|
---|
525 | "fprem \n"
|
---|
526 | "fnstsw (%0)\n"
|
---|
527 | "fstpt (%1)\n"
|
---|
528 | "fstpt (%2)\n"
|
---|
529 | : : "r" (&env->fpus), "r" (&ST0), "r" (&ST1) : "memory");
|
---|
530 |
|
---|
531 | LogFlow(("helper_fprem: -> ST0=%.*Rhxs fpus=%#x c\n", sizeof(ST0), &ST0, env->fpus));
|
---|
532 | #else
|
---|
533 | CPU86_LDouble dblq, fpsrcop, fptemp;
|
---|
534 | CPU86_LDoubleU fpsrcop1, fptemp1;
|
---|
535 | int expdif;
|
---|
536 | int q;
|
---|
537 |
|
---|
538 | fpsrcop = ST0;
|
---|
539 | fptemp = ST1;
|
---|
540 | fpsrcop1.d = fpsrcop;
|
---|
541 | fptemp1.d = fptemp;
|
---|
542 |
|
---|
543 | expdif = EXPD(fpsrcop1) - EXPD(fptemp1);
|
---|
544 | if ( expdif < 53 ) {
|
---|
545 | dblq = fpsrcop / fptemp;
|
---|
546 | dblq = (dblq < 0.0)? ceil(dblq): floor(dblq);
|
---|
547 | ST0 = fpsrcop - fptemp*dblq;
|
---|
548 | q = (int)dblq; /* cutting off top bits is assumed here */
|
---|
549 | env->fpus &= (~0x4700); /* (C3,C2,C1,C0) <-- 0000 */
|
---|
550 | /* (C0,C1,C3) <-- (q2,q1,q0) */
|
---|
551 | env->fpus |= (q&0x4) << 6; /* (C0) <-- q2 */
|
---|
552 | env->fpus |= (q&0x2) << 8; /* (C1) <-- q1 */
|
---|
553 | env->fpus |= (q&0x1) << 14; /* (C3) <-- q0 */
|
---|
554 | } else {
|
---|
555 | env->fpus |= 0x400; /* C2 <-- 1 */
|
---|
556 | fptemp = pow(2.0, expdif-50);
|
---|
557 | fpsrcop = (ST0 / ST1) / fptemp;
|
---|
558 | /* fpsrcop = integer obtained by chopping */
|
---|
559 | fpsrcop = (fpsrcop < 0.0)?
|
---|
560 | -(floor(fabs(fpsrcop))): floor(fpsrcop);
|
---|
561 | ST0 -= (ST1 * fpsrcop * fptemp);
|
---|
562 | }
|
---|
563 | #endif
|
---|
564 | }
|
---|
565 |
|
---|
566 | static void helper_fyl2xp1(void)
|
---|
567 | {
|
---|
568 | CPU86_LDouble fptemp;
|
---|
569 |
|
---|
570 | fptemp = ST0;
|
---|
571 | if ((fptemp+1.0)>0.0) {
|
---|
572 | fptemp = log(fptemp+1.0) / log(2.0); /* log2(ST+1.0) */
|
---|
573 | ST1 *= fptemp;
|
---|
574 | fpop();
|
---|
575 | } else {
|
---|
576 | env->fpus &= (~0x4700);
|
---|
577 | env->fpus |= 0x400;
|
---|
578 | }
|
---|
579 | }
|
---|
580 |
|
---|
581 | static void helper_fsqrt(void)
|
---|
582 | {
|
---|
583 | CPU86_LDouble fptemp;
|
---|
584 |
|
---|
585 | fptemp = ST0;
|
---|
586 | if (fptemp<0.0) {
|
---|
587 | env->fpus &= (~0x4700); /* (C3,C2,C1,C0) <-- 0000 */
|
---|
588 | env->fpus |= 0x400;
|
---|
589 | }
|
---|
590 | ST0 = sqrt(fptemp);
|
---|
591 | }
|
---|
592 |
|
---|
593 | static void helper_fsincos(void)
|
---|
594 | {
|
---|
595 | CPU86_LDouble fptemp;
|
---|
596 |
|
---|
597 | fptemp = ST0;
|
---|
598 | if ((fptemp > MAXTAN)||(fptemp < -MAXTAN)) {
|
---|
599 | env->fpus |= 0x400;
|
---|
600 | } else {
|
---|
601 | ST0 = sin(fptemp);
|
---|
602 | fpush();
|
---|
603 | ST0 = cos(fptemp);
|
---|
604 | env->fpus &= (~0x400); /* C2 <-- 0 */
|
---|
605 | /* the above code is for |arg| < 2**63 only */
|
---|
606 | }
|
---|
607 | }
|
---|
608 |
|
---|
609 | static void helper_frndint(void)
|
---|
610 | {
|
---|
611 | ST0 = floatx_round_to_int(ST0, &env->fp_status);
|
---|
612 | }
|
---|
613 |
|
---|
614 | static void helper_fscale(void)
|
---|
615 | {
|
---|
616 | ST0 = ldexp (ST0, (int)(ST1));
|
---|
617 | }
|
---|
618 |
|
---|
619 | static void helper_fsin(void)
|
---|
620 | {
|
---|
621 | CPU86_LDouble fptemp;
|
---|
622 |
|
---|
623 | fptemp = ST0;
|
---|
624 | if ((fptemp > MAXTAN)||(fptemp < -MAXTAN)) {
|
---|
625 | env->fpus |= 0x400;
|
---|
626 | } else {
|
---|
627 | ST0 = sin(fptemp);
|
---|
628 | env->fpus &= (~0x400); /* C2 <-- 0 */
|
---|
629 | /* the above code is for |arg| < 2**53 only */
|
---|
630 | }
|
---|
631 | }
|
---|
632 |
|
---|
633 | static void helper_fcos(void)
|
---|
634 | {
|
---|
635 | CPU86_LDouble fptemp;
|
---|
636 |
|
---|
637 | fptemp = ST0;
|
---|
638 | if((fptemp > MAXTAN)||(fptemp < -MAXTAN)) {
|
---|
639 | env->fpus |= 0x400;
|
---|
640 | } else {
|
---|
641 | ST0 = cos(fptemp);
|
---|
642 | env->fpus &= (~0x400); /* C2 <-- 0 */
|
---|
643 | /* the above code is for |arg5 < 2**63 only */
|
---|
644 | }
|
---|
645 | }
|
---|
646 |
|
---|
647 | static void helper_fxam_ST0(void)
|
---|
648 | {
|
---|
649 | CPU86_LDoubleU temp;
|
---|
650 | int expdif;
|
---|
651 |
|
---|
652 | temp.d = ST0;
|
---|
653 |
|
---|
654 | env->fpus &= (~0x4700); /* (C3,C2,C1,C0) <-- 0000 */
|
---|
655 | if (SIGND(temp))
|
---|
656 | env->fpus |= 0x200; /* C1 <-- 1 */
|
---|
657 |
|
---|
658 | /* XXX: test fptags too */
|
---|
659 | expdif = EXPD(temp);
|
---|
660 | if (expdif == MAXEXPD) {
|
---|
661 | #ifdef USE_X86LDOUBLE
|
---|
662 | if (MANTD(temp) == 0x8000000000000000ULL)
|
---|
663 | #else
|
---|
664 | if (MANTD(temp) == 0)
|
---|
665 | #endif
|
---|
666 | env->fpus |= 0x500 /*Infinity*/;
|
---|
667 | else
|
---|
668 | env->fpus |= 0x100 /*NaN*/;
|
---|
669 | } else if (expdif == 0) {
|
---|
670 | if (MANTD(temp) == 0)
|
---|
671 | env->fpus |= 0x4000 /*Zero*/;
|
---|
672 | else
|
---|
673 | env->fpus |= 0x4400 /*Denormal*/;
|
---|
674 | } else {
|
---|
675 | env->fpus |= 0x400;
|
---|
676 | }
|
---|
677 | }
|
---|
678 |
|
---|
679 |
|
---|
680 | void check_env(void)
|
---|
681 | {
|
---|
682 | int i;
|
---|
683 | for (i = 0; i < 8; i++)
|
---|
684 | {
|
---|
685 | CPU86_LDoubleU my, res;
|
---|
686 | my.d = env->fpregs[i].d;
|
---|
687 | res.d = env_res.fpregs[i].d;
|
---|
688 |
|
---|
689 | if ( my.l.lower != res.l.lower
|
---|
690 | || my.l.upper != res.l.upper)
|
---|
691 | printf("register %i: %#018llx:%#06x\n"
|
---|
692 | " expected %#018llx:%#06x\n",
|
---|
693 | i,
|
---|
694 | my.l.lower, my.l.upper,
|
---|
695 | res.l.lower, res.l.upper);
|
---|
696 | }
|
---|
697 | for (i = 0; i < 8; i++)
|
---|
698 | if (env->fptags[i] != env_res.fptags[i])
|
---|
699 | printf("tag %i: %d != %d\n", i, env->fptags[i], env_res.fptags[i]);
|
---|
700 | if (env->fpstt != env_res.fpstt)
|
---|
701 | printf("fpstt: %#06x != %#06x\n", env->fpstt, env_res.fpstt);
|
---|
702 | if (env->fpuc != env_res.fpuc)
|
---|
703 | printf("fpuc: %#06x != %#06x\n", env->fpuc, env_res.fpuc);
|
---|
704 | if (env->fpus != env_res.fpus)
|
---|
705 | printf("fpus: %#06x != %#06x\n", env->fpus, env_res.fpus);
|
---|
706 | }
|
---|
707 | #endif /* not used. */
|
---|
708 |
|
---|
709 | #if 0 /* insert this into helper.c */
|
---|
710 | /* FPU helpers */
|
---|
711 | CPU86_LDoubleU my_st[8];
|
---|
712 | unsigned int my_fpstt;
|
---|
713 | unsigned int my_fpus;
|
---|
714 | unsigned int my_fpuc;
|
---|
715 | unsigned char my_fptags[8];
|
---|
716 |
|
---|
717 | void hlp_fpu_enter(void)
|
---|
718 | {
|
---|
719 | int i;
|
---|
720 | for (i = 0; i < 8; i++)
|
---|
721 | my_st[i].d = env->fpregs[i].d;
|
---|
722 | my_fpstt = env->fpstt;
|
---|
723 | my_fpus = env->fpus;
|
---|
724 | my_fpuc = env->fpuc;
|
---|
725 | memcpy(&my_fptags, &env->fptags, sizeof(my_fptags));
|
---|
726 | }
|
---|
727 |
|
---|
728 | void hlp_fpu_leave(const char *psz)
|
---|
729 | {
|
---|
730 | int i;
|
---|
731 | Log(("/*code*/ \n"));
|
---|
732 | for (i = 0; i < 8; i++)
|
---|
733 | Log(("/*code*/ *(unsigned long long *)&env_org.fpregs[%d] = %#018llxULL; ((unsigned short *)&env_org.fpregs[%d])[4] = %#06x; env_org.fptags[%d]=%d;\n",
|
---|
734 | i, my_st[i].l.lower, i, my_st[i].l.upper, i, my_fptags[i]));
|
---|
735 | Log(("/*code*/ env_org.fpstt=%#x;\n", my_fpstt));
|
---|
736 | Log(("/*code*/ env_org.fpus=%#x;\n", my_fpus));
|
---|
737 | Log(("/*code*/ env_org.fpuc=%#x;\n", my_fpuc));
|
---|
738 | for (i = 0; i < 8; i++)
|
---|
739 | {
|
---|
740 | CPU86_LDoubleU u;
|
---|
741 | u.d = env->fpregs[i].d;
|
---|
742 | Log(("/*code*/ *(unsigned long long *)&env_res.fpregs[%d] = %#018llxULL; ((unsigned short *)&env_res.fpregs[%d])[4] = %#06x; env_res.fptags[%d]=%d;\n",
|
---|
743 | i, u.l.lower, i, u.l.upper, i, env->fptags[i]));
|
---|
744 | }
|
---|
745 | Log(("/*code*/ env_res.fpstt=%#x;\n", env->fpstt));
|
---|
746 | Log(("/*code*/ env_res.fpus=%#x;\n", env->fpus));
|
---|
747 | Log(("/*code*/ env_res.fpuc=%#x;\n", env->fpuc));
|
---|
748 |
|
---|
749 | Log(("/*code*/ my_env = env_org;\n"));
|
---|
750 | Log(("/*code*/ %s();\n", psz));
|
---|
751 | Log(("/*code*/ check_env();\n"));
|
---|
752 | }
|
---|
753 | #endif /* helper.c */
|
---|
754 |
|
---|
755 | extern void testmath2(void )
|
---|
756 | {
|
---|
757 | #if 0
|
---|
758 | #include "/tmp/code.h"
|
---|
759 | #endif
|
---|
760 | }
|
---|
761 |
|
---|
762 |
|
---|
763 | /////////////////////////////////////////////////////////////////////////////////////////
|
---|
764 | /////////////////////////////////////////////////////////////////////////////////////////
|
---|
765 | /////////////////////////////////////////////////////////////////////////////////////////
|
---|
766 |
|
---|
767 | #ifdef MATHTEST_STANDALONE
|
---|
768 |
|
---|
769 | void test_fops(double a, double b)
|
---|
770 | {
|
---|
771 | printf("a=%f b=%f a+b=%f\n", a, b, a + b);
|
---|
772 | printf("a=%f b=%f a-b=%f\n", a, b, a - b);
|
---|
773 | printf("a=%f b=%f a*b=%f\n", a, b, a * b);
|
---|
774 | printf("a=%f b=%f a/b=%f\n", a, b, a / b);
|
---|
775 | printf("a=%f b=%f fmod(a, b)=%f\n", a, b, (double)fmod(a, b));
|
---|
776 | printf("a=%f sqrt(a)=%f\n", a, (double)sqrtl(a));
|
---|
777 | printf("a=%f sin(a)=%f\n", a, (double)sinl(a));
|
---|
778 | printf("a=%f cos(a)=%f\n", a, (double)cos(a));
|
---|
779 | printf("a=%f tan(a)=%f\n", a, (double)tanl(a));
|
---|
780 | printf("a=%f log(a)=%f\n", a, (double)log(a));
|
---|
781 | printf("a=%f exp(a)=%f\n", a, (double)exp(a));
|
---|
782 | printf("a=%f b=%f atan2(a, b)=%f\n", a, b, atan2(a, b));
|
---|
783 | /* just to test some op combining */
|
---|
784 | printf("a=%f asin(sinl(a))=%f\n", a, (double)asin(sinl(a)));
|
---|
785 | printf("a=%f acos(cos(a))=%f\n", a, (double)acos(cos(a)));
|
---|
786 | printf("a=%f atan(tanl(a))=%f\n", a, (double)atan(tanl(a)));
|
---|
787 | }
|
---|
788 |
|
---|
789 | int main()
|
---|
790 | {
|
---|
791 | unsigned cErrors = testmath();
|
---|
792 |
|
---|
793 | testmath2();
|
---|
794 | test_fops(2, 3);
|
---|
795 | test_fops(1.4, -5);
|
---|
796 |
|
---|
797 | printf("cErrors=%d\n", cErrors);
|
---|
798 | return cErrors;
|
---|
799 | }
|
---|
800 | #endif
|
---|
801 |
|
---|