1 /* $NetBSD: timesoftfloat.c,v 1.1 2000/06/06 08:15:11 bjh21 Exp $ */ 2 3 /* 4 =============================================================================== 5 6 This C source file is part of the SoftFloat IEC/IEEE Floating-point 7 Arithmetic Package, Release 2a. 8 9 Written by John R. Hauser. This work was made possible in part by the 10 International Computer Science Institute, located at Suite 600, 1947 Center 11 Street, Berkeley, California 94704. Funding was partially provided by the 12 National Science Foundation under grant MIP-9311980. The original version 13 of this code was written as part of a project to build a fixed-point vector 14 processor in collaboration with the University of California at Berkeley, 15 overseen by Profs. Nelson Morgan and John Wawrzynek. More information 16 is available through the Web page `http://HTTP.CS.Berkeley.EDU/~jhauser/ 17 arithmetic/SoftFloat.html'. 18 19 THIS SOFTWARE IS DISTRIBUTED AS IS, FOR FREE. Although reasonable effort 20 has been made to avoid it, THIS SOFTWARE MAY CONTAIN FAULTS THAT WILL AT 21 TIMES RESULT IN INCORRECT BEHAVIOR. USE OF THIS SOFTWARE IS RESTRICTED TO 22 PERSONS AND ORGANIZATIONS WHO CAN AND WILL TAKE FULL RESPONSIBILITY FOR ANY 23 AND ALL LOSSES, COSTS, OR OTHER PROBLEMS ARISING FROM ITS USE. 24 25 Derivative works are acceptable, even for commercial purposes, so long as 26 (1) they include prominent notice that the work is derivative, and (2) they 27 include prominent notice akin to these four paragraphs for those parts of 28 this code that are retained. 29 30 =============================================================================== 31 */ 32 33 #include <sys/cdefs.h> 34 __FBSDID("$FreeBSD$"); 35 36 #include <stdlib.h> 37 #include <stdarg.h> 38 #include <string.h> 39 #include <stdio.h> 40 #include <time.h> 41 #include "milieu.h" 42 #include "softfloat.h" 43 44 enum { 45 minIterations = 1000 46 }; 47 48 static void fail( const char *message, ... ) 49 { 50 va_list varArgs; 51 52 fputs( "timesoftfloat: ", stderr ); 53 va_start( varArgs, message ); 54 vfprintf( stderr, message, varArgs ); 55 va_end( varArgs ); 56 fputs( ".\n", stderr ); 57 exit( EXIT_FAILURE ); 58 59 } 60 61 static char *functionName; 62 static char *roundingPrecisionName, *roundingModeName, *tininessModeName; 63 64 static void reportTime( int32 count, long clocks ) 65 { 66 67 printf( 68 "%8.1f kops/s: %s", 69 ( count / ( ( (float) clocks ) / CLOCKS_PER_SEC ) ) / 1000, 70 functionName 71 ); 72 if ( roundingModeName ) { 73 if ( roundingPrecisionName ) { 74 fputs( ", precision ", stdout ); 75 fputs( roundingPrecisionName, stdout ); 76 } 77 fputs( ", rounding ", stdout ); 78 fputs( roundingModeName, stdout ); 79 if ( tininessModeName ) { 80 fputs( ", tininess ", stdout ); 81 fputs( tininessModeName, stdout ); 82 fputs( " rounding", stdout ); 83 } 84 } 85 fputc( '\n', stdout ); 86 87 } 88 89 enum { 90 numInputs_int32 = 32 91 }; 92 93 static const int32 inputs_int32[ numInputs_int32 ] = { 94 0xFFFFBB79, 0x405CF80F, 0x00000000, 0xFFFFFD04, 95 0xFFF20002, 0x0C8EF795, 0xF00011FF, 0x000006CA, 96 0x00009BFE, 0xFF4862E3, 0x9FFFEFFE, 0xFFFFFFB7, 97 0x0BFF7FFF, 0x0000F37A, 0x0011DFFE, 0x00000006, 98 0xFFF02006, 0xFFFFF7D1, 0x10200003, 0xDE8DF765, 99 0x00003E02, 0x000019E8, 0x0008FFFE, 0xFFFFFB5C, 100 0xFFDF7FFE, 0x07C42FBF, 0x0FFFE3FF, 0x040B9F13, 101 0xBFFFFFF8, 0x0001BF56, 0x000017F6, 0x000A908A 102 }; 103 104 static void time_a_int32_z_float32( float32 function( int32 ) ) 105 { 106 clock_t startClock, endClock; 107 int32 count, i; 108 int8 inputNum; 109 110 count = 0; 111 inputNum = 0; 112 startClock = clock(); 113 do { 114 for ( i = minIterations; i; --i ) { 115 function( inputs_int32[ inputNum ] ); 116 inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 ); 117 } 118 count += minIterations; 119 } while ( clock() - startClock < CLOCKS_PER_SEC ); 120 inputNum = 0; 121 startClock = clock(); 122 for ( i = count; i; --i ) { 123 function( inputs_int32[ inputNum ] ); 124 inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 ); 125 } 126 endClock = clock(); 127 reportTime( count, endClock - startClock ); 128 129 } 130 131 static void time_a_int32_z_float64( float64 function( int32 ) ) 132 { 133 clock_t startClock, endClock; 134 int32 count, i; 135 int8 inputNum; 136 137 count = 0; 138 inputNum = 0; 139 startClock = clock(); 140 do { 141 for ( i = minIterations; i; --i ) { 142 function( inputs_int32[ inputNum ] ); 143 inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 ); 144 } 145 count += minIterations; 146 } while ( clock() - startClock < CLOCKS_PER_SEC ); 147 inputNum = 0; 148 startClock = clock(); 149 for ( i = count; i; --i ) { 150 function( inputs_int32[ inputNum ] ); 151 inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 ); 152 } 153 endClock = clock(); 154 reportTime( count, endClock - startClock ); 155 156 } 157 158 #ifdef FLOATX80 159 160 static void time_a_int32_z_floatx80( floatx80 function( int32 ) ) 161 { 162 clock_t startClock, endClock; 163 int32 count, i; 164 int8 inputNum; 165 166 count = 0; 167 inputNum = 0; 168 startClock = clock(); 169 do { 170 for ( i = minIterations; i; --i ) { 171 function( inputs_int32[ inputNum ] ); 172 inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 ); 173 } 174 count += minIterations; 175 } while ( clock() - startClock < CLOCKS_PER_SEC ); 176 inputNum = 0; 177 startClock = clock(); 178 for ( i = count; i; --i ) { 179 function( inputs_int32[ inputNum ] ); 180 inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 ); 181 } 182 endClock = clock(); 183 reportTime( count, endClock - startClock ); 184 185 } 186 187 #endif 188 189 #ifdef FLOAT128 190 191 static void time_a_int32_z_float128( float128 function( int32 ) ) 192 { 193 clock_t startClock, endClock; 194 int32 count, i; 195 int8 inputNum; 196 197 count = 0; 198 inputNum = 0; 199 startClock = clock(); 200 do { 201 for ( i = minIterations; i; --i ) { 202 function( inputs_int32[ inputNum ] ); 203 inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 ); 204 } 205 count += minIterations; 206 } while ( clock() - startClock < CLOCKS_PER_SEC ); 207 inputNum = 0; 208 startClock = clock(); 209 for ( i = count; i; --i ) { 210 function( inputs_int32[ inputNum ] ); 211 inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 ); 212 } 213 endClock = clock(); 214 reportTime( count, endClock - startClock ); 215 216 } 217 218 #endif 219 220 enum { 221 numInputs_int64 = 32 222 }; 223 224 static const int64 inputs_int64[ numInputs_int64 ] = { 225 LIT64( 0xFBFFC3FFFFFFFFFF ), 226 LIT64( 0x0000000003C589BC ), 227 LIT64( 0x00000000400013FE ), 228 LIT64( 0x0000000000186171 ), 229 LIT64( 0xFFFFFFFFFFFEFBFA ), 230 LIT64( 0xFFFFFD79E6DFFC73 ), 231 LIT64( 0x0000000010001DFF ), 232 LIT64( 0xDD1A0F0C78513710 ), 233 LIT64( 0xFFFF83FFFFFEFFFE ), 234 LIT64( 0x00756EBD1AD0C1C7 ), 235 LIT64( 0x0003FDFFFFFFFFBE ), 236 LIT64( 0x0007D0FB2C2CA951 ), 237 LIT64( 0x0007FC0007FFFFFE ), 238 LIT64( 0x0000001F942B18BB ), 239 LIT64( 0x0000080101FFFFFE ), 240 LIT64( 0xFFFFFFFFFFFF0978 ), 241 LIT64( 0x000000000008BFFF ), 242 LIT64( 0x0000000006F5AF08 ), 243 LIT64( 0xFFDEFF7FFFFFFFFE ), 244 LIT64( 0x0000000000000003 ), 245 LIT64( 0x3FFFFFFFFF80007D ), 246 LIT64( 0x0000000000000078 ), 247 LIT64( 0xFFF80000007FDFFD ), 248 LIT64( 0x1BBC775B78016AB0 ), 249 LIT64( 0xFFF9001FFFFFFFFE ), 250 LIT64( 0xFFFD4767AB98E43F ), 251 LIT64( 0xFFFFFEFFFE00001E ), 252 LIT64( 0xFFFFFFFFFFF04EFD ), 253 LIT64( 0x07FFFFFFFFFFF7FF ), 254 LIT64( 0xFFFC9EAA38F89050 ), 255 LIT64( 0x00000020FBFFFFFE ), 256 LIT64( 0x0000099AE6455357 ) 257 }; 258 259 static void time_a_int64_z_float32( float32 function( int64 ) ) 260 { 261 clock_t startClock, endClock; 262 int32 count, i; 263 int8 inputNum; 264 265 count = 0; 266 inputNum = 0; 267 startClock = clock(); 268 do { 269 for ( i = minIterations; i; --i ) { 270 function( inputs_int64[ inputNum ] ); 271 inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 ); 272 } 273 count += minIterations; 274 } while ( clock() - startClock < CLOCKS_PER_SEC ); 275 inputNum = 0; 276 startClock = clock(); 277 for ( i = count; i; --i ) { 278 function( inputs_int64[ inputNum ] ); 279 inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 ); 280 } 281 endClock = clock(); 282 reportTime( count, endClock - startClock ); 283 284 } 285 286 static void time_a_int64_z_float64( float64 function( int64 ) ) 287 { 288 clock_t startClock, endClock; 289 int32 count, i; 290 int8 inputNum; 291 292 count = 0; 293 inputNum = 0; 294 startClock = clock(); 295 do { 296 for ( i = minIterations; i; --i ) { 297 function( inputs_int64[ inputNum ] ); 298 inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 ); 299 } 300 count += minIterations; 301 } while ( clock() - startClock < CLOCKS_PER_SEC ); 302 inputNum = 0; 303 startClock = clock(); 304 for ( i = count; i; --i ) { 305 function( inputs_int64[ inputNum ] ); 306 inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 ); 307 } 308 endClock = clock(); 309 reportTime( count, endClock - startClock ); 310 311 } 312 313 #ifdef FLOATX80 314 315 static void time_a_int64_z_floatx80( floatx80 function( int64 ) ) 316 { 317 clock_t startClock, endClock; 318 int32 count, i; 319 int8 inputNum; 320 321 count = 0; 322 inputNum = 0; 323 startClock = clock(); 324 do { 325 for ( i = minIterations; i; --i ) { 326 function( inputs_int64[ inputNum ] ); 327 inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 ); 328 } 329 count += minIterations; 330 } while ( clock() - startClock < CLOCKS_PER_SEC ); 331 inputNum = 0; 332 startClock = clock(); 333 for ( i = count; i; --i ) { 334 function( inputs_int64[ inputNum ] ); 335 inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 ); 336 } 337 endClock = clock(); 338 reportTime( count, endClock - startClock ); 339 340 } 341 342 #endif 343 344 #ifdef FLOAT128 345 346 static void time_a_int64_z_float128( float128 function( int64 ) ) 347 { 348 clock_t startClock, endClock; 349 int32 count, i; 350 int8 inputNum; 351 352 count = 0; 353 inputNum = 0; 354 startClock = clock(); 355 do { 356 for ( i = minIterations; i; --i ) { 357 function( inputs_int64[ inputNum ] ); 358 inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 ); 359 } 360 count += minIterations; 361 } while ( clock() - startClock < CLOCKS_PER_SEC ); 362 inputNum = 0; 363 startClock = clock(); 364 for ( i = count; i; --i ) { 365 function( inputs_int64[ inputNum ] ); 366 inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 ); 367 } 368 endClock = clock(); 369 reportTime( count, endClock - startClock ); 370 371 } 372 373 #endif 374 375 enum { 376 numInputs_float32 = 32 377 }; 378 379 static const float32 inputs_float32[ numInputs_float32 ] = { 380 0x4EFA0000, 0xC1D0B328, 0x80000000, 0x3E69A31E, 381 0xAF803EFF, 0x3F800000, 0x17BF8000, 0xE74A301A, 382 0x4E010003, 0x7EE3C75D, 0xBD803FE0, 0xBFFEFF00, 383 0x7981F800, 0x431FFFFC, 0xC100C000, 0x3D87EFFF, 384 0x4103FEFE, 0xBC000007, 0xBF01F7FF, 0x4E6C6B5C, 385 0xC187FFFE, 0xC58B9F13, 0x4F88007F, 0xDF004007, 386 0xB7FFD7FE, 0x7E8001FB, 0x46EFFBFF, 0x31C10000, 387 0xDB428661, 0x33F89B1F, 0xA3BFEFFF, 0x537BFFBE 388 }; 389 390 static void time_a_float32_z_int32( int32 function( float32 ) ) 391 { 392 clock_t startClock, endClock; 393 int32 count, i; 394 int8 inputNum; 395 396 count = 0; 397 inputNum = 0; 398 startClock = clock(); 399 do { 400 for ( i = minIterations; i; --i ) { 401 function( inputs_float32[ inputNum ] ); 402 inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); 403 } 404 count += minIterations; 405 } while ( clock() - startClock < CLOCKS_PER_SEC ); 406 inputNum = 0; 407 startClock = clock(); 408 for ( i = count; i; --i ) { 409 function( inputs_float32[ inputNum ] ); 410 inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); 411 } 412 endClock = clock(); 413 reportTime( count, endClock - startClock ); 414 415 } 416 417 static void time_a_float32_z_int64( int64 function( float32 ) ) 418 { 419 clock_t startClock, endClock; 420 int32 count, i; 421 int8 inputNum; 422 423 count = 0; 424 inputNum = 0; 425 startClock = clock(); 426 do { 427 for ( i = minIterations; i; --i ) { 428 function( inputs_float32[ inputNum ] ); 429 inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); 430 } 431 count += minIterations; 432 } while ( clock() - startClock < CLOCKS_PER_SEC ); 433 inputNum = 0; 434 startClock = clock(); 435 for ( i = count; i; --i ) { 436 function( inputs_float32[ inputNum ] ); 437 inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); 438 } 439 endClock = clock(); 440 reportTime( count, endClock - startClock ); 441 442 } 443 444 static void time_a_float32_z_float64( float64 function( float32 ) ) 445 { 446 clock_t startClock, endClock; 447 int32 count, i; 448 int8 inputNum; 449 450 count = 0; 451 inputNum = 0; 452 startClock = clock(); 453 do { 454 for ( i = minIterations; i; --i ) { 455 function( inputs_float32[ inputNum ] ); 456 inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); 457 } 458 count += minIterations; 459 } while ( clock() - startClock < CLOCKS_PER_SEC ); 460 inputNum = 0; 461 startClock = clock(); 462 for ( i = count; i; --i ) { 463 function( inputs_float32[ inputNum ] ); 464 inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); 465 } 466 endClock = clock(); 467 reportTime( count, endClock - startClock ); 468 469 } 470 471 #ifdef FLOATX80 472 473 static void time_a_float32_z_floatx80( floatx80 function( float32 ) ) 474 { 475 clock_t startClock, endClock; 476 int32 count, i; 477 int8 inputNum; 478 479 count = 0; 480 inputNum = 0; 481 startClock = clock(); 482 do { 483 for ( i = minIterations; i; --i ) { 484 function( inputs_float32[ inputNum ] ); 485 inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); 486 } 487 count += minIterations; 488 } while ( clock() - startClock < CLOCKS_PER_SEC ); 489 inputNum = 0; 490 startClock = clock(); 491 for ( i = count; i; --i ) { 492 function( inputs_float32[ inputNum ] ); 493 inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); 494 } 495 endClock = clock(); 496 reportTime( count, endClock - startClock ); 497 498 } 499 500 #endif 501 502 #ifdef FLOAT128 503 504 static void time_a_float32_z_float128( float128 function( float32 ) ) 505 { 506 clock_t startClock, endClock; 507 int32 count, i; 508 int8 inputNum; 509 510 count = 0; 511 inputNum = 0; 512 startClock = clock(); 513 do { 514 for ( i = minIterations; i; --i ) { 515 function( inputs_float32[ inputNum ] ); 516 inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); 517 } 518 count += minIterations; 519 } while ( clock() - startClock < CLOCKS_PER_SEC ); 520 inputNum = 0; 521 startClock = clock(); 522 for ( i = count; i; --i ) { 523 function( inputs_float32[ inputNum ] ); 524 inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); 525 } 526 endClock = clock(); 527 reportTime( count, endClock - startClock ); 528 529 } 530 531 #endif 532 533 static void time_az_float32( float32 function( float32 ) ) 534 { 535 clock_t startClock, endClock; 536 int32 count, i; 537 int8 inputNum; 538 539 count = 0; 540 inputNum = 0; 541 startClock = clock(); 542 do { 543 for ( i = minIterations; i; --i ) { 544 function( inputs_float32[ inputNum ] ); 545 inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); 546 } 547 count += minIterations; 548 } while ( clock() - startClock < CLOCKS_PER_SEC ); 549 inputNum = 0; 550 startClock = clock(); 551 for ( i = count; i; --i ) { 552 function( inputs_float32[ inputNum ] ); 553 inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); 554 } 555 endClock = clock(); 556 reportTime( count, endClock - startClock ); 557 558 } 559 560 static void time_ab_float32_z_flag( flag function( float32, float32 ) ) 561 { 562 clock_t startClock, endClock; 563 int32 count, i; 564 int8 inputNumA, inputNumB; 565 566 count = 0; 567 inputNumA = 0; 568 inputNumB = 0; 569 startClock = clock(); 570 do { 571 for ( i = minIterations; i; --i ) { 572 function( 573 inputs_float32[ inputNumA ], inputs_float32[ inputNumB ] ); 574 inputNumA = ( inputNumA + 1 ) & ( numInputs_float32 - 1 ); 575 if ( inputNumA == 0 ) ++inputNumB; 576 inputNumB = ( inputNumB + 1 ) & ( numInputs_float32 - 1 ); 577 } 578 count += minIterations; 579 } while ( clock() - startClock < CLOCKS_PER_SEC ); 580 inputNumA = 0; 581 inputNumB = 0; 582 startClock = clock(); 583 for ( i = count; i; --i ) { 584 function( 585 inputs_float32[ inputNumA ], inputs_float32[ inputNumB ] ); 586 inputNumA = ( inputNumA + 1 ) & ( numInputs_float32 - 1 ); 587 if ( inputNumA == 0 ) ++inputNumB; 588 inputNumB = ( inputNumB + 1 ) & ( numInputs_float32 - 1 ); 589 } 590 endClock = clock(); 591 reportTime( count, endClock - startClock ); 592 593 } 594 595 static void time_abz_float32( float32 function( float32, float32 ) ) 596 { 597 clock_t startClock, endClock; 598 int32 count, i; 599 int8 inputNumA, inputNumB; 600 601 count = 0; 602 inputNumA = 0; 603 inputNumB = 0; 604 startClock = clock(); 605 do { 606 for ( i = minIterations; i; --i ) { 607 function( 608 inputs_float32[ inputNumA ], inputs_float32[ inputNumB ] ); 609 inputNumA = ( inputNumA + 1 ) & ( numInputs_float32 - 1 ); 610 if ( inputNumA == 0 ) ++inputNumB; 611 inputNumB = ( inputNumB + 1 ) & ( numInputs_float32 - 1 ); 612 } 613 count += minIterations; 614 } while ( clock() - startClock < CLOCKS_PER_SEC ); 615 inputNumA = 0; 616 inputNumB = 0; 617 startClock = clock(); 618 for ( i = count; i; --i ) { 619 function( 620 inputs_float32[ inputNumA ], inputs_float32[ inputNumB ] ); 621 inputNumA = ( inputNumA + 1 ) & ( numInputs_float32 - 1 ); 622 if ( inputNumA == 0 ) ++inputNumB; 623 inputNumB = ( inputNumB + 1 ) & ( numInputs_float32 - 1 ); 624 } 625 endClock = clock(); 626 reportTime( count, endClock - startClock ); 627 628 } 629 630 static const float32 inputs_float32_pos[ numInputs_float32 ] = { 631 0x4EFA0000, 0x41D0B328, 0x00000000, 0x3E69A31E, 632 0x2F803EFF, 0x3F800000, 0x17BF8000, 0x674A301A, 633 0x4E010003, 0x7EE3C75D, 0x3D803FE0, 0x3FFEFF00, 634 0x7981F800, 0x431FFFFC, 0x4100C000, 0x3D87EFFF, 635 0x4103FEFE, 0x3C000007, 0x3F01F7FF, 0x4E6C6B5C, 636 0x4187FFFE, 0x458B9F13, 0x4F88007F, 0x5F004007, 637 0x37FFD7FE, 0x7E8001FB, 0x46EFFBFF, 0x31C10000, 638 0x5B428661, 0x33F89B1F, 0x23BFEFFF, 0x537BFFBE 639 }; 640 641 static void time_az_float32_pos( float32 function( float32 ) ) 642 { 643 clock_t startClock, endClock; 644 int32 count, i; 645 int8 inputNum; 646 647 count = 0; 648 inputNum = 0; 649 startClock = clock(); 650 do { 651 for ( i = minIterations; i; --i ) { 652 function( inputs_float32_pos[ inputNum ] ); 653 inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); 654 } 655 count += minIterations; 656 } while ( clock() - startClock < CLOCKS_PER_SEC ); 657 inputNum = 0; 658 startClock = clock(); 659 for ( i = count; i; --i ) { 660 function( inputs_float32_pos[ inputNum ] ); 661 inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); 662 } 663 endClock = clock(); 664 reportTime( count, endClock - startClock ); 665 666 } 667 668 enum { 669 numInputs_float64 = 32 670 }; 671 672 static const float64 inputs_float64[ numInputs_float64 ] = { 673 LIT64( 0x422FFFC008000000 ), 674 LIT64( 0xB7E0000480000000 ), 675 LIT64( 0xF3FD2546120B7935 ), 676 LIT64( 0x3FF0000000000000 ), 677 LIT64( 0xCE07F766F09588D6 ), 678 LIT64( 0x8000000000000000 ), 679 LIT64( 0x3FCE000400000000 ), 680 LIT64( 0x8313B60F0032BED8 ), 681 LIT64( 0xC1EFFFFFC0002000 ), 682 LIT64( 0x3FB3C75D224F2B0F ), 683 LIT64( 0x7FD00000004000FF ), 684 LIT64( 0xA12FFF8000001FFF ), 685 LIT64( 0x3EE0000000FE0000 ), 686 LIT64( 0x0010000080000004 ), 687 LIT64( 0x41CFFFFE00000020 ), 688 LIT64( 0x40303FFFFFFFFFFD ), 689 LIT64( 0x3FD000003FEFFFFF ), 690 LIT64( 0xBFD0000010000000 ), 691 LIT64( 0xB7FC6B5C16CA55CF ), 692 LIT64( 0x413EEB940B9D1301 ), 693 LIT64( 0xC7E00200001FFFFF ), 694 LIT64( 0x47F00021FFFFFFFE ), 695 LIT64( 0xBFFFFFFFF80000FF ), 696 LIT64( 0xC07FFFFFE00FFFFF ), 697 LIT64( 0x001497A63740C5E8 ), 698 LIT64( 0xC4BFFFE0001FFFFF ), 699 LIT64( 0x96FFDFFEFFFFFFFF ), 700 LIT64( 0x403FC000000001FE ), 701 LIT64( 0xFFD00000000001F6 ), 702 LIT64( 0x0640400002000000 ), 703 LIT64( 0x479CEE1E4F789FE0 ), 704 LIT64( 0xC237FFFFFFFFFDFE ) 705 }; 706 707 static void time_a_float64_z_int32( int32 function( float64 ) ) 708 { 709 clock_t startClock, endClock; 710 int32 count, i; 711 int8 inputNum; 712 713 count = 0; 714 inputNum = 0; 715 startClock = clock(); 716 do { 717 for ( i = minIterations; i; --i ) { 718 function( inputs_float64[ inputNum ] ); 719 inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); 720 } 721 count += minIterations; 722 } while ( clock() - startClock < CLOCKS_PER_SEC ); 723 inputNum = 0; 724 startClock = clock(); 725 for ( i = count; i; --i ) { 726 function( inputs_float64[ inputNum ] ); 727 inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); 728 } 729 endClock = clock(); 730 reportTime( count, endClock - startClock ); 731 732 } 733 734 static void time_a_float64_z_int64( int64 function( float64 ) ) 735 { 736 clock_t startClock, endClock; 737 int32 count, i; 738 int8 inputNum; 739 740 count = 0; 741 inputNum = 0; 742 startClock = clock(); 743 do { 744 for ( i = minIterations; i; --i ) { 745 function( inputs_float64[ inputNum ] ); 746 inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); 747 } 748 count += minIterations; 749 } while ( clock() - startClock < CLOCKS_PER_SEC ); 750 inputNum = 0; 751 startClock = clock(); 752 for ( i = count; i; --i ) { 753 function( inputs_float64[ inputNum ] ); 754 inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); 755 } 756 endClock = clock(); 757 reportTime( count, endClock - startClock ); 758 759 } 760 761 static void time_a_float64_z_float32( float32 function( float64 ) ) 762 { 763 clock_t startClock, endClock; 764 int32 count, i; 765 int8 inputNum; 766 767 count = 0; 768 inputNum = 0; 769 startClock = clock(); 770 do { 771 for ( i = minIterations; i; --i ) { 772 function( inputs_float64[ inputNum ] ); 773 inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); 774 } 775 count += minIterations; 776 } while ( clock() - startClock < CLOCKS_PER_SEC ); 777 inputNum = 0; 778 startClock = clock(); 779 for ( i = count; i; --i ) { 780 function( inputs_float64[ inputNum ] ); 781 inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); 782 } 783 endClock = clock(); 784 reportTime( count, endClock - startClock ); 785 786 } 787 788 #ifdef FLOATX80 789 790 static void time_a_float64_z_floatx80( floatx80 function( float64 ) ) 791 { 792 clock_t startClock, endClock; 793 int32 count, i; 794 int8 inputNum; 795 796 count = 0; 797 inputNum = 0; 798 startClock = clock(); 799 do { 800 for ( i = minIterations; i; --i ) { 801 function( inputs_float64[ inputNum ] ); 802 inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); 803 } 804 count += minIterations; 805 } while ( clock() - startClock < CLOCKS_PER_SEC ); 806 inputNum = 0; 807 startClock = clock(); 808 for ( i = count; i; --i ) { 809 function( inputs_float64[ inputNum ] ); 810 inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); 811 } 812 endClock = clock(); 813 reportTime( count, endClock - startClock ); 814 815 } 816 817 #endif 818 819 #ifdef FLOAT128 820 821 static void time_a_float64_z_float128( float128 function( float64 ) ) 822 { 823 clock_t startClock, endClock; 824 int32 count, i; 825 int8 inputNum; 826 827 count = 0; 828 inputNum = 0; 829 startClock = clock(); 830 do { 831 for ( i = minIterations; i; --i ) { 832 function( inputs_float64[ inputNum ] ); 833 inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); 834 } 835 count += minIterations; 836 } while ( clock() - startClock < CLOCKS_PER_SEC ); 837 inputNum = 0; 838 startClock = clock(); 839 for ( i = count; i; --i ) { 840 function( inputs_float64[ inputNum ] ); 841 inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); 842 } 843 endClock = clock(); 844 reportTime( count, endClock - startClock ); 845 846 } 847 848 #endif 849 850 static void time_az_float64( float64 function( float64 ) ) 851 { 852 clock_t startClock, endClock; 853 int32 count, i; 854 int8 inputNum; 855 856 count = 0; 857 inputNum = 0; 858 startClock = clock(); 859 do { 860 for ( i = minIterations; i; --i ) { 861 function( inputs_float64[ inputNum ] ); 862 inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); 863 } 864 count += minIterations; 865 } while ( clock() - startClock < CLOCKS_PER_SEC ); 866 inputNum = 0; 867 startClock = clock(); 868 for ( i = count; i; --i ) { 869 function( inputs_float64[ inputNum ] ); 870 inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); 871 } 872 endClock = clock(); 873 reportTime( count, endClock - startClock ); 874 875 } 876 877 static void time_ab_float64_z_flag( flag function( float64, float64 ) ) 878 { 879 clock_t startClock, endClock; 880 int32 count, i; 881 int8 inputNumA, inputNumB; 882 883 count = 0; 884 inputNumA = 0; 885 inputNumB = 0; 886 startClock = clock(); 887 do { 888 for ( i = minIterations; i; --i ) { 889 function( 890 inputs_float64[ inputNumA ], inputs_float64[ inputNumB ] ); 891 inputNumA = ( inputNumA + 1 ) & ( numInputs_float64 - 1 ); 892 if ( inputNumA == 0 ) ++inputNumB; 893 inputNumB = ( inputNumB + 1 ) & ( numInputs_float64 - 1 ); 894 } 895 count += minIterations; 896 } while ( clock() - startClock < CLOCKS_PER_SEC ); 897 inputNumA = 0; 898 inputNumB = 0; 899 startClock = clock(); 900 for ( i = count; i; --i ) { 901 function( 902 inputs_float64[ inputNumA ], inputs_float64[ inputNumB ] ); 903 inputNumA = ( inputNumA + 1 ) & ( numInputs_float64 - 1 ); 904 if ( inputNumA == 0 ) ++inputNumB; 905 inputNumB = ( inputNumB + 1 ) & ( numInputs_float64 - 1 ); 906 } 907 endClock = clock(); 908 reportTime( count, endClock - startClock ); 909 910 } 911 912 static void time_abz_float64( float64 function( float64, float64 ) ) 913 { 914 clock_t startClock, endClock; 915 int32 count, i; 916 int8 inputNumA, inputNumB; 917 918 count = 0; 919 inputNumA = 0; 920 inputNumB = 0; 921 startClock = clock(); 922 do { 923 for ( i = minIterations; i; --i ) { 924 function( 925 inputs_float64[ inputNumA ], inputs_float64[ inputNumB ] ); 926 inputNumA = ( inputNumA + 1 ) & ( numInputs_float64 - 1 ); 927 if ( inputNumA == 0 ) ++inputNumB; 928 inputNumB = ( inputNumB + 1 ) & ( numInputs_float64 - 1 ); 929 } 930 count += minIterations; 931 } while ( clock() - startClock < CLOCKS_PER_SEC ); 932 inputNumA = 0; 933 inputNumB = 0; 934 startClock = clock(); 935 for ( i = count; i; --i ) { 936 function( 937 inputs_float64[ inputNumA ], inputs_float64[ inputNumB ] ); 938 inputNumA = ( inputNumA + 1 ) & ( numInputs_float64 - 1 ); 939 if ( inputNumA == 0 ) ++inputNumB; 940 inputNumB = ( inputNumB + 1 ) & ( numInputs_float64 - 1 ); 941 } 942 endClock = clock(); 943 reportTime( count, endClock - startClock ); 944 945 } 946 947 static const float64 inputs_float64_pos[ numInputs_float64 ] = { 948 LIT64( 0x422FFFC008000000 ), 949 LIT64( 0x37E0000480000000 ), 950 LIT64( 0x73FD2546120B7935 ), 951 LIT64( 0x3FF0000000000000 ), 952 LIT64( 0x4E07F766F09588D6 ), 953 LIT64( 0x0000000000000000 ), 954 LIT64( 0x3FCE000400000000 ), 955 LIT64( 0x0313B60F0032BED8 ), 956 LIT64( 0x41EFFFFFC0002000 ), 957 LIT64( 0x3FB3C75D224F2B0F ), 958 LIT64( 0x7FD00000004000FF ), 959 LIT64( 0x212FFF8000001FFF ), 960 LIT64( 0x3EE0000000FE0000 ), 961 LIT64( 0x0010000080000004 ), 962 LIT64( 0x41CFFFFE00000020 ), 963 LIT64( 0x40303FFFFFFFFFFD ), 964 LIT64( 0x3FD000003FEFFFFF ), 965 LIT64( 0x3FD0000010000000 ), 966 LIT64( 0x37FC6B5C16CA55CF ), 967 LIT64( 0x413EEB940B9D1301 ), 968 LIT64( 0x47E00200001FFFFF ), 969 LIT64( 0x47F00021FFFFFFFE ), 970 LIT64( 0x3FFFFFFFF80000FF ), 971 LIT64( 0x407FFFFFE00FFFFF ), 972 LIT64( 0x001497A63740C5E8 ), 973 LIT64( 0x44BFFFE0001FFFFF ), 974 LIT64( 0x16FFDFFEFFFFFFFF ), 975 LIT64( 0x403FC000000001FE ), 976 LIT64( 0x7FD00000000001F6 ), 977 LIT64( 0x0640400002000000 ), 978 LIT64( 0x479CEE1E4F789FE0 ), 979 LIT64( 0x4237FFFFFFFFFDFE ) 980 }; 981 982 static void time_az_float64_pos( float64 function( float64 ) ) 983 { 984 clock_t startClock, endClock; 985 int32 count, i; 986 int8 inputNum; 987 988 count = 0; 989 inputNum = 0; 990 startClock = clock(); 991 do { 992 for ( i = minIterations; i; --i ) { 993 function( inputs_float64_pos[ inputNum ] ); 994 inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); 995 } 996 count += minIterations; 997 } while ( clock() - startClock < CLOCKS_PER_SEC ); 998 inputNum = 0; 999 startClock = clock(); 1000 for ( i = count; i; --i ) { 1001 function( inputs_float64_pos[ inputNum ] ); 1002 inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); 1003 } 1004 endClock = clock(); 1005 reportTime( count, endClock - startClock ); 1006 1007 } 1008 1009 #ifdef FLOATX80 1010 1011 enum { 1012 numInputs_floatx80 = 32 1013 }; 1014 1015 static const struct { 1016 bits16 high; 1017 bits64 low; 1018 } inputs_floatx80[ numInputs_floatx80 ] = { 1019 { 0xC03F, LIT64( 0xA9BE15A19C1E8B62 ) }, 1020 { 0x8000, LIT64( 0x0000000000000000 ) }, 1021 { 0x75A8, LIT64( 0xE59591E4788957A5 ) }, 1022 { 0xBFFF, LIT64( 0xFFF0000000000040 ) }, 1023 { 0x0CD8, LIT64( 0xFC000000000007FE ) }, 1024 { 0x43BA, LIT64( 0x99A4000000000000 ) }, 1025 { 0x3FFF, LIT64( 0x8000000000000000 ) }, 1026 { 0x4081, LIT64( 0x94FBF1BCEB5545F0 ) }, 1027 { 0x403E, LIT64( 0xFFF0000000002000 ) }, 1028 { 0x3FFE, LIT64( 0xC860E3C75D224F28 ) }, 1029 { 0x407E, LIT64( 0xFC00000FFFFFFFFE ) }, 1030 { 0x737A, LIT64( 0x800000007FFDFFFE ) }, 1031 { 0x4044, LIT64( 0xFFFFFF80000FFFFF ) }, 1032 { 0xBBFE, LIT64( 0x8000040000001FFE ) }, 1033 { 0xC002, LIT64( 0xFF80000000000020 ) }, 1034 { 0xDE8D, LIT64( 0xFFFFFFFFFFE00004 ) }, 1035 { 0xC004, LIT64( 0x8000000000003FFB ) }, 1036 { 0x407F, LIT64( 0x800000000003FFFE ) }, 1037 { 0xC000, LIT64( 0xA459EE6A5C16CA55 ) }, 1038 { 0x8003, LIT64( 0xC42CBF7399AEEB94 ) }, 1039 { 0xBF7F, LIT64( 0xF800000000000006 ) }, 1040 { 0xC07F, LIT64( 0xBF56BE8871F28FEA ) }, 1041 { 0xC07E, LIT64( 0xFFFF77FFFFFFFFFE ) }, 1042 { 0xADC9, LIT64( 0x8000000FFFFFFFDE ) }, 1043 { 0xC001, LIT64( 0xEFF7FFFFFFFFFFFF ) }, 1044 { 0x4001, LIT64( 0xBE84F30125C497A6 ) }, 1045 { 0xC06B, LIT64( 0xEFFFFFFFFFFFFFFF ) }, 1046 { 0x4080, LIT64( 0xFFFFFFFFBFFFFFFF ) }, 1047 { 0x87E9, LIT64( 0x81FFFFFFFFFFFBFF ) }, 1048 { 0xA63F, LIT64( 0x801FFFFFFEFFFFFE ) }, 1049 { 0x403C, LIT64( 0x801FFFFFFFF7FFFF ) }, 1050 { 0x4018, LIT64( 0x8000000000080003 ) } 1051 }; 1052 1053 static void time_a_floatx80_z_int32( int32 function( floatx80 ) ) 1054 { 1055 clock_t startClock, endClock; 1056 int32 count, i; 1057 int8 inputNum; 1058 floatx80 a; 1059 1060 count = 0; 1061 inputNum = 0; 1062 startClock = clock(); 1063 do { 1064 for ( i = minIterations; i; --i ) { 1065 a.low = inputs_floatx80[ inputNum ].low; 1066 a.high = inputs_floatx80[ inputNum ].high; 1067 function( a ); 1068 inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); 1069 } 1070 count += minIterations; 1071 } while ( clock() - startClock < CLOCKS_PER_SEC ); 1072 inputNum = 0; 1073 startClock = clock(); 1074 for ( i = count; i; --i ) { 1075 a.low = inputs_floatx80[ inputNum ].low; 1076 a.high = inputs_floatx80[ inputNum ].high; 1077 function( a ); 1078 inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); 1079 } 1080 endClock = clock(); 1081 reportTime( count, endClock - startClock ); 1082 1083 } 1084 1085 static void time_a_floatx80_z_int64( int64 function( floatx80 ) ) 1086 { 1087 clock_t startClock, endClock; 1088 int32 count, i; 1089 int8 inputNum; 1090 floatx80 a; 1091 1092 count = 0; 1093 inputNum = 0; 1094 startClock = clock(); 1095 do { 1096 for ( i = minIterations; i; --i ) { 1097 a.low = inputs_floatx80[ inputNum ].low; 1098 a.high = inputs_floatx80[ inputNum ].high; 1099 function( a ); 1100 inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); 1101 } 1102 count += minIterations; 1103 } while ( clock() - startClock < CLOCKS_PER_SEC ); 1104 inputNum = 0; 1105 startClock = clock(); 1106 for ( i = count; i; --i ) { 1107 a.low = inputs_floatx80[ inputNum ].low; 1108 a.high = inputs_floatx80[ inputNum ].high; 1109 function( a ); 1110 inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); 1111 } 1112 endClock = clock(); 1113 reportTime( count, endClock - startClock ); 1114 1115 } 1116 1117 static void time_a_floatx80_z_float32( float32 function( floatx80 ) ) 1118 { 1119 clock_t startClock, endClock; 1120 int32 count, i; 1121 int8 inputNum; 1122 floatx80 a; 1123 1124 count = 0; 1125 inputNum = 0; 1126 startClock = clock(); 1127 do { 1128 for ( i = minIterations; i; --i ) { 1129 a.low = inputs_floatx80[ inputNum ].low; 1130 a.high = inputs_floatx80[ inputNum ].high; 1131 function( a ); 1132 inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); 1133 } 1134 count += minIterations; 1135 } while ( clock() - startClock < CLOCKS_PER_SEC ); 1136 inputNum = 0; 1137 startClock = clock(); 1138 for ( i = count; i; --i ) { 1139 a.low = inputs_floatx80[ inputNum ].low; 1140 a.high = inputs_floatx80[ inputNum ].high; 1141 function( a ); 1142 inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); 1143 } 1144 endClock = clock(); 1145 reportTime( count, endClock - startClock ); 1146 1147 } 1148 1149 static void time_a_floatx80_z_float64( float64 function( floatx80 ) ) 1150 { 1151 clock_t startClock, endClock; 1152 int32 count, i; 1153 int8 inputNum; 1154 floatx80 a; 1155 1156 count = 0; 1157 inputNum = 0; 1158 startClock = clock(); 1159 do { 1160 for ( i = minIterations; i; --i ) { 1161 a.low = inputs_floatx80[ inputNum ].low; 1162 a.high = inputs_floatx80[ inputNum ].high; 1163 function( a ); 1164 inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); 1165 } 1166 count += minIterations; 1167 } while ( clock() - startClock < CLOCKS_PER_SEC ); 1168 inputNum = 0; 1169 startClock = clock(); 1170 for ( i = count; i; --i ) { 1171 a.low = inputs_floatx80[ inputNum ].low; 1172 a.high = inputs_floatx80[ inputNum ].high; 1173 function( a ); 1174 inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); 1175 } 1176 endClock = clock(); 1177 reportTime( count, endClock - startClock ); 1178 1179 } 1180 1181 #ifdef FLOAT128 1182 1183 static void time_a_floatx80_z_float128( float128 function( floatx80 ) ) 1184 { 1185 clock_t startClock, endClock; 1186 int32 count, i; 1187 int8 inputNum; 1188 floatx80 a; 1189 1190 count = 0; 1191 inputNum = 0; 1192 startClock = clock(); 1193 do { 1194 for ( i = minIterations; i; --i ) { 1195 a.low = inputs_floatx80[ inputNum ].low; 1196 a.high = inputs_floatx80[ inputNum ].high; 1197 function( a ); 1198 inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); 1199 } 1200 count += minIterations; 1201 } while ( clock() - startClock < CLOCKS_PER_SEC ); 1202 inputNum = 0; 1203 startClock = clock(); 1204 for ( i = count; i; --i ) { 1205 a.low = inputs_floatx80[ inputNum ].low; 1206 a.high = inputs_floatx80[ inputNum ].high; 1207 function( a ); 1208 inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); 1209 } 1210 endClock = clock(); 1211 reportTime( count, endClock - startClock ); 1212 1213 } 1214 1215 #endif 1216 1217 static void time_az_floatx80( floatx80 function( floatx80 ) ) 1218 { 1219 clock_t startClock, endClock; 1220 int32 count, i; 1221 int8 inputNum; 1222 floatx80 a; 1223 1224 count = 0; 1225 inputNum = 0; 1226 startClock = clock(); 1227 do { 1228 for ( i = minIterations; i; --i ) { 1229 a.low = inputs_floatx80[ inputNum ].low; 1230 a.high = inputs_floatx80[ inputNum ].high; 1231 function( a ); 1232 inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); 1233 } 1234 count += minIterations; 1235 } while ( clock() - startClock < CLOCKS_PER_SEC ); 1236 inputNum = 0; 1237 startClock = clock(); 1238 for ( i = count; i; --i ) { 1239 a.low = inputs_floatx80[ inputNum ].low; 1240 a.high = inputs_floatx80[ inputNum ].high; 1241 function( a ); 1242 inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); 1243 } 1244 endClock = clock(); 1245 reportTime( count, endClock - startClock ); 1246 1247 } 1248 1249 static void time_ab_floatx80_z_flag( flag function( floatx80, floatx80 ) ) 1250 { 1251 clock_t startClock, endClock; 1252 int32 count, i; 1253 int8 inputNumA, inputNumB; 1254 floatx80 a, b; 1255 1256 count = 0; 1257 inputNumA = 0; 1258 inputNumB = 0; 1259 startClock = clock(); 1260 do { 1261 for ( i = minIterations; i; --i ) { 1262 a.low = inputs_floatx80[ inputNumA ].low; 1263 a.high = inputs_floatx80[ inputNumA ].high; 1264 b.low = inputs_floatx80[ inputNumB ].low; 1265 b.high = inputs_floatx80[ inputNumB ].high; 1266 function( a, b ); 1267 inputNumA = ( inputNumA + 1 ) & ( numInputs_floatx80 - 1 ); 1268 if ( inputNumA == 0 ) ++inputNumB; 1269 inputNumB = ( inputNumB + 1 ) & ( numInputs_floatx80 - 1 ); 1270 } 1271 count += minIterations; 1272 } while ( clock() - startClock < CLOCKS_PER_SEC ); 1273 inputNumA = 0; 1274 inputNumB = 0; 1275 startClock = clock(); 1276 for ( i = count; i; --i ) { 1277 a.low = inputs_floatx80[ inputNumA ].low; 1278 a.high = inputs_floatx80[ inputNumA ].high; 1279 b.low = inputs_floatx80[ inputNumB ].low; 1280 b.high = inputs_floatx80[ inputNumB ].high; 1281 function( a, b ); 1282 inputNumA = ( inputNumA + 1 ) & ( numInputs_floatx80 - 1 ); 1283 if ( inputNumA == 0 ) ++inputNumB; 1284 inputNumB = ( inputNumB + 1 ) & ( numInputs_floatx80 - 1 ); 1285 } 1286 endClock = clock(); 1287 reportTime( count, endClock - startClock ); 1288 1289 } 1290 1291 static void time_abz_floatx80( floatx80 function( floatx80, floatx80 ) ) 1292 { 1293 clock_t startClock, endClock; 1294 int32 count, i; 1295 int8 inputNumA, inputNumB; 1296 floatx80 a, b; 1297 1298 count = 0; 1299 inputNumA = 0; 1300 inputNumB = 0; 1301 startClock = clock(); 1302 do { 1303 for ( i = minIterations; i; --i ) { 1304 a.low = inputs_floatx80[ inputNumA ].low; 1305 a.high = inputs_floatx80[ inputNumA ].high; 1306 b.low = inputs_floatx80[ inputNumB ].low; 1307 b.high = inputs_floatx80[ inputNumB ].high; 1308 function( a, b ); 1309 inputNumA = ( inputNumA + 1 ) & ( numInputs_floatx80 - 1 ); 1310 if ( inputNumA == 0 ) ++inputNumB; 1311 inputNumB = ( inputNumB + 1 ) & ( numInputs_floatx80 - 1 ); 1312 } 1313 count += minIterations; 1314 } while ( clock() - startClock < CLOCKS_PER_SEC ); 1315 inputNumA = 0; 1316 inputNumB = 0; 1317 startClock = clock(); 1318 for ( i = count; i; --i ) { 1319 a.low = inputs_floatx80[ inputNumA ].low; 1320 a.high = inputs_floatx80[ inputNumA ].high; 1321 b.low = inputs_floatx80[ inputNumB ].low; 1322 b.high = inputs_floatx80[ inputNumB ].high; 1323 function( a, b ); 1324 inputNumA = ( inputNumA + 1 ) & ( numInputs_floatx80 - 1 ); 1325 if ( inputNumA == 0 ) ++inputNumB; 1326 inputNumB = ( inputNumB + 1 ) & ( numInputs_floatx80 - 1 ); 1327 } 1328 endClock = clock(); 1329 reportTime( count, endClock - startClock ); 1330 1331 } 1332 1333 static const struct { 1334 bits16 high; 1335 bits64 low; 1336 } inputs_floatx80_pos[ numInputs_floatx80 ] = { 1337 { 0x403F, LIT64( 0xA9BE15A19C1E8B62 ) }, 1338 { 0x0000, LIT64( 0x0000000000000000 ) }, 1339 { 0x75A8, LIT64( 0xE59591E4788957A5 ) }, 1340 { 0x3FFF, LIT64( 0xFFF0000000000040 ) }, 1341 { 0x0CD8, LIT64( 0xFC000000000007FE ) }, 1342 { 0x43BA, LIT64( 0x99A4000000000000 ) }, 1343 { 0x3FFF, LIT64( 0x8000000000000000 ) }, 1344 { 0x4081, LIT64( 0x94FBF1BCEB5545F0 ) }, 1345 { 0x403E, LIT64( 0xFFF0000000002000 ) }, 1346 { 0x3FFE, LIT64( 0xC860E3C75D224F28 ) }, 1347 { 0x407E, LIT64( 0xFC00000FFFFFFFFE ) }, 1348 { 0x737A, LIT64( 0x800000007FFDFFFE ) }, 1349 { 0x4044, LIT64( 0xFFFFFF80000FFFFF ) }, 1350 { 0x3BFE, LIT64( 0x8000040000001FFE ) }, 1351 { 0x4002, LIT64( 0xFF80000000000020 ) }, 1352 { 0x5E8D, LIT64( 0xFFFFFFFFFFE00004 ) }, 1353 { 0x4004, LIT64( 0x8000000000003FFB ) }, 1354 { 0x407F, LIT64( 0x800000000003FFFE ) }, 1355 { 0x4000, LIT64( 0xA459EE6A5C16CA55 ) }, 1356 { 0x0003, LIT64( 0xC42CBF7399AEEB94 ) }, 1357 { 0x3F7F, LIT64( 0xF800000000000006 ) }, 1358 { 0x407F, LIT64( 0xBF56BE8871F28FEA ) }, 1359 { 0x407E, LIT64( 0xFFFF77FFFFFFFFFE ) }, 1360 { 0x2DC9, LIT64( 0x8000000FFFFFFFDE ) }, 1361 { 0x4001, LIT64( 0xEFF7FFFFFFFFFFFF ) }, 1362 { 0x4001, LIT64( 0xBE84F30125C497A6 ) }, 1363 { 0x406B, LIT64( 0xEFFFFFFFFFFFFFFF ) }, 1364 { 0x4080, LIT64( 0xFFFFFFFFBFFFFFFF ) }, 1365 { 0x07E9, LIT64( 0x81FFFFFFFFFFFBFF ) }, 1366 { 0x263F, LIT64( 0x801FFFFFFEFFFFFE ) }, 1367 { 0x403C, LIT64( 0x801FFFFFFFF7FFFF ) }, 1368 { 0x4018, LIT64( 0x8000000000080003 ) } 1369 }; 1370 1371 static void time_az_floatx80_pos( floatx80 function( floatx80 ) ) 1372 { 1373 clock_t startClock, endClock; 1374 int32 count, i; 1375 int8 inputNum; 1376 floatx80 a; 1377 1378 count = 0; 1379 inputNum = 0; 1380 startClock = clock(); 1381 do { 1382 for ( i = minIterations; i; --i ) { 1383 a.low = inputs_floatx80_pos[ inputNum ].low; 1384 a.high = inputs_floatx80_pos[ inputNum ].high; 1385 function( a ); 1386 inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); 1387 } 1388 count += minIterations; 1389 } while ( clock() - startClock < CLOCKS_PER_SEC ); 1390 inputNum = 0; 1391 startClock = clock(); 1392 for ( i = count; i; --i ) { 1393 a.low = inputs_floatx80_pos[ inputNum ].low; 1394 a.high = inputs_floatx80_pos[ inputNum ].high; 1395 function( a ); 1396 inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); 1397 } 1398 endClock = clock(); 1399 reportTime( count, endClock - startClock ); 1400 1401 } 1402 1403 #endif 1404 1405 #ifdef FLOAT128 1406 1407 enum { 1408 numInputs_float128 = 32 1409 }; 1410 1411 static const struct { 1412 bits64 high, low; 1413 } inputs_float128[ numInputs_float128 ] = { 1414 { LIT64( 0x3FDA200000100000 ), LIT64( 0x0000000000000000 ) }, 1415 { LIT64( 0x3FFF000000000000 ), LIT64( 0x0000000000000000 ) }, 1416 { LIT64( 0x85F14776190C8306 ), LIT64( 0xD8715F4E3D54BB92 ) }, 1417 { LIT64( 0xF2B00000007FFFFF ), LIT64( 0xFFFFFFFFFFF7FFFF ) }, 1418 { LIT64( 0x8000000000000000 ), LIT64( 0x0000000000000000 ) }, 1419 { LIT64( 0xBFFFFFFFFFE00000 ), LIT64( 0x0000008000000000 ) }, 1420 { LIT64( 0x407F1719CE722F3E ), LIT64( 0xDA6B3FE5FF29425B ) }, 1421 { LIT64( 0x43FFFF8000000000 ), LIT64( 0x0000000000400000 ) }, 1422 { LIT64( 0x401E000000000100 ), LIT64( 0x0000000000002000 ) }, 1423 { LIT64( 0x3FFED71DACDA8E47 ), LIT64( 0x4860E3C75D224F28 ) }, 1424 { LIT64( 0xBF7ECFC1E90647D1 ), LIT64( 0x7A124FE55623EE44 ) }, 1425 { LIT64( 0x0DF7007FFFFFFFFF ), LIT64( 0xFFFFFFFFEFFFFFFF ) }, 1426 { LIT64( 0x3FE5FFEFFFFFFFFF ), LIT64( 0xFFFFFFFFFFFFEFFF ) }, 1427 { LIT64( 0x403FFFFFFFFFFFFF ), LIT64( 0xFFFFFFFFFFFFFBFE ) }, 1428 { LIT64( 0xBFFB2FBF7399AFEB ), LIT64( 0xA459EE6A5C16CA55 ) }, 1429 { LIT64( 0xBDB8FFFFFFFFFFFC ), LIT64( 0x0000000000000400 ) }, 1430 { LIT64( 0x3FC8FFDFFFFFFFFF ), LIT64( 0xFFFFFFFFF0000000 ) }, 1431 { LIT64( 0x3FFBFFFFFFDFFFFF ), LIT64( 0xFFF8000000000000 ) }, 1432 { LIT64( 0x407043C11737BE84 ), LIT64( 0xDDD58212ADC937F4 ) }, 1433 { LIT64( 0x8001000000000000 ), LIT64( 0x0000001000000001 ) }, 1434 { LIT64( 0xC036FFFFFFFFFFFF ), LIT64( 0xFE40000000000000 ) }, 1435 { LIT64( 0x4002FFFFFE000002 ), LIT64( 0x0000000000000000 ) }, 1436 { LIT64( 0x4000C3FEDE897773 ), LIT64( 0x326AC4FD8EFBE6DC ) }, 1437 { LIT64( 0xBFFF0000000FFFFF ), LIT64( 0xFFFFFE0000000000 ) }, 1438 { LIT64( 0x62C3E502146E426D ), LIT64( 0x43F3CAA0DC7DF1A0 ) }, 1439 { LIT64( 0xB5CBD32E52BB570E ), LIT64( 0xBCC477CB11C6236C ) }, 1440 { LIT64( 0xE228FFFFFFC00000 ), LIT64( 0x0000000000000000 ) }, 1441 { LIT64( 0x3F80000000000000 ), LIT64( 0x0000000080000008 ) }, 1442 { LIT64( 0xC1AFFFDFFFFFFFFF ), LIT64( 0xFFFC000000000000 ) }, 1443 { LIT64( 0xC96F000000000000 ), LIT64( 0x00000001FFFBFFFF ) }, 1444 { LIT64( 0x3DE09BFE7923A338 ), LIT64( 0xBCC8FBBD7CEC1F4F ) }, 1445 { LIT64( 0x401CFFFFFFFFFFFF ), LIT64( 0xFFFFFFFEFFFFFF80 ) } 1446 }; 1447 1448 static void time_a_float128_z_int32( int32 function( float128 ) ) 1449 { 1450 clock_t startClock, endClock; 1451 int32 count, i; 1452 int8 inputNum; 1453 float128 a; 1454 1455 count = 0; 1456 inputNum = 0; 1457 startClock = clock(); 1458 do { 1459 for ( i = minIterations; i; --i ) { 1460 a.low = inputs_float128[ inputNum ].low; 1461 a.high = inputs_float128[ inputNum ].high; 1462 function( a ); 1463 inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); 1464 } 1465 count += minIterations; 1466 } while ( clock() - startClock < CLOCKS_PER_SEC ); 1467 inputNum = 0; 1468 startClock = clock(); 1469 for ( i = count; i; --i ) { 1470 a.low = inputs_float128[ inputNum ].low; 1471 a.high = inputs_float128[ inputNum ].high; 1472 function( a ); 1473 inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); 1474 } 1475 endClock = clock(); 1476 reportTime( count, endClock - startClock ); 1477 1478 } 1479 1480 static void time_a_float128_z_int64( int64 function( float128 ) ) 1481 { 1482 clock_t startClock, endClock; 1483 int32 count, i; 1484 int8 inputNum; 1485 float128 a; 1486 1487 count = 0; 1488 inputNum = 0; 1489 startClock = clock(); 1490 do { 1491 for ( i = minIterations; i; --i ) { 1492 a.low = inputs_float128[ inputNum ].low; 1493 a.high = inputs_float128[ inputNum ].high; 1494 function( a ); 1495 inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); 1496 } 1497 count += minIterations; 1498 } while ( clock() - startClock < CLOCKS_PER_SEC ); 1499 inputNum = 0; 1500 startClock = clock(); 1501 for ( i = count; i; --i ) { 1502 a.low = inputs_float128[ inputNum ].low; 1503 a.high = inputs_float128[ inputNum ].high; 1504 function( a ); 1505 inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); 1506 } 1507 endClock = clock(); 1508 reportTime( count, endClock - startClock ); 1509 1510 } 1511 1512 static void time_a_float128_z_float32( float32 function( float128 ) ) 1513 { 1514 clock_t startClock, endClock; 1515 int32 count, i; 1516 int8 inputNum; 1517 float128 a; 1518 1519 count = 0; 1520 inputNum = 0; 1521 startClock = clock(); 1522 do { 1523 for ( i = minIterations; i; --i ) { 1524 a.low = inputs_float128[ inputNum ].low; 1525 a.high = inputs_float128[ inputNum ].high; 1526 function( a ); 1527 inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); 1528 } 1529 count += minIterations; 1530 } while ( clock() - startClock < CLOCKS_PER_SEC ); 1531 inputNum = 0; 1532 startClock = clock(); 1533 for ( i = count; i; --i ) { 1534 a.low = inputs_float128[ inputNum ].low; 1535 a.high = inputs_float128[ inputNum ].high; 1536 function( a ); 1537 inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); 1538 } 1539 endClock = clock(); 1540 reportTime( count, endClock - startClock ); 1541 1542 } 1543 1544 static void time_a_float128_z_float64( float64 function( float128 ) ) 1545 { 1546 clock_t startClock, endClock; 1547 int32 count, i; 1548 int8 inputNum; 1549 float128 a; 1550 1551 count = 0; 1552 inputNum = 0; 1553 startClock = clock(); 1554 do { 1555 for ( i = minIterations; i; --i ) { 1556 a.low = inputs_float128[ inputNum ].low; 1557 a.high = inputs_float128[ inputNum ].high; 1558 function( a ); 1559 inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); 1560 } 1561 count += minIterations; 1562 } while ( clock() - startClock < CLOCKS_PER_SEC ); 1563 inputNum = 0; 1564 startClock = clock(); 1565 for ( i = count; i; --i ) { 1566 a.low = inputs_float128[ inputNum ].low; 1567 a.high = inputs_float128[ inputNum ].high; 1568 function( a ); 1569 inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); 1570 } 1571 endClock = clock(); 1572 reportTime( count, endClock - startClock ); 1573 1574 } 1575 1576 #ifdef FLOATX80 1577 1578 static void time_a_float128_z_floatx80( floatx80 function( float128 ) ) 1579 { 1580 clock_t startClock, endClock; 1581 int32 count, i; 1582 int8 inputNum; 1583 float128 a; 1584 1585 count = 0; 1586 inputNum = 0; 1587 startClock = clock(); 1588 do { 1589 for ( i = minIterations; i; --i ) { 1590 a.low = inputs_float128[ inputNum ].low; 1591 a.high = inputs_float128[ inputNum ].high; 1592 function( a ); 1593 inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); 1594 } 1595 count += minIterations; 1596 } while ( clock() - startClock < CLOCKS_PER_SEC ); 1597 inputNum = 0; 1598 startClock = clock(); 1599 for ( i = count; i; --i ) { 1600 a.low = inputs_float128[ inputNum ].low; 1601 a.high = inputs_float128[ inputNum ].high; 1602 function( a ); 1603 inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); 1604 } 1605 endClock = clock(); 1606 reportTime( count, endClock - startClock ); 1607 1608 } 1609 1610 #endif 1611 1612 static void time_az_float128( float128 function( float128 ) ) 1613 { 1614 clock_t startClock, endClock; 1615 int32 count, i; 1616 int8 inputNum; 1617 float128 a; 1618 1619 count = 0; 1620 inputNum = 0; 1621 startClock = clock(); 1622 do { 1623 for ( i = minIterations; i; --i ) { 1624 a.low = inputs_float128[ inputNum ].low; 1625 a.high = inputs_float128[ inputNum ].high; 1626 function( a ); 1627 inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); 1628 } 1629 count += minIterations; 1630 } while ( clock() - startClock < CLOCKS_PER_SEC ); 1631 inputNum = 0; 1632 startClock = clock(); 1633 for ( i = count; i; --i ) { 1634 a.low = inputs_float128[ inputNum ].low; 1635 a.high = inputs_float128[ inputNum ].high; 1636 function( a ); 1637 inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); 1638 } 1639 endClock = clock(); 1640 reportTime( count, endClock - startClock ); 1641 1642 } 1643 1644 static void time_ab_float128_z_flag( flag function( float128, float128 ) ) 1645 { 1646 clock_t startClock, endClock; 1647 int32 count, i; 1648 int8 inputNumA, inputNumB; 1649 float128 a, b; 1650 1651 count = 0; 1652 inputNumA = 0; 1653 inputNumB = 0; 1654 startClock = clock(); 1655 do { 1656 for ( i = minIterations; i; --i ) { 1657 a.low = inputs_float128[ inputNumA ].low; 1658 a.high = inputs_float128[ inputNumA ].high; 1659 b.low = inputs_float128[ inputNumB ].low; 1660 b.high = inputs_float128[ inputNumB ].high; 1661 function( a, b ); 1662 inputNumA = ( inputNumA + 1 ) & ( numInputs_float128 - 1 ); 1663 if ( inputNumA == 0 ) ++inputNumB; 1664 inputNumB = ( inputNumB + 1 ) & ( numInputs_float128 - 1 ); 1665 } 1666 count += minIterations; 1667 } while ( clock() - startClock < CLOCKS_PER_SEC ); 1668 inputNumA = 0; 1669 inputNumB = 0; 1670 startClock = clock(); 1671 for ( i = count; i; --i ) { 1672 a.low = inputs_float128[ inputNumA ].low; 1673 a.high = inputs_float128[ inputNumA ].high; 1674 b.low = inputs_float128[ inputNumB ].low; 1675 b.high = inputs_float128[ inputNumB ].high; 1676 function( a, b ); 1677 inputNumA = ( inputNumA + 1 ) & ( numInputs_float128 - 1 ); 1678 if ( inputNumA == 0 ) ++inputNumB; 1679 inputNumB = ( inputNumB + 1 ) & ( numInputs_float128 - 1 ); 1680 } 1681 endClock = clock(); 1682 reportTime( count, endClock - startClock ); 1683 1684 } 1685 1686 static void time_abz_float128( float128 function( float128, float128 ) ) 1687 { 1688 clock_t startClock, endClock; 1689 int32 count, i; 1690 int8 inputNumA, inputNumB; 1691 float128 a, b; 1692 1693 count = 0; 1694 inputNumA = 0; 1695 inputNumB = 0; 1696 startClock = clock(); 1697 do { 1698 for ( i = minIterations; i; --i ) { 1699 a.low = inputs_float128[ inputNumA ].low; 1700 a.high = inputs_float128[ inputNumA ].high; 1701 b.low = inputs_float128[ inputNumB ].low; 1702 b.high = inputs_float128[ inputNumB ].high; 1703 function( a, b ); 1704 inputNumA = ( inputNumA + 1 ) & ( numInputs_float128 - 1 ); 1705 if ( inputNumA == 0 ) ++inputNumB; 1706 inputNumB = ( inputNumB + 1 ) & ( numInputs_float128 - 1 ); 1707 } 1708 count += minIterations; 1709 } while ( clock() - startClock < CLOCKS_PER_SEC ); 1710 inputNumA = 0; 1711 inputNumB = 0; 1712 startClock = clock(); 1713 for ( i = count; i; --i ) { 1714 a.low = inputs_float128[ inputNumA ].low; 1715 a.high = inputs_float128[ inputNumA ].high; 1716 b.low = inputs_float128[ inputNumB ].low; 1717 b.high = inputs_float128[ inputNumB ].high; 1718 function( a, b ); 1719 inputNumA = ( inputNumA + 1 ) & ( numInputs_float128 - 1 ); 1720 if ( inputNumA == 0 ) ++inputNumB; 1721 inputNumB = ( inputNumB + 1 ) & ( numInputs_float128 - 1 ); 1722 } 1723 endClock = clock(); 1724 reportTime( count, endClock - startClock ); 1725 1726 } 1727 1728 static const struct { 1729 bits64 high, low; 1730 } inputs_float128_pos[ numInputs_float128 ] = { 1731 { LIT64( 0x3FDA200000100000 ), LIT64( 0x0000000000000000 ) }, 1732 { LIT64( 0x3FFF000000000000 ), LIT64( 0x0000000000000000 ) }, 1733 { LIT64( 0x05F14776190C8306 ), LIT64( 0xD8715F4E3D54BB92 ) }, 1734 { LIT64( 0x72B00000007FFFFF ), LIT64( 0xFFFFFFFFFFF7FFFF ) }, 1735 { LIT64( 0x0000000000000000 ), LIT64( 0x0000000000000000 ) }, 1736 { LIT64( 0x3FFFFFFFFFE00000 ), LIT64( 0x0000008000000000 ) }, 1737 { LIT64( 0x407F1719CE722F3E ), LIT64( 0xDA6B3FE5FF29425B ) }, 1738 { LIT64( 0x43FFFF8000000000 ), LIT64( 0x0000000000400000 ) }, 1739 { LIT64( 0x401E000000000100 ), LIT64( 0x0000000000002000 ) }, 1740 { LIT64( 0x3FFED71DACDA8E47 ), LIT64( 0x4860E3C75D224F28 ) }, 1741 { LIT64( 0x3F7ECFC1E90647D1 ), LIT64( 0x7A124FE55623EE44 ) }, 1742 { LIT64( 0x0DF7007FFFFFFFFF ), LIT64( 0xFFFFFFFFEFFFFFFF ) }, 1743 { LIT64( 0x3FE5FFEFFFFFFFFF ), LIT64( 0xFFFFFFFFFFFFEFFF ) }, 1744 { LIT64( 0x403FFFFFFFFFFFFF ), LIT64( 0xFFFFFFFFFFFFFBFE ) }, 1745 { LIT64( 0x3FFB2FBF7399AFEB ), LIT64( 0xA459EE6A5C16CA55 ) }, 1746 { LIT64( 0x3DB8FFFFFFFFFFFC ), LIT64( 0x0000000000000400 ) }, 1747 { LIT64( 0x3FC8FFDFFFFFFFFF ), LIT64( 0xFFFFFFFFF0000000 ) }, 1748 { LIT64( 0x3FFBFFFFFFDFFFFF ), LIT64( 0xFFF8000000000000 ) }, 1749 { LIT64( 0x407043C11737BE84 ), LIT64( 0xDDD58212ADC937F4 ) }, 1750 { LIT64( 0x0001000000000000 ), LIT64( 0x0000001000000001 ) }, 1751 { LIT64( 0x4036FFFFFFFFFFFF ), LIT64( 0xFE40000000000000 ) }, 1752 { LIT64( 0x4002FFFFFE000002 ), LIT64( 0x0000000000000000 ) }, 1753 { LIT64( 0x4000C3FEDE897773 ), LIT64( 0x326AC4FD8EFBE6DC ) }, 1754 { LIT64( 0x3FFF0000000FFFFF ), LIT64( 0xFFFFFE0000000000 ) }, 1755 { LIT64( 0x62C3E502146E426D ), LIT64( 0x43F3CAA0DC7DF1A0 ) }, 1756 { LIT64( 0x35CBD32E52BB570E ), LIT64( 0xBCC477CB11C6236C ) }, 1757 { LIT64( 0x6228FFFFFFC00000 ), LIT64( 0x0000000000000000 ) }, 1758 { LIT64( 0x3F80000000000000 ), LIT64( 0x0000000080000008 ) }, 1759 { LIT64( 0x41AFFFDFFFFFFFFF ), LIT64( 0xFFFC000000000000 ) }, 1760 { LIT64( 0x496F000000000000 ), LIT64( 0x00000001FFFBFFFF ) }, 1761 { LIT64( 0x3DE09BFE7923A338 ), LIT64( 0xBCC8FBBD7CEC1F4F ) }, 1762 { LIT64( 0x401CFFFFFFFFFFFF ), LIT64( 0xFFFFFFFEFFFFFF80 ) } 1763 }; 1764 1765 static void time_az_float128_pos( float128 function( float128 ) ) 1766 { 1767 clock_t startClock, endClock; 1768 int32 count, i; 1769 int8 inputNum; 1770 float128 a; 1771 1772 count = 0; 1773 inputNum = 0; 1774 startClock = clock(); 1775 do { 1776 for ( i = minIterations; i; --i ) { 1777 a.low = inputs_float128_pos[ inputNum ].low; 1778 a.high = inputs_float128_pos[ inputNum ].high; 1779 function( a ); 1780 inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); 1781 } 1782 count += minIterations; 1783 } while ( clock() - startClock < CLOCKS_PER_SEC ); 1784 inputNum = 0; 1785 startClock = clock(); 1786 for ( i = count; i; --i ) { 1787 a.low = inputs_float128_pos[ inputNum ].low; 1788 a.high = inputs_float128_pos[ inputNum ].high; 1789 function( a ); 1790 inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); 1791 } 1792 endClock = clock(); 1793 reportTime( count, endClock - startClock ); 1794 1795 } 1796 1797 #endif 1798 1799 enum { 1800 INT32_TO_FLOAT32 = 1, 1801 INT32_TO_FLOAT64, 1802 #ifdef FLOATX80 1803 INT32_TO_FLOATX80, 1804 #endif 1805 #ifdef FLOAT128 1806 INT32_TO_FLOAT128, 1807 #endif 1808 INT64_TO_FLOAT32, 1809 INT64_TO_FLOAT64, 1810 #ifdef FLOATX80 1811 INT64_TO_FLOATX80, 1812 #endif 1813 #ifdef FLOAT128 1814 INT64_TO_FLOAT128, 1815 #endif 1816 FLOAT32_TO_INT32, 1817 FLOAT32_TO_INT32_ROUND_TO_ZERO, 1818 FLOAT32_TO_INT64, 1819 FLOAT32_TO_INT64_ROUND_TO_ZERO, 1820 FLOAT32_TO_FLOAT64, 1821 #ifdef FLOATX80 1822 FLOAT32_TO_FLOATX80, 1823 #endif 1824 #ifdef FLOAT128 1825 FLOAT32_TO_FLOAT128, 1826 #endif 1827 FLOAT32_ROUND_TO_INT, 1828 FLOAT32_ADD, 1829 FLOAT32_SUB, 1830 FLOAT32_MUL, 1831 FLOAT32_DIV, 1832 FLOAT32_REM, 1833 FLOAT32_SQRT, 1834 FLOAT32_EQ, 1835 FLOAT32_LE, 1836 FLOAT32_LT, 1837 FLOAT32_EQ_SIGNALING, 1838 FLOAT32_LE_QUIET, 1839 FLOAT32_LT_QUIET, 1840 FLOAT64_TO_INT32, 1841 FLOAT64_TO_INT32_ROUND_TO_ZERO, 1842 FLOAT64_TO_INT64, 1843 FLOAT64_TO_INT64_ROUND_TO_ZERO, 1844 FLOAT64_TO_FLOAT32, 1845 #ifdef FLOATX80 1846 FLOAT64_TO_FLOATX80, 1847 #endif 1848 #ifdef FLOAT128 1849 FLOAT64_TO_FLOAT128, 1850 #endif 1851 FLOAT64_ROUND_TO_INT, 1852 FLOAT64_ADD, 1853 FLOAT64_SUB, 1854 FLOAT64_MUL, 1855 FLOAT64_DIV, 1856 FLOAT64_REM, 1857 FLOAT64_SQRT, 1858 FLOAT64_EQ, 1859 FLOAT64_LE, 1860 FLOAT64_LT, 1861 FLOAT64_EQ_SIGNALING, 1862 FLOAT64_LE_QUIET, 1863 FLOAT64_LT_QUIET, 1864 #ifdef FLOATX80 1865 FLOATX80_TO_INT32, 1866 FLOATX80_TO_INT32_ROUND_TO_ZERO, 1867 FLOATX80_TO_INT64, 1868 FLOATX80_TO_INT64_ROUND_TO_ZERO, 1869 FLOATX80_TO_FLOAT32, 1870 FLOATX80_TO_FLOAT64, 1871 #ifdef FLOAT128 1872 FLOATX80_TO_FLOAT128, 1873 #endif 1874 FLOATX80_ROUND_TO_INT, 1875 FLOATX80_ADD, 1876 FLOATX80_SUB, 1877 FLOATX80_MUL, 1878 FLOATX80_DIV, 1879 FLOATX80_REM, 1880 FLOATX80_SQRT, 1881 FLOATX80_EQ, 1882 FLOATX80_LE, 1883 FLOATX80_LT, 1884 FLOATX80_EQ_SIGNALING, 1885 FLOATX80_LE_QUIET, 1886 FLOATX80_LT_QUIET, 1887 #endif 1888 #ifdef FLOAT128 1889 FLOAT128_TO_INT32, 1890 FLOAT128_TO_INT32_ROUND_TO_ZERO, 1891 FLOAT128_TO_INT64, 1892 FLOAT128_TO_INT64_ROUND_TO_ZERO, 1893 FLOAT128_TO_FLOAT32, 1894 FLOAT128_TO_FLOAT64, 1895 #ifdef FLOATX80 1896 FLOAT128_TO_FLOATX80, 1897 #endif 1898 FLOAT128_ROUND_TO_INT, 1899 FLOAT128_ADD, 1900 FLOAT128_SUB, 1901 FLOAT128_MUL, 1902 FLOAT128_DIV, 1903 FLOAT128_REM, 1904 FLOAT128_SQRT, 1905 FLOAT128_EQ, 1906 FLOAT128_LE, 1907 FLOAT128_LT, 1908 FLOAT128_EQ_SIGNALING, 1909 FLOAT128_LE_QUIET, 1910 FLOAT128_LT_QUIET, 1911 #endif 1912 NUM_FUNCTIONS 1913 }; 1914 1915 static struct { 1916 char *name; 1917 int8 numInputs; 1918 flag roundingPrecision, roundingMode; 1919 flag tininessMode, tininessModeAtReducedPrecision; 1920 } functions[ NUM_FUNCTIONS ] = { 1921 { 0, 0, 0, 0, 0, 0 }, 1922 { "int32_to_float32", 1, FALSE, TRUE, FALSE, FALSE }, 1923 { "int32_to_float64", 1, FALSE, FALSE, FALSE, FALSE }, 1924 #ifdef FLOATX80 1925 { "int32_to_floatx80", 1, FALSE, FALSE, FALSE, FALSE }, 1926 #endif 1927 #ifdef FLOAT128 1928 { "int32_to_float128", 1, FALSE, FALSE, FALSE, FALSE }, 1929 #endif 1930 { "int64_to_float32", 1, FALSE, TRUE, FALSE, FALSE }, 1931 { "int64_to_float64", 1, FALSE, TRUE, FALSE, FALSE }, 1932 #ifdef FLOATX80 1933 { "int64_to_floatx80", 1, FALSE, FALSE, FALSE, FALSE }, 1934 #endif 1935 #ifdef FLOAT128 1936 { "int64_to_float128", 1, FALSE, FALSE, FALSE, FALSE }, 1937 #endif 1938 { "float32_to_int32", 1, FALSE, TRUE, FALSE, FALSE }, 1939 { "float32_to_int32_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE }, 1940 { "float32_to_int64", 1, FALSE, TRUE, FALSE, FALSE }, 1941 { "float32_to_int64_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE }, 1942 { "float32_to_float64", 1, FALSE, FALSE, FALSE, FALSE }, 1943 #ifdef FLOATX80 1944 { "float32_to_floatx80", 1, FALSE, FALSE, FALSE, FALSE }, 1945 #endif 1946 #ifdef FLOAT128 1947 { "float32_to_float128", 1, FALSE, FALSE, FALSE, FALSE }, 1948 #endif 1949 { "float32_round_to_int", 1, FALSE, TRUE, FALSE, FALSE }, 1950 { "float32_add", 2, FALSE, TRUE, FALSE, FALSE }, 1951 { "float32_sub", 2, FALSE, TRUE, FALSE, FALSE }, 1952 { "float32_mul", 2, FALSE, TRUE, TRUE, FALSE }, 1953 { "float32_div", 2, FALSE, TRUE, FALSE, FALSE }, 1954 { "float32_rem", 2, FALSE, FALSE, FALSE, FALSE }, 1955 { "float32_sqrt", 1, FALSE, TRUE, FALSE, FALSE }, 1956 { "float32_eq", 2, FALSE, FALSE, FALSE, FALSE }, 1957 { "float32_le", 2, FALSE, FALSE, FALSE, FALSE }, 1958 { "float32_lt", 2, FALSE, FALSE, FALSE, FALSE }, 1959 { "float32_eq_signaling", 2, FALSE, FALSE, FALSE, FALSE }, 1960 { "float32_le_quiet", 2, FALSE, FALSE, FALSE, FALSE }, 1961 { "float32_lt_quiet", 2, FALSE, FALSE, FALSE, FALSE }, 1962 { "float64_to_int32", 1, FALSE, TRUE, FALSE, FALSE }, 1963 { "float64_to_int32_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE }, 1964 { "float64_to_int64", 1, FALSE, TRUE, FALSE, FALSE }, 1965 { "float64_to_int64_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE }, 1966 { "float64_to_float32", 1, FALSE, TRUE, TRUE, FALSE }, 1967 #ifdef FLOATX80 1968 { "float64_to_floatx80", 1, FALSE, FALSE, FALSE, FALSE }, 1969 #endif 1970 #ifdef FLOAT128 1971 { "float64_to_float128", 1, FALSE, FALSE, FALSE, FALSE }, 1972 #endif 1973 { "float64_round_to_int", 1, FALSE, TRUE, FALSE, FALSE }, 1974 { "float64_add", 2, FALSE, TRUE, FALSE, FALSE }, 1975 { "float64_sub", 2, FALSE, TRUE, FALSE, FALSE }, 1976 { "float64_mul", 2, FALSE, TRUE, TRUE, FALSE }, 1977 { "float64_div", 2, FALSE, TRUE, FALSE, FALSE }, 1978 { "float64_rem", 2, FALSE, FALSE, FALSE, FALSE }, 1979 { "float64_sqrt", 1, FALSE, TRUE, FALSE, FALSE }, 1980 { "float64_eq", 2, FALSE, FALSE, FALSE, FALSE }, 1981 { "float64_le", 2, FALSE, FALSE, FALSE, FALSE }, 1982 { "float64_lt", 2, FALSE, FALSE, FALSE, FALSE }, 1983 { "float64_eq_signaling", 2, FALSE, FALSE, FALSE, FALSE }, 1984 { "float64_le_quiet", 2, FALSE, FALSE, FALSE, FALSE }, 1985 { "float64_lt_quiet", 2, FALSE, FALSE, FALSE, FALSE }, 1986 #ifdef FLOATX80 1987 { "floatx80_to_int32", 1, FALSE, TRUE, FALSE, FALSE }, 1988 { "floatx80_to_int32_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE }, 1989 { "floatx80_to_int64", 1, FALSE, TRUE, FALSE, FALSE }, 1990 { "floatx80_to_int64_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE }, 1991 { "floatx80_to_float32", 1, FALSE, TRUE, TRUE, FALSE }, 1992 { "floatx80_to_float64", 1, FALSE, TRUE, TRUE, FALSE }, 1993 #ifdef FLOAT128 1994 { "floatx80_to_float128", 1, FALSE, FALSE, FALSE, FALSE }, 1995 #endif 1996 { "floatx80_round_to_int", 1, FALSE, TRUE, FALSE, FALSE }, 1997 { "floatx80_add", 2, TRUE, TRUE, FALSE, TRUE }, 1998 { "floatx80_sub", 2, TRUE, TRUE, FALSE, TRUE }, 1999 { "floatx80_mul", 2, TRUE, TRUE, TRUE, TRUE }, 2000 { "floatx80_div", 2, TRUE, TRUE, FALSE, TRUE }, 2001 { "floatx80_rem", 2, FALSE, FALSE, FALSE, FALSE }, 2002 { "floatx80_sqrt", 1, TRUE, TRUE, FALSE, FALSE }, 2003 { "floatx80_eq", 2, FALSE, FALSE, FALSE, FALSE }, 2004 { "floatx80_le", 2, FALSE, FALSE, FALSE, FALSE }, 2005 { "floatx80_lt", 2, FALSE, FALSE, FALSE, FALSE }, 2006 { "floatx80_eq_signaling", 2, FALSE, FALSE, FALSE, FALSE }, 2007 { "floatx80_le_quiet", 2, FALSE, FALSE, FALSE, FALSE }, 2008 { "floatx80_lt_quiet", 2, FALSE, FALSE, FALSE, FALSE }, 2009 #endif 2010 #ifdef FLOAT128 2011 { "float128_to_int32", 1, FALSE, TRUE, FALSE, FALSE }, 2012 { "float128_to_int32_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE }, 2013 { "float128_to_int64", 1, FALSE, TRUE, FALSE, FALSE }, 2014 { "float128_to_int64_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE }, 2015 { "float128_to_float32", 1, FALSE, TRUE, TRUE, FALSE }, 2016 { "float128_to_float64", 1, FALSE, TRUE, TRUE, FALSE }, 2017 #ifdef FLOATX80 2018 { "float128_to_floatx80", 1, FALSE, TRUE, TRUE, FALSE }, 2019 #endif 2020 { "float128_round_to_int", 1, FALSE, TRUE, FALSE, FALSE }, 2021 { "float128_add", 2, FALSE, TRUE, FALSE, FALSE }, 2022 { "float128_sub", 2, FALSE, TRUE, FALSE, FALSE }, 2023 { "float128_mul", 2, FALSE, TRUE, TRUE, FALSE }, 2024 { "float128_div", 2, FALSE, TRUE, FALSE, FALSE }, 2025 { "float128_rem", 2, FALSE, FALSE, FALSE, FALSE }, 2026 { "float128_sqrt", 1, FALSE, TRUE, FALSE, FALSE }, 2027 { "float128_eq", 2, FALSE, FALSE, FALSE, FALSE }, 2028 { "float128_le", 2, FALSE, FALSE, FALSE, FALSE }, 2029 { "float128_lt", 2, FALSE, FALSE, FALSE, FALSE }, 2030 { "float128_eq_signaling", 2, FALSE, FALSE, FALSE, FALSE }, 2031 { "float128_le_quiet", 2, FALSE, FALSE, FALSE, FALSE }, 2032 { "float128_lt_quiet", 2, FALSE, FALSE, FALSE, FALSE }, 2033 #endif 2034 }; 2035 2036 enum { 2037 ROUND_NEAREST_EVEN = 1, 2038 ROUND_TO_ZERO, 2039 ROUND_DOWN, 2040 ROUND_UP, 2041 NUM_ROUNDINGMODES 2042 }; 2043 enum { 2044 TININESS_BEFORE_ROUNDING = 1, 2045 TININESS_AFTER_ROUNDING, 2046 NUM_TININESSMODES 2047 }; 2048 2049 static void 2050 timeFunctionVariety( 2051 uint8 functionCode, 2052 int8 roundingPrecision, 2053 int8 roundingMode, 2054 int8 tininessMode 2055 ) 2056 { 2057 uint8 roundingCode; 2058 int8 tininessCode; 2059 2060 functionName = functions[ functionCode ].name; 2061 if ( roundingPrecision == 32 ) { 2062 roundingPrecisionName = "32"; 2063 } 2064 else if ( roundingPrecision == 64 ) { 2065 roundingPrecisionName = "64"; 2066 } 2067 else if ( roundingPrecision == 80 ) { 2068 roundingPrecisionName = "80"; 2069 } 2070 else { 2071 roundingPrecisionName = 0; 2072 } 2073 #ifdef FLOATX80 2074 floatx80_rounding_precision = roundingPrecision; 2075 #endif 2076 switch ( roundingMode ) { 2077 case 0: 2078 roundingModeName = 0; 2079 roundingCode = float_round_nearest_even; 2080 break; 2081 case ROUND_NEAREST_EVEN: 2082 roundingModeName = "nearest_even"; 2083 roundingCode = float_round_nearest_even; 2084 break; 2085 case ROUND_TO_ZERO: 2086 roundingModeName = "to_zero"; 2087 roundingCode = float_round_to_zero; 2088 break; 2089 case ROUND_DOWN: 2090 roundingModeName = "down"; 2091 roundingCode = float_round_down; 2092 break; 2093 case ROUND_UP: 2094 roundingModeName = "up"; 2095 roundingCode = float_round_up; 2096 break; 2097 } 2098 float_rounding_mode = roundingCode; 2099 switch ( tininessMode ) { 2100 case 0: 2101 tininessModeName = 0; 2102 tininessCode = float_tininess_after_rounding; 2103 break; 2104 case TININESS_BEFORE_ROUNDING: 2105 tininessModeName = "before"; 2106 tininessCode = float_tininess_before_rounding; 2107 break; 2108 case TININESS_AFTER_ROUNDING: 2109 tininessModeName = "after"; 2110 tininessCode = float_tininess_after_rounding; 2111 break; 2112 } 2113 float_detect_tininess = tininessCode; 2114 switch ( functionCode ) { 2115 case INT32_TO_FLOAT32: 2116 time_a_int32_z_float32( int32_to_float32 ); 2117 break; 2118 case INT32_TO_FLOAT64: 2119 time_a_int32_z_float64( int32_to_float64 ); 2120 break; 2121 #ifdef FLOATX80 2122 case INT32_TO_FLOATX80: 2123 time_a_int32_z_floatx80( int32_to_floatx80 ); 2124 break; 2125 #endif 2126 #ifdef FLOAT128 2127 case INT32_TO_FLOAT128: 2128 time_a_int32_z_float128( int32_to_float128 ); 2129 break; 2130 #endif 2131 case INT64_TO_FLOAT32: 2132 time_a_int64_z_float32( int64_to_float32 ); 2133 break; 2134 case INT64_TO_FLOAT64: 2135 time_a_int64_z_float64( int64_to_float64 ); 2136 break; 2137 #ifdef FLOATX80 2138 case INT64_TO_FLOATX80: 2139 time_a_int64_z_floatx80( int64_to_floatx80 ); 2140 break; 2141 #endif 2142 #ifdef FLOAT128 2143 case INT64_TO_FLOAT128: 2144 time_a_int64_z_float128( int64_to_float128 ); 2145 break; 2146 #endif 2147 case FLOAT32_TO_INT32: 2148 time_a_float32_z_int32( float32_to_int32 ); 2149 break; 2150 case FLOAT32_TO_INT32_ROUND_TO_ZERO: 2151 time_a_float32_z_int32( float32_to_int32_round_to_zero ); 2152 break; 2153 case FLOAT32_TO_INT64: 2154 time_a_float32_z_int64( float32_to_int64 ); 2155 break; 2156 case FLOAT32_TO_INT64_ROUND_TO_ZERO: 2157 time_a_float32_z_int64( float32_to_int64_round_to_zero ); 2158 break; 2159 case FLOAT32_TO_FLOAT64: 2160 time_a_float32_z_float64( float32_to_float64 ); 2161 break; 2162 #ifdef FLOATX80 2163 case FLOAT32_TO_FLOATX80: 2164 time_a_float32_z_floatx80( float32_to_floatx80 ); 2165 break; 2166 #endif 2167 #ifdef FLOAT128 2168 case FLOAT32_TO_FLOAT128: 2169 time_a_float32_z_float128( float32_to_float128 ); 2170 break; 2171 #endif 2172 case FLOAT32_ROUND_TO_INT: 2173 time_az_float32( float32_round_to_int ); 2174 break; 2175 case FLOAT32_ADD: 2176 time_abz_float32( float32_add ); 2177 break; 2178 case FLOAT32_SUB: 2179 time_abz_float32( float32_sub ); 2180 break; 2181 case FLOAT32_MUL: 2182 time_abz_float32( float32_mul ); 2183 break; 2184 case FLOAT32_DIV: 2185 time_abz_float32( float32_div ); 2186 break; 2187 case FLOAT32_REM: 2188 time_abz_float32( float32_rem ); 2189 break; 2190 case FLOAT32_SQRT: 2191 time_az_float32_pos( float32_sqrt ); 2192 break; 2193 case FLOAT32_EQ: 2194 time_ab_float32_z_flag( float32_eq ); 2195 break; 2196 case FLOAT32_LE: 2197 time_ab_float32_z_flag( float32_le ); 2198 break; 2199 case FLOAT32_LT: 2200 time_ab_float32_z_flag( float32_lt ); 2201 break; 2202 case FLOAT32_EQ_SIGNALING: 2203 time_ab_float32_z_flag( float32_eq_signaling ); 2204 break; 2205 case FLOAT32_LE_QUIET: 2206 time_ab_float32_z_flag( float32_le_quiet ); 2207 break; 2208 case FLOAT32_LT_QUIET: 2209 time_ab_float32_z_flag( float32_lt_quiet ); 2210 break; 2211 case FLOAT64_TO_INT32: 2212 time_a_float64_z_int32( float64_to_int32 ); 2213 break; 2214 case FLOAT64_TO_INT32_ROUND_TO_ZERO: 2215 time_a_float64_z_int32( float64_to_int32_round_to_zero ); 2216 break; 2217 case FLOAT64_TO_INT64: 2218 time_a_float64_z_int64( float64_to_int64 ); 2219 break; 2220 case FLOAT64_TO_INT64_ROUND_TO_ZERO: 2221 time_a_float64_z_int64( float64_to_int64_round_to_zero ); 2222 break; 2223 case FLOAT64_TO_FLOAT32: 2224 time_a_float64_z_float32( float64_to_float32 ); 2225 break; 2226 #ifdef FLOATX80 2227 case FLOAT64_TO_FLOATX80: 2228 time_a_float64_z_floatx80( float64_to_floatx80 ); 2229 break; 2230 #endif 2231 #ifdef FLOAT128 2232 case FLOAT64_TO_FLOAT128: 2233 time_a_float64_z_float128( float64_to_float128 ); 2234 break; 2235 #endif 2236 case FLOAT64_ROUND_TO_INT: 2237 time_az_float64( float64_round_to_int ); 2238 break; 2239 case FLOAT64_ADD: 2240 time_abz_float64( float64_add ); 2241 break; 2242 case FLOAT64_SUB: 2243 time_abz_float64( float64_sub ); 2244 break; 2245 case FLOAT64_MUL: 2246 time_abz_float64( float64_mul ); 2247 break; 2248 case FLOAT64_DIV: 2249 time_abz_float64( float64_div ); 2250 break; 2251 case FLOAT64_REM: 2252 time_abz_float64( float64_rem ); 2253 break; 2254 case FLOAT64_SQRT: 2255 time_az_float64_pos( float64_sqrt ); 2256 break; 2257 case FLOAT64_EQ: 2258 time_ab_float64_z_flag( float64_eq ); 2259 break; 2260 case FLOAT64_LE: 2261 time_ab_float64_z_flag( float64_le ); 2262 break; 2263 case FLOAT64_LT: 2264 time_ab_float64_z_flag( float64_lt ); 2265 break; 2266 case FLOAT64_EQ_SIGNALING: 2267 time_ab_float64_z_flag( float64_eq_signaling ); 2268 break; 2269 case FLOAT64_LE_QUIET: 2270 time_ab_float64_z_flag( float64_le_quiet ); 2271 break; 2272 case FLOAT64_LT_QUIET: 2273 time_ab_float64_z_flag( float64_lt_quiet ); 2274 break; 2275 #ifdef FLOATX80 2276 case FLOATX80_TO_INT32: 2277 time_a_floatx80_z_int32( floatx80_to_int32 ); 2278 break; 2279 case FLOATX80_TO_INT32_ROUND_TO_ZERO: 2280 time_a_floatx80_z_int32( floatx80_to_int32_round_to_zero ); 2281 break; 2282 case FLOATX80_TO_INT64: 2283 time_a_floatx80_z_int64( floatx80_to_int64 ); 2284 break; 2285 case FLOATX80_TO_INT64_ROUND_TO_ZERO: 2286 time_a_floatx80_z_int64( floatx80_to_int64_round_to_zero ); 2287 break; 2288 case FLOATX80_TO_FLOAT32: 2289 time_a_floatx80_z_float32( floatx80_to_float32 ); 2290 break; 2291 case FLOATX80_TO_FLOAT64: 2292 time_a_floatx80_z_float64( floatx80_to_float64 ); 2293 break; 2294 #ifdef FLOAT128 2295 case FLOATX80_TO_FLOAT128: 2296 time_a_floatx80_z_float128( floatx80_to_float128 ); 2297 break; 2298 #endif 2299 case FLOATX80_ROUND_TO_INT: 2300 time_az_floatx80( floatx80_round_to_int ); 2301 break; 2302 case FLOATX80_ADD: 2303 time_abz_floatx80( floatx80_add ); 2304 break; 2305 case FLOATX80_SUB: 2306 time_abz_floatx80( floatx80_sub ); 2307 break; 2308 case FLOATX80_MUL: 2309 time_abz_floatx80( floatx80_mul ); 2310 break; 2311 case FLOATX80_DIV: 2312 time_abz_floatx80( floatx80_div ); 2313 break; 2314 case FLOATX80_REM: 2315 time_abz_floatx80( floatx80_rem ); 2316 break; 2317 case FLOATX80_SQRT: 2318 time_az_floatx80_pos( floatx80_sqrt ); 2319 break; 2320 case FLOATX80_EQ: 2321 time_ab_floatx80_z_flag( floatx80_eq ); 2322 break; 2323 case FLOATX80_LE: 2324 time_ab_floatx80_z_flag( floatx80_le ); 2325 break; 2326 case FLOATX80_LT: 2327 time_ab_floatx80_z_flag( floatx80_lt ); 2328 break; 2329 case FLOATX80_EQ_SIGNALING: 2330 time_ab_floatx80_z_flag( floatx80_eq_signaling ); 2331 break; 2332 case FLOATX80_LE_QUIET: 2333 time_ab_floatx80_z_flag( floatx80_le_quiet ); 2334 break; 2335 case FLOATX80_LT_QUIET: 2336 time_ab_floatx80_z_flag( floatx80_lt_quiet ); 2337 break; 2338 #endif 2339 #ifdef FLOAT128 2340 case FLOAT128_TO_INT32: 2341 time_a_float128_z_int32( float128_to_int32 ); 2342 break; 2343 case FLOAT128_TO_INT32_ROUND_TO_ZERO: 2344 time_a_float128_z_int32( float128_to_int32_round_to_zero ); 2345 break; 2346 case FLOAT128_TO_INT64: 2347 time_a_float128_z_int64( float128_to_int64 ); 2348 break; 2349 case FLOAT128_TO_INT64_ROUND_TO_ZERO: 2350 time_a_float128_z_int64( float128_to_int64_round_to_zero ); 2351 break; 2352 case FLOAT128_TO_FLOAT32: 2353 time_a_float128_z_float32( float128_to_float32 ); 2354 break; 2355 case FLOAT128_TO_FLOAT64: 2356 time_a_float128_z_float64( float128_to_float64 ); 2357 break; 2358 #ifdef FLOATX80 2359 case FLOAT128_TO_FLOATX80: 2360 time_a_float128_z_floatx80( float128_to_floatx80 ); 2361 break; 2362 #endif 2363 case FLOAT128_ROUND_TO_INT: 2364 time_az_float128( float128_round_to_int ); 2365 break; 2366 case FLOAT128_ADD: 2367 time_abz_float128( float128_add ); 2368 break; 2369 case FLOAT128_SUB: 2370 time_abz_float128( float128_sub ); 2371 break; 2372 case FLOAT128_MUL: 2373 time_abz_float128( float128_mul ); 2374 break; 2375 case FLOAT128_DIV: 2376 time_abz_float128( float128_div ); 2377 break; 2378 case FLOAT128_REM: 2379 time_abz_float128( float128_rem ); 2380 break; 2381 case FLOAT128_SQRT: 2382 time_az_float128_pos( float128_sqrt ); 2383 break; 2384 case FLOAT128_EQ: 2385 time_ab_float128_z_flag( float128_eq ); 2386 break; 2387 case FLOAT128_LE: 2388 time_ab_float128_z_flag( float128_le ); 2389 break; 2390 case FLOAT128_LT: 2391 time_ab_float128_z_flag( float128_lt ); 2392 break; 2393 case FLOAT128_EQ_SIGNALING: 2394 time_ab_float128_z_flag( float128_eq_signaling ); 2395 break; 2396 case FLOAT128_LE_QUIET: 2397 time_ab_float128_z_flag( float128_le_quiet ); 2398 break; 2399 case FLOAT128_LT_QUIET: 2400 time_ab_float128_z_flag( float128_lt_quiet ); 2401 break; 2402 #endif 2403 } 2404 2405 } 2406 2407 static void 2408 timeFunction( 2409 uint8 functionCode, 2410 int8 roundingPrecisionIn, 2411 int8 roundingModeIn, 2412 int8 tininessModeIn 2413 ) 2414 { 2415 int8 roundingPrecision, roundingMode, tininessMode; 2416 2417 roundingPrecision = 32; 2418 for (;;) { 2419 if ( ! functions[ functionCode ].roundingPrecision ) { 2420 roundingPrecision = 0; 2421 } 2422 else if ( roundingPrecisionIn ) { 2423 roundingPrecision = roundingPrecisionIn; 2424 } 2425 for ( roundingMode = 1; 2426 roundingMode < NUM_ROUNDINGMODES; 2427 ++roundingMode 2428 ) { 2429 if ( ! functions[ functionCode ].roundingMode ) { 2430 roundingMode = 0; 2431 } 2432 else if ( roundingModeIn ) { 2433 roundingMode = roundingModeIn; 2434 } 2435 for ( tininessMode = 1; 2436 tininessMode < NUM_TININESSMODES; 2437 ++tininessMode 2438 ) { 2439 if ( ( roundingPrecision == 32 ) 2440 || ( roundingPrecision == 64 ) ) { 2441 if ( ! functions[ functionCode ] 2442 .tininessModeAtReducedPrecision 2443 ) { 2444 tininessMode = 0; 2445 } 2446 else if ( tininessModeIn ) { 2447 tininessMode = tininessModeIn; 2448 } 2449 } 2450 else { 2451 if ( ! functions[ functionCode ].tininessMode ) { 2452 tininessMode = 0; 2453 } 2454 else if ( tininessModeIn ) { 2455 tininessMode = tininessModeIn; 2456 } 2457 } 2458 timeFunctionVariety( 2459 functionCode, roundingPrecision, roundingMode, tininessMode 2460 ); 2461 if ( tininessModeIn || ! tininessMode ) break; 2462 } 2463 if ( roundingModeIn || ! roundingMode ) break; 2464 } 2465 if ( roundingPrecisionIn || ! roundingPrecision ) break; 2466 if ( roundingPrecision == 80 ) { 2467 break; 2468 } 2469 else if ( roundingPrecision == 64 ) { 2470 roundingPrecision = 80; 2471 } 2472 else if ( roundingPrecision == 32 ) { 2473 roundingPrecision = 64; 2474 } 2475 } 2476 2477 } 2478 2479 main( int argc, char **argv ) 2480 { 2481 char *argPtr; 2482 flag functionArgument; 2483 uint8 functionCode; 2484 int8 operands, roundingPrecision, roundingMode, tininessMode; 2485 2486 if ( argc <= 1 ) goto writeHelpMessage; 2487 functionArgument = FALSE; 2488 functionCode = 0; 2489 operands = 0; 2490 roundingPrecision = 0; 2491 roundingMode = 0; 2492 tininessMode = 0; 2493 --argc; 2494 ++argv; 2495 while ( argc && ( argPtr = argv[ 0 ] ) ) { 2496 if ( argPtr[ 0 ] == '-' ) ++argPtr; 2497 if ( strcmp( argPtr, "help" ) == 0 ) { 2498 writeHelpMessage: 2499 fputs( 2500 "timesoftfloat [<option>...] <function>\n" 2501 " <option>: (* is default)\n" 2502 " -help --Write this message and exit.\n" 2503 #ifdef FLOATX80 2504 " -precision32 --Only time rounding precision equivalent to float32.\n" 2505 " -precision64 --Only time rounding precision equivalent to float64.\n" 2506 " -precision80 --Only time maximum rounding precision.\n" 2507 #endif 2508 " -nearesteven --Only time rounding to nearest/even.\n" 2509 " -tozero --Only time rounding to zero.\n" 2510 " -down --Only time rounding down.\n" 2511 " -up --Only time rounding up.\n" 2512 " -tininessbefore --Only time underflow tininess before rounding.\n" 2513 " -tininessafter --Only time underflow tininess after rounding.\n" 2514 " <function>:\n" 2515 " int32_to_<float> <float>_add <float>_eq\n" 2516 " <float>_to_int32 <float>_sub <float>_le\n" 2517 " <float>_to_int32_round_to_zero <float>_mul <float>_lt\n" 2518 " int64_to_<float> <float>_div <float>_eq_signaling\n" 2519 " <float>_to_int64 <float>_rem <float>_le_quiet\n" 2520 " <float>_to_int64_round_to_zero <float>_lt_quiet\n" 2521 " <float>_to_<float>\n" 2522 " <float>_round_to_int\n" 2523 " <float>_sqrt\n" 2524 " -all1 --All 1-operand functions.\n" 2525 " -all2 --All 2-operand functions.\n" 2526 " -all --All functions.\n" 2527 " <float>:\n" 2528 " float32 --Single precision.\n" 2529 " float64 --Double precision.\n" 2530 #ifdef FLOATX80 2531 " floatx80 --Extended double precision.\n" 2532 #endif 2533 #ifdef FLOAT128 2534 " float128 --Quadruple precision.\n" 2535 #endif 2536 , 2537 stdout 2538 ); 2539 return EXIT_SUCCESS; 2540 } 2541 #ifdef FLOATX80 2542 else if ( strcmp( argPtr, "precision32" ) == 0 ) { 2543 roundingPrecision = 32; 2544 } 2545 else if ( strcmp( argPtr, "precision64" ) == 0 ) { 2546 roundingPrecision = 64; 2547 } 2548 else if ( strcmp( argPtr, "precision80" ) == 0 ) { 2549 roundingPrecision = 80; 2550 } 2551 #endif 2552 else if ( ( strcmp( argPtr, "nearesteven" ) == 0 ) 2553 || ( strcmp( argPtr, "nearest_even" ) == 0 ) ) { 2554 roundingMode = ROUND_NEAREST_EVEN; 2555 } 2556 else if ( ( strcmp( argPtr, "tozero" ) == 0 ) 2557 || ( strcmp( argPtr, "to_zero" ) == 0 ) ) { 2558 roundingMode = ROUND_TO_ZERO; 2559 } 2560 else if ( strcmp( argPtr, "down" ) == 0 ) { 2561 roundingMode = ROUND_DOWN; 2562 } 2563 else if ( strcmp( argPtr, "up" ) == 0 ) { 2564 roundingMode = ROUND_UP; 2565 } 2566 else if ( strcmp( argPtr, "tininessbefore" ) == 0 ) { 2567 tininessMode = TININESS_BEFORE_ROUNDING; 2568 } 2569 else if ( strcmp( argPtr, "tininessafter" ) == 0 ) { 2570 tininessMode = TININESS_AFTER_ROUNDING; 2571 } 2572 else if ( strcmp( argPtr, "all1" ) == 0 ) { 2573 functionArgument = TRUE; 2574 functionCode = 0; 2575 operands = 1; 2576 } 2577 else if ( strcmp( argPtr, "all2" ) == 0 ) { 2578 functionArgument = TRUE; 2579 functionCode = 0; 2580 operands = 2; 2581 } 2582 else if ( strcmp( argPtr, "all" ) == 0 ) { 2583 functionArgument = TRUE; 2584 functionCode = 0; 2585 operands = 0; 2586 } 2587 else { 2588 for ( functionCode = 1; 2589 functionCode < NUM_FUNCTIONS; 2590 ++functionCode 2591 ) { 2592 if ( strcmp( argPtr, functions[ functionCode ].name ) == 0 ) { 2593 break; 2594 } 2595 } 2596 if ( functionCode == NUM_FUNCTIONS ) { 2597 fail( "Invalid option or function `%s'", argv[ 0 ] ); 2598 } 2599 functionArgument = TRUE; 2600 } 2601 --argc; 2602 ++argv; 2603 } 2604 if ( ! functionArgument ) fail( "Function argument required" ); 2605 if ( functionCode ) { 2606 timeFunction( 2607 functionCode, roundingPrecision, roundingMode, tininessMode ); 2608 } 2609 else if ( operands == 1 ) { 2610 for ( functionCode = 1; functionCode < NUM_FUNCTIONS; ++functionCode 2611 ) { 2612 if ( functions[ functionCode ].numInputs == 1 ) { 2613 timeFunction( 2614 functionCode, roundingPrecision, roundingMode, tininessMode 2615 ); 2616 } 2617 } 2618 } 2619 else if ( operands == 2 ) { 2620 for ( functionCode = 1; functionCode < NUM_FUNCTIONS; ++functionCode 2621 ) { 2622 if ( functions[ functionCode ].numInputs == 2 ) { 2623 timeFunction( 2624 functionCode, roundingPrecision, roundingMode, tininessMode 2625 ); 2626 } 2627 } 2628 } 2629 else { 2630 for ( functionCode = 1; functionCode < NUM_FUNCTIONS; ++functionCode 2631 ) { 2632 timeFunction( 2633 functionCode, roundingPrecision, roundingMode, tininessMode ); 2634 } 2635 } 2636 return EXIT_SUCCESS; 2637 2638 } 2639 2640