Current Path : /compat/linux/proc/self/root/usr/src/lib/libc/softfloat/ |
FreeBSD hs32.drive.ne.jp 9.1-RELEASE FreeBSD 9.1-RELEASE #1: Wed Jan 14 12:18:08 JST 2015 root@hs32.drive.ne.jp:/sys/amd64/compile/hs32 amd64 |
Current File : //compat/linux/proc/self/root/usr/src/lib/libc/softfloat/timesoftfloat.c |
/* $NetBSD: timesoftfloat.c,v 1.1 2000/06/06 08:15:11 bjh21 Exp $ */ /* =============================================================================== This C source file is part of the SoftFloat IEC/IEEE Floating-point Arithmetic Package, Release 2a. Written by John R. Hauser. This work was made possible in part by the International Computer Science Institute, located at Suite 600, 1947 Center Street, Berkeley, California 94704. Funding was partially provided by the National Science Foundation under grant MIP-9311980. The original version of this code was written as part of a project to build a fixed-point vector processor in collaboration with the University of California at Berkeley, overseen by Profs. Nelson Morgan and John Wawrzynek. More information is available through the Web page `http://HTTP.CS.Berkeley.EDU/~jhauser/ arithmetic/SoftFloat.html'. THIS SOFTWARE IS DISTRIBUTED AS IS, FOR FREE. Although reasonable effort has been made to avoid it, THIS SOFTWARE MAY CONTAIN FAULTS THAT WILL AT TIMES RESULT IN INCORRECT BEHAVIOR. USE OF THIS SOFTWARE IS RESTRICTED TO PERSONS AND ORGANIZATIONS WHO CAN AND WILL TAKE FULL RESPONSIBILITY FOR ANY AND ALL LOSSES, COSTS, OR OTHER PROBLEMS ARISING FROM ITS USE. Derivative works are acceptable, even for commercial purposes, so long as (1) they include prominent notice that the work is derivative, and (2) they include prominent notice akin to these four paragraphs for those parts of this code that are retained. =============================================================================== */ #include <sys/cdefs.h> __FBSDID("$FreeBSD: release/9.1.0/lib/libc/softfloat/timesoftfloat.c 129203 2004-05-14 12:13:06Z cognet $"); #include <stdlib.h> #include <stdarg.h> #include <string.h> #include <stdio.h> #include <time.h> #include "milieu.h" #include "softfloat.h" enum { minIterations = 1000 }; static void fail( const char *message, ... ) { va_list varArgs; fputs( "timesoftfloat: ", stderr ); va_start( varArgs, message ); vfprintf( stderr, message, varArgs ); va_end( varArgs ); fputs( ".\n", stderr ); exit( EXIT_FAILURE ); } static char *functionName; static char *roundingPrecisionName, *roundingModeName, *tininessModeName; static void reportTime( int32 count, long clocks ) { printf( "%8.1f kops/s: %s", ( count / ( ( (float) clocks ) / CLOCKS_PER_SEC ) ) / 1000, functionName ); if ( roundingModeName ) { if ( roundingPrecisionName ) { fputs( ", precision ", stdout ); fputs( roundingPrecisionName, stdout ); } fputs( ", rounding ", stdout ); fputs( roundingModeName, stdout ); if ( tininessModeName ) { fputs( ", tininess ", stdout ); fputs( tininessModeName, stdout ); fputs( " rounding", stdout ); } } fputc( '\n', stdout ); } enum { numInputs_int32 = 32 }; static const int32 inputs_int32[ numInputs_int32 ] = { 0xFFFFBB79, 0x405CF80F, 0x00000000, 0xFFFFFD04, 0xFFF20002, 0x0C8EF795, 0xF00011FF, 0x000006CA, 0x00009BFE, 0xFF4862E3, 0x9FFFEFFE, 0xFFFFFFB7, 0x0BFF7FFF, 0x0000F37A, 0x0011DFFE, 0x00000006, 0xFFF02006, 0xFFFFF7D1, 0x10200003, 0xDE8DF765, 0x00003E02, 0x000019E8, 0x0008FFFE, 0xFFFFFB5C, 0xFFDF7FFE, 0x07C42FBF, 0x0FFFE3FF, 0x040B9F13, 0xBFFFFFF8, 0x0001BF56, 0x000017F6, 0x000A908A }; static void time_a_int32_z_float32( float32 function( int32 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_int32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_int32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_a_int32_z_float64( float64 function( int32 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_int32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_int32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #ifdef FLOATX80 static void time_a_int32_z_floatx80( floatx80 function( int32 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_int32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_int32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #endif #ifdef FLOAT128 static void time_a_int32_z_float128( float128 function( int32 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_int32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_int32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #endif enum { numInputs_int64 = 32 }; static const int64 inputs_int64[ numInputs_int64 ] = { LIT64( 0xFBFFC3FFFFFFFFFF ), LIT64( 0x0000000003C589BC ), LIT64( 0x00000000400013FE ), LIT64( 0x0000000000186171 ), LIT64( 0xFFFFFFFFFFFEFBFA ), LIT64( 0xFFFFFD79E6DFFC73 ), LIT64( 0x0000000010001DFF ), LIT64( 0xDD1A0F0C78513710 ), LIT64( 0xFFFF83FFFFFEFFFE ), LIT64( 0x00756EBD1AD0C1C7 ), LIT64( 0x0003FDFFFFFFFFBE ), LIT64( 0x0007D0FB2C2CA951 ), LIT64( 0x0007FC0007FFFFFE ), LIT64( 0x0000001F942B18BB ), LIT64( 0x0000080101FFFFFE ), LIT64( 0xFFFFFFFFFFFF0978 ), LIT64( 0x000000000008BFFF ), LIT64( 0x0000000006F5AF08 ), LIT64( 0xFFDEFF7FFFFFFFFE ), LIT64( 0x0000000000000003 ), LIT64( 0x3FFFFFFFFF80007D ), LIT64( 0x0000000000000078 ), LIT64( 0xFFF80000007FDFFD ), LIT64( 0x1BBC775B78016AB0 ), LIT64( 0xFFF9001FFFFFFFFE ), LIT64( 0xFFFD4767AB98E43F ), LIT64( 0xFFFFFEFFFE00001E ), LIT64( 0xFFFFFFFFFFF04EFD ), LIT64( 0x07FFFFFFFFFFF7FF ), LIT64( 0xFFFC9EAA38F89050 ), LIT64( 0x00000020FBFFFFFE ), LIT64( 0x0000099AE6455357 ) }; static void time_a_int64_z_float32( float32 function( int64 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_int64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_int64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_a_int64_z_float64( float64 function( int64 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_int64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_int64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #ifdef FLOATX80 static void time_a_int64_z_floatx80( floatx80 function( int64 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_int64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_int64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #endif #ifdef FLOAT128 static void time_a_int64_z_float128( float128 function( int64 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_int64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_int64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #endif enum { numInputs_float32 = 32 }; static const float32 inputs_float32[ numInputs_float32 ] = { 0x4EFA0000, 0xC1D0B328, 0x80000000, 0x3E69A31E, 0xAF803EFF, 0x3F800000, 0x17BF8000, 0xE74A301A, 0x4E010003, 0x7EE3C75D, 0xBD803FE0, 0xBFFEFF00, 0x7981F800, 0x431FFFFC, 0xC100C000, 0x3D87EFFF, 0x4103FEFE, 0xBC000007, 0xBF01F7FF, 0x4E6C6B5C, 0xC187FFFE, 0xC58B9F13, 0x4F88007F, 0xDF004007, 0xB7FFD7FE, 0x7E8001FB, 0x46EFFBFF, 0x31C10000, 0xDB428661, 0x33F89B1F, 0xA3BFEFFF, 0x537BFFBE }; static void time_a_float32_z_int32( int32 function( float32 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_float32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_float32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_a_float32_z_int64( int64 function( float32 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_float32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_float32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_a_float32_z_float64( float64 function( float32 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_float32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_float32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #ifdef FLOATX80 static void time_a_float32_z_floatx80( floatx80 function( float32 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_float32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_float32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #endif #ifdef FLOAT128 static void time_a_float32_z_float128( float128 function( float32 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_float32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_float32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #endif static void time_az_float32( float32 function( float32 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_float32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_float32[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_ab_float32_z_flag( flag function( float32, float32 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNumA, inputNumB; count = 0; inputNumA = 0; inputNumB = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_float32[ inputNumA ], inputs_float32[ inputNumB ] ); inputNumA = ( inputNumA + 1 ) & ( numInputs_float32 - 1 ); if ( inputNumA == 0 ) ++inputNumB; inputNumB = ( inputNumB + 1 ) & ( numInputs_float32 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNumA = 0; inputNumB = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_float32[ inputNumA ], inputs_float32[ inputNumB ] ); inputNumA = ( inputNumA + 1 ) & ( numInputs_float32 - 1 ); if ( inputNumA == 0 ) ++inputNumB; inputNumB = ( inputNumB + 1 ) & ( numInputs_float32 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_abz_float32( float32 function( float32, float32 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNumA, inputNumB; count = 0; inputNumA = 0; inputNumB = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_float32[ inputNumA ], inputs_float32[ inputNumB ] ); inputNumA = ( inputNumA + 1 ) & ( numInputs_float32 - 1 ); if ( inputNumA == 0 ) ++inputNumB; inputNumB = ( inputNumB + 1 ) & ( numInputs_float32 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNumA = 0; inputNumB = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_float32[ inputNumA ], inputs_float32[ inputNumB ] ); inputNumA = ( inputNumA + 1 ) & ( numInputs_float32 - 1 ); if ( inputNumA == 0 ) ++inputNumB; inputNumB = ( inputNumB + 1 ) & ( numInputs_float32 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static const float32 inputs_float32_pos[ numInputs_float32 ] = { 0x4EFA0000, 0x41D0B328, 0x00000000, 0x3E69A31E, 0x2F803EFF, 0x3F800000, 0x17BF8000, 0x674A301A, 0x4E010003, 0x7EE3C75D, 0x3D803FE0, 0x3FFEFF00, 0x7981F800, 0x431FFFFC, 0x4100C000, 0x3D87EFFF, 0x4103FEFE, 0x3C000007, 0x3F01F7FF, 0x4E6C6B5C, 0x4187FFFE, 0x458B9F13, 0x4F88007F, 0x5F004007, 0x37FFD7FE, 0x7E8001FB, 0x46EFFBFF, 0x31C10000, 0x5B428661, 0x33F89B1F, 0x23BFEFFF, 0x537BFFBE }; static void time_az_float32_pos( float32 function( float32 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_float32_pos[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_float32_pos[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } enum { numInputs_float64 = 32 }; static const float64 inputs_float64[ numInputs_float64 ] = { LIT64( 0x422FFFC008000000 ), LIT64( 0xB7E0000480000000 ), LIT64( 0xF3FD2546120B7935 ), LIT64( 0x3FF0000000000000 ), LIT64( 0xCE07F766F09588D6 ), LIT64( 0x8000000000000000 ), LIT64( 0x3FCE000400000000 ), LIT64( 0x8313B60F0032BED8 ), LIT64( 0xC1EFFFFFC0002000 ), LIT64( 0x3FB3C75D224F2B0F ), LIT64( 0x7FD00000004000FF ), LIT64( 0xA12FFF8000001FFF ), LIT64( 0x3EE0000000FE0000 ), LIT64( 0x0010000080000004 ), LIT64( 0x41CFFFFE00000020 ), LIT64( 0x40303FFFFFFFFFFD ), LIT64( 0x3FD000003FEFFFFF ), LIT64( 0xBFD0000010000000 ), LIT64( 0xB7FC6B5C16CA55CF ), LIT64( 0x413EEB940B9D1301 ), LIT64( 0xC7E00200001FFFFF ), LIT64( 0x47F00021FFFFFFFE ), LIT64( 0xBFFFFFFFF80000FF ), LIT64( 0xC07FFFFFE00FFFFF ), LIT64( 0x001497A63740C5E8 ), LIT64( 0xC4BFFFE0001FFFFF ), LIT64( 0x96FFDFFEFFFFFFFF ), LIT64( 0x403FC000000001FE ), LIT64( 0xFFD00000000001F6 ), LIT64( 0x0640400002000000 ), LIT64( 0x479CEE1E4F789FE0 ), LIT64( 0xC237FFFFFFFFFDFE ) }; static void time_a_float64_z_int32( int32 function( float64 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_float64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_float64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_a_float64_z_int64( int64 function( float64 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_float64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_float64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_a_float64_z_float32( float32 function( float64 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_float64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_float64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #ifdef FLOATX80 static void time_a_float64_z_floatx80( floatx80 function( float64 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_float64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_float64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #endif #ifdef FLOAT128 static void time_a_float64_z_float128( float128 function( float64 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_float64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_float64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #endif static void time_az_float64( float64 function( float64 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_float64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_float64[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_ab_float64_z_flag( flag function( float64, float64 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNumA, inputNumB; count = 0; inputNumA = 0; inputNumB = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_float64[ inputNumA ], inputs_float64[ inputNumB ] ); inputNumA = ( inputNumA + 1 ) & ( numInputs_float64 - 1 ); if ( inputNumA == 0 ) ++inputNumB; inputNumB = ( inputNumB + 1 ) & ( numInputs_float64 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNumA = 0; inputNumB = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_float64[ inputNumA ], inputs_float64[ inputNumB ] ); inputNumA = ( inputNumA + 1 ) & ( numInputs_float64 - 1 ); if ( inputNumA == 0 ) ++inputNumB; inputNumB = ( inputNumB + 1 ) & ( numInputs_float64 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_abz_float64( float64 function( float64, float64 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNumA, inputNumB; count = 0; inputNumA = 0; inputNumB = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_float64[ inputNumA ], inputs_float64[ inputNumB ] ); inputNumA = ( inputNumA + 1 ) & ( numInputs_float64 - 1 ); if ( inputNumA == 0 ) ++inputNumB; inputNumB = ( inputNumB + 1 ) & ( numInputs_float64 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNumA = 0; inputNumB = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_float64[ inputNumA ], inputs_float64[ inputNumB ] ); inputNumA = ( inputNumA + 1 ) & ( numInputs_float64 - 1 ); if ( inputNumA == 0 ) ++inputNumB; inputNumB = ( inputNumB + 1 ) & ( numInputs_float64 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static const float64 inputs_float64_pos[ numInputs_float64 ] = { LIT64( 0x422FFFC008000000 ), LIT64( 0x37E0000480000000 ), LIT64( 0x73FD2546120B7935 ), LIT64( 0x3FF0000000000000 ), LIT64( 0x4E07F766F09588D6 ), LIT64( 0x0000000000000000 ), LIT64( 0x3FCE000400000000 ), LIT64( 0x0313B60F0032BED8 ), LIT64( 0x41EFFFFFC0002000 ), LIT64( 0x3FB3C75D224F2B0F ), LIT64( 0x7FD00000004000FF ), LIT64( 0x212FFF8000001FFF ), LIT64( 0x3EE0000000FE0000 ), LIT64( 0x0010000080000004 ), LIT64( 0x41CFFFFE00000020 ), LIT64( 0x40303FFFFFFFFFFD ), LIT64( 0x3FD000003FEFFFFF ), LIT64( 0x3FD0000010000000 ), LIT64( 0x37FC6B5C16CA55CF ), LIT64( 0x413EEB940B9D1301 ), LIT64( 0x47E00200001FFFFF ), LIT64( 0x47F00021FFFFFFFE ), LIT64( 0x3FFFFFFFF80000FF ), LIT64( 0x407FFFFFE00FFFFF ), LIT64( 0x001497A63740C5E8 ), LIT64( 0x44BFFFE0001FFFFF ), LIT64( 0x16FFDFFEFFFFFFFF ), LIT64( 0x403FC000000001FE ), LIT64( 0x7FD00000000001F6 ), LIT64( 0x0640400002000000 ), LIT64( 0x479CEE1E4F789FE0 ), LIT64( 0x4237FFFFFFFFFDFE ) }; static void time_az_float64_pos( float64 function( float64 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { function( inputs_float64_pos[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { function( inputs_float64_pos[ inputNum ] ); inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #ifdef FLOATX80 enum { numInputs_floatx80 = 32 }; static const struct { bits16 high; bits64 low; } inputs_floatx80[ numInputs_floatx80 ] = { { 0xC03F, LIT64( 0xA9BE15A19C1E8B62 ) }, { 0x8000, LIT64( 0x0000000000000000 ) }, { 0x75A8, LIT64( 0xE59591E4788957A5 ) }, { 0xBFFF, LIT64( 0xFFF0000000000040 ) }, { 0x0CD8, LIT64( 0xFC000000000007FE ) }, { 0x43BA, LIT64( 0x99A4000000000000 ) }, { 0x3FFF, LIT64( 0x8000000000000000 ) }, { 0x4081, LIT64( 0x94FBF1BCEB5545F0 ) }, { 0x403E, LIT64( 0xFFF0000000002000 ) }, { 0x3FFE, LIT64( 0xC860E3C75D224F28 ) }, { 0x407E, LIT64( 0xFC00000FFFFFFFFE ) }, { 0x737A, LIT64( 0x800000007FFDFFFE ) }, { 0x4044, LIT64( 0xFFFFFF80000FFFFF ) }, { 0xBBFE, LIT64( 0x8000040000001FFE ) }, { 0xC002, LIT64( 0xFF80000000000020 ) }, { 0xDE8D, LIT64( 0xFFFFFFFFFFE00004 ) }, { 0xC004, LIT64( 0x8000000000003FFB ) }, { 0x407F, LIT64( 0x800000000003FFFE ) }, { 0xC000, LIT64( 0xA459EE6A5C16CA55 ) }, { 0x8003, LIT64( 0xC42CBF7399AEEB94 ) }, { 0xBF7F, LIT64( 0xF800000000000006 ) }, { 0xC07F, LIT64( 0xBF56BE8871F28FEA ) }, { 0xC07E, LIT64( 0xFFFF77FFFFFFFFFE ) }, { 0xADC9, LIT64( 0x8000000FFFFFFFDE ) }, { 0xC001, LIT64( 0xEFF7FFFFFFFFFFFF ) }, { 0x4001, LIT64( 0xBE84F30125C497A6 ) }, { 0xC06B, LIT64( 0xEFFFFFFFFFFFFFFF ) }, { 0x4080, LIT64( 0xFFFFFFFFBFFFFFFF ) }, { 0x87E9, LIT64( 0x81FFFFFFFFFFFBFF ) }, { 0xA63F, LIT64( 0x801FFFFFFEFFFFFE ) }, { 0x403C, LIT64( 0x801FFFFFFFF7FFFF ) }, { 0x4018, LIT64( 0x8000000000080003 ) } }; static void time_a_floatx80_z_int32( int32 function( floatx80 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; floatx80 a; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { a.low = inputs_floatx80[ inputNum ].low; a.high = inputs_floatx80[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { a.low = inputs_floatx80[ inputNum ].low; a.high = inputs_floatx80[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_a_floatx80_z_int64( int64 function( floatx80 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; floatx80 a; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { a.low = inputs_floatx80[ inputNum ].low; a.high = inputs_floatx80[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { a.low = inputs_floatx80[ inputNum ].low; a.high = inputs_floatx80[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_a_floatx80_z_float32( float32 function( floatx80 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; floatx80 a; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { a.low = inputs_floatx80[ inputNum ].low; a.high = inputs_floatx80[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { a.low = inputs_floatx80[ inputNum ].low; a.high = inputs_floatx80[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_a_floatx80_z_float64( float64 function( floatx80 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; floatx80 a; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { a.low = inputs_floatx80[ inputNum ].low; a.high = inputs_floatx80[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { a.low = inputs_floatx80[ inputNum ].low; a.high = inputs_floatx80[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #ifdef FLOAT128 static void time_a_floatx80_z_float128( float128 function( floatx80 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; floatx80 a; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { a.low = inputs_floatx80[ inputNum ].low; a.high = inputs_floatx80[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { a.low = inputs_floatx80[ inputNum ].low; a.high = inputs_floatx80[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #endif static void time_az_floatx80( floatx80 function( floatx80 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; floatx80 a; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { a.low = inputs_floatx80[ inputNum ].low; a.high = inputs_floatx80[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { a.low = inputs_floatx80[ inputNum ].low; a.high = inputs_floatx80[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_ab_floatx80_z_flag( flag function( floatx80, floatx80 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNumA, inputNumB; floatx80 a, b; count = 0; inputNumA = 0; inputNumB = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { a.low = inputs_floatx80[ inputNumA ].low; a.high = inputs_floatx80[ inputNumA ].high; b.low = inputs_floatx80[ inputNumB ].low; b.high = inputs_floatx80[ inputNumB ].high; function( a, b ); inputNumA = ( inputNumA + 1 ) & ( numInputs_floatx80 - 1 ); if ( inputNumA == 0 ) ++inputNumB; inputNumB = ( inputNumB + 1 ) & ( numInputs_floatx80 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNumA = 0; inputNumB = 0; startClock = clock(); for ( i = count; i; --i ) { a.low = inputs_floatx80[ inputNumA ].low; a.high = inputs_floatx80[ inputNumA ].high; b.low = inputs_floatx80[ inputNumB ].low; b.high = inputs_floatx80[ inputNumB ].high; function( a, b ); inputNumA = ( inputNumA + 1 ) & ( numInputs_floatx80 - 1 ); if ( inputNumA == 0 ) ++inputNumB; inputNumB = ( inputNumB + 1 ) & ( numInputs_floatx80 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_abz_floatx80( floatx80 function( floatx80, floatx80 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNumA, inputNumB; floatx80 a, b; count = 0; inputNumA = 0; inputNumB = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { a.low = inputs_floatx80[ inputNumA ].low; a.high = inputs_floatx80[ inputNumA ].high; b.low = inputs_floatx80[ inputNumB ].low; b.high = inputs_floatx80[ inputNumB ].high; function( a, b ); inputNumA = ( inputNumA + 1 ) & ( numInputs_floatx80 - 1 ); if ( inputNumA == 0 ) ++inputNumB; inputNumB = ( inputNumB + 1 ) & ( numInputs_floatx80 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNumA = 0; inputNumB = 0; startClock = clock(); for ( i = count; i; --i ) { a.low = inputs_floatx80[ inputNumA ].low; a.high = inputs_floatx80[ inputNumA ].high; b.low = inputs_floatx80[ inputNumB ].low; b.high = inputs_floatx80[ inputNumB ].high; function( a, b ); inputNumA = ( inputNumA + 1 ) & ( numInputs_floatx80 - 1 ); if ( inputNumA == 0 ) ++inputNumB; inputNumB = ( inputNumB + 1 ) & ( numInputs_floatx80 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static const struct { bits16 high; bits64 low; } inputs_floatx80_pos[ numInputs_floatx80 ] = { { 0x403F, LIT64( 0xA9BE15A19C1E8B62 ) }, { 0x0000, LIT64( 0x0000000000000000 ) }, { 0x75A8, LIT64( 0xE59591E4788957A5 ) }, { 0x3FFF, LIT64( 0xFFF0000000000040 ) }, { 0x0CD8, LIT64( 0xFC000000000007FE ) }, { 0x43BA, LIT64( 0x99A4000000000000 ) }, { 0x3FFF, LIT64( 0x8000000000000000 ) }, { 0x4081, LIT64( 0x94FBF1BCEB5545F0 ) }, { 0x403E, LIT64( 0xFFF0000000002000 ) }, { 0x3FFE, LIT64( 0xC860E3C75D224F28 ) }, { 0x407E, LIT64( 0xFC00000FFFFFFFFE ) }, { 0x737A, LIT64( 0x800000007FFDFFFE ) }, { 0x4044, LIT64( 0xFFFFFF80000FFFFF ) }, { 0x3BFE, LIT64( 0x8000040000001FFE ) }, { 0x4002, LIT64( 0xFF80000000000020 ) }, { 0x5E8D, LIT64( 0xFFFFFFFFFFE00004 ) }, { 0x4004, LIT64( 0x8000000000003FFB ) }, { 0x407F, LIT64( 0x800000000003FFFE ) }, { 0x4000, LIT64( 0xA459EE6A5C16CA55 ) }, { 0x0003, LIT64( 0xC42CBF7399AEEB94 ) }, { 0x3F7F, LIT64( 0xF800000000000006 ) }, { 0x407F, LIT64( 0xBF56BE8871F28FEA ) }, { 0x407E, LIT64( 0xFFFF77FFFFFFFFFE ) }, { 0x2DC9, LIT64( 0x8000000FFFFFFFDE ) }, { 0x4001, LIT64( 0xEFF7FFFFFFFFFFFF ) }, { 0x4001, LIT64( 0xBE84F30125C497A6 ) }, { 0x406B, LIT64( 0xEFFFFFFFFFFFFFFF ) }, { 0x4080, LIT64( 0xFFFFFFFFBFFFFFFF ) }, { 0x07E9, LIT64( 0x81FFFFFFFFFFFBFF ) }, { 0x263F, LIT64( 0x801FFFFFFEFFFFFE ) }, { 0x403C, LIT64( 0x801FFFFFFFF7FFFF ) }, { 0x4018, LIT64( 0x8000000000080003 ) } }; static void time_az_floatx80_pos( floatx80 function( floatx80 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; floatx80 a; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { a.low = inputs_floatx80_pos[ inputNum ].low; a.high = inputs_floatx80_pos[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { a.low = inputs_floatx80_pos[ inputNum ].low; a.high = inputs_floatx80_pos[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #endif #ifdef FLOAT128 enum { numInputs_float128 = 32 }; static const struct { bits64 high, low; } inputs_float128[ numInputs_float128 ] = { { LIT64( 0x3FDA200000100000 ), LIT64( 0x0000000000000000 ) }, { LIT64( 0x3FFF000000000000 ), LIT64( 0x0000000000000000 ) }, { LIT64( 0x85F14776190C8306 ), LIT64( 0xD8715F4E3D54BB92 ) }, { LIT64( 0xF2B00000007FFFFF ), LIT64( 0xFFFFFFFFFFF7FFFF ) }, { LIT64( 0x8000000000000000 ), LIT64( 0x0000000000000000 ) }, { LIT64( 0xBFFFFFFFFFE00000 ), LIT64( 0x0000008000000000 ) }, { LIT64( 0x407F1719CE722F3E ), LIT64( 0xDA6B3FE5FF29425B ) }, { LIT64( 0x43FFFF8000000000 ), LIT64( 0x0000000000400000 ) }, { LIT64( 0x401E000000000100 ), LIT64( 0x0000000000002000 ) }, { LIT64( 0x3FFED71DACDA8E47 ), LIT64( 0x4860E3C75D224F28 ) }, { LIT64( 0xBF7ECFC1E90647D1 ), LIT64( 0x7A124FE55623EE44 ) }, { LIT64( 0x0DF7007FFFFFFFFF ), LIT64( 0xFFFFFFFFEFFFFFFF ) }, { LIT64( 0x3FE5FFEFFFFFFFFF ), LIT64( 0xFFFFFFFFFFFFEFFF ) }, { LIT64( 0x403FFFFFFFFFFFFF ), LIT64( 0xFFFFFFFFFFFFFBFE ) }, { LIT64( 0xBFFB2FBF7399AFEB ), LIT64( 0xA459EE6A5C16CA55 ) }, { LIT64( 0xBDB8FFFFFFFFFFFC ), LIT64( 0x0000000000000400 ) }, { LIT64( 0x3FC8FFDFFFFFFFFF ), LIT64( 0xFFFFFFFFF0000000 ) }, { LIT64( 0x3FFBFFFFFFDFFFFF ), LIT64( 0xFFF8000000000000 ) }, { LIT64( 0x407043C11737BE84 ), LIT64( 0xDDD58212ADC937F4 ) }, { LIT64( 0x8001000000000000 ), LIT64( 0x0000001000000001 ) }, { LIT64( 0xC036FFFFFFFFFFFF ), LIT64( 0xFE40000000000000 ) }, { LIT64( 0x4002FFFFFE000002 ), LIT64( 0x0000000000000000 ) }, { LIT64( 0x4000C3FEDE897773 ), LIT64( 0x326AC4FD8EFBE6DC ) }, { LIT64( 0xBFFF0000000FFFFF ), LIT64( 0xFFFFFE0000000000 ) }, { LIT64( 0x62C3E502146E426D ), LIT64( 0x43F3CAA0DC7DF1A0 ) }, { LIT64( 0xB5CBD32E52BB570E ), LIT64( 0xBCC477CB11C6236C ) }, { LIT64( 0xE228FFFFFFC00000 ), LIT64( 0x0000000000000000 ) }, { LIT64( 0x3F80000000000000 ), LIT64( 0x0000000080000008 ) }, { LIT64( 0xC1AFFFDFFFFFFFFF ), LIT64( 0xFFFC000000000000 ) }, { LIT64( 0xC96F000000000000 ), LIT64( 0x00000001FFFBFFFF ) }, { LIT64( 0x3DE09BFE7923A338 ), LIT64( 0xBCC8FBBD7CEC1F4F ) }, { LIT64( 0x401CFFFFFFFFFFFF ), LIT64( 0xFFFFFFFEFFFFFF80 ) } }; static void time_a_float128_z_int32( int32 function( float128 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; float128 a; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { a.low = inputs_float128[ inputNum ].low; a.high = inputs_float128[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { a.low = inputs_float128[ inputNum ].low; a.high = inputs_float128[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_a_float128_z_int64( int64 function( float128 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; float128 a; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { a.low = inputs_float128[ inputNum ].low; a.high = inputs_float128[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { a.low = inputs_float128[ inputNum ].low; a.high = inputs_float128[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_a_float128_z_float32( float32 function( float128 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; float128 a; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { a.low = inputs_float128[ inputNum ].low; a.high = inputs_float128[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { a.low = inputs_float128[ inputNum ].low; a.high = inputs_float128[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_a_float128_z_float64( float64 function( float128 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; float128 a; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { a.low = inputs_float128[ inputNum ].low; a.high = inputs_float128[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { a.low = inputs_float128[ inputNum ].low; a.high = inputs_float128[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #ifdef FLOATX80 static void time_a_float128_z_floatx80( floatx80 function( float128 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; float128 a; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { a.low = inputs_float128[ inputNum ].low; a.high = inputs_float128[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { a.low = inputs_float128[ inputNum ].low; a.high = inputs_float128[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #endif static void time_az_float128( float128 function( float128 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; float128 a; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { a.low = inputs_float128[ inputNum ].low; a.high = inputs_float128[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { a.low = inputs_float128[ inputNum ].low; a.high = inputs_float128[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_ab_float128_z_flag( flag function( float128, float128 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNumA, inputNumB; float128 a, b; count = 0; inputNumA = 0; inputNumB = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { a.low = inputs_float128[ inputNumA ].low; a.high = inputs_float128[ inputNumA ].high; b.low = inputs_float128[ inputNumB ].low; b.high = inputs_float128[ inputNumB ].high; function( a, b ); inputNumA = ( inputNumA + 1 ) & ( numInputs_float128 - 1 ); if ( inputNumA == 0 ) ++inputNumB; inputNumB = ( inputNumB + 1 ) & ( numInputs_float128 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNumA = 0; inputNumB = 0; startClock = clock(); for ( i = count; i; --i ) { a.low = inputs_float128[ inputNumA ].low; a.high = inputs_float128[ inputNumA ].high; b.low = inputs_float128[ inputNumB ].low; b.high = inputs_float128[ inputNumB ].high; function( a, b ); inputNumA = ( inputNumA + 1 ) & ( numInputs_float128 - 1 ); if ( inputNumA == 0 ) ++inputNumB; inputNumB = ( inputNumB + 1 ) & ( numInputs_float128 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static void time_abz_float128( float128 function( float128, float128 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNumA, inputNumB; float128 a, b; count = 0; inputNumA = 0; inputNumB = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { a.low = inputs_float128[ inputNumA ].low; a.high = inputs_float128[ inputNumA ].high; b.low = inputs_float128[ inputNumB ].low; b.high = inputs_float128[ inputNumB ].high; function( a, b ); inputNumA = ( inputNumA + 1 ) & ( numInputs_float128 - 1 ); if ( inputNumA == 0 ) ++inputNumB; inputNumB = ( inputNumB + 1 ) & ( numInputs_float128 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNumA = 0; inputNumB = 0; startClock = clock(); for ( i = count; i; --i ) { a.low = inputs_float128[ inputNumA ].low; a.high = inputs_float128[ inputNumA ].high; b.low = inputs_float128[ inputNumB ].low; b.high = inputs_float128[ inputNumB ].high; function( a, b ); inputNumA = ( inputNumA + 1 ) & ( numInputs_float128 - 1 ); if ( inputNumA == 0 ) ++inputNumB; inputNumB = ( inputNumB + 1 ) & ( numInputs_float128 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } static const struct { bits64 high, low; } inputs_float128_pos[ numInputs_float128 ] = { { LIT64( 0x3FDA200000100000 ), LIT64( 0x0000000000000000 ) }, { LIT64( 0x3FFF000000000000 ), LIT64( 0x0000000000000000 ) }, { LIT64( 0x05F14776190C8306 ), LIT64( 0xD8715F4E3D54BB92 ) }, { LIT64( 0x72B00000007FFFFF ), LIT64( 0xFFFFFFFFFFF7FFFF ) }, { LIT64( 0x0000000000000000 ), LIT64( 0x0000000000000000 ) }, { LIT64( 0x3FFFFFFFFFE00000 ), LIT64( 0x0000008000000000 ) }, { LIT64( 0x407F1719CE722F3E ), LIT64( 0xDA6B3FE5FF29425B ) }, { LIT64( 0x43FFFF8000000000 ), LIT64( 0x0000000000400000 ) }, { LIT64( 0x401E000000000100 ), LIT64( 0x0000000000002000 ) }, { LIT64( 0x3FFED71DACDA8E47 ), LIT64( 0x4860E3C75D224F28 ) }, { LIT64( 0x3F7ECFC1E90647D1 ), LIT64( 0x7A124FE55623EE44 ) }, { LIT64( 0x0DF7007FFFFFFFFF ), LIT64( 0xFFFFFFFFEFFFFFFF ) }, { LIT64( 0x3FE5FFEFFFFFFFFF ), LIT64( 0xFFFFFFFFFFFFEFFF ) }, { LIT64( 0x403FFFFFFFFFFFFF ), LIT64( 0xFFFFFFFFFFFFFBFE ) }, { LIT64( 0x3FFB2FBF7399AFEB ), LIT64( 0xA459EE6A5C16CA55 ) }, { LIT64( 0x3DB8FFFFFFFFFFFC ), LIT64( 0x0000000000000400 ) }, { LIT64( 0x3FC8FFDFFFFFFFFF ), LIT64( 0xFFFFFFFFF0000000 ) }, { LIT64( 0x3FFBFFFFFFDFFFFF ), LIT64( 0xFFF8000000000000 ) }, { LIT64( 0x407043C11737BE84 ), LIT64( 0xDDD58212ADC937F4 ) }, { LIT64( 0x0001000000000000 ), LIT64( 0x0000001000000001 ) }, { LIT64( 0x4036FFFFFFFFFFFF ), LIT64( 0xFE40000000000000 ) }, { LIT64( 0x4002FFFFFE000002 ), LIT64( 0x0000000000000000 ) }, { LIT64( 0x4000C3FEDE897773 ), LIT64( 0x326AC4FD8EFBE6DC ) }, { LIT64( 0x3FFF0000000FFFFF ), LIT64( 0xFFFFFE0000000000 ) }, { LIT64( 0x62C3E502146E426D ), LIT64( 0x43F3CAA0DC7DF1A0 ) }, { LIT64( 0x35CBD32E52BB570E ), LIT64( 0xBCC477CB11C6236C ) }, { LIT64( 0x6228FFFFFFC00000 ), LIT64( 0x0000000000000000 ) }, { LIT64( 0x3F80000000000000 ), LIT64( 0x0000000080000008 ) }, { LIT64( 0x41AFFFDFFFFFFFFF ), LIT64( 0xFFFC000000000000 ) }, { LIT64( 0x496F000000000000 ), LIT64( 0x00000001FFFBFFFF ) }, { LIT64( 0x3DE09BFE7923A338 ), LIT64( 0xBCC8FBBD7CEC1F4F ) }, { LIT64( 0x401CFFFFFFFFFFFF ), LIT64( 0xFFFFFFFEFFFFFF80 ) } }; static void time_az_float128_pos( float128 function( float128 ) ) { clock_t startClock, endClock; int32 count, i; int8 inputNum; float128 a; count = 0; inputNum = 0; startClock = clock(); do { for ( i = minIterations; i; --i ) { a.low = inputs_float128_pos[ inputNum ].low; a.high = inputs_float128_pos[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); } count += minIterations; } while ( clock() - startClock < CLOCKS_PER_SEC ); inputNum = 0; startClock = clock(); for ( i = count; i; --i ) { a.low = inputs_float128_pos[ inputNum ].low; a.high = inputs_float128_pos[ inputNum ].high; function( a ); inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 ); } endClock = clock(); reportTime( count, endClock - startClock ); } #endif enum { INT32_TO_FLOAT32 = 1, INT32_TO_FLOAT64, #ifdef FLOATX80 INT32_TO_FLOATX80, #endif #ifdef FLOAT128 INT32_TO_FLOAT128, #endif INT64_TO_FLOAT32, INT64_TO_FLOAT64, #ifdef FLOATX80 INT64_TO_FLOATX80, #endif #ifdef FLOAT128 INT64_TO_FLOAT128, #endif FLOAT32_TO_INT32, FLOAT32_TO_INT32_ROUND_TO_ZERO, FLOAT32_TO_INT64, FLOAT32_TO_INT64_ROUND_TO_ZERO, FLOAT32_TO_FLOAT64, #ifdef FLOATX80 FLOAT32_TO_FLOATX80, #endif #ifdef FLOAT128 FLOAT32_TO_FLOAT128, #endif FLOAT32_ROUND_TO_INT, FLOAT32_ADD, FLOAT32_SUB, FLOAT32_MUL, FLOAT32_DIV, FLOAT32_REM, FLOAT32_SQRT, FLOAT32_EQ, FLOAT32_LE, FLOAT32_LT, FLOAT32_EQ_SIGNALING, FLOAT32_LE_QUIET, FLOAT32_LT_QUIET, FLOAT64_TO_INT32, FLOAT64_TO_INT32_ROUND_TO_ZERO, FLOAT64_TO_INT64, FLOAT64_TO_INT64_ROUND_TO_ZERO, FLOAT64_TO_FLOAT32, #ifdef FLOATX80 FLOAT64_TO_FLOATX80, #endif #ifdef FLOAT128 FLOAT64_TO_FLOAT128, #endif FLOAT64_ROUND_TO_INT, FLOAT64_ADD, FLOAT64_SUB, FLOAT64_MUL, FLOAT64_DIV, FLOAT64_REM, FLOAT64_SQRT, FLOAT64_EQ, FLOAT64_LE, FLOAT64_LT, FLOAT64_EQ_SIGNALING, FLOAT64_LE_QUIET, FLOAT64_LT_QUIET, #ifdef FLOATX80 FLOATX80_TO_INT32, FLOATX80_TO_INT32_ROUND_TO_ZERO, FLOATX80_TO_INT64, FLOATX80_TO_INT64_ROUND_TO_ZERO, FLOATX80_TO_FLOAT32, FLOATX80_TO_FLOAT64, #ifdef FLOAT128 FLOATX80_TO_FLOAT128, #endif FLOATX80_ROUND_TO_INT, FLOATX80_ADD, FLOATX80_SUB, FLOATX80_MUL, FLOATX80_DIV, FLOATX80_REM, FLOATX80_SQRT, FLOATX80_EQ, FLOATX80_LE, FLOATX80_LT, FLOATX80_EQ_SIGNALING, FLOATX80_LE_QUIET, FLOATX80_LT_QUIET, #endif #ifdef FLOAT128 FLOAT128_TO_INT32, FLOAT128_TO_INT32_ROUND_TO_ZERO, FLOAT128_TO_INT64, FLOAT128_TO_INT64_ROUND_TO_ZERO, FLOAT128_TO_FLOAT32, FLOAT128_TO_FLOAT64, #ifdef FLOATX80 FLOAT128_TO_FLOATX80, #endif FLOAT128_ROUND_TO_INT, FLOAT128_ADD, FLOAT128_SUB, FLOAT128_MUL, FLOAT128_DIV, FLOAT128_REM, FLOAT128_SQRT, FLOAT128_EQ, FLOAT128_LE, FLOAT128_LT, FLOAT128_EQ_SIGNALING, FLOAT128_LE_QUIET, FLOAT128_LT_QUIET, #endif NUM_FUNCTIONS }; static struct { char *name; int8 numInputs; flag roundingPrecision, roundingMode; flag tininessMode, tininessModeAtReducedPrecision; } functions[ NUM_FUNCTIONS ] = { { 0, 0, 0, 0, 0, 0 }, { "int32_to_float32", 1, FALSE, TRUE, FALSE, FALSE }, { "int32_to_float64", 1, FALSE, FALSE, FALSE, FALSE }, #ifdef FLOATX80 { "int32_to_floatx80", 1, FALSE, FALSE, FALSE, FALSE }, #endif #ifdef FLOAT128 { "int32_to_float128", 1, FALSE, FALSE, FALSE, FALSE }, #endif { "int64_to_float32", 1, FALSE, TRUE, FALSE, FALSE }, { "int64_to_float64", 1, FALSE, TRUE, FALSE, FALSE }, #ifdef FLOATX80 { "int64_to_floatx80", 1, FALSE, FALSE, FALSE, FALSE }, #endif #ifdef FLOAT128 { "int64_to_float128", 1, FALSE, FALSE, FALSE, FALSE }, #endif { "float32_to_int32", 1, FALSE, TRUE, FALSE, FALSE }, { "float32_to_int32_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE }, { "float32_to_int64", 1, FALSE, TRUE, FALSE, FALSE }, { "float32_to_int64_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE }, { "float32_to_float64", 1, FALSE, FALSE, FALSE, FALSE }, #ifdef FLOATX80 { "float32_to_floatx80", 1, FALSE, FALSE, FALSE, FALSE }, #endif #ifdef FLOAT128 { "float32_to_float128", 1, FALSE, FALSE, FALSE, FALSE }, #endif { "float32_round_to_int", 1, FALSE, TRUE, FALSE, FALSE }, { "float32_add", 2, FALSE, TRUE, FALSE, FALSE }, { "float32_sub", 2, FALSE, TRUE, FALSE, FALSE }, { "float32_mul", 2, FALSE, TRUE, TRUE, FALSE }, { "float32_div", 2, FALSE, TRUE, FALSE, FALSE }, { "float32_rem", 2, FALSE, FALSE, FALSE, FALSE }, { "float32_sqrt", 1, FALSE, TRUE, FALSE, FALSE }, { "float32_eq", 2, FALSE, FALSE, FALSE, FALSE }, { "float32_le", 2, FALSE, FALSE, FALSE, FALSE }, { "float32_lt", 2, FALSE, FALSE, FALSE, FALSE }, { "float32_eq_signaling", 2, FALSE, FALSE, FALSE, FALSE }, { "float32_le_quiet", 2, FALSE, FALSE, FALSE, FALSE }, { "float32_lt_quiet", 2, FALSE, FALSE, FALSE, FALSE }, { "float64_to_int32", 1, FALSE, TRUE, FALSE, FALSE }, { "float64_to_int32_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE }, { "float64_to_int64", 1, FALSE, TRUE, FALSE, FALSE }, { "float64_to_int64_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE }, { "float64_to_float32", 1, FALSE, TRUE, TRUE, FALSE }, #ifdef FLOATX80 { "float64_to_floatx80", 1, FALSE, FALSE, FALSE, FALSE }, #endif #ifdef FLOAT128 { "float64_to_float128", 1, FALSE, FALSE, FALSE, FALSE }, #endif { "float64_round_to_int", 1, FALSE, TRUE, FALSE, FALSE }, { "float64_add", 2, FALSE, TRUE, FALSE, FALSE }, { "float64_sub", 2, FALSE, TRUE, FALSE, FALSE }, { "float64_mul", 2, FALSE, TRUE, TRUE, FALSE }, { "float64_div", 2, FALSE, TRUE, FALSE, FALSE }, { "float64_rem", 2, FALSE, FALSE, FALSE, FALSE }, { "float64_sqrt", 1, FALSE, TRUE, FALSE, FALSE }, { "float64_eq", 2, FALSE, FALSE, FALSE, FALSE }, { "float64_le", 2, FALSE, FALSE, FALSE, FALSE }, { "float64_lt", 2, FALSE, FALSE, FALSE, FALSE }, { "float64_eq_signaling", 2, FALSE, FALSE, FALSE, FALSE }, { "float64_le_quiet", 2, FALSE, FALSE, FALSE, FALSE }, { "float64_lt_quiet", 2, FALSE, FALSE, FALSE, FALSE }, #ifdef FLOATX80 { "floatx80_to_int32", 1, FALSE, TRUE, FALSE, FALSE }, { "floatx80_to_int32_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE }, { "floatx80_to_int64", 1, FALSE, TRUE, FALSE, FALSE }, { "floatx80_to_int64_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE }, { "floatx80_to_float32", 1, FALSE, TRUE, TRUE, FALSE }, { "floatx80_to_float64", 1, FALSE, TRUE, TRUE, FALSE }, #ifdef FLOAT128 { "floatx80_to_float128", 1, FALSE, FALSE, FALSE, FALSE }, #endif { "floatx80_round_to_int", 1, FALSE, TRUE, FALSE, FALSE }, { "floatx80_add", 2, TRUE, TRUE, FALSE, TRUE }, { "floatx80_sub", 2, TRUE, TRUE, FALSE, TRUE }, { "floatx80_mul", 2, TRUE, TRUE, TRUE, TRUE }, { "floatx80_div", 2, TRUE, TRUE, FALSE, TRUE }, { "floatx80_rem", 2, FALSE, FALSE, FALSE, FALSE }, { "floatx80_sqrt", 1, TRUE, TRUE, FALSE, FALSE }, { "floatx80_eq", 2, FALSE, FALSE, FALSE, FALSE }, { "floatx80_le", 2, FALSE, FALSE, FALSE, FALSE }, { "floatx80_lt", 2, FALSE, FALSE, FALSE, FALSE }, { "floatx80_eq_signaling", 2, FALSE, FALSE, FALSE, FALSE }, { "floatx80_le_quiet", 2, FALSE, FALSE, FALSE, FALSE }, { "floatx80_lt_quiet", 2, FALSE, FALSE, FALSE, FALSE }, #endif #ifdef FLOAT128 { "float128_to_int32", 1, FALSE, TRUE, FALSE, FALSE }, { "float128_to_int32_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE }, { "float128_to_int64", 1, FALSE, TRUE, FALSE, FALSE }, { "float128_to_int64_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE }, { "float128_to_float32", 1, FALSE, TRUE, TRUE, FALSE }, { "float128_to_float64", 1, FALSE, TRUE, TRUE, FALSE }, #ifdef FLOATX80 { "float128_to_floatx80", 1, FALSE, TRUE, TRUE, FALSE }, #endif { "float128_round_to_int", 1, FALSE, TRUE, FALSE, FALSE }, { "float128_add", 2, FALSE, TRUE, FALSE, FALSE }, { "float128_sub", 2, FALSE, TRUE, FALSE, FALSE }, { "float128_mul", 2, FALSE, TRUE, TRUE, FALSE }, { "float128_div", 2, FALSE, TRUE, FALSE, FALSE }, { "float128_rem", 2, FALSE, FALSE, FALSE, FALSE }, { "float128_sqrt", 1, FALSE, TRUE, FALSE, FALSE }, { "float128_eq", 2, FALSE, FALSE, FALSE, FALSE }, { "float128_le", 2, FALSE, FALSE, FALSE, FALSE }, { "float128_lt", 2, FALSE, FALSE, FALSE, FALSE }, { "float128_eq_signaling", 2, FALSE, FALSE, FALSE, FALSE }, { "float128_le_quiet", 2, FALSE, FALSE, FALSE, FALSE }, { "float128_lt_quiet", 2, FALSE, FALSE, FALSE, FALSE }, #endif }; enum { ROUND_NEAREST_EVEN = 1, ROUND_TO_ZERO, ROUND_DOWN, ROUND_UP, NUM_ROUNDINGMODES }; enum { TININESS_BEFORE_ROUNDING = 1, TININESS_AFTER_ROUNDING, NUM_TININESSMODES }; static void timeFunctionVariety( uint8 functionCode, int8 roundingPrecision, int8 roundingMode, int8 tininessMode ) { uint8 roundingCode; int8 tininessCode; functionName = functions[ functionCode ].name; if ( roundingPrecision == 32 ) { roundingPrecisionName = "32"; } else if ( roundingPrecision == 64 ) { roundingPrecisionName = "64"; } else if ( roundingPrecision == 80 ) { roundingPrecisionName = "80"; } else { roundingPrecisionName = 0; } #ifdef FLOATX80 floatx80_rounding_precision = roundingPrecision; #endif switch ( roundingMode ) { case 0: roundingModeName = 0; roundingCode = float_round_nearest_even; break; case ROUND_NEAREST_EVEN: roundingModeName = "nearest_even"; roundingCode = float_round_nearest_even; break; case ROUND_TO_ZERO: roundingModeName = "to_zero"; roundingCode = float_round_to_zero; break; case ROUND_DOWN: roundingModeName = "down"; roundingCode = float_round_down; break; case ROUND_UP: roundingModeName = "up"; roundingCode = float_round_up; break; } float_rounding_mode = roundingCode; switch ( tininessMode ) { case 0: tininessModeName = 0; tininessCode = float_tininess_after_rounding; break; case TININESS_BEFORE_ROUNDING: tininessModeName = "before"; tininessCode = float_tininess_before_rounding; break; case TININESS_AFTER_ROUNDING: tininessModeName = "after"; tininessCode = float_tininess_after_rounding; break; } float_detect_tininess = tininessCode; switch ( functionCode ) { case INT32_TO_FLOAT32: time_a_int32_z_float32( int32_to_float32 ); break; case INT32_TO_FLOAT64: time_a_int32_z_float64( int32_to_float64 ); break; #ifdef FLOATX80 case INT32_TO_FLOATX80: time_a_int32_z_floatx80( int32_to_floatx80 ); break; #endif #ifdef FLOAT128 case INT32_TO_FLOAT128: time_a_int32_z_float128( int32_to_float128 ); break; #endif case INT64_TO_FLOAT32: time_a_int64_z_float32( int64_to_float32 ); break; case INT64_TO_FLOAT64: time_a_int64_z_float64( int64_to_float64 ); break; #ifdef FLOATX80 case INT64_TO_FLOATX80: time_a_int64_z_floatx80( int64_to_floatx80 ); break; #endif #ifdef FLOAT128 case INT64_TO_FLOAT128: time_a_int64_z_float128( int64_to_float128 ); break; #endif case FLOAT32_TO_INT32: time_a_float32_z_int32( float32_to_int32 ); break; case FLOAT32_TO_INT32_ROUND_TO_ZERO: time_a_float32_z_int32( float32_to_int32_round_to_zero ); break; case FLOAT32_TO_INT64: time_a_float32_z_int64( float32_to_int64 ); break; case FLOAT32_TO_INT64_ROUND_TO_ZERO: time_a_float32_z_int64( float32_to_int64_round_to_zero ); break; case FLOAT32_TO_FLOAT64: time_a_float32_z_float64( float32_to_float64 ); break; #ifdef FLOATX80 case FLOAT32_TO_FLOATX80: time_a_float32_z_floatx80( float32_to_floatx80 ); break; #endif #ifdef FLOAT128 case FLOAT32_TO_FLOAT128: time_a_float32_z_float128( float32_to_float128 ); break; #endif case FLOAT32_ROUND_TO_INT: time_az_float32( float32_round_to_int ); break; case FLOAT32_ADD: time_abz_float32( float32_add ); break; case FLOAT32_SUB: time_abz_float32( float32_sub ); break; case FLOAT32_MUL: time_abz_float32( float32_mul ); break; case FLOAT32_DIV: time_abz_float32( float32_div ); break; case FLOAT32_REM: time_abz_float32( float32_rem ); break; case FLOAT32_SQRT: time_az_float32_pos( float32_sqrt ); break; case FLOAT32_EQ: time_ab_float32_z_flag( float32_eq ); break; case FLOAT32_LE: time_ab_float32_z_flag( float32_le ); break; case FLOAT32_LT: time_ab_float32_z_flag( float32_lt ); break; case FLOAT32_EQ_SIGNALING: time_ab_float32_z_flag( float32_eq_signaling ); break; case FLOAT32_LE_QUIET: time_ab_float32_z_flag( float32_le_quiet ); break; case FLOAT32_LT_QUIET: time_ab_float32_z_flag( float32_lt_quiet ); break; case FLOAT64_TO_INT32: time_a_float64_z_int32( float64_to_int32 ); break; case FLOAT64_TO_INT32_ROUND_TO_ZERO: time_a_float64_z_int32( float64_to_int32_round_to_zero ); break; case FLOAT64_TO_INT64: time_a_float64_z_int64( float64_to_int64 ); break; case FLOAT64_TO_INT64_ROUND_TO_ZERO: time_a_float64_z_int64( float64_to_int64_round_to_zero ); break; case FLOAT64_TO_FLOAT32: time_a_float64_z_float32( float64_to_float32 ); break; #ifdef FLOATX80 case FLOAT64_TO_FLOATX80: time_a_float64_z_floatx80( float64_to_floatx80 ); break; #endif #ifdef FLOAT128 case FLOAT64_TO_FLOAT128: time_a_float64_z_float128( float64_to_float128 ); break; #endif case FLOAT64_ROUND_TO_INT: time_az_float64( float64_round_to_int ); break; case FLOAT64_ADD: time_abz_float64( float64_add ); break; case FLOAT64_SUB: time_abz_float64( float64_sub ); break; case FLOAT64_MUL: time_abz_float64( float64_mul ); break; case FLOAT64_DIV: time_abz_float64( float64_div ); break; case FLOAT64_REM: time_abz_float64( float64_rem ); break; case FLOAT64_SQRT: time_az_float64_pos( float64_sqrt ); break; case FLOAT64_EQ: time_ab_float64_z_flag( float64_eq ); break; case FLOAT64_LE: time_ab_float64_z_flag( float64_le ); break; case FLOAT64_LT: time_ab_float64_z_flag( float64_lt ); break; case FLOAT64_EQ_SIGNALING: time_ab_float64_z_flag( float64_eq_signaling ); break; case FLOAT64_LE_QUIET: time_ab_float64_z_flag( float64_le_quiet ); break; case FLOAT64_LT_QUIET: time_ab_float64_z_flag( float64_lt_quiet ); break; #ifdef FLOATX80 case FLOATX80_TO_INT32: time_a_floatx80_z_int32( floatx80_to_int32 ); break; case FLOATX80_TO_INT32_ROUND_TO_ZERO: time_a_floatx80_z_int32( floatx80_to_int32_round_to_zero ); break; case FLOATX80_TO_INT64: time_a_floatx80_z_int64( floatx80_to_int64 ); break; case FLOATX80_TO_INT64_ROUND_TO_ZERO: time_a_floatx80_z_int64( floatx80_to_int64_round_to_zero ); break; case FLOATX80_TO_FLOAT32: time_a_floatx80_z_float32( floatx80_to_float32 ); break; case FLOATX80_TO_FLOAT64: time_a_floatx80_z_float64( floatx80_to_float64 ); break; #ifdef FLOAT128 case FLOATX80_TO_FLOAT128: time_a_floatx80_z_float128( floatx80_to_float128 ); break; #endif case FLOATX80_ROUND_TO_INT: time_az_floatx80( floatx80_round_to_int ); break; case FLOATX80_ADD: time_abz_floatx80( floatx80_add ); break; case FLOATX80_SUB: time_abz_floatx80( floatx80_sub ); break; case FLOATX80_MUL: time_abz_floatx80( floatx80_mul ); break; case FLOATX80_DIV: time_abz_floatx80( floatx80_div ); break; case FLOATX80_REM: time_abz_floatx80( floatx80_rem ); break; case FLOATX80_SQRT: time_az_floatx80_pos( floatx80_sqrt ); break; case FLOATX80_EQ: time_ab_floatx80_z_flag( floatx80_eq ); break; case FLOATX80_LE: time_ab_floatx80_z_flag( floatx80_le ); break; case FLOATX80_LT: time_ab_floatx80_z_flag( floatx80_lt ); break; case FLOATX80_EQ_SIGNALING: time_ab_floatx80_z_flag( floatx80_eq_signaling ); break; case FLOATX80_LE_QUIET: time_ab_floatx80_z_flag( floatx80_le_quiet ); break; case FLOATX80_LT_QUIET: time_ab_floatx80_z_flag( floatx80_lt_quiet ); break; #endif #ifdef FLOAT128 case FLOAT128_TO_INT32: time_a_float128_z_int32( float128_to_int32 ); break; case FLOAT128_TO_INT32_ROUND_TO_ZERO: time_a_float128_z_int32( float128_to_int32_round_to_zero ); break; case FLOAT128_TO_INT64: time_a_float128_z_int64( float128_to_int64 ); break; case FLOAT128_TO_INT64_ROUND_TO_ZERO: time_a_float128_z_int64( float128_to_int64_round_to_zero ); break; case FLOAT128_TO_FLOAT32: time_a_float128_z_float32( float128_to_float32 ); break; case FLOAT128_TO_FLOAT64: time_a_float128_z_float64( float128_to_float64 ); break; #ifdef FLOATX80 case FLOAT128_TO_FLOATX80: time_a_float128_z_floatx80( float128_to_floatx80 ); break; #endif case FLOAT128_ROUND_TO_INT: time_az_float128( float128_round_to_int ); break; case FLOAT128_ADD: time_abz_float128( float128_add ); break; case FLOAT128_SUB: time_abz_float128( float128_sub ); break; case FLOAT128_MUL: time_abz_float128( float128_mul ); break; case FLOAT128_DIV: time_abz_float128( float128_div ); break; case FLOAT128_REM: time_abz_float128( float128_rem ); break; case FLOAT128_SQRT: time_az_float128_pos( float128_sqrt ); break; case FLOAT128_EQ: time_ab_float128_z_flag( float128_eq ); break; case FLOAT128_LE: time_ab_float128_z_flag( float128_le ); break; case FLOAT128_LT: time_ab_float128_z_flag( float128_lt ); break; case FLOAT128_EQ_SIGNALING: time_ab_float128_z_flag( float128_eq_signaling ); break; case FLOAT128_LE_QUIET: time_ab_float128_z_flag( float128_le_quiet ); break; case FLOAT128_LT_QUIET: time_ab_float128_z_flag( float128_lt_quiet ); break; #endif } } static void timeFunction( uint8 functionCode, int8 roundingPrecisionIn, int8 roundingModeIn, int8 tininessModeIn ) { int8 roundingPrecision, roundingMode, tininessMode; roundingPrecision = 32; for (;;) { if ( ! functions[ functionCode ].roundingPrecision ) { roundingPrecision = 0; } else if ( roundingPrecisionIn ) { roundingPrecision = roundingPrecisionIn; } for ( roundingMode = 1; roundingMode < NUM_ROUNDINGMODES; ++roundingMode ) { if ( ! functions[ functionCode ].roundingMode ) { roundingMode = 0; } else if ( roundingModeIn ) { roundingMode = roundingModeIn; } for ( tininessMode = 1; tininessMode < NUM_TININESSMODES; ++tininessMode ) { if ( ( roundingPrecision == 32 ) || ( roundingPrecision == 64 ) ) { if ( ! functions[ functionCode ] .tininessModeAtReducedPrecision ) { tininessMode = 0; } else if ( tininessModeIn ) { tininessMode = tininessModeIn; } } else { if ( ! functions[ functionCode ].tininessMode ) { tininessMode = 0; } else if ( tininessModeIn ) { tininessMode = tininessModeIn; } } timeFunctionVariety( functionCode, roundingPrecision, roundingMode, tininessMode ); if ( tininessModeIn || ! tininessMode ) break; } if ( roundingModeIn || ! roundingMode ) break; } if ( roundingPrecisionIn || ! roundingPrecision ) break; if ( roundingPrecision == 80 ) { break; } else if ( roundingPrecision == 64 ) { roundingPrecision = 80; } else if ( roundingPrecision == 32 ) { roundingPrecision = 64; } } } main( int argc, char **argv ) { char *argPtr; flag functionArgument; uint8 functionCode; int8 operands, roundingPrecision, roundingMode, tininessMode; if ( argc <= 1 ) goto writeHelpMessage; functionArgument = FALSE; functionCode = 0; operands = 0; roundingPrecision = 0; roundingMode = 0; tininessMode = 0; --argc; ++argv; while ( argc && ( argPtr = argv[ 0 ] ) ) { if ( argPtr[ 0 ] == '-' ) ++argPtr; if ( strcmp( argPtr, "help" ) == 0 ) { writeHelpMessage: fputs( "timesoftfloat [<option>...] <function>\n" " <option>: (* is default)\n" " -help --Write this message and exit.\n" #ifdef FLOATX80 " -precision32 --Only time rounding precision equivalent to float32.\n" " -precision64 --Only time rounding precision equivalent to float64.\n" " -precision80 --Only time maximum rounding precision.\n" #endif " -nearesteven --Only time rounding to nearest/even.\n" " -tozero --Only time rounding to zero.\n" " -down --Only time rounding down.\n" " -up --Only time rounding up.\n" " -tininessbefore --Only time underflow tininess before rounding.\n" " -tininessafter --Only time underflow tininess after rounding.\n" " <function>:\n" " int32_to_<float> <float>_add <float>_eq\n" " <float>_to_int32 <float>_sub <float>_le\n" " <float>_to_int32_round_to_zero <float>_mul <float>_lt\n" " int64_to_<float> <float>_div <float>_eq_signaling\n" " <float>_to_int64 <float>_rem <float>_le_quiet\n" " <float>_to_int64_round_to_zero <float>_lt_quiet\n" " <float>_to_<float>\n" " <float>_round_to_int\n" " <float>_sqrt\n" " -all1 --All 1-operand functions.\n" " -all2 --All 2-operand functions.\n" " -all --All functions.\n" " <float>:\n" " float32 --Single precision.\n" " float64 --Double precision.\n" #ifdef FLOATX80 " floatx80 --Extended double precision.\n" #endif #ifdef FLOAT128 " float128 --Quadruple precision.\n" #endif , stdout ); return EXIT_SUCCESS; } #ifdef FLOATX80 else if ( strcmp( argPtr, "precision32" ) == 0 ) { roundingPrecision = 32; } else if ( strcmp( argPtr, "precision64" ) == 0 ) { roundingPrecision = 64; } else if ( strcmp( argPtr, "precision80" ) == 0 ) { roundingPrecision = 80; } #endif else if ( ( strcmp( argPtr, "nearesteven" ) == 0 ) || ( strcmp( argPtr, "nearest_even" ) == 0 ) ) { roundingMode = ROUND_NEAREST_EVEN; } else if ( ( strcmp( argPtr, "tozero" ) == 0 ) || ( strcmp( argPtr, "to_zero" ) == 0 ) ) { roundingMode = ROUND_TO_ZERO; } else if ( strcmp( argPtr, "down" ) == 0 ) { roundingMode = ROUND_DOWN; } else if ( strcmp( argPtr, "up" ) == 0 ) { roundingMode = ROUND_UP; } else if ( strcmp( argPtr, "tininessbefore" ) == 0 ) { tininessMode = TININESS_BEFORE_ROUNDING; } else if ( strcmp( argPtr, "tininessafter" ) == 0 ) { tininessMode = TININESS_AFTER_ROUNDING; } else if ( strcmp( argPtr, "all1" ) == 0 ) { functionArgument = TRUE; functionCode = 0; operands = 1; } else if ( strcmp( argPtr, "all2" ) == 0 ) { functionArgument = TRUE; functionCode = 0; operands = 2; } else if ( strcmp( argPtr, "all" ) == 0 ) { functionArgument = TRUE; functionCode = 0; operands = 0; } else { for ( functionCode = 1; functionCode < NUM_FUNCTIONS; ++functionCode ) { if ( strcmp( argPtr, functions[ functionCode ].name ) == 0 ) { break; } } if ( functionCode == NUM_FUNCTIONS ) { fail( "Invalid option or function `%s'", argv[ 0 ] ); } functionArgument = TRUE; } --argc; ++argv; } if ( ! functionArgument ) fail( "Function argument required" ); if ( functionCode ) { timeFunction( functionCode, roundingPrecision, roundingMode, tininessMode ); } else if ( operands == 1 ) { for ( functionCode = 1; functionCode < NUM_FUNCTIONS; ++functionCode ) { if ( functions[ functionCode ].numInputs == 1 ) { timeFunction( functionCode, roundingPrecision, roundingMode, tininessMode ); } } } else if ( operands == 2 ) { for ( functionCode = 1; functionCode < NUM_FUNCTIONS; ++functionCode ) { if ( functions[ functionCode ].numInputs == 2 ) { timeFunction( functionCode, roundingPrecision, roundingMode, tininessMode ); } } } else { for ( functionCode = 1; functionCode < NUM_FUNCTIONS; ++functionCode ) { timeFunction( functionCode, roundingPrecision, roundingMode, tininessMode ); } } return EXIT_SUCCESS; }