2fe8fb192f
There is important information about booting non-ack images in docs/UPDATING. ack/aout-format images can't be built any more, and booting clang/ELF-format ones is a little different. Updating to the new boot monitor is recommended. Changes in this commit: . drop boot monitor -> allowing dropping ack support . facility to copy ELF boot files to /boot so that old boot monitor can still boot fairly easily, see UPDATING . no more ack-format libraries -> single-case libraries . some cleanup of OBJECT_FMT, COMPILER_TYPE, etc cases . drop several ack toolchain commands, but not all support commands (e.g. aal is gone but acksize is not yet). . a few libc files moved to netbsd libc dir . new /bin/date as minix date used code in libc/ . test compile fix . harmonize includes . /usr/lib is no longer special: without ack, /usr/lib plays no kind of special bootstrapping role any more and bootstrapping is done exclusively through packages, so releases depend even less on the state of the machine making them now. . rename nbsd_lib* to lib* . reduce mtree
2641 lines
81 KiB
C
2641 lines
81 KiB
C
/* $NetBSD: timesoftfloat.c,v 1.1 2000/06/06 08:15:11 bjh21 Exp $ */
|
|
|
|
/*
|
|
===============================================================================
|
|
|
|
This C source file is part of the SoftFloat IEC/IEEE Floating-point
|
|
Arithmetic Package, Release 2a.
|
|
|
|
Written by John R. Hauser. This work was made possible in part by the
|
|
International Computer Science Institute, located at Suite 600, 1947 Center
|
|
Street, Berkeley, California 94704. Funding was partially provided by the
|
|
National Science Foundation under grant MIP-9311980. The original version
|
|
of this code was written as part of a project to build a fixed-point vector
|
|
processor in collaboration with the University of California at Berkeley,
|
|
overseen by Profs. Nelson Morgan and John Wawrzynek. More information
|
|
is available through the Web page `http://HTTP.CS.Berkeley.EDU/~jhauser/
|
|
arithmetic/SoftFloat.html'.
|
|
|
|
THIS SOFTWARE IS DISTRIBUTED AS IS, FOR FREE. Although reasonable effort
|
|
has been made to avoid it, THIS SOFTWARE MAY CONTAIN FAULTS THAT WILL AT
|
|
TIMES RESULT IN INCORRECT BEHAVIOR. USE OF THIS SOFTWARE IS RESTRICTED TO
|
|
PERSONS AND ORGANIZATIONS WHO CAN AND WILL TAKE FULL RESPONSIBILITY FOR ANY
|
|
AND ALL LOSSES, COSTS, OR OTHER PROBLEMS ARISING FROM ITS USE.
|
|
|
|
Derivative works are acceptable, even for commercial purposes, so long as
|
|
(1) they include prominent notice that the work is derivative, and (2) they
|
|
include prominent notice akin to these four paragraphs for those parts of
|
|
this code that are retained.
|
|
|
|
===============================================================================
|
|
*/
|
|
|
|
#include <sys/cdefs.h>
|
|
#if defined(LIBC_SCCS) && !defined(lint)
|
|
__RCSID("$NetBSD: timesoftfloat.c,v 1.1 2000/06/06 08:15:11 bjh21 Exp $");
|
|
#endif /* LIBC_SCCS and not lint */
|
|
|
|
#include <stdlib.h>
|
|
#include <stdarg.h>
|
|
#include <string.h>
|
|
#include <stdio.h>
|
|
#include <time.h>
|
|
#include "milieu.h"
|
|
#include "softfloat.h"
|
|
|
|
enum {
|
|
minIterations = 1000
|
|
};
|
|
|
|
static void fail( const char *message, ... )
|
|
{
|
|
va_list varArgs;
|
|
|
|
fputs( "timesoftfloat: ", stderr );
|
|
va_start( varArgs, message );
|
|
vfprintf( stderr, message, varArgs );
|
|
va_end( varArgs );
|
|
fputs( ".\n", stderr );
|
|
exit( EXIT_FAILURE );
|
|
|
|
}
|
|
|
|
static char *functionName;
|
|
static char *roundingPrecisionName, *roundingModeName, *tininessModeName;
|
|
|
|
static void reportTime( int32 count, long clocks )
|
|
{
|
|
|
|
printf(
|
|
"%8.1f kops/s: %s",
|
|
( count / ( ( (float) clocks ) / CLOCKS_PER_SEC ) ) / 1000,
|
|
functionName
|
|
);
|
|
if ( roundingModeName ) {
|
|
if ( roundingPrecisionName ) {
|
|
fputs( ", precision ", stdout );
|
|
fputs( roundingPrecisionName, stdout );
|
|
}
|
|
fputs( ", rounding ", stdout );
|
|
fputs( roundingModeName, stdout );
|
|
if ( tininessModeName ) {
|
|
fputs( ", tininess ", stdout );
|
|
fputs( tininessModeName, stdout );
|
|
fputs( " rounding", stdout );
|
|
}
|
|
}
|
|
fputc( '\n', stdout );
|
|
|
|
}
|
|
|
|
enum {
|
|
numInputs_int32 = 32
|
|
};
|
|
|
|
static const int32 inputs_int32[ numInputs_int32 ] = {
|
|
0xFFFFBB79, 0x405CF80F, 0x00000000, 0xFFFFFD04,
|
|
0xFFF20002, 0x0C8EF795, 0xF00011FF, 0x000006CA,
|
|
0x00009BFE, 0xFF4862E3, 0x9FFFEFFE, 0xFFFFFFB7,
|
|
0x0BFF7FFF, 0x0000F37A, 0x0011DFFE, 0x00000006,
|
|
0xFFF02006, 0xFFFFF7D1, 0x10200003, 0xDE8DF765,
|
|
0x00003E02, 0x000019E8, 0x0008FFFE, 0xFFFFFB5C,
|
|
0xFFDF7FFE, 0x07C42FBF, 0x0FFFE3FF, 0x040B9F13,
|
|
0xBFFFFFF8, 0x0001BF56, 0x000017F6, 0x000A908A
|
|
};
|
|
|
|
static void time_a_int32_z_float32( float32 function( int32 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_int32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_int32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_a_int32_z_float64( float64 function( int32 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_int32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_int32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#ifdef FLOATX80
|
|
|
|
static void time_a_int32_z_floatx80( floatx80 function( int32 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_int32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_int32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
#ifdef FLOAT128
|
|
|
|
static void time_a_int32_z_float128( float128 function( int32 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_int32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_int32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_int32 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
enum {
|
|
numInputs_int64 = 32
|
|
};
|
|
|
|
static const int64 inputs_int64[ numInputs_int64 ] = {
|
|
LIT64( 0xFBFFC3FFFFFFFFFF ),
|
|
LIT64( 0x0000000003C589BC ),
|
|
LIT64( 0x00000000400013FE ),
|
|
LIT64( 0x0000000000186171 ),
|
|
LIT64( 0xFFFFFFFFFFFEFBFA ),
|
|
LIT64( 0xFFFFFD79E6DFFC73 ),
|
|
LIT64( 0x0000000010001DFF ),
|
|
LIT64( 0xDD1A0F0C78513710 ),
|
|
LIT64( 0xFFFF83FFFFFEFFFE ),
|
|
LIT64( 0x00756EBD1AD0C1C7 ),
|
|
LIT64( 0x0003FDFFFFFFFFBE ),
|
|
LIT64( 0x0007D0FB2C2CA951 ),
|
|
LIT64( 0x0007FC0007FFFFFE ),
|
|
LIT64( 0x0000001F942B18BB ),
|
|
LIT64( 0x0000080101FFFFFE ),
|
|
LIT64( 0xFFFFFFFFFFFF0978 ),
|
|
LIT64( 0x000000000008BFFF ),
|
|
LIT64( 0x0000000006F5AF08 ),
|
|
LIT64( 0xFFDEFF7FFFFFFFFE ),
|
|
LIT64( 0x0000000000000003 ),
|
|
LIT64( 0x3FFFFFFFFF80007D ),
|
|
LIT64( 0x0000000000000078 ),
|
|
LIT64( 0xFFF80000007FDFFD ),
|
|
LIT64( 0x1BBC775B78016AB0 ),
|
|
LIT64( 0xFFF9001FFFFFFFFE ),
|
|
LIT64( 0xFFFD4767AB98E43F ),
|
|
LIT64( 0xFFFFFEFFFE00001E ),
|
|
LIT64( 0xFFFFFFFFFFF04EFD ),
|
|
LIT64( 0x07FFFFFFFFFFF7FF ),
|
|
LIT64( 0xFFFC9EAA38F89050 ),
|
|
LIT64( 0x00000020FBFFFFFE ),
|
|
LIT64( 0x0000099AE6455357 )
|
|
};
|
|
|
|
static void time_a_int64_z_float32( float32 function( int64 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_int64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_int64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_a_int64_z_float64( float64 function( int64 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_int64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_int64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#ifdef FLOATX80
|
|
|
|
static void time_a_int64_z_floatx80( floatx80 function( int64 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_int64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_int64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
#ifdef FLOAT128
|
|
|
|
static void time_a_int64_z_float128( float128 function( int64 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_int64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_int64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_int64 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
enum {
|
|
numInputs_float32 = 32
|
|
};
|
|
|
|
static const float32 inputs_float32[ numInputs_float32 ] = {
|
|
0x4EFA0000, 0xC1D0B328, 0x80000000, 0x3E69A31E,
|
|
0xAF803EFF, 0x3F800000, 0x17BF8000, 0xE74A301A,
|
|
0x4E010003, 0x7EE3C75D, 0xBD803FE0, 0xBFFEFF00,
|
|
0x7981F800, 0x431FFFFC, 0xC100C000, 0x3D87EFFF,
|
|
0x4103FEFE, 0xBC000007, 0xBF01F7FF, 0x4E6C6B5C,
|
|
0xC187FFFE, 0xC58B9F13, 0x4F88007F, 0xDF004007,
|
|
0xB7FFD7FE, 0x7E8001FB, 0x46EFFBFF, 0x31C10000,
|
|
0xDB428661, 0x33F89B1F, 0xA3BFEFFF, 0x537BFFBE
|
|
};
|
|
|
|
static void time_a_float32_z_int32( int32 function( float32 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_float32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_float32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_a_float32_z_int64( int64 function( float32 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_float32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_float32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_a_float32_z_float64( float64 function( float32 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_float32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_float32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#ifdef FLOATX80
|
|
|
|
static void time_a_float32_z_floatx80( floatx80 function( float32 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_float32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_float32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
#ifdef FLOAT128
|
|
|
|
static void time_a_float32_z_float128( float128 function( float32 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_float32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_float32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
static void time_az_float32( float32 function( float32 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_float32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_float32[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_ab_float32_z_flag( flag function( float32, float32 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNumA, inputNumB;
|
|
|
|
count = 0;
|
|
inputNumA = 0;
|
|
inputNumB = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function(
|
|
inputs_float32[ inputNumA ], inputs_float32[ inputNumB ] );
|
|
inputNumA = ( inputNumA + 1 ) & ( numInputs_float32 - 1 );
|
|
if ( inputNumA == 0 ) ++inputNumB;
|
|
inputNumB = ( inputNumB + 1 ) & ( numInputs_float32 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNumA = 0;
|
|
inputNumB = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function(
|
|
inputs_float32[ inputNumA ], inputs_float32[ inputNumB ] );
|
|
inputNumA = ( inputNumA + 1 ) & ( numInputs_float32 - 1 );
|
|
if ( inputNumA == 0 ) ++inputNumB;
|
|
inputNumB = ( inputNumB + 1 ) & ( numInputs_float32 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_abz_float32( float32 function( float32, float32 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNumA, inputNumB;
|
|
|
|
count = 0;
|
|
inputNumA = 0;
|
|
inputNumB = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function(
|
|
inputs_float32[ inputNumA ], inputs_float32[ inputNumB ] );
|
|
inputNumA = ( inputNumA + 1 ) & ( numInputs_float32 - 1 );
|
|
if ( inputNumA == 0 ) ++inputNumB;
|
|
inputNumB = ( inputNumB + 1 ) & ( numInputs_float32 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNumA = 0;
|
|
inputNumB = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function(
|
|
inputs_float32[ inputNumA ], inputs_float32[ inputNumB ] );
|
|
inputNumA = ( inputNumA + 1 ) & ( numInputs_float32 - 1 );
|
|
if ( inputNumA == 0 ) ++inputNumB;
|
|
inputNumB = ( inputNumB + 1 ) & ( numInputs_float32 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static const float32 inputs_float32_pos[ numInputs_float32 ] = {
|
|
0x4EFA0000, 0x41D0B328, 0x00000000, 0x3E69A31E,
|
|
0x2F803EFF, 0x3F800000, 0x17BF8000, 0x674A301A,
|
|
0x4E010003, 0x7EE3C75D, 0x3D803FE0, 0x3FFEFF00,
|
|
0x7981F800, 0x431FFFFC, 0x4100C000, 0x3D87EFFF,
|
|
0x4103FEFE, 0x3C000007, 0x3F01F7FF, 0x4E6C6B5C,
|
|
0x4187FFFE, 0x458B9F13, 0x4F88007F, 0x5F004007,
|
|
0x37FFD7FE, 0x7E8001FB, 0x46EFFBFF, 0x31C10000,
|
|
0x5B428661, 0x33F89B1F, 0x23BFEFFF, 0x537BFFBE
|
|
};
|
|
|
|
static void time_az_float32_pos( float32 function( float32 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_float32_pos[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_float32_pos[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float32 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
enum {
|
|
numInputs_float64 = 32
|
|
};
|
|
|
|
static const float64 inputs_float64[ numInputs_float64 ] = {
|
|
LIT64( 0x422FFFC008000000 ),
|
|
LIT64( 0xB7E0000480000000 ),
|
|
LIT64( 0xF3FD2546120B7935 ),
|
|
LIT64( 0x3FF0000000000000 ),
|
|
LIT64( 0xCE07F766F09588D6 ),
|
|
LIT64( 0x8000000000000000 ),
|
|
LIT64( 0x3FCE000400000000 ),
|
|
LIT64( 0x8313B60F0032BED8 ),
|
|
LIT64( 0xC1EFFFFFC0002000 ),
|
|
LIT64( 0x3FB3C75D224F2B0F ),
|
|
LIT64( 0x7FD00000004000FF ),
|
|
LIT64( 0xA12FFF8000001FFF ),
|
|
LIT64( 0x3EE0000000FE0000 ),
|
|
LIT64( 0x0010000080000004 ),
|
|
LIT64( 0x41CFFFFE00000020 ),
|
|
LIT64( 0x40303FFFFFFFFFFD ),
|
|
LIT64( 0x3FD000003FEFFFFF ),
|
|
LIT64( 0xBFD0000010000000 ),
|
|
LIT64( 0xB7FC6B5C16CA55CF ),
|
|
LIT64( 0x413EEB940B9D1301 ),
|
|
LIT64( 0xC7E00200001FFFFF ),
|
|
LIT64( 0x47F00021FFFFFFFE ),
|
|
LIT64( 0xBFFFFFFFF80000FF ),
|
|
LIT64( 0xC07FFFFFE00FFFFF ),
|
|
LIT64( 0x001497A63740C5E8 ),
|
|
LIT64( 0xC4BFFFE0001FFFFF ),
|
|
LIT64( 0x96FFDFFEFFFFFFFF ),
|
|
LIT64( 0x403FC000000001FE ),
|
|
LIT64( 0xFFD00000000001F6 ),
|
|
LIT64( 0x0640400002000000 ),
|
|
LIT64( 0x479CEE1E4F789FE0 ),
|
|
LIT64( 0xC237FFFFFFFFFDFE )
|
|
};
|
|
|
|
static void time_a_float64_z_int32( int32 function( float64 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_float64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_float64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_a_float64_z_int64( int64 function( float64 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_float64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_float64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_a_float64_z_float32( float32 function( float64 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_float64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_float64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#ifdef FLOATX80
|
|
|
|
static void time_a_float64_z_floatx80( floatx80 function( float64 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_float64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_float64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
#ifdef FLOAT128
|
|
|
|
static void time_a_float64_z_float128( float128 function( float64 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_float64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_float64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
static void time_az_float64( float64 function( float64 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_float64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_float64[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_ab_float64_z_flag( flag function( float64, float64 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNumA, inputNumB;
|
|
|
|
count = 0;
|
|
inputNumA = 0;
|
|
inputNumB = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function(
|
|
inputs_float64[ inputNumA ], inputs_float64[ inputNumB ] );
|
|
inputNumA = ( inputNumA + 1 ) & ( numInputs_float64 - 1 );
|
|
if ( inputNumA == 0 ) ++inputNumB;
|
|
inputNumB = ( inputNumB + 1 ) & ( numInputs_float64 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNumA = 0;
|
|
inputNumB = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function(
|
|
inputs_float64[ inputNumA ], inputs_float64[ inputNumB ] );
|
|
inputNumA = ( inputNumA + 1 ) & ( numInputs_float64 - 1 );
|
|
if ( inputNumA == 0 ) ++inputNumB;
|
|
inputNumB = ( inputNumB + 1 ) & ( numInputs_float64 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_abz_float64( float64 function( float64, float64 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNumA, inputNumB;
|
|
|
|
count = 0;
|
|
inputNumA = 0;
|
|
inputNumB = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function(
|
|
inputs_float64[ inputNumA ], inputs_float64[ inputNumB ] );
|
|
inputNumA = ( inputNumA + 1 ) & ( numInputs_float64 - 1 );
|
|
if ( inputNumA == 0 ) ++inputNumB;
|
|
inputNumB = ( inputNumB + 1 ) & ( numInputs_float64 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNumA = 0;
|
|
inputNumB = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function(
|
|
inputs_float64[ inputNumA ], inputs_float64[ inputNumB ] );
|
|
inputNumA = ( inputNumA + 1 ) & ( numInputs_float64 - 1 );
|
|
if ( inputNumA == 0 ) ++inputNumB;
|
|
inputNumB = ( inputNumB + 1 ) & ( numInputs_float64 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static const float64 inputs_float64_pos[ numInputs_float64 ] = {
|
|
LIT64( 0x422FFFC008000000 ),
|
|
LIT64( 0x37E0000480000000 ),
|
|
LIT64( 0x73FD2546120B7935 ),
|
|
LIT64( 0x3FF0000000000000 ),
|
|
LIT64( 0x4E07F766F09588D6 ),
|
|
LIT64( 0x0000000000000000 ),
|
|
LIT64( 0x3FCE000400000000 ),
|
|
LIT64( 0x0313B60F0032BED8 ),
|
|
LIT64( 0x41EFFFFFC0002000 ),
|
|
LIT64( 0x3FB3C75D224F2B0F ),
|
|
LIT64( 0x7FD00000004000FF ),
|
|
LIT64( 0x212FFF8000001FFF ),
|
|
LIT64( 0x3EE0000000FE0000 ),
|
|
LIT64( 0x0010000080000004 ),
|
|
LIT64( 0x41CFFFFE00000020 ),
|
|
LIT64( 0x40303FFFFFFFFFFD ),
|
|
LIT64( 0x3FD000003FEFFFFF ),
|
|
LIT64( 0x3FD0000010000000 ),
|
|
LIT64( 0x37FC6B5C16CA55CF ),
|
|
LIT64( 0x413EEB940B9D1301 ),
|
|
LIT64( 0x47E00200001FFFFF ),
|
|
LIT64( 0x47F00021FFFFFFFE ),
|
|
LIT64( 0x3FFFFFFFF80000FF ),
|
|
LIT64( 0x407FFFFFE00FFFFF ),
|
|
LIT64( 0x001497A63740C5E8 ),
|
|
LIT64( 0x44BFFFE0001FFFFF ),
|
|
LIT64( 0x16FFDFFEFFFFFFFF ),
|
|
LIT64( 0x403FC000000001FE ),
|
|
LIT64( 0x7FD00000000001F6 ),
|
|
LIT64( 0x0640400002000000 ),
|
|
LIT64( 0x479CEE1E4F789FE0 ),
|
|
LIT64( 0x4237FFFFFFFFFDFE )
|
|
};
|
|
|
|
static void time_az_float64_pos( float64 function( float64 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
function( inputs_float64_pos[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
function( inputs_float64_pos[ inputNum ] );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float64 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#ifdef FLOATX80
|
|
|
|
enum {
|
|
numInputs_floatx80 = 32
|
|
};
|
|
|
|
static const struct {
|
|
bits16 high;
|
|
bits64 low;
|
|
} inputs_floatx80[ numInputs_floatx80 ] = {
|
|
{ 0xC03F, LIT64( 0xA9BE15A19C1E8B62 ) },
|
|
{ 0x8000, LIT64( 0x0000000000000000 ) },
|
|
{ 0x75A8, LIT64( 0xE59591E4788957A5 ) },
|
|
{ 0xBFFF, LIT64( 0xFFF0000000000040 ) },
|
|
{ 0x0CD8, LIT64( 0xFC000000000007FE ) },
|
|
{ 0x43BA, LIT64( 0x99A4000000000000 ) },
|
|
{ 0x3FFF, LIT64( 0x8000000000000000 ) },
|
|
{ 0x4081, LIT64( 0x94FBF1BCEB5545F0 ) },
|
|
{ 0x403E, LIT64( 0xFFF0000000002000 ) },
|
|
{ 0x3FFE, LIT64( 0xC860E3C75D224F28 ) },
|
|
{ 0x407E, LIT64( 0xFC00000FFFFFFFFE ) },
|
|
{ 0x737A, LIT64( 0x800000007FFDFFFE ) },
|
|
{ 0x4044, LIT64( 0xFFFFFF80000FFFFF ) },
|
|
{ 0xBBFE, LIT64( 0x8000040000001FFE ) },
|
|
{ 0xC002, LIT64( 0xFF80000000000020 ) },
|
|
{ 0xDE8D, LIT64( 0xFFFFFFFFFFE00004 ) },
|
|
{ 0xC004, LIT64( 0x8000000000003FFB ) },
|
|
{ 0x407F, LIT64( 0x800000000003FFFE ) },
|
|
{ 0xC000, LIT64( 0xA459EE6A5C16CA55 ) },
|
|
{ 0x8003, LIT64( 0xC42CBF7399AEEB94 ) },
|
|
{ 0xBF7F, LIT64( 0xF800000000000006 ) },
|
|
{ 0xC07F, LIT64( 0xBF56BE8871F28FEA ) },
|
|
{ 0xC07E, LIT64( 0xFFFF77FFFFFFFFFE ) },
|
|
{ 0xADC9, LIT64( 0x8000000FFFFFFFDE ) },
|
|
{ 0xC001, LIT64( 0xEFF7FFFFFFFFFFFF ) },
|
|
{ 0x4001, LIT64( 0xBE84F30125C497A6 ) },
|
|
{ 0xC06B, LIT64( 0xEFFFFFFFFFFFFFFF ) },
|
|
{ 0x4080, LIT64( 0xFFFFFFFFBFFFFFFF ) },
|
|
{ 0x87E9, LIT64( 0x81FFFFFFFFFFFBFF ) },
|
|
{ 0xA63F, LIT64( 0x801FFFFFFEFFFFFE ) },
|
|
{ 0x403C, LIT64( 0x801FFFFFFFF7FFFF ) },
|
|
{ 0x4018, LIT64( 0x8000000000080003 ) }
|
|
};
|
|
|
|
static void time_a_floatx80_z_int32( int32 function( floatx80 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
floatx80 a;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
a.low = inputs_floatx80[ inputNum ].low;
|
|
a.high = inputs_floatx80[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
a.low = inputs_floatx80[ inputNum ].low;
|
|
a.high = inputs_floatx80[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_a_floatx80_z_int64( int64 function( floatx80 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
floatx80 a;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
a.low = inputs_floatx80[ inputNum ].low;
|
|
a.high = inputs_floatx80[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
a.low = inputs_floatx80[ inputNum ].low;
|
|
a.high = inputs_floatx80[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_a_floatx80_z_float32( float32 function( floatx80 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
floatx80 a;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
a.low = inputs_floatx80[ inputNum ].low;
|
|
a.high = inputs_floatx80[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
a.low = inputs_floatx80[ inputNum ].low;
|
|
a.high = inputs_floatx80[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_a_floatx80_z_float64( float64 function( floatx80 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
floatx80 a;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
a.low = inputs_floatx80[ inputNum ].low;
|
|
a.high = inputs_floatx80[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
a.low = inputs_floatx80[ inputNum ].low;
|
|
a.high = inputs_floatx80[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#ifdef FLOAT128
|
|
|
|
static void time_a_floatx80_z_float128( float128 function( floatx80 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
floatx80 a;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
a.low = inputs_floatx80[ inputNum ].low;
|
|
a.high = inputs_floatx80[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
a.low = inputs_floatx80[ inputNum ].low;
|
|
a.high = inputs_floatx80[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
static void time_az_floatx80( floatx80 function( floatx80 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
floatx80 a;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
a.low = inputs_floatx80[ inputNum ].low;
|
|
a.high = inputs_floatx80[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
a.low = inputs_floatx80[ inputNum ].low;
|
|
a.high = inputs_floatx80[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_ab_floatx80_z_flag( flag function( floatx80, floatx80 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNumA, inputNumB;
|
|
floatx80 a, b;
|
|
|
|
count = 0;
|
|
inputNumA = 0;
|
|
inputNumB = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
a.low = inputs_floatx80[ inputNumA ].low;
|
|
a.high = inputs_floatx80[ inputNumA ].high;
|
|
b.low = inputs_floatx80[ inputNumB ].low;
|
|
b.high = inputs_floatx80[ inputNumB ].high;
|
|
function( a, b );
|
|
inputNumA = ( inputNumA + 1 ) & ( numInputs_floatx80 - 1 );
|
|
if ( inputNumA == 0 ) ++inputNumB;
|
|
inputNumB = ( inputNumB + 1 ) & ( numInputs_floatx80 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNumA = 0;
|
|
inputNumB = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
a.low = inputs_floatx80[ inputNumA ].low;
|
|
a.high = inputs_floatx80[ inputNumA ].high;
|
|
b.low = inputs_floatx80[ inputNumB ].low;
|
|
b.high = inputs_floatx80[ inputNumB ].high;
|
|
function( a, b );
|
|
inputNumA = ( inputNumA + 1 ) & ( numInputs_floatx80 - 1 );
|
|
if ( inputNumA == 0 ) ++inputNumB;
|
|
inputNumB = ( inputNumB + 1 ) & ( numInputs_floatx80 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_abz_floatx80( floatx80 function( floatx80, floatx80 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNumA, inputNumB;
|
|
floatx80 a, b;
|
|
|
|
count = 0;
|
|
inputNumA = 0;
|
|
inputNumB = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
a.low = inputs_floatx80[ inputNumA ].low;
|
|
a.high = inputs_floatx80[ inputNumA ].high;
|
|
b.low = inputs_floatx80[ inputNumB ].low;
|
|
b.high = inputs_floatx80[ inputNumB ].high;
|
|
function( a, b );
|
|
inputNumA = ( inputNumA + 1 ) & ( numInputs_floatx80 - 1 );
|
|
if ( inputNumA == 0 ) ++inputNumB;
|
|
inputNumB = ( inputNumB + 1 ) & ( numInputs_floatx80 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNumA = 0;
|
|
inputNumB = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
a.low = inputs_floatx80[ inputNumA ].low;
|
|
a.high = inputs_floatx80[ inputNumA ].high;
|
|
b.low = inputs_floatx80[ inputNumB ].low;
|
|
b.high = inputs_floatx80[ inputNumB ].high;
|
|
function( a, b );
|
|
inputNumA = ( inputNumA + 1 ) & ( numInputs_floatx80 - 1 );
|
|
if ( inputNumA == 0 ) ++inputNumB;
|
|
inputNumB = ( inputNumB + 1 ) & ( numInputs_floatx80 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static const struct {
|
|
bits16 high;
|
|
bits64 low;
|
|
} inputs_floatx80_pos[ numInputs_floatx80 ] = {
|
|
{ 0x403F, LIT64( 0xA9BE15A19C1E8B62 ) },
|
|
{ 0x0000, LIT64( 0x0000000000000000 ) },
|
|
{ 0x75A8, LIT64( 0xE59591E4788957A5 ) },
|
|
{ 0x3FFF, LIT64( 0xFFF0000000000040 ) },
|
|
{ 0x0CD8, LIT64( 0xFC000000000007FE ) },
|
|
{ 0x43BA, LIT64( 0x99A4000000000000 ) },
|
|
{ 0x3FFF, LIT64( 0x8000000000000000 ) },
|
|
{ 0x4081, LIT64( 0x94FBF1BCEB5545F0 ) },
|
|
{ 0x403E, LIT64( 0xFFF0000000002000 ) },
|
|
{ 0x3FFE, LIT64( 0xC860E3C75D224F28 ) },
|
|
{ 0x407E, LIT64( 0xFC00000FFFFFFFFE ) },
|
|
{ 0x737A, LIT64( 0x800000007FFDFFFE ) },
|
|
{ 0x4044, LIT64( 0xFFFFFF80000FFFFF ) },
|
|
{ 0x3BFE, LIT64( 0x8000040000001FFE ) },
|
|
{ 0x4002, LIT64( 0xFF80000000000020 ) },
|
|
{ 0x5E8D, LIT64( 0xFFFFFFFFFFE00004 ) },
|
|
{ 0x4004, LIT64( 0x8000000000003FFB ) },
|
|
{ 0x407F, LIT64( 0x800000000003FFFE ) },
|
|
{ 0x4000, LIT64( 0xA459EE6A5C16CA55 ) },
|
|
{ 0x0003, LIT64( 0xC42CBF7399AEEB94 ) },
|
|
{ 0x3F7F, LIT64( 0xF800000000000006 ) },
|
|
{ 0x407F, LIT64( 0xBF56BE8871F28FEA ) },
|
|
{ 0x407E, LIT64( 0xFFFF77FFFFFFFFFE ) },
|
|
{ 0x2DC9, LIT64( 0x8000000FFFFFFFDE ) },
|
|
{ 0x4001, LIT64( 0xEFF7FFFFFFFFFFFF ) },
|
|
{ 0x4001, LIT64( 0xBE84F30125C497A6 ) },
|
|
{ 0x406B, LIT64( 0xEFFFFFFFFFFFFFFF ) },
|
|
{ 0x4080, LIT64( 0xFFFFFFFFBFFFFFFF ) },
|
|
{ 0x07E9, LIT64( 0x81FFFFFFFFFFFBFF ) },
|
|
{ 0x263F, LIT64( 0x801FFFFFFEFFFFFE ) },
|
|
{ 0x403C, LIT64( 0x801FFFFFFFF7FFFF ) },
|
|
{ 0x4018, LIT64( 0x8000000000080003 ) }
|
|
};
|
|
|
|
static void time_az_floatx80_pos( floatx80 function( floatx80 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
floatx80 a;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
a.low = inputs_floatx80_pos[ inputNum ].low;
|
|
a.high = inputs_floatx80_pos[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
a.low = inputs_floatx80_pos[ inputNum ].low;
|
|
a.high = inputs_floatx80_pos[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_floatx80 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
#ifdef FLOAT128
|
|
|
|
enum {
|
|
numInputs_float128 = 32
|
|
};
|
|
|
|
static const struct {
|
|
bits64 high, low;
|
|
} inputs_float128[ numInputs_float128 ] = {
|
|
{ LIT64( 0x3FDA200000100000 ), LIT64( 0x0000000000000000 ) },
|
|
{ LIT64( 0x3FFF000000000000 ), LIT64( 0x0000000000000000 ) },
|
|
{ LIT64( 0x85F14776190C8306 ), LIT64( 0xD8715F4E3D54BB92 ) },
|
|
{ LIT64( 0xF2B00000007FFFFF ), LIT64( 0xFFFFFFFFFFF7FFFF ) },
|
|
{ LIT64( 0x8000000000000000 ), LIT64( 0x0000000000000000 ) },
|
|
{ LIT64( 0xBFFFFFFFFFE00000 ), LIT64( 0x0000008000000000 ) },
|
|
{ LIT64( 0x407F1719CE722F3E ), LIT64( 0xDA6B3FE5FF29425B ) },
|
|
{ LIT64( 0x43FFFF8000000000 ), LIT64( 0x0000000000400000 ) },
|
|
{ LIT64( 0x401E000000000100 ), LIT64( 0x0000000000002000 ) },
|
|
{ LIT64( 0x3FFED71DACDA8E47 ), LIT64( 0x4860E3C75D224F28 ) },
|
|
{ LIT64( 0xBF7ECFC1E90647D1 ), LIT64( 0x7A124FE55623EE44 ) },
|
|
{ LIT64( 0x0DF7007FFFFFFFFF ), LIT64( 0xFFFFFFFFEFFFFFFF ) },
|
|
{ LIT64( 0x3FE5FFEFFFFFFFFF ), LIT64( 0xFFFFFFFFFFFFEFFF ) },
|
|
{ LIT64( 0x403FFFFFFFFFFFFF ), LIT64( 0xFFFFFFFFFFFFFBFE ) },
|
|
{ LIT64( 0xBFFB2FBF7399AFEB ), LIT64( 0xA459EE6A5C16CA55 ) },
|
|
{ LIT64( 0xBDB8FFFFFFFFFFFC ), LIT64( 0x0000000000000400 ) },
|
|
{ LIT64( 0x3FC8FFDFFFFFFFFF ), LIT64( 0xFFFFFFFFF0000000 ) },
|
|
{ LIT64( 0x3FFBFFFFFFDFFFFF ), LIT64( 0xFFF8000000000000 ) },
|
|
{ LIT64( 0x407043C11737BE84 ), LIT64( 0xDDD58212ADC937F4 ) },
|
|
{ LIT64( 0x8001000000000000 ), LIT64( 0x0000001000000001 ) },
|
|
{ LIT64( 0xC036FFFFFFFFFFFF ), LIT64( 0xFE40000000000000 ) },
|
|
{ LIT64( 0x4002FFFFFE000002 ), LIT64( 0x0000000000000000 ) },
|
|
{ LIT64( 0x4000C3FEDE897773 ), LIT64( 0x326AC4FD8EFBE6DC ) },
|
|
{ LIT64( 0xBFFF0000000FFFFF ), LIT64( 0xFFFFFE0000000000 ) },
|
|
{ LIT64( 0x62C3E502146E426D ), LIT64( 0x43F3CAA0DC7DF1A0 ) },
|
|
{ LIT64( 0xB5CBD32E52BB570E ), LIT64( 0xBCC477CB11C6236C ) },
|
|
{ LIT64( 0xE228FFFFFFC00000 ), LIT64( 0x0000000000000000 ) },
|
|
{ LIT64( 0x3F80000000000000 ), LIT64( 0x0000000080000008 ) },
|
|
{ LIT64( 0xC1AFFFDFFFFFFFFF ), LIT64( 0xFFFC000000000000 ) },
|
|
{ LIT64( 0xC96F000000000000 ), LIT64( 0x00000001FFFBFFFF ) },
|
|
{ LIT64( 0x3DE09BFE7923A338 ), LIT64( 0xBCC8FBBD7CEC1F4F ) },
|
|
{ LIT64( 0x401CFFFFFFFFFFFF ), LIT64( 0xFFFFFFFEFFFFFF80 ) }
|
|
};
|
|
|
|
static void time_a_float128_z_int32( int32 function( float128 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
float128 a;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
a.low = inputs_float128[ inputNum ].low;
|
|
a.high = inputs_float128[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
a.low = inputs_float128[ inputNum ].low;
|
|
a.high = inputs_float128[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_a_float128_z_int64( int64 function( float128 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
float128 a;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
a.low = inputs_float128[ inputNum ].low;
|
|
a.high = inputs_float128[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
a.low = inputs_float128[ inputNum ].low;
|
|
a.high = inputs_float128[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_a_float128_z_float32( float32 function( float128 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
float128 a;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
a.low = inputs_float128[ inputNum ].low;
|
|
a.high = inputs_float128[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
a.low = inputs_float128[ inputNum ].low;
|
|
a.high = inputs_float128[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_a_float128_z_float64( float64 function( float128 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
float128 a;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
a.low = inputs_float128[ inputNum ].low;
|
|
a.high = inputs_float128[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
a.low = inputs_float128[ inputNum ].low;
|
|
a.high = inputs_float128[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#ifdef FLOATX80
|
|
|
|
static void time_a_float128_z_floatx80( floatx80 function( float128 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
float128 a;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
a.low = inputs_float128[ inputNum ].low;
|
|
a.high = inputs_float128[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
a.low = inputs_float128[ inputNum ].low;
|
|
a.high = inputs_float128[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
static void time_az_float128( float128 function( float128 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
float128 a;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
a.low = inputs_float128[ inputNum ].low;
|
|
a.high = inputs_float128[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
a.low = inputs_float128[ inputNum ].low;
|
|
a.high = inputs_float128[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_ab_float128_z_flag( flag function( float128, float128 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNumA, inputNumB;
|
|
float128 a, b;
|
|
|
|
count = 0;
|
|
inputNumA = 0;
|
|
inputNumB = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
a.low = inputs_float128[ inputNumA ].low;
|
|
a.high = inputs_float128[ inputNumA ].high;
|
|
b.low = inputs_float128[ inputNumB ].low;
|
|
b.high = inputs_float128[ inputNumB ].high;
|
|
function( a, b );
|
|
inputNumA = ( inputNumA + 1 ) & ( numInputs_float128 - 1 );
|
|
if ( inputNumA == 0 ) ++inputNumB;
|
|
inputNumB = ( inputNumB + 1 ) & ( numInputs_float128 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNumA = 0;
|
|
inputNumB = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
a.low = inputs_float128[ inputNumA ].low;
|
|
a.high = inputs_float128[ inputNumA ].high;
|
|
b.low = inputs_float128[ inputNumB ].low;
|
|
b.high = inputs_float128[ inputNumB ].high;
|
|
function( a, b );
|
|
inputNumA = ( inputNumA + 1 ) & ( numInputs_float128 - 1 );
|
|
if ( inputNumA == 0 ) ++inputNumB;
|
|
inputNumB = ( inputNumB + 1 ) & ( numInputs_float128 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static void time_abz_float128( float128 function( float128, float128 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNumA, inputNumB;
|
|
float128 a, b;
|
|
|
|
count = 0;
|
|
inputNumA = 0;
|
|
inputNumB = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
a.low = inputs_float128[ inputNumA ].low;
|
|
a.high = inputs_float128[ inputNumA ].high;
|
|
b.low = inputs_float128[ inputNumB ].low;
|
|
b.high = inputs_float128[ inputNumB ].high;
|
|
function( a, b );
|
|
inputNumA = ( inputNumA + 1 ) & ( numInputs_float128 - 1 );
|
|
if ( inputNumA == 0 ) ++inputNumB;
|
|
inputNumB = ( inputNumB + 1 ) & ( numInputs_float128 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNumA = 0;
|
|
inputNumB = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
a.low = inputs_float128[ inputNumA ].low;
|
|
a.high = inputs_float128[ inputNumA ].high;
|
|
b.low = inputs_float128[ inputNumB ].low;
|
|
b.high = inputs_float128[ inputNumB ].high;
|
|
function( a, b );
|
|
inputNumA = ( inputNumA + 1 ) & ( numInputs_float128 - 1 );
|
|
if ( inputNumA == 0 ) ++inputNumB;
|
|
inputNumB = ( inputNumB + 1 ) & ( numInputs_float128 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
static const struct {
|
|
bits64 high, low;
|
|
} inputs_float128_pos[ numInputs_float128 ] = {
|
|
{ LIT64( 0x3FDA200000100000 ), LIT64( 0x0000000000000000 ) },
|
|
{ LIT64( 0x3FFF000000000000 ), LIT64( 0x0000000000000000 ) },
|
|
{ LIT64( 0x05F14776190C8306 ), LIT64( 0xD8715F4E3D54BB92 ) },
|
|
{ LIT64( 0x72B00000007FFFFF ), LIT64( 0xFFFFFFFFFFF7FFFF ) },
|
|
{ LIT64( 0x0000000000000000 ), LIT64( 0x0000000000000000 ) },
|
|
{ LIT64( 0x3FFFFFFFFFE00000 ), LIT64( 0x0000008000000000 ) },
|
|
{ LIT64( 0x407F1719CE722F3E ), LIT64( 0xDA6B3FE5FF29425B ) },
|
|
{ LIT64( 0x43FFFF8000000000 ), LIT64( 0x0000000000400000 ) },
|
|
{ LIT64( 0x401E000000000100 ), LIT64( 0x0000000000002000 ) },
|
|
{ LIT64( 0x3FFED71DACDA8E47 ), LIT64( 0x4860E3C75D224F28 ) },
|
|
{ LIT64( 0x3F7ECFC1E90647D1 ), LIT64( 0x7A124FE55623EE44 ) },
|
|
{ LIT64( 0x0DF7007FFFFFFFFF ), LIT64( 0xFFFFFFFFEFFFFFFF ) },
|
|
{ LIT64( 0x3FE5FFEFFFFFFFFF ), LIT64( 0xFFFFFFFFFFFFEFFF ) },
|
|
{ LIT64( 0x403FFFFFFFFFFFFF ), LIT64( 0xFFFFFFFFFFFFFBFE ) },
|
|
{ LIT64( 0x3FFB2FBF7399AFEB ), LIT64( 0xA459EE6A5C16CA55 ) },
|
|
{ LIT64( 0x3DB8FFFFFFFFFFFC ), LIT64( 0x0000000000000400 ) },
|
|
{ LIT64( 0x3FC8FFDFFFFFFFFF ), LIT64( 0xFFFFFFFFF0000000 ) },
|
|
{ LIT64( 0x3FFBFFFFFFDFFFFF ), LIT64( 0xFFF8000000000000 ) },
|
|
{ LIT64( 0x407043C11737BE84 ), LIT64( 0xDDD58212ADC937F4 ) },
|
|
{ LIT64( 0x0001000000000000 ), LIT64( 0x0000001000000001 ) },
|
|
{ LIT64( 0x4036FFFFFFFFFFFF ), LIT64( 0xFE40000000000000 ) },
|
|
{ LIT64( 0x4002FFFFFE000002 ), LIT64( 0x0000000000000000 ) },
|
|
{ LIT64( 0x4000C3FEDE897773 ), LIT64( 0x326AC4FD8EFBE6DC ) },
|
|
{ LIT64( 0x3FFF0000000FFFFF ), LIT64( 0xFFFFFE0000000000 ) },
|
|
{ LIT64( 0x62C3E502146E426D ), LIT64( 0x43F3CAA0DC7DF1A0 ) },
|
|
{ LIT64( 0x35CBD32E52BB570E ), LIT64( 0xBCC477CB11C6236C ) },
|
|
{ LIT64( 0x6228FFFFFFC00000 ), LIT64( 0x0000000000000000 ) },
|
|
{ LIT64( 0x3F80000000000000 ), LIT64( 0x0000000080000008 ) },
|
|
{ LIT64( 0x41AFFFDFFFFFFFFF ), LIT64( 0xFFFC000000000000 ) },
|
|
{ LIT64( 0x496F000000000000 ), LIT64( 0x00000001FFFBFFFF ) },
|
|
{ LIT64( 0x3DE09BFE7923A338 ), LIT64( 0xBCC8FBBD7CEC1F4F ) },
|
|
{ LIT64( 0x401CFFFFFFFFFFFF ), LIT64( 0xFFFFFFFEFFFFFF80 ) }
|
|
};
|
|
|
|
static void time_az_float128_pos( float128 function( float128 ) )
|
|
{
|
|
clock_t startClock, endClock;
|
|
int32 count, i;
|
|
int8 inputNum;
|
|
float128 a;
|
|
|
|
count = 0;
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
do {
|
|
for ( i = minIterations; i; --i ) {
|
|
a.low = inputs_float128_pos[ inputNum ].low;
|
|
a.high = inputs_float128_pos[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 );
|
|
}
|
|
count += minIterations;
|
|
} while ( clock() - startClock < CLOCKS_PER_SEC );
|
|
inputNum = 0;
|
|
startClock = clock();
|
|
for ( i = count; i; --i ) {
|
|
a.low = inputs_float128_pos[ inputNum ].low;
|
|
a.high = inputs_float128_pos[ inputNum ].high;
|
|
function( a );
|
|
inputNum = ( inputNum + 1 ) & ( numInputs_float128 - 1 );
|
|
}
|
|
endClock = clock();
|
|
reportTime( count, endClock - startClock );
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
enum {
|
|
INT32_TO_FLOAT32 = 1,
|
|
INT32_TO_FLOAT64,
|
|
#ifdef FLOATX80
|
|
INT32_TO_FLOATX80,
|
|
#endif
|
|
#ifdef FLOAT128
|
|
INT32_TO_FLOAT128,
|
|
#endif
|
|
INT64_TO_FLOAT32,
|
|
INT64_TO_FLOAT64,
|
|
#ifdef FLOATX80
|
|
INT64_TO_FLOATX80,
|
|
#endif
|
|
#ifdef FLOAT128
|
|
INT64_TO_FLOAT128,
|
|
#endif
|
|
FLOAT32_TO_INT32,
|
|
FLOAT32_TO_INT32_ROUND_TO_ZERO,
|
|
FLOAT32_TO_INT64,
|
|
FLOAT32_TO_INT64_ROUND_TO_ZERO,
|
|
FLOAT32_TO_FLOAT64,
|
|
#ifdef FLOATX80
|
|
FLOAT32_TO_FLOATX80,
|
|
#endif
|
|
#ifdef FLOAT128
|
|
FLOAT32_TO_FLOAT128,
|
|
#endif
|
|
FLOAT32_ROUND_TO_INT,
|
|
FLOAT32_ADD,
|
|
FLOAT32_SUB,
|
|
FLOAT32_MUL,
|
|
FLOAT32_DIV,
|
|
FLOAT32_REM,
|
|
FLOAT32_SQRT,
|
|
FLOAT32_EQ,
|
|
FLOAT32_LE,
|
|
FLOAT32_LT,
|
|
FLOAT32_EQ_SIGNALING,
|
|
FLOAT32_LE_QUIET,
|
|
FLOAT32_LT_QUIET,
|
|
FLOAT64_TO_INT32,
|
|
FLOAT64_TO_INT32_ROUND_TO_ZERO,
|
|
FLOAT64_TO_INT64,
|
|
FLOAT64_TO_INT64_ROUND_TO_ZERO,
|
|
FLOAT64_TO_FLOAT32,
|
|
#ifdef FLOATX80
|
|
FLOAT64_TO_FLOATX80,
|
|
#endif
|
|
#ifdef FLOAT128
|
|
FLOAT64_TO_FLOAT128,
|
|
#endif
|
|
FLOAT64_ROUND_TO_INT,
|
|
FLOAT64_ADD,
|
|
FLOAT64_SUB,
|
|
FLOAT64_MUL,
|
|
FLOAT64_DIV,
|
|
FLOAT64_REM,
|
|
FLOAT64_SQRT,
|
|
FLOAT64_EQ,
|
|
FLOAT64_LE,
|
|
FLOAT64_LT,
|
|
FLOAT64_EQ_SIGNALING,
|
|
FLOAT64_LE_QUIET,
|
|
FLOAT64_LT_QUIET,
|
|
#ifdef FLOATX80
|
|
FLOATX80_TO_INT32,
|
|
FLOATX80_TO_INT32_ROUND_TO_ZERO,
|
|
FLOATX80_TO_INT64,
|
|
FLOATX80_TO_INT64_ROUND_TO_ZERO,
|
|
FLOATX80_TO_FLOAT32,
|
|
FLOATX80_TO_FLOAT64,
|
|
#ifdef FLOAT128
|
|
FLOATX80_TO_FLOAT128,
|
|
#endif
|
|
FLOATX80_ROUND_TO_INT,
|
|
FLOATX80_ADD,
|
|
FLOATX80_SUB,
|
|
FLOATX80_MUL,
|
|
FLOATX80_DIV,
|
|
FLOATX80_REM,
|
|
FLOATX80_SQRT,
|
|
FLOATX80_EQ,
|
|
FLOATX80_LE,
|
|
FLOATX80_LT,
|
|
FLOATX80_EQ_SIGNALING,
|
|
FLOATX80_LE_QUIET,
|
|
FLOATX80_LT_QUIET,
|
|
#endif
|
|
#ifdef FLOAT128
|
|
FLOAT128_TO_INT32,
|
|
FLOAT128_TO_INT32_ROUND_TO_ZERO,
|
|
FLOAT128_TO_INT64,
|
|
FLOAT128_TO_INT64_ROUND_TO_ZERO,
|
|
FLOAT128_TO_FLOAT32,
|
|
FLOAT128_TO_FLOAT64,
|
|
#ifdef FLOATX80
|
|
FLOAT128_TO_FLOATX80,
|
|
#endif
|
|
FLOAT128_ROUND_TO_INT,
|
|
FLOAT128_ADD,
|
|
FLOAT128_SUB,
|
|
FLOAT128_MUL,
|
|
FLOAT128_DIV,
|
|
FLOAT128_REM,
|
|
FLOAT128_SQRT,
|
|
FLOAT128_EQ,
|
|
FLOAT128_LE,
|
|
FLOAT128_LT,
|
|
FLOAT128_EQ_SIGNALING,
|
|
FLOAT128_LE_QUIET,
|
|
FLOAT128_LT_QUIET,
|
|
#endif
|
|
NUM_FUNCTIONS
|
|
};
|
|
|
|
static struct {
|
|
char *name;
|
|
int8 numInputs;
|
|
flag roundingPrecision, roundingMode;
|
|
flag tininessMode, tininessModeAtReducedPrecision;
|
|
} functions[ NUM_FUNCTIONS ] = {
|
|
{ 0, 0, 0, 0, 0, 0 },
|
|
{ "int32_to_float32", 1, FALSE, TRUE, FALSE, FALSE },
|
|
{ "int32_to_float64", 1, FALSE, FALSE, FALSE, FALSE },
|
|
#ifdef FLOATX80
|
|
{ "int32_to_floatx80", 1, FALSE, FALSE, FALSE, FALSE },
|
|
#endif
|
|
#ifdef FLOAT128
|
|
{ "int32_to_float128", 1, FALSE, FALSE, FALSE, FALSE },
|
|
#endif
|
|
{ "int64_to_float32", 1, FALSE, TRUE, FALSE, FALSE },
|
|
{ "int64_to_float64", 1, FALSE, TRUE, FALSE, FALSE },
|
|
#ifdef FLOATX80
|
|
{ "int64_to_floatx80", 1, FALSE, FALSE, FALSE, FALSE },
|
|
#endif
|
|
#ifdef FLOAT128
|
|
{ "int64_to_float128", 1, FALSE, FALSE, FALSE, FALSE },
|
|
#endif
|
|
{ "float32_to_int32", 1, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float32_to_int32_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float32_to_int64", 1, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float32_to_int64_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float32_to_float64", 1, FALSE, FALSE, FALSE, FALSE },
|
|
#ifdef FLOATX80
|
|
{ "float32_to_floatx80", 1, FALSE, FALSE, FALSE, FALSE },
|
|
#endif
|
|
#ifdef FLOAT128
|
|
{ "float32_to_float128", 1, FALSE, FALSE, FALSE, FALSE },
|
|
#endif
|
|
{ "float32_round_to_int", 1, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float32_add", 2, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float32_sub", 2, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float32_mul", 2, FALSE, TRUE, TRUE, FALSE },
|
|
{ "float32_div", 2, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float32_rem", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float32_sqrt", 1, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float32_eq", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float32_le", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float32_lt", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float32_eq_signaling", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float32_le_quiet", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float32_lt_quiet", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float64_to_int32", 1, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float64_to_int32_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float64_to_int64", 1, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float64_to_int64_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float64_to_float32", 1, FALSE, TRUE, TRUE, FALSE },
|
|
#ifdef FLOATX80
|
|
{ "float64_to_floatx80", 1, FALSE, FALSE, FALSE, FALSE },
|
|
#endif
|
|
#ifdef FLOAT128
|
|
{ "float64_to_float128", 1, FALSE, FALSE, FALSE, FALSE },
|
|
#endif
|
|
{ "float64_round_to_int", 1, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float64_add", 2, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float64_sub", 2, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float64_mul", 2, FALSE, TRUE, TRUE, FALSE },
|
|
{ "float64_div", 2, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float64_rem", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float64_sqrt", 1, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float64_eq", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float64_le", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float64_lt", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float64_eq_signaling", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float64_le_quiet", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float64_lt_quiet", 2, FALSE, FALSE, FALSE, FALSE },
|
|
#ifdef FLOATX80
|
|
{ "floatx80_to_int32", 1, FALSE, TRUE, FALSE, FALSE },
|
|
{ "floatx80_to_int32_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE },
|
|
{ "floatx80_to_int64", 1, FALSE, TRUE, FALSE, FALSE },
|
|
{ "floatx80_to_int64_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE },
|
|
{ "floatx80_to_float32", 1, FALSE, TRUE, TRUE, FALSE },
|
|
{ "floatx80_to_float64", 1, FALSE, TRUE, TRUE, FALSE },
|
|
#ifdef FLOAT128
|
|
{ "floatx80_to_float128", 1, FALSE, FALSE, FALSE, FALSE },
|
|
#endif
|
|
{ "floatx80_round_to_int", 1, FALSE, TRUE, FALSE, FALSE },
|
|
{ "floatx80_add", 2, TRUE, TRUE, FALSE, TRUE },
|
|
{ "floatx80_sub", 2, TRUE, TRUE, FALSE, TRUE },
|
|
{ "floatx80_mul", 2, TRUE, TRUE, TRUE, TRUE },
|
|
{ "floatx80_div", 2, TRUE, TRUE, FALSE, TRUE },
|
|
{ "floatx80_rem", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "floatx80_sqrt", 1, TRUE, TRUE, FALSE, FALSE },
|
|
{ "floatx80_eq", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "floatx80_le", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "floatx80_lt", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "floatx80_eq_signaling", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "floatx80_le_quiet", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "floatx80_lt_quiet", 2, FALSE, FALSE, FALSE, FALSE },
|
|
#endif
|
|
#ifdef FLOAT128
|
|
{ "float128_to_int32", 1, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float128_to_int32_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float128_to_int64", 1, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float128_to_int64_round_to_zero", 1, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float128_to_float32", 1, FALSE, TRUE, TRUE, FALSE },
|
|
{ "float128_to_float64", 1, FALSE, TRUE, TRUE, FALSE },
|
|
#ifdef FLOATX80
|
|
{ "float128_to_floatx80", 1, FALSE, TRUE, TRUE, FALSE },
|
|
#endif
|
|
{ "float128_round_to_int", 1, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float128_add", 2, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float128_sub", 2, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float128_mul", 2, FALSE, TRUE, TRUE, FALSE },
|
|
{ "float128_div", 2, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float128_rem", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float128_sqrt", 1, FALSE, TRUE, FALSE, FALSE },
|
|
{ "float128_eq", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float128_le", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float128_lt", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float128_eq_signaling", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float128_le_quiet", 2, FALSE, FALSE, FALSE, FALSE },
|
|
{ "float128_lt_quiet", 2, FALSE, FALSE, FALSE, FALSE },
|
|
#endif
|
|
};
|
|
|
|
enum {
|
|
ROUND_NEAREST_EVEN = 1,
|
|
ROUND_TO_ZERO,
|
|
ROUND_DOWN,
|
|
ROUND_UP,
|
|
NUM_ROUNDINGMODES
|
|
};
|
|
enum {
|
|
TININESS_BEFORE_ROUNDING = 1,
|
|
TININESS_AFTER_ROUNDING,
|
|
NUM_TININESSMODES
|
|
};
|
|
|
|
static void
|
|
timeFunctionVariety(
|
|
uint8 functionCode,
|
|
int8 roundingPrecision,
|
|
int8 roundingMode,
|
|
int8 tininessMode
|
|
)
|
|
{
|
|
uint8 roundingCode;
|
|
int8 tininessCode;
|
|
|
|
functionName = functions[ functionCode ].name;
|
|
if ( roundingPrecision == 32 ) {
|
|
roundingPrecisionName = "32";
|
|
}
|
|
else if ( roundingPrecision == 64 ) {
|
|
roundingPrecisionName = "64";
|
|
}
|
|
else if ( roundingPrecision == 80 ) {
|
|
roundingPrecisionName = "80";
|
|
}
|
|
else {
|
|
roundingPrecisionName = 0;
|
|
}
|
|
#ifdef FLOATX80
|
|
floatx80_rounding_precision = roundingPrecision;
|
|
#endif
|
|
switch ( roundingMode ) {
|
|
case 0:
|
|
roundingModeName = 0;
|
|
roundingCode = float_round_nearest_even;
|
|
break;
|
|
case ROUND_NEAREST_EVEN:
|
|
roundingModeName = "nearest_even";
|
|
roundingCode = float_round_nearest_even;
|
|
break;
|
|
case ROUND_TO_ZERO:
|
|
roundingModeName = "to_zero";
|
|
roundingCode = float_round_to_zero;
|
|
break;
|
|
case ROUND_DOWN:
|
|
roundingModeName = "down";
|
|
roundingCode = float_round_down;
|
|
break;
|
|
case ROUND_UP:
|
|
roundingModeName = "up";
|
|
roundingCode = float_round_up;
|
|
break;
|
|
}
|
|
float_rounding_mode = roundingCode;
|
|
switch ( tininessMode ) {
|
|
case 0:
|
|
tininessModeName = 0;
|
|
tininessCode = float_tininess_after_rounding;
|
|
break;
|
|
case TININESS_BEFORE_ROUNDING:
|
|
tininessModeName = "before";
|
|
tininessCode = float_tininess_before_rounding;
|
|
break;
|
|
case TININESS_AFTER_ROUNDING:
|
|
tininessModeName = "after";
|
|
tininessCode = float_tininess_after_rounding;
|
|
break;
|
|
}
|
|
float_detect_tininess = tininessCode;
|
|
switch ( functionCode ) {
|
|
case INT32_TO_FLOAT32:
|
|
time_a_int32_z_float32( int32_to_float32 );
|
|
break;
|
|
case INT32_TO_FLOAT64:
|
|
time_a_int32_z_float64( int32_to_float64 );
|
|
break;
|
|
#ifdef FLOATX80
|
|
case INT32_TO_FLOATX80:
|
|
time_a_int32_z_floatx80( int32_to_floatx80 );
|
|
break;
|
|
#endif
|
|
#ifdef FLOAT128
|
|
case INT32_TO_FLOAT128:
|
|
time_a_int32_z_float128( int32_to_float128 );
|
|
break;
|
|
#endif
|
|
case INT64_TO_FLOAT32:
|
|
time_a_int64_z_float32( int64_to_float32 );
|
|
break;
|
|
case INT64_TO_FLOAT64:
|
|
time_a_int64_z_float64( int64_to_float64 );
|
|
break;
|
|
#ifdef FLOATX80
|
|
case INT64_TO_FLOATX80:
|
|
time_a_int64_z_floatx80( int64_to_floatx80 );
|
|
break;
|
|
#endif
|
|
#ifdef FLOAT128
|
|
case INT64_TO_FLOAT128:
|
|
time_a_int64_z_float128( int64_to_float128 );
|
|
break;
|
|
#endif
|
|
case FLOAT32_TO_INT32:
|
|
time_a_float32_z_int32( float32_to_int32 );
|
|
break;
|
|
case FLOAT32_TO_INT32_ROUND_TO_ZERO:
|
|
time_a_float32_z_int32( float32_to_int32_round_to_zero );
|
|
break;
|
|
case FLOAT32_TO_INT64:
|
|
time_a_float32_z_int64( float32_to_int64 );
|
|
break;
|
|
case FLOAT32_TO_INT64_ROUND_TO_ZERO:
|
|
time_a_float32_z_int64( float32_to_int64_round_to_zero );
|
|
break;
|
|
case FLOAT32_TO_FLOAT64:
|
|
time_a_float32_z_float64( float32_to_float64 );
|
|
break;
|
|
#ifdef FLOATX80
|
|
case FLOAT32_TO_FLOATX80:
|
|
time_a_float32_z_floatx80( float32_to_floatx80 );
|
|
break;
|
|
#endif
|
|
#ifdef FLOAT128
|
|
case FLOAT32_TO_FLOAT128:
|
|
time_a_float32_z_float128( float32_to_float128 );
|
|
break;
|
|
#endif
|
|
case FLOAT32_ROUND_TO_INT:
|
|
time_az_float32( float32_round_to_int );
|
|
break;
|
|
case FLOAT32_ADD:
|
|
time_abz_float32( float32_add );
|
|
break;
|
|
case FLOAT32_SUB:
|
|
time_abz_float32( float32_sub );
|
|
break;
|
|
case FLOAT32_MUL:
|
|
time_abz_float32( float32_mul );
|
|
break;
|
|
case FLOAT32_DIV:
|
|
time_abz_float32( float32_div );
|
|
break;
|
|
case FLOAT32_REM:
|
|
time_abz_float32( float32_rem );
|
|
break;
|
|
case FLOAT32_SQRT:
|
|
time_az_float32_pos( float32_sqrt );
|
|
break;
|
|
case FLOAT32_EQ:
|
|
time_ab_float32_z_flag( float32_eq );
|
|
break;
|
|
case FLOAT32_LE:
|
|
time_ab_float32_z_flag( float32_le );
|
|
break;
|
|
case FLOAT32_LT:
|
|
time_ab_float32_z_flag( float32_lt );
|
|
break;
|
|
case FLOAT32_EQ_SIGNALING:
|
|
time_ab_float32_z_flag( float32_eq_signaling );
|
|
break;
|
|
case FLOAT32_LE_QUIET:
|
|
time_ab_float32_z_flag( float32_le_quiet );
|
|
break;
|
|
case FLOAT32_LT_QUIET:
|
|
time_ab_float32_z_flag( float32_lt_quiet );
|
|
break;
|
|
case FLOAT64_TO_INT32:
|
|
time_a_float64_z_int32( float64_to_int32 );
|
|
break;
|
|
case FLOAT64_TO_INT32_ROUND_TO_ZERO:
|
|
time_a_float64_z_int32( float64_to_int32_round_to_zero );
|
|
break;
|
|
case FLOAT64_TO_INT64:
|
|
time_a_float64_z_int64( float64_to_int64 );
|
|
break;
|
|
case FLOAT64_TO_INT64_ROUND_TO_ZERO:
|
|
time_a_float64_z_int64( float64_to_int64_round_to_zero );
|
|
break;
|
|
case FLOAT64_TO_FLOAT32:
|
|
time_a_float64_z_float32( float64_to_float32 );
|
|
break;
|
|
#ifdef FLOATX80
|
|
case FLOAT64_TO_FLOATX80:
|
|
time_a_float64_z_floatx80( float64_to_floatx80 );
|
|
break;
|
|
#endif
|
|
#ifdef FLOAT128
|
|
case FLOAT64_TO_FLOAT128:
|
|
time_a_float64_z_float128( float64_to_float128 );
|
|
break;
|
|
#endif
|
|
case FLOAT64_ROUND_TO_INT:
|
|
time_az_float64( float64_round_to_int );
|
|
break;
|
|
case FLOAT64_ADD:
|
|
time_abz_float64( float64_add );
|
|
break;
|
|
case FLOAT64_SUB:
|
|
time_abz_float64( float64_sub );
|
|
break;
|
|
case FLOAT64_MUL:
|
|
time_abz_float64( float64_mul );
|
|
break;
|
|
case FLOAT64_DIV:
|
|
time_abz_float64( float64_div );
|
|
break;
|
|
case FLOAT64_REM:
|
|
time_abz_float64( float64_rem );
|
|
break;
|
|
case FLOAT64_SQRT:
|
|
time_az_float64_pos( float64_sqrt );
|
|
break;
|
|
case FLOAT64_EQ:
|
|
time_ab_float64_z_flag( float64_eq );
|
|
break;
|
|
case FLOAT64_LE:
|
|
time_ab_float64_z_flag( float64_le );
|
|
break;
|
|
case FLOAT64_LT:
|
|
time_ab_float64_z_flag( float64_lt );
|
|
break;
|
|
case FLOAT64_EQ_SIGNALING:
|
|
time_ab_float64_z_flag( float64_eq_signaling );
|
|
break;
|
|
case FLOAT64_LE_QUIET:
|
|
time_ab_float64_z_flag( float64_le_quiet );
|
|
break;
|
|
case FLOAT64_LT_QUIET:
|
|
time_ab_float64_z_flag( float64_lt_quiet );
|
|
break;
|
|
#ifdef FLOATX80
|
|
case FLOATX80_TO_INT32:
|
|
time_a_floatx80_z_int32( floatx80_to_int32 );
|
|
break;
|
|
case FLOATX80_TO_INT32_ROUND_TO_ZERO:
|
|
time_a_floatx80_z_int32( floatx80_to_int32_round_to_zero );
|
|
break;
|
|
case FLOATX80_TO_INT64:
|
|
time_a_floatx80_z_int64( floatx80_to_int64 );
|
|
break;
|
|
case FLOATX80_TO_INT64_ROUND_TO_ZERO:
|
|
time_a_floatx80_z_int64( floatx80_to_int64_round_to_zero );
|
|
break;
|
|
case FLOATX80_TO_FLOAT32:
|
|
time_a_floatx80_z_float32( floatx80_to_float32 );
|
|
break;
|
|
case FLOATX80_TO_FLOAT64:
|
|
time_a_floatx80_z_float64( floatx80_to_float64 );
|
|
break;
|
|
#ifdef FLOAT128
|
|
case FLOATX80_TO_FLOAT128:
|
|
time_a_floatx80_z_float128( floatx80_to_float128 );
|
|
break;
|
|
#endif
|
|
case FLOATX80_ROUND_TO_INT:
|
|
time_az_floatx80( floatx80_round_to_int );
|
|
break;
|
|
case FLOATX80_ADD:
|
|
time_abz_floatx80( floatx80_add );
|
|
break;
|
|
case FLOATX80_SUB:
|
|
time_abz_floatx80( floatx80_sub );
|
|
break;
|
|
case FLOATX80_MUL:
|
|
time_abz_floatx80( floatx80_mul );
|
|
break;
|
|
case FLOATX80_DIV:
|
|
time_abz_floatx80( floatx80_div );
|
|
break;
|
|
case FLOATX80_REM:
|
|
time_abz_floatx80( floatx80_rem );
|
|
break;
|
|
case FLOATX80_SQRT:
|
|
time_az_floatx80_pos( floatx80_sqrt );
|
|
break;
|
|
case FLOATX80_EQ:
|
|
time_ab_floatx80_z_flag( floatx80_eq );
|
|
break;
|
|
case FLOATX80_LE:
|
|
time_ab_floatx80_z_flag( floatx80_le );
|
|
break;
|
|
case FLOATX80_LT:
|
|
time_ab_floatx80_z_flag( floatx80_lt );
|
|
break;
|
|
case FLOATX80_EQ_SIGNALING:
|
|
time_ab_floatx80_z_flag( floatx80_eq_signaling );
|
|
break;
|
|
case FLOATX80_LE_QUIET:
|
|
time_ab_floatx80_z_flag( floatx80_le_quiet );
|
|
break;
|
|
case FLOATX80_LT_QUIET:
|
|
time_ab_floatx80_z_flag( floatx80_lt_quiet );
|
|
break;
|
|
#endif
|
|
#ifdef FLOAT128
|
|
case FLOAT128_TO_INT32:
|
|
time_a_float128_z_int32( float128_to_int32 );
|
|
break;
|
|
case FLOAT128_TO_INT32_ROUND_TO_ZERO:
|
|
time_a_float128_z_int32( float128_to_int32_round_to_zero );
|
|
break;
|
|
case FLOAT128_TO_INT64:
|
|
time_a_float128_z_int64( float128_to_int64 );
|
|
break;
|
|
case FLOAT128_TO_INT64_ROUND_TO_ZERO:
|
|
time_a_float128_z_int64( float128_to_int64_round_to_zero );
|
|
break;
|
|
case FLOAT128_TO_FLOAT32:
|
|
time_a_float128_z_float32( float128_to_float32 );
|
|
break;
|
|
case FLOAT128_TO_FLOAT64:
|
|
time_a_float128_z_float64( float128_to_float64 );
|
|
break;
|
|
#ifdef FLOATX80
|
|
case FLOAT128_TO_FLOATX80:
|
|
time_a_float128_z_floatx80( float128_to_floatx80 );
|
|
break;
|
|
#endif
|
|
case FLOAT128_ROUND_TO_INT:
|
|
time_az_float128( float128_round_to_int );
|
|
break;
|
|
case FLOAT128_ADD:
|
|
time_abz_float128( float128_add );
|
|
break;
|
|
case FLOAT128_SUB:
|
|
time_abz_float128( float128_sub );
|
|
break;
|
|
case FLOAT128_MUL:
|
|
time_abz_float128( float128_mul );
|
|
break;
|
|
case FLOAT128_DIV:
|
|
time_abz_float128( float128_div );
|
|
break;
|
|
case FLOAT128_REM:
|
|
time_abz_float128( float128_rem );
|
|
break;
|
|
case FLOAT128_SQRT:
|
|
time_az_float128_pos( float128_sqrt );
|
|
break;
|
|
case FLOAT128_EQ:
|
|
time_ab_float128_z_flag( float128_eq );
|
|
break;
|
|
case FLOAT128_LE:
|
|
time_ab_float128_z_flag( float128_le );
|
|
break;
|
|
case FLOAT128_LT:
|
|
time_ab_float128_z_flag( float128_lt );
|
|
break;
|
|
case FLOAT128_EQ_SIGNALING:
|
|
time_ab_float128_z_flag( float128_eq_signaling );
|
|
break;
|
|
case FLOAT128_LE_QUIET:
|
|
time_ab_float128_z_flag( float128_le_quiet );
|
|
break;
|
|
case FLOAT128_LT_QUIET:
|
|
time_ab_float128_z_flag( float128_lt_quiet );
|
|
break;
|
|
#endif
|
|
}
|
|
|
|
}
|
|
|
|
static void
|
|
timeFunction(
|
|
uint8 functionCode,
|
|
int8 roundingPrecisionIn,
|
|
int8 roundingModeIn,
|
|
int8 tininessModeIn
|
|
)
|
|
{
|
|
int8 roundingPrecision, roundingMode, tininessMode;
|
|
|
|
roundingPrecision = 32;
|
|
for (;;) {
|
|
if ( ! functions[ functionCode ].roundingPrecision ) {
|
|
roundingPrecision = 0;
|
|
}
|
|
else if ( roundingPrecisionIn ) {
|
|
roundingPrecision = roundingPrecisionIn;
|
|
}
|
|
for ( roundingMode = 1;
|
|
roundingMode < NUM_ROUNDINGMODES;
|
|
++roundingMode
|
|
) {
|
|
if ( ! functions[ functionCode ].roundingMode ) {
|
|
roundingMode = 0;
|
|
}
|
|
else if ( roundingModeIn ) {
|
|
roundingMode = roundingModeIn;
|
|
}
|
|
for ( tininessMode = 1;
|
|
tininessMode < NUM_TININESSMODES;
|
|
++tininessMode
|
|
) {
|
|
if ( ( roundingPrecision == 32 )
|
|
|| ( roundingPrecision == 64 ) ) {
|
|
if ( ! functions[ functionCode ]
|
|
.tininessModeAtReducedPrecision
|
|
) {
|
|
tininessMode = 0;
|
|
}
|
|
else if ( tininessModeIn ) {
|
|
tininessMode = tininessModeIn;
|
|
}
|
|
}
|
|
else {
|
|
if ( ! functions[ functionCode ].tininessMode ) {
|
|
tininessMode = 0;
|
|
}
|
|
else if ( tininessModeIn ) {
|
|
tininessMode = tininessModeIn;
|
|
}
|
|
}
|
|
timeFunctionVariety(
|
|
functionCode, roundingPrecision, roundingMode, tininessMode
|
|
);
|
|
if ( tininessModeIn || ! tininessMode ) break;
|
|
}
|
|
if ( roundingModeIn || ! roundingMode ) break;
|
|
}
|
|
if ( roundingPrecisionIn || ! roundingPrecision ) break;
|
|
if ( roundingPrecision == 80 ) {
|
|
break;
|
|
}
|
|
else if ( roundingPrecision == 64 ) {
|
|
roundingPrecision = 80;
|
|
}
|
|
else if ( roundingPrecision == 32 ) {
|
|
roundingPrecision = 64;
|
|
}
|
|
}
|
|
|
|
}
|
|
|
|
main( int argc, char **argv )
|
|
{
|
|
char *argPtr;
|
|
flag functionArgument;
|
|
uint8 functionCode;
|
|
int8 operands, roundingPrecision, roundingMode, tininessMode;
|
|
|
|
if ( argc <= 1 ) goto writeHelpMessage;
|
|
functionArgument = FALSE;
|
|
functionCode = 0;
|
|
operands = 0;
|
|
roundingPrecision = 0;
|
|
roundingMode = 0;
|
|
tininessMode = 0;
|
|
--argc;
|
|
++argv;
|
|
while ( argc && ( argPtr = argv[ 0 ] ) ) {
|
|
if ( argPtr[ 0 ] == '-' ) ++argPtr;
|
|
if ( strcmp( argPtr, "help" ) == 0 ) {
|
|
writeHelpMessage:
|
|
fputs(
|
|
"timesoftfloat [<option>...] <function>\n"
|
|
" <option>: (* is default)\n"
|
|
" -help --Write this message and exit.\n"
|
|
#ifdef FLOATX80
|
|
" -precision32 --Only time rounding precision equivalent to float32.\n"
|
|
" -precision64 --Only time rounding precision equivalent to float64.\n"
|
|
" -precision80 --Only time maximum rounding precision.\n"
|
|
#endif
|
|
" -nearesteven --Only time rounding to nearest/even.\n"
|
|
" -tozero --Only time rounding to zero.\n"
|
|
" -down --Only time rounding down.\n"
|
|
" -up --Only time rounding up.\n"
|
|
" -tininessbefore --Only time underflow tininess before rounding.\n"
|
|
" -tininessafter --Only time underflow tininess after rounding.\n"
|
|
" <function>:\n"
|
|
" int32_to_<float> <float>_add <float>_eq\n"
|
|
" <float>_to_int32 <float>_sub <float>_le\n"
|
|
" <float>_to_int32_round_to_zero <float>_mul <float>_lt\n"
|
|
" int64_to_<float> <float>_div <float>_eq_signaling\n"
|
|
" <float>_to_int64 <float>_rem <float>_le_quiet\n"
|
|
" <float>_to_int64_round_to_zero <float>_lt_quiet\n"
|
|
" <float>_to_<float>\n"
|
|
" <float>_round_to_int\n"
|
|
" <float>_sqrt\n"
|
|
" -all1 --All 1-operand functions.\n"
|
|
" -all2 --All 2-operand functions.\n"
|
|
" -all --All functions.\n"
|
|
" <float>:\n"
|
|
" float32 --Single precision.\n"
|
|
" float64 --Double precision.\n"
|
|
#ifdef FLOATX80
|
|
" floatx80 --Extended double precision.\n"
|
|
#endif
|
|
#ifdef FLOAT128
|
|
" float128 --Quadruple precision.\n"
|
|
#endif
|
|
,
|
|
stdout
|
|
);
|
|
return EXIT_SUCCESS;
|
|
}
|
|
#ifdef FLOATX80
|
|
else if ( strcmp( argPtr, "precision32" ) == 0 ) {
|
|
roundingPrecision = 32;
|
|
}
|
|
else if ( strcmp( argPtr, "precision64" ) == 0 ) {
|
|
roundingPrecision = 64;
|
|
}
|
|
else if ( strcmp( argPtr, "precision80" ) == 0 ) {
|
|
roundingPrecision = 80;
|
|
}
|
|
#endif
|
|
else if ( ( strcmp( argPtr, "nearesteven" ) == 0 )
|
|
|| ( strcmp( argPtr, "nearest_even" ) == 0 ) ) {
|
|
roundingMode = ROUND_NEAREST_EVEN;
|
|
}
|
|
else if ( ( strcmp( argPtr, "tozero" ) == 0 )
|
|
|| ( strcmp( argPtr, "to_zero" ) == 0 ) ) {
|
|
roundingMode = ROUND_TO_ZERO;
|
|
}
|
|
else if ( strcmp( argPtr, "down" ) == 0 ) {
|
|
roundingMode = ROUND_DOWN;
|
|
}
|
|
else if ( strcmp( argPtr, "up" ) == 0 ) {
|
|
roundingMode = ROUND_UP;
|
|
}
|
|
else if ( strcmp( argPtr, "tininessbefore" ) == 0 ) {
|
|
tininessMode = TININESS_BEFORE_ROUNDING;
|
|
}
|
|
else if ( strcmp( argPtr, "tininessafter" ) == 0 ) {
|
|
tininessMode = TININESS_AFTER_ROUNDING;
|
|
}
|
|
else if ( strcmp( argPtr, "all1" ) == 0 ) {
|
|
functionArgument = TRUE;
|
|
functionCode = 0;
|
|
operands = 1;
|
|
}
|
|
else if ( strcmp( argPtr, "all2" ) == 0 ) {
|
|
functionArgument = TRUE;
|
|
functionCode = 0;
|
|
operands = 2;
|
|
}
|
|
else if ( strcmp( argPtr, "all" ) == 0 ) {
|
|
functionArgument = TRUE;
|
|
functionCode = 0;
|
|
operands = 0;
|
|
}
|
|
else {
|
|
for ( functionCode = 1;
|
|
functionCode < NUM_FUNCTIONS;
|
|
++functionCode
|
|
) {
|
|
if ( strcmp( argPtr, functions[ functionCode ].name ) == 0 ) {
|
|
break;
|
|
}
|
|
}
|
|
if ( functionCode == NUM_FUNCTIONS ) {
|
|
fail( "Invalid option or function `%s'", argv[ 0 ] );
|
|
}
|
|
functionArgument = TRUE;
|
|
}
|
|
--argc;
|
|
++argv;
|
|
}
|
|
if ( ! functionArgument ) fail( "Function argument required" );
|
|
if ( functionCode ) {
|
|
timeFunction(
|
|
functionCode, roundingPrecision, roundingMode, tininessMode );
|
|
}
|
|
else if ( operands == 1 ) {
|
|
for ( functionCode = 1; functionCode < NUM_FUNCTIONS; ++functionCode
|
|
) {
|
|
if ( functions[ functionCode ].numInputs == 1 ) {
|
|
timeFunction(
|
|
functionCode, roundingPrecision, roundingMode, tininessMode
|
|
);
|
|
}
|
|
}
|
|
}
|
|
else if ( operands == 2 ) {
|
|
for ( functionCode = 1; functionCode < NUM_FUNCTIONS; ++functionCode
|
|
) {
|
|
if ( functions[ functionCode ].numInputs == 2 ) {
|
|
timeFunction(
|
|
functionCode, roundingPrecision, roundingMode, tininessMode
|
|
);
|
|
}
|
|
}
|
|
}
|
|
else {
|
|
for ( functionCode = 1; functionCode < NUM_FUNCTIONS; ++functionCode
|
|
) {
|
|
timeFunction(
|
|
functionCode, roundingPrecision, roundingMode, tininessMode );
|
|
}
|
|
}
|
|
return EXIT_SUCCESS;
|
|
|
|
}
|
|
|