Path: blob/main/lib/libc/softfloat/templates/softfloat.h
39534 views
1/*2===============================================================================34This C header file is part of the SoftFloat IEC/IEEE Floating-point5Arithmetic Package, Release 2a.67Written by John R. Hauser. This work was made possible in part by the8International Computer Science Institute, located at Suite 600, 1947 Center9Street, Berkeley, California 94704. Funding was partially provided by the10National Science Foundation under grant MIP-9311980. The original version11of this code was written as part of a project to build a fixed-point vector12processor in collaboration with the University of California at Berkeley,13overseen by Profs. Nelson Morgan and John Wawrzynek. More information14is available through the Web page `http://HTTP.CS.Berkeley.EDU/~jhauser/15arithmetic/SoftFloat.html'.1617THIS SOFTWARE IS DISTRIBUTED AS IS, FOR FREE. Although reasonable effort18has been made to avoid it, THIS SOFTWARE MAY CONTAIN FAULTS THAT WILL AT19TIMES RESULT IN INCORRECT BEHAVIOR. USE OF THIS SOFTWARE IS RESTRICTED TO20PERSONS AND ORGANIZATIONS WHO CAN AND WILL TAKE FULL RESPONSIBILITY FOR ANY21AND ALL LOSSES, COSTS, OR OTHER PROBLEMS ARISING FROM ITS USE.2223Derivative works are acceptable, even for commercial purposes, so long as24(1) they include prominent notice that the work is derivative, and (2) they25include prominent notice akin to these four paragraphs for those parts of26this code that are retained.2728===============================================================================29*/3031/*32-------------------------------------------------------------------------------33The macro `FLOATX80' must be defined to enable the extended double-precision34floating-point format `floatx80'. If this macro is not defined, the35`floatx80' type will not be defined, and none of the functions that either36input or output the `floatx80' type will be defined. The same applies to37the `FLOAT128' macro and the quadruple-precision format `float128'.38-------------------------------------------------------------------------------39*/40#define FLOATX8041#define FLOAT1284243/*44-------------------------------------------------------------------------------45Software IEC/IEEE floating-point types.46-------------------------------------------------------------------------------47*/48typedef !!!bits32 float32;49typedef !!!bits64 float64;50#ifdef FLOATX8051typedef struct {52!!!bits16 high;53!!!bits64 low;54} floatx80;55#endif56#ifdef FLOAT12857typedef struct {58!!!bits64 high, low;59} float128;60#endif6162/*63-------------------------------------------------------------------------------64Software IEC/IEEE floating-point underflow tininess-detection mode.65-------------------------------------------------------------------------------66*/67extern !!!int8 float_detect_tininess;68enum {69float_tininess_after_rounding = 0,70float_tininess_before_rounding = 171};7273/*74-------------------------------------------------------------------------------75Software IEC/IEEE floating-point rounding mode.76-------------------------------------------------------------------------------77*/78extern !!!int8 float_rounding_mode;79enum {80float_round_nearest_even = 0,81float_round_to_zero = 1,82float_round_down = 2,83float_round_up = 384};8586/*87-------------------------------------------------------------------------------88Software IEC/IEEE floating-point exception flags.89-------------------------------------------------------------------------------90*/91extern !!!int8 float_exception_flags;92enum {93float_flag_inexact = 1,94float_flag_underflow = 2,95float_flag_overflow = 4,96float_flag_divbyzero = 8,97float_flag_invalid = 1698};99100/*101-------------------------------------------------------------------------------102Routine to raise any or all of the software IEC/IEEE floating-point103exception flags.104-------------------------------------------------------------------------------105*/106void float_raise( !!!int8 );107108/*109-------------------------------------------------------------------------------110Software IEC/IEEE integer-to-floating-point conversion routines.111-------------------------------------------------------------------------------112*/113float32 int32_to_float32( !!!int32 );114float64 int32_to_float64( !!!int32 );115#ifdef FLOATX80116floatx80 int32_to_floatx80( !!!int32 );117#endif118#ifdef FLOAT128119float128 int32_to_float128( !!!int32 );120#endif121float32 int64_to_float32( !!!int64 );122float64 int64_to_float64( !!!int64 );123#ifdef FLOATX80124floatx80 int64_to_floatx80( !!!int64 );125#endif126#ifdef FLOAT128127float128 int64_to_float128( !!!int64 );128#endif129130/*131-------------------------------------------------------------------------------132Software IEC/IEEE single-precision conversion routines.133-------------------------------------------------------------------------------134*/135!!!int32 float32_to_int32( float32 );136!!!int32 float32_to_int32_round_to_zero( float32 );137!!!int64 float32_to_int64( float32 );138!!!int64 float32_to_int64_round_to_zero( float32 );139float64 float32_to_float64( float32 );140#ifdef FLOATX80141floatx80 float32_to_floatx80( float32 );142#endif143#ifdef FLOAT128144float128 float32_to_float128( float32 );145#endif146147/*148-------------------------------------------------------------------------------149Software IEC/IEEE single-precision operations.150-------------------------------------------------------------------------------151*/152float32 float32_round_to_int( float32 );153float32 float32_add( float32, float32 );154float32 float32_sub( float32, float32 );155float32 float32_mul( float32, float32 );156float32 float32_div( float32, float32 );157float32 float32_rem( float32, float32 );158float32 float32_sqrt( float32 );159!!!flag float32_eq( float32, float32 );160!!!flag float32_le( float32, float32 );161!!!flag float32_lt( float32, float32 );162!!!flag float32_eq_signaling( float32, float32 );163!!!flag float32_le_quiet( float32, float32 );164!!!flag float32_lt_quiet( float32, float32 );165!!!flag float32_is_signaling_nan( float32 );166167/*168-------------------------------------------------------------------------------169Software IEC/IEEE double-precision conversion routines.170-------------------------------------------------------------------------------171*/172!!!int32 float64_to_int32( float64 );173!!!int32 float64_to_int32_round_to_zero( float64 );174!!!int64 float64_to_int64( float64 );175!!!int64 float64_to_int64_round_to_zero( float64 );176float32 float64_to_float32( float64 );177#ifdef FLOATX80178floatx80 float64_to_floatx80( float64 );179#endif180#ifdef FLOAT128181float128 float64_to_float128( float64 );182#endif183184/*185-------------------------------------------------------------------------------186Software IEC/IEEE double-precision operations.187-------------------------------------------------------------------------------188*/189float64 float64_round_to_int( float64 );190float64 float64_add( float64, float64 );191float64 float64_sub( float64, float64 );192float64 float64_mul( float64, float64 );193float64 float64_div( float64, float64 );194float64 float64_rem( float64, float64 );195float64 float64_sqrt( float64 );196!!!flag float64_eq( float64, float64 );197!!!flag float64_le( float64, float64 );198!!!flag float64_lt( float64, float64 );199!!!flag float64_eq_signaling( float64, float64 );200!!!flag float64_le_quiet( float64, float64 );201!!!flag float64_lt_quiet( float64, float64 );202!!!flag float64_is_signaling_nan( float64 );203204#ifdef FLOATX80205206/*207-------------------------------------------------------------------------------208Software IEC/IEEE extended double-precision conversion routines.209-------------------------------------------------------------------------------210*/211!!!int32 floatx80_to_int32( floatx80 );212!!!int32 floatx80_to_int32_round_to_zero( floatx80 );213!!!int64 floatx80_to_int64( floatx80 );214!!!int64 floatx80_to_int64_round_to_zero( floatx80 );215float32 floatx80_to_float32( floatx80 );216float64 floatx80_to_float64( floatx80 );217#ifdef FLOAT128218float128 floatx80_to_float128( floatx80 );219#endif220221/*222-------------------------------------------------------------------------------223Software IEC/IEEE extended double-precision rounding precision. Valid224values are 32, 64, and 80.225-------------------------------------------------------------------------------226*/227extern !!!int8 floatx80_rounding_precision;228229/*230-------------------------------------------------------------------------------231Software IEC/IEEE extended double-precision operations.232-------------------------------------------------------------------------------233*/234floatx80 floatx80_round_to_int( floatx80 );235floatx80 floatx80_add( floatx80, floatx80 );236floatx80 floatx80_sub( floatx80, floatx80 );237floatx80 floatx80_mul( floatx80, floatx80 );238floatx80 floatx80_div( floatx80, floatx80 );239floatx80 floatx80_rem( floatx80, floatx80 );240floatx80 floatx80_sqrt( floatx80 );241!!!flag floatx80_eq( floatx80, floatx80 );242!!!flag floatx80_le( floatx80, floatx80 );243!!!flag floatx80_lt( floatx80, floatx80 );244!!!flag floatx80_eq_signaling( floatx80, floatx80 );245!!!flag floatx80_le_quiet( floatx80, floatx80 );246!!!flag floatx80_lt_quiet( floatx80, floatx80 );247!!!flag floatx80_is_signaling_nan( floatx80 );248249#endif250251#ifdef FLOAT128252253/*254-------------------------------------------------------------------------------255Software IEC/IEEE quadruple-precision conversion routines.256-------------------------------------------------------------------------------257*/258!!!int32 float128_to_int32( float128 );259!!!int32 float128_to_int32_round_to_zero( float128 );260!!!int64 float128_to_int64( float128 );261!!!int64 float128_to_int64_round_to_zero( float128 );262float32 float128_to_float32( float128 );263float64 float128_to_float64( float128 );264#ifdef FLOATX80265floatx80 float128_to_floatx80( float128 );266#endif267268/*269-------------------------------------------------------------------------------270Software IEC/IEEE quadruple-precision operations.271-------------------------------------------------------------------------------272*/273float128 float128_round_to_int( float128 );274float128 float128_add( float128, float128 );275float128 float128_sub( float128, float128 );276float128 float128_mul( float128, float128 );277float128 float128_div( float128, float128 );278float128 float128_rem( float128, float128 );279float128 float128_sqrt( float128 );280!!!flag float128_eq( float128, float128 );281!!!flag float128_le( float128, float128 );282!!!flag float128_lt( float128, float128 );283!!!flag float128_eq_signaling( float128, float128 );284!!!flag float128_le_quiet( float128, float128 );285!!!flag float128_lt_quiet( float128, float128 );286!!!flag float128_is_signaling_nan( float128 );287288#endif289290291292