diff options
Diffstat (limited to 'sysdeps/ia64/fpu/e_log2f.S')
-rw-r--r-- | sysdeps/ia64/fpu/e_log2f.S | 551 |
1 files changed, 0 insertions, 551 deletions
diff --git a/sysdeps/ia64/fpu/e_log2f.S b/sysdeps/ia64/fpu/e_log2f.S deleted file mode 100644 index 17d710a951..0000000000 --- a/sysdeps/ia64/fpu/e_log2f.S +++ /dev/null @@ -1,551 +0,0 @@ -.file "log2f.s" - - -// Copyright (c) 2000 - 2003, Intel Corporation -// All rights reserved. -// -// Contributed 2000 by the Intel Numerics Group, Intel Corporation -// -// Redistribution and use in source and binary forms, with or without -// modification, are permitted provided that the following conditions are -// met: -// -// * Redistributions of source code must retain the above copyright -// notice, this list of conditions and the following disclaimer. -// -// * Redistributions in binary form must reproduce the above copyright -// notice, this list of conditions and the following disclaimer in the -// documentation and/or other materials provided with the distribution. -// -// * The name of Intel Corporation may not be used to endorse or promote -// products derived from this software without specific prior written -// permission. - -// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS -// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT -// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR -// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL INTEL OR ITS -// CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, -// EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, -// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR -// PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY -// OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY OR TORT (INCLUDING -// NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS -// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. -// -// Intel Corporation is the author of this code, and requests that all -// problem reports or change requests be submitted to it directly at -// http://www.intel.com/software/products/opensource/libraries/num.htm. -// -// History -//============================================================== -// 09/11/00 Initial version -// 05/20/02 Cleaned up namespace and sf0 syntax -// 02/10/03 Reordered header: .section, .global, .proc, .align -// -// API -//============================================================== -// float log2f(float) -// -// Overview of operation -//============================================================== -// Background -// -// Implementation -// -// Let x = 2^l * m, where m=1.b1 b2 ... b8 b9 ... b52 -// y=frcpa(m), r=m*y-1, f=b1 b2 .. b8 (table index) -// j=0 if f<128; j=1 if f>=128 -// T is a table that stores log2(1/y) (in entries 1..255) rounded to -// double extended precision; f is used as an index; T[255]=0 -// -// If f=0 and b9=0, r is set to 2^{-8}* 0.b9 b10 ... b52 = m-1 (fractional part of m), -// and 0 is used instead of T[0] -// (polynomial evaluation only, for m=1+r, 0<=r<2^{-9}) -// If f=255, r is set to (m-2)/2 (T[255]=0, and only polynomial evaluation is used -// for m=2(1-r'), 0<=r'<2^{-9}) -// -// log2f(x) is approximated as -// (l-j) + T[f] + (c1*r+c2*r^2+...+c6*r^6), if f>0 -// - - -// Special values -//============================================================== -// log2f(0)=-inf, raises Divide by Zero -// log2f(+inf)=inf -// log2f(x)=NaN, raises Invalid if x<0 -// - - -// Registers used -//============================================================== -// f6-f14 -// r2-r3, r23-r30 -// p6,p7,p8,p12 -// - - -GR_SAVE_B0 = r33 -GR_SAVE_PFS = r34 -GR_SAVE_GP = r35 // This reg. can safely be used -GR_SAVE_SP = r36 - -GR_Parameter_X = r37 -GR_Parameter_Y = r38 -GR_Parameter_RESULT = r39 -GR_Parameter_TAG = r40 - -FR_X = f10 -FR_Y = f1 -FR_RESULT = f8 - - - - -// Data tables -//============================================================== - -RODATA - -.align 16 - -LOCAL_OBJECT_START(poly_coeffs) - -data8 0x3fdec709dc3a03fd, 0xbfd71547652b82fe //C_3 and C_4 -data8 0xb8aa3b295c17f0bc, 0x00003fff // C_1 -data8 0xb8aa3b295c17f0bc, 0x0000bffe // C_2 -LOCAL_OBJECT_END(poly_coeffs) - - -LOCAL_OBJECT_START(T_table) - -data8 0x3f671b0ea42e5fda, 0x3f815cfe8eaec830 -data8 0x3f8cfee70c5ce5dc, 0x3f94564a62192834 -data8 0x3f997723ace35766, 0x3f9f5923c69b54a1 -data8 0x3fa2a094a085d693, 0x3fa538941776b01e -data8 0x3fa8324c9b914bc7, 0x3faacf54ce07d7e9 -data8 0x3fadced958dadc12, 0x3fb0387efbca869e -data8 0x3fb18ac6067479c0, 0x3fb30edd3e13530d -data8 0x3fb463c15936464e, 0x3fb5b9e13c3fa21d -data8 0x3fb7113f3259e07a, 0x3fb869dd8d1b2035 -data8 0x3fb9c3bea49d3214, 0x3fbb1ee4d7961701 -data8 0x3fbc7b528b70f1c5, 0x3fbdd90a2c676ed4 -data8 0x3fbf05d4976c2028, 0x3fc032fbbaee6d65 -data8 0x3fc0e3b5a9f3284a, 0x3fc195195c7d125b -data8 0x3fc22dadc2ab3497, 0x3fc2e050231df57d -data8 0x3fc379f79c2b255b, 0x3fc42ddd2ba1b4a9 -data8 0x3fc4c89b9e6807f5, 0x3fc563dc29ffacb2 -data8 0x3fc619a25f5d798d, 0x3fc6b5ffbf367644 -data8 0x3fc752e1f660f8d6, 0x3fc7f049e753e7cf -data8 0x3fc8a8980abfbd32, 0x3fc94724cca657be -data8 0x3fc9e63a24971f46, 0x3fca85d8feb202f7 -data8 0x3fcb2602497d5346, 0x3fcbc6b6f5ee1c9b -data8 0x3fcc67f7f770a67e, 0x3fcceec4b2234fba -data8 0x3fcd91097ad13982, 0x3fce33dd57f3d335 -data8 0x3fced74146bc7b10, 0x3fcf7b3646fef683 -data8 0x3fd00223a943dc19, 0x3fd054a474bf0eb7 -data8 0x3fd0999d9b9259a1, 0x3fd0eca66d3b2581 -data8 0x3fd13ffa2e85b475, 0x3fd185a444fa0a7b -data8 0x3fd1cb8312f27eff, 0x3fd21fa1441ce5e8 -data8 0x3fd265f526e603cb, 0x3fd2baa0c34be1ec -data8 0x3fd3016b45de21ce, 0x3fd3486c38aa29a8 -data8 0x3fd38fa3efaa8262, 0x3fd3e562c0816a02 -data8 0x3fd42d141f53b646, 0x3fd474fd543f222c -data8 0x3fd4bd1eb680e548, 0x3fd505789e234bd1 -data8 0x3fd54e0b64003b70, 0x3fd596d761c3c1f0 -data8 0x3fd5dfdcf1eeae0e, 0x3fd6291c6fd9329c -data8 0x3fd6729637b59418, 0x3fd6bc4aa692e0fd -data8 0x3fd7063a1a5fb4f2, 0x3fd75064f1ed0715 -data8 0x3fd79acb8cf10390, 0x3fd7d67c1e43ae5c -data8 0x3fd8214f4068afa7, 0x3fd86c5f36dea3dc -data8 0x3fd8b7ac64dd7f9d, 0x3fd8f4167a0c6f92 -data8 0x3fd93fd2d5e1bf1d, 0x3fd98bcd84296946 -data8 0x3fd9c8c333e6e9a5, 0x3fda152f142981b4 -data8 0x3fda527fd95fd8ff, 0x3fda9f5e3edeb9e6 -data8 0x3fdadd0b2b5755a7, 0x3fdb2a5d6f51ff83 -data8 0x3fdb686799b00be3, 0x3fdbb62f1b887cd8 -data8 0x3fdbf4979f666668, 0x3fdc332a6e8399d4 -data8 0x3fdc819dc2d45fe4, 0x3fdcc0908e19b7bd -data8 0x3fdcffae611ad12b, 0x3fdd3ef776d43ff4 -data8 0x3fdd8e5002710128, 0x3fddcdfb486cb9a1 -data8 0x3fde0dd294245fe4, 0x3fde4dd622a28840 -data8 0x3fde8e06317114f0, 0x3fdece62fe9a9915 -data8 0x3fdf1f164a15389a, 0x3fdf5fd8a9063e35 -data8 0x3fdfa0c8937e7d5d, 0x3fdfe1e649bb6335 -data8 0x3fe011990641535a, 0x3fe032560e91e59e -data8 0x3fe0532a5ebcd44a, 0x3fe0741617f5fc28 -data8 0x3fe08cd653f38839, 0x3fe0adeb55c1103b -data8 0x3fe0cf181d5d1dd0, 0x3fe0f05ccd0aced7 -data8 0x3fe111b9875788ab, 0x3fe1332e6f1bcf73 -data8 0x3fe154bba77c2088, 0x3fe16df59bfa06c1 -data8 0x3fe18fadb6e2d3c2, 0x3fe1b17e849adc26 -data8 0x3fe1caeb6a0de814, 0x3fe1ece7c830eec9 -data8 0x3fe20efd3dae01df, 0x3fe2289de375d901 -data8 0x3fe24adf9b6a6fe0, 0x3fe26d3ad1aebcfc -data8 0x3fe287100c2771f4, 0x3fe2a9983b3c1b28 -data8 0xbfda78e146f7bef4, 0xbfda33760a7f6051 -data8 0xbfd9ff43476fb5f7, 0xbfd9b97c3c4eec8f -data8 0xbfd98504431717fc, 0xbfd93ee07535f967 -data8 0xbfd90a228d5712b2, 0xbfd8c3a104cb24f5 -data8 0xbfd88e9c72e0b226, 0xbfd847bc33d8618e -data8 0xbfd812703988bb69, 0xbfd7dd0569c04bff -data8 0xbfd7959c202292f1, 0xbfd75fe8d2c5d48f -data8 0xbfd72a1637cbc183, 0xbfd6e221cd9d0cde -data8 0xbfd6ac059985503b, 0xbfd675c99ce81f92 -data8 0xbfd63f6db2590482, 0xbfd5f6c138136489 -data8 0xbfd5c01a39fbd688, 0xbfd58952cf519193 -data8 0xbfd5526ad18493ce, 0xbfd51b6219bfe6ea -data8 0xbfd4d1cdf8b4846f, 0xbfd49a784bcd1b8b -data8 0xbfd4630161832547, 0xbfd42b6911cf5465 -data8 0xbfd3f3af3461e1c4, 0xbfd3bbd3a0a1dcfb -data8 0xbfd383d62dac7ae7, 0xbfd34bb6b2546218 -data8 0xbfd313750520f520, 0xbfd2db10fc4d9aaf -data8 0xbfd2a28a6dc90387, 0xbfd269e12f346e2c -data8 0xbfd2311515e2e855, 0xbfd1f825f6d88e13 -data8 0xbfd1bf13a6c9c69f, 0xbfd185ddfa1a7ed0 -data8 0xbfd14c84c4dd6128, 0xbfd11307dad30b76 -data8 0xbfd0d9670f6941fe, 0xbfd09fa235ba2020 -data8 0xbfd0790adbb03009, 0xbfd03f09858c55fb -data8 0xbfd004e3a7c97cbd, 0xbfcf9532288fcf69 -data8 0xbfcf205339208f27, 0xbfceab2a23a5b83e -data8 0xbfce5ce55fdd37a5, 0xbfcde73fe3b1480f -data8 0xbfcd714f44623927, 0xbfccfb1321b8c400 -data8 0xbfccac163c770dc9, 0xbfcc355b67195dd0 -data8 0xbfcbbe540a3f036f, 0xbfcb6ecf175f95e9 -data8 0xbfcaf74751e1be33, 0xbfca7f71fb7bab9d -data8 0xbfca2f632320b86b, 0xbfc9b70ba539dfae -data8 0xbfc93e6587910444, 0xbfc8edcae8352b6c -data8 0xbfc874a0db01a719, 0xbfc7fb27199df16d -data8 0xbfc7a9fec7d05ddf, 0xbfc72fff456ac70d -data8 0xbfc6de7d66023dbc, 0xbfc663f6fac91316 -data8 0xbfc6121ac74813cf, 0xbfc5970c478fff4a -data8 0xbfc51bab907a5c8a, 0xbfc4c93d33151b24 -data8 0xbfc44d527fdadf55, 0xbfc3fa87be0f3a1b -data8 0xbfc3a797cd35d959, 0xbfc32ae9e278ae1a -data8 0xbfc2d79c6937efdd, 0xbfc25a619370d9dc -data8 0xbfc206b5bde2f8b8, 0xbfc188ecbd1d16be -data8 0xbfc134e1b489062e, 0xbfc0b6894488e95f -data8 0xbfc0621e2f556b5c, 0xbfc00d8c711a12cc -data8 0xbfbf1cd21257e18c, 0xbfbe72ec117fa5b2 -data8 0xbfbdc8b7c49a1ddb, 0xbfbcc8d5e467b710 -data8 0xbfbc1ddc9c39c7a1, 0xbfbb7294093cdd0f -data8 0xbfba7111df348494, 0xbfb9c501cdf75872 -data8 0xbfb918a16e46335b, 0xbfb81579a73e83c6 -data8 0xbfb7684f39f4ff2d, 0xbfb6bad3758efd87 -data8 0xbfb60d060d7e41ac, 0xbfb507b836033bb7 -data8 0xbfb4591d6310d85a, 0xbfb3aa2fdd27f1c3 -data8 0xbfb2faef55ccb372, 0xbfb1f3723b4ae6db -data8 0xbfb14360d6136ffa, 0xbfb092fb594145c1 -data8 0xbfafc482e8b48a7e, 0xbfae6265ace11ae4 -data8 0xbfacff9e5c4341d0, 0xbfaaea3316095f72 -data8 0xbfa985bfc3495194, 0xbfa820a01ac754cb -data8 0xbfa6bad3758efd87, 0xbfa554592bb8cd58 -data8 0xbfa3ed3094685a26, 0xbfa2855905ca70f6 -data8 0xbfa11cd1d5133413, 0xbf9dfd78881399f1 -data8 0xbf9b28f618cc85df, 0xbf98530faa3c087b -data8 0xbf957bc3dddcd7fa, 0xbf92a3115322f9e6 -data8 0xbf8f91ed4eef8370, 0xbf89dae4ec6b8b2e -data8 0xbf842106b1499209, 0xbf7cc89f97d67594 -data8 0xbf71497accf7e11d, 0x0000000000000000 -LOCAL_OBJECT_END(T_table) - - -.section .text -GLOBAL_LIBM_ENTRY(log2f) - -{ .mfi - alloc r32=ar.pfs,1,4,4,0 - // y=frcpa(x) - frcpa.s1 f6,p0=f1,f8 - // will form significand of 1.5 (to test whether the index is 128 or above) - mov r24=0xc -} -{.mfi - nop.m 0 - // normalize x - fma.s1 f7=f8,f1,f0 - // r2 = pointer to C_1...C_6 followed by T_table - addl r2 = @ltoff(poly_coeffs), gp;; -} -{.mfi - // get significand - getf.sig r25=f8 - // f8 denormal ? - fclass.m p8,p10=f8,0x9 - // will form significand of 1.5 (to test whether the index is 128 or above) - shl r24=r24,60 -} -{.mfi - mov r26=0x804 - nop.f 0 - // r23=bias-1 - mov r23=0xfffe;; -} - -{.mmf - getf.exp r29=f8 - // load start address for C_1...C_6 followed by T_table - ld8 r2=[r2] - // will continue only for positive normal/denormal numbers - fclass.nm.unc p12,p7 = f8, 0x19 ;; -} - -.pred.rel "mutex",p8,p10 -{.mfi - // denormal input, repeat get significand (after normalization) - (p8) getf.sig r25=f7 - // x=1 ? - fcmp.eq.s0 p6,p0=f8,f1 - // get T_index - (p10) shr.u r28=r25,63-8 -} -{.mfi - // f12=0.5 - setf.exp f12=r23 - nop.f 0 - // r27=bias - mov r27=0xffff;; -} - -{.mfb - // denormal input, repeat get exponent (after normalization) - (p8) getf.exp r29=f7 - nop.f 0 - (p12) br.cond.spnt SPECIAL_log2f -} -{.mfi - cmp.geu p12,p0=r25,r24 - nop.f 0 - mov r23=0xff;; -} - -{.mfi - add r3=32,r2 - // r=1-x*y - fms.s1 f6=f6,f8,f1 - // r26=0x80400...0 (threshold for using polynomial approximation) - shl r26=r26,64-12 -} -{.mfi - // load C_3, C_4 - ldfpd f10,f11=[r2],16 - nop.f 0 - // r27=bias-1 (if index >=128, will add exponent+1) - (p12) mov r27=0xfffe;; -} - -{.mfi - // load C_1 - ldfe f14=[r2],32 - // x=1, return 0 - (p6) fma.s.s0 f8=f0,f0,f0 - (p8) shr.u r28=r25,63-8 -} -{.mib - // load C_2 - ldfe f13=[r3] - // r29=exponent-bias - sub r29=r29,r27 - // x=1, return - (p6) br.ret.spnt b0;; -} - - -{.mfi - // get T_index - and r28=r28,r23 - fmerge.se f7=f1,f7 - // if first 9 bits after leading 1 are all zero, then p8=1 - cmp.ltu p8,p12=r25,r26;; -} -{.mfi - // f8=expon - bias - setf.sig f8=r29 - nop.f 0 - // get T address - shladd r2=r28,3,r2 -} -{.mfi - // first 8 bits after leading 1 are all ones ? - cmp.eq p10,p0=r23,r28 - // if first 8 bits after leading bit are 0, use polynomial approx. only - (p8) fms.s1 f6=f7,f1,f1 - nop.i 0;; -} -{.mfi - //r26=1 - mov r26=1 - // if first 8 bits after leading 1 are all ones, use polynomial approx. only - (p10) fms.s1 f6=f7,f12,f1 - nop.i 0;; -} - -.pred.rel "mutex",p8,p12 -{.mmf - // load T (unless first 9 bits after leading 1 are 0) - (p12) ldfd f12=[r2] - nop.m 0 - // set T=0 (if first 9 bits after leading 1 are 0) - (p8) fma.s1 f12=f0,f0,f0;; -} - -{.mfi - nop.m 0 - // P34=C_3+C_4*r - fma.s1 f10=f11,f6,f10 - // r26=2^{63} - shl r26=r26,63 -} -{.mfi - nop.m 0 - // r2=r*r - fma.s1 f11=f6,f6,f0 - nop.i 0;; -} -{.mfi - // significand of x is 1 ? - cmp.eq p0,p6=r25,r26 - // P12=C_1+C_2*r - fma.s1 f14=f13,f6,f14 - nop.i 0;; -} -{.mfi - nop.m 0 - // normalize additive term (l=exponent of x) - fcvt.xf f8=f8 - // if significand(x)=1, return exponent (l) - nop.i 0;; -} -{.mfi - nop.m 0 - // add T+l - (p6) fma.s1 f8=f8,f1,f12 - nop.i 0 -} -{.mfi - nop.m 0 - // P14=P12+r2*P34 - (p6) fma.s1 f13=f10,f11,f14 - nop.i 0;; -} - -{.mfb - nop.m 0 - // result=T+l+r*P14 - (p6) fma.s.s0 f8=f13,f6,f8 - // return - br.ret.sptk b0;; -} - - -SPECIAL_log2f: -{.mfi - nop.m 0 - // x=+Infinity ? - fclass.m p7,p0=f8,0x21 - nop.i 0;; -} -{.mfi - nop.m 0 - // x=+/-Zero ? - fclass.m p8,p0=f8,0x7 - nop.i 0;; -} -{.mfi - nop.m 0 - // x=-Infinity, -normal, -denormal ? - fclass.m p6,p0=f8,0x3a - nop.i 0;; -} -{.mfb - nop.m 0 - // log2f(+Infinity)=+Infinity - nop.f 0 - (p7) br.ret.spnt b0;; -} -{.mfi - (p8) mov GR_Parameter_TAG = 172 - // log2f(+/-0)=-infinity, raises Divide by Zero - // set f8=-0 - (p8) fmerge.ns f8=f0,f8 - nop.i 0;; -} -{.mfb - nop.m 0 - (p8) frcpa.s0 f8,p0=f1,f8 - (p8) br.cond.sptk __libm_error_region;; -} -{.mfb - (p6) mov GR_Parameter_TAG = 173 - // x<0: return NaN, raise Invalid - (p6) frcpa.s0 f8,p0=f0,f0 - (p6) br.cond.sptk __libm_error_region;; -} - - -{.mfb - nop.m 0 - // Remaining cases: NaNs - fma.s.s0 f8=f8,f1,f0 - br.ret.sptk b0;; -} - -GLOBAL_LIBM_END(log2f) - - -LOCAL_LIBM_ENTRY(__libm_error_region) -.prologue -{ .mfi - add GR_Parameter_Y=-32,sp // Parameter 2 value - nop.f 0 -.save ar.pfs,GR_SAVE_PFS - mov GR_SAVE_PFS=ar.pfs // Save ar.pfs -} -{ .mfi -.fframe 64 - add sp=-64,sp // Create new stack - nop.f 0 - mov GR_SAVE_GP=gp // Save gp -};; -{ .mmi - stfs [GR_Parameter_Y] = FR_Y,16 // STORE Parameter 2 on stack - add GR_Parameter_X = 16,sp // Parameter 1 address -.save b0, GR_SAVE_B0 - mov GR_SAVE_B0=b0 // Save b0 -};; -.body -{ .mib - stfs [GR_Parameter_X] = FR_X // STORE Parameter 1 on stack - add GR_Parameter_RESULT = 0,GR_Parameter_Y // Parameter 3 address - nop.b 0 -} -{ .mib - stfs [GR_Parameter_Y] = FR_RESULT // STORE Parameter 3 on stack - add GR_Parameter_Y = -16,GR_Parameter_Y - br.call.sptk b0=__libm_error_support# // Call error handling function -};; -{ .mmi - nop.m 0 - nop.m 0 - add GR_Parameter_RESULT = 48,sp -};; -{ .mmi - ldfs f8 = [GR_Parameter_RESULT] // Get return result off stack -.restore sp - add sp = 64,sp // Restore stack pointer - mov b0 = GR_SAVE_B0 // Restore return address -};; -{ .mib - mov gp = GR_SAVE_GP // Restore gp - mov ar.pfs = GR_SAVE_PFS // Restore ar.pfs - br.ret.sptk b0 // Return -};; - -LOCAL_LIBM_END(__libm_error_region) -.type __libm_error_support#,@function -.global __libm_error_support# - - - - |