?? s_nextafterf.s

?? glibc 庫, 不僅可以學習使用庫函數,還可以學習函數的具體實現,是提高功力的好資料
?? S
字號:
.file "nextafterf.s"// Copyright (c) 2000 - 2004, Intel Corporation// All rights reserved.//// Contributed 2000 by the Intel Numerics Group, Intel Corporation//// Redistribution and use in source and binary forms, with or without// modification, are permitted provided that the following conditions are// met://// * Redistributions of source code must retain the above copyright// notice, this list of conditions and the following disclaimer.//// * Redistributions in binary form must reproduce the above copyright// notice, this list of conditions and the following disclaimer in the// documentation and/or other materials provided with the distribution.//// * The name of Intel Corporation may not be used to endorse or promote// products derived from this software without specific prior written// permission.// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL INTEL OR ITS // CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,// EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR // PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY // OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY OR TORT (INCLUDING// NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS // SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. // // Intel Corporation is the author of this code, and requests that all// problem reports or change requests be submitted to it directly at // http://www.intel.com/software/products/opensource/libraries/num.htm.//// History//==============================================================// 02/02/00 Initial version // 03/03/00 Modified to conform to C9X, and improve speed of main path// 03/14/00 Fixed case where x is a power of 2, and x > y, improved speed// 04/04/00 Unwind support added// 05/12/00 Fixed erroneous denormal flag setting for exponent change cases 1,3// 08/15/00 Bundle added after call to __libm_error_support to properly//          set [the previously overwritten] GR_Parameter_RESULT.// 09/09/00 Updated fcmp so that qnans do not raise invalid// 12/15/00 Corrected behavior when both args are zero to conform to C99, and//          fixed flag settings for several cases// 05/20/02 Cleaned up namespace and sf0 syntax// 02/10/03 Reordered header: .section, .global, .proc, .align// 12/14/04 Added error handling on underflow.//// API//==============================================================// float nextafterf( float x, float y );// input  floating point f8, f9// output floating point f8//// Registers used//==============================================================GR_max_pexp     = r14GR_min_pexp     = r15GR_exp          = r16GR_sig          = r17GR_lnorm_sig    = r18GR_sign_mask    = r19GR_exp_mask     = r20GR_sden_sig     = r21GR_new_sig      = r22GR_new_exp      = r23GR_lden_sig     = r24GR_snorm_sig    = r25GR_exp1         = r26GR_x_exp        = r27GR_min_den_rexp = r28// r36-39 parameters for libm_error_supportGR_SAVE_B0                = r34GR_SAVE_GP                = r35GR_SAVE_PFS               = r32GR_Parameter_X            = r36GR_Parameter_Y            = r37GR_Parameter_RESULT       = r38GR_Parameter_TAG          = r39FR_lnorm_sig       = f10FR_lnorm_exp       = f11FR_lnorm           = f12FR_sden_sig        = f13FR_sden_exp        = f14FR_sden            = f15FR_save_f8         = f33FR_new_exp         = f34FR_new_sig         = f35FR_lden_sig        = f36FR_snorm_sig       = f37FR_exp1            = f38FR_tmp             = f39//// Overview of operation//==============================================================// nextafterf determines the next representable value // after x in the direction of y. .section .textGLOBAL_LIBM_ENTRY(nextafterf)// Extract signexp from x// Form smallest denormal significand = ulp size{ .mlx      getf.exp GR_exp      = f8      movl GR_sden_sig = 0x0000010000000000}// Form largest normal exponent// Is x < y ?  p10 if yes, p11 if no// Form smallest normal exponent{ .mfi      addl GR_max_pexp = 0x1007e, r0      fcmp.lt.s1 p10,p11 = f8, f9      addl GR_min_pexp = 0x0ff81, r0 ;;}// Is x=y?{ .mfi      getf.sig GR_sig      = f8      fcmp.eq.s0 p6,p0 = f8, f9      nop.i 0}// Extract significand from x// Form largest normal significand{ .mlx      nop.m 0       movl GR_lnorm_sig = 0xffffff0000000000 ;;}// Move largest normal significand to fp reg for special cases{ .mfi      setf.sig FR_lnorm_sig = GR_lnorm_sig      nop.f 0       addl GR_sign_mask = 0x20000, r0 ;;}// Move smallest denormal significand and signexp to fp regs// Is x=nan?// Set p12 and p13 based on whether significand increases or decreases// It increases (p12 set) if x<y and x>=0 or if x>y and x<0// It decreases (p13 set) if x<y and x<0  or if x>y and x>=0{ .mfi      setf.sig FR_sden_sig = GR_sden_sig      fclass.m  p8,p0 = f8, 0xc3           (p10) cmp.lt p12,p13 = GR_exp, GR_sign_mask}{ .mfi      setf.exp FR_sden_exp = GR_min_pexp      nop.f 999(p11) cmp.ge p12,p13 = GR_exp, GR_sign_mask ;;}.pred.rel "mutex",p12,p13// Form expected new significand, adding or subtracting 1 ulp increment// If x=y set result to y// Form smallest normal significand and largest denormal significand{ .mfi(p12) add GR_new_sig = GR_sig, GR_sden_sig(p6)  fmerge.s f8=f9,f9      dep.z GR_snorm_sig = 1,63,1 // 0x8000000000000000}{ .mlx(p13) sub GR_new_sig = GR_sig, GR_sden_sig      movl GR_lden_sig = 0x7fffff0000000000 ;;}// Move expected result significand and signexp to fp regs// Is y=nan?// Form new exponent in case result exponent needs incrementing or decrementing{ .mfi      setf.exp FR_new_exp = GR_exp      fclass.m  p9,p0 = f9, 0xc3           (p12) add GR_exp1 = 1, GR_exp}{ .mib      setf.sig FR_new_sig = GR_new_sig(p13) add GR_exp1 = -1, GR_exp(p6)  br.ret.spnt    b0 ;;             // Exit if x=y}// Move largest normal signexp to fp reg for special cases// Is x=zero?{ .mfi      setf.exp FR_lnorm_exp = GR_max_pexp      fclass.m  p7,p0 = f8, 0x7      nop.i 999}{ .mfb      nop.m 999(p8)  fma.s0 f8 = f8,f1,f9                     (p8)  br.ret.spnt    b0 ;;             // Exit if x=nan}// Move exp+-1 and smallest normal significand to fp regs for special cases// Is x=inf?{ .mfi      setf.exp FR_exp1 = GR_exp1      fclass.m  p6,p0 = f8, 0x23                 addl GR_exp_mask = 0x1ffff, r0}{ .mfb      setf.sig FR_snorm_sig = GR_snorm_sig(p9)  fma.s0 f8 = f8,f1,f9                     (p9)  br.ret.spnt    b0 ;;             // Exit if y=nan}// Move largest denormal significand to fp regs for special cases// Save x{ .mfb      setf.sig FR_lden_sig = GR_lden_sig      mov FR_save_f8 = f8(p7)  br.cond.spnt NEXT_ZERO ;;   // Exit if x=0   }// Mask off the sign to get x_exp{ .mfb      and GR_x_exp = GR_exp_mask, GR_exp      nop.f 999(p6)  br.cond.spnt NEXT_INF ;;   // Exit if x=inf   }// Check 6 special cases when significand rolls over://  1 sig size incr, x_sig=max_sig, x_exp < max_exp//     Set p6, result is sig=min_sig, exp++//  2 sig size incr, x_sig=max_sig, x_exp >= max_exp//     Set p7, result is inf, signal overflow//  3 sig size decr, x_sig=min_sig, x_exp > min_exp//     Set p8, result is sig=max_sig, exp--//  4 sig size decr, x_sig=min_sig, x_exp = min_exp//     Set p9, result is sig=max_den_sig, exp same, signal underflow and inexact//  5 sig size decr, x_sig=min_den_sig, x_exp = min_exp//     Set p10, result is zero, sign of x, signal underflow and inexact//  6 sig size decr, x_sig=min_sig, x_exp < min_exp //     Set p14, result is zero, sign of x, signal underflow and inexact//// Form exponent of smallest float denormal (if normalized register format){ .mmi      adds GR_min_den_rexp = -23, GR_min_pexp(p12) cmp.eq.unc p6,p0 = GR_new_sig, r0(p13) cmp.eq.unc p8,p10 = GR_new_sig, GR_lden_sig ;;}{ .mmi(p6)  cmp.lt.unc p6,p7 = GR_x_exp, GR_max_pexp(p8)  cmp.gt.unc p8,p9 = GR_x_exp, GR_min_pexp(p10) cmp.eq.unc p10,p0 = GR_new_sig, r0 ;;}// Create small normal in case need to generate underflow flag{ .mfi(p10) cmp.le.unc p10,p0 = GR_x_exp, GR_min_pexp      fmerge.se FR_tmp = FR_sden_exp, FR_lnorm_sig(p9)  cmp.gt.unc p9,p14 = GR_x_exp, GR_min_den_rexp}// Branch if cases 1, 2, 3{ .bbb(p6)  br.cond.spnt NEXT_EXPUP(p7)  br.cond.spnt NEXT_OVERFLOW(p8)  br.cond.spnt NEXT_EXPDOWN ;;}// Branch if cases 4, 5, 6{ .bbb(p9)  br.cond.spnt NEXT_NORM_TO_DENORM(p10) br.cond.spnt NEXT_UNDERFLOW_TO_ZERO(p14) br.cond.spnt NEXT_UNDERFLOW_TO_ZERO ;;}// Here if no special cases// Set p6 if result will be a denormal, so can force underflow flag//    Case 1:  x_exp=min_exp, x_sig=unnormalized//    Case 2:  x_exp<min_exp{ .mfi      cmp.lt p6,p7 = GR_x_exp, GR_min_pexp      fmerge.se f8 = FR_new_exp, FR_new_sig      nop.i 999 ;;}{ .mfi      nop.m 999      nop.f 999(p7)  tbit.z p6,p0 = GR_new_sig, 63 ;;}NEXT_COMMON_FINISH:// Force underflow and inexact if denormal result{ .mfi      nop.m 999(p6)  fma.s.s0 FR_tmp = FR_tmp,FR_tmp,f0      nop.i 999}{ .mfb      nop.m 999      fnorm.s.s0 f8 = f8 // Final normalization to result precision(p6)  br.cond.spnt NEXT_UNDERFLOW ;;}{ .mfb      nop.m 999      nop.f 999      br.ret.sptk b0;;}//Special casesNEXT_EXPUP:{ .mfb      cmp.lt p6,p7 = GR_x_exp, GR_min_pexp      fmerge.se f8 = FR_exp1, FR_snorm_sig      br.cond.sptk NEXT_COMMON_FINISH ;;}NEXT_EXPDOWN:{ .mfb      cmp.lt p6,p7 = GR_x_exp, GR_min_pexp      fmerge.se f8 = FR_exp1, FR_lnorm_sig      br.cond.sptk NEXT_COMMON_FINISH ;;}NEXT_NORM_TO_DENORM:{ .mfi      nop.m 999      fmerge.se f8 = FR_new_exp, FR_lden_sig      nop.i 999}// Force underflow and inexact{ .mfb      nop.m 999      fma.s.s0 FR_tmp = FR_tmp,FR_tmp,f0      br.cond.sptk NEXT_UNDERFLOW ;;}NEXT_UNDERFLOW_TO_ZERO:{ .mfb      cmp.eq p6,p0 = r0,r0      fmerge.s f8 = FR_save_f8,f0      br.cond.sptk NEXT_COMMON_FINISH ;;}NEXT_INF: // Here if f8 is +- infinity// INF// if f8 is +inf, no matter what y is return  largest float// if f8 is -inf, no matter what y is return -largest float{ .mfi      nop.m 999      fmerge.se FR_lnorm = FR_lnorm_exp,FR_lnorm_sig      nop.i 999 ;;}{ .mfb      nop.m 999      fmerge.s f8 = f8,FR_lnorm                      br.ret.sptk    b0 ;;                        }NEXT_ZERO: // Here if f8 is +- zero// ZERO// if f8 is zero and y is +, return + smallest float denormal // if f8 is zero and y is -, return - smallest float denormal { .mfi      nop.m 999      fmerge.se FR_sden = FR_sden_exp,FR_sden_sig      nop.i 999 ;;}// Create small normal to generate underflow flag{ .mfi      nop.m 999      fmerge.se FR_tmp = FR_sden_exp, FR_lnorm_sig      nop.i 999 ;;}// Add correct sign from direction arg{ .mfi      nop.m 999      fmerge.s f8 = f9,FR_sden                      nop.i 999 ;;}// Force underflow and inexact flags{ .mfb      nop.m 999      fma.s.s0 FR_tmp = FR_tmp,FR_tmp,f0      br.cond.sptk NEXT_UNDERFLOW ;;}NEXT_UNDERFLOW: // Here if result is a denorm, or input is finite and result is zero// Call error support to report possible range error{ .mib      alloc          r32=ar.pfs,2,2,4,0      mov           GR_Parameter_TAG = 269      // Error code      br.cond.sptk  __libm_error_region    // Branch to error call};;NEXT_OVERFLOW: // Here if input is finite, but result will be infinite// Use frcpa to generate infinity of correct sign// Call error support to report possible range error{ .mfi      alloc          r32=ar.pfs,2,2,4,0      frcpa.s1 f8,p6 = FR_save_f8, f0      nop.i 999 ;;}// Create largest double{ .mfi      nop.m 999      fmerge.se FR_lnorm = FR_lnorm_exp,FR_lnorm_sig      nop.i 999 ;;}// Force overflow and inexact flags to be set{ .mfb      mov           GR_Parameter_TAG = 155      // Error code      fma.s.s0 FR_tmp = FR_lnorm,FR_lnorm,f0      br.cond.sptk  __libm_error_region    // Branch to error call};;GLOBAL_LIBM_END(nextafterf)LOCAL_LIBM_ENTRY(__libm_error_region).prologue// (1){ .mfi        add   GR_Parameter_Y=-32,sp             // Parameter 2 value        nop.f 0.save   ar.pfs,GR_SAVE_PFS        mov  GR_SAVE_PFS=ar.pfs                 // Save ar.pfs}{ .mfi.fframe 64        add sp=-64,sp                          // Create new stack        nop.f 0        mov GR_SAVE_GP=gp                      // Save gp};;// (2){ .mmi        stfs [GR_Parameter_Y] = f9,16         // STORE Parameter 2 on stack        add GR_Parameter_X = 16,sp            // Parameter 1 address.save   b0, GR_SAVE_B0        mov GR_SAVE_B0=b0                     // Save b0};;.body// (3){ .mib        stfs [GR_Parameter_X] = FR_save_f8              // STORE Parameter 1 on stack        add   GR_Parameter_RESULT = 0,GR_Parameter_Y           // Parameter 3 address        nop.b 0                                }{ .mib        stfs [GR_Parameter_Y] = f8              // STORE Parameter 3 on stack        add   GR_Parameter_Y = -16,GR_Parameter_Y        br.call.sptk b0=__libm_error_support#   // Call error handling function};;{ .mmi        nop.m 0        nop.m 0        add   GR_Parameter_RESULT = 48,sp};;// (4){ .mmi        ldfs  f8 = [GR_Parameter_RESULT]       // Get return result off stack.restore sp        add   sp = 64,sp                       // Restore stack pointer        mov   b0 = GR_SAVE_B0                  // Restore return address};;{ .mib        mov   gp = GR_SAVE_GP                  // Restore gp        mov   ar.pfs = GR_SAVE_PFS             // Restore ar.pfs        br.ret.sptk     b0                     // Return};;LOCAL_LIBM_END(__libm_error_region).type   __libm_error_support#,@function.global __libm_error_support#
?? 文件大小 20450 K
?? 上傳用戶 hanyuangu
?? 所屬分類 Linux/Unix編程
??? 相關標簽

#glibc #庫函數 #函數
?? 快捷鍵說明

復制代碼 Ctrl + C
搜索代碼 Ctrl + F
全屏模式 F11
切換主題 Ctrl + Shift + D
顯示快捷鍵 ?
增大字號 Ctrl + =
減小字號 Ctrl + -
亚洲欧美第一页_禁久久精品乱码_粉嫩av一区二区三区免费野_久草精品视频

?? s_nextafterf.s

?? 快捷鍵說明