--- ffcall/avcall/avcall-ia64.s +++ ffcall/avcall/avcall-ia64.s 2006-07-21 16:24:20.000000000 +0200 @@ -1,739 +1,822 @@ .file "avcall-ia64.c" - .version "01.01" - .global __divdi3# -.text + .pred.safe_across_calls p1-p5,p16-p63 + .text .align 16 .global __builtin_avcall# .proc __builtin_avcall# __builtin_avcall: - alloc r37 = ar.pfs, 1, 5, 8, 0 - mov r34 = r32 - adds r12 = -16, r12 - mov r33 = r1 - ;; - adds r15 = 40, r34 - adds r12 = -2048, r12 - mov r36 = b0 + .prologue 12, 34 + .save ar.pfs, r35 + alloc r35 = ar.pfs, 1, 5, 8, 0 + .save ar.lc, r37 + mov r37 = ar.lc + mov r36 = r1 + .save rp, r34 + mov r34 = b0 + .body + adds r18 = -2032, r12 + adds r14 = 48, r32 + adds r15 = 56, r32 ;; - ld8 r14 = [r15] - adds r35 = 16, r12 - addl r39 = 8, r0 + ld8 r14 = [r14] ;; - sub r14 = r14, r34 + sub r14 = r14, r15 ;; - adds r38 = -120, r14 - br.call.sptk.many b0 = __divdi3# ;; - adds r15 = 48, r34 - mov r1 = r33 - addl r39 = 8, r0 + shr.u r17 = r14, 3 + adds r14 = 40, r32 + adds r15 = 120, r32 ;; - ld8 r14 = [r15] - sxt4 r33 = r8 + ld8 r14 = [r14] ;; - sub r14 = r14, r34 + sub r14 = r14, r15 ;; - adds r38 = -56, r14 - br.call.sptk.many b0 = __divdi3# ;; - addl r18 = 8, r0 - sxt4 r17 = r8 - ;; - cmp.gt p6, p7 = r33, r18 - (p7) br.cond.dpnt .L97 - adds r23 = 120, r34 - ;; - mov r19 = r23 -.L6: - shl r14 = r18, 3 - ;; - add r16 = r19, r14 - adds r18 = 1, r18 - add r14 = r35, r14 + extr r14 = r14, 3, 32 ;; - ld8 r15 = [r16] - cmp.gt p6, p7 = r33, r18 - adds r14 = -64, r14 + cmp.ge p6, p7 = 8, r14 + (p6) br.cond.dpnt .L2 + adds r16 = 184, r32 + mov r15 = r18 + sub r14 = 8, r14 ;; - st8 [r14] = r15 - (p6) br.cond.dptk .L6 - br .L96 -.L97: - adds r23 = 120, r34 -.L96: - adds r33 = 24, r34 + andcm r14 = -1, r14 + ;; + mov ar.lc = r14 +.L4: + ld8 r14 = [r16], 8 ;; - ld4 r14 = [r33] + st8 [r15] = r14, 8 + br.cloop.sptk.few .L4 +.L2: + adds r14 = 24, r32 + ;; + ld4 r14 = [r14] ;; cmp4.ne p6, p7 = 16, r14 - (p6) br.cond.dptk .L8 - adds r14 = 16, r34 ;; - ld8 r8 = [r14] -.L8: + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r8 = [r14] cmp4.ge p6, p7 = 0, r17 - (p6) br.cond.dptk .L9 - adds r14 = 56, r34 + (p6) br.cond.dpnt .L7 + adds r14 = 56, r32 ;; - cmp4.ge p6, p7 = 1, r17 ldfd f8 = [r14] - (p6) br.cond.dptk .L9 - adds r14 = 64, r34 + cmp4.ge p6, p7 = 1, r17 + (p6) br.cond.dpnt .L7 + adds r14 = 64, r32 ;; - cmp4.ge p6, p7 = 2, r17 ldfd f9 = [r14] - (p6) br.cond.dptk .L9 - adds r14 = 72, r34 + cmp4.ge p6, p7 = 2, r17 + (p6) br.cond.dptk .L7 + adds r14 = 72, r32 ;; - cmp4.ge p6, p7 = 3, r17 ldfd f10 = [r14] - (p6) br.cond.dptk .L9 - adds r14 = 80, r34 + cmp4.ge p6, p7 = 3, r17 + (p6) br.cond.dptk .L7 + adds r14 = 80, r32 ;; - cmp4.ge p6, p7 = 4, r17 ldfd f11 = [r14] - (p6) br.cond.dptk .L9 - adds r14 = 88, r34 + cmp4.ge p6, p7 = 4, r17 + (p6) br.cond.dptk .L7 + adds r14 = 88, r32 ;; - cmp4.ge p6, p7 = 5, r17 ldfd f12 = [r14] - (p6) br.cond.dptk .L9 - adds r14 = 96, r34 + cmp4.ge p6, p7 = 5, r17 + (p6) br.cond.dptk .L7 + adds r14 = 96, r32 ;; - cmp4.ge p6, p7 = 6, r17 ldfd f13 = [r14] - (p6) br.cond.dptk .L9 - adds r14 = 104, r34 + cmp4.ge p6, p7 = 6, r17 + (p6) br.cond.dptk .L7 + adds r14 = 104, r32 ;; - cmp4.ge p6, p7 = 7, r17 ldfd f14 = [r14] - (p6) br.cond.dptk .L9 - adds r14 = 112, r34 + cmp4.ge p6, p7 = 7, r17 ;; - ldfd f15 = [r14] -.L9: - ld4 r14 = [r33] + (p7) adds r14 = 112, r32 ;; - cmp4.ne p6, p7 = 13, r14 - (p6) br.cond.dptk .L17 - ld8 r21 = [r34] - adds r14 = 144, r34 - adds r15 = 152, r34 - ;; - ld8 r22 = [r21], 8 - adds r19 = 128, r34 - adds r20 = 136, r34 - adds r16 = 160, r34 - adds r17 = 168, r34 - adds r18 = 176, r34 - ld8 r41 = [r14] - ld8 r42 = [r15] - ld8 r38 = [r23] - ;; - ld8 r39 = [r19] - ld8 r40 = [r20] - ld8 r43 = [r16] - ld8 r44 = [r17] - ld8 r45 = [r18] - ld8 r1 = [r21] - mov b6 = r22 + (p7) ldfd f15 = [r14] +.L7: + adds r14 = 24, r32 ;; - br.call.sptk.many b0 = b6 ;; - adds r14 = 16, r34 + ld4 r14 = [r14] ;; - ld8 r15 = [r14] + cmp4.ne p6, p7 = 13, r14 + (p6) br.cond.dptk .L16 + adds r14 = 16, r32 ;; - stfs [r15] = f8 + ld8 r33 = [r14] + adds r14 = 120, r32 + adds r15 = 128, r32 + adds r16 = 136, r32 + adds r17 = 144, r32 + adds r18 = 152, r32 + adds r19 = 160, r32 + adds r20 = 168, r32 + adds r21 = 176, r32 + ld8 r22 = [r32] + ;; + ld8 r38 = [r14] + ld8 r39 = [r15] + ld8 r40 = [r16] + ld8 r41 = [r17] + ld8 r42 = [r18] + ld8 r43 = [r19] + ld8 r44 = [r20] + ld8 r45 = [r21] + ld8 r14 = [r22], 8 + ;; + mov b6 = r14 + ld8 r1 = [r22] + br.call.sptk.many b0 = b6 + ;; + mov r1 = r36 + stfs [r33] = f8 br .L18 -.L17: + ;; +.L16: cmp4.ne p6, p7 = 14, r14 (p6) br.cond.dptk .L19 - ld8 r21 = [r34] - adds r14 = 144, r34 - adds r15 = 152, r34 - ;; - ld8 r22 = [r21], 8 - adds r19 = 128, r34 - adds r20 = 136, r34 - adds r16 = 160, r34 - adds r17 = 168, r34 - adds r18 = 176, r34 - ld8 r41 = [r14] - ld8 r42 = [r15] - ld8 r38 = [r23] - ;; - ld8 r39 = [r19] - ld8 r40 = [r20] - ld8 r43 = [r16] - ld8 r44 = [r17] - ld8 r45 = [r18] - ld8 r1 = [r21] - mov b6 = r22 - ;; - br.call.sptk.many b0 = b6 ;; - adds r14 = 16, r34 + adds r14 = 16, r32 ;; - ld8 r15 = [r14] + ld8 r33 = [r14] + adds r14 = 120, r32 + adds r15 = 128, r32 + adds r16 = 136, r32 + adds r17 = 144, r32 + adds r18 = 152, r32 + adds r19 = 160, r32 + adds r20 = 168, r32 + adds r21 = 176, r32 + ld8 r22 = [r32] + ;; + ld8 r38 = [r14] + ld8 r39 = [r15] + ld8 r40 = [r16] + ld8 r41 = [r17] + ld8 r42 = [r18] + ld8 r43 = [r19] + ld8 r44 = [r20] + ld8 r45 = [r21] + ld8 r14 = [r22], 8 + ;; + mov b6 = r14 + ld8 r1 = [r22] + br.call.sptk.many b0 = b6 ;; - stfd [r15] = f8 + mov r1 = r36 + stfd [r33] = f8 br .L18 + ;; .L19: - ld8 r21 = [r34] - adds r14 = 144, r34 - adds r18 = 176, r34 - ;; - ld8 r22 = [r21], 8 - adds r19 = 128, r34 - adds r20 = 136, r34 - adds r15 = 152, r34 - adds r16 = 160, r34 - adds r17 = 168, r34 - ld8 r41 = [r14] - ld8 r45 = [r18] - ld8 r38 = [r23] - ;; - ld8 r39 = [r19] - ld8 r40 = [r20] - ld8 r42 = [r15] - ld8 r43 = [r16] - ld8 r44 = [r17] - ld8 r1 = [r21] - mov b6 = r22 - ;; - br.call.sptk.many b0 = b6 ;; - ld4 r14 = [r33] - mov r18 = r8 + adds r14 = 120, r32 + adds r15 = 128, r32 + adds r16 = 136, r32 + adds r17 = 144, r32 + adds r18 = 152, r32 + adds r19 = 160, r32 + adds r20 = 168, r32 + adds r21 = 176, r32 + ld8 r22 = [r32] + ;; + ld8 r38 = [r14] + ld8 r39 = [r15] + ld8 r40 = [r16] + ld8 r41 = [r17] + ld8 r42 = [r18] + ld8 r43 = [r19] + ld8 r44 = [r20] + ld8 r45 = [r21] + ld8 r14 = [r22], 8 + ;; + mov b6 = r14 + ld8 r1 = [r22] + br.call.sptk.many b0 = b6 + ;; + mov r1 = r36 + mov r23 = r8 + adds r14 = 24, r32 ;; - cmp4.ne p6, p7 = 1, r14 - (p7) br.cond.dpnt .L18 + ld4 r14 = [r14] + ;; + cmp4.eq p6, p7 = 1, r14 + (p6) br.cond.dpnt .L18 ;; cmp4.ne p6, p7 = 0, r14 - (p7) br.cond.dpnt .L98 ;; + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] + ;; + (p7) st8 [r14] = r8 + (p7) br.cond.dptk .L18 cmp4.ne p6, p7 = 2, r14 - (p7) br.cond.dpnt .L99 ;; + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] + ;; + (p7) st1 [r14] = r8 + (p7) br.cond.dpnt .L18 cmp4.ne p6, p7 = 3, r14 - (p7) br.cond.dpnt .L99 ;; + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] + ;; + (p7) st1 [r14] = r8 + (p7) br.cond.dpnt .L18 cmp4.ne p6, p7 = 4, r14 - (p6) br.cond.dptk .L29 -.L99: - adds r14 = 16, r34 ;; - ld8 r15 = [r14] + (p7) adds r14 = 16, r32 ;; - st1 [r15] = r18 - br .L18 -.L29: + (p7) ld8 r14 = [r14] + ;; + (p7) st1 [r14] = r8 + (p7) br.cond.dpnt .L18 cmp4.ne p6, p7 = 5, r14 - (p7) br.cond.dpnt .L100 ;; + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] + ;; + (p7) st2 [r14] = r8 + (p7) br.cond.dpnt .L18 cmp4.ne p6, p7 = 6, r14 - (p6) br.cond.dptk .L33 -.L100: - adds r14 = 16, r34 ;; - ld8 r15 = [r14] + (p7) adds r14 = 16, r32 ;; - st2 [r15] = r18 - br .L18 -.L33: + (p7) ld8 r14 = [r14] + ;; + (p7) st2 [r14] = r8 + (p7) br.cond.dpnt .L18 cmp4.ne p6, p7 = 7, r14 - (p7) br.cond.dpnt .L101 ;; + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] + ;; + (p7) st4 [r14] = r8 + (p7) br.cond.dpnt .L18 cmp4.ne p6, p7 = 8, r14 - (p6) br.cond.dptk .L37 -.L101: - adds r14 = 16, r34 ;; - ld8 r15 = [r14] + (p7) adds r14 = 16, r32 ;; - st4 [r15] = r18 - br .L18 -.L37: - mov r15 = r14 + (p7) ld8 r14 = [r14] ;; - cmp4.eq p6, p7 = 9, r15 - (p6) br.cond.dptk .L98 + (p7) st4 [r14] = r8 + (p7) br.cond.dpnt .L18 + cmp4.ne p6, p7 = 9, r14 ;; - cmp4.eq p6, p7 = 11, r15 - (p6) br.cond.dptk .L98 + cmp4.ne.and.orcm p6, p7 = 11, r14 ;; - cmp4.eq p6, p7 = 10, r15 - (p6) br.cond.dptk .L98 + (p7) adds r14 = 16, r32 ;; - cmp4.eq p6, p7 = 12, r15 - (p6) br.cond.dptk .L98 + (p7) ld8 r14 = [r14] ;; - cmp4.ne p6, p7 = 15, r15 - (p6) br.cond.dptk .L45 -.L98: - adds r14 = 16, r34 + (p7) st8 [r14] = r8 + (p7) br.cond.dptk .L18 + cmp4.ne p6, p7 = 10, r14 ;; - ld8 r15 = [r14] + cmp4.ne.and.orcm p6, p7 = 12, r14 ;; - st8 [r15] = r18 - br .L18 -.L45: + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] + ;; + (p7) st8 [r14] = r8 + (p7) br.cond.dptk .L18 + cmp4.ne p6, p7 = 15, r14 + ;; + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] + ;; + (p7) st8 [r14] = r8 + (p7) br.cond.dpnt .L18 cmp4.ne p6, p7 = 16, r14 (p6) br.cond.dptk .L18 - adds r15 = 8, r34 - ;; - ld4 r14 = [r15] + adds r14 = 8, r32 ;; - and r14 = 1, r14 + ld4 r14 = [r14] ;; - cmp4.eq p6, p7 = 0, r14 - (p6) br.cond.dptk .L48 - adds r14 = 32, r34 + tbit.z p6, p7 = r14, 0 + (p6) br.cond.dptk .L45 + adds r14 = 32, r32 ;; ld8 r14 = [r14] ;; cmp.ne p6, p7 = 1, r14 - (p6) br.cond.dptk .L49 - adds r14 = 16, r34 - ld1 r16 = [r18] ;; - ld8 r15 = [r14] + (p7) adds r14 = 16, r32 ;; - st1 [r15] = r16 - br .L18 -.L49: + (p7) ld8 r15 = [r14] + (p7) ld1 r14 = [r8] + ;; + (p7) st1 [r15] = r14 + (p7) br.cond.dpnt .L18 cmp.ne p6, p7 = 2, r14 - (p6) br.cond.dptk .L51 - adds r14 = 16, r34 - ld2 r16 = [r18] ;; - ld8 r15 = [r14] + (p7) adds r14 = 16, r32 ;; - st2 [r15] = r16 - br .L18 -.L51: + (p7) ld8 r15 = [r14] + (p7) ld2 r14 = [r8] + ;; + (p7) st2 [r15] = r14 + (p7) br.cond.dpnt .L18 cmp.ne p6, p7 = 4, r14 - (p6) br.cond.dptk .L53 - adds r14 = 16, r34 - ld4 r16 = [r18] ;; - ld8 r15 = [r14] + (p7) adds r14 = 16, r32 ;; - st4 [r15] = r16 - br .L18 -.L53: + (p7) ld8 r15 = [r14] + (p7) ld4 r14 = [r8] + ;; + (p7) st4 [r15] = r14 + (p7) br.cond.dpnt .L18 cmp.ne p6, p7 = 8, r14 - (p6) br.cond.dptk .L55 - adds r14 = 16, r34 - ld8 r16 = [r18] ;; - ld8 r15 = [r14] + (p7) adds r14 = 16, r32 ;; - st8 [r15] = r16 - br .L18 -.L55: + (p7) ld8 r15 = [r14] + (p7) ld8 r14 = [r8] + ;; + (p7) st8 [r15] = r14 + (p7) br.cond.dpnt .L18 adds r14 = 7, r14 ;; - shr.u r14 = r14, 3 + shr.u r25 = r14, 3 ;; - adds r14 = -1, r14 + adds r15 = -1, r25 ;; - cmp4.le p6, p7 = 0, r14 - sxt4 r17 = r14 - (p7) br.cond.dpnt .L18 - adds r14 = 16, r34 + cmp4.gt p6, p7 = r0, r15 + (p6) br.cond.dpnt .L18 + sxt4 r14 = r15 ;; - ld8 r19 = [r14] -.L59: - shl r14 = r17, 3 - adds r17 = -1, r17 + shladd r24 = r14, 3, r0 ;; - add r16 = r18, r14 - add r14 = r19, r14 - cmp4.le p6, p7 = 0, r17 + add r23 = r8, r24 + adds r16 = 16, r32 + sub r14 = r25, r15 ;; - ld8 r15 = [r16] - sxt4 r17 = r17 + adds r14 = -2, r14 + ;; + sub r14 = r15, r14, 1 + ;; + addp4 r14 = r14, r0 + ;; + mov ar.lc = r14 +.L56: + ld8 r14 = [r16] + ;; + add r14 = r24, r14 + ld8 r15 = [r23], -8 ;; st8 [r14] = r15 - (p6) br.cond.dptk .L59 + adds r24 = -8, r24 + br.cloop.sptk.few .L56 br .L18 -.L48: - ld4 r14 = [r15] - addl r15 = 512, r0 - ;; - and r14 = r15, r14 ;; - cmp4.eq p6, p7 = 0, r14 - (p6) br.cond.dptk .L18 - adds r22 = 32, r34 +.L45: + tbit.z p6, p7 = r14, 9 + (p6) br.cond.dpnt .L18 + adds r16 = 32, r32 ;; - ld8 r15 = [r22] + ld8 r15 = [r16] ;; adds r14 = -1, r15 ;; cmp.ltu p6, p7 = 31, r14 - (p6) br.cond.dptk .L18 + (p6) br.cond.dpnt .L18 ;; cmp.eq p6, p7 = 0, r15 - (p6) br.cond.dptk .L64 - adds r14 = 16, r34 + (p6) br.cond.dptk .L59 + adds r15 = 16, r32 + ;; + ld8 r14 = [r15] + ;; + st1 [r14] = r8 + ld8 r14 = [r16] + ;; + cmp.geu p6, p7 = 1, r14 + ;; + (p7) ld8 r14 = [r15] + ;; + (p7) adds r14 = 1, r14 + (p7) shr r15 = r8, 8 ;; - ld8 r15 = [r14] + (p7) st1 [r14] = r15 + adds r14 = 32, r32 ;; - st1 [r15] = r18 - ld8 r15 = [r22] + ld8 r14 = [r14] ;; -.L64: - cmp.geu p6, p7 = 1, r15 - (p6) br.cond.dptk .L65 - adds r14 = 16, r34 - shr r16 = r18, 8 + cmp.geu p6, p7 = 2, r14 ;; - ld8 r15 = [r14] + (p7) adds r14 = 16, r32 ;; - adds r15 = 1, r15 + (p7) ld8 r14 = [r14] ;; - st1 [r15] = r16 - ld8 r15 = [r22] + (p7) adds r14 = 2, r14 + (p7) shr r15 = r8, 16 ;; -.L65: - cmp.geu p6, p7 = 2, r15 - (p6) br.cond.dptk .L66 - adds r14 = 16, r34 - shr r16 = r18, 16 + (p7) st1 [r14] = r15 + adds r14 = 32, r32 ;; - ld8 r15 = [r14] + ld8 r14 = [r14] ;; - adds r15 = 2, r15 + cmp.geu p6, p7 = 3, r14 ;; - st1 [r15] = r16 - ld8 r15 = [r22] + (p7) adds r14 = 16, r32 ;; -.L66: - cmp.geu p6, p7 = 3, r15 - (p6) br.cond.dptk .L67 - adds r14 = 16, r34 - shr r16 = r18, 24 + (p7) ld8 r14 = [r14] ;; - ld8 r15 = [r14] + (p7) adds r14 = 3, r14 + (p7) shr r15 = r8, 24 ;; - adds r15 = 3, r15 + (p7) st1 [r14] = r15 +.L59: + adds r14 = 32, r32 ;; - st1 [r15] = r16 - ld8 r15 = [r22] + ld8 r14 = [r14] ;; -.L67: - cmp.geu p6, p7 = 4, r15 - (p6) br.cond.dptk .L68 - adds r14 = 16, r34 - shr r16 = r18, 32 + cmp.geu p6, p7 = 4, r14 ;; - ld8 r15 = [r14] + (p7) adds r14 = 16, r32 ;; - adds r15 = 4, r15 + (p7) ld8 r14 = [r14] ;; - st1 [r15] = r16 - ld8 r15 = [r22] + (p7) adds r14 = 4, r14 + (p7) shr r15 = r23, 32 ;; -.L68: - cmp.geu p6, p7 = 5, r15 - (p6) br.cond.dptk .L69 - adds r14 = 16, r34 - shr r16 = r18, 40 + (p7) st1 [r14] = r15 + adds r14 = 32, r32 ;; - ld8 r15 = [r14] + ld8 r14 = [r14] ;; - adds r15 = 5, r15 + cmp.geu p6, p7 = 5, r14 ;; - st1 [r15] = r16 - ld8 r15 = [r22] + (p7) adds r14 = 16, r32 ;; -.L69: - cmp.geu p6, p7 = 6, r15 - (p6) br.cond.dptk .L70 - adds r14 = 16, r34 - shr r16 = r18, 48 + (p7) ld8 r14 = [r14] ;; - ld8 r15 = [r14] + (p7) adds r14 = 5, r14 + (p7) shr r15 = r23, 40 ;; - adds r15 = 6, r15 + (p7) st1 [r14] = r15 + adds r14 = 32, r32 ;; - st1 [r15] = r16 - ld8 r15 = [r22] + ld8 r14 = [r14] ;; -.L70: - cmp.geu p6, p7 = 7, r15 - (p6) br.cond.dptk .L71 - adds r14 = 16, r34 - shr r16 = r18, 56 + cmp.geu p6, p7 = 6, r14 ;; - ld8 r15 = [r14] + (p7) adds r14 = 16, r32 ;; - adds r15 = 7, r15 + (p7) ld8 r14 = [r14] ;; - st1 [r15] = r16 - ld8 r15 = [r22] + (p7) adds r14 = 6, r14 + (p7) shr r15 = r23, 48 ;; -.L71: - cmp.geu p6, p7 = 8, r15 - (p6) br.cond.dptk .L18 - adds r16 = 16, r34 + (p7) st1 [r14] = r15 + adds r14 = 32, r32 + ;; + ld8 r14 = [r14] + ;; + cmp.geu p6, p7 = 7, r14 + ;; + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] + ;; + (p7) adds r14 = 7, r14 + (p7) shr r15 = r23, 56 + ;; + (p7) st1 [r14] = r15 + adds r15 = 32, r32 + ;; + ld8 r14 = [r15] + ;; + cmp.geu p6, p7 = 8, r14 + (p6) br.cond.dpnt .L18 + adds r16 = 16, r32 ;; ld8 r14 = [r16] ;; adds r14 = 8, r14 ;; st1 [r14] = r9 - ld8 r15 = [r22] + ld8 r14 = [r15] ;; - cmp.geu p6, p7 = 9, r15 - (p6) br.cond.dptk .L73 - ld8 r14 = [r16] - shr r15 = r9, 8 + cmp.geu p6, p7 = 9, r14 ;; - adds r14 = 9, r14 + (p7) ld8 r14 = [r16] ;; - st1 [r14] = r15 - ld8 r15 = [r22] + (p7) adds r14 = 9, r14 + (p7) shr r15 = r9, 8 ;; -.L73: - cmp.geu p6, p7 = 10, r15 - (p6) br.cond.dptk .L74 - ld8 r14 = [r16] - shr r15 = r9, 16 + (p7) st1 [r14] = r15 + adds r14 = 32, r32 + ;; + ld8 r14 = [r14] + ;; + cmp.geu p6, p7 = 10, r14 + ;; + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] ;; - adds r14 = 10, r14 + (p7) adds r14 = 10, r14 + (p7) shr r15 = r9, 16 ;; - st1 [r14] = r15 -.L74: - ld8 r14 = [r22] + (p7) st1 [r14] = r15 + adds r14 = 32, r32 + ;; + ld8 r14 = [r14] ;; cmp.geu p6, p7 = 11, r14 - (p6) br.cond.dptk .L75 - ld8 r14 = [r16] - shr r15 = r9, 24 ;; - adds r14 = 11, r14 + (p7) adds r14 = 16, r32 ;; - st1 [r14] = r15 - ld8 r14 = [r22] + (p7) ld8 r14 = [r14] + ;; + (p7) adds r14 = 11, r14 + (p7) shr r15 = r9, 24 + ;; + (p7) st1 [r14] = r15 + adds r14 = 32, r32 + ;; + ld8 r14 = [r14] ;; -.L75: cmp.geu p6, p7 = 12, r14 - (p6) br.cond.dptk .L76 - ld8 r14 = [r16] - shr r15 = r9, 32 ;; - adds r14 = 12, r14 + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] + ;; + (p7) adds r14 = 12, r14 + (p7) shr r15 = r9, 32 ;; - st1 [r14] = r15 - ld8 r14 = [r22] + (p7) st1 [r14] = r15 + adds r14 = 32, r32 + ;; + ld8 r14 = [r14] ;; -.L76: cmp.geu p6, p7 = 13, r14 - (p6) br.cond.dptk .L77 - ld8 r14 = [r16] - shr r15 = r9, 40 ;; - adds r14 = 13, r14 + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] ;; - st1 [r14] = r15 - ld8 r14 = [r22] + (p7) adds r14 = 13, r14 + (p7) shr r15 = r9, 40 + ;; + (p7) st1 [r14] = r15 + adds r14 = 32, r32 + ;; + ld8 r14 = [r14] ;; -.L77: cmp.geu p6, p7 = 14, r14 - (p6) br.cond.dptk .L78 - ld8 r14 = [r16] - shr r15 = r9, 48 ;; - adds r14 = 14, r14 + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] ;; - st1 [r14] = r15 - ld8 r14 = [r22] + (p7) adds r14 = 14, r14 + (p7) shr r15 = r9, 48 + ;; + (p7) st1 [r14] = r15 + adds r14 = 32, r32 + ;; + ld8 r14 = [r14] ;; -.L78: cmp.geu p6, p7 = 15, r14 - (p6) br.cond.dptk .L79 - ld8 r14 = [r16] - shr r15 = r9, 56 ;; - adds r14 = 15, r14 + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] ;; - st1 [r14] = r15 - ld8 r14 = [r22] + (p7) adds r14 = 15, r14 + (p7) shr r15 = r9, 56 + ;; + (p7) st1 [r14] = r15 + adds r15 = 32, r32 + ;; + ld8 r14 = [r15] ;; -.L79: cmp.geu p6, p7 = 16, r14 - (p6) br.cond.dptk .L18 + (p6) br.cond.dpnt .L18 + adds r16 = 16, r32 + ;; ld8 r14 = [r16] ;; adds r14 = 16, r14 ;; st1 [r14] = r10 - ld8 r14 = [r22] + ld8 r14 = [r15] ;; cmp.geu p6, p7 = 17, r14 - (p6) br.cond.dptk .L81 - ld8 r14 = [r16] - shr r15 = r10, 8 ;; - adds r14 = 17, r14 + (p7) ld8 r14 = [r16] ;; - st1 [r14] = r15 - ld8 r14 = [r22] + (p7) adds r14 = 17, r14 + (p7) shr r15 = r10, 8 + ;; + (p7) st1 [r14] = r15 + adds r14 = 32, r32 + ;; + ld8 r14 = [r14] ;; -.L81: cmp.geu p6, p7 = 18, r14 - (p6) br.cond.dptk .L82 - ld8 r14 = [r16] - shr r15 = r10, 16 ;; - adds r14 = 18, r14 + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] + ;; + (p7) adds r14 = 18, r14 + (p7) shr r15 = r10, 16 + ;; + (p7) st1 [r14] = r15 + adds r14 = 32, r32 ;; - st1 [r14] = r15 - ld8 r14 = [r22] + ld8 r14 = [r14] ;; -.L82: cmp.geu p6, p7 = 19, r14 - (p6) br.cond.dptk .L83 - ld8 r14 = [r16] - shr r15 = r10, 24 ;; - adds r14 = 19, r14 + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] + ;; + (p7) adds r14 = 19, r14 + (p7) shr r15 = r10, 24 ;; - st1 [r14] = r15 - ld8 r14 = [r22] + (p7) st1 [r14] = r15 + adds r14 = 32, r32 + ;; + ld8 r14 = [r14] ;; -.L83: cmp.geu p6, p7 = 20, r14 - (p6) br.cond.dptk .L84 - ld8 r14 = [r16] - shr r15 = r10, 32 ;; - adds r14 = 20, r14 + (p7) adds r14 = 16, r32 ;; - st1 [r14] = r15 - ld8 r14 = [r22] + (p7) ld8 r14 = [r14] + ;; + (p7) adds r14 = 20, r14 + (p7) shr r15 = r10, 32 + ;; + (p7) st1 [r14] = r15 + adds r14 = 32, r32 + ;; + ld8 r14 = [r14] ;; -.L84: cmp.geu p6, p7 = 21, r14 - (p6) br.cond.dptk .L85 - ld8 r14 = [r16] - shr r15 = r10, 40 ;; - adds r14 = 21, r14 + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] + ;; + (p7) adds r14 = 21, r14 + (p7) shr r15 = r10, 40 ;; - st1 [r14] = r15 -.L85: - ld8 r14 = [r22] + (p7) st1 [r14] = r15 + adds r14 = 32, r32 + ;; + ld8 r14 = [r14] ;; cmp.geu p6, p7 = 22, r14 - (p6) br.cond.dptk .L86 - ld8 r14 = [r16] - shr r15 = r10, 48 ;; - adds r14 = 22, r14 + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] ;; - st1 [r14] = r15 - ld8 r14 = [r22] + (p7) adds r14 = 22, r14 + (p7) shr r15 = r10, 48 + ;; + (p7) st1 [r14] = r15 + adds r14 = 32, r32 + ;; + ld8 r14 = [r14] ;; -.L86: cmp.geu p6, p7 = 23, r14 - (p6) br.cond.dptk .L87 - ld8 r14 = [r16] - shr r15 = r10, 56 ;; - adds r14 = 23, r14 + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] ;; - st1 [r14] = r15 - ld8 r14 = [r22] + (p7) adds r14 = 23, r14 + (p7) shr r15 = r10, 56 + ;; + (p7) st1 [r14] = r15 + adds r15 = 32, r32 + ;; + ld8 r14 = [r15] ;; -.L87: cmp.geu p6, p7 = 24, r14 - (p6) br.cond.dptk .L18 + (p6) br.cond.dpnt .L18 + adds r16 = 16, r32 + ;; ld8 r14 = [r16] ;; adds r14 = 24, r14 ;; st1 [r14] = r11 - ld8 r14 = [r22] + ld8 r14 = [r15] ;; cmp.geu p6, p7 = 25, r14 - (p6) br.cond.dptk .L89 - ld8 r14 = [r16] - shr r15 = r11, 8 ;; - adds r14 = 25, r14 + (p7) ld8 r14 = [r16] ;; - st1 [r14] = r15 - ld8 r14 = [r22] + (p7) adds r14 = 25, r14 + (p7) shr r15 = r11, 8 + ;; + (p7) st1 [r14] = r15 + adds r14 = 32, r32 + ;; + ld8 r14 = [r14] ;; -.L89: cmp.geu p6, p7 = 26, r14 - (p6) br.cond.dptk .L90 - ld8 r14 = [r16] - shr r15 = r11, 16 ;; - adds r14 = 26, r14 + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] ;; - st1 [r14] = r15 - ld8 r14 = [r22] + (p7) adds r14 = 26, r14 + (p7) shr r15 = r11, 16 + ;; + (p7) st1 [r14] = r15 + adds r14 = 32, r32 + ;; + ld8 r14 = [r14] ;; -.L90: cmp.geu p6, p7 = 27, r14 - (p6) br.cond.dptk .L91 - ld8 r14 = [r16] - shr r15 = r11, 24 ;; - adds r14 = 27, r14 + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] + ;; + (p7) adds r14 = 27, r14 + (p7) shr r15 = r11, 24 + ;; + (p7) st1 [r14] = r15 + adds r14 = 32, r32 ;; - st1 [r14] = r15 - ld8 r14 = [r22] + ld8 r14 = [r14] ;; -.L91: cmp.geu p6, p7 = 28, r14 - (p6) br.cond.dptk .L92 - ld8 r14 = [r16] - shr r15 = r11, 32 ;; - adds r14 = 28, r14 + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] + ;; + (p7) adds r14 = 28, r14 + (p7) shr r15 = r11, 32 ;; - st1 [r14] = r15 - ld8 r14 = [r22] + (p7) st1 [r14] = r15 + adds r14 = 32, r32 + ;; + ld8 r14 = [r14] ;; -.L92: cmp.geu p6, p7 = 29, r14 - (p6) br.cond.dptk .L93 - ld8 r14 = [r16] - shr r15 = r11, 40 ;; - adds r14 = 29, r14 + (p7) adds r14 = 16, r32 ;; - st1 [r14] = r15 - ld8 r14 = [r22] + (p7) ld8 r14 = [r14] + ;; + (p7) adds r14 = 29, r14 + (p7) shr r15 = r11, 40 + ;; + (p7) st1 [r14] = r15 + adds r14 = 32, r32 + ;; + ld8 r14 = [r14] ;; -.L93: cmp.geu p6, p7 = 30, r14 - (p6) br.cond.dptk .L94 - ld8 r14 = [r16] - shr r15 = r11, 48 ;; - adds r14 = 30, r14 + (p7) adds r14 = 16, r32 + ;; + (p7) ld8 r14 = [r14] + ;; + (p7) adds r14 = 30, r14 + (p7) shr r15 = r11, 48 ;; - st1 [r14] = r15 - ld8 r14 = [r22] + (p7) st1 [r14] = r15 + adds r14 = 32, r32 + ;; + ld8 r14 = [r14] ;; -.L94: cmp.geu p6, p7 = 31, r14 - (p6) br.cond.dptk .L18 - ld8 r14 = [r16] - shr r15 = r11, 56 ;; - adds r14 = 31, r14 + (p7) adds r14 = 16, r32 ;; - st1 [r14] = r15 + (p7) ld8 r14 = [r14] + ;; + (p7) adds r14 = 31, r14 + (p7) shr r15 = r11, 56 + ;; + (p7) st1 [r14] = r15 .L18: - addl r8 = 0, r0 - adds r12 = 16, r12 - mov ar.pfs = r37 - mov b0 = r36 + mov r8 = r0 + mov ar.pfs = r35 + mov ar.lc = r37 + mov b0 = r34 br.ret.sptk.many b0 + ;; .endp __builtin_avcall# - .ident "GCC: (GNU) 2.9-ia64-000216 snap-000324" + .ident "GCC: (GNU) 4.1.0 (SUSE Linux)" --- ffcall/avcall/avcall.h.in +++ ffcall/avcall/avcall.h.in 2006-07-19 17:19:49.000000000 +0200 @@ -1112,7 +1112,7 @@ typedef struct * different alignment. */ /* little endian -> small structures < 1 word are adjusted to the left */ -#if defined(__i386__) || defined(__alpha__) || defined(__x86_64__) +#if defined(__i386__) || defined(__alpha__) || defined(__x86_64__) || (defined(__ia64__) && defined(__GNUC__) && (__GNUC__ >= 3)) #define __av_struct(LIST,TYPE,TYPE_SIZE,TYPE_ALIGN,ASSIGN,VAL) \ (((LIST).aptr = \ (__avword*)(((__avword)(LIST).aptr+(TYPE_SIZE)+__av_struct_alignment(TYPE_ALIGN)-1) & -(long)__av_struct_alignment(TYPE_ALIGN)))\ @@ -1121,7 +1121,7 @@ typedef struct (LIST).aptr = (__avword*)(((__avword)(LIST).aptr+sizeof(__avword)-1) & -(long)sizeof(__avword)),\ 0)) #endif -#if defined(__ia64__) +#if defined(__ia64__) && (!defined(__GNUC__) || (__GNUC__ < 3)) /* Types larger than a word have 2-word alignment. */ #define __av_struct(LIST,TYPE,TYPE_SIZE,TYPE_ALIGN,ASSIGN,VAL) \ ((LIST).aptr = (__avword*)(((__avword)(LIST).aptr+(TYPE_SIZE)+__av_struct_alignment(TYPE_ALIGN)-1) & -(long)__av_struct_alignment(TYPE_ALIGN)), \ --- ffcall/callback/vacall_r/vacall_r.h.in +++ ffcall/callback/vacall_r/vacall_r.h.in 2006-07-19 17:23:49.000000000 +0200 @@ -1059,7 +1059,7 @@ typedef __va_alist* va_alist; #endif #define __va_align_struct(LIST,TYPE_SIZE,TYPE_ALIGN) \ (LIST)->aptr = ((LIST)->aptr + __va_struct_alignment(TYPE_ALIGN)-1) & -(long)__va_struct_alignment(TYPE_ALIGN), -#if defined(__i386__) || defined(__m68k__) || defined(__alpha__) || defined(__arm__) || defined(__powerpc64__) || defined(__m88k__) || defined(__convex__) || defined(__x86_64__) +#if defined(__i386__) || defined(__m68k__) || defined(__alpha__) || defined(__arm__) || defined(__powerpc64__) || defined(__m88k__) || defined(__convex__) || defined(__x86_64__) || (defined(__ia64__) && defined(__GNUC__) && (__GNUC__ >= 3)) #define __va_arg_struct(LIST,TYPE_SIZE,TYPE_ALIGN) \ (__va_align_struct(LIST,TYPE_SIZE,TYPE_ALIGN) \ __va_arg_adjusted(LIST,TYPE_SIZE,TYPE_ALIGN) \ @@ -1144,7 +1144,7 @@ typedef __va_alist* va_alist; (void*)__va_arg_rightadjusted(LIST,TYPE_SIZE,TYPE_ALIGN) \ ) #endif -#if defined(__ia64__) +#if defined(__ia64__) && (!defined(__GNUC__) || (__GNUC__ < 3)) /* Types larger than a word have 2-word alignment. */ #define __va_arg_struct(LIST,TYPE_SIZE,TYPE_ALIGN) \ (__va_align_struct(LIST,TYPE_SIZE,TYPE_ALIGN) \