1.1 --- /dev/null Thu Jan 01 00:00:00 1970 +0000 1.2 +++ b/security/nss/lib/freebl/mpi/montmulf.s Wed Dec 31 06:09:35 2014 +0100 1.3 @@ -0,0 +1,1938 @@ 1.4 +! 1.5 +! This Source Code Form is subject to the terms of the Mozilla Public 1.6 +! License, v. 2.0. If a copy of the MPL was not distributed with this 1.7 +! file, You can obtain one at http://mozilla.org/MPL/2.0/. 1.8 + 1.9 + .section ".text",#alloc,#execinstr 1.10 + .file "montmulf.c" 1.11 + 1.12 + .section ".data",#alloc,#write 1.13 + .align 8 1.14 +TwoTo16: /* frequency 1.0 confidence 0.0 */ 1.15 + .word 1089470464 1.16 + .word 0 1.17 + .type TwoTo16,#object 1.18 + .size TwoTo16,8 1.19 +TwoToMinus16: /* frequency 1.0 confidence 0.0 */ 1.20 + .word 1055916032 1.21 + .word 0 1.22 + .type TwoToMinus16,#object 1.23 + .size TwoToMinus16,8 1.24 +Zero: /* frequency 1.0 confidence 0.0 */ 1.25 + .word 0 1.26 + .word 0 1.27 + .type Zero,#object 1.28 + .size Zero,8 1.29 +TwoTo32: /* frequency 1.0 confidence 0.0 */ 1.30 + .word 1106247680 1.31 + .word 0 1.32 + .type TwoTo32,#object 1.33 + .size TwoTo32,8 1.34 +TwoToMinus32: /* frequency 1.0 confidence 0.0 */ 1.35 + .word 1039138816 1.36 + .word 0 1.37 + .type TwoToMinus32,#object 1.38 + .size TwoToMinus32,8 1.39 + 1.40 + .section ".text",#alloc,#execinstr 1.41 +/* 000000 0 ( 0 0) */ .align 4 1.42 +! 1.43 +! SUBROUTINE cleanup 1.44 +! 1.45 +! OFFSET SOURCE LINE LABEL INSTRUCTION (ISSUE TIME) (COMPLETION TIME) 1.46 + 1.47 + .global cleanup 1.48 + cleanup: /* frequency 1.0 confidence 0.0 */ 1.49 +! FILE montmulf.c 1.50 + 1.51 +! 1 !#define RF_INLINE_MACROS 1.52 +! 3 !static double TwoTo16=65536.0; 1.53 +! 4 !static double TwoToMinus16=1.0/65536.0; 1.54 +! 5 !static double Zero=0.0; 1.55 +! 6 !static double TwoTo32=65536.0*65536.0; 1.56 +! 7 !static double TwoToMinus32=1.0/(65536.0*65536.0); 1.57 +! 9 !#ifdef RF_INLINE_MACROS 1.58 +! 11 !double upper32(double); 1.59 +! 12 !double lower32(double, double); 1.60 +! 13 !double mod(double, double, double); 1.61 +! 15 !#else 1.62 +! 17 !static double upper32(double x) 1.63 +! 18 !{ 1.64 +! 19 ! return floor(x*TwoToMinus32); 1.65 +! 20 !} 1.66 +! 22 !static double lower32(double x, double y) 1.67 +! 23 !{ 1.68 +! 24 ! return x-TwoTo32*floor(x*TwoToMinus32); 1.69 +! 25 !} 1.70 +! 27 !static double mod(double x, double oneoverm, double m) 1.71 +! 28 !{ 1.72 +! 29 ! return x-m*floor(x*oneoverm); 1.73 +! 30 !} 1.74 +! 32 !#endif 1.75 +! 35 !void cleanup(double *dt, int from, int tlen) 1.76 +! 36 !{ 1.77 +! 37 ! int i; 1.78 +! 38 ! double tmp,tmp1,x,x1; 1.79 +! 40 ! tmp=tmp1=Zero; 1.80 + 1.81 +/* 000000 40 ( 0 1) */ sethi %hi(Zero),%g2 1.82 + 1.83 +! 41 ! /* original code ** 1.84 +! 42 ! for(i=2*from;i<2*tlen-2;i++) 1.85 +! 43 ! { 1.86 +! 44 ! x=dt[i]; 1.87 +! 45 ! dt[i]=lower32(x,Zero)+tmp1; 1.88 +! 46 ! tmp1=tmp; 1.89 +! 47 ! tmp=upper32(x); 1.90 +! 48 ! } 1.91 +! 49 ! dt[tlen-2]+=tmp1; 1.92 +! 50 ! dt[tlen-1]+=tmp; 1.93 +! 51 ! **end original code ***/ 1.94 +! 52 ! /* new code ***/ 1.95 +! 53 ! for(i=2*from;i<2*tlen;i+=2) 1.96 + 1.97 +/* 0x0004 53 ( 1 2) */ sll %o2,1,%g3 1.98 +/* 0x0008 40 ( 1 4) */ ldd [%g2+%lo(Zero)],%f0 1.99 +/* 0x000c ( 1 2) */ add %g2,%lo(Zero),%g2 1.100 +/* 0x0010 53 ( 2 3) */ sll %o1,1,%g4 1.101 +/* 0x0014 36 ( 3 4) */ sll %o1,4,%g1 1.102 +/* 0x0018 40 ( 3 4) */ fmovd %f0,%f4 1.103 +/* 0x001c 53 ( 3 4) */ cmp %g4,%g3 1.104 +/* 0x0020 ( 3 4) */ bge,pt %icc,.L77000116 ! tprob=0.56 1.105 +/* 0x0024 ( 4 5) */ fmovd %f0,%f2 1.106 +/* 0x0028 36 ( 4 5) */ add %o0,%g1,%g1 1.107 +/* 0x002c ( 4 5) */ sub %g3,1,%g3 1.108 + 1.109 +! 54 ! { 1.110 +! 55 ! x=dt[i]; 1.111 + 1.112 +/* 0x0030 55 ( 5 8) */ ldd [%g1],%f8 1.113 + .L900000114: /* frequency 6.4 confidence 0.0 */ 1.114 +/* 0x0034 ( 0 3) */ fdtox %f8,%f6 1.115 + 1.116 +! 56 ! x1=dt[i+1]; 1.117 + 1.118 +/* 0x0038 56 ( 0 3) */ ldd [%g1+8],%f10 1.119 + 1.120 +! 57 ! dt[i]=lower32(x,Zero)+tmp; 1.121 +! 58 ! dt[i+1]=lower32(x1,Zero)+tmp1; 1.122 +! 59 ! tmp=upper32(x); 1.123 +! 60 ! tmp1=upper32(x1); 1.124 + 1.125 +/* 0x003c 60 ( 0 1) */ add %g4,2,%g4 1.126 +/* 0x0040 ( 1 4) */ fdtox %f8,%f8 1.127 +/* 0x0044 ( 1 2) */ cmp %g4,%g3 1.128 +/* 0x0048 ( 5 6) */ fmovs %f0,%f6 1.129 +/* 0x004c ( 7 10) */ fxtod %f6,%f6 1.130 +/* 0x0050 ( 8 11) */ fdtox %f10,%f0 1.131 +/* 0x0054 57 (10 13) */ faddd %f6,%f2,%f2 1.132 +/* 0x0058 (10 11) */ std %f2,[%g1] 1.133 +/* 0x005c (12 15) */ ldd [%g2],%f2 1.134 +/* 0x0060 (14 15) */ fmovs %f2,%f0 1.135 +/* 0x0064 (16 19) */ fxtod %f0,%f6 1.136 +/* 0x0068 (17 20) */ fdtox %f10,%f0 1.137 +/* 0x006c (18 21) */ fitod %f8,%f2 1.138 +/* 0x0070 58 (19 22) */ faddd %f6,%f4,%f4 1.139 +/* 0x0074 (19 20) */ std %f4,[%g1+8] 1.140 +/* 0x0078 60 (19 20) */ add %g1,16,%g1 1.141 +/* 0x007c (20 23) */ fitod %f0,%f4 1.142 +/* 0x0080 (20 23) */ ldd [%g2],%f0 1.143 +/* 0x0084 (20 21) */ ble,a,pt %icc,.L900000114 ! tprob=0.86 1.144 +/* 0x0088 (21 24) */ ldd [%g1],%f8 1.145 + .L77000116: /* frequency 1.0 confidence 0.0 */ 1.146 +/* 0x008c ( 0 2) */ retl ! Result = 1.147 +/* 0x0090 ( 1 2) */ nop 1.148 +/* 0x0094 0 ( 0 0) */ .type cleanup,2 1.149 +/* 0x0094 ( 0 0) */ .size cleanup,(.-cleanup) 1.150 + 1.151 + .section ".text",#alloc,#execinstr 1.152 +/* 000000 0 ( 0 0) */ .align 4 1.153 +! 1.154 +! SUBROUTINE conv_d16_to_i32 1.155 +! 1.156 +! OFFSET SOURCE LINE LABEL INSTRUCTION (ISSUE TIME) (COMPLETION TIME) 1.157 + 1.158 + .global conv_d16_to_i32 1.159 + conv_d16_to_i32: /* frequency 1.0 confidence 0.0 */ 1.160 +/* 000000 ( 0 1) */ save %sp,-136,%sp 1.161 + 1.162 +! 61 ! } 1.163 +! 62 ! /** end new code **/ 1.164 +! 63 !} 1.165 +! 66 !void conv_d16_to_i32(unsigned int *i32, double *d16, long long *tmp, int ilen) 1.166 +! 67 !{ 1.167 +! 68 !int i; 1.168 +! 69 !long long t, t1, a, b, c, d; 1.169 +! 71 ! t1=0; 1.170 +! 72 ! a=(long long)d16[0]; 1.171 + 1.172 +/* 0x0004 72 ( 1 4) */ ldd [%i1],%f0 1.173 + 1.174 +! 73 ! b=(long long)d16[1]; 1.175 +! 74 ! for(i=0; i<ilen-1; i++) 1.176 + 1.177 +/* 0x0008 74 ( 1 2) */ sub %i3,1,%g2 1.178 +/* 0x000c 67 ( 1 2) */ or %g0,%i0,%g5 1.179 +/* 0x0010 74 ( 2 3) */ cmp %g2,0 1.180 +/* 0x0014 71 ( 2 3) */ or %g0,0,%o4 1.181 +/* 0x0018 72 ( 3 6) */ fdtox %f0,%f0 1.182 +/* 0x001c ( 3 4) */ std %f0,[%sp+120] 1.183 +/* 0x0020 74 ( 3 4) */ or %g0,0,%o7 1.184 +/* 0x0024 67 ( 4 5) */ or %g0,%i3,%o0 1.185 +/* 0x0028 ( 4 5) */ sub %i3,2,%o2 1.186 +/* 0x002c 73 ( 5 8) */ ldd [%i1+8],%f0 1.187 +/* 0x0030 67 ( 5 6) */ sethi %hi(0xfc00),%o0 1.188 +/* 0x0034 ( 5 6) */ add %o2,1,%g3 1.189 +/* 0x0038 ( 6 7) */ add %o0,1023,%o1 1.190 +/* 0x003c ( 6 7) */ or %g0,%g5,%o5 1.191 +/* 0x0040 73 ( 7 10) */ fdtox %f0,%f0 1.192 +/* 0x0044 ( 7 8) */ std %f0,[%sp+112] 1.193 +/* 0x0048 72 (11 13) */ ldx [%sp+120],%g4 1.194 +/* 0x004c 73 (12 14) */ ldx [%sp+112],%g1 1.195 +/* 0x0050 74 (12 13) */ ble,pt %icc,.L900000214 ! tprob=0.56 1.196 +/* 0x0054 (12 13) */ sethi %hi(0xfc00),%g2 1.197 +/* 0x0058 67 (13 14) */ or %g0,-1,%g2 1.198 +/* 0x005c 74 (13 14) */ cmp %g3,3 1.199 +/* 0x0060 67 (14 15) */ srl %g2,0,%o3 1.200 +/* 0x0064 (14 15) */ or %g0,%i1,%g2 1.201 +/* 0x0068 74 (14 15) */ bl,pn %icc,.L77000134 ! tprob=0.44 1.202 +/* 0x006c (15 18) */ ldd [%g2+16],%f0 1.203 + 1.204 +! 75 ! { 1.205 +! 76 ! c=(long long)d16[2*i+2]; 1.206 +! 77 ! t1+=a&0xffffffff; 1.207 +! 78 ! t=(a>>32); 1.208 +! 79 ! d=(long long)d16[2*i+3]; 1.209 +! 80 ! t1+=(b&0xffff)<<16; 1.210 + 1.211 +/* 0x0070 80 (15 16) */ and %g1,%o1,%o0 1.212 + 1.213 +! 81 ! t+=(b>>16)+(t1>>32); 1.214 +! 82 ! i32[i]=t1&0xffffffff; 1.215 +! 83 ! t1=t; 1.216 +! 84 ! a=c; 1.217 +! 85 ! b=d; 1.218 + 1.219 +/* 0x0074 85 (15 16) */ add %g2,16,%g2 1.220 +/* 0x0078 80 (16 17) */ sllx %o0,16,%g3 1.221 +/* 0x007c 77 (16 17) */ and %g4,%o3,%o0 1.222 +/* 0x0080 76 (17 20) */ fdtox %f0,%f0 1.223 +/* 0x0084 (17 18) */ std %f0,[%sp+104] 1.224 +/* 0x0088 74 (17 18) */ add %o0,%g3,%o4 1.225 +/* 0x008c 79 (18 21) */ ldd [%g2+8],%f2 1.226 +/* 0x0090 81 (18 19) */ srax %g1,16,%o0 1.227 +/* 0x0094 82 (18 19) */ and %o4,%o3,%o7 1.228 +/* 0x0098 81 (19 20) */ stx %o0,[%sp+112] 1.229 +/* 0x009c (19 20) */ srax %o4,32,%o0 1.230 +/* 0x00a0 85 (19 20) */ add %g5,4,%o5 1.231 +/* 0x00a4 81 (20 21) */ stx %o0,[%sp+120] 1.232 +/* 0x00a8 78 (20 21) */ srax %g4,32,%o4 1.233 +/* 0x00ac 79 (20 23) */ fdtox %f2,%f0 1.234 +/* 0x00b0 (21 22) */ std %f0,[%sp+96] 1.235 +/* 0x00b4 81 (22 24) */ ldx [%sp+112],%o0 1.236 +/* 0x00b8 (23 25) */ ldx [%sp+120],%g4 1.237 +/* 0x00bc 76 (25 27) */ ldx [%sp+104],%g3 1.238 +/* 0x00c0 81 (25 26) */ add %o0,%g4,%g4 1.239 +/* 0x00c4 79 (26 28) */ ldx [%sp+96],%g1 1.240 +/* 0x00c8 81 (26 27) */ add %o4,%g4,%o4 1.241 +/* 0x00cc 82 (27 28) */ st %o7,[%g5] 1.242 +/* 0x00d0 (27 28) */ or %g0,1,%o7 1.243 +/* 0x00d4 84 (27 28) */ or %g0,%g3,%g4 1.244 + .L900000209: /* frequency 64.0 confidence 0.0 */ 1.245 +/* 0x00d8 76 (17 19) */ ldd [%g2+16],%f0 1.246 +/* 0x00dc 85 (17 18) */ add %o7,1,%o7 1.247 +/* 0x00e0 (17 18) */ add %o5,4,%o5 1.248 +/* 0x00e4 (18 18) */ cmp %o7,%o2 1.249 +/* 0x00e8 (18 19) */ add %g2,16,%g2 1.250 +/* 0x00ec 76 (19 22) */ fdtox %f0,%f0 1.251 +/* 0x00f0 (20 21) */ std %f0,[%sp+104] 1.252 +/* 0x00f4 79 (21 23) */ ldd [%g2+8],%f0 1.253 +/* 0x00f8 (23 26) */ fdtox %f0,%f0 1.254 +/* 0x00fc (24 25) */ std %f0,[%sp+96] 1.255 +/* 0x0100 80 (25 26) */ and %g1,%o1,%g3 1.256 +/* 0x0104 (26 27) */ sllx %g3,16,%g3 1.257 +/* 0x0108 ( 0 0) */ stx %g3,[%sp+120] 1.258 +/* 0x010c 77 (26 27) */ and %g4,%o3,%g3 1.259 +/* 0x0110 74 ( 0 0) */ stx %o7,[%sp+128] 1.260 +/* 0x0114 ( 0 0) */ ldx [%sp+120],%o7 1.261 +/* 0x0118 (27 27) */ add %g3,%o7,%g3 1.262 +/* 0x011c ( 0 0) */ ldx [%sp+128],%o7 1.263 +/* 0x0120 81 (28 29) */ srax %g1,16,%g1 1.264 +/* 0x0124 74 (28 28) */ add %g3,%o4,%g3 1.265 +/* 0x0128 81 (29 30) */ srax %g3,32,%o4 1.266 +/* 0x012c ( 0 0) */ stx %o4,[%sp+112] 1.267 +/* 0x0130 78 (30 31) */ srax %g4,32,%o4 1.268 +/* 0x0134 81 ( 0 0) */ ldx [%sp+112],%g4 1.269 +/* 0x0138 (30 31) */ add %g1,%g4,%g4 1.270 +/* 0x013c 79 (31 33) */ ldx [%sp+96],%g1 1.271 +/* 0x0140 81 (31 32) */ add %o4,%g4,%o4 1.272 +/* 0x0144 82 (32 33) */ and %g3,%o3,%g3 1.273 +/* 0x0148 84 ( 0 0) */ ldx [%sp+104],%g4 1.274 +/* 0x014c 85 (33 34) */ ble,pt %icc,.L900000209 ! tprob=0.50 1.275 +/* 0x0150 (33 34) */ st %g3,[%o5-4] 1.276 + .L900000212: /* frequency 8.0 confidence 0.0 */ 1.277 +/* 0x0154 85 ( 0 1) */ ba .L900000214 ! tprob=1.00 1.278 +/* 0x0158 ( 0 1) */ sethi %hi(0xfc00),%g2 1.279 + .L77000134: /* frequency 0.7 confidence 0.0 */ 1.280 + .L900000213: /* frequency 6.4 confidence 0.0 */ 1.281 +/* 0x015c 77 ( 0 1) */ and %g4,%o3,%o0 1.282 +/* 0x0160 80 ( 0 1) */ and %g1,%o1,%g3 1.283 +/* 0x0164 76 ( 0 3) */ fdtox %f0,%f0 1.284 +/* 0x0168 77 ( 1 2) */ add %o4,%o0,%o0 1.285 +/* 0x016c 76 ( 1 2) */ std %f0,[%sp+104] 1.286 +/* 0x0170 85 ( 1 2) */ add %o7,1,%o7 1.287 +/* 0x0174 80 ( 2 3) */ sllx %g3,16,%o4 1.288 +/* 0x0178 79 ( 2 5) */ ldd [%g2+24],%f2 1.289 +/* 0x017c 85 ( 2 3) */ add %g2,16,%g2 1.290 +/* 0x0180 80 ( 3 4) */ add %o0,%o4,%o4 1.291 +/* 0x0184 81 ( 3 4) */ stx %o7,[%sp+128] 1.292 +/* 0x0188 ( 4 5) */ srax %g1,16,%o0 1.293 +/* 0x018c ( 4 5) */ stx %o0,[%sp+112] 1.294 +/* 0x0190 82 ( 4 5) */ and %o4,%o3,%g3 1.295 +/* 0x0194 81 ( 5 6) */ srax %o4,32,%o0 1.296 +/* 0x0198 ( 5 6) */ stx %o0,[%sp+120] 1.297 +/* 0x019c 79 ( 5 8) */ fdtox %f2,%f0 1.298 +/* 0x01a0 ( 6 7) */ std %f0,[%sp+96] 1.299 +/* 0x01a4 78 ( 6 7) */ srax %g4,32,%o4 1.300 +/* 0x01a8 81 ( 7 9) */ ldx [%sp+120],%o7 1.301 +/* 0x01ac ( 8 10) */ ldx [%sp+112],%g4 1.302 +/* 0x01b0 76 (10 12) */ ldx [%sp+104],%g1 1.303 +/* 0x01b4 81 (10 11) */ add %g4,%o7,%g4 1.304 +/* 0x01b8 (11 13) */ ldx [%sp+128],%o7 1.305 +/* 0x01bc (11 12) */ add %o4,%g4,%o4 1.306 +/* 0x01c0 79 (12 14) */ ldx [%sp+96],%o0 1.307 +/* 0x01c4 84 (12 13) */ or %g0,%g1,%g4 1.308 +/* 0x01c8 82 (13 14) */ st %g3,[%o5] 1.309 +/* 0x01cc 85 (13 14) */ add %o5,4,%o5 1.310 +/* 0x01d0 (13 14) */ cmp %o7,%o2 1.311 +/* 0x01d4 (14 15) */ or %g0,%o0,%g1 1.312 +/* 0x01d8 (14 15) */ ble,a,pt %icc,.L900000213 ! tprob=0.86 1.313 +/* 0x01dc (14 17) */ ldd [%g2+16],%f0 1.314 + .L77000127: /* frequency 1.0 confidence 0.0 */ 1.315 + 1.316 +! 86 ! } 1.317 +! 87 ! t1+=a&0xffffffff; 1.318 +! 88 ! t=(a>>32); 1.319 +! 89 ! t1+=(b&0xffff)<<16; 1.320 +! 90 ! i32[i]=t1&0xffffffff; 1.321 + 1.322 +/* 0x01e0 90 ( 0 1) */ sethi %hi(0xfc00),%g2 1.323 + .L900000214: /* frequency 1.0 confidence 0.0 */ 1.324 +/* 0x01e4 90 ( 0 1) */ or %g0,-1,%g3 1.325 +/* 0x01e8 ( 0 1) */ add %g2,1023,%g2 1.326 +/* 0x01ec ( 1 2) */ srl %g3,0,%g3 1.327 +/* 0x01f0 ( 1 2) */ and %g1,%g2,%g2 1.328 +/* 0x01f4 ( 2 3) */ and %g4,%g3,%g4 1.329 +/* 0x01f8 ( 3 4) */ sllx %g2,16,%g2 1.330 +/* 0x01fc ( 3 4) */ add %o4,%g4,%g4 1.331 +/* 0x0200 ( 4 5) */ add %g4,%g2,%g2 1.332 +/* 0x0204 ( 5 6) */ sll %o7,2,%g4 1.333 +/* 0x0208 ( 5 6) */ and %g2,%g3,%g2 1.334 +/* 0x020c ( 6 7) */ st %g2,[%g5+%g4] 1.335 +/* 0x0210 ( 7 9) */ ret ! Result = 1.336 +/* 0x0214 ( 9 10) */ restore %g0,%g0,%g0 1.337 +/* 0x0218 0 ( 0 0) */ .type conv_d16_to_i32,2 1.338 +/* 0x0218 ( 0 0) */ .size conv_d16_to_i32,(.-conv_d16_to_i32) 1.339 + 1.340 + .section ".text",#alloc,#execinstr 1.341 +/* 000000 0 ( 0 0) */ .align 8 1.342 +! 1.343 +! CONSTANT POOL 1.344 +! 1.345 + .L_const_seg_900000301: /* frequency 1.0 confidence 0.0 */ 1.346 +/* 000000 0 ( 0 0) */ .word 1127219200,0 1.347 +/* 0x0008 0 ( 0 0) */ .align 4 1.348 +! 1.349 +! SUBROUTINE conv_i32_to_d32 1.350 +! 1.351 +! OFFSET SOURCE LINE LABEL INSTRUCTION (ISSUE TIME) (COMPLETION TIME) 1.352 + 1.353 + .global conv_i32_to_d32 1.354 + conv_i32_to_d32: /* frequency 1.0 confidence 0.0 */ 1.355 +/* 000000 ( 0 1) */ orcc %g0,%o2,%g1 1.356 + 1.357 +! 92 !} 1.358 +! 94 !void conv_i32_to_d32(double *d32, unsigned int *i32, int len) 1.359 +! 95 !{ 1.360 +! 96 !int i; 1.361 +! 98 !#pragma pipeloop(0) 1.362 +! 99 ! for(i=0;i<len;i++) d32[i]=(double)(i32[i]); 1.363 + 1.364 +/* 0x0004 99 ( 0 1) */ ble,pt %icc,.L77000140 ! tprob=0.56 1.365 +/* 0x0008 ( 0 1) */ nop 1.366 +/* 0x000c ( 1 2) */ sethi %hi(.L_const_seg_900000301),%g2 1.367 +/* 0x0010 95 ( 1 2) */ or %g0,%o1,%g4 1.368 +/* 0x0014 99 ( 2 3) */ add %g2,%lo(.L_const_seg_900000301),%g2 1.369 +/* 0x0018 ( 2 3) */ or %g0,0,%o5 1.370 +/* 0x001c 95 ( 3 4) */ or %g0,%o0,%g5 1.371 +/* 0x0020 99 ( 3 4) */ sub %o2,1,%g3 1.372 +/* 0x0024 ( 4 5) */ cmp %o2,9 1.373 +/* 0x0028 ( 4 5) */ bl,pn %icc,.L77000144 ! tprob=0.44 1.374 +/* 0x002c ( 4 7) */ ldd [%g2],%f8 1.375 +/* 0x0030 ( 5 8) */ ld [%o1],%f7 1.376 +/* 0x0034 ( 5 6) */ add %o1,16,%g4 1.377 +/* 0x0038 ( 5 6) */ sub %o2,5,%g1 1.378 +/* 0x003c ( 6 9) */ ld [%o1+4],%f5 1.379 +/* 0x0040 ( 6 7) */ or %g0,4,%o5 1.380 +/* 0x0044 ( 7 10) */ ld [%o1+8],%f3 1.381 +/* 0x0048 ( 7 8) */ fmovs %f8,%f6 1.382 +/* 0x004c ( 8 11) */ ld [%o1+12],%f1 1.383 + .L900000305: /* frequency 64.0 confidence 0.0 */ 1.384 +/* 0x0050 ( 8 16) */ ld [%g4],%f11 1.385 +/* 0x0054 ( 8 9) */ add %o5,5,%o5 1.386 +/* 0x0058 ( 8 9) */ add %g4,20,%g4 1.387 +/* 0x005c ( 8 11) */ fsubd %f6,%f8,%f6 1.388 +/* 0x0060 ( 9 10) */ std %f6,[%g5] 1.389 +/* 0x0064 ( 9 9) */ cmp %o5,%g1 1.390 +/* 0x0068 ( 9 10) */ add %g5,40,%g5 1.391 +/* 0x006c ( 0 0) */ fmovs %f8,%f4 1.392 +/* 0x0070 (10 18) */ ld [%g4-16],%f7 1.393 +/* 0x0074 (10 13) */ fsubd %f4,%f8,%f12 1.394 +/* 0x0078 ( 0 0) */ fmovs %f8,%f2 1.395 +/* 0x007c (11 12) */ std %f12,[%g5-32] 1.396 +/* 0x0080 (12 20) */ ld [%g4-12],%f5 1.397 +/* 0x0084 (12 15) */ fsubd %f2,%f8,%f12 1.398 +/* 0x0088 ( 0 0) */ fmovs %f8,%f0 1.399 +/* 0x008c (13 14) */ std %f12,[%g5-24] 1.400 +/* 0x0090 (14 22) */ ld [%g4-8],%f3 1.401 +/* 0x0094 (14 17) */ fsubd %f0,%f8,%f12 1.402 +/* 0x0098 ( 0 0) */ fmovs %f8,%f10 1.403 +/* 0x009c (15 16) */ std %f12,[%g5-16] 1.404 +/* 0x00a0 (16 24) */ ld [%g4-4],%f1 1.405 +/* 0x00a4 (16 19) */ fsubd %f10,%f8,%f10 1.406 +/* 0x00a8 ( 0 0) */ fmovs %f8,%f6 1.407 +/* 0x00ac (17 18) */ ble,pt %icc,.L900000305 ! tprob=0.50 1.408 +/* 0x00b0 (17 18) */ std %f10,[%g5-8] 1.409 + .L900000308: /* frequency 8.0 confidence 0.0 */ 1.410 +/* 0x00b4 ( 0 1) */ fmovs %f8,%f4 1.411 +/* 0x00b8 ( 0 1) */ add %g5,32,%g5 1.412 +/* 0x00bc ( 0 1) */ cmp %o5,%g3 1.413 +/* 0x00c0 ( 1 2) */ fmovs %f8,%f2 1.414 +/* 0x00c4 ( 2 3) */ fmovs %f8,%f0 1.415 +/* 0x00c8 ( 4 7) */ fsubd %f6,%f8,%f6 1.416 +/* 0x00cc ( 4 5) */ std %f6,[%g5-32] 1.417 +/* 0x00d0 ( 5 8) */ fsubd %f4,%f8,%f4 1.418 +/* 0x00d4 ( 5 6) */ std %f4,[%g5-24] 1.419 +/* 0x00d8 ( 6 9) */ fsubd %f2,%f8,%f2 1.420 +/* 0x00dc ( 6 7) */ std %f2,[%g5-16] 1.421 +/* 0x00e0 ( 7 10) */ fsubd %f0,%f8,%f0 1.422 +/* 0x00e4 ( 7 8) */ bg,pn %icc,.L77000140 ! tprob=0.14 1.423 +/* 0x00e8 ( 7 8) */ std %f0,[%g5-8] 1.424 + .L77000144: /* frequency 0.7 confidence 0.0 */ 1.425 +/* 0x00ec ( 0 3) */ ld [%g4],%f1 1.426 + .L900000309: /* frequency 6.4 confidence 0.0 */ 1.427 +/* 0x00f0 ( 0 3) */ ldd [%g2],%f8 1.428 +/* 0x00f4 ( 0 1) */ add %o5,1,%o5 1.429 +/* 0x00f8 ( 0 1) */ add %g4,4,%g4 1.430 +/* 0x00fc ( 1 2) */ cmp %o5,%g3 1.431 +/* 0x0100 ( 2 3) */ fmovs %f8,%f0 1.432 +/* 0x0104 ( 4 7) */ fsubd %f0,%f8,%f0 1.433 +/* 0x0108 ( 4 5) */ std %f0,[%g5] 1.434 +/* 0x010c ( 4 5) */ add %g5,8,%g5 1.435 +/* 0x0110 ( 4 5) */ ble,a,pt %icc,.L900000309 ! tprob=0.86 1.436 +/* 0x0114 ( 6 9) */ ld [%g4],%f1 1.437 + .L77000140: /* frequency 1.0 confidence 0.0 */ 1.438 +/* 0x0118 ( 0 2) */ retl ! Result = 1.439 +/* 0x011c ( 1 2) */ nop 1.440 +/* 0x0120 0 ( 0 0) */ .type conv_i32_to_d32,2 1.441 +/* 0x0120 ( 0 0) */ .size conv_i32_to_d32,(.-conv_i32_to_d32) 1.442 + 1.443 + .section ".text",#alloc,#execinstr 1.444 +/* 000000 0 ( 0 0) */ .align 8 1.445 +! 1.446 +! CONSTANT POOL 1.447 +! 1.448 + .L_const_seg_900000401: /* frequency 1.0 confidence 0.0 */ 1.449 +/* 000000 0 ( 0 0) */ .word 1127219200,0 1.450 +/* 0x0008 0 ( 0 0) */ .align 4 1.451 +! 1.452 +! SUBROUTINE conv_i32_to_d16 1.453 +! 1.454 +! OFFSET SOURCE LINE LABEL INSTRUCTION (ISSUE TIME) (COMPLETION TIME) 1.455 + 1.456 + .global conv_i32_to_d16 1.457 + conv_i32_to_d16: /* frequency 1.0 confidence 0.0 */ 1.458 +/* 000000 ( 0 1) */ save %sp,-104,%sp 1.459 +/* 0x0004 ( 1 2) */ orcc %g0,%i2,%o0 1.460 + 1.461 +! 100 !} 1.462 +! 103 !void conv_i32_to_d16(double *d16, unsigned int *i32, int len) 1.463 +! 104 !{ 1.464 +! 105 !int i; 1.465 +! 106 !unsigned int a; 1.466 +! 108 !#pragma pipeloop(0) 1.467 +! 109 ! for(i=0;i<len;i++) 1.468 + 1.469 +/* 0x0008 109 ( 1 2) */ ble,pt %icc,.L77000150 ! tprob=0.56 1.470 +/* 0x000c ( 1 2) */ nop 1.471 +/* 0x0010 ( 2 3) */ sub %o0,1,%o5 1.472 +/* 0x0014 ( 2 3) */ sethi %hi(0xfc00),%g2 1.473 + 1.474 +! 110 ! { 1.475 +! 111 ! a=i32[i]; 1.476 +! 112 ! d16[2*i]=(double)(a&0xffff); 1.477 +! 113 ! d16[2*i+1]=(double)(a>>16); 1.478 + 1.479 +/* 0x0018 113 ( 3 4) */ sethi %hi(.L_const_seg_900000401),%o0 1.480 +/* 0x001c ( 3 4) */ add %o5,1,%g3 1.481 +/* 0x0020 ( 4 5) */ add %g2,1023,%o4 1.482 +/* 0x0024 109 ( 4 5) */ or %g0,0,%g1 1.483 +/* 0x0028 ( 5 6) */ cmp %g3,3 1.484 +/* 0x002c ( 5 6) */ or %g0,%i1,%o7 1.485 +/* 0x0030 ( 6 7) */ add %o0,%lo(.L_const_seg_900000401),%o3 1.486 +/* 0x0034 ( 6 7) */ or %g0,%i0,%g2 1.487 +/* 0x0038 ( 6 7) */ bl,pn %icc,.L77000154 ! tprob=0.44 1.488 +/* 0x003c ( 7 8) */ add %o7,4,%o0 1.489 +/* 0x0040 112 ( 7 10) */ ldd [%o3],%f0 1.490 +/* 0x0044 113 ( 7 8) */ or %g0,1,%g1 1.491 +/* 0x0048 111 ( 8 11) */ ld [%o0-4],%o1 1.492 +/* 0x004c 0 ( 8 9) */ or %g0,%o0,%o7 1.493 +/* 0x0050 112 (10 11) */ and %o1,%o4,%o0 1.494 + .L900000406: /* frequency 64.0 confidence 0.0 */ 1.495 +/* 0x0054 112 (22 23) */ st %o0,[%sp+96] 1.496 +/* 0x0058 113 (22 23) */ add %g1,1,%g1 1.497 +/* 0x005c (22 23) */ add %g2,16,%g2 1.498 +/* 0x0060 (23 23) */ cmp %g1,%o5 1.499 +/* 0x0064 (23 24) */ add %o7,4,%o7 1.500 +/* 0x0068 112 (29 31) */ ld [%sp+96],%f3 1.501 +/* 0x006c ( 0 0) */ fmovs %f0,%f2 1.502 +/* 0x0070 (31 34) */ fsubd %f2,%f0,%f2 1.503 +/* 0x0074 113 (32 33) */ srl %o1,16,%o0 1.504 +/* 0x0078 112 (32 33) */ std %f2,[%g2-16] 1.505 +/* 0x007c 113 (33 34) */ st %o0,[%sp+92] 1.506 +/* 0x0080 (40 42) */ ld [%sp+92],%f3 1.507 +/* 0x0084 111 (41 43) */ ld [%o7-4],%o1 1.508 +/* 0x0088 113 ( 0 0) */ fmovs %f0,%f2 1.509 +/* 0x008c (42 45) */ fsubd %f2,%f0,%f2 1.510 +/* 0x0090 112 (43 44) */ and %o1,%o4,%o0 1.511 +/* 0x0094 113 (43 44) */ ble,pt %icc,.L900000406 ! tprob=0.50 1.512 +/* 0x0098 (43 44) */ std %f2,[%g2-8] 1.513 + .L900000409: /* frequency 8.0 confidence 0.0 */ 1.514 +/* 0x009c 112 ( 0 1) */ st %o0,[%sp+96] 1.515 +/* 0x00a0 ( 0 1) */ fmovs %f0,%f2 1.516 +/* 0x00a4 113 ( 0 1) */ add %g2,16,%g2 1.517 +/* 0x00a8 ( 1 2) */ srl %o1,16,%o0 1.518 +/* 0x00ac 112 ( 4 7) */ ld [%sp+96],%f3 1.519 +/* 0x00b0 ( 6 9) */ fsubd %f2,%f0,%f2 1.520 +/* 0x00b4 ( 6 7) */ std %f2,[%g2-16] 1.521 +/* 0x00b8 113 ( 7 8) */ st %o0,[%sp+92] 1.522 +/* 0x00bc (10 11) */ fmovs %f0,%f2 1.523 +/* 0x00c0 (11 14) */ ld [%sp+92],%f3 1.524 +/* 0x00c4 (13 16) */ fsubd %f2,%f0,%f0 1.525 +/* 0x00c8 (13 14) */ std %f0,[%g2-8] 1.526 +/* 0x00cc (14 16) */ ret ! Result = 1.527 +/* 0x00d0 (16 17) */ restore %g0,%g0,%g0 1.528 + .L77000154: /* frequency 0.7 confidence 0.0 */ 1.529 +/* 0x00d4 111 ( 0 3) */ ld [%o7],%o0 1.530 + .L900000410: /* frequency 6.4 confidence 0.0 */ 1.531 +/* 0x00d8 112 ( 0 1) */ and %o0,%o4,%o1 1.532 +/* 0x00dc ( 0 1) */ st %o1,[%sp+96] 1.533 +/* 0x00e0 113 ( 0 1) */ add %g1,1,%g1 1.534 +/* 0x00e4 112 ( 1 4) */ ldd [%o3],%f0 1.535 +/* 0x00e8 113 ( 1 2) */ srl %o0,16,%o0 1.536 +/* 0x00ec ( 1 2) */ add %o7,4,%o7 1.537 +/* 0x00f0 ( 2 3) */ cmp %g1,%o5 1.538 +/* 0x00f4 112 ( 3 4) */ fmovs %f0,%f2 1.539 +/* 0x00f8 ( 4 7) */ ld [%sp+96],%f3 1.540 +/* 0x00fc ( 6 9) */ fsubd %f2,%f0,%f2 1.541 +/* 0x0100 ( 6 7) */ std %f2,[%g2] 1.542 +/* 0x0104 113 ( 7 8) */ st %o0,[%sp+92] 1.543 +/* 0x0108 (10 11) */ fmovs %f0,%f2 1.544 +/* 0x010c (11 14) */ ld [%sp+92],%f3 1.545 +/* 0x0110 (13 16) */ fsubd %f2,%f0,%f0 1.546 +/* 0x0114 (13 14) */ std %f0,[%g2+8] 1.547 +/* 0x0118 (13 14) */ add %g2,16,%g2 1.548 +/* 0x011c (13 14) */ ble,a,pt %icc,.L900000410 ! tprob=0.86 1.549 +/* 0x0120 (14 17) */ ld [%o7],%o0 1.550 + .L77000150: /* frequency 1.0 confidence 0.0 */ 1.551 +/* 0x0124 ( 0 2) */ ret ! Result = 1.552 +/* 0x0128 ( 2 3) */ restore %g0,%g0,%g0 1.553 +/* 0x012c 0 ( 0 0) */ .type conv_i32_to_d16,2 1.554 +/* 0x012c ( 0 0) */ .size conv_i32_to_d16,(.-conv_i32_to_d16) 1.555 + 1.556 + .section ".text",#alloc,#execinstr 1.557 +/* 000000 0 ( 0 0) */ .align 8 1.558 +! 1.559 +! CONSTANT POOL 1.560 +! 1.561 + .L_const_seg_900000501: /* frequency 1.0 confidence 0.0 */ 1.562 +/* 000000 0 ( 0 0) */ .word 1127219200,0 1.563 +/* 0x0008 0 ( 0 0) */ .align 4 1.564 +! 1.565 +! SUBROUTINE conv_i32_to_d32_and_d16 1.566 +! 1.567 +! OFFSET SOURCE LINE LABEL INSTRUCTION (ISSUE TIME) (COMPLETION TIME) 1.568 + 1.569 + .global conv_i32_to_d32_and_d16 1.570 + conv_i32_to_d32_and_d16: /* frequency 1.0 confidence 0.0 */ 1.571 +/* 000000 ( 0 1) */ save %sp,-104,%sp 1.572 +/* 0x0004 ( 1 2) */ or %g0,%i3,%i4 1.573 +/* 0x0008 ( 1 2) */ or %g0,%i2,%g1 1.574 + 1.575 +! 114 ! } 1.576 +! 115 !} 1.577 +! 118 !void i16_to_d16_and_d32x4(double * /*1/(2^16)*/, double * /* 2^16*/, 1.578 +! 119 ! double * /* 0 */, 1.579 +! 120 ! double * /*result16*/, double * /* result32 */, 1.580 +! 121 ! float * /*source - should be unsigned int* 1.581 +! 122 ! converted to float* */); 1.582 +! 126 !void conv_i32_to_d32_and_d16(double *d32, double *d16, 1.583 +! 127 ! unsigned int *i32, int len) 1.584 +! 128 !{ 1.585 +! 129 !int i; 1.586 +! 130 !unsigned int a; 1.587 +! 132 !#pragma pipeloop(0) 1.588 +! 133 ! for(i=0;i<len-3;i+=4) 1.589 + 1.590 +/* 0x000c 133 ( 2 3) */ sub %i4,3,%g2 1.591 +/* 0x0010 ( 2 3) */ or %g0,0,%o7 1.592 +/* 0x0014 ( 3 4) */ cmp %g2,0 1.593 +/* 0x0018 128 ( 3 4) */ or %g0,%i0,%i3 1.594 +/* 0x001c 133 ( 3 4) */ ble,pt %icc,.L900000515 ! tprob=0.56 1.595 +/* 0x0020 ( 4 5) */ cmp %o7,%i4 1.596 + 1.597 +! 134 ! { 1.598 +! 135 ! i16_to_d16_and_d32x4(&TwoToMinus16, &TwoTo16, &Zero, 1.599 +! 136 ! &(d16[2*i]), &(d32[i]), (float *)(&(i32[i]))); 1.600 + 1.601 +/* 0x0024 136 ( 4 5) */ sethi %hi(Zero),%g2 1.602 +/* 0x0028 133 ( 5 6) */ or %g0,%g1,%o3 1.603 +/* 0x002c ( 5 6) */ sub %i4,4,%o2 1.604 +/* 0x0030 136 ( 6 7) */ add %g2,%lo(Zero),%o1 1.605 +/* 0x0034 133 ( 6 7) */ or %g0,0,%o5 1.606 +/* 0x0038 ( 7 8) */ or %g0,0,%o4 1.607 +/* 0x003c 136 ( 7 8) */ or %g0,%o3,%g4 1.608 + .L900000514: /* frequency 6.4 confidence 0.0 */ 1.609 +/* 0x0040 ( 0 3) */ ldd [%o1],%f2 1.610 +/* 0x0044 136 ( 0 1) */ add %i3,%o5,%g2 1.611 +/* 0x0048 ( 0 1) */ add %i1,%o4,%g3 1.612 +/* 0x004c ( 1 4) */ ldd [%o1-8],%f0 1.613 +/* 0x0050 ( 1 2) */ add %o7,4,%o7 1.614 +/* 0x0054 ( 1 2) */ add %o3,16,%o3 1.615 +/* 0x0058 ( 2 3) */ fmovd %f2,%f14 1.616 +/* 0x005c ( 2 5) */ ld [%g4],%f15 1.617 +/* 0x0060 ( 2 3) */ cmp %o7,%o2 1.618 +/* 0x0064 ( 3 4) */ fmovd %f2,%f10 1.619 +/* 0x0068 ( 3 6) */ ld [%g4+4],%f11 1.620 +/* 0x006c ( 4 5) */ fmovd %f2,%f6 1.621 +/* 0x0070 ( 4 7) */ ld [%g4+8],%f7 1.622 +/* 0x0074 ( 5 8) */ ld [%g4+12],%f3 1.623 +/* 0x0078 ( 5 8) */ fxtod %f14,%f14 1.624 +/* 0x007c ( 6 9) */ fxtod %f10,%f10 1.625 +/* 0x0080 ( 6 9) */ ldd [%o1-16],%f16 1.626 +/* 0x0084 ( 7 10) */ fxtod %f6,%f6 1.627 +/* 0x0088 ( 7 8) */ std %f14,[%i3+%o5] 1.628 +/* 0x008c ( 7 8) */ add %o5,32,%o5 1.629 +/* 0x0090 ( 8 11) */ fxtod %f2,%f2 1.630 +/* 0x0094 ( 8 11) */ fmuld %f0,%f14,%f12 1.631 +/* 0x0098 ( 8 9) */ std %f10,[%g2+8] 1.632 +/* 0x009c ( 9 12) */ fmuld %f0,%f10,%f8 1.633 +/* 0x00a0 ( 9 10) */ std %f6,[%g2+16] 1.634 +/* 0x00a4 (10 13) */ fmuld %f0,%f6,%f4 1.635 +/* 0x00a8 (10 11) */ std %f2,[%g2+24] 1.636 +/* 0x00ac (11 14) */ fmuld %f0,%f2,%f0 1.637 +/* 0x00b0 (11 14) */ fdtox %f12,%f12 1.638 +/* 0x00b4 (12 15) */ fdtox %f8,%f8 1.639 +/* 0x00b8 (13 16) */ fdtox %f4,%f4 1.640 +/* 0x00bc (14 17) */ fdtox %f0,%f0 1.641 +/* 0x00c0 (15 18) */ fxtod %f12,%f12 1.642 +/* 0x00c4 (15 16) */ std %f12,[%g3+8] 1.643 +/* 0x00c8 (16 19) */ fxtod %f8,%f8 1.644 +/* 0x00cc (16 17) */ std %f8,[%g3+24] 1.645 +/* 0x00d0 (17 20) */ fxtod %f4,%f4 1.646 +/* 0x00d4 (17 18) */ std %f4,[%g3+40] 1.647 +/* 0x00d8 (18 21) */ fxtod %f0,%f0 1.648 +/* 0x00dc (18 21) */ fmuld %f12,%f16,%f12 1.649 +/* 0x00e0 (18 19) */ std %f0,[%g3+56] 1.650 +/* 0x00e4 (19 22) */ fmuld %f8,%f16,%f8 1.651 +/* 0x00e8 (20 23) */ fmuld %f4,%f16,%f4 1.652 +/* 0x00ec (21 24) */ fmuld %f0,%f16,%f0 1.653 +/* 0x00f0 (21 24) */ fsubd %f14,%f12,%f12 1.654 +/* 0x00f4 (21 22) */ std %f12,[%i1+%o4] 1.655 +/* 0x00f8 (22 25) */ fsubd %f10,%f8,%f8 1.656 +/* 0x00fc (22 23) */ std %f8,[%g3+16] 1.657 +/* 0x0100 (22 23) */ add %o4,64,%o4 1.658 +/* 0x0104 (23 26) */ fsubd %f6,%f4,%f4 1.659 +/* 0x0108 (23 24) */ std %f4,[%g3+32] 1.660 +/* 0x010c (24 27) */ fsubd %f2,%f0,%f0 1.661 +/* 0x0110 (24 25) */ std %f0,[%g3+48] 1.662 +/* 0x0114 (24 25) */ ble,pt %icc,.L900000514 ! tprob=0.86 1.663 +/* 0x0118 (25 26) */ or %g0,%o3,%g4 1.664 + .L77000159: /* frequency 1.0 confidence 0.0 */ 1.665 + 1.666 +! 137 ! } 1.667 +! 138 ! for(;i<len;i++) 1.668 + 1.669 +/* 0x011c 138 ( 0 1) */ cmp %o7,%i4 1.670 + .L900000515: /* frequency 1.0 confidence 0.0 */ 1.671 +/* 0x0120 138 ( 0 1) */ bge,pt %icc,.L77000164 ! tprob=0.56 1.672 +/* 0x0124 ( 0 1) */ nop 1.673 + 1.674 +! 139 ! { 1.675 +! 140 ! a=i32[i]; 1.676 +! 141 ! d32[i]=(double)(i32[i]); 1.677 +! 142 ! d16[2*i]=(double)(a&0xffff); 1.678 +! 143 ! d16[2*i+1]=(double)(a>>16); 1.679 + 1.680 +/* 0x0128 143 ( 0 1) */ sethi %hi(.L_const_seg_900000501),%o1 1.681 +/* 0x012c 138 ( 1 2) */ sethi %hi(0xfc00),%o0 1.682 +/* 0x0130 141 ( 1 4) */ ldd [%o1+%lo(.L_const_seg_900000501)],%f0 1.683 +/* 0x0134 138 ( 1 2) */ sub %i4,%o7,%g3 1.684 +/* 0x0138 ( 2 3) */ sll %o7,2,%g2 1.685 +/* 0x013c ( 2 3) */ add %o0,1023,%o3 1.686 +/* 0x0140 ( 3 4) */ sll %o7,3,%g4 1.687 +/* 0x0144 ( 3 4) */ cmp %g3,3 1.688 +/* 0x0148 ( 4 5) */ add %g1,%g2,%o0 1.689 +/* 0x014c ( 4 5) */ add %o1,%lo(.L_const_seg_900000501),%o2 1.690 +/* 0x0150 ( 5 6) */ add %i3,%g4,%o4 1.691 +/* 0x0154 ( 5 6) */ sub %i4,1,%o1 1.692 +/* 0x0158 ( 6 7) */ sll %o7,4,%g5 1.693 +/* 0x015c ( 6 7) */ bl,pn %icc,.L77000161 ! tprob=0.44 1.694 +/* 0x0160 ( 7 8) */ add %i1,%g5,%o5 1.695 +/* 0x0164 141 ( 7 10) */ ld [%g1+%g2],%f3 1.696 +/* 0x0168 143 ( 7 8) */ add %o4,8,%o4 1.697 +/* 0x016c 140 ( 8 11) */ ld [%g1+%g2],%g1 1.698 +/* 0x0170 143 ( 8 9) */ add %o5,16,%o5 1.699 +/* 0x0174 ( 8 9) */ add %o7,1,%o7 1.700 +/* 0x0178 141 ( 9 10) */ fmovs %f0,%f2 1.701 +/* 0x017c 143 ( 9 10) */ add %o0,4,%o0 1.702 +/* 0x0180 142 (10 11) */ and %g1,%o3,%g2 1.703 +/* 0x0184 141 (11 14) */ fsubd %f2,%f0,%f2 1.704 +/* 0x0188 (11 12) */ std %f2,[%o4-8] 1.705 +/* 0x018c 143 (11 12) */ srl %g1,16,%g1 1.706 +/* 0x0190 142 (12 13) */ st %g2,[%sp+96] 1.707 +/* 0x0194 (15 16) */ fmovs %f0,%f2 1.708 +/* 0x0198 (16 19) */ ld [%sp+96],%f3 1.709 +/* 0x019c (18 21) */ fsubd %f2,%f0,%f2 1.710 +/* 0x01a0 (18 19) */ std %f2,[%o5-16] 1.711 +/* 0x01a4 143 (19 20) */ st %g1,[%sp+92] 1.712 +/* 0x01a8 (22 23) */ fmovs %f0,%f2 1.713 +/* 0x01ac (23 26) */ ld [%sp+92],%f3 1.714 +/* 0x01b0 (25 28) */ fsubd %f2,%f0,%f2 1.715 +/* 0x01b4 (25 26) */ std %f2,[%o5-8] 1.716 + .L900000509: /* frequency 64.0 confidence 0.0 */ 1.717 +/* 0x01b8 141 (26 28) */ ld [%o0],%f3 1.718 +/* 0x01bc 143 (26 27) */ add %o7,2,%o7 1.719 +/* 0x01c0 (26 27) */ add %o5,32,%o5 1.720 +/* 0x01c4 140 (27 29) */ ld [%o0],%g1 1.721 +/* 0x01c8 143 (27 27) */ cmp %o7,%o1 1.722 +/* 0x01cc (27 28) */ add %o4,16,%o4 1.723 +/* 0x01d0 141 ( 0 0) */ fmovs %f0,%f2 1.724 +/* 0x01d4 (28 31) */ fsubd %f2,%f0,%f2 1.725 +/* 0x01d8 (29 30) */ std %f2,[%o4-16] 1.726 +/* 0x01dc 142 (29 30) */ and %g1,%o3,%g2 1.727 +/* 0x01e0 (30 31) */ st %g2,[%sp+96] 1.728 +/* 0x01e4 (37 39) */ ld [%sp+96],%f3 1.729 +/* 0x01e8 ( 0 0) */ fmovs %f0,%f2 1.730 +/* 0x01ec (39 42) */ fsubd %f2,%f0,%f2 1.731 +/* 0x01f0 143 (40 41) */ srl %g1,16,%g1 1.732 +/* 0x01f4 142 (40 41) */ std %f2,[%o5-32] 1.733 +/* 0x01f8 143 (41 42) */ st %g1,[%sp+92] 1.734 +/* 0x01fc (48 50) */ ld [%sp+92],%f3 1.735 +/* 0x0200 ( 0 0) */ fmovs %f0,%f2 1.736 +/* 0x0204 (50 53) */ fsubd %f2,%f0,%f2 1.737 +/* 0x0208 (51 52) */ std %f2,[%o5-24] 1.738 +/* 0x020c (51 52) */ add %o0,4,%o0 1.739 +/* 0x0210 141 (52 54) */ ld [%o0],%f3 1.740 +/* 0x0214 140 (53 55) */ ld [%o0],%g1 1.741 +/* 0x0218 141 ( 0 0) */ fmovs %f0,%f2 1.742 +/* 0x021c (54 57) */ fsubd %f2,%f0,%f2 1.743 +/* 0x0220 (55 56) */ std %f2,[%o4-8] 1.744 +/* 0x0224 142 (55 56) */ and %g1,%o3,%g2 1.745 +/* 0x0228 (56 57) */ st %g2,[%sp+96] 1.746 +/* 0x022c (63 65) */ ld [%sp+96],%f3 1.747 +/* 0x0230 ( 0 0) */ fmovs %f0,%f2 1.748 +/* 0x0234 (65 68) */ fsubd %f2,%f0,%f2 1.749 +/* 0x0238 143 (66 67) */ srl %g1,16,%g1 1.750 +/* 0x023c 142 (66 67) */ std %f2,[%o5-16] 1.751 +/* 0x0240 143 (67 68) */ st %g1,[%sp+92] 1.752 +/* 0x0244 (74 76) */ ld [%sp+92],%f3 1.753 +/* 0x0248 ( 0 0) */ fmovs %f0,%f2 1.754 +/* 0x024c (76 79) */ fsubd %f2,%f0,%f2 1.755 +/* 0x0250 (77 78) */ std %f2,[%o5-8] 1.756 +/* 0x0254 (77 78) */ bl,pt %icc,.L900000509 ! tprob=0.50 1.757 +/* 0x0258 (77 78) */ add %o0,4,%o0 1.758 + .L900000512: /* frequency 8.0 confidence 0.0 */ 1.759 +/* 0x025c 143 ( 0 1) */ cmp %o7,%i4 1.760 +/* 0x0260 ( 0 1) */ bge,pn %icc,.L77000164 ! tprob=0.14 1.761 +/* 0x0264 ( 0 1) */ nop 1.762 + .L77000161: /* frequency 0.7 confidence 0.0 */ 1.763 +/* 0x0268 141 ( 0 3) */ ld [%o0],%f3 1.764 + .L900000513: /* frequency 6.4 confidence 0.0 */ 1.765 +/* 0x026c 141 ( 0 3) */ ldd [%o2],%f0 1.766 +/* 0x0270 143 ( 0 1) */ add %o7,1,%o7 1.767 +/* 0x0274 140 ( 1 4) */ ld [%o0],%o1 1.768 +/* 0x0278 143 ( 1 2) */ add %o0,4,%o0 1.769 +/* 0x027c ( 1 2) */ cmp %o7,%i4 1.770 +/* 0x0280 141 ( 2 3) */ fmovs %f0,%f2 1.771 +/* 0x0284 142 ( 3 4) */ and %o1,%o3,%g1 1.772 +/* 0x0288 141 ( 4 7) */ fsubd %f2,%f0,%f2 1.773 +/* 0x028c ( 4 5) */ std %f2,[%o4] 1.774 +/* 0x0290 143 ( 4 5) */ srl %o1,16,%o1 1.775 +/* 0x0294 142 ( 5 6) */ st %g1,[%sp+96] 1.776 +/* 0x0298 143 ( 5 6) */ add %o4,8,%o4 1.777 +/* 0x029c 142 ( 8 9) */ fmovs %f0,%f2 1.778 +/* 0x02a0 ( 9 12) */ ld [%sp+96],%f3 1.779 +/* 0x02a4 (11 14) */ fsubd %f2,%f0,%f2 1.780 +/* 0x02a8 (11 12) */ std %f2,[%o5] 1.781 +/* 0x02ac 143 (12 13) */ st %o1,[%sp+92] 1.782 +/* 0x02b0 (15 16) */ fmovs %f0,%f2 1.783 +/* 0x02b4 (16 19) */ ld [%sp+92],%f3 1.784 +/* 0x02b8 (18 21) */ fsubd %f2,%f0,%f0 1.785 +/* 0x02bc (18 19) */ std %f0,[%o5+8] 1.786 +/* 0x02c0 (18 19) */ add %o5,16,%o5 1.787 +/* 0x02c4 (18 19) */ bl,a,pt %icc,.L900000513 ! tprob=0.86 1.788 +/* 0x02c8 (19 22) */ ld [%o0],%f3 1.789 + .L77000164: /* frequency 1.0 confidence 0.0 */ 1.790 +/* 0x02cc ( 0 2) */ ret ! Result = 1.791 +/* 0x02d0 ( 2 3) */ restore %g0,%g0,%g0 1.792 +/* 0x02d4 0 ( 0 0) */ .type conv_i32_to_d32_and_d16,2 1.793 +/* 0x02d4 ( 0 0) */ .size conv_i32_to_d32_and_d16,(.-conv_i32_to_d32_and_d16) 1.794 + 1.795 + .section ".text",#alloc,#execinstr 1.796 +/* 000000 0 ( 0 0) */ .align 4 1.797 +! 1.798 +! SUBROUTINE adjust_montf_result 1.799 +! 1.800 +! OFFSET SOURCE LINE LABEL INSTRUCTION (ISSUE TIME) (COMPLETION TIME) 1.801 + 1.802 + .global adjust_montf_result 1.803 + adjust_montf_result: /* frequency 1.0 confidence 0.0 */ 1.804 + 1.805 +! 144 ! } 1.806 +! 145 !} 1.807 +! 148 !void adjust_montf_result(unsigned int *i32, unsigned int *nint, int len) 1.808 +! 149 !{ 1.809 +! 150 !long long acc; 1.810 +! 151 !int i; 1.811 +! 153 ! if(i32[len]>0) i=-1; 1.812 + 1.813 +/* 000000 153 ( 0 1) */ sll %o2,2,%g1 1.814 +/* 0x0004 ( 0 1) */ or %g0,-1,%g3 1.815 +/* 0x0008 ( 1 4) */ ld [%o0+%g1],%g1 1.816 +/* 0x000c ( 3 4) */ cmp %g1,0 1.817 +/* 0x0010 ( 3 4) */ bleu,pn %icc,.L77000175 ! tprob=0.50 1.818 +/* 0x0014 ( 3 4) */ or %g0,%o1,%o3 1.819 +/* 0x0018 ( 4 5) */ ba .L900000611 ! tprob=1.00 1.820 +/* 0x001c ( 4 5) */ cmp %g3,0 1.821 + .L77000175: /* frequency 0.8 confidence 0.0 */ 1.822 + 1.823 +! 154 ! else 1.824 +! 155 ! { 1.825 +! 156 ! for(i=len-1; i>=0; i++) 1.826 + 1.827 +/* 0x0020 156 ( 0 1) */ subcc %o2,1,%g3 1.828 +/* 0x0024 ( 0 1) */ bneg,pt %icc,.L900000611 ! tprob=0.60 1.829 +/* 0x0028 ( 1 2) */ cmp %g3,0 1.830 +/* 0x002c ( 1 2) */ sll %g3,2,%g1 1.831 +/* 0x0030 ( 2 3) */ add %o0,%g1,%g2 1.832 +/* 0x0034 ( 2 3) */ add %o1,%g1,%g1 1.833 + 1.834 +! 157 ! { 1.835 +! 158 ! if(i32[i]!=nint[i]) break; 1.836 + 1.837 +/* 0x0038 158 ( 3 6) */ ld [%g1],%g5 1.838 + .L900000610: /* frequency 5.3 confidence 0.0 */ 1.839 +/* 0x003c 158 ( 0 3) */ ld [%g2],%o5 1.840 +/* 0x0040 ( 0 1) */ add %g1,4,%g1 1.841 +/* 0x0044 ( 0 1) */ add %g2,4,%g2 1.842 +/* 0x0048 ( 2 3) */ cmp %o5,%g5 1.843 +/* 0x004c ( 2 3) */ bne,pn %icc,.L77000182 ! tprob=0.16 1.844 +/* 0x0050 ( 2 3) */ nop 1.845 +/* 0x0054 ( 3 4) */ addcc %g3,1,%g3 1.846 +/* 0x0058 ( 3 4) */ bpos,a,pt %icc,.L900000610 ! tprob=0.84 1.847 +/* 0x005c ( 3 6) */ ld [%g1],%g5 1.848 + .L77000182: /* frequency 1.0 confidence 0.0 */ 1.849 + 1.850 +! 159 ! } 1.851 +! 160 ! } 1.852 +! 161 ! if((i<0)||(i32[i]>nint[i])) 1.853 + 1.854 +/* 0x0060 161 ( 0 1) */ cmp %g3,0 1.855 + .L900000611: /* frequency 1.0 confidence 0.0 */ 1.856 +/* 0x0064 161 ( 0 1) */ bl,pn %icc,.L77000198 ! tprob=0.50 1.857 +/* 0x0068 ( 0 1) */ sll %g3,2,%g2 1.858 +/* 0x006c ( 1 4) */ ld [%o1+%g2],%g1 1.859 +/* 0x0070 ( 2 5) */ ld [%o0+%g2],%g2 1.860 +/* 0x0074 ( 4 5) */ cmp %g2,%g1 1.861 +/* 0x0078 ( 4 5) */ bleu,pt %icc,.L77000191 ! tprob=0.56 1.862 +/* 0x007c ( 4 5) */ nop 1.863 + .L77000198: /* frequency 0.8 confidence 0.0 */ 1.864 + 1.865 +! 162 ! { 1.866 +! 163 ! acc=0; 1.867 +! 164 ! for(i=0;i<len;i++) 1.868 + 1.869 +/* 0x0080 164 ( 0 1) */ cmp %o2,0 1.870 +/* 0x0084 ( 0 1) */ ble,pt %icc,.L77000191 ! tprob=0.60 1.871 +/* 0x0088 ( 0 1) */ nop 1.872 +/* 0x008c 161 ( 1 2) */ or %g0,-1,%g2 1.873 +/* 0x0090 ( 1 2) */ sub %o2,1,%g4 1.874 +/* 0x0094 ( 2 3) */ srl %g2,0,%g3 1.875 +/* 0x0098 163 ( 2 3) */ or %g0,0,%g5 1.876 +/* 0x009c 164 ( 3 4) */ or %g0,0,%o5 1.877 +/* 0x00a0 161 ( 3 4) */ or %g0,%o0,%o4 1.878 +/* 0x00a4 ( 4 5) */ cmp %o2,3 1.879 +/* 0x00a8 ( 4 5) */ add %o1,4,%g2 1.880 +/* 0x00ac 164 ( 4 5) */ bl,pn %icc,.L77000199 ! tprob=0.40 1.881 +/* 0x00b0 ( 5 6) */ add %o0,8,%g1 1.882 + 1.883 +! 165 ! { 1.884 +! 166 ! acc=acc+(unsigned long long)(i32[i])-(unsigned long long)(nint[i]); 1.885 + 1.886 +/* 0x00b4 166 ( 5 8) */ ld [%o0],%o2 1.887 +/* 0x00b8 0 ( 5 6) */ or %g0,%g2,%o3 1.888 +/* 0x00bc 166 ( 6 9) */ ld [%o1],%o1 1.889 +/* 0x00c0 0 ( 6 7) */ or %g0,%g1,%o4 1.890 + 1.891 +! 167 ! i32[i]=acc&0xffffffff; 1.892 +! 168 ! acc=acc>>32; 1.893 + 1.894 +/* 0x00c4 168 ( 6 7) */ or %g0,2,%o5 1.895 +/* 0x00c8 166 ( 7 10) */ ld [%o0+4],%g1 1.896 +/* 0x00cc 164 ( 8 9) */ sub %o2,%o1,%o2 1.897 +/* 0x00d0 ( 9 10) */ or %g0,%o2,%g5 1.898 +/* 0x00d4 167 ( 9 10) */ and %o2,%g3,%o2 1.899 +/* 0x00d8 ( 9 10) */ st %o2,[%o0] 1.900 +/* 0x00dc 168 (10 11) */ srax %g5,32,%g5 1.901 + .L900000605: /* frequency 64.0 confidence 0.0 */ 1.902 +/* 0x00e0 166 (12 20) */ ld [%o3],%o2 1.903 +/* 0x00e4 168 (12 13) */ add %o5,1,%o5 1.904 +/* 0x00e8 (12 13) */ add %o3,4,%o3 1.905 +/* 0x00ec (13 13) */ cmp %o5,%g4 1.906 +/* 0x00f0 (13 14) */ add %o4,4,%o4 1.907 +/* 0x00f4 164 (14 14) */ sub %g1,%o2,%g1 1.908 +/* 0x00f8 (15 15) */ add %g1,%g5,%g5 1.909 +/* 0x00fc 167 (16 17) */ and %g5,%g3,%o2 1.910 +/* 0x0100 166 (16 24) */ ld [%o4-4],%g1 1.911 +/* 0x0104 167 (17 18) */ st %o2,[%o4-8] 1.912 +/* 0x0108 168 (17 18) */ ble,pt %icc,.L900000605 ! tprob=0.50 1.913 +/* 0x010c (17 18) */ srax %g5,32,%g5 1.914 + .L900000608: /* frequency 8.0 confidence 0.0 */ 1.915 +/* 0x0110 166 ( 0 3) */ ld [%o3],%g2 1.916 +/* 0x0114 164 ( 2 3) */ sub %g1,%g2,%g1 1.917 +/* 0x0118 ( 3 4) */ add %g1,%g5,%g1 1.918 +/* 0x011c 167 ( 4 5) */ and %g1,%g3,%g2 1.919 +/* 0x0120 ( 5 7) */ retl ! Result = 1.920 +/* 0x0124 ( 6 7) */ st %g2,[%o4-4] 1.921 + .L77000199: /* frequency 0.6 confidence 0.0 */ 1.922 +/* 0x0128 166 ( 0 3) */ ld [%o4],%g1 1.923 + .L900000609: /* frequency 5.3 confidence 0.0 */ 1.924 +/* 0x012c 166 ( 0 3) */ ld [%o3],%g2 1.925 +/* 0x0130 ( 0 1) */ add %g5,%g1,%g1 1.926 +/* 0x0134 168 ( 0 1) */ add %o5,1,%o5 1.927 +/* 0x0138 ( 1 2) */ add %o3,4,%o3 1.928 +/* 0x013c ( 1 2) */ cmp %o5,%g4 1.929 +/* 0x0140 166 ( 2 3) */ sub %g1,%g2,%g1 1.930 +/* 0x0144 167 ( 3 4) */ and %g1,%g3,%g2 1.931 +/* 0x0148 ( 3 4) */ st %g2,[%o4] 1.932 +/* 0x014c 168 ( 3 4) */ add %o4,4,%o4 1.933 +/* 0x0150 ( 4 5) */ srax %g1,32,%g5 1.934 +/* 0x0154 ( 4 5) */ ble,a,pt %icc,.L900000609 ! tprob=0.84 1.935 +/* 0x0158 ( 4 7) */ ld [%o4],%g1 1.936 + .L77000191: /* frequency 1.0 confidence 0.0 */ 1.937 +/* 0x015c ( 0 2) */ retl ! Result = 1.938 +/* 0x0160 ( 1 2) */ nop 1.939 +/* 0x0164 0 ( 0 0) */ .type adjust_montf_result,2 1.940 +/* 0x0164 ( 0 0) */ .size adjust_montf_result,(.-adjust_montf_result) 1.941 + 1.942 + .section ".text",#alloc,#execinstr 1.943 +/* 000000 0 ( 0 0) */ .align 32 1.944 +! 1.945 +! SUBROUTINE mont_mulf_noconv 1.946 +! 1.947 +! OFFSET SOURCE LINE LABEL INSTRUCTION (ISSUE TIME) (COMPLETION TIME) 1.948 + 1.949 + .global mont_mulf_noconv 1.950 + mont_mulf_noconv: /* frequency 1.0 confidence 0.0 */ 1.951 +/* 000000 ( 0 1) */ save %sp,-144,%sp 1.952 +/* 0x0004 ( 1 2) */ st %i0,[%fp+68] 1.953 + 1.954 +! 169 ! } 1.955 +! 170 ! } 1.956 +! 171 !} 1.957 +! 175 !void cleanup(double *dt, int from, int tlen); 1.958 +! 177 !/* 1.959 +! 178 !** the lengths of the input arrays should be at least the following: 1.960 +! 179 !** result[nlen+1], dm1[nlen], dm2[2*nlen+1], dt[4*nlen+2], dn[nlen], nint[nlen] 1.961 +! 180 !** all of them should be different from one another 1.962 +! 181 !** 1.963 +! 182 !*/ 1.964 +! 183 !void mont_mulf_noconv(unsigned int *result, 1.965 +! 184 ! double *dm1, double *dm2, double *dt, 1.966 +! 185 ! double *dn, unsigned int *nint, 1.967 +! 186 ! int nlen, double dn0) 1.968 +! 187 !{ 1.969 +! 188 ! int i, j, jj; 1.970 +! 189 ! int tmp; 1.971 +! 190 ! double digit, m2j, nextm2j, a, b; 1.972 +! 191 ! double *dptmp, *pdm1, *pdm2, *pdn, *pdtj, pdn_0, pdm1_0; 1.973 +! 193 ! pdm1=&(dm1[0]); 1.974 +! 194 ! pdm2=&(dm2[0]); 1.975 +! 195 ! pdn=&(dn[0]); 1.976 +! 196 ! pdm2[2*nlen]=Zero; 1.977 + 1.978 +/* 0x0008 196 ( 1 2) */ sethi %hi(Zero),%g2 1.979 +/* 0x000c 187 ( 1 2) */ or %g0,%i2,%o1 1.980 +/* 0x0010 ( 2 3) */ st %i5,[%fp+88] 1.981 +/* 0x0014 ( 2 3) */ or %g0,%i3,%o2 1.982 +/* 0x0018 196 ( 2 3) */ add %g2,%lo(Zero),%g4 1.983 +/* 0x001c ( 3 6) */ ldd [%g2+%lo(Zero)],%f2 1.984 +/* 0x0020 187 ( 3 4) */ or %g0,%o2,%g5 1.985 +/* 0x0024 196 ( 3 4) */ or %g0,%o1,%i0 1.986 +/* 0x0028 187 ( 4 5) */ or %g0,%i4,%i2 1.987 + 1.988 +! 198 ! if (nlen!=16) 1.989 +! 199 ! { 1.990 +! 200 ! for(i=0;i<4*nlen+2;i++) dt[i]=Zero; 1.991 +! 202 ! a=dt[0]=pdm1[0]*pdm2[0]; 1.992 +! 203 ! digit=mod(lower32(a,Zero)*dn0,TwoToMinus16,TwoTo16); 1.993 +! 205 ! pdtj=&(dt[0]); 1.994 +! 206 ! for(j=jj=0;j<2*nlen;j++,jj++,pdtj++) 1.995 +! 207 ! { 1.996 +! 208 ! m2j=pdm2[j]; 1.997 +! 209 ! a=pdtj[0]+pdn[0]*digit; 1.998 +! 210 ! b=pdtj[1]+pdm1[0]*pdm2[j+1]+a*TwoToMinus16; 1.999 +! 211 ! pdtj[1]=b; 1.1000 +! 213 !#pragma pipeloop(0) 1.1001 +! 214 ! for(i=1;i<nlen;i++) 1.1002 +! 215 ! { 1.1003 +! 216 ! pdtj[2*i]+=pdm1[i]*m2j+pdn[i]*digit; 1.1004 +! 217 ! } 1.1005 +! 218 ! if((jj==30)) {cleanup(dt,j/2+1,2*nlen+1); jj=0;} 1.1006 +! 219 ! 1.1007 +! 220 ! digit=mod(lower32(b,Zero)*dn0,TwoToMinus16,TwoTo16); 1.1008 +! 221 ! } 1.1009 +! 222 ! } 1.1010 +! 223 ! else 1.1011 +! 224 ! { 1.1012 +! 225 ! a=dt[0]=pdm1[0]*pdm2[0]; 1.1013 +! 227 ! dt[65]= dt[64]= dt[63]= dt[62]= dt[61]= dt[60]= 1.1014 +! 228 ! dt[59]= dt[58]= dt[57]= dt[56]= dt[55]= dt[54]= 1.1015 +! 229 ! dt[53]= dt[52]= dt[51]= dt[50]= dt[49]= dt[48]= 1.1016 +! 230 ! dt[47]= dt[46]= dt[45]= dt[44]= dt[43]= dt[42]= 1.1017 +! 231 ! dt[41]= dt[40]= dt[39]= dt[38]= dt[37]= dt[36]= 1.1018 +! 232 ! dt[35]= dt[34]= dt[33]= dt[32]= dt[31]= dt[30]= 1.1019 +! 233 ! dt[29]= dt[28]= dt[27]= dt[26]= dt[25]= dt[24]= 1.1020 +! 234 ! dt[23]= dt[22]= dt[21]= dt[20]= dt[19]= dt[18]= 1.1021 +! 235 ! dt[17]= dt[16]= dt[15]= dt[14]= dt[13]= dt[12]= 1.1022 +! 236 ! dt[11]= dt[10]= dt[ 9]= dt[ 8]= dt[ 7]= dt[ 6]= 1.1023 +! 237 ! dt[ 5]= dt[ 4]= dt[ 3]= dt[ 2]= dt[ 1]=Zero; 1.1024 +! 239 ! pdn_0=pdn[0]; 1.1025 +! 240 ! pdm1_0=pdm1[0]; 1.1026 +! 242 ! digit=mod(lower32(a,Zero)*dn0,TwoToMinus16,TwoTo16); 1.1027 +! 243 ! pdtj=&(dt[0]); 1.1028 +! 245 ! for(j=0;j<32;j++,pdtj++) 1.1029 +! 246 ! { 1.1030 +! 248 ! m2j=pdm2[j]; 1.1031 +! 249 ! a=pdtj[0]+pdn_0*digit; 1.1032 +! 250 ! b=pdtj[1]+pdm1_0*pdm2[j+1]+a*TwoToMinus16; 1.1033 +! 251 ! pdtj[1]=b; 1.1034 +! 253 ! /**** this loop will be fully unrolled: 1.1035 +! 254 ! for(i=1;i<16;i++) 1.1036 +! 255 ! { 1.1037 +! 256 ! pdtj[2*i]+=pdm1[i]*m2j+pdn[i]*digit; 1.1038 +! 257 ! } 1.1039 +! 258 ! *************************************/ 1.1040 +! 259 ! pdtj[2]+=pdm1[1]*m2j+pdn[1]*digit; 1.1041 +! 260 ! pdtj[4]+=pdm1[2]*m2j+pdn[2]*digit; 1.1042 +! 261 ! pdtj[6]+=pdm1[3]*m2j+pdn[3]*digit; 1.1043 +! 262 ! pdtj[8]+=pdm1[4]*m2j+pdn[4]*digit; 1.1044 +! 263 ! pdtj[10]+=pdm1[5]*m2j+pdn[5]*digit; 1.1045 +! 264 ! pdtj[12]+=pdm1[6]*m2j+pdn[6]*digit; 1.1046 +! 265 ! pdtj[14]+=pdm1[7]*m2j+pdn[7]*digit; 1.1047 +! 266 ! pdtj[16]+=pdm1[8]*m2j+pdn[8]*digit; 1.1048 +! 267 ! pdtj[18]+=pdm1[9]*m2j+pdn[9]*digit; 1.1049 +! 268 ! pdtj[20]+=pdm1[10]*m2j+pdn[10]*digit; 1.1050 +! 269 ! pdtj[22]+=pdm1[11]*m2j+pdn[11]*digit; 1.1051 +! 270 ! pdtj[24]+=pdm1[12]*m2j+pdn[12]*digit; 1.1052 +! 271 ! pdtj[26]+=pdm1[13]*m2j+pdn[13]*digit; 1.1053 +! 272 ! pdtj[28]+=pdm1[14]*m2j+pdn[14]*digit; 1.1054 +! 273 ! pdtj[30]+=pdm1[15]*m2j+pdn[15]*digit; 1.1055 +! 274 ! /* no need for cleenup, cannot overflow */ 1.1056 +! 275 ! digit=mod(lower32(b,Zero)*dn0,TwoToMinus16,TwoTo16); 1.1057 +! 276 ! } 1.1058 +! 277 ! } 1.1059 +! 279 ! conv_d16_to_i32(result,dt+2*nlen,(long long *)dt,nlen+1); 1.1060 +! 281 ! adjust_montf_result(result,nint,nlen); 1.1061 + 1.1062 +/* 0x002c 281 ( 4 5) */ or %g0,1,%o4 1.1063 +/* 0x0030 187 ( 6 9) */ ldd [%fp+96],%f0 1.1064 +/* 0x0034 196 ( 7 10) */ ld [%fp+92],%o0 1.1065 +/* 0x0038 187 ( 8 9) */ fmovd %f0,%f16 1.1066 +/* 0x003c 196 ( 9 10) */ sll %o0,4,%g2 1.1067 +/* 0x0040 ( 9 10) */ or %g0,%o0,%g1 1.1068 +/* 0x0044 198 (10 11) */ cmp %o0,16 1.1069 +/* 0x0048 (10 11) */ be,pn %icc,.L77000289 ! tprob=0.50 1.1070 +/* 0x004c (10 11) */ std %f2,[%o1+%g2] 1.1071 +/* 0x0050 200 (11 12) */ sll %o0,2,%g2 1.1072 +/* 0x0054 (11 14) */ ldd [%g4],%f2 1.1073 +/* 0x0058 (12 13) */ add %g2,2,%o1 1.1074 +/* 0x005c (12 13) */ add %g2,1,%o3 1.1075 +/* 0x0060 196 (13 14) */ sll %o0,1,%o7 1.1076 +/* 0x0064 200 (13 14) */ cmp %o1,0 1.1077 +/* 0x0068 (13 14) */ ble,a,pt %icc,.L900000755 ! tprob=0.55 1.1078 +/* 0x006c (14 17) */ ldd [%i1],%f0 1.1079 +/* 0x0070 (14 15) */ cmp %o1,3 1.1080 +/* 0x0074 281 (14 15) */ or %g0,1,%o1 1.1081 +/* 0x0078 (14 15) */ bl,pn %icc,.L77000279 ! tprob=0.40 1.1082 +/* 0x007c (15 16) */ add %o2,8,%o0 1.1083 +/* 0x0080 (15 16) */ std %f2,[%g5] 1.1084 +/* 0x0084 0 (16 17) */ or %g0,%o0,%o2 1.1085 + .L900000726: /* frequency 64.0 confidence 0.0 */ 1.1086 +/* 0x0088 ( 3 5) */ ldd [%g4],%f0 1.1087 +/* 0x008c ( 3 4) */ add %o4,1,%o4 1.1088 +/* 0x0090 ( 3 4) */ add %o2,8,%o2 1.1089 +/* 0x0094 ( 4 4) */ cmp %o4,%o3 1.1090 +/* 0x0098 ( 5 6) */ ble,pt %icc,.L900000726 ! tprob=0.50 1.1091 +/* 0x009c ( 5 6) */ std %f0,[%o2-8] 1.1092 + .L900000729: /* frequency 8.0 confidence 0.0 */ 1.1093 +/* 0x00a0 ( 0 1) */ ba .L900000755 ! tprob=1.00 1.1094 +/* 0x00a4 ( 0 3) */ ldd [%i1],%f0 1.1095 + .L77000279: /* frequency 0.6 confidence 0.0 */ 1.1096 +/* 0x00a8 ( 0 1) */ std %f2,[%o2] 1.1097 + .L900000754: /* frequency 5.3 confidence 0.0 */ 1.1098 +/* 0x00ac ( 0 3) */ ldd [%g4],%f2 1.1099 +/* 0x00b0 ( 0 1) */ cmp %o1,%o3 1.1100 +/* 0x00b4 ( 0 1) */ add %o2,8,%o2 1.1101 +/* 0x00b8 ( 1 2) */ add %o1,1,%o1 1.1102 +/* 0x00bc ( 1 2) */ ble,a,pt %icc,.L900000754 ! tprob=0.87 1.1103 +/* 0x00c0 ( 3 4) */ std %f2,[%o2] 1.1104 + .L77000284: /* frequency 0.8 confidence 0.0 */ 1.1105 +/* 0x00c4 202 ( 0 3) */ ldd [%i1],%f0 1.1106 + .L900000755: /* frequency 0.8 confidence 0.0 */ 1.1107 +/* 0x00c8 202 ( 0 3) */ ldd [%i0],%f2 1.1108 +/* 0x00cc ( 0 1) */ add %o7,1,%o2 1.1109 +/* 0x00d0 206 ( 0 1) */ cmp %o7,0 1.1110 +/* 0x00d4 ( 1 2) */ sll %o2,1,%o0 1.1111 +/* 0x00d8 ( 1 2) */ sub %o7,1,%o1 1.1112 +/* 0x00dc 202 ( 2 5) */ fmuld %f0,%f2,%f0 1.1113 +/* 0x00e0 ( 2 3) */ std %f0,[%g5] 1.1114 +/* 0x00e4 ( 2 3) */ sub %g1,1,%o7 1.1115 +/* 0x00e8 ( 3 6) */ ldd [%g4],%f6 1.1116 +/* 0x00ec 0 ( 3 4) */ or %g0,%o7,%g3 1.1117 +/* 0x00f0 ( 3 4) */ or %g0,0,%l0 1.1118 +/* 0x00f4 ( 4 7) */ ldd [%g4-8],%f2 1.1119 +/* 0x00f8 ( 4 5) */ or %g0,0,%i5 1.1120 +/* 0x00fc ( 4 5) */ or %g0,%o1,%o5 1.1121 +/* 0x0100 ( 5 8) */ fdtox %f0,%f0 1.1122 +/* 0x0104 ( 5 8) */ ldd [%g4-16],%f4 1.1123 +/* 0x0108 ( 5 6) */ or %g0,%o0,%o3 1.1124 +/* 0x010c 210 ( 6 7) */ add %i0,8,%o4 1.1125 +/* 0x0110 ( 6 7) */ or %g0,0,%i4 1.1126 +/* 0x0114 ( 9 10) */ fmovs %f6,%f0 1.1127 +/* 0x0118 (11 14) */ fxtod %f0,%f0 1.1128 +/* 0x011c 203 (14 17) */ fmuld %f0,%f16,%f0 1.1129 +/* 0x0120 (17 20) */ fmuld %f0,%f2,%f2 1.1130 +/* 0x0124 (20 23) */ fdtox %f2,%f2 1.1131 +/* 0x0128 (23 26) */ fxtod %f2,%f2 1.1132 +/* 0x012c (26 29) */ fmuld %f2,%f4,%f2 1.1133 +/* 0x0130 (29 32) */ fsubd %f0,%f2,%f22 1.1134 +/* 0x0134 206 (29 30) */ ble,pt %icc,.L900000748 ! tprob=0.60 1.1135 +/* 0x0138 (29 30) */ sll %g1,4,%g2 1.1136 +/* 0x013c 210 (30 33) */ ldd [%i2],%f0 1.1137 + .L900000749: /* frequency 5.3 confidence 0.0 */ 1.1138 +/* 0x0140 210 ( 0 3) */ fmuld %f0,%f22,%f8 1.1139 +/* 0x0144 ( 0 3) */ ldd [%i1],%f0 1.1140 +/* 0x0148 214 ( 0 1) */ cmp %g1,1 1.1141 +/* 0x014c 210 ( 1 4) */ ldd [%o4+%i4],%f6 1.1142 +/* 0x0150 ( 1 2) */ add %i1,8,%o0 1.1143 +/* 0x0154 214 ( 1 2) */ or %g0,1,%o1 1.1144 +/* 0x0158 210 ( 2 5) */ ldd [%i3],%f2 1.1145 +/* 0x015c ( 2 3) */ add %i3,16,%l1 1.1146 +/* 0x0160 ( 3 6) */ fmuld %f0,%f6,%f6 1.1147 +/* 0x0164 ( 3 6) */ ldd [%g4-8],%f4 1.1148 +/* 0x0168 ( 4 7) */ faddd %f2,%f8,%f2 1.1149 +/* 0x016c ( 4 7) */ ldd [%i3+8],%f0 1.1150 +/* 0x0170 208 ( 5 8) */ ldd [%i0+%i4],%f20 1.1151 +/* 0x0174 210 ( 6 9) */ faddd %f0,%f6,%f0 1.1152 +/* 0x0178 ( 7 10) */ fmuld %f2,%f4,%f2 1.1153 +/* 0x017c (10 13) */ faddd %f0,%f2,%f18 1.1154 +/* 0x0180 211 (10 11) */ std %f18,[%i3+8] 1.1155 +/* 0x0184 214 (10 11) */ ble,pt %icc,.L900000753 ! tprob=0.54 1.1156 +/* 0x0188 (11 12) */ srl %i5,31,%g2 1.1157 +/* 0x018c (11 12) */ cmp %g3,7 1.1158 +/* 0x0190 210 (12 13) */ add %i2,8,%g2 1.1159 +/* 0x0194 214 (12 13) */ bl,pn %icc,.L77000281 ! tprob=0.36 1.1160 +/* 0x0198 (13 14) */ add %g2,24,%o2 1.1161 +/* 0x019c 216 (13 16) */ ldd [%o0+16],%f14 1.1162 +/* 0x01a0 (13 14) */ add %i3,48,%l1 1.1163 +/* 0x01a4 (14 17) */ ldd [%o0+24],%f12 1.1164 +/* 0x01a8 0 (14 15) */ or %g0,%o2,%g2 1.1165 +/* 0x01ac 214 (14 15) */ sub %g1,3,%o2 1.1166 +/* 0x01b0 216 (15 18) */ ldd [%o0],%f2 1.1167 +/* 0x01b4 (15 16) */ or %g0,5,%o1 1.1168 +/* 0x01b8 (16 19) */ ldd [%g2-24],%f0 1.1169 +/* 0x01bc (17 20) */ ldd [%o0+8],%f6 1.1170 +/* 0x01c0 (17 20) */ fmuld %f2,%f20,%f2 1.1171 +/* 0x01c4 (17 18) */ add %o0,32,%o0 1.1172 +/* 0x01c8 (18 21) */ ldd [%g2-16],%f8 1.1173 +/* 0x01cc (18 21) */ fmuld %f0,%f22,%f4 1.1174 +/* 0x01d0 (19 22) */ ldd [%i3+16],%f0 1.1175 +/* 0x01d4 (19 22) */ fmuld %f6,%f20,%f10 1.1176 +/* 0x01d8 (20 23) */ ldd [%g2-8],%f6 1.1177 +/* 0x01dc (21 24) */ faddd %f2,%f4,%f4 1.1178 +/* 0x01e0 (21 24) */ ldd [%i3+32],%f2 1.1179 + .L900000738: /* frequency 512.0 confidence 0.0 */ 1.1180 +/* 0x01e4 216 (16 24) */ ldd [%g2],%f24 1.1181 +/* 0x01e8 (16 17) */ add %o1,3,%o1 1.1182 +/* 0x01ec (16 17) */ add %g2,24,%g2 1.1183 +/* 0x01f0 (16 19) */ fmuld %f8,%f22,%f8 1.1184 +/* 0x01f4 (17 25) */ ldd [%l1],%f28 1.1185 +/* 0x01f8 (17 17) */ cmp %o1,%o2 1.1186 +/* 0x01fc (17 18) */ add %o0,24,%o0 1.1187 +/* 0x0200 (18 26) */ ldd [%o0-24],%f26 1.1188 +/* 0x0204 (18 21) */ faddd %f0,%f4,%f0 1.1189 +/* 0x0208 (18 19) */ add %l1,48,%l1 1.1190 +/* 0x020c (19 22) */ faddd %f10,%f8,%f10 1.1191 +/* 0x0210 (19 22) */ fmuld %f14,%f20,%f4 1.1192 +/* 0x0214 (19 20) */ std %f0,[%l1-80] 1.1193 +/* 0x0218 (20 28) */ ldd [%g2-16],%f8 1.1194 +/* 0x021c (20 23) */ fmuld %f6,%f22,%f6 1.1195 +/* 0x0220 (21 29) */ ldd [%l1-32],%f0 1.1196 +/* 0x0224 (22 30) */ ldd [%o0-16],%f14 1.1197 +/* 0x0228 (22 25) */ faddd %f2,%f10,%f2 1.1198 +/* 0x022c (23 26) */ faddd %f4,%f6,%f10 1.1199 +/* 0x0230 (23 26) */ fmuld %f12,%f20,%f4 1.1200 +/* 0x0234 (23 24) */ std %f2,[%l1-64] 1.1201 +/* 0x0238 (24 32) */ ldd [%g2-8],%f6 1.1202 +/* 0x023c (24 27) */ fmuld %f24,%f22,%f24 1.1203 +/* 0x0240 (25 33) */ ldd [%l1-16],%f2 1.1204 +/* 0x0244 (26 34) */ ldd [%o0-8],%f12 1.1205 +/* 0x0248 (26 29) */ faddd %f28,%f10,%f10 1.1206 +/* 0x024c (27 28) */ std %f10,[%l1-48] 1.1207 +/* 0x0250 (27 30) */ fmuld %f26,%f20,%f10 1.1208 +/* 0x0254 (27 28) */ ble,pt %icc,.L900000738 ! tprob=0.50 1.1209 +/* 0x0258 (27 30) */ faddd %f4,%f24,%f4 1.1210 + .L900000741: /* frequency 64.0 confidence 0.0 */ 1.1211 +/* 0x025c 216 ( 0 3) */ fmuld %f8,%f22,%f28 1.1212 +/* 0x0260 ( 0 3) */ ldd [%g2],%f24 1.1213 +/* 0x0264 ( 0 3) */ faddd %f0,%f4,%f26 1.1214 +/* 0x0268 ( 1 4) */ fmuld %f12,%f20,%f8 1.1215 +/* 0x026c ( 1 2) */ add %l1,32,%l1 1.1216 +/* 0x0270 ( 1 2) */ cmp %o1,%g3 1.1217 +/* 0x0274 ( 2 5) */ fmuld %f14,%f20,%f14 1.1218 +/* 0x0278 ( 2 5) */ ldd [%l1-32],%f4 1.1219 +/* 0x027c ( 2 3) */ add %g2,8,%g2 1.1220 +/* 0x0280 ( 3 6) */ faddd %f10,%f28,%f12 1.1221 +/* 0x0284 ( 3 6) */ fmuld %f6,%f22,%f6 1.1222 +/* 0x0288 ( 3 6) */ ldd [%l1-16],%f0 1.1223 +/* 0x028c ( 4 7) */ fmuld %f24,%f22,%f10 1.1224 +/* 0x0290 ( 4 5) */ std %f26,[%l1-64] 1.1225 +/* 0x0294 ( 6 9) */ faddd %f2,%f12,%f2 1.1226 +/* 0x0298 ( 6 7) */ std %f2,[%l1-48] 1.1227 +/* 0x029c ( 7 10) */ faddd %f14,%f6,%f6 1.1228 +/* 0x02a0 ( 8 11) */ faddd %f8,%f10,%f2 1.1229 +/* 0x02a4 (10 13) */ faddd %f4,%f6,%f4 1.1230 +/* 0x02a8 (10 11) */ std %f4,[%l1-32] 1.1231 +/* 0x02ac (11 14) */ faddd %f0,%f2,%f0 1.1232 +/* 0x02b0 (11 12) */ bg,pn %icc,.L77000213 ! tprob=0.13 1.1233 +/* 0x02b4 (11 12) */ std %f0,[%l1-16] 1.1234 + .L77000281: /* frequency 4.0 confidence 0.0 */ 1.1235 +/* 0x02b8 216 ( 0 3) */ ldd [%o0],%f0 1.1236 + .L900000752: /* frequency 36.6 confidence 0.0 */ 1.1237 +/* 0x02bc 216 ( 0 3) */ ldd [%g2],%f4 1.1238 +/* 0x02c0 ( 0 3) */ fmuld %f0,%f20,%f2 1.1239 +/* 0x02c4 ( 0 1) */ add %o1,1,%o1 1.1240 +/* 0x02c8 ( 1 4) */ ldd [%l1],%f0 1.1241 +/* 0x02cc ( 1 2) */ add %o0,8,%o0 1.1242 +/* 0x02d0 ( 1 2) */ add %g2,8,%g2 1.1243 +/* 0x02d4 ( 2 5) */ fmuld %f4,%f22,%f4 1.1244 +/* 0x02d8 ( 2 3) */ cmp %o1,%g3 1.1245 +/* 0x02dc ( 5 8) */ faddd %f2,%f4,%f2 1.1246 +/* 0x02e0 ( 8 11) */ faddd %f0,%f2,%f0 1.1247 +/* 0x02e4 ( 8 9) */ std %f0,[%l1] 1.1248 +/* 0x02e8 ( 8 9) */ add %l1,16,%l1 1.1249 +/* 0x02ec ( 8 9) */ ble,a,pt %icc,.L900000752 ! tprob=0.87 1.1250 +/* 0x02f0 (10 13) */ ldd [%o0],%f0 1.1251 + .L77000213: /* frequency 5.3 confidence 0.0 */ 1.1252 +/* 0x02f4 ( 0 1) */ srl %i5,31,%g2 1.1253 + .L900000753: /* frequency 5.3 confidence 0.0 */ 1.1254 +/* 0x02f8 218 ( 0 1) */ cmp %l0,30 1.1255 +/* 0x02fc ( 0 1) */ bne,a,pt %icc,.L900000751 ! tprob=0.54 1.1256 +/* 0x0300 ( 0 3) */ fdtox %f18,%f0 1.1257 +/* 0x0304 ( 1 2) */ add %i5,%g2,%g2 1.1258 +/* 0x0308 ( 1 2) */ sub %o3,1,%o2 1.1259 +/* 0x030c ( 2 3) */ sra %g2,1,%o0 1.1260 +/* 0x0310 216 ( 2 5) */ ldd [%g4],%f0 1.1261 +/* 0x0314 ( 3 4) */ add %o0,1,%g2 1.1262 +/* 0x0318 ( 4 5) */ sll %g2,1,%o0 1.1263 +/* 0x031c ( 4 5) */ fmovd %f0,%f2 1.1264 +/* 0x0320 ( 5 6) */ sll %g2,4,%o1 1.1265 +/* 0x0324 ( 5 6) */ cmp %o0,%o3 1.1266 +/* 0x0328 ( 5 6) */ bge,pt %icc,.L77000215 ! tprob=0.53 1.1267 +/* 0x032c ( 6 7) */ or %g0,0,%l0 1.1268 +/* 0x0330 218 ( 6 7) */ add %g5,%o1,%o1 1.1269 +/* 0x0334 216 ( 7 10) */ ldd [%o1],%f8 1.1270 + .L900000750: /* frequency 32.0 confidence 0.0 */ 1.1271 +/* 0x0338 ( 0 3) */ fdtox %f8,%f6 1.1272 +/* 0x033c ( 0 3) */ ldd [%g4],%f10 1.1273 +/* 0x0340 ( 0 1) */ add %o0,2,%o0 1.1274 +/* 0x0344 ( 1 4) */ ldd [%o1+8],%f4 1.1275 +/* 0x0348 ( 1 4) */ fdtox %f8,%f8 1.1276 +/* 0x034c ( 1 2) */ cmp %o0,%o2 1.1277 +/* 0x0350 ( 5 6) */ fmovs %f10,%f6 1.1278 +/* 0x0354 ( 7 10) */ fxtod %f6,%f10 1.1279 +/* 0x0358 ( 8 11) */ fdtox %f4,%f6 1.1280 +/* 0x035c ( 9 12) */ fdtox %f4,%f4 1.1281 +/* 0x0360 (10 13) */ faddd %f10,%f2,%f2 1.1282 +/* 0x0364 (10 11) */ std %f2,[%o1] 1.1283 +/* 0x0368 (12 15) */ ldd [%g4],%f2 1.1284 +/* 0x036c (14 15) */ fmovs %f2,%f6 1.1285 +/* 0x0370 (16 19) */ fxtod %f6,%f6 1.1286 +/* 0x0374 (17 20) */ fitod %f8,%f2 1.1287 +/* 0x0378 (19 22) */ faddd %f6,%f0,%f0 1.1288 +/* 0x037c (19 20) */ std %f0,[%o1+8] 1.1289 +/* 0x0380 (19 20) */ add %o1,16,%o1 1.1290 +/* 0x0384 (20 23) */ fitod %f4,%f0 1.1291 +/* 0x0388 (20 21) */ ble,a,pt %icc,.L900000750 ! tprob=0.87 1.1292 +/* 0x038c (20 23) */ ldd [%o1],%f8 1.1293 + .L77000233: /* frequency 4.6 confidence 0.0 */ 1.1294 +/* 0x0390 ( 0 0) */ or %g0,0,%l0 1.1295 + .L77000215: /* frequency 5.3 confidence 0.0 */ 1.1296 +/* 0x0394 ( 0 3) */ fdtox %f18,%f0 1.1297 + .L900000751: /* frequency 5.3 confidence 0.0 */ 1.1298 +/* 0x0398 ( 0 3) */ ldd [%g4],%f6 1.1299 +/* 0x039c 220 ( 0 1) */ add %i5,1,%i5 1.1300 +/* 0x03a0 ( 0 1) */ add %i4,8,%i4 1.1301 +/* 0x03a4 ( 1 4) */ ldd [%g4-8],%f2 1.1302 +/* 0x03a8 ( 1 2) */ add %l0,1,%l0 1.1303 +/* 0x03ac ( 1 2) */ add %i3,8,%i3 1.1304 +/* 0x03b0 ( 2 3) */ fmovs %f6,%f0 1.1305 +/* 0x03b4 ( 2 5) */ ldd [%g4-16],%f4 1.1306 +/* 0x03b8 ( 2 3) */ cmp %i5,%o5 1.1307 +/* 0x03bc ( 4 7) */ fxtod %f0,%f0 1.1308 +/* 0x03c0 ( 7 10) */ fmuld %f0,%f16,%f0 1.1309 +/* 0x03c4 (10 13) */ fmuld %f0,%f2,%f2 1.1310 +/* 0x03c8 (13 16) */ fdtox %f2,%f2 1.1311 +/* 0x03cc (16 19) */ fxtod %f2,%f2 1.1312 +/* 0x03d0 (19 22) */ fmuld %f2,%f4,%f2 1.1313 +/* 0x03d4 (22 25) */ fsubd %f0,%f2,%f22 1.1314 +/* 0x03d8 (22 23) */ ble,a,pt %icc,.L900000749 ! tprob=0.89 1.1315 +/* 0x03dc (22 25) */ ldd [%i2],%f0 1.1316 + .L900000725: /* frequency 0.7 confidence 0.0 */ 1.1317 +/* 0x03e0 220 ( 0 1) */ ba .L900000748 ! tprob=1.00 1.1318 +/* 0x03e4 ( 0 1) */ sll %g1,4,%g2 1.1319 + 1.1320 + 1.1321 + .L77000289: /* frequency 0.8 confidence 0.0 */ 1.1322 +/* 0x03e8 225 ( 0 3) */ ldd [%o1],%f6 1.1323 +/* 0x03ec 242 ( 0 1) */ add %g4,-8,%g2 1.1324 +/* 0x03f0 ( 0 1) */ add %g4,-16,%g3 1.1325 +/* 0x03f4 225 ( 1 4) */ ldd [%i1],%f2 1.1326 +/* 0x03f8 245 ( 1 2) */ or %g0,0,%o3 1.1327 +/* 0x03fc ( 1 2) */ or %g0,0,%o0 1.1328 +/* 0x0400 225 ( 3 6) */ fmuld %f2,%f6,%f2 1.1329 +/* 0x0404 ( 3 4) */ std %f2,[%o2] 1.1330 +/* 0x0408 ( 4 7) */ ldd [%g4],%f6 1.1331 +/* 0x040c 237 ( 7 8) */ std %f6,[%o2+8] 1.1332 +/* 0x0410 ( 8 9) */ std %f6,[%o2+16] 1.1333 +/* 0x0414 ( 9 10) */ std %f6,[%o2+24] 1.1334 +/* 0x0418 (10 11) */ std %f6,[%o2+32] 1.1335 +/* 0x041c (11 12) */ std %f6,[%o2+40] 1.1336 +/* 0x0420 (12 13) */ std %f6,[%o2+48] 1.1337 +/* 0x0424 (13 14) */ std %f6,[%o2+56] 1.1338 +/* 0x0428 (14 15) */ std %f6,[%o2+64] 1.1339 +/* 0x042c (15 16) */ std %f6,[%o2+72] 1.1340 +! prefetch [%i4],0 1.1341 +! prefetch [%i4+32],0 1.1342 +! prefetch [%i4+64],0 1.1343 +! prefetch [%i4+96],0 1.1344 +! prefetch [%i4+120],0 1.1345 +! prefetch [%i1],0 1.1346 +! prefetch [%i1+32],0 1.1347 +! prefetch [%i1+64],0 1.1348 +! prefetch [%i1+96],0 1.1349 +! prefetch [%i1+120],0 1.1350 +/* 0x0430 (16 17) */ std %f6,[%o2+80] 1.1351 +/* 0x0434 (17 18) */ std %f6,[%o2+88] 1.1352 +/* 0x0438 (18 19) */ std %f6,[%o2+96] 1.1353 +/* 0x043c (19 20) */ std %f6,[%o2+104] 1.1354 +/* 0x0440 (20 21) */ std %f6,[%o2+112] 1.1355 +/* 0x0444 (21 22) */ std %f6,[%o2+120] 1.1356 +/* 0x0448 (22 23) */ std %f6,[%o2+128] 1.1357 +/* 0x044c (23 24) */ std %f6,[%o2+136] 1.1358 +/* 0x0450 (24 25) */ std %f6,[%o2+144] 1.1359 +/* 0x0454 (25 26) */ std %f6,[%o2+152] 1.1360 +/* 0x0458 (26 27) */ std %f6,[%o2+160] 1.1361 +/* 0x045c (27 28) */ std %f6,[%o2+168] 1.1362 +/* 0x0460 (27 30) */ fdtox %f2,%f2 1.1363 +/* 0x0464 (28 29) */ std %f6,[%o2+176] 1.1364 +/* 0x0468 (29 30) */ std %f6,[%o2+184] 1.1365 +/* 0x046c (30 31) */ std %f6,[%o2+192] 1.1366 +/* 0x0470 (31 32) */ std %f6,[%o2+200] 1.1367 +/* 0x0474 (32 33) */ std %f6,[%o2+208] 1.1368 +/* 0x0478 (33 34) */ std %f6,[%o2+216] 1.1369 +/* 0x047c (34 35) */ std %f6,[%o2+224] 1.1370 +/* 0x0480 (35 36) */ std %f6,[%o2+232] 1.1371 +/* 0x0484 (36 37) */ std %f6,[%o2+240] 1.1372 +/* 0x0488 (37 38) */ std %f6,[%o2+248] 1.1373 +/* 0x048c (38 39) */ std %f6,[%o2+256] 1.1374 +/* 0x0490 (39 40) */ std %f6,[%o2+264] 1.1375 +/* 0x0494 (40 41) */ std %f6,[%o2+272] 1.1376 +/* 0x0498 (41 42) */ std %f6,[%o2+280] 1.1377 +/* 0x049c (42 43) */ std %f6,[%o2+288] 1.1378 +/* 0x04a0 (43 44) */ std %f6,[%o2+296] 1.1379 +/* 0x04a4 (44 45) */ std %f6,[%o2+304] 1.1380 +/* 0x04a8 (45 46) */ std %f6,[%o2+312] 1.1381 +/* 0x04ac (46 47) */ std %f6,[%o2+320] 1.1382 +/* 0x04b0 (47 48) */ std %f6,[%o2+328] 1.1383 +/* 0x04b4 (48 49) */ std %f6,[%o2+336] 1.1384 +/* 0x04b8 (49 50) */ std %f6,[%o2+344] 1.1385 +/* 0x04bc (50 51) */ std %f6,[%o2+352] 1.1386 +/* 0x04c0 (51 52) */ std %f6,[%o2+360] 1.1387 +/* 0x04c4 (52 53) */ std %f6,[%o2+368] 1.1388 +/* 0x04c8 (53 54) */ std %f6,[%o2+376] 1.1389 +/* 0x04cc (54 55) */ std %f6,[%o2+384] 1.1390 +/* 0x04d0 (55 56) */ std %f6,[%o2+392] 1.1391 +/* 0x04d4 (56 57) */ std %f6,[%o2+400] 1.1392 +/* 0x04d8 (57 58) */ std %f6,[%o2+408] 1.1393 +/* 0x04dc (58 59) */ std %f6,[%o2+416] 1.1394 +/* 0x04e0 (59 60) */ std %f6,[%o2+424] 1.1395 +/* 0x04e4 (60 61) */ std %f6,[%o2+432] 1.1396 +/* 0x04e8 (61 62) */ std %f6,[%o2+440] 1.1397 +/* 0x04ec (62 63) */ std %f6,[%o2+448] 1.1398 +/* 0x04f0 (63 64) */ std %f6,[%o2+456] 1.1399 +/* 0x04f4 (64 65) */ std %f6,[%o2+464] 1.1400 +/* 0x04f8 (65 66) */ std %f6,[%o2+472] 1.1401 +/* 0x04fc (66 67) */ std %f6,[%o2+480] 1.1402 +/* 0x0500 (67 68) */ std %f6,[%o2+488] 1.1403 +/* 0x0504 (68 69) */ std %f6,[%o2+496] 1.1404 +/* 0x0508 (69 70) */ std %f6,[%o2+504] 1.1405 +/* 0x050c (70 71) */ std %f6,[%o2+512] 1.1406 +/* 0x0510 (71 72) */ std %f6,[%o2+520] 1.1407 +/* 0x0514 242 (72 75) */ ld [%g4],%f2 ! dalign 1.1408 +/* 0x0518 (73 76) */ ld [%g2],%f6 ! dalign 1.1409 +/* 0x051c (74 77) */ fxtod %f2,%f10 1.1410 +/* 0x0520 (74 77) */ ld [%g2+4],%f7 1.1411 +/* 0x0524 (75 78) */ ld [%g3],%f8 ! dalign 1.1412 +/* 0x0528 (76 79) */ ld [%g3+4],%f9 1.1413 +/* 0x052c (77 80) */ fmuld %f10,%f0,%f0 1.1414 +/* 0x0530 239 (77 80) */ ldd [%i4],%f4 1.1415 +/* 0x0534 240 (78 81) */ ldd [%i1],%f2 1.1416 +/* 0x0538 (80 83) */ fmuld %f0,%f6,%f6 1.1417 +/* 0x053c (83 86) */ fdtox %f6,%f6 1.1418 +/* 0x0540 (86 89) */ fxtod %f6,%f6 1.1419 +/* 0x0544 (89 92) */ fmuld %f6,%f8,%f6 1.1420 +/* 0x0548 (92 95) */ fsubd %f0,%f6,%f0 1.1421 +/* 0x054c 250 (95 98) */ fmuld %f4,%f0,%f10 1.1422 + .L900000747: /* frequency 6.4 confidence 0.0 */ 1.1423 + 1.1424 + 1.1425 + fmovd %f0,%f0 1.1426 + fmovd %f16,%f18 1.1427 + ldd [%i4],%f2 1.1428 + ldd [%o2],%f8 1.1429 + ldd [%i1],%f10 1.1430 + ldd [%g4-8],%f14 1.1431 + ldd [%g4-16],%f16 1.1432 + ldd [%o1],%f24 1.1433 + 1.1434 + ldd [%i1+8],%f26 1.1435 + ldd [%i1+16],%f40 1.1436 + ldd [%i1+48],%f46 1.1437 + ldd [%i1+56],%f30 1.1438 + ldd [%i1+64],%f54 1.1439 + ldd [%i1+104],%f34 1.1440 + ldd [%i1+112],%f58 1.1441 + 1.1442 + ldd [%i4+112],%f60 1.1443 + ldd [%i4+8],%f28 1.1444 + ldd [%i4+104],%f38 1.1445 + 1.1446 + nop 1.1447 + nop 1.1448 +! 1.1449 + .L99999999: 1.1450 +!1 1.1451 +!!! 1.1452 + ldd [%i1+24],%f32 1.1453 + fmuld %f0,%f2,%f4 1.1454 +!2 1.1455 +!!! 1.1456 + ldd [%i4+24],%f36 1.1457 + fmuld %f26,%f24,%f20 1.1458 +!3 1.1459 +!!! 1.1460 + ldd [%i1+40],%f42 1.1461 + fmuld %f28,%f0,%f22 1.1462 +!4 1.1463 +!!! 1.1464 + ldd [%i4+40],%f44 1.1465 + fmuld %f32,%f24,%f32 1.1466 +!5 1.1467 +!!! 1.1468 + ldd [%o1+8],%f6 1.1469 + faddd %f4,%f8,%f4 1.1470 + fmuld %f36,%f0,%f36 1.1471 +!6 1.1472 +!!! 1.1473 + add %o1,8,%o1 1.1474 + ldd [%i4+56],%f50 1.1475 + fmuld %f42,%f24,%f42 1.1476 +!7 1.1477 +!!! 1.1478 + ldd [%i1+72],%f52 1.1479 + faddd %f20,%f22,%f20 1.1480 + fmuld %f44,%f0,%f44 1.1481 +!8 1.1482 +!!! 1.1483 + ldd [%o2+16],%f22 1.1484 + fmuld %f10,%f6,%f12 1.1485 +!9 1.1486 +!!! 1.1487 + ldd [%i4+72],%f56 1.1488 + faddd %f32,%f36,%f32 1.1489 + fmuld %f14,%f4,%f4 1.1490 +!10 1.1491 +!!! 1.1492 + ldd [%o2+48],%f36 1.1493 + fmuld %f30,%f24,%f48 1.1494 +!11 1.1495 +!!! 1.1496 + ldd [%o2+8],%f8 1.1497 + faddd %f20,%f22,%f20 1.1498 + fmuld %f50,%f0,%f50 1.1499 +!12 1.1500 +!!! 1.1501 + std %f20,[%o2+16] 1.1502 + faddd %f42,%f44,%f42 1.1503 + fmuld %f52,%f24,%f52 1.1504 +!13 1.1505 +!!! 1.1506 + ldd [%o2+80],%f44 1.1507 + faddd %f4,%f12,%f4 1.1508 + fmuld %f56,%f0,%f56 1.1509 +!14 1.1510 +!!! 1.1511 + ldd [%i1+88],%f20 1.1512 + faddd %f32,%f36,%f32 1.1513 +!15 1.1514 +!!! 1.1515 + ldd [%i4+88],%f22 1.1516 + faddd %f48,%f50,%f48 1.1517 +!16 1.1518 +!!! 1.1519 + ldd [%o2+112],%f50 1.1520 + faddd %f52,%f56,%f52 1.1521 +!17 1.1522 +!!! 1.1523 + ldd [%o2+144],%f56 1.1524 + faddd %f4,%f8,%f8 1.1525 + fmuld %f20,%f24,%f20 1.1526 +!18 1.1527 +!!! 1.1528 + std %f32,[%o2+48] 1.1529 + faddd %f42,%f44,%f42 1.1530 + fmuld %f22,%f0,%f22 1.1531 +!19 1.1532 +!!! 1.1533 + std %f42,[%o2+80] 1.1534 + faddd %f48,%f50,%f48 1.1535 + fmuld %f34,%f24,%f32 1.1536 +!20 1.1537 +!!! 1.1538 + std %f48,[%o2+112] 1.1539 + faddd %f52,%f56,%f52 1.1540 + fmuld %f38,%f0,%f36 1.1541 +!21 1.1542 +!!! 1.1543 + ldd [%i1+120],%f42 1.1544 + fdtox %f8,%f4 1.1545 +!22 1.1546 +!!! 1.1547 + std %f52,[%o2+144] 1.1548 + faddd %f20,%f22,%f20 1.1549 +!23 1.1550 +!!! 1.1551 + ldd [%i4+120],%f44 1.1552 +!24 1.1553 +!!! 1.1554 + ldd [%o2+176],%f22 1.1555 + faddd %f32,%f36,%f32 1.1556 + fmuld %f42,%f24,%f42 1.1557 +!25 1.1558 +!!! 1.1559 + ldd [%i4+16],%f50 1.1560 + fmovs %f17,%f4 1.1561 +!26 1.1562 +!!! 1.1563 + ldd [%i1+32],%f52 1.1564 + fmuld %f44,%f0,%f44 1.1565 +!27 1.1566 +!!! 1.1567 + ldd [%i4+32],%f56 1.1568 + fmuld %f40,%f24,%f48 1.1569 +!28 1.1570 +!!! 1.1571 + ldd [%o2+208],%f36 1.1572 + faddd %f20,%f22,%f20 1.1573 + fmuld %f50,%f0,%f50 1.1574 +!29 1.1575 +!!! 1.1576 + std %f20,[%o2+176] 1.1577 + fxtod %f4,%f4 1.1578 + fmuld %f52,%f24,%f52 1.1579 +!30 1.1580 +!!! 1.1581 + ldd [%i4+48],%f22 1.1582 + faddd %f42,%f44,%f42 1.1583 + fmuld %f56,%f0,%f56 1.1584 +!31 1.1585 +!!! 1.1586 + ldd [%o2+240],%f44 1.1587 + faddd %f32,%f36,%f32 1.1588 +!32 1.1589 +!!! 1.1590 + std %f32,[%o2+208] 1.1591 + faddd %f48,%f50,%f48 1.1592 + fmuld %f46,%f24,%f20 1.1593 +!33 1.1594 +!!! 1.1595 + ldd [%o2+32],%f50 1.1596 + fmuld %f4,%f18,%f12 1.1597 +!34 1.1598 +!!! 1.1599 + ldd [%i4+64],%f36 1.1600 + faddd %f52,%f56,%f52 1.1601 + fmuld %f22,%f0,%f22 1.1602 +!35 1.1603 +!!! 1.1604 + ldd [%o2+64],%f56 1.1605 + faddd %f42,%f44,%f42 1.1606 +!36 1.1607 +!!! 1.1608 + std %f42,[%o2+240] 1.1609 + faddd %f48,%f50,%f48 1.1610 + fmuld %f54,%f24,%f32 1.1611 +!37 1.1612 +!!! 1.1613 + std %f48,[%o2+32] 1.1614 + fmuld %f12,%f14,%f4 1.1615 +!38 1.1616 +!!! 1.1617 + ldd [%i1+80],%f42 1.1618 + faddd %f52,%f56,%f56 ! yes, tmp52! 1.1619 + fmuld %f36,%f0,%f36 1.1620 +!39 1.1621 +!!! 1.1622 + ldd [%i4+80],%f44 1.1623 + faddd %f20,%f22,%f20 1.1624 +!40 1.1625 +!!! 1.1626 + ldd [%i1+96],%f48 1.1627 + fmuld %f58,%f24,%f52 1.1628 +!41 1.1629 +!!! 1.1630 + ldd [%i4+96],%f50 1.1631 + fdtox %f4,%f4 1.1632 + fmuld %f42,%f24,%f42 1.1633 +!42 1.1634 +!!! 1.1635 + std %f56,[%o2+64] ! yes, tmp52! 1.1636 + faddd %f32,%f36,%f32 1.1637 + fmuld %f44,%f0,%f44 1.1638 +!43 1.1639 +!!! 1.1640 + ldd [%o2+96],%f22 1.1641 + fmuld %f48,%f24,%f48 1.1642 +!44 1.1643 +!!! 1.1644 + ldd [%o2+128],%f36 1.1645 + fmovd %f6,%f24 1.1646 + fmuld %f50,%f0,%f50 1.1647 +!45 1.1648 +!!! 1.1649 + fxtod %f4,%f4 1.1650 + fmuld %f60,%f0,%f56 1.1651 +!46 1.1652 +!!! 1.1653 + add %o2,8,%o2 1.1654 + faddd %f42,%f44,%f42 1.1655 +!47 1.1656 +!!! 1.1657 + ldd [%o2+160-8],%f44 1.1658 + faddd %f20,%f22,%f20 1.1659 +!48 1.1660 +!!! 1.1661 + std %f20,[%o2+96-8] 1.1662 + faddd %f48,%f50,%f48 1.1663 +!49 1.1664 +!!! 1.1665 + ldd [%o2+192-8],%f50 1.1666 + faddd %f52,%f56,%f52 1.1667 + fmuld %f4,%f16,%f4 1.1668 +!50 1.1669 +!!! 1.1670 + ldd [%o2+224-8],%f56 1.1671 + faddd %f32,%f36,%f32 1.1672 +!51 1.1673 +!!! 1.1674 + std %f32,[%o2+128-8] 1.1675 + faddd %f42,%f44,%f42 1.1676 +!52 1.1677 + add %o3,1,%o3 1.1678 + std %f42,[%o2+160-8] 1.1679 + faddd %f48,%f50,%f48 1.1680 +!53 1.1681 +!!! 1.1682 + cmp %o3,31 1.1683 + std %f48,[%o2+192-8] 1.1684 + faddd %f52,%f56,%f52 1.1685 +!54 1.1686 + std %f52,[%o2+224-8] 1.1687 + ble,pt %icc,.L99999999 1.1688 + fsubd %f12,%f4,%f0 1.1689 + 1.1690 + 1.1691 + 1.1692 +!55 1.1693 + std %f8,[%o2] 1.1694 + 1.1695 + 1.1696 + 1.1697 + 1.1698 + 1.1699 + 1.1700 + .L77000285: /* frequency 1.0 confidence 0.0 */ 1.1701 +/* 0x07a8 279 ( 0 1) */ sll %g1,4,%g2 1.1702 + .L900000748: /* frequency 1.0 confidence 0.0 */ 1.1703 +/* 0x07ac 279 ( 0 3) */ ldd [%g5+%g2],%f0 1.1704 +/* 0x07b0 ( 0 1) */ add %g5,%g2,%i1 1.1705 +/* 0x07b4 ( 0 1) */ or %g0,0,%o4 1.1706 +/* 0x07b8 206 ( 1 4) */ ld [%fp+68],%o0 1.1707 +/* 0x07bc 279 ( 1 2) */ or %g0,0,%i0 1.1708 +/* 0x07c0 ( 1 2) */ cmp %g1,0 1.1709 +/* 0x07c4 ( 2 5) */ fdtox %f0,%f0 1.1710 +/* 0x07c8 ( 2 3) */ std %f0,[%sp+120] 1.1711 +/* 0x07cc 275 ( 2 3) */ sethi %hi(0xfc00),%o1 1.1712 +/* 0x07d0 206 ( 3 4) */ or %g0,%o0,%o3 1.1713 +/* 0x07d4 275 ( 3 4) */ sub %g1,1,%g4 1.1714 +/* 0x07d8 279 ( 4 7) */ ldd [%i1+8],%f0 1.1715 +/* 0x07dc ( 4 5) */ or %g0,%o0,%g5 1.1716 +/* 0x07e0 ( 4 5) */ add %o1,1023,%o1 1.1717 +/* 0x07e4 ( 6 9) */ fdtox %f0,%f0 1.1718 +/* 0x07e8 ( 6 7) */ std %f0,[%sp+112] 1.1719 +/* 0x07ec (10 12) */ ldx [%sp+112],%o5 1.1720 +/* 0x07f0 (11 13) */ ldx [%sp+120],%o7 1.1721 +/* 0x07f4 (11 12) */ ble,pt %icc,.L900000746 ! tprob=0.56 1.1722 +/* 0x07f8 (11 12) */ sethi %hi(0xfc00),%g2 1.1723 +/* 0x07fc 275 (12 13) */ or %g0,-1,%g2 1.1724 +/* 0x0800 279 (12 13) */ cmp %g1,3 1.1725 +/* 0x0804 275 (13 14) */ srl %g2,0,%o2 1.1726 +/* 0x0808 279 (13 14) */ bl,pn %icc,.L77000286 ! tprob=0.44 1.1727 +/* 0x080c (13 14) */ or %g0,%i1,%g2 1.1728 +/* 0x0810 (14 17) */ ldd [%i1+16],%f0 1.1729 +/* 0x0814 (14 15) */ and %o5,%o1,%o0 1.1730 +/* 0x0818 (14 15) */ add %i1,16,%g2 1.1731 +/* 0x081c (15 16) */ sllx %o0,16,%g3 1.1732 +/* 0x0820 (15 16) */ and %o7,%o2,%o0 1.1733 +/* 0x0824 (16 19) */ fdtox %f0,%f0 1.1734 +/* 0x0828 (16 17) */ std %f0,[%sp+104] 1.1735 +/* 0x082c (16 17) */ add %o0,%g3,%o4 1.1736 +/* 0x0830 (17 20) */ ldd [%i1+24],%f2 1.1737 +/* 0x0834 (17 18) */ srax %o5,16,%o0 1.1738 +/* 0x0838 (17 18) */ add %o3,4,%g5 1.1739 +/* 0x083c (18 19) */ stx %o0,[%sp+128] 1.1740 +/* 0x0840 (18 19) */ and %o4,%o2,%o0 1.1741 +/* 0x0844 (18 19) */ or %g0,1,%i0 1.1742 +/* 0x0848 (19 20) */ stx %o0,[%sp+112] 1.1743 +/* 0x084c (19 20) */ srax %o4,32,%o0 1.1744 +/* 0x0850 (19 22) */ fdtox %f2,%f0 1.1745 +/* 0x0854 (20 21) */ stx %o0,[%sp+136] 1.1746 +/* 0x0858 (20 21) */ srax %o7,32,%o4 1.1747 +/* 0x085c (21 22) */ std %f0,[%sp+96] 1.1748 +/* 0x0860 (22 24) */ ldx [%sp+136],%o7 1.1749 +/* 0x0864 (23 25) */ ldx [%sp+128],%o0 1.1750 +/* 0x0868 (25 27) */ ldx [%sp+104],%g3 1.1751 +/* 0x086c (25 26) */ add %o0,%o7,%o0 1.1752 +/* 0x0870 (26 28) */ ldx [%sp+112],%o7 1.1753 +/* 0x0874 (26 27) */ add %o4,%o0,%o4 1.1754 +/* 0x0878 (27 29) */ ldx [%sp+96],%o5 1.1755 +/* 0x087c (28 29) */ st %o7,[%o3] 1.1756 +/* 0x0880 (28 29) */ or %g0,%g3,%o7 1.1757 + .L900000730: /* frequency 64.0 confidence 0.0 */ 1.1758 +/* 0x0884 (17 19) */ ldd [%g2+16],%f0 1.1759 +/* 0x0888 (17 18) */ add %i0,1,%i0 1.1760 +/* 0x088c (17 18) */ add %g5,4,%g5 1.1761 +/* 0x0890 (18 18) */ cmp %i0,%g4 1.1762 +/* 0x0894 (18 19) */ add %g2,16,%g2 1.1763 +/* 0x0898 (19 22) */ fdtox %f0,%f0 1.1764 +/* 0x089c (20 21) */ std %f0,[%sp+104] 1.1765 +/* 0x08a0 (21 23) */ ldd [%g2+8],%f0 1.1766 +/* 0x08a4 (23 26) */ fdtox %f0,%f0 1.1767 +/* 0x08a8 (24 25) */ std %f0,[%sp+96] 1.1768 +/* 0x08ac (25 26) */ and %o5,%o1,%g3 1.1769 +/* 0x08b0 (26 27) */ sllx %g3,16,%g3 1.1770 +/* 0x08b4 ( 0 0) */ stx %g3,[%sp+120] 1.1771 +/* 0x08b8 (26 27) */ and %o7,%o2,%g3 1.1772 +/* 0x08bc ( 0 0) */ stx %o7,[%sp+128] 1.1773 +/* 0x08c0 ( 0 0) */ ldx [%sp+120],%o7 1.1774 +/* 0x08c4 (27 27) */ add %g3,%o7,%g3 1.1775 +/* 0x08c8 ( 0 0) */ ldx [%sp+128],%o7 1.1776 +/* 0x08cc (28 29) */ srax %o5,16,%o5 1.1777 +/* 0x08d0 (28 28) */ add %g3,%o4,%g3 1.1778 +/* 0x08d4 (29 30) */ srax %g3,32,%o4 1.1779 +/* 0x08d8 ( 0 0) */ stx %o4,[%sp+112] 1.1780 +/* 0x08dc (30 31) */ srax %o7,32,%o4 1.1781 +/* 0x08e0 ( 0 0) */ ldx [%sp+112],%o7 1.1782 +/* 0x08e4 (30 31) */ add %o5,%o7,%o7 1.1783 +/* 0x08e8 (31 33) */ ldx [%sp+96],%o5 1.1784 +/* 0x08ec (31 32) */ add %o4,%o7,%o4 1.1785 +/* 0x08f0 (32 33) */ and %g3,%o2,%g3 1.1786 +/* 0x08f4 ( 0 0) */ ldx [%sp+104],%o7 1.1787 +/* 0x08f8 (33 34) */ ble,pt %icc,.L900000730 ! tprob=0.50 1.1788 +/* 0x08fc (33 34) */ st %g3,[%g5-4] 1.1789 + .L900000733: /* frequency 8.0 confidence 0.0 */ 1.1790 +/* 0x0900 ( 0 1) */ ba .L900000746 ! tprob=1.00 1.1791 +/* 0x0904 ( 0 1) */ sethi %hi(0xfc00),%g2 1.1792 + .L77000286: /* frequency 0.7 confidence 0.0 */ 1.1793 +/* 0x0908 ( 0 3) */ ldd [%g2+16],%f0 1.1794 + .L900000745: /* frequency 6.4 confidence 0.0 */ 1.1795 +/* 0x090c ( 0 1) */ and %o7,%o2,%o0 1.1796 +/* 0x0910 ( 0 1) */ and %o5,%o1,%g3 1.1797 +/* 0x0914 ( 0 3) */ fdtox %f0,%f0 1.1798 +/* 0x0918 ( 1 2) */ add %o4,%o0,%o0 1.1799 +/* 0x091c ( 1 2) */ std %f0,[%sp+104] 1.1800 +/* 0x0920 ( 1 2) */ add %i0,1,%i0 1.1801 +/* 0x0924 ( 2 3) */ sllx %g3,16,%o4 1.1802 +/* 0x0928 ( 2 5) */ ldd [%g2+24],%f2 1.1803 +/* 0x092c ( 2 3) */ add %g2,16,%g2 1.1804 +/* 0x0930 ( 3 4) */ add %o0,%o4,%o4 1.1805 +/* 0x0934 ( 3 4) */ cmp %i0,%g4 1.1806 +/* 0x0938 ( 4 5) */ srax %o5,16,%o0 1.1807 +/* 0x093c ( 4 5) */ stx %o0,[%sp+112] 1.1808 +/* 0x0940 ( 4 5) */ and %o4,%o2,%g3 1.1809 +/* 0x0944 ( 5 6) */ srax %o4,32,%o5 1.1810 +/* 0x0948 ( 5 8) */ fdtox %f2,%f0 1.1811 +/* 0x094c ( 5 6) */ std %f0,[%sp+96] 1.1812 +/* 0x0950 ( 6 7) */ srax %o7,32,%o4 1.1813 +/* 0x0954 ( 6 8) */ ldx [%sp+112],%o7 1.1814 +/* 0x0958 ( 8 9) */ add %o7,%o5,%o7 1.1815 +/* 0x095c ( 9 11) */ ldx [%sp+104],%o5 1.1816 +/* 0x0960 ( 9 10) */ add %o4,%o7,%o4 1.1817 +/* 0x0964 (10 12) */ ldx [%sp+96],%o0 1.1818 +/* 0x0968 (11 12) */ st %g3,[%g5] 1.1819 +/* 0x096c (11 12) */ or %g0,%o5,%o7 1.1820 +/* 0x0970 (11 12) */ add %g5,4,%g5 1.1821 +/* 0x0974 (12 13) */ or %g0,%o0,%o5 1.1822 +/* 0x0978 (12 13) */ ble,a,pt %icc,.L900000745 ! tprob=0.86 1.1823 +/* 0x097c (12 15) */ ldd [%g2+16],%f0 1.1824 + .L77000236: /* frequency 1.0 confidence 0.0 */ 1.1825 +/* 0x0980 ( 0 1) */ sethi %hi(0xfc00),%g2 1.1826 + .L900000746: /* frequency 1.0 confidence 0.0 */ 1.1827 +/* 0x0984 ( 0 1) */ or %g0,-1,%o0 1.1828 +/* 0x0988 ( 0 1) */ add %g2,1023,%g2 1.1829 +/* 0x098c ( 0 3) */ ld [%fp+88],%o1 1.1830 +/* 0x0990 ( 1 2) */ srl %o0,0,%g3 1.1831 +/* 0x0994 ( 1 2) */ and %o5,%g2,%g2 1.1832 +/* 0x0998 ( 2 3) */ and %o7,%g3,%g4 1.1833 +/* 0x099c 281 ( 2 3) */ or %g0,-1,%o5 1.1834 +/* 0x09a0 275 ( 3 4) */ sllx %g2,16,%g2 1.1835 +/* 0x09a4 ( 3 4) */ add %o4,%g4,%g4 1.1836 +/* 0x09a8 ( 4 5) */ add %g4,%g2,%g2 1.1837 +/* 0x09ac ( 5 6) */ sll %i0,2,%g4 1.1838 +/* 0x09b0 ( 5 6) */ and %g2,%g3,%g2 1.1839 +/* 0x09b4 ( 6 7) */ st %g2,[%o3+%g4] 1.1840 +/* 0x09b8 281 ( 6 7) */ sll %g1,2,%g2 1.1841 +/* 0x09bc ( 7 10) */ ld [%o3+%g2],%g2 1.1842 +/* 0x09c0 ( 9 10) */ cmp %g2,0 1.1843 +/* 0x09c4 ( 9 10) */ bleu,pn %icc,.L77000241 ! tprob=0.50 1.1844 +/* 0x09c8 ( 9 10) */ or %g0,%o1,%o2 1.1845 +/* 0x09cc (10 11) */ ba .L900000744 ! tprob=1.00 1.1846 +/* 0x09d0 (10 11) */ cmp %o5,0 1.1847 + .L77000241: /* frequency 0.8 confidence 0.0 */ 1.1848 +/* 0x09d4 ( 0 1) */ subcc %g1,1,%o5 1.1849 +/* 0x09d8 ( 0 1) */ bneg,pt %icc,.L900000744 ! tprob=0.60 1.1850 +/* 0x09dc ( 1 2) */ cmp %o5,0 1.1851 +/* 0x09e0 ( 1 2) */ sll %o5,2,%g2 1.1852 +/* 0x09e4 ( 2 3) */ add %o1,%g2,%o0 1.1853 +/* 0x09e8 ( 2 3) */ add %o3,%g2,%o4 1.1854 +/* 0x09ec ( 3 6) */ ld [%o0],%g2 1.1855 + .L900000743: /* frequency 5.3 confidence 0.0 */ 1.1856 +/* 0x09f0 ( 0 3) */ ld [%o4],%g3 1.1857 +/* 0x09f4 ( 0 1) */ add %o0,4,%o0 1.1858 +/* 0x09f8 ( 0 1) */ add %o4,4,%o4 1.1859 +/* 0x09fc ( 2 3) */ cmp %g3,%g2 1.1860 +/* 0x0a00 ( 2 3) */ bne,pn %icc,.L77000244 ! tprob=0.16 1.1861 +/* 0x0a04 ( 2 3) */ nop 1.1862 +/* 0x0a08 ( 3 4) */ addcc %o5,1,%o5 1.1863 +/* 0x0a0c ( 3 4) */ bpos,a,pt %icc,.L900000743 ! tprob=0.84 1.1864 +/* 0x0a10 ( 3 6) */ ld [%o0],%g2 1.1865 + .L77000244: /* frequency 1.0 confidence 0.0 */ 1.1866 +/* 0x0a14 ( 0 1) */ cmp %o5,0 1.1867 + .L900000744: /* frequency 1.0 confidence 0.0 */ 1.1868 +/* 0x0a18 ( 0 1) */ bl,pn %icc,.L77000287 ! tprob=0.50 1.1869 +/* 0x0a1c ( 0 1) */ sll %o5,2,%g2 1.1870 +/* 0x0a20 ( 1 4) */ ld [%o2+%g2],%g3 1.1871 +/* 0x0a24 ( 2 5) */ ld [%o3+%g2],%g2 1.1872 +/* 0x0a28 ( 4 5) */ cmp %g2,%g3 1.1873 +/* 0x0a2c ( 4 5) */ bleu,pt %icc,.L77000224 ! tprob=0.56 1.1874 +/* 0x0a30 ( 4 5) */ nop 1.1875 + .L77000287: /* frequency 0.8 confidence 0.0 */ 1.1876 +/* 0x0a34 ( 0 1) */ cmp %g1,0 1.1877 +/* 0x0a38 ( 0 1) */ ble,pt %icc,.L77000224 ! tprob=0.60 1.1878 +/* 0x0a3c ( 0 1) */ nop 1.1879 +/* 0x0a40 281 ( 1 2) */ sub %g1,1,%o7 1.1880 +/* 0x0a44 ( 1 2) */ or %g0,-1,%g2 1.1881 +/* 0x0a48 ( 2 3) */ srl %g2,0,%o4 1.1882 +/* 0x0a4c ( 2 3) */ add %o7,1,%o0 1.1883 +/* 0x0a50 279 ( 3 4) */ or %g0,0,%o5 1.1884 +/* 0x0a54 ( 3 4) */ or %g0,0,%g1 1.1885 +/* 0x0a58 ( 4 5) */ cmp %o0,3 1.1886 +/* 0x0a5c ( 4 5) */ bl,pn %icc,.L77000288 ! tprob=0.40 1.1887 +/* 0x0a60 ( 4 5) */ add %o3,8,%o1 1.1888 +/* 0x0a64 ( 5 6) */ add %o2,4,%o0 1.1889 +/* 0x0a68 ( 5 8) */ ld [%o1-8],%g2 1.1890 +/* 0x0a6c 0 ( 5 6) */ or %g0,%o1,%o3 1.1891 +/* 0x0a70 279 ( 6 9) */ ld [%o0-4],%g3 1.1892 +/* 0x0a74 0 ( 6 7) */ or %g0,%o0,%o2 1.1893 +/* 0x0a78 279 ( 6 7) */ or %g0,2,%g1 1.1894 +/* 0x0a7c ( 7 10) */ ld [%o3-4],%o0 1.1895 +/* 0x0a80 ( 8 9) */ sub %g2,%g3,%g2 1.1896 +/* 0x0a84 ( 9 10) */ or %g0,%g2,%o5 1.1897 +/* 0x0a88 ( 9 10) */ and %g2,%o4,%g2 1.1898 +/* 0x0a8c ( 9 10) */ st %g2,[%o3-8] 1.1899 +/* 0x0a90 (10 11) */ srax %o5,32,%o5 1.1900 + .L900000734: /* frequency 64.0 confidence 0.0 */ 1.1901 +/* 0x0a94 (12 20) */ ld [%o2],%g2 1.1902 +/* 0x0a98 (12 13) */ add %g1,1,%g1 1.1903 +/* 0x0a9c (12 13) */ add %o2,4,%o2 1.1904 +/* 0x0aa0 (13 13) */ cmp %g1,%o7 1.1905 +/* 0x0aa4 (13 14) */ add %o3,4,%o3 1.1906 +/* 0x0aa8 (14 14) */ sub %o0,%g2,%o0 1.1907 +/* 0x0aac (15 15) */ add %o0,%o5,%o5 1.1908 +/* 0x0ab0 (16 17) */ and %o5,%o4,%g2 1.1909 +/* 0x0ab4 (16 24) */ ld [%o3-4],%o0 1.1910 +/* 0x0ab8 (17 18) */ st %g2,[%o3-8] 1.1911 +/* 0x0abc (17 18) */ ble,pt %icc,.L900000734 ! tprob=0.50 1.1912 +/* 0x0ac0 (17 18) */ srax %o5,32,%o5 1.1913 + .L900000737: /* frequency 8.0 confidence 0.0 */ 1.1914 +/* 0x0ac4 ( 0 3) */ ld [%o2],%o1 1.1915 +/* 0x0ac8 ( 2 3) */ sub %o0,%o1,%o0 1.1916 +/* 0x0acc ( 3 4) */ add %o0,%o5,%o0 1.1917 +/* 0x0ad0 ( 4 5) */ and %o0,%o4,%o1 1.1918 +/* 0x0ad4 ( 4 5) */ st %o1,[%o3-4] 1.1919 +/* 0x0ad8 ( 5 7) */ ret ! Result = 1.1920 +/* 0x0adc ( 7 8) */ restore %g0,%g0,%g0 1.1921 + .L77000288: /* frequency 0.6 confidence 0.0 */ 1.1922 +/* 0x0ae0 ( 0 3) */ ld [%o3],%o0 1.1923 + .L900000742: /* frequency 5.3 confidence 0.0 */ 1.1924 +/* 0x0ae4 ( 0 3) */ ld [%o2],%o1 1.1925 +/* 0x0ae8 ( 0 1) */ add %o5,%o0,%o0 1.1926 +/* 0x0aec ( 0 1) */ add %g1,1,%g1 1.1927 +/* 0x0af0 ( 1 2) */ add %o2,4,%o2 1.1928 +/* 0x0af4 ( 1 2) */ cmp %g1,%o7 1.1929 +/* 0x0af8 ( 2 3) */ sub %o0,%o1,%o0 1.1930 +/* 0x0afc ( 3 4) */ and %o0,%o4,%o1 1.1931 +/* 0x0b00 ( 3 4) */ st %o1,[%o3] 1.1932 +/* 0x0b04 ( 3 4) */ add %o3,4,%o3 1.1933 +/* 0x0b08 ( 4 5) */ srax %o0,32,%o5 1.1934 +/* 0x0b0c ( 4 5) */ ble,a,pt %icc,.L900000742 ! tprob=0.84 1.1935 +/* 0x0b10 ( 4 7) */ ld [%o3],%o0 1.1936 + .L77000224: /* frequency 1.0 confidence 0.0 */ 1.1937 +/* 0x0b14 ( 0 2) */ ret ! Result = 1.1938 +/* 0x0b18 ( 2 3) */ restore %g0,%g0,%g0 1.1939 +/* 0x0b1c 0 ( 0 0) */ .type mont_mulf_noconv,2 1.1940 +/* 0x0b1c ( 0 0) */ .size mont_mulf_noconv,(.-mont_mulf_noconv) 1.1941 +