1.1 --- /dev/null Thu Jan 01 00:00:00 1970 +0000 1.2 +++ b/security/nss/lib/freebl/mpi/montmulfv9.s Wed Dec 31 06:09:35 2014 +0100 1.3 @@ -0,0 +1,2346 @@ 1.4 +! 1.5 +! This Source Code Form is subject to the terms of the Mozilla Public 1.6 +! License, v. 2.0. If a copy of the MPL was not distributed with this 1.7 +! file, You can obtain one at http://mozilla.org/MPL/2.0/. 1.8 + 1.9 + .section ".text",#alloc,#execinstr 1.10 + .file "montmulf.c" 1.11 + 1.12 + .section ".rodata",#alloc 1.13 + .global TwoTo16 1.14 + .align 8 1.15 +! 1.16 +! CONSTANT POOL 1.17 +! 1.18 + .global TwoTo16 1.19 +TwoTo16: 1.20 + .word 1089470464 1.21 + .word 0 1.22 + .type TwoTo16,#object 1.23 + .size TwoTo16,8 1.24 + .global TwoToMinus16 1.25 +! 1.26 +! CONSTANT POOL 1.27 +! 1.28 + .global TwoToMinus16 1.29 +TwoToMinus16: 1.30 + .word 1055916032 1.31 + .word 0 1.32 + .type TwoToMinus16,#object 1.33 + .size TwoToMinus16,8 1.34 + .global Zero 1.35 +! 1.36 +! CONSTANT POOL 1.37 +! 1.38 + .global Zero 1.39 +Zero: 1.40 + .word 0 1.41 + .word 0 1.42 + .type Zero,#object 1.43 + .size Zero,8 1.44 + .global TwoTo32 1.45 +! 1.46 +! CONSTANT POOL 1.47 +! 1.48 + .global TwoTo32 1.49 +TwoTo32: 1.50 + .word 1106247680 1.51 + .word 0 1.52 + .type TwoTo32,#object 1.53 + .size TwoTo32,8 1.54 + .global TwoToMinus32 1.55 +! 1.56 +! CONSTANT POOL 1.57 +! 1.58 + .global TwoToMinus32 1.59 +TwoToMinus32: 1.60 + .word 1039138816 1.61 + .word 0 1.62 + .type TwoToMinus32,#object 1.63 + .size TwoToMinus32,8 1.64 + 1.65 + .section ".text",#alloc,#execinstr 1.66 +/* 000000 0 */ .register %g3,#scratch 1.67 +/* 000000 */ .register %g2,#scratch 1.68 +/* 000000 0 */ .align 8 1.69 +! 1.70 +! SUBROUTINE conv_d16_to_i32 1.71 +! 1.72 +! OFFSET SOURCE LINE LABEL INSTRUCTION 1.73 + 1.74 + .global conv_d16_to_i32 1.75 + conv_d16_to_i32: 1.76 +/* 000000 */ save %sp,-208,%sp 1.77 +! FILE montmulf.c 1.78 + 1.79 +! 1 !/* 1.80 +! 2 ! * The contents of this file are subject to the Mozilla Public 1.81 +! 3 ! * License Version 1.1 (the "License"); you may not use this file 1.82 +! 4 ! * except in compliance with the License. You may obtain a copy of 1.83 +! 5 ! * the License at http://www.mozilla.org/MPL/ 1.84 +! 6 ! * 1.85 +! 7 ! * Software distributed under the License is distributed on an "AS 1.86 +! 8 ! * IS" basis, WITHOUT WARRANTY OF ANY KIND, either express or 1.87 +! 9 ! * implied. See the License for the specific language governing 1.88 +! 10 ! * rights and limitations under the License. 1.89 +! 11 ! * 1.90 +! 12 ! * The Original Code is SPARC optimized Montgomery multiply functions. 1.91 +! 13 ! * 1.92 +! 14 ! * The Initial Developer of the Original Code is Sun Microsystems Inc. 1.93 +! 15 ! * Portions created by Sun Microsystems Inc. are 1.94 +! 16 ! * Copyright (C) 1999-2000 Sun Microsystems Inc. All Rights Reserved. 1.95 +! 17 ! * 1.96 +! 18 ! * Contributor(s): 1.97 +! 19 ! * Netscape Communications Corporation 1.98 +! 20 ! * 1.99 +! 21 ! * Alternatively, the contents of this file may be used under the 1.100 +! 22 ! * terms of the GNU General Public License Version 2 or later (the 1.101 +! 23 ! * "GPL"), in which case the provisions of the GPL are applicable 1.102 +! 24 ! * instead of those above. If you wish to allow use of your 1.103 +! 25 ! * version of this file only under the terms of the GPL and not to 1.104 +! 26 ! * allow others to use your version of this file under the MPL, 1.105 +! 27 ! * indicate your decision by deleting the provisions above and 1.106 +! 28 ! * replace them with the notice and other provisions required by 1.107 +! 29 ! * the GPL. If you do not delete the provisions above, a recipient 1.108 +! 30 ! * may use your version of this file under either the MPL or the 1.109 +! 31 ! * GPL. 1.110 +! 34 ! */ 1.111 +! 36 !#define RF_INLINE_MACROS 1.112 +! 38 !static const double TwoTo16=65536.0; 1.113 +! 39 !static const double TwoToMinus16=1.0/65536.0; 1.114 +! 40 !static const double Zero=0.0; 1.115 +! 41 !static const double TwoTo32=65536.0*65536.0; 1.116 +! 42 !static const double TwoToMinus32=1.0/(65536.0*65536.0); 1.117 +! 44 !#ifdef RF_INLINE_MACROS 1.118 +! 46 !double upper32(double); 1.119 +! 47 !double lower32(double, double); 1.120 +! 48 !double mod(double, double, double); 1.121 +! 50 !void i16_to_d16_and_d32x4(const double * /*1/(2^16)*/, 1.122 +! 51 ! const double * /* 2^16*/, 1.123 +! 52 ! const double * /* 0 */, 1.124 +! 53 ! double * /*result16*/, 1.125 +! 54 ! double * /* result32 */, 1.126 +! 55 ! float * /*source - should be unsigned int* 1.127 +! 56 ! converted to float* */); 1.128 +! 58 !#else 1.129 +! 60 !static double upper32(double x) 1.130 +! 61 !{ 1.131 +! 62 ! return floor(x*TwoToMinus32); 1.132 +! 63 !} 1.133 +! 65 !static double lower32(double x, double y) 1.134 +! 66 !{ 1.135 +! 67 ! return x-TwoTo32*floor(x*TwoToMinus32); 1.136 +! 68 !} 1.137 +! 70 !static double mod(double x, double oneoverm, double m) 1.138 +! 71 !{ 1.139 +! 72 ! return x-m*floor(x*oneoverm); 1.140 +! 73 !} 1.141 +! 75 !#endif 1.142 +! 78 !static void cleanup(double *dt, int from, int tlen) 1.143 +! 79 !{ 1.144 +! 80 ! int i; 1.145 +! 81 ! double tmp,tmp1,x,x1; 1.146 +! 83 ! tmp=tmp1=Zero; 1.147 +! 84 ! /* original code ** 1.148 +! 85 ! for(i=2*from;i<2*tlen-2;i++) 1.149 +! 86 ! { 1.150 +! 87 ! x=dt[i]; 1.151 +! 88 ! dt[i]=lower32(x,Zero)+tmp1; 1.152 +! 89 ! tmp1=tmp; 1.153 +! 90 ! tmp=upper32(x); 1.154 +! 91 ! } 1.155 +! 92 ! dt[tlen-2]+=tmp1; 1.156 +! 93 ! dt[tlen-1]+=tmp; 1.157 +! 94 ! **end original code ***/ 1.158 +! 95 ! /* new code ***/ 1.159 +! 96 ! for(i=2*from;i<2*tlen;i+=2) 1.160 +! 97 ! { 1.161 +! 98 ! x=dt[i]; 1.162 +! 99 ! x1=dt[i+1]; 1.163 +! 100 ! dt[i]=lower32(x,Zero)+tmp; 1.164 +! 101 ! dt[i+1]=lower32(x1,Zero)+tmp1; 1.165 +! 102 ! tmp=upper32(x); 1.166 +! 103 ! tmp1=upper32(x1); 1.167 +! 104 ! } 1.168 +! 105 ! /** end new code **/ 1.169 +! 106 !} 1.170 +! 109 !void conv_d16_to_i32(unsigned int *i32, double *d16, long long *tmp, int ilen) 1.171 +! 110 !{ 1.172 +! 111 !int i; 1.173 +! 112 !long long t, t1, a, b, c, d; 1.174 +! 114 ! t1=0; 1.175 +! 115 ! a=(long long)d16[0]; 1.176 + 1.177 +/* 0x0004 115 */ ldd [%i1],%f2 1.178 + 1.179 +! 116 ! b=(long long)d16[1]; 1.180 +! 117 ! for(i=0; i<ilen-1; i++) 1.181 + 1.182 +/* 0x0008 117 */ sub %i3,1,%o1 1.183 +/* 0x000c 110 */ or %g0,%i0,%g1 1.184 +/* 0x0010 116 */ ldd [%i1+8],%f4 1.185 +/* 0x0014 117 */ cmp %o1,0 1.186 +/* 0x0018 114 */ or %g0,0,%g5 1.187 +/* 0x001c 115 */ fdtox %f2,%f2 1.188 +/* 0x0020 */ std %f2,[%sp+2247] 1.189 +/* 0x0024 117 */ or %g0,0,%o0 1.190 +/* 0x0028 116 */ fdtox %f4,%f2 1.191 +/* 0x002c */ std %f2,[%sp+2239] 1.192 +/* 0x0030 110 */ sub %o1,1,%o7 1.193 +/* 0x0034 */ or %g0,%i1,%o4 1.194 +/* 0x0038 */ sethi %hi(0xfc00),%o3 1.195 +/* 0x003c */ or %g0,-1,%o1 1.196 +/* 0x0040 */ or %g0,2,%i1 1.197 +/* 0x0044 */ srl %o1,0,%g3 1.198 +/* 0x0048 */ or %g0,%o4,%g4 1.199 +/* 0x004c 116 */ ldx [%sp+2239],%i2 1.200 +/* 0x0050 */ add %o3,1023,%o5 1.201 +/* 0x0054 117 */ sub %o7,1,%o2 1.202 +/* 0x0058 115 */ ldx [%sp+2247],%i3 1.203 +/* 0x005c 117 */ ble,pt %icc,.L900000113 1.204 +/* 0x0060 */ sethi %hi(0xfc00),%g2 1.205 +/* 0x0064 */ add %o7,1,%g2 1.206 + 1.207 +! 118 ! { 1.208 +! 119 ! c=(long long)d16[2*i+2]; 1.209 +! 120 ! t1+=a&0xffffffff; 1.210 +! 121 ! t=(a>>32); 1.211 +! 122 ! d=(long long)d16[2*i+3]; 1.212 +! 123 ! t1+=(b&0xffff)<<16; 1.213 + 1.214 +/* 0x0068 123 */ and %i2,%o5,%i4 1.215 +/* 0x006c */ sllx %i4,16,%o1 1.216 +/* 0x0070 117 */ cmp %g2,6 1.217 +/* 0x0074 */ bl,pn %icc,.L77000134 1.218 +/* 0x0078 */ or %g0,3,%i0 1.219 +/* 0x007c 119 */ ldd [%o4+16],%f0 1.220 +/* 0x0080 120 */ and %i3,%g3,%o3 1.221 + 1.222 +! 124 ! t+=(b>>16)+(t1>>32); 1.223 + 1.224 +/* 0x0084 124 */ srax %i2,16,%i5 1.225 +/* 0x0088 117 */ add %o3,%o1,%i4 1.226 +/* 0x008c 121 */ srax %i3,32,%i3 1.227 +/* 0x0090 119 */ fdtox %f0,%f0 1.228 +/* 0x0094 */ std %f0,[%sp+2231] 1.229 + 1.230 +! 125 ! i32[i]=t1&0xffffffff; 1.231 + 1.232 +/* 0x0098 125 */ and %i4,%g3,%l0 1.233 +/* 0x009c 117 */ or %g0,72,%o3 1.234 +/* 0x00a0 122 */ ldd [%g4+24],%f0 1.235 +/* 0x00a4 117 */ or %g0,64,%o4 1.236 +/* 0x00a8 */ or %g0,4,%o1 1.237 + 1.238 +! 126 ! t1=t; 1.239 +! 127 ! a=c; 1.240 +! 128 ! b=d; 1.241 + 1.242 +/* 0x00ac 128 */ or %g0,5,%i0 1.243 +/* 0x00b0 */ or %g0,4,%i1 1.244 +/* 0x00b4 119 */ ldx [%sp+2231],%g2 1.245 +/* 0x00b8 122 */ fdtox %f0,%f0 1.246 +/* 0x00bc 128 */ or %g0,4,%o0 1.247 +/* 0x00c0 122 */ std %f0,[%sp+2223] 1.248 +/* 0x00c4 */ ldd [%g4+40],%f2 1.249 +/* 0x00c8 120 */ and %g2,%g3,%i2 1.250 +/* 0x00cc 119 */ ldd [%g4+32],%f0 1.251 +/* 0x00d0 121 */ srax %g2,32,%g2 1.252 +/* 0x00d4 122 */ ldd [%g4+56],%f4 1.253 +/* 0x00d8 */ fdtox %f2,%f2 1.254 +/* 0x00dc */ ldx [%sp+2223],%g5 1.255 +/* 0x00e0 119 */ fdtox %f0,%f0 1.256 +/* 0x00e4 125 */ st %l0,[%g1] 1.257 +/* 0x00e8 124 */ srax %i4,32,%l0 1.258 +/* 0x00ec 122 */ fdtox %f4,%f4 1.259 +/* 0x00f0 */ std %f2,[%sp+2223] 1.260 +/* 0x00f4 123 */ and %g5,%o5,%i4 1.261 +/* 0x00f8 124 */ add %i5,%l0,%i5 1.262 +/* 0x00fc 119 */ std %f0,[%sp+2231] 1.263 +/* 0x0100 123 */ sllx %i4,16,%i4 1.264 +/* 0x0104 124 */ add %i3,%i5,%i3 1.265 +/* 0x0108 119 */ ldd [%g4+48],%f2 1.266 +/* 0x010c 124 */ srax %g5,16,%g5 1.267 +/* 0x0110 117 */ add %i2,%i4,%i2 1.268 +/* 0x0114 122 */ ldd [%g4+72],%f0 1.269 +/* 0x0118 117 */ add %i2,%i3,%i4 1.270 +/* 0x011c 124 */ srax %i4,32,%i5 1.271 +/* 0x0120 119 */ fdtox %f2,%f2 1.272 +/* 0x0124 125 */ and %i4,%g3,%i4 1.273 +/* 0x0128 122 */ ldx [%sp+2223],%i2 1.274 +/* 0x012c 124 */ add %g5,%i5,%g5 1.275 +/* 0x0130 119 */ ldx [%sp+2231],%i3 1.276 +/* 0x0134 124 */ add %g2,%g5,%g5 1.277 +/* 0x0138 119 */ std %f2,[%sp+2231] 1.278 +/* 0x013c 122 */ std %f4,[%sp+2223] 1.279 +/* 0x0140 119 */ ldd [%g4+64],%f2 1.280 +/* 0x0144 125 */ st %i4,[%g1+4] 1.281 + .L900000108: 1.282 +/* 0x0148 122 */ ldx [%sp+2223],%i4 1.283 +/* 0x014c 128 */ add %o0,2,%o0 1.284 +/* 0x0150 */ add %i0,4,%i0 1.285 +/* 0x0154 119 */ ldx [%sp+2231],%l0 1.286 +/* 0x0158 117 */ add %o3,16,%o3 1.287 +/* 0x015c 123 */ and %i2,%o5,%g2 1.288 +/* 0x0160 */ sllx %g2,16,%i5 1.289 +/* 0x0164 120 */ and %i3,%g3,%g2 1.290 +/* 0x0168 122 */ ldd [%g4+%o3],%f4 1.291 +/* 0x016c */ fdtox %f0,%f0 1.292 +/* 0x0170 */ std %f0,[%sp+2223] 1.293 +/* 0x0174 124 */ srax %i2,16,%i2 1.294 +/* 0x0178 117 */ add %g2,%i5,%g2 1.295 +/* 0x017c 119 */ fdtox %f2,%f0 1.296 +/* 0x0180 117 */ add %o4,16,%o4 1.297 +/* 0x0184 119 */ std %f0,[%sp+2231] 1.298 +/* 0x0188 117 */ add %g2,%g5,%g2 1.299 +/* 0x018c 119 */ ldd [%g4+%o4],%f2 1.300 +/* 0x0190 124 */ srax %g2,32,%i5 1.301 +/* 0x0194 128 */ cmp %o0,%o2 1.302 +/* 0x0198 121 */ srax %i3,32,%g5 1.303 +/* 0x019c 124 */ add %i2,%i5,%i2 1.304 +/* 0x01a0 */ add %g5,%i2,%i5 1.305 +/* 0x01a4 117 */ add %o1,4,%o1 1.306 +/* 0x01a8 125 */ and %g2,%g3,%g2 1.307 +/* 0x01ac 127 */ or %g0,%l0,%g5 1.308 +/* 0x01b0 125 */ st %g2,[%g1+%o1] 1.309 +/* 0x01b4 128 */ add %i1,4,%i1 1.310 +/* 0x01b8 122 */ ldx [%sp+2223],%i2 1.311 +/* 0x01bc 119 */ ldx [%sp+2231],%i3 1.312 +/* 0x01c0 117 */ add %o3,16,%o3 1.313 +/* 0x01c4 123 */ and %i4,%o5,%g2 1.314 +/* 0x01c8 */ sllx %g2,16,%l0 1.315 +/* 0x01cc 120 */ and %g5,%g3,%g2 1.316 +/* 0x01d0 122 */ ldd [%g4+%o3],%f0 1.317 +/* 0x01d4 */ fdtox %f4,%f4 1.318 +/* 0x01d8 */ std %f4,[%sp+2223] 1.319 +/* 0x01dc 124 */ srax %i4,16,%i4 1.320 +/* 0x01e0 117 */ add %g2,%l0,%g2 1.321 +/* 0x01e4 119 */ fdtox %f2,%f2 1.322 +/* 0x01e8 117 */ add %o4,16,%o4 1.323 +/* 0x01ec 119 */ std %f2,[%sp+2231] 1.324 +/* 0x01f0 117 */ add %g2,%i5,%g2 1.325 +/* 0x01f4 119 */ ldd [%g4+%o4],%f2 1.326 +/* 0x01f8 124 */ srax %g2,32,%i5 1.327 +/* 0x01fc 121 */ srax %g5,32,%g5 1.328 +/* 0x0200 124 */ add %i4,%i5,%i4 1.329 +/* 0x0204 */ add %g5,%i4,%g5 1.330 +/* 0x0208 117 */ add %o1,4,%o1 1.331 +/* 0x020c 125 */ and %g2,%g3,%g2 1.332 +/* 0x0210 128 */ ble,pt %icc,.L900000108 1.333 +/* 0x0214 */ st %g2,[%g1+%o1] 1.334 + .L900000111: 1.335 +/* 0x0218 122 */ ldx [%sp+2223],%o2 1.336 +/* 0x021c 123 */ and %i2,%o5,%i4 1.337 +/* 0x0220 120 */ and %i3,%g3,%g2 1.338 +/* 0x0224 123 */ sllx %i4,16,%i4 1.339 +/* 0x0228 119 */ ldx [%sp+2231],%i5 1.340 +/* 0x022c 128 */ cmp %o0,%o7 1.341 +/* 0x0230 124 */ srax %i2,16,%i2 1.342 +/* 0x0234 117 */ add %g2,%i4,%g2 1.343 +/* 0x0238 122 */ fdtox %f0,%f4 1.344 +/* 0x023c */ std %f4,[%sp+2223] 1.345 +/* 0x0240 117 */ add %g2,%g5,%g5 1.346 +/* 0x0244 123 */ and %o2,%o5,%l0 1.347 +/* 0x0248 124 */ srax %g5,32,%l1 1.348 +/* 0x024c 120 */ and %i5,%g3,%i4 1.349 +/* 0x0250 119 */ fdtox %f2,%f0 1.350 +/* 0x0254 121 */ srax %i3,32,%g2 1.351 +/* 0x0258 119 */ std %f0,[%sp+2231] 1.352 +/* 0x025c 124 */ add %i2,%l1,%i2 1.353 +/* 0x0260 123 */ sllx %l0,16,%i3 1.354 +/* 0x0264 124 */ add %g2,%i2,%i2 1.355 +/* 0x0268 */ srax %o2,16,%o2 1.356 +/* 0x026c 117 */ add %o1,4,%g2 1.357 +/* 0x0270 */ add %i4,%i3,%o1 1.358 +/* 0x0274 125 */ and %g5,%g3,%g5 1.359 +/* 0x0278 */ st %g5,[%g1+%g2] 1.360 +/* 0x027c 119 */ ldx [%sp+2231],%i3 1.361 +/* 0x0280 117 */ add %o1,%i2,%o1 1.362 +/* 0x0284 */ add %g2,4,%g2 1.363 +/* 0x0288 124 */ srax %o1,32,%i4 1.364 +/* 0x028c 122 */ ldx [%sp+2223],%i2 1.365 +/* 0x0290 125 */ and %o1,%g3,%g5 1.366 +/* 0x0294 121 */ srax %i5,32,%o1 1.367 +/* 0x0298 124 */ add %o2,%i4,%o2 1.368 +/* 0x029c 125 */ st %g5,[%g1+%g2] 1.369 +/* 0x02a0 128 */ bg,pn %icc,.L77000127 1.370 +/* 0x02a4 */ add %o1,%o2,%g5 1.371 +/* 0x02a8 */ add %i0,6,%i0 1.372 +/* 0x02ac */ add %i1,6,%i1 1.373 + .L77000134: 1.374 +/* 0x02b0 119 */ sra %i1,0,%o2 1.375 + .L900000112: 1.376 +/* 0x02b4 119 */ sllx %o2,3,%o3 1.377 +/* 0x02b8 120 */ and %i3,%g3,%o1 1.378 +/* 0x02bc 119 */ ldd [%g4+%o3],%f0 1.379 +/* 0x02c0 122 */ sra %i0,0,%o3 1.380 +/* 0x02c4 123 */ and %i2,%o5,%o2 1.381 +/* 0x02c8 122 */ sllx %o3,3,%o3 1.382 +/* 0x02cc 120 */ add %g5,%o1,%o1 1.383 +/* 0x02d0 119 */ fdtox %f0,%f0 1.384 +/* 0x02d4 */ std %f0,[%sp+2231] 1.385 +/* 0x02d8 123 */ sllx %o2,16,%o2 1.386 +/* 0x02dc */ add %o1,%o2,%o2 1.387 +/* 0x02e0 128 */ add %i1,2,%i1 1.388 +/* 0x02e4 122 */ ldd [%g4+%o3],%f0 1.389 +/* 0x02e8 124 */ srax %o2,32,%g2 1.390 +/* 0x02ec 125 */ and %o2,%g3,%o3 1.391 +/* 0x02f0 124 */ srax %i2,16,%o1 1.392 +/* 0x02f4 128 */ add %i0,2,%i0 1.393 +/* 0x02f8 122 */ fdtox %f0,%f0 1.394 +/* 0x02fc */ std %f0,[%sp+2223] 1.395 +/* 0x0300 125 */ sra %o0,0,%o2 1.396 +/* 0x0304 */ sllx %o2,2,%o2 1.397 +/* 0x0308 124 */ add %o1,%g2,%g5 1.398 +/* 0x030c 121 */ srax %i3,32,%g2 1.399 +/* 0x0310 128 */ add %o0,1,%o0 1.400 +/* 0x0314 124 */ add %g2,%g5,%g5 1.401 +/* 0x0318 128 */ cmp %o0,%o7 1.402 +/* 0x031c 119 */ ldx [%sp+2231],%o4 1.403 +/* 0x0320 122 */ ldx [%sp+2223],%i2 1.404 +/* 0x0324 125 */ st %o3,[%g1+%o2] 1.405 +/* 0x0328 127 */ or %g0,%o4,%i3 1.406 +/* 0x032c 128 */ ble,pt %icc,.L900000112 1.407 +/* 0x0330 */ sra %i1,0,%o2 1.408 + .L77000127: 1.409 + 1.410 +! 129 ! } 1.411 +! 130 ! t1+=a&0xffffffff; 1.412 +! 131 ! t=(a>>32); 1.413 +! 132 ! t1+=(b&0xffff)<<16; 1.414 +! 133 ! i32[i]=t1&0xffffffff; 1.415 + 1.416 +/* 0x0334 133 */ sethi %hi(0xfc00),%g2 1.417 + .L900000113: 1.418 +/* 0x0338 133 */ or %g0,-1,%g3 1.419 +/* 0x033c */ add %g2,1023,%g2 1.420 +/* 0x0340 */ srl %g3,0,%g3 1.421 +/* 0x0344 */ and %i2,%g2,%g2 1.422 +/* 0x0348 */ and %i3,%g3,%g4 1.423 +/* 0x034c */ sllx %g2,16,%g2 1.424 +/* 0x0350 */ add %g5,%g4,%g4 1.425 +/* 0x0354 */ sra %o0,0,%g5 1.426 +/* 0x0358 */ add %g4,%g2,%g4 1.427 +/* 0x035c */ sllx %g5,2,%g2 1.428 +/* 0x0360 */ and %g4,%g3,%g3 1.429 +/* 0x0364 */ st %g3,[%g1+%g2] 1.430 +/* 0x0368 */ ret ! Result = 1.431 +/* 0x036c */ restore %g0,%g0,%g0 1.432 +/* 0x0370 0 */ .type conv_d16_to_i32,2 1.433 +/* 0x0370 */ .size conv_d16_to_i32,(.-conv_d16_to_i32) 1.434 + 1.435 + .section ".text",#alloc,#execinstr 1.436 +/* 000000 0 */ .align 8 1.437 +! 1.438 +! CONSTANT POOL 1.439 +! 1.440 + .L_const_seg_900000201: 1.441 +/* 000000 0 */ .word 1127219200,0 1.442 +/* 0x0008 0 */ .align 8 1.443 +/* 0x0008 */ .skip 24 1.444 +! 1.445 +! SUBROUTINE conv_i32_to_d32 1.446 +! 1.447 +! OFFSET SOURCE LINE LABEL INSTRUCTION 1.448 + 1.449 + .global conv_i32_to_d32 1.450 + conv_i32_to_d32: 1.451 +/* 000000 */ or %g0,%o7,%g3 1.452 + 1.453 +! 135 !} 1.454 +! 137 !void conv_i32_to_d32(double *d32, unsigned int *i32, int len) 1.455 +! 138 !{ 1.456 +! 139 !int i; 1.457 +! 141 !#pragma pipeloop(0) 1.458 +! 142 ! for(i=0;i<len;i++) d32[i]=(double)(i32[i]); 1.459 + 1.460 +/* 0x0004 142 */ cmp %o2,0 1.461 + .L900000210: 1.462 +/* 0x0008 */ call .+8 1.463 +/* 0x000c */ sethi /*X*/%hi(_GLOBAL_OFFSET_TABLE_-(.L900000210-.)),%g4 1.464 +/* 0x0010 142 */ or %g0,0,%o3 1.465 +/* 0x0014 138 */ add %g4,/*X*/%lo(_GLOBAL_OFFSET_TABLE_-(.L900000210-.)),%g4 1.466 +/* 0x0018 142 */ sub %o2,1,%o4 1.467 +/* 0x001c 138 */ add %g4,%o7,%g1 1.468 +/* 0x0020 142 */ ble,pt %icc,.L77000140 1.469 +/* 0x0024 */ or %g0,%g3,%o7 1.470 +/* 0x0028 */ sethi %hi(.L_const_seg_900000201),%g3 1.471 +/* 0x002c */ cmp %o2,12 1.472 +/* 0x0030 */ add %g3,%lo(.L_const_seg_900000201),%g2 1.473 +/* 0x0034 */ or %g0,%o1,%g5 1.474 +/* 0x0038 */ ldx [%g1+%g2],%g4 1.475 +/* 0x003c */ or %g0,0,%g1 1.476 +/* 0x0040 */ or %g0,24,%g2 1.477 +/* 0x0044 */ bl,pn %icc,.L77000144 1.478 +/* 0x0048 */ or %g0,0,%g3 1.479 +/* 0x004c */ ld [%o1],%f13 1.480 +/* 0x0050 */ or %g0,7,%o3 1.481 +/* 0x0054 */ ldd [%g4],%f8 1.482 +/* 0x0058 */ sub %o2,5,%g3 1.483 +/* 0x005c */ or %g0,8,%g1 1.484 +/* 0x0060 */ ld [%o1+4],%f11 1.485 +/* 0x0064 */ ld [%o1+8],%f7 1.486 +/* 0x0068 */ fmovs %f8,%f12 1.487 +/* 0x006c */ ld [%o1+12],%f5 1.488 +/* 0x0070 */ fmovs %f8,%f10 1.489 +/* 0x0074 */ ld [%o1+16],%f3 1.490 +/* 0x0078 */ fmovs %f8,%f6 1.491 +/* 0x007c */ ld [%o1+20],%f1 1.492 +/* 0x0080 */ fsubd %f12,%f8,%f12 1.493 +/* 0x0084 */ std %f12,[%o0] 1.494 +/* 0x0088 */ fsubd %f10,%f8,%f10 1.495 +/* 0x008c */ std %f10,[%o0+8] 1.496 + .L900000205: 1.497 +/* 0x0090 */ ld [%o1+%g2],%f11 1.498 +/* 0x0094 */ add %g1,8,%g1 1.499 +/* 0x0098 */ add %o3,5,%o3 1.500 +/* 0x009c */ fsubd %f6,%f8,%f6 1.501 +/* 0x00a0 */ add %g2,4,%g2 1.502 +/* 0x00a4 */ std %f6,[%o0+%g1] 1.503 +/* 0x00a8 */ cmp %o3,%g3 1.504 +/* 0x00ac */ fmovs %f8,%f4 1.505 +/* 0x00b0 */ ld [%o1+%g2],%f7 1.506 +/* 0x00b4 */ fsubd %f4,%f8,%f12 1.507 +/* 0x00b8 */ add %g1,8,%g1 1.508 +/* 0x00bc */ add %g2,4,%g2 1.509 +/* 0x00c0 */ fmovs %f8,%f2 1.510 +/* 0x00c4 */ std %f12,[%o0+%g1] 1.511 +/* 0x00c8 */ ld [%o1+%g2],%f5 1.512 +/* 0x00cc */ fsubd %f2,%f8,%f12 1.513 +/* 0x00d0 */ add %g1,8,%g1 1.514 +/* 0x00d4 */ add %g2,4,%g2 1.515 +/* 0x00d8 */ fmovs %f8,%f0 1.516 +/* 0x00dc */ std %f12,[%o0+%g1] 1.517 +/* 0x00e0 */ ld [%o1+%g2],%f3 1.518 +/* 0x00e4 */ fsubd %f0,%f8,%f12 1.519 +/* 0x00e8 */ add %g1,8,%g1 1.520 +/* 0x00ec */ add %g2,4,%g2 1.521 +/* 0x00f0 */ fmovs %f8,%f10 1.522 +/* 0x00f4 */ std %f12,[%o0+%g1] 1.523 +/* 0x00f8 */ ld [%o1+%g2],%f1 1.524 +/* 0x00fc */ fsubd %f10,%f8,%f10 1.525 +/* 0x0100 */ add %g1,8,%g1 1.526 +/* 0x0104 */ add %g2,4,%g2 1.527 +/* 0x0108 */ std %f10,[%o0+%g1] 1.528 +/* 0x010c */ ble,pt %icc,.L900000205 1.529 +/* 0x0110 */ fmovs %f8,%f6 1.530 + .L900000208: 1.531 +/* 0x0114 */ fmovs %f8,%f4 1.532 +/* 0x0118 */ ld [%o1+%g2],%f11 1.533 +/* 0x011c */ add %g1,8,%g3 1.534 +/* 0x0120 */ fmovs %f8,%f2 1.535 +/* 0x0124 */ add %g1,16,%g1 1.536 +/* 0x0128 */ cmp %o3,%o4 1.537 +/* 0x012c */ fmovs %f8,%f0 1.538 +/* 0x0130 */ add %g1,8,%o1 1.539 +/* 0x0134 */ add %g1,16,%o2 1.540 +/* 0x0138 */ fmovs %f8,%f10 1.541 +/* 0x013c */ add %g1,24,%g2 1.542 +/* 0x0140 */ fsubd %f6,%f8,%f6 1.543 +/* 0x0144 */ std %f6,[%o0+%g3] 1.544 +/* 0x0148 */ fsubd %f4,%f8,%f4 1.545 +/* 0x014c */ std %f4,[%o0+%g1] 1.546 +/* 0x0150 */ sra %o3,0,%g1 1.547 +/* 0x0154 */ fsubd %f2,%f8,%f2 1.548 +/* 0x0158 */ std %f2,[%o0+%o1] 1.549 +/* 0x015c */ sllx %g1,2,%g3 1.550 +/* 0x0160 */ fsubd %f0,%f8,%f0 1.551 +/* 0x0164 */ std %f0,[%o0+%o2] 1.552 +/* 0x0168 */ fsubd %f10,%f8,%f0 1.553 +/* 0x016c */ bg,pn %icc,.L77000140 1.554 +/* 0x0170 */ std %f0,[%o0+%g2] 1.555 + .L77000144: 1.556 +/* 0x0174 */ ldd [%g4],%f8 1.557 + .L900000211: 1.558 +/* 0x0178 */ ld [%g5+%g3],%f13 1.559 +/* 0x017c */ sllx %g1,3,%g2 1.560 +/* 0x0180 */ add %o3,1,%o3 1.561 +/* 0x0184 */ sra %o3,0,%g1 1.562 +/* 0x0188 */ cmp %o3,%o4 1.563 +/* 0x018c */ fmovs %f8,%f12 1.564 +/* 0x0190 */ sllx %g1,2,%g3 1.565 +/* 0x0194 */ fsubd %f12,%f8,%f0 1.566 +/* 0x0198 */ std %f0,[%o0+%g2] 1.567 +/* 0x019c */ ble,a,pt %icc,.L900000211 1.568 +/* 0x01a0 */ ldd [%g4],%f8 1.569 + .L77000140: 1.570 +/* 0x01a4 */ retl ! Result = 1.571 +/* 0x01a8 */ nop 1.572 +/* 0x01ac 0 */ .type conv_i32_to_d32,2 1.573 +/* 0x01ac */ .size conv_i32_to_d32,(.-conv_i32_to_d32) 1.574 + 1.575 + .section ".text",#alloc,#execinstr 1.576 +/* 000000 0 */ .align 8 1.577 +! 1.578 +! CONSTANT POOL 1.579 +! 1.580 + .L_const_seg_900000301: 1.581 +/* 000000 0 */ .word 1127219200,0 1.582 +/* 0x0008 0 */ .align 8 1.583 +/* 0x0008 */ .skip 24 1.584 +! 1.585 +! SUBROUTINE conv_i32_to_d16 1.586 +! 1.587 +! OFFSET SOURCE LINE LABEL INSTRUCTION 1.588 + 1.589 + .global conv_i32_to_d16 1.590 + conv_i32_to_d16: 1.591 +/* 000000 */ save %sp,-192,%sp 1.592 + .L900000310: 1.593 +/* 0x0004 */ call .+8 1.594 +/* 0x0008 */ sethi /*X*/%hi(_GLOBAL_OFFSET_TABLE_-(.L900000310-.)),%g3 1.595 + 1.596 +! 143 !} 1.597 +! 146 !void conv_i32_to_d16(double *d16, unsigned int *i32, int len) 1.598 +! 147 !{ 1.599 +! 148 !int i; 1.600 +! 149 !unsigned int a; 1.601 +! 151 !#pragma pipeloop(0) 1.602 +! 152 ! for(i=0;i<len;i++) 1.603 + 1.604 +/* 0x000c 152 */ cmp %i2,0 1.605 +/* 0x0010 147 */ add %g3,/*X*/%lo(_GLOBAL_OFFSET_TABLE_-(.L900000310-.)),%g3 1.606 +/* 0x0014 152 */ ble,pt %icc,.L77000150 1.607 +/* 0x0018 */ add %g3,%o7,%o0 1.608 + 1.609 +! 153 ! { 1.610 +! 154 ! a=i32[i]; 1.611 +! 155 ! d16[2*i]=(double)(a&0xffff); 1.612 +! 156 ! d16[2*i+1]=(double)(a>>16); 1.613 + 1.614 +/* 0x001c 156 */ sethi %hi(.L_const_seg_900000301),%g2 1.615 +/* 0x0020 147 */ or %g0,%i2,%o1 1.616 +/* 0x0024 152 */ sethi %hi(0xfc00),%g3 1.617 +/* 0x0028 156 */ add %g2,%lo(.L_const_seg_900000301),%g2 1.618 +/* 0x002c 152 */ or %g0,%o1,%g4 1.619 +/* 0x0030 156 */ ldx [%o0+%g2],%o5 1.620 +/* 0x0034 152 */ add %g3,1023,%g1 1.621 +/* 0x0038 147 */ or %g0,%i1,%o7 1.622 +/* 0x003c 152 */ or %g0,0,%i2 1.623 +/* 0x0040 */ sub %o1,1,%g5 1.624 +/* 0x0044 */ or %g0,0,%g3 1.625 +/* 0x0048 */ or %g0,1,%g2 1.626 +/* 0x004c 154 */ or %g0,0,%o2 1.627 +/* 0x0050 */ cmp %g4,6 1.628 +/* 0x0054 152 */ bl,pn %icc,.L77000154 1.629 +/* 0x0058 */ ldd [%o5],%f0 1.630 +/* 0x005c */ sub %o1,2,%o3 1.631 +/* 0x0060 */ or %g0,16,%o2 1.632 +/* 0x0064 154 */ ld [%i1],%o4 1.633 +/* 0x0068 156 */ or %g0,3,%g2 1.634 +/* 0x006c */ or %g0,2,%g3 1.635 +/* 0x0070 155 */ fmovs %f0,%f2 1.636 +/* 0x0074 156 */ or %g0,4,%i2 1.637 +/* 0x0078 155 */ and %o4,%g1,%o0 1.638 +/* 0x007c */ st %o0,[%sp+2227] 1.639 +/* 0x0080 */ fmovs %f0,%f4 1.640 +/* 0x0084 156 */ srl %o4,16,%i4 1.641 +/* 0x0088 152 */ or %g0,12,%o4 1.642 +/* 0x008c */ or %g0,24,%o0 1.643 +/* 0x0090 155 */ ld [%sp+2227],%f3 1.644 +/* 0x0094 */ fsubd %f2,%f0,%f2 1.645 +/* 0x0098 */ std %f2,[%i0] 1.646 +/* 0x009c 156 */ st %i4,[%sp+2223] 1.647 +/* 0x00a0 154 */ ld [%o7+4],%o1 1.648 +/* 0x00a4 156 */ fmovs %f0,%f2 1.649 +/* 0x00a8 155 */ and %o1,%g1,%i1 1.650 +/* 0x00ac 156 */ ld [%sp+2223],%f3 1.651 +/* 0x00b0 */ srl %o1,16,%o1 1.652 +/* 0x00b4 */ fsubd %f2,%f0,%f2 1.653 +/* 0x00b8 */ std %f2,[%i0+8] 1.654 +/* 0x00bc */ st %o1,[%sp+2223] 1.655 +/* 0x00c0 155 */ st %i1,[%sp+2227] 1.656 +/* 0x00c4 154 */ ld [%o7+8],%o1 1.657 +/* 0x00c8 156 */ fmovs %f0,%f2 1.658 +/* 0x00cc 155 */ and %o1,%g1,%g4 1.659 +/* 0x00d0 */ ld [%sp+2227],%f5 1.660 +/* 0x00d4 156 */ srl %o1,16,%o1 1.661 +/* 0x00d8 */ ld [%sp+2223],%f3 1.662 +/* 0x00dc */ st %o1,[%sp+2223] 1.663 +/* 0x00e0 155 */ fsubd %f4,%f0,%f4 1.664 +/* 0x00e4 */ st %g4,[%sp+2227] 1.665 +/* 0x00e8 156 */ fsubd %f2,%f0,%f2 1.666 +/* 0x00ec 154 */ ld [%o7+12],%o1 1.667 +/* 0x00f0 155 */ std %f4,[%i0+16] 1.668 +/* 0x00f4 156 */ std %f2,[%i0+24] 1.669 + .L900000306: 1.670 +/* 0x00f8 155 */ ld [%sp+2227],%f5 1.671 +/* 0x00fc 156 */ add %i2,2,%i2 1.672 +/* 0x0100 */ add %g2,4,%g2 1.673 +/* 0x0104 */ ld [%sp+2223],%f3 1.674 +/* 0x0108 */ cmp %i2,%o3 1.675 +/* 0x010c */ add %g3,4,%g3 1.676 +/* 0x0110 155 */ and %o1,%g1,%g4 1.677 +/* 0x0114 156 */ srl %o1,16,%o1 1.678 +/* 0x0118 155 */ st %g4,[%sp+2227] 1.679 +/* 0x011c 156 */ st %o1,[%sp+2223] 1.680 +/* 0x0120 152 */ add %o4,4,%o1 1.681 +/* 0x0124 154 */ ld [%o7+%o1],%o4 1.682 +/* 0x0128 156 */ fmovs %f0,%f2 1.683 +/* 0x012c 155 */ fmovs %f0,%f4 1.684 +/* 0x0130 */ fsubd %f4,%f0,%f4 1.685 +/* 0x0134 152 */ add %o2,16,%o2 1.686 +/* 0x0138 156 */ fsubd %f2,%f0,%f2 1.687 +/* 0x013c 155 */ std %f4,[%i0+%o2] 1.688 +/* 0x0140 152 */ add %o0,16,%o0 1.689 +/* 0x0144 156 */ std %f2,[%i0+%o0] 1.690 +/* 0x0148 155 */ ld [%sp+2227],%f5 1.691 +/* 0x014c 156 */ ld [%sp+2223],%f3 1.692 +/* 0x0150 155 */ and %o4,%g1,%g4 1.693 +/* 0x0154 156 */ srl %o4,16,%o4 1.694 +/* 0x0158 155 */ st %g4,[%sp+2227] 1.695 +/* 0x015c 156 */ st %o4,[%sp+2223] 1.696 +/* 0x0160 152 */ add %o1,4,%o4 1.697 +/* 0x0164 154 */ ld [%o7+%o4],%o1 1.698 +/* 0x0168 156 */ fmovs %f0,%f2 1.699 +/* 0x016c 155 */ fmovs %f0,%f4 1.700 +/* 0x0170 */ fsubd %f4,%f0,%f4 1.701 +/* 0x0174 152 */ add %o2,16,%o2 1.702 +/* 0x0178 156 */ fsubd %f2,%f0,%f2 1.703 +/* 0x017c 155 */ std %f4,[%i0+%o2] 1.704 +/* 0x0180 152 */ add %o0,16,%o0 1.705 +/* 0x0184 156 */ ble,pt %icc,.L900000306 1.706 +/* 0x0188 */ std %f2,[%i0+%o0] 1.707 + .L900000309: 1.708 +/* 0x018c 155 */ ld [%sp+2227],%f5 1.709 +/* 0x0190 156 */ fmovs %f0,%f2 1.710 +/* 0x0194 */ srl %o1,16,%o3 1.711 +/* 0x0198 */ ld [%sp+2223],%f3 1.712 +/* 0x019c 155 */ and %o1,%g1,%i1 1.713 +/* 0x01a0 152 */ add %o2,16,%g4 1.714 +/* 0x01a4 155 */ fmovs %f0,%f4 1.715 +/* 0x01a8 */ st %i1,[%sp+2227] 1.716 +/* 0x01ac 152 */ add %o0,16,%o2 1.717 +/* 0x01b0 156 */ st %o3,[%sp+2223] 1.718 +/* 0x01b4 154 */ sra %i2,0,%o3 1.719 +/* 0x01b8 152 */ add %g4,16,%o1 1.720 +/* 0x01bc 155 */ fsubd %f4,%f0,%f4 1.721 +/* 0x01c0 */ std %f4,[%i0+%g4] 1.722 +/* 0x01c4 152 */ add %o0,32,%o0 1.723 +/* 0x01c8 156 */ fsubd %f2,%f0,%f2 1.724 +/* 0x01cc */ std %f2,[%i0+%o2] 1.725 +/* 0x01d0 */ sllx %o3,2,%o2 1.726 +/* 0x01d4 155 */ ld [%sp+2227],%f5 1.727 +/* 0x01d8 156 */ cmp %i2,%g5 1.728 +/* 0x01dc */ add %g2,6,%g2 1.729 +/* 0x01e0 */ ld [%sp+2223],%f3 1.730 +/* 0x01e4 */ add %g3,6,%g3 1.731 +/* 0x01e8 155 */ fmovs %f0,%f4 1.732 +/* 0x01ec 156 */ fmovs %f0,%f2 1.733 +/* 0x01f0 155 */ fsubd %f4,%f0,%f4 1.734 +/* 0x01f4 */ std %f4,[%i0+%o1] 1.735 +/* 0x01f8 156 */ fsubd %f2,%f0,%f0 1.736 +/* 0x01fc */ bg,pn %icc,.L77000150 1.737 +/* 0x0200 */ std %f0,[%i0+%o0] 1.738 + .L77000154: 1.739 +/* 0x0204 155 */ ldd [%o5],%f0 1.740 + .L900000311: 1.741 +/* 0x0208 154 */ ld [%o7+%o2],%o0 1.742 +/* 0x020c 155 */ sra %g3,0,%o1 1.743 +/* 0x0210 */ fmovs %f0,%f2 1.744 +/* 0x0214 */ sllx %o1,3,%o2 1.745 +/* 0x0218 156 */ add %i2,1,%i2 1.746 +/* 0x021c 155 */ and %o0,%g1,%o1 1.747 +/* 0x0220 */ st %o1,[%sp+2227] 1.748 +/* 0x0224 156 */ add %g3,2,%g3 1.749 +/* 0x0228 */ srl %o0,16,%o1 1.750 +/* 0x022c */ cmp %i2,%g5 1.751 +/* 0x0230 */ sra %g2,0,%o0 1.752 +/* 0x0234 */ add %g2,2,%g2 1.753 +/* 0x0238 */ sllx %o0,3,%o0 1.754 +/* 0x023c 155 */ ld [%sp+2227],%f3 1.755 +/* 0x0240 154 */ sra %i2,0,%o3 1.756 +/* 0x0244 155 */ fsubd %f2,%f0,%f2 1.757 +/* 0x0248 */ std %f2,[%i0+%o2] 1.758 +/* 0x024c */ sllx %o3,2,%o2 1.759 +/* 0x0250 156 */ st %o1,[%sp+2223] 1.760 +/* 0x0254 */ fmovs %f0,%f2 1.761 +/* 0x0258 */ ld [%sp+2223],%f3 1.762 +/* 0x025c */ fsubd %f2,%f0,%f0 1.763 +/* 0x0260 */ std %f0,[%i0+%o0] 1.764 +/* 0x0264 */ ble,a,pt %icc,.L900000311 1.765 +/* 0x0268 */ ldd [%o5],%f0 1.766 + .L77000150: 1.767 +/* 0x026c */ ret ! Result = 1.768 +/* 0x0270 */ restore %g0,%g0,%g0 1.769 +/* 0x0274 0 */ .type conv_i32_to_d16,2 1.770 +/* 0x0274 */ .size conv_i32_to_d16,(.-conv_i32_to_d16) 1.771 + 1.772 + .section ".text",#alloc,#execinstr 1.773 +/* 000000 0 */ .align 8 1.774 +! 1.775 +! CONSTANT POOL 1.776 +! 1.777 + .L_const_seg_900000401: 1.778 +/* 000000 0 */ .word 1127219200,0 1.779 +/* 0x0008 0 */ .align 8 1.780 +/* 0x0008 */ .skip 24 1.781 +! 1.782 +! SUBROUTINE conv_i32_to_d32_and_d16 1.783 +! 1.784 +! OFFSET SOURCE LINE LABEL INSTRUCTION 1.785 + 1.786 + .global conv_i32_to_d32_and_d16 1.787 + conv_i32_to_d32_and_d16: 1.788 +/* 000000 */ save %sp,-192,%sp 1.789 + .L900000415: 1.790 +/* 0x0004 */ call .+8 1.791 +/* 0x0008 */ sethi /*X*/%hi(_GLOBAL_OFFSET_TABLE_-(.L900000415-.)),%g3 1.792 + 1.793 +! 157 ! } 1.794 +! 158 !} 1.795 +! 161 !void conv_i32_to_d32_and_d16(double *d32, double *d16, 1.796 +! 162 ! unsigned int *i32, int len) 1.797 +! 163 !{ 1.798 +! 164 !int i = 0; 1.799 +! 165 !unsigned int a; 1.800 +! 167 !#pragma pipeloop(0) 1.801 +! 168 !#ifdef RF_INLINE_MACROS 1.802 +! 169 ! for(;i<len-3;i+=4) 1.803 +! 170 ! { 1.804 +! 171 ! i16_to_d16_and_d32x4(&TwoToMinus16, &TwoTo16, &Zero, 1.805 +! 172 ! &(d16[2*i]), &(d32[i]), (float *)(&(i32[i]))); 1.806 + 1.807 +/* 0x000c 172 */ sethi %hi(Zero),%g2 1.808 +/* 0x0010 163 */ add %g3,/*X*/%lo(_GLOBAL_OFFSET_TABLE_-(.L900000415-.)),%g3 1.809 +/* 0x0014 */ or %g0,%i3,%g5 1.810 +/* 0x0018 */ add %g3,%o7,%o3 1.811 +/* 0x001c 172 */ add %g2,%lo(Zero),%g2 1.812 +/* 0x0020 */ ldx [%o3+%g2],%o0 1.813 +/* 0x0024 */ sethi %hi(TwoToMinus16),%g3 1.814 +/* 0x0028 163 */ or %g0,%i0,%i3 1.815 +/* 0x002c 169 */ sub %g5,3,%o1 1.816 +/* 0x0030 172 */ sethi %hi(TwoTo16),%g4 1.817 +/* 0x0034 163 */ or %g0,%i2,%i0 1.818 +/* 0x0038 172 */ add %g3,%lo(TwoToMinus16),%g2 1.819 +/* 0x003c */ ldx [%o3+%g2],%o2 1.820 +/* 0x0040 169 */ cmp %o1,0 1.821 +/* 0x0044 164 */ or %g0,0,%i2 1.822 +/* 0x0048 169 */ ble,pt %icc,.L900000418 1.823 +/* 0x004c */ cmp %i2,%g5 1.824 +/* 0x0050 */ ldd [%o0],%f2 1.825 +/* 0x0054 172 */ add %g4,%lo(TwoTo16),%g3 1.826 +/* 0x0058 */ ldx [%o3+%g3],%o1 1.827 +/* 0x005c 169 */ sub %g5,4,%o4 1.828 +/* 0x0060 */ or %g0,0,%o5 1.829 + .L900000417: 1.830 +/* 0x0064 172 */ sra %i2,0,%g2 1.831 +/* 0x0068 */ fmovd %f2,%f14 1.832 +/* 0x006c */ ldd [%o2],%f0 1.833 +/* 0x0070 */ sllx %g2,2,%g3 1.834 +/* 0x0074 */ fmovd %f2,%f10 1.835 +/* 0x0078 */ ldd [%o1],%f16 1.836 +/* 0x007c */ ld [%g3+%i0],%f15 1.837 +/* 0x0080 */ add %i0,%g3,%g3 1.838 +/* 0x0084 */ fmovd %f2,%f6 1.839 +/* 0x0088 */ ld [%g3+4],%f11 1.840 +/* 0x008c */ sra %o5,0,%g4 1.841 +/* 0x0090 */ add %i2,4,%i2 1.842 +/* 0x0094 */ ld [%g3+8],%f7 1.843 +/* 0x0098 */ fxtod %f14,%f14 1.844 +/* 0x009c */ sllx %g2,3,%g2 1.845 +/* 0x00a0 */ ld [%g3+12],%f3 1.846 +/* 0x00a4 */ fxtod %f10,%f10 1.847 +/* 0x00a8 */ sllx %g4,3,%g3 1.848 +/* 0x00ac */ fxtod %f6,%f6 1.849 +/* 0x00b0 */ std %f14,[%g2+%i3] 1.850 +/* 0x00b4 */ add %i3,%g2,%g4 1.851 +/* 0x00b8 */ fxtod %f2,%f2 1.852 +/* 0x00bc */ fmuld %f0,%f14,%f12 1.853 +/* 0x00c0 */ std %f2,[%g4+24] 1.854 +/* 0x00c4 */ fmuld %f0,%f10,%f8 1.855 +/* 0x00c8 */ std %f10,[%g4+8] 1.856 +/* 0x00cc */ add %i1,%g3,%g2 1.857 +/* 0x00d0 */ fmuld %f0,%f6,%f4 1.858 +/* 0x00d4 */ std %f6,[%g4+16] 1.859 +/* 0x00d8 */ cmp %i2,%o4 1.860 +/* 0x00dc */ fmuld %f0,%f2,%f0 1.861 +/* 0x00e0 */ fdtox %f12,%f12 1.862 +/* 0x00e4 */ add %o5,8,%o5 1.863 +/* 0x00e8 */ fdtox %f8,%f8 1.864 +/* 0x00ec */ fdtox %f4,%f4 1.865 +/* 0x00f0 */ fdtox %f0,%f0 1.866 +/* 0x00f4 */ fxtod %f12,%f12 1.867 +/* 0x00f8 */ std %f12,[%g2+8] 1.868 +/* 0x00fc */ fxtod %f8,%f8 1.869 +/* 0x0100 */ std %f8,[%g2+24] 1.870 +/* 0x0104 */ fxtod %f4,%f4 1.871 +/* 0x0108 */ std %f4,[%g2+40] 1.872 +/* 0x010c */ fxtod %f0,%f0 1.873 +/* 0x0110 */ std %f0,[%g2+56] 1.874 +/* 0x0114 */ fmuld %f12,%f16,%f12 1.875 +/* 0x0118 */ fmuld %f8,%f16,%f8 1.876 +/* 0x011c */ fmuld %f4,%f16,%f4 1.877 +/* 0x0120 */ fsubd %f14,%f12,%f12 1.878 +/* 0x0124 */ std %f12,[%g3+%i1] 1.879 +/* 0x0128 */ fmuld %f0,%f16,%f0 1.880 +/* 0x012c */ fsubd %f10,%f8,%f8 1.881 +/* 0x0130 */ std %f8,[%g2+16] 1.882 +/* 0x0134 */ fsubd %f6,%f4,%f4 1.883 +/* 0x0138 */ std %f4,[%g2+32] 1.884 +/* 0x013c */ fsubd %f2,%f0,%f0 1.885 +/* 0x0140 */ std %f0,[%g2+48] 1.886 +/* 0x0144 */ ble,a,pt %icc,.L900000417 1.887 +/* 0x0148 */ ldd [%o0],%f2 1.888 + .L77000159: 1.889 + 1.890 +! 173 ! } 1.891 +! 174 !#endif 1.892 +! 175 ! for(;i<len;i++) 1.893 + 1.894 +/* 0x014c 175 */ cmp %i2,%g5 1.895 + .L900000418: 1.896 +/* 0x0150 175 */ bge,pt %icc,.L77000164 1.897 +/* 0x0154 */ nop 1.898 + 1.899 +! 176 ! { 1.900 +! 177 ! a=i32[i]; 1.901 +! 178 ! d32[i]=(double)(i32[i]); 1.902 +! 179 ! d16[2*i]=(double)(a&0xffff); 1.903 +! 180 ! d16[2*i+1]=(double)(a>>16); 1.904 + 1.905 +/* 0x0158 180 */ sethi %hi(.L_const_seg_900000401),%g2 1.906 +/* 0x015c */ add %g2,%lo(.L_const_seg_900000401),%g2 1.907 +/* 0x0160 175 */ sethi %hi(0xfc00),%g3 1.908 +/* 0x0164 180 */ ldx [%o3+%g2],%g1 1.909 +/* 0x0168 175 */ sll %i2,1,%i4 1.910 +/* 0x016c */ sub %g5,%i2,%g4 1.911 +/* 0x0170 177 */ sra %i2,0,%o3 1.912 +/* 0x0174 175 */ add %g3,1023,%g3 1.913 +/* 0x0178 178 */ ldd [%g1],%f2 1.914 +/* 0x017c */ sllx %o3,2,%o2 1.915 +/* 0x0180 175 */ add %i4,1,%g2 1.916 +/* 0x0184 177 */ or %g0,%o3,%o1 1.917 +/* 0x0188 */ cmp %g4,6 1.918 +/* 0x018c 175 */ bl,pn %icc,.L77000161 1.919 +/* 0x0190 */ sra %i2,0,%o3 1.920 +/* 0x0194 177 */ or %g0,%o2,%o0 1.921 +/* 0x0198 178 */ ld [%i0+%o2],%f5 1.922 +/* 0x019c 179 */ fmovs %f2,%f8 1.923 +/* 0x01a0 175 */ add %o0,4,%o3 1.924 +/* 0x01a4 177 */ ld [%i0+%o0],%o7 1.925 +/* 0x01a8 180 */ fmovs %f2,%f6 1.926 +/* 0x01ac 178 */ fmovs %f2,%f4 1.927 +/* 0x01b0 */ sllx %o1,3,%o2 1.928 +/* 0x01b4 175 */ add %o3,4,%o5 1.929 +/* 0x01b8 179 */ sra %i4,0,%o0 1.930 +/* 0x01bc 175 */ add %o3,8,%o4 1.931 +/* 0x01c0 178 */ fsubd %f4,%f2,%f4 1.932 +/* 0x01c4 */ std %f4,[%i3+%o2] 1.933 +/* 0x01c8 179 */ sllx %o0,3,%i5 1.934 +/* 0x01cc */ and %o7,%g3,%o0 1.935 +/* 0x01d0 */ st %o0,[%sp+2227] 1.936 +/* 0x01d4 175 */ add %i5,16,%o1 1.937 +/* 0x01d8 180 */ srl %o7,16,%g4 1.938 +/* 0x01dc */ add %i2,1,%i2 1.939 +/* 0x01e0 */ sra %g2,0,%o0 1.940 +/* 0x01e4 175 */ add %o2,8,%o2 1.941 +/* 0x01e8 179 */ fmovs %f2,%f4 1.942 +/* 0x01ec 180 */ sllx %o0,3,%l0 1.943 +/* 0x01f0 */ add %i4,3,%g2 1.944 +/* 0x01f4 179 */ ld [%sp+2227],%f5 1.945 +/* 0x01f8 175 */ add %l0,16,%o0 1.946 +/* 0x01fc 180 */ add %i4,2,%i4 1.947 +/* 0x0200 175 */ sub %g5,1,%o7 1.948 +/* 0x0204 180 */ add %i2,3,%i2 1.949 +/* 0x0208 179 */ fsubd %f4,%f2,%f4 1.950 +/* 0x020c */ std %f4,[%i1+%i5] 1.951 +/* 0x0210 180 */ st %g4,[%sp+2223] 1.952 +/* 0x0214 177 */ ld [%i0+%o3],%i5 1.953 +/* 0x0218 180 */ fmovs %f2,%f4 1.954 +/* 0x021c */ srl %i5,16,%g4 1.955 +/* 0x0220 179 */ and %i5,%g3,%i5 1.956 +/* 0x0224 180 */ ld [%sp+2223],%f5 1.957 +/* 0x0228 */ fsubd %f4,%f2,%f4 1.958 +/* 0x022c */ std %f4,[%i1+%l0] 1.959 +/* 0x0230 */ st %g4,[%sp+2223] 1.960 +/* 0x0234 177 */ ld [%i0+%o5],%g4 1.961 +/* 0x0238 179 */ st %i5,[%sp+2227] 1.962 +/* 0x023c 178 */ fmovs %f2,%f4 1.963 +/* 0x0240 180 */ srl %g4,16,%i5 1.964 +/* 0x0244 179 */ and %g4,%g3,%g4 1.965 +/* 0x0248 180 */ ld [%sp+2223],%f7 1.966 +/* 0x024c */ st %i5,[%sp+2223] 1.967 +/* 0x0250 178 */ ld [%i0+%o3],%f5 1.968 +/* 0x0254 180 */ fsubd %f6,%f2,%f6 1.969 +/* 0x0258 177 */ ld [%i0+%o4],%o3 1.970 +/* 0x025c 178 */ fsubd %f4,%f2,%f4 1.971 +/* 0x0260 179 */ ld [%sp+2227],%f9 1.972 +/* 0x0264 180 */ ld [%sp+2223],%f1 1.973 +/* 0x0268 179 */ st %g4,[%sp+2227] 1.974 +/* 0x026c */ fsubd %f8,%f2,%f8 1.975 +/* 0x0270 */ std %f8,[%i1+%o1] 1.976 +/* 0x0274 180 */ std %f6,[%i1+%o0] 1.977 +/* 0x0278 178 */ std %f4,[%i3+%o2] 1.978 + .L900000411: 1.979 +/* 0x027c 179 */ ld [%sp+2227],%f13 1.980 +/* 0x0280 180 */ srl %o3,16,%g4 1.981 +/* 0x0284 */ add %i2,2,%i2 1.982 +/* 0x0288 */ st %g4,[%sp+2223] 1.983 +/* 0x028c */ cmp %i2,%o7 1.984 +/* 0x0290 */ add %g2,4,%g2 1.985 +/* 0x0294 178 */ ld [%i0+%o5],%f11 1.986 +/* 0x0298 180 */ add %i4,4,%i4 1.987 +/* 0x029c 175 */ add %o4,4,%o5 1.988 +/* 0x02a0 177 */ ld [%i0+%o5],%g4 1.989 +/* 0x02a4 179 */ and %o3,%g3,%o3 1.990 +/* 0x02a8 */ st %o3,[%sp+2227] 1.991 +/* 0x02ac 180 */ fmovs %f2,%f0 1.992 +/* 0x02b0 179 */ fmovs %f2,%f12 1.993 +/* 0x02b4 180 */ fsubd %f0,%f2,%f8 1.994 +/* 0x02b8 179 */ fsubd %f12,%f2,%f4 1.995 +/* 0x02bc 175 */ add %o1,16,%o1 1.996 +/* 0x02c0 180 */ ld [%sp+2223],%f7 1.997 +/* 0x02c4 178 */ fmovs %f2,%f10 1.998 +/* 0x02c8 179 */ std %f4,[%i1+%o1] 1.999 +/* 0x02cc 175 */ add %o0,16,%o0 1.1000 +/* 0x02d0 178 */ fsubd %f10,%f2,%f4 1.1001 +/* 0x02d4 175 */ add %o2,8,%o2 1.1002 +/* 0x02d8 180 */ std %f8,[%i1+%o0] 1.1003 +/* 0x02dc 178 */ std %f4,[%i3+%o2] 1.1004 +/* 0x02e0 179 */ ld [%sp+2227],%f9 1.1005 +/* 0x02e4 180 */ srl %g4,16,%o3 1.1006 +/* 0x02e8 */ st %o3,[%sp+2223] 1.1007 +/* 0x02ec 178 */ ld [%i0+%o4],%f5 1.1008 +/* 0x02f0 175 */ add %o4,8,%o4 1.1009 +/* 0x02f4 177 */ ld [%i0+%o4],%o3 1.1010 +/* 0x02f8 179 */ and %g4,%g3,%g4 1.1011 +/* 0x02fc */ st %g4,[%sp+2227] 1.1012 +/* 0x0300 180 */ fmovs %f2,%f6 1.1013 +/* 0x0304 179 */ fmovs %f2,%f8 1.1014 +/* 0x0308 180 */ fsubd %f6,%f2,%f6 1.1015 +/* 0x030c 179 */ fsubd %f8,%f2,%f8 1.1016 +/* 0x0310 175 */ add %o1,16,%o1 1.1017 +/* 0x0314 180 */ ld [%sp+2223],%f1 1.1018 +/* 0x0318 178 */ fmovs %f2,%f4 1.1019 +/* 0x031c 179 */ std %f8,[%i1+%o1] 1.1020 +/* 0x0320 175 */ add %o0,16,%o0 1.1021 +/* 0x0324 178 */ fsubd %f4,%f2,%f4 1.1022 +/* 0x0328 175 */ add %o2,8,%o2 1.1023 +/* 0x032c 180 */ std %f6,[%i1+%o0] 1.1024 +/* 0x0330 */ bl,pt %icc,.L900000411 1.1025 +/* 0x0334 */ std %f4,[%i3+%o2] 1.1026 + .L900000414: 1.1027 +/* 0x0338 180 */ srl %o3,16,%o7 1.1028 +/* 0x033c */ st %o7,[%sp+2223] 1.1029 +/* 0x0340 179 */ fmovs %f2,%f12 1.1030 +/* 0x0344 178 */ ld [%i0+%o5],%f11 1.1031 +/* 0x0348 180 */ fmovs %f2,%f0 1.1032 +/* 0x034c 179 */ and %o3,%g3,%g4 1.1033 +/* 0x0350 180 */ fmovs %f2,%f6 1.1034 +/* 0x0354 175 */ add %o1,16,%o3 1.1035 +/* 0x0358 */ add %o0,16,%o7 1.1036 +/* 0x035c 178 */ fmovs %f2,%f10 1.1037 +/* 0x0360 175 */ add %o2,8,%o2 1.1038 +/* 0x0364 */ add %o1,32,%o5 1.1039 +/* 0x0368 179 */ ld [%sp+2227],%f13 1.1040 +/* 0x036c 178 */ fmovs %f2,%f4 1.1041 +/* 0x0370 175 */ add %o0,32,%o1 1.1042 +/* 0x0374 180 */ ld [%sp+2223],%f7 1.1043 +/* 0x0378 175 */ add %o2,8,%o0 1.1044 +/* 0x037c 180 */ cmp %i2,%g5 1.1045 +/* 0x0380 179 */ st %g4,[%sp+2227] 1.1046 +/* 0x0384 */ fsubd %f12,%f2,%f8 1.1047 +/* 0x0388 180 */ add %g2,6,%g2 1.1048 +/* 0x038c 179 */ std %f8,[%i1+%o3] 1.1049 +/* 0x0390 180 */ fsubd %f0,%f2,%f0 1.1050 +/* 0x0394 177 */ sra %i2,0,%o3 1.1051 +/* 0x0398 180 */ std %f0,[%i1+%o7] 1.1052 +/* 0x039c 178 */ fsubd %f10,%f2,%f0 1.1053 +/* 0x03a0 180 */ add %i4,6,%i4 1.1054 +/* 0x03a4 178 */ std %f0,[%i3+%o2] 1.1055 +/* 0x03a8 */ sllx %o3,2,%o2 1.1056 +/* 0x03ac 179 */ ld [%sp+2227],%f9 1.1057 +/* 0x03b0 178 */ ld [%i0+%o4],%f5 1.1058 +/* 0x03b4 179 */ fmovs %f2,%f8 1.1059 +/* 0x03b8 */ fsubd %f8,%f2,%f0 1.1060 +/* 0x03bc */ std %f0,[%i1+%o5] 1.1061 +/* 0x03c0 180 */ fsubd %f6,%f2,%f0 1.1062 +/* 0x03c4 */ std %f0,[%i1+%o1] 1.1063 +/* 0x03c8 178 */ fsubd %f4,%f2,%f0 1.1064 +/* 0x03cc 180 */ bge,pn %icc,.L77000164 1.1065 +/* 0x03d0 */ std %f0,[%i3+%o0] 1.1066 + .L77000161: 1.1067 +/* 0x03d4 178 */ ldd [%g1],%f2 1.1068 + .L900000416: 1.1069 +/* 0x03d8 178 */ ld [%i0+%o2],%f5 1.1070 +/* 0x03dc 179 */ sra %i4,0,%o0 1.1071 +/* 0x03e0 180 */ add %i2,1,%i2 1.1072 +/* 0x03e4 177 */ ld [%i0+%o2],%o1 1.1073 +/* 0x03e8 178 */ sllx %o3,3,%o3 1.1074 +/* 0x03ec 180 */ add %i4,2,%i4 1.1075 +/* 0x03f0 178 */ fmovs %f2,%f4 1.1076 +/* 0x03f4 179 */ sllx %o0,3,%o4 1.1077 +/* 0x03f8 180 */ cmp %i2,%g5 1.1078 +/* 0x03fc 179 */ and %o1,%g3,%o0 1.1079 +/* 0x0400 178 */ fsubd %f4,%f2,%f0 1.1080 +/* 0x0404 */ std %f0,[%i3+%o3] 1.1081 +/* 0x0408 180 */ srl %o1,16,%o1 1.1082 +/* 0x040c 179 */ st %o0,[%sp+2227] 1.1083 +/* 0x0410 180 */ sra %g2,0,%o0 1.1084 +/* 0x0414 */ add %g2,2,%g2 1.1085 +/* 0x0418 177 */ sra %i2,0,%o3 1.1086 +/* 0x041c 180 */ sllx %o0,3,%o0 1.1087 +/* 0x0420 179 */ fmovs %f2,%f4 1.1088 +/* 0x0424 */ sllx %o3,2,%o2 1.1089 +/* 0x0428 */ ld [%sp+2227],%f5 1.1090 +/* 0x042c */ fsubd %f4,%f2,%f0 1.1091 +/* 0x0430 */ std %f0,[%i1+%o4] 1.1092 +/* 0x0434 180 */ st %o1,[%sp+2223] 1.1093 +/* 0x0438 */ fmovs %f2,%f4 1.1094 +/* 0x043c */ ld [%sp+2223],%f5 1.1095 +/* 0x0440 */ fsubd %f4,%f2,%f0 1.1096 +/* 0x0444 */ std %f0,[%i1+%o0] 1.1097 +/* 0x0448 */ bl,a,pt %icc,.L900000416 1.1098 +/* 0x044c */ ldd [%g1],%f2 1.1099 + .L77000164: 1.1100 +/* 0x0450 */ ret ! Result = 1.1101 +/* 0x0454 */ restore %g0,%g0,%g0 1.1102 +/* 0x0458 0 */ .type conv_i32_to_d32_and_d16,2 1.1103 +/* 0x0458 */ .size conv_i32_to_d32_and_d16,(.-conv_i32_to_d32_and_d16) 1.1104 + 1.1105 + .section ".text",#alloc,#execinstr 1.1106 +/* 000000 0 */ .align 8 1.1107 +! 1.1108 +! SUBROUTINE adjust_montf_result 1.1109 +! 1.1110 +! OFFSET SOURCE LINE LABEL INSTRUCTION 1.1111 + 1.1112 + .global adjust_montf_result 1.1113 + adjust_montf_result: 1.1114 +/* 000000 */ save %sp,-176,%sp 1.1115 +/* 0x0004 */ or %g0,%i2,%o1 1.1116 +/* 0x0008 */ or %g0,%i0,%i2 1.1117 + 1.1118 +! 181 ! } 1.1119 +! 182 !} 1.1120 +! 185 !void adjust_montf_result(unsigned int *i32, unsigned int *nint, int len) 1.1121 +! 186 !{ 1.1122 +! 187 !long long acc; 1.1123 +! 188 !int i; 1.1124 +! 190 ! if(i32[len]>0) i=-1; 1.1125 + 1.1126 +/* 0x000c 190 */ sra %o1,0,%g2 1.1127 +/* 0x0010 */ or %g0,-1,%o2 1.1128 +/* 0x0014 */ sllx %g2,2,%g2 1.1129 +/* 0x0018 */ ld [%i2+%g2],%g2 1.1130 +/* 0x001c */ cmp %g2,0 1.1131 +/* 0x0020 */ bleu,pn %icc,.L77000175 1.1132 +/* 0x0024 */ or %g0,%i1,%i0 1.1133 +/* 0x0028 */ ba .L900000511 1.1134 +/* 0x002c */ cmp %o2,0 1.1135 + .L77000175: 1.1136 + 1.1137 +! 191 ! else 1.1138 +! 192 ! { 1.1139 +! 193 ! for(i=len-1; i>=0; i--) 1.1140 + 1.1141 +/* 0x0030 193 */ sub %o1,1,%o2 1.1142 +/* 0x0034 */ cmp %o2,0 1.1143 +/* 0x0038 */ bl,pn %icc,.L77000182 1.1144 +/* 0x003c */ sra %o2,0,%g2 1.1145 + .L900000510: 1.1146 + 1.1147 +! 194 ! { 1.1148 +! 195 ! if(i32[i]!=nint[i]) break; 1.1149 + 1.1150 +/* 0x0040 195 */ sllx %g2,2,%g2 1.1151 +/* 0x0044 */ sub %o2,1,%o0 1.1152 +/* 0x0048 */ ld [%i1+%g2],%g3 1.1153 +/* 0x004c */ ld [%i2+%g2],%g2 1.1154 +/* 0x0050 */ cmp %g2,%g3 1.1155 +/* 0x0054 */ bne,pn %icc,.L77000182 1.1156 +/* 0x0058 */ nop 1.1157 +/* 0x005c 0 */ or %g0,%o0,%o2 1.1158 +/* 0x0060 195 */ cmp %o0,0 1.1159 +/* 0x0064 */ bge,pt %icc,.L900000510 1.1160 +/* 0x0068 */ sra %o2,0,%g2 1.1161 + .L77000182: 1.1162 + 1.1163 +! 196 ! } 1.1164 +! 197 ! } 1.1165 +! 198 ! if((i<0)||(i32[i]>nint[i])) 1.1166 + 1.1167 +/* 0x006c 198 */ cmp %o2,0 1.1168 + .L900000511: 1.1169 +/* 0x0070 198 */ bl,pn %icc,.L77000198 1.1170 +/* 0x0074 */ sra %o2,0,%g2 1.1171 +/* 0x0078 */ sllx %g2,2,%g2 1.1172 +/* 0x007c */ ld [%i1+%g2],%g3 1.1173 +/* 0x0080 */ ld [%i2+%g2],%g2 1.1174 +/* 0x0084 */ cmp %g2,%g3 1.1175 +/* 0x0088 */ bleu,pt %icc,.L77000191 1.1176 +/* 0x008c */ nop 1.1177 + .L77000198: 1.1178 + 1.1179 +! 199 ! { 1.1180 +! 200 ! acc=0; 1.1181 +! 201 ! for(i=0;i<len;i++) 1.1182 + 1.1183 +/* 0x0090 201 */ cmp %o1,0 1.1184 +/* 0x0094 */ ble,pt %icc,.L77000191 1.1185 +/* 0x0098 */ nop 1.1186 +/* 0x009c 198 */ or %g0,-1,%g2 1.1187 +/* 0x00a0 201 */ or %g0,%o1,%g3 1.1188 +/* 0x00a4 198 */ srl %g2,0,%g2 1.1189 +/* 0x00a8 */ sub %o1,1,%g4 1.1190 +/* 0x00ac */ cmp %o1,9 1.1191 +/* 0x00b0 201 */ or %g0,0,%i1 1.1192 +/* 0x00b4 200 */ or %g0,0,%g5 1.1193 + 1.1194 +! 202 ! { 1.1195 +! 203 ! acc=acc+(unsigned long long)(i32[i])-(unsigned long long)(nint[i]); 1.1196 + 1.1197 +/* 0x00b8 203 */ or %g0,0,%o1 1.1198 +/* 0x00bc 201 */ bl,pn %icc,.L77000199 1.1199 +/* 0x00c0 */ sub %g3,4,%o7 1.1200 +/* 0x00c4 203 */ ld [%i2],%o1 1.1201 + 1.1202 +! 204 ! i32[i]=acc&0xffffffff; 1.1203 +! 205 ! acc=acc>>32; 1.1204 + 1.1205 +/* 0x00c8 205 */ or %g0,5,%i1 1.1206 +/* 0x00cc 203 */ ld [%i0],%o2 1.1207 +/* 0x00d0 201 */ or %g0,8,%o5 1.1208 +/* 0x00d4 */ or %g0,12,%o4 1.1209 +/* 0x00d8 203 */ ld [%i0+4],%o3 1.1210 +/* 0x00dc 201 */ or %g0,16,%g1 1.1211 +/* 0x00e0 203 */ ld [%i2+4],%o0 1.1212 +/* 0x00e4 201 */ sub %o1,%o2,%o1 1.1213 +/* 0x00e8 203 */ ld [%i0+8],%i3 1.1214 +/* 0x00ec 204 */ and %o1,%g2,%g5 1.1215 +/* 0x00f0 */ st %g5,[%i2] 1.1216 +/* 0x00f4 205 */ srax %o1,32,%g5 1.1217 +/* 0x00f8 201 */ sub %o0,%o3,%o0 1.1218 +/* 0x00fc 203 */ ld [%i0+12],%o2 1.1219 +/* 0x0100 201 */ add %o0,%g5,%o0 1.1220 +/* 0x0104 204 */ and %o0,%g2,%g5 1.1221 +/* 0x0108 */ st %g5,[%i2+4] 1.1222 +/* 0x010c 205 */ srax %o0,32,%o0 1.1223 +/* 0x0110 203 */ ld [%i2+8],%o1 1.1224 +/* 0x0114 */ ld [%i2+12],%o3 1.1225 +/* 0x0118 201 */ sub %o1,%i3,%o1 1.1226 + .L900000505: 1.1227 +/* 0x011c */ add %g1,4,%g3 1.1228 +/* 0x0120 203 */ ld [%g1+%i2],%g5 1.1229 +/* 0x0124 201 */ add %o1,%o0,%o0 1.1230 +/* 0x0128 203 */ ld [%i0+%g1],%i3 1.1231 +/* 0x012c 201 */ sub %o3,%o2,%o1 1.1232 +/* 0x0130 204 */ and %o0,%g2,%o2 1.1233 +/* 0x0134 */ st %o2,[%o5+%i2] 1.1234 +/* 0x0138 205 */ srax %o0,32,%o2 1.1235 +/* 0x013c */ add %i1,4,%i1 1.1236 +/* 0x0140 201 */ add %g1,8,%o5 1.1237 +/* 0x0144 203 */ ld [%g3+%i2],%o0 1.1238 +/* 0x0148 201 */ add %o1,%o2,%o1 1.1239 +/* 0x014c 203 */ ld [%i0+%g3],%o3 1.1240 +/* 0x0150 201 */ sub %g5,%i3,%o2 1.1241 +/* 0x0154 204 */ and %o1,%g2,%g5 1.1242 +/* 0x0158 */ st %g5,[%o4+%i2] 1.1243 +/* 0x015c 205 */ srax %o1,32,%g5 1.1244 +/* 0x0160 */ cmp %i1,%o7 1.1245 +/* 0x0164 201 */ add %g1,12,%o4 1.1246 +/* 0x0168 203 */ ld [%o5+%i2],%o1 1.1247 +/* 0x016c 201 */ add %o2,%g5,%o2 1.1248 +/* 0x0170 203 */ ld [%i0+%o5],%i3 1.1249 +/* 0x0174 201 */ sub %o0,%o3,%o0 1.1250 +/* 0x0178 204 */ and %o2,%g2,%o3 1.1251 +/* 0x017c */ st %o3,[%g1+%i2] 1.1252 +/* 0x0180 205 */ srax %o2,32,%g5 1.1253 +/* 0x0184 203 */ ld [%o4+%i2],%o3 1.1254 +/* 0x0188 201 */ add %g1,16,%g1 1.1255 +/* 0x018c */ add %o0,%g5,%o0 1.1256 +/* 0x0190 203 */ ld [%i0+%o4],%o2 1.1257 +/* 0x0194 201 */ sub %o1,%i3,%o1 1.1258 +/* 0x0198 204 */ and %o0,%g2,%g5 1.1259 +/* 0x019c */ st %g5,[%g3+%i2] 1.1260 +/* 0x01a0 205 */ ble,pt %icc,.L900000505 1.1261 +/* 0x01a4 */ srax %o0,32,%o0 1.1262 + .L900000508: 1.1263 +/* 0x01a8 */ add %o1,%o0,%g3 1.1264 +/* 0x01ac */ sub %o3,%o2,%o1 1.1265 +/* 0x01b0 203 */ ld [%g1+%i2],%o0 1.1266 +/* 0x01b4 */ ld [%i0+%g1],%o2 1.1267 +/* 0x01b8 205 */ srax %g3,32,%o7 1.1268 +/* 0x01bc 204 */ and %g3,%g2,%o3 1.1269 +/* 0x01c0 201 */ add %o1,%o7,%o1 1.1270 +/* 0x01c4 204 */ st %o3,[%o5+%i2] 1.1271 +/* 0x01c8 205 */ cmp %i1,%g4 1.1272 +/* 0x01cc 201 */ sub %o0,%o2,%o0 1.1273 +/* 0x01d0 204 */ and %o1,%g2,%o2 1.1274 +/* 0x01d4 */ st %o2,[%o4+%i2] 1.1275 +/* 0x01d8 205 */ srax %o1,32,%o1 1.1276 +/* 0x01dc 203 */ sra %i1,0,%o2 1.1277 +/* 0x01e0 201 */ add %o0,%o1,%o0 1.1278 +/* 0x01e4 205 */ srax %o0,32,%g5 1.1279 +/* 0x01e8 204 */ and %o0,%g2,%o1 1.1280 +/* 0x01ec */ st %o1,[%g1+%i2] 1.1281 +/* 0x01f0 205 */ bg,pn %icc,.L77000191 1.1282 +/* 0x01f4 */ sllx %o2,2,%o1 1.1283 + .L77000199: 1.1284 +/* 0x01f8 0 */ or %g0,%o1,%g1 1.1285 + .L900000509: 1.1286 +/* 0x01fc 203 */ ld [%o1+%i2],%o0 1.1287 +/* 0x0200 205 */ add %i1,1,%i1 1.1288 +/* 0x0204 203 */ ld [%i0+%o1],%o1 1.1289 +/* 0x0208 */ sra %i1,0,%o2 1.1290 +/* 0x020c 205 */ cmp %i1,%g4 1.1291 +/* 0x0210 203 */ add %g5,%o0,%o0 1.1292 +/* 0x0214 */ sub %o0,%o1,%o0 1.1293 +/* 0x0218 205 */ srax %o0,32,%g5 1.1294 +/* 0x021c 204 */ and %o0,%g2,%o1 1.1295 +/* 0x0220 */ st %o1,[%g1+%i2] 1.1296 +/* 0x0224 */ sllx %o2,2,%o1 1.1297 +/* 0x0228 205 */ ble,pt %icc,.L900000509 1.1298 +/* 0x022c */ or %g0,%o1,%g1 1.1299 + .L77000191: 1.1300 +/* 0x0230 */ ret ! Result = 1.1301 +/* 0x0234 */ restore %g0,%g0,%g0 1.1302 +/* 0x0238 0 */ .type adjust_montf_result,2 1.1303 +/* 0x0238 */ .size adjust_montf_result,(.-adjust_montf_result) 1.1304 + 1.1305 + .section ".text",#alloc,#execinstr 1.1306 +/* 000000 0 */ .align 8 1.1307 +/* 000000 */ .skip 24 1.1308 +! 1.1309 +! SUBROUTINE mont_mulf_noconv 1.1310 +! 1.1311 +! OFFSET SOURCE LINE LABEL INSTRUCTION 1.1312 + 1.1313 + .global mont_mulf_noconv 1.1314 + mont_mulf_noconv: 1.1315 +/* 000000 */ save %sp,-224,%sp 1.1316 + .L900000643: 1.1317 +/* 0x0004 */ call .+8 1.1318 +/* 0x0008 */ sethi /*X*/%hi(_GLOBAL_OFFSET_TABLE_-(.L900000643-.)),%g5 1.1319 +/* 0x000c */ ldx [%fp+2223],%l0 1.1320 + 1.1321 +! 206 ! } 1.1322 +! 207 ! } 1.1323 +! 208 !} 1.1324 +! 213 !/* 1.1325 +! 214 !** the lengths of the input arrays should be at least the following: 1.1326 +! 215 !** result[nlen+1], dm1[nlen], dm2[2*nlen+1], dt[4*nlen+2], dn[nlen], nint[nlen] 1.1327 +! 216 !** all of them should be different from one another 1.1328 +! 217 !** 1.1329 +! 218 !*/ 1.1330 +! 219 !void mont_mulf_noconv(unsigned int *result, 1.1331 +! 220 ! double *dm1, double *dm2, double *dt, 1.1332 +! 221 ! double *dn, unsigned int *nint, 1.1333 +! 222 ! int nlen, double dn0) 1.1334 +! 223 !{ 1.1335 +! 224 ! int i, j, jj; 1.1336 +! 225 ! int tmp; 1.1337 +! 226 ! double digit, m2j, nextm2j, a, b; 1.1338 +! 227 ! double *dptmp, *pdm1, *pdm2, *pdn, *pdtj, pdn_0, pdm1_0; 1.1339 +! 229 ! pdm1=&(dm1[0]); 1.1340 +! 230 ! pdm2=&(dm2[0]); 1.1341 +! 231 ! pdn=&(dn[0]); 1.1342 +! 232 ! pdm2[2*nlen]=Zero; 1.1343 + 1.1344 +/* 0x0010 232 */ sethi %hi(Zero),%g2 1.1345 +/* 0x0014 223 */ fmovd %f14,%f30 1.1346 +/* 0x0018 */ add %g5,/*X*/%lo(_GLOBAL_OFFSET_TABLE_-(.L900000643-.)),%g5 1.1347 +/* 0x001c 232 */ add %g2,%lo(Zero),%g2 1.1348 +/* 0x0020 */ sll %l0,1,%o3 1.1349 +/* 0x0024 223 */ add %g5,%o7,%o4 1.1350 +/* 0x0028 232 */ sra %o3,0,%g5 1.1351 +/* 0x002c */ ldx [%o4+%g2],%o7 1.1352 + 1.1353 +! 234 ! if (nlen!=16) 1.1354 +! 235 ! { 1.1355 +! 236 ! for(i=0;i<4*nlen+2;i++) dt[i]=Zero; 1.1356 +! 238 ! a=dt[0]=pdm1[0]*pdm2[0]; 1.1357 +! 239 ! digit=mod(lower32(a,Zero)*dn0,TwoToMinus16,TwoTo16); 1.1358 + 1.1359 +/* 0x0030 239 */ sethi %hi(TwoToMinus16),%g3 1.1360 +/* 0x0034 */ sethi %hi(TwoTo16),%g4 1.1361 +/* 0x0038 */ add %g3,%lo(TwoToMinus16),%g2 1.1362 +/* 0x003c 232 */ ldd [%o7],%f0 1.1363 +/* 0x0040 239 */ add %g4,%lo(TwoTo16),%g3 1.1364 +/* 0x0044 223 */ or %g0,%i4,%o0 1.1365 +/* 0x0048 232 */ sllx %g5,3,%g4 1.1366 +/* 0x004c 239 */ ldx [%o4+%g2],%o5 1.1367 +/* 0x0050 223 */ or %g0,%i5,%l3 1.1368 +/* 0x0054 */ or %g0,%i0,%l2 1.1369 +/* 0x0058 239 */ ldx [%o4+%g3],%o4 1.1370 +/* 0x005c 234 */ cmp %l0,16 1.1371 +/* 0x0060 232 */ std %f0,[%i2+%g4] 1.1372 +/* 0x0064 234 */ be,pn %icc,.L77000279 1.1373 +/* 0x0068 */ or %g0,%i3,%l4 1.1374 +/* 0x006c 236 */ sll %l0,2,%g2 1.1375 +/* 0x0070 223 */ or %g0,%o0,%i5 1.1376 +/* 0x0074 236 */ add %g2,2,%o0 1.1377 +/* 0x0078 223 */ or %g0,%i1,%i4 1.1378 +/* 0x007c 236 */ cmp %o0,0 1.1379 +/* 0x0080 223 */ or %g0,%i2,%l1 1.1380 +/* 0x0084 236 */ ble,a,pt %icc,.L900000657 1.1381 +/* 0x0088 */ ldd [%i1],%f6 1.1382 + 1.1383 +! 241 ! pdtj=&(dt[0]); 1.1384 +! 242 ! for(j=jj=0;j<2*nlen;j++,jj++,pdtj++) 1.1385 +! 243 ! { 1.1386 +! 244 ! m2j=pdm2[j]; 1.1387 +! 245 ! a=pdtj[0]+pdn[0]*digit; 1.1388 +! 246 ! b=pdtj[1]+pdm1[0]*pdm2[j+1]+a*TwoToMinus16; 1.1389 +! 247 ! pdtj[1]=b; 1.1390 +! 249 !#pragma pipeloop(0) 1.1391 +! 250 ! for(i=1;i<nlen;i++) 1.1392 +! 251 ! { 1.1393 +! 252 ! pdtj[2*i]+=pdm1[i]*m2j+pdn[i]*digit; 1.1394 +! 253 ! } 1.1395 +! 254 ! if((jj==30)) {cleanup(dt,j/2+1,2*nlen+1); jj=0;} 1.1396 +! 255 ! 1.1397 +! 256 ! digit=mod(lower32(b,Zero)*dn0,TwoToMinus16,TwoTo16); 1.1398 +! 257 ! } 1.1399 +! 258 ! } 1.1400 +! 259 ! else 1.1401 +! 260 ! { 1.1402 +! 261 ! a=dt[0]=pdm1[0]*pdm2[0]; 1.1403 +! 263 ! dt[65]= dt[64]= dt[63]= dt[62]= dt[61]= dt[60]= 1.1404 +! 264 ! dt[59]= dt[58]= dt[57]= dt[56]= dt[55]= dt[54]= 1.1405 +! 265 ! dt[53]= dt[52]= dt[51]= dt[50]= dt[49]= dt[48]= 1.1406 +! 266 ! dt[47]= dt[46]= dt[45]= dt[44]= dt[43]= dt[42]= 1.1407 +! 267 ! dt[41]= dt[40]= dt[39]= dt[38]= dt[37]= dt[36]= 1.1408 +! 268 ! dt[35]= dt[34]= dt[33]= dt[32]= dt[31]= dt[30]= 1.1409 +! 269 ! dt[29]= dt[28]= dt[27]= dt[26]= dt[25]= dt[24]= 1.1410 +! 270 ! dt[23]= dt[22]= dt[21]= dt[20]= dt[19]= dt[18]= 1.1411 +! 271 ! dt[17]= dt[16]= dt[15]= dt[14]= dt[13]= dt[12]= 1.1412 +! 272 ! dt[11]= dt[10]= dt[ 9]= dt[ 8]= dt[ 7]= dt[ 6]= 1.1413 +! 273 ! dt[ 5]= dt[ 4]= dt[ 3]= dt[ 2]= dt[ 1]=Zero; 1.1414 +! 275 ! pdn_0=pdn[0]; 1.1415 +! 276 ! pdm1_0=pdm1[0]; 1.1416 +! 278 ! digit=mod(lower32(a,Zero)*dn0,TwoToMinus16,TwoTo16); 1.1417 +! 279 ! pdtj=&(dt[0]); 1.1418 +! 281 ! for(j=0;j<32;j++,pdtj++) 1.1419 + 1.1420 +/* 0x008c 281 */ or %g0,%o0,%o1 1.1421 +/* 0x0090 236 */ sub %o0,1,%g1 1.1422 +/* 0x0094 */ or %g0,0,%g2 1.1423 +/* 0x0098 281 */ cmp %o1,5 1.1424 +/* 0x009c */ bl,pn %icc,.L77000280 1.1425 +/* 0x00a0 */ or %g0,8,%o0 1.1426 +/* 0x00a4 */ std %f0,[%i3] 1.1427 +/* 0x00a8 */ or %g0,2,%g2 1.1428 +/* 0x00ac */ sub %g1,2,%o1 1.1429 + .L900000627: 1.1430 +/* 0x00b0 */ add %o0,8,%g3 1.1431 +/* 0x00b4 */ std %f0,[%i3+%o0] 1.1432 +/* 0x00b8 */ add %g2,3,%g2 1.1433 +/* 0x00bc */ add %o0,16,%o2 1.1434 +/* 0x00c0 */ std %f0,[%i3+%g3] 1.1435 +/* 0x00c4 */ cmp %g2,%o1 1.1436 +/* 0x00c8 */ add %o0,24,%o0 1.1437 +/* 0x00cc */ ble,pt %icc,.L900000627 1.1438 +/* 0x00d0 */ std %f0,[%i3+%o2] 1.1439 + .L900000630: 1.1440 +/* 0x00d4 */ cmp %g2,%g1 1.1441 +/* 0x00d8 */ bg,pn %icc,.L77000285 1.1442 +/* 0x00dc */ std %f0,[%i3+%o0] 1.1443 + .L77000280: 1.1444 +/* 0x00e0 */ ldd [%o7],%f0 1.1445 + .L900000656: 1.1446 +/* 0x00e4 */ sra %g2,0,%o0 1.1447 +/* 0x00e8 */ add %g2,1,%g2 1.1448 +/* 0x00ec */ sllx %o0,3,%o0 1.1449 +/* 0x00f0 */ cmp %g2,%g1 1.1450 +/* 0x00f4 */ std %f0,[%i3+%o0] 1.1451 +/* 0x00f8 */ ble,a,pt %icc,.L900000656 1.1452 +/* 0x00fc */ ldd [%o7],%f0 1.1453 + .L77000285: 1.1454 +/* 0x0100 238 */ ldd [%i1],%f6 1.1455 + .L900000657: 1.1456 +/* 0x0104 238 */ ldd [%i2],%f8 1.1457 +/* 0x0108 242 */ cmp %o3,0 1.1458 +/* 0x010c */ sub %o3,1,%o1 1.1459 +/* 0x0110 239 */ ldd [%o7],%f10 1.1460 +/* 0x0114 */ add %o3,1,%o2 1.1461 +/* 0x0118 0 */ or %g0,0,%i2 1.1462 +/* 0x011c 238 */ fmuld %f6,%f8,%f6 1.1463 +/* 0x0120 */ std %f6,[%i3] 1.1464 +/* 0x0124 0 */ or %g0,0,%g3 1.1465 +/* 0x0128 239 */ ldd [%o5],%f8 1.1466 +/* 0x012c 0 */ or %g0,%o2,%g1 1.1467 +/* 0x0130 236 */ sub %l0,1,%i1 1.1468 +/* 0x0134 239 */ ldd [%o4],%f12 1.1469 +/* 0x0138 236 */ or %g0,1,%g4 1.1470 +/* 0x013c */ fdtox %f6,%f0 1.1471 +/* 0x0140 */ fmovs %f10,%f0 1.1472 +/* 0x0144 */ fxtod %f0,%f6 1.1473 +/* 0x0148 239 */ fmuld %f6,%f14,%f6 1.1474 +/* 0x014c */ fmuld %f6,%f8,%f8 1.1475 +/* 0x0150 */ fdtox %f8,%f8 1.1476 +/* 0x0154 */ fxtod %f8,%f8 1.1477 +/* 0x0158 */ fmuld %f8,%f12,%f8 1.1478 +/* 0x015c */ fsubd %f6,%f8,%f20 1.1479 +/* 0x0160 242 */ ble,pt %icc,.L900000650 1.1480 +/* 0x0164 */ sllx %g5,3,%g2 1.1481 +/* 0x0168 0 */ st %o1,[%sp+2223] 1.1482 +/* 0x016c 246 */ ldd [%i5],%f6 1.1483 + .L900000651: 1.1484 +/* 0x0170 246 */ sra %g4,0,%g2 1.1485 +/* 0x0174 */ fmuld %f6,%f20,%f6 1.1486 +/* 0x0178 */ ldd [%i3],%f12 1.1487 +/* 0x017c */ sllx %g2,3,%g2 1.1488 +/* 0x0180 */ ldd [%i4],%f8 1.1489 +/* 0x0184 250 */ cmp %l0,1 1.1490 +/* 0x0188 246 */ ldd [%l1+%g2],%f10 1.1491 +/* 0x018c 244 */ sra %i2,0,%g2 1.1492 +/* 0x0190 */ add %i2,1,%i0 1.1493 +/* 0x0194 246 */ faddd %f12,%f6,%f6 1.1494 +/* 0x0198 */ ldd [%o5],%f12 1.1495 +/* 0x019c 244 */ sllx %g2,3,%g2 1.1496 +/* 0x01a0 246 */ fmuld %f8,%f10,%f8 1.1497 +/* 0x01a4 */ ldd [%i3+8],%f10 1.1498 +/* 0x01a8 */ srl %i2,31,%o3 1.1499 +/* 0x01ac 244 */ ldd [%l1+%g2],%f18 1.1500 +/* 0x01b0 0 */ or %g0,1,%l5 1.1501 +/* 0x01b4 236 */ or %g0,2,%g2 1.1502 +/* 0x01b8 246 */ fmuld %f6,%f12,%f6 1.1503 +/* 0x01bc 250 */ or %g0,32,%o1 1.1504 +/* 0x01c0 */ or %g0,48,%o2 1.1505 +/* 0x01c4 246 */ faddd %f10,%f8,%f8 1.1506 +/* 0x01c8 */ faddd %f8,%f6,%f16 1.1507 +/* 0x01cc 250 */ ble,pn %icc,.L77000213 1.1508 +/* 0x01d0 */ std %f16,[%i3+8] 1.1509 +/* 0x01d4 */ cmp %i1,8 1.1510 +/* 0x01d8 */ sub %l0,3,%o3 1.1511 +/* 0x01dc */ bl,pn %icc,.L77000284 1.1512 +/* 0x01e0 */ or %g0,8,%o0 1.1513 +/* 0x01e4 252 */ ldd [%i5+8],%f0 1.1514 +/* 0x01e8 */ or %g0,6,%l5 1.1515 +/* 0x01ec */ ldd [%i4+8],%f2 1.1516 +/* 0x01f0 */ or %g0,4,%g2 1.1517 +/* 0x01f4 250 */ or %g0,40,%o0 1.1518 +/* 0x01f8 252 */ ldd [%i5+16],%f8 1.1519 +/* 0x01fc */ fmuld %f0,%f20,%f10 1.1520 +/* 0x0200 */ ldd [%i4+16],%f4 1.1521 +/* 0x0204 */ fmuld %f2,%f18,%f2 1.1522 +/* 0x0208 */ ldd [%i3+16],%f0 1.1523 +/* 0x020c */ fmuld %f8,%f20,%f12 1.1524 +/* 0x0210 */ ldd [%i4+24],%f6 1.1525 +/* 0x0214 */ fmuld %f4,%f18,%f4 1.1526 +/* 0x0218 */ ldd [%i5+24],%f8 1.1527 +/* 0x021c */ faddd %f2,%f10,%f2 1.1528 +/* 0x0220 */ ldd [%i4+32],%f14 1.1529 +/* 0x0224 */ fmuld %f6,%f18,%f10 1.1530 +/* 0x0228 */ ldd [%i5+32],%f6 1.1531 +/* 0x022c */ faddd %f4,%f12,%f4 1.1532 +/* 0x0230 */ ldd [%i4+40],%f12 1.1533 +/* 0x0234 */ faddd %f0,%f2,%f0 1.1534 +/* 0x0238 */ std %f0,[%i3+16] 1.1535 +/* 0x023c */ ldd [%i3+32],%f0 1.1536 +/* 0x0240 */ ldd [%i3+48],%f2 1.1537 + .L900000639: 1.1538 +/* 0x0244 */ add %o2,16,%l6 1.1539 +/* 0x0248 252 */ ldd [%i5+%o0],%f22 1.1540 +/* 0x024c */ add %l5,3,%l5 1.1541 +/* 0x0250 */ fmuld %f8,%f20,%f8 1.1542 +/* 0x0254 250 */ add %o0,8,%o0 1.1543 +/* 0x0258 252 */ ldd [%l6+%i3],%f26 1.1544 +/* 0x025c */ cmp %l5,%o3 1.1545 +/* 0x0260 */ ldd [%i4+%o0],%f24 1.1546 +/* 0x0264 */ faddd %f0,%f4,%f0 1.1547 +/* 0x0268 */ add %g2,6,%g2 1.1548 +/* 0x026c */ faddd %f10,%f8,%f10 1.1549 +/* 0x0270 */ fmuld %f14,%f18,%f4 1.1550 +/* 0x0274 */ std %f0,[%o1+%i3] 1.1551 +/* 0x0278 250 */ add %o2,32,%o1 1.1552 +/* 0x027c 252 */ ldd [%i5+%o0],%f8 1.1553 +/* 0x0280 */ fmuld %f6,%f20,%f6 1.1554 +/* 0x0284 250 */ add %o0,8,%o0 1.1555 +/* 0x0288 252 */ ldd [%o1+%i3],%f0 1.1556 +/* 0x028c */ ldd [%i4+%o0],%f14 1.1557 +/* 0x0290 */ faddd %f2,%f10,%f2 1.1558 +/* 0x0294 */ faddd %f4,%f6,%f10 1.1559 +/* 0x0298 */ fmuld %f12,%f18,%f4 1.1560 +/* 0x029c */ std %f2,[%o2+%i3] 1.1561 +/* 0x02a0 250 */ add %o2,48,%o2 1.1562 +/* 0x02a4 252 */ ldd [%i5+%o0],%f6 1.1563 +/* 0x02a8 */ fmuld %f22,%f20,%f22 1.1564 +/* 0x02ac 250 */ add %o0,8,%o0 1.1565 +/* 0x02b0 252 */ ldd [%o2+%i3],%f2 1.1566 +/* 0x02b4 */ ldd [%i4+%o0],%f12 1.1567 +/* 0x02b8 */ faddd %f26,%f10,%f10 1.1568 +/* 0x02bc */ std %f10,[%l6+%i3] 1.1569 +/* 0x02c0 */ fmuld %f24,%f18,%f10 1.1570 +/* 0x02c4 */ ble,pt %icc,.L900000639 1.1571 +/* 0x02c8 */ faddd %f4,%f22,%f4 1.1572 + .L900000642: 1.1573 +/* 0x02cc 252 */ fmuld %f8,%f20,%f24 1.1574 +/* 0x02d0 */ faddd %f0,%f4,%f8 1.1575 +/* 0x02d4 250 */ add %o2,16,%o3 1.1576 +/* 0x02d8 252 */ ldd [%o3+%i3],%f4 1.1577 +/* 0x02dc */ fmuld %f14,%f18,%f0 1.1578 +/* 0x02e0 */ cmp %l5,%i1 1.1579 +/* 0x02e4 */ std %f8,[%o1+%i3] 1.1580 +/* 0x02e8 */ fmuld %f12,%f18,%f8 1.1581 +/* 0x02ec 250 */ add %o2,32,%o1 1.1582 +/* 0x02f0 252 */ faddd %f10,%f24,%f12 1.1583 +/* 0x02f4 */ ldd [%i5+%o0],%f22 1.1584 +/* 0x02f8 */ fmuld %f6,%f20,%f6 1.1585 +/* 0x02fc */ add %g2,8,%g2 1.1586 +/* 0x0300 */ fmuld %f22,%f20,%f10 1.1587 +/* 0x0304 */ faddd %f2,%f12,%f2 1.1588 +/* 0x0308 */ faddd %f0,%f6,%f6 1.1589 +/* 0x030c */ ldd [%o1+%i3],%f0 1.1590 +/* 0x0310 */ std %f2,[%o2+%i3] 1.1591 +/* 0x0314 */ faddd %f8,%f10,%f2 1.1592 +/* 0x0318 */ sra %l5,0,%o2 1.1593 +/* 0x031c */ sllx %o2,3,%o0 1.1594 +/* 0x0320 */ faddd %f4,%f6,%f4 1.1595 +/* 0x0324 */ std %f4,[%o3+%i3] 1.1596 +/* 0x0328 */ faddd %f0,%f2,%f0 1.1597 +/* 0x032c */ std %f0,[%o1+%i3] 1.1598 +/* 0x0330 */ bg,a,pn %icc,.L77000213 1.1599 +/* 0x0334 */ srl %i2,31,%o3 1.1600 + .L77000284: 1.1601 +/* 0x0338 252 */ ldd [%i4+%o0],%f2 1.1602 + .L900000655: 1.1603 +/* 0x033c 252 */ ldd [%i5+%o0],%f0 1.1604 +/* 0x0340 */ fmuld %f2,%f18,%f2 1.1605 +/* 0x0344 */ sra %g2,0,%o0 1.1606 +/* 0x0348 */ sllx %o0,3,%o1 1.1607 +/* 0x034c */ add %l5,1,%l5 1.1608 +/* 0x0350 */ fmuld %f0,%f20,%f4 1.1609 +/* 0x0354 */ ldd [%o1+%i3],%f0 1.1610 +/* 0x0358 */ sra %l5,0,%o2 1.1611 +/* 0x035c */ sllx %o2,3,%o0 1.1612 +/* 0x0360 */ add %g2,2,%g2 1.1613 +/* 0x0364 */ cmp %l5,%i1 1.1614 +/* 0x0368 */ faddd %f2,%f4,%f2 1.1615 +/* 0x036c */ faddd %f0,%f2,%f0 1.1616 +/* 0x0370 */ std %f0,[%o1+%i3] 1.1617 +/* 0x0374 */ ble,a,pt %icc,.L900000655 1.1618 +/* 0x0378 */ ldd [%i4+%o0],%f2 1.1619 + .L900000626: 1.1620 +/* 0x037c */ srl %i2,31,%o3 1.1621 +/* 0x0380 252 */ ba .L900000654 1.1622 +/* 0x0384 */ cmp %g3,30 1.1623 + .L77000213: 1.1624 +/* 0x0388 254 */ cmp %g3,30 1.1625 + .L900000654: 1.1626 +/* 0x038c */ add %i2,%o3,%o0 1.1627 +/* 0x0390 254 */ bne,a,pt %icc,.L900000653 1.1628 +/* 0x0394 */ fdtox %f16,%f0 1.1629 +/* 0x0398 281 */ sra %o0,1,%g2 1.1630 +/* 0x039c */ add %g2,1,%g2 1.1631 +/* 0x03a0 */ ldd [%o7],%f0 1.1632 +/* 0x03a4 */ sll %g2,1,%o1 1.1633 +/* 0x03a8 */ sll %g1,1,%g2 1.1634 +/* 0x03ac */ or %g0,%o1,%o2 1.1635 +/* 0x03b0 */ fmovd %f0,%f2 1.1636 +/* 0x03b4 */ or %g0,%g2,%o0 1.1637 +/* 0x03b8 */ cmp %o1,%o0 1.1638 +/* 0x03bc */ sub %g2,1,%o0 1.1639 +/* 0x03c0 */ bge,pt %icc,.L77000215 1.1640 +/* 0x03c4 */ or %g0,0,%g3 1.1641 +/* 0x03c8 254 */ add %o1,1,%o1 1.1642 +/* 0x03cc 281 */ sra %o2,0,%g2 1.1643 + .L900000652: 1.1644 +/* 0x03d0 */ sllx %g2,3,%g2 1.1645 +/* 0x03d4 */ ldd [%o7],%f6 1.1646 +/* 0x03d8 */ add %o2,2,%o2 1.1647 +/* 0x03dc */ sra %o1,0,%g3 1.1648 +/* 0x03e0 */ ldd [%g2+%l4],%f8 1.1649 +/* 0x03e4 */ cmp %o2,%o0 1.1650 +/* 0x03e8 */ sllx %g3,3,%g3 1.1651 +/* 0x03ec */ add %o1,2,%o1 1.1652 +/* 0x03f0 */ ldd [%l4+%g3],%f10 1.1653 +/* 0x03f4 */ fdtox %f8,%f12 1.1654 +/* 0x03f8 */ fdtox %f10,%f4 1.1655 +/* 0x03fc */ fmovd %f12,%f8 1.1656 +/* 0x0400 */ fmovs %f6,%f12 1.1657 +/* 0x0404 */ fmovs %f6,%f4 1.1658 +/* 0x0408 */ fxtod %f12,%f6 1.1659 +/* 0x040c */ fxtod %f4,%f12 1.1660 +/* 0x0410 */ fdtox %f10,%f4 1.1661 +/* 0x0414 */ faddd %f6,%f2,%f6 1.1662 +/* 0x0418 */ std %f6,[%g2+%l4] 1.1663 +/* 0x041c */ faddd %f12,%f0,%f6 1.1664 +/* 0x0420 */ std %f6,[%l4+%g3] 1.1665 +/* 0x0424 */ fitod %f8,%f2 1.1666 +/* 0x0428 */ fitod %f4,%f0 1.1667 +/* 0x042c */ ble,pt %icc,.L900000652 1.1668 +/* 0x0430 */ sra %o2,0,%g2 1.1669 + .L77000233: 1.1670 +/* 0x0434 */ or %g0,0,%g3 1.1671 + .L77000215: 1.1672 +/* 0x0438 */ fdtox %f16,%f0 1.1673 + .L900000653: 1.1674 +/* 0x043c 256 */ ldd [%o7],%f6 1.1675 +/* 0x0440 */ add %g4,1,%g4 1.1676 +/* 0x0444 */ or %g0,%i0,%i2 1.1677 +/* 0x0448 */ ldd [%o5],%f8 1.1678 +/* 0x044c */ add %g3,1,%g3 1.1679 +/* 0x0450 */ add %i3,8,%i3 1.1680 +/* 0x0454 */ fmovs %f6,%f0 1.1681 +/* 0x0458 */ ldd [%o4],%f10 1.1682 +/* 0x045c */ ld [%sp+2223],%o0 1.1683 +/* 0x0460 */ fxtod %f0,%f6 1.1684 +/* 0x0464 */ cmp %i0,%o0 1.1685 +/* 0x0468 */ fmuld %f6,%f30,%f6 1.1686 +/* 0x046c */ fmuld %f6,%f8,%f8 1.1687 +/* 0x0470 */ fdtox %f8,%f8 1.1688 +/* 0x0474 */ fxtod %f8,%f8 1.1689 +/* 0x0478 */ fmuld %f8,%f10,%f8 1.1690 +/* 0x047c */ fsubd %f6,%f8,%f20 1.1691 +/* 0x0480 */ ble,a,pt %icc,.L900000651 1.1692 +/* 0x0484 */ ldd [%i5],%f6 1.1693 + .L900000625: 1.1694 +/* 0x0488 256 */ ba .L900000650 1.1695 +/* 0x048c */ sllx %g5,3,%g2 1.1696 + .L77000279: 1.1697 +/* 0x0490 261 */ ldd [%i1],%f4 1.1698 +/* 0x0494 */ ldd [%i2],%f6 1.1699 +/* 0x0498 273 */ std %f0,[%i3+8] 1.1700 +/* 0x049c */ std %f0,[%i3+16] 1.1701 +/* 0x04a0 261 */ fmuld %f4,%f6,%f6 1.1702 +/* 0x04a4 */ std %f6,[%i3] 1.1703 +/* 0x04a8 273 */ std %f0,[%i3+24] 1.1704 +/* 0x04ac */ std %f0,[%i3+32] 1.1705 +/* 0x04b0 */ fdtox %f6,%f2 1.1706 +/* 0x04b4 */ std %f0,[%i3+40] 1.1707 +/* 0x04b8 */ std %f0,[%i3+48] 1.1708 +/* 0x04bc */ std %f0,[%i3+56] 1.1709 +/* 0x04c0 */ std %f0,[%i3+64] 1.1710 +/* 0x04c4 */ fmovs %f0,%f2 1.1711 +/* 0x04c8 */ std %f0,[%i3+72] 1.1712 +/* 0x04cc */ std %f0,[%i3+80] 1.1713 +/* 0x04d0 */ std %f0,[%i3+88] 1.1714 +/* 0x04d4 */ std %f0,[%i3+96] 1.1715 +/* 0x04d8 */ std %f0,[%i3+104] 1.1716 +/* 0x04dc */ std %f0,[%i3+112] 1.1717 +/* 0x04e0 */ std %f0,[%i3+120] 1.1718 +/* 0x04e4 */ std %f0,[%i3+128] 1.1719 +/* 0x04e8 */ std %f0,[%i3+136] 1.1720 +/* 0x04ec */ std %f0,[%i3+144] 1.1721 +/* 0x04f0 */ std %f0,[%i3+152] 1.1722 +/* 0x04f4 */ std %f0,[%i3+160] 1.1723 +/* 0x04f8 */ std %f0,[%i3+168] 1.1724 +/* 0x04fc */ fxtod %f2,%f6 1.1725 +/* 0x0500 */ std %f0,[%i3+176] 1.1726 +/* 0x0504 281 */ or %g0,1,%o2 1.1727 +/* 0x0508 273 */ std %f0,[%i3+184] 1.1728 + 1.1729 +! 282 ! { 1.1730 +! 284 ! m2j=pdm2[j]; 1.1731 +! 285 ! a=pdtj[0]+pdn_0*digit; 1.1732 +! 286 ! b=pdtj[1]+pdm1_0*pdm2[j+1]+a*TwoToMinus16; 1.1733 + 1.1734 +/* 0x050c 286 */ sra %o2,0,%g2 1.1735 +/* 0x0510 279 */ or %g0,%i3,%o3 1.1736 +/* 0x0514 273 */ std %f0,[%i3+192] 1.1737 +/* 0x0518 278 */ fmuld %f6,%f14,%f6 1.1738 +/* 0x051c 281 */ or %g0,0,%g1 1.1739 +/* 0x0520 273 */ std %f0,[%i3+200] 1.1740 +/* 0x0524 */ std %f0,[%i3+208] 1.1741 +/* 0x0528 */ std %f0,[%i3+216] 1.1742 +/* 0x052c */ std %f0,[%i3+224] 1.1743 +/* 0x0530 */ std %f0,[%i3+232] 1.1744 +/* 0x0534 */ std %f0,[%i3+240] 1.1745 +/* 0x0538 */ std %f0,[%i3+248] 1.1746 +/* 0x053c */ std %f0,[%i3+256] 1.1747 +/* 0x0540 */ std %f0,[%i3+264] 1.1748 +/* 0x0544 */ std %f0,[%i3+272] 1.1749 +/* 0x0548 */ std %f0,[%i3+280] 1.1750 +/* 0x054c */ std %f0,[%i3+288] 1.1751 +/* 0x0550 */ std %f0,[%i3+296] 1.1752 +/* 0x0554 */ std %f0,[%i3+304] 1.1753 +/* 0x0558 */ std %f0,[%i3+312] 1.1754 +/* 0x055c */ std %f0,[%i3+320] 1.1755 +/* 0x0560 */ std %f0,[%i3+328] 1.1756 +/* 0x0564 */ std %f0,[%i3+336] 1.1757 +/* 0x0568 */ std %f0,[%i3+344] 1.1758 +/* 0x056c */ std %f0,[%i3+352] 1.1759 +/* 0x0570 */ std %f0,[%i3+360] 1.1760 +/* 0x0574 */ std %f0,[%i3+368] 1.1761 +/* 0x0578 */ std %f0,[%i3+376] 1.1762 +/* 0x057c */ std %f0,[%i3+384] 1.1763 +/* 0x0580 */ std %f0,[%i3+392] 1.1764 +/* 0x0584 */ std %f0,[%i3+400] 1.1765 +/* 0x0588 */ std %f0,[%i3+408] 1.1766 +/* 0x058c */ std %f0,[%i3+416] 1.1767 +/* 0x0590 */ std %f0,[%i3+424] 1.1768 +/* 0x0594 */ std %f0,[%i3+432] 1.1769 +/* 0x0598 */ std %f0,[%i3+440] 1.1770 +/* 0x059c */ std %f0,[%i3+448] 1.1771 +/* 0x05a0 */ std %f0,[%i3+456] 1.1772 +/* 0x05a4 */ std %f0,[%i3+464] 1.1773 +/* 0x05a8 */ std %f0,[%i3+472] 1.1774 +/* 0x05ac */ std %f0,[%i3+480] 1.1775 +/* 0x05b0 */ std %f0,[%i3+488] 1.1776 +/* 0x05b4 */ std %f0,[%i3+496] 1.1777 +/* 0x05b8 278 */ ldd [%o5],%f8 1.1778 +/* 0x05bc */ ldd [%o4],%f10 1.1779 +/* 0x05c0 */ fmuld %f6,%f8,%f8 1.1780 +/* 0x05c4 273 */ std %f0,[%i3+504] 1.1781 +/* 0x05c8 */ std %f0,[%i3+512] 1.1782 +/* 0x05cc */ std %f0,[%i3+520] 1.1783 +/* 0x05d0 */ fdtox %f8,%f8 1.1784 +/* 0x05d4 275 */ ldd [%o0],%f0 1.1785 +/* 0x05d8 */ fxtod %f8,%f8 1.1786 +/* 0x05dc */ fmuld %f8,%f10,%f8 1.1787 +/* 0x05e0 */ fsubd %f6,%f8,%f2 1.1788 + 1.1789 +! 287 ! pdtj[1]=b; 1.1790 +! 289 ! /**** this loop will be fully unrolled: 1.1791 +! 290 ! for(i=1;i<16;i++) 1.1792 +! 291 ! { 1.1793 +! 292 ! pdtj[2*i]+=pdm1[i]*m2j+pdn[i]*digit; 1.1794 +! 293 ! } 1.1795 +! 294 ! *************************************/ 1.1796 +! 295 ! pdtj[2]+=pdm1[1]*m2j+pdn[1]*digit; 1.1797 +! 296 ! pdtj[4]+=pdm1[2]*m2j+pdn[2]*digit; 1.1798 +! 297 ! pdtj[6]+=pdm1[3]*m2j+pdn[3]*digit; 1.1799 +! 298 ! pdtj[8]+=pdm1[4]*m2j+pdn[4]*digit; 1.1800 +! 299 ! pdtj[10]+=pdm1[5]*m2j+pdn[5]*digit; 1.1801 +! 300 ! pdtj[12]+=pdm1[6]*m2j+pdn[6]*digit; 1.1802 +! 301 ! pdtj[14]+=pdm1[7]*m2j+pdn[7]*digit; 1.1803 +! 302 ! pdtj[16]+=pdm1[8]*m2j+pdn[8]*digit; 1.1804 +! 303 ! pdtj[18]+=pdm1[9]*m2j+pdn[9]*digit; 1.1805 +! 304 ! pdtj[20]+=pdm1[10]*m2j+pdn[10]*digit; 1.1806 +! 305 ! pdtj[22]+=pdm1[11]*m2j+pdn[11]*digit; 1.1807 +! 306 ! pdtj[24]+=pdm1[12]*m2j+pdn[12]*digit; 1.1808 +! 307 ! pdtj[26]+=pdm1[13]*m2j+pdn[13]*digit; 1.1809 +! 308 ! pdtj[28]+=pdm1[14]*m2j+pdn[14]*digit; 1.1810 +! 309 ! pdtj[30]+=pdm1[15]*m2j+pdn[15]*digit; 1.1811 +! 310 ! /* no need for cleenup, cannot overflow */ 1.1812 +! 311 ! digit=mod(lower32(b,Zero)*dn0,TwoToMinus16,TwoTo16); 1.1813 + 1.1814 + 1.1815 + fmovd %f2,%f0 ! hand modified 1.1816 + fmovd %f30,%f18 ! hand modified 1.1817 + ldd [%o0],%f2 1.1818 + ldd [%o3],%f8 1.1819 + ldd [%i1],%f10 1.1820 + ldd [%o5],%f14 ! hand modified 1.1821 + ldd [%o4],%f16 ! hand modified 1.1822 + ldd [%i2],%f24 1.1823 + 1.1824 + ldd [%i1+8],%f26 1.1825 + ldd [%i1+16],%f40 1.1826 + ldd [%i1+48],%f46 1.1827 + ldd [%i1+56],%f30 1.1828 + ldd [%i1+64],%f54 1.1829 + ldd [%i1+104],%f34 1.1830 + ldd [%i1+112],%f58 1.1831 + 1.1832 + ldd [%o0+8],%f28 1.1833 + ldd [%o0+104],%f38 1.1834 + ldd [%o0+112],%f60 1.1835 + 1.1836 + .L99999999: !1 1.1837 + ldd [%i1+24],%f32 1.1838 + fmuld %f0,%f2,%f4 !2 1.1839 + ldd [%o0+24],%f36 1.1840 + fmuld %f26,%f24,%f20 !3 1.1841 + ldd [%i1+40],%f42 1.1842 + fmuld %f28,%f0,%f22 !4 1.1843 + ldd [%o0+40],%f44 1.1844 + fmuld %f32,%f24,%f32 !5 1.1845 + ldd [%i2+8],%f6 1.1846 + faddd %f4,%f8,%f4 1.1847 + fmuld %f36,%f0,%f36 !6 1.1848 + add %i2,8,%i2 1.1849 + ldd [%o0+56],%f50 1.1850 + fmuld %f42,%f24,%f42 !7 1.1851 + ldd [%i1+72],%f52 1.1852 + faddd %f20,%f22,%f20 1.1853 + fmuld %f44,%f0,%f44 !8 1.1854 + ldd [%o3+16],%f22 1.1855 + fmuld %f10,%f6,%f12 !9 1.1856 + ldd [%o0+72],%f56 1.1857 + faddd %f32,%f36,%f32 1.1858 + fmuld %f14,%f4,%f4 !10 1.1859 + ldd [%o3+48],%f36 1.1860 + fmuld %f30,%f24,%f48 !11 1.1861 + ldd [%o3+8],%f8 1.1862 + faddd %f20,%f22,%f20 1.1863 + fmuld %f50,%f0,%f50 !12 1.1864 + std %f20,[%o3+16] 1.1865 + faddd %f42,%f44,%f42 1.1866 + fmuld %f52,%f24,%f52 !13 1.1867 + ldd [%o3+80],%f44 1.1868 + faddd %f4,%f12,%f4 1.1869 + fmuld %f56,%f0,%f56 !14 1.1870 + ldd [%i1+88],%f20 1.1871 + faddd %f32,%f36,%f32 !15 1.1872 + ldd [%o0+88],%f22 1.1873 + faddd %f48,%f50,%f48 !16 1.1874 + ldd [%o3+112],%f50 1.1875 + faddd %f52,%f56,%f52 !17 1.1876 + ldd [%o3+144],%f56 1.1877 + faddd %f4,%f8,%f8 1.1878 + fmuld %f20,%f24,%f20 !18 1.1879 + std %f32,[%o3+48] 1.1880 + faddd %f42,%f44,%f42 1.1881 + fmuld %f22,%f0,%f22 !19 1.1882 + std %f42,[%o3+80] 1.1883 + faddd %f48,%f50,%f48 1.1884 + fmuld %f34,%f24,%f32 !20 1.1885 + std %f48,[%o3+112] 1.1886 + faddd %f52,%f56,%f52 1.1887 + fmuld %f38,%f0,%f36 !21 1.1888 + ldd [%i1+120],%f42 1.1889 + fdtox %f8,%f4 !22 1.1890 + std %f52,[%o3+144] 1.1891 + faddd %f20,%f22,%f20 !23 1.1892 + ldd [%o0+120],%f44 !24 1.1893 + ldd [%o3+176],%f22 1.1894 + faddd %f32,%f36,%f32 1.1895 + fmuld %f42,%f24,%f42 !25 1.1896 + ldd [%o0+16],%f50 1.1897 + fmovs %f17,%f4 !26 1.1898 + ldd [%i1+32],%f52 1.1899 + fmuld %f44,%f0,%f44 !27 1.1900 + ldd [%o0+32],%f56 1.1901 + fmuld %f40,%f24,%f48 !28 1.1902 + ldd [%o3+208],%f36 1.1903 + faddd %f20,%f22,%f20 1.1904 + fmuld %f50,%f0,%f50 !29 1.1905 + std %f20,[%o3+176] 1.1906 + fxtod %f4,%f4 1.1907 + fmuld %f52,%f24,%f52 !30 1.1908 + ldd [%o0+48],%f22 1.1909 + faddd %f42,%f44,%f42 1.1910 + fmuld %f56,%f0,%f56 !31 1.1911 + ldd [%o3+240],%f44 1.1912 + faddd %f32,%f36,%f32 !32 1.1913 + std %f32,[%o3+208] 1.1914 + faddd %f48,%f50,%f48 1.1915 + fmuld %f46,%f24,%f20 !33 1.1916 + ldd [%o3+32],%f50 1.1917 + fmuld %f4,%f18,%f12 !34 1.1918 + ldd [%o0+64],%f36 1.1919 + faddd %f52,%f56,%f52 1.1920 + fmuld %f22,%f0,%f22 !35 1.1921 + ldd [%o3+64],%f56 1.1922 + faddd %f42,%f44,%f42 !36 1.1923 + std %f42,[%o3+240] 1.1924 + faddd %f48,%f50,%f48 1.1925 + fmuld %f54,%f24,%f32 !37 1.1926 + std %f48,[%o3+32] 1.1927 + fmuld %f12,%f14,%f4 !38 1.1928 + ldd [%i1+80],%f42 1.1929 + faddd %f52,%f56,%f56 ! yes, tmp52! 1.1930 + fmuld %f36,%f0,%f36 !39 1.1931 + ldd [%o0+80],%f44 1.1932 + faddd %f20,%f22,%f20 !40 1.1933 + ldd [%i1+96],%f48 1.1934 + fmuld %f58,%f24,%f52 !41 1.1935 + ldd [%o0+96],%f50 1.1936 + fdtox %f4,%f4 1.1937 + fmuld %f42,%f24,%f42 !42 1.1938 + std %f56,[%o3+64] ! yes, tmp52! 1.1939 + faddd %f32,%f36,%f32 1.1940 + fmuld %f44,%f0,%f44 !43 1.1941 + ldd [%o3+96],%f22 1.1942 + fmuld %f48,%f24,%f48 !44 1.1943 + ldd [%o3+128],%f36 1.1944 + fmovd %f6,%f24 1.1945 + fmuld %f50,%f0,%f50 !45 1.1946 + fxtod %f4,%f4 1.1947 + fmuld %f60,%f0,%f56 !46 1.1948 + add %o3,8,%o3 1.1949 + faddd %f42,%f44,%f42 !47 1.1950 + ldd [%o3+160-8],%f44 1.1951 + faddd %f20,%f22,%f20 !48 1.1952 + std %f20,[%o3+96-8] 1.1953 + faddd %f48,%f50,%f48 !49 1.1954 + ldd [%o3+192-8],%f50 1.1955 + faddd %f52,%f56,%f52 1.1956 + fmuld %f4,%f16,%f4 !50 1.1957 + ldd [%o3+224-8],%f56 1.1958 + faddd %f32,%f36,%f32 !51 1.1959 + std %f32,[%o3+128-8] 1.1960 + faddd %f42,%f44,%f42 !52 1.1961 + add %g1,1,%g1 1.1962 + std %f42,[%o3+160-8] 1.1963 + faddd %f48,%f50,%f48 !53 1.1964 + cmp %g1,31 1.1965 + std %f48,[%o3+192-8] 1.1966 + fsubd %f12,%f4,%f0 !54 1.1967 + faddd %f52,%f56,%f52 1.1968 + ble,pt %icc,.L99999999 1.1969 + std %f52,[%o3+224-8] !55 1.1970 + std %f8,[%o3] 1.1971 +! 312 ! } 1.1972 +! 313 ! } 1.1973 +! 315 ! conv_d16_to_i32(result,dt+2*nlen,(long long *)dt,nlen+1); 1.1974 + 1.1975 +/* 0x0844 315 */ sllx %g5,3,%g2 1.1976 + .L900000650: 1.1977 +/* 0x0848 315 */ ldd [%g2+%l4],%f2 1.1978 +/* 0x084c */ add %l4,%g2,%o0 1.1979 +/* 0x0850 */ or %g0,0,%g1 1.1980 +/* 0x0854 */ ldd [%o0+8],%f4 1.1981 +/* 0x0858 */ or %g0,0,%i2 1.1982 +/* 0x085c */ cmp %l0,0 1.1983 +/* 0x0860 */ fdtox %f2,%f2 1.1984 +/* 0x0864 */ std %f2,[%sp+2255] 1.1985 +/* 0x0868 311 */ sethi %hi(0xfc00),%o3 1.1986 +/* 0x086c 315 */ fdtox %f4,%f2 1.1987 +/* 0x0870 */ std %f2,[%sp+2247] 1.1988 +/* 0x0874 311 */ or %g0,-1,%o2 1.1989 +/* 0x0878 */ srl %o2,0,%o5 1.1990 +/* 0x087c */ or %g0,2,%g5 1.1991 +/* 0x0880 */ sub %l0,1,%g3 1.1992 +/* 0x0884 */ or %g0,%o0,%o7 1.1993 +/* 0x0888 */ add %o3,1023,%o4 1.1994 +/* 0x088c 315 */ or %g0,64,%o3 1.1995 +/* 0x0890 */ ldx [%sp+2255],%i0 1.1996 +/* 0x0894 */ sub %l0,2,%o1 1.1997 +/* 0x0898 */ ldx [%sp+2247],%i1 1.1998 +/* 0x089c */ ble,pt %icc,.L900000648 1.1999 +/* 0x08a0 */ sethi %hi(0xfc00),%g2 1.2000 +/* 0x08a4 */ cmp %l0,6 1.2001 +/* 0x08a8 */ and %i0,%o5,%o2 1.2002 +/* 0x08ac */ bl,pn %icc,.L77000287 1.2003 +/* 0x08b0 */ or %g0,3,%g4 1.2004 +/* 0x08b4 */ ldd [%o7+16],%f0 1.2005 +/* 0x08b8 */ and %i1,%o4,%i3 1.2006 +/* 0x08bc */ sllx %i3,16,%o0 1.2007 +/* 0x08c0 */ or %g0,5,%g4 1.2008 +/* 0x08c4 */ srax %i1,16,%i4 1.2009 +/* 0x08c8 */ fdtox %f0,%f0 1.2010 +/* 0x08cc */ std %f0,[%sp+2239] 1.2011 +/* 0x08d0 */ srax %i0,32,%i1 1.2012 +/* 0x08d4 */ add %o2,%o0,%i5 1.2013 +/* 0x08d8 */ ldd [%o7+24],%f0 1.2014 +/* 0x08dc */ and %i5,%o5,%l1 1.2015 +/* 0x08e0 */ or %g0,72,%o2 1.2016 +/* 0x08e4 */ or %g0,4,%o0 1.2017 +/* 0x08e8 */ or %g0,4,%g5 1.2018 +/* 0x08ec */ ldx [%sp+2239],%g1 1.2019 +/* 0x08f0 */ fdtox %f0,%f0 1.2020 +/* 0x08f4 */ or %g0,4,%i2 1.2021 +/* 0x08f8 */ std %f0,[%sp+2231] 1.2022 +/* 0x08fc */ ldd [%o7+40],%f2 1.2023 +/* 0x0900 */ and %g1,%o5,%i3 1.2024 +/* 0x0904 */ ldd [%o7+32],%f0 1.2025 +/* 0x0908 */ srax %g1,32,%g1 1.2026 +/* 0x090c */ ldd [%o7+56],%f4 1.2027 +/* 0x0910 */ fdtox %f2,%f2 1.2028 +/* 0x0914 */ ldx [%sp+2231],%g2 1.2029 +/* 0x0918 */ fdtox %f0,%f0 1.2030 +/* 0x091c */ st %l1,[%l2] 1.2031 +/* 0x0920 */ srax %i5,32,%l1 1.2032 +/* 0x0924 */ fdtox %f4,%f4 1.2033 +/* 0x0928 */ std %f2,[%sp+2231] 1.2034 +/* 0x092c */ and %g2,%o4,%i5 1.2035 +/* 0x0930 */ add %i4,%l1,%i4 1.2036 +/* 0x0934 */ std %f0,[%sp+2239] 1.2037 +/* 0x0938 */ sllx %i5,16,%i0 1.2038 +/* 0x093c */ add %i1,%i4,%i1 1.2039 +/* 0x0940 */ ldd [%o7+48],%f2 1.2040 +/* 0x0944 */ srax %g2,16,%g2 1.2041 +/* 0x0948 */ add %i3,%i0,%i0 1.2042 +/* 0x094c */ ldd [%o7+72],%f0 1.2043 +/* 0x0950 */ add %i0,%i1,%i3 1.2044 +/* 0x0954 */ srax %i3,32,%i4 1.2045 +/* 0x0958 */ fdtox %f2,%f2 1.2046 +/* 0x095c */ and %i3,%o5,%i3 1.2047 +/* 0x0960 */ ldx [%sp+2231],%i1 1.2048 +/* 0x0964 */ add %g2,%i4,%g2 1.2049 +/* 0x0968 */ ldx [%sp+2239],%i0 1.2050 +/* 0x096c */ add %g1,%g2,%g1 1.2051 +/* 0x0970 */ std %f2,[%sp+2239] 1.2052 +/* 0x0974 */ std %f4,[%sp+2231] 1.2053 +/* 0x0978 */ ldd [%o7+64],%f2 1.2054 +/* 0x097c */ st %i3,[%l2+4] 1.2055 + .L900000631: 1.2056 +/* 0x0980 */ ldx [%sp+2231],%i3 1.2057 +/* 0x0984 */ add %i2,2,%i2 1.2058 +/* 0x0988 */ add %g4,4,%g4 1.2059 +/* 0x098c */ ldx [%sp+2239],%i5 1.2060 +/* 0x0990 */ add %o2,16,%o2 1.2061 +/* 0x0994 */ and %i1,%o4,%g2 1.2062 +/* 0x0998 */ sllx %g2,16,%i4 1.2063 +/* 0x099c */ and %i0,%o5,%g2 1.2064 +/* 0x09a0 */ ldd [%o7+%o2],%f4 1.2065 +/* 0x09a4 */ fdtox %f0,%f0 1.2066 +/* 0x09a8 */ std %f0,[%sp+2231] 1.2067 +/* 0x09ac */ srax %i1,16,%i1 1.2068 +/* 0x09b0 */ add %g2,%i4,%g2 1.2069 +/* 0x09b4 */ fdtox %f2,%f0 1.2070 +/* 0x09b8 */ add %o3,16,%o3 1.2071 +/* 0x09bc */ std %f0,[%sp+2239] 1.2072 +/* 0x09c0 */ add %g2,%g1,%g1 1.2073 +/* 0x09c4 */ ldd [%o7+%o3],%f2 1.2074 +/* 0x09c8 */ srax %g1,32,%i4 1.2075 +/* 0x09cc */ cmp %i2,%o1 1.2076 +/* 0x09d0 */ srax %i0,32,%g2 1.2077 +/* 0x09d4 */ add %i1,%i4,%i0 1.2078 +/* 0x09d8 */ add %g2,%i0,%i4 1.2079 +/* 0x09dc */ add %o0,4,%o0 1.2080 +/* 0x09e0 */ and %g1,%o5,%g2 1.2081 +/* 0x09e4 */ or %g0,%i5,%g1 1.2082 +/* 0x09e8 */ st %g2,[%l2+%o0] 1.2083 +/* 0x09ec */ add %g5,4,%g5 1.2084 +/* 0x09f0 */ ldx [%sp+2231],%i1 1.2085 +/* 0x09f4 */ ldx [%sp+2239],%i0 1.2086 +/* 0x09f8 */ add %o2,16,%o2 1.2087 +/* 0x09fc */ and %i3,%o4,%g2 1.2088 +/* 0x0a00 */ sllx %g2,16,%i5 1.2089 +/* 0x0a04 */ and %g1,%o5,%g2 1.2090 +/* 0x0a08 */ ldd [%o7+%o2],%f0 1.2091 +/* 0x0a0c */ fdtox %f4,%f4 1.2092 +/* 0x0a10 */ std %f4,[%sp+2231] 1.2093 +/* 0x0a14 */ srax %i3,16,%i3 1.2094 +/* 0x0a18 */ add %g2,%i5,%g2 1.2095 +/* 0x0a1c */ fdtox %f2,%f2 1.2096 +/* 0x0a20 */ add %o3,16,%o3 1.2097 +/* 0x0a24 */ std %f2,[%sp+2239] 1.2098 +/* 0x0a28 */ add %g2,%i4,%g2 1.2099 +/* 0x0a2c */ ldd [%o7+%o3],%f2 1.2100 +/* 0x0a30 */ srax %g2,32,%i4 1.2101 +/* 0x0a34 */ srax %g1,32,%g1 1.2102 +/* 0x0a38 */ add %i3,%i4,%i3 1.2103 +/* 0x0a3c */ add %g1,%i3,%g1 1.2104 +/* 0x0a40 */ add %o0,4,%o0 1.2105 +/* 0x0a44 */ and %g2,%o5,%g2 1.2106 +/* 0x0a48 */ ble,pt %icc,.L900000631 1.2107 +/* 0x0a4c */ st %g2,[%l2+%o0] 1.2108 + .L900000634: 1.2109 +/* 0x0a50 */ srax %i1,16,%i5 1.2110 +/* 0x0a54 */ ldx [%sp+2231],%o1 1.2111 +/* 0x0a58 */ and %i1,%o4,%i3 1.2112 +/* 0x0a5c */ sllx %i3,16,%i3 1.2113 +/* 0x0a60 */ ldx [%sp+2239],%i4 1.2114 +/* 0x0a64 */ and %i0,%o5,%g2 1.2115 +/* 0x0a68 */ add %g2,%i3,%g2 1.2116 +/* 0x0a6c */ and %o1,%o4,%i3 1.2117 +/* 0x0a70 */ fdtox %f0,%f4 1.2118 +/* 0x0a74 */ sllx %i3,16,%i3 1.2119 +/* 0x0a78 */ std %f4,[%sp+2231] 1.2120 +/* 0x0a7c */ add %g2,%g1,%g2 1.2121 +/* 0x0a80 */ srax %g2,32,%l1 1.2122 +/* 0x0a84 */ and %i4,%o5,%i1 1.2123 +/* 0x0a88 */ fdtox %f2,%f0 1.2124 +/* 0x0a8c */ srax %i0,32,%g1 1.2125 +/* 0x0a90 */ std %f0,[%sp+2239] 1.2126 +/* 0x0a94 */ add %i5,%l1,%i0 1.2127 +/* 0x0a98 */ srax %o1,16,%o1 1.2128 +/* 0x0a9c */ add %g1,%i0,%i0 1.2129 +/* 0x0aa0 */ add %o0,4,%g1 1.2130 +/* 0x0aa4 */ add %i1,%i3,%o0 1.2131 +/* 0x0aa8 */ and %g2,%o5,%g2 1.2132 +/* 0x0aac */ st %g2,[%l2+%g1] 1.2133 +/* 0x0ab0 */ add %o0,%i0,%o0 1.2134 +/* 0x0ab4 */ srax %o0,32,%i3 1.2135 +/* 0x0ab8 */ ldx [%sp+2231],%i1 1.2136 +/* 0x0abc */ add %g1,4,%g1 1.2137 +/* 0x0ac0 */ ldx [%sp+2239],%i0 1.2138 +/* 0x0ac4 */ and %o0,%o5,%g2 1.2139 +/* 0x0ac8 */ add %o1,%i3,%o1 1.2140 +/* 0x0acc */ srax %i4,32,%o0 1.2141 +/* 0x0ad0 */ cmp %i2,%g3 1.2142 +/* 0x0ad4 */ st %g2,[%l2+%g1] 1.2143 +/* 0x0ad8 */ bg,pn %icc,.L77000236 1.2144 +/* 0x0adc */ add %o0,%o1,%g1 1.2145 +/* 0x0ae0 */ add %g4,6,%g4 1.2146 +/* 0x0ae4 */ add %g5,6,%g5 1.2147 + .L77000287: 1.2148 +/* 0x0ae8 */ sra %g5,0,%o1 1.2149 + .L900000647: 1.2150 +/* 0x0aec */ sllx %o1,3,%o2 1.2151 +/* 0x0af0 */ and %i0,%o5,%o0 1.2152 +/* 0x0af4 */ ldd [%o7+%o2],%f0 1.2153 +/* 0x0af8 */ sra %g4,0,%o2 1.2154 +/* 0x0afc */ and %i1,%o4,%o1 1.2155 +/* 0x0b00 */ sllx %o2,3,%o2 1.2156 +/* 0x0b04 */ add %g1,%o0,%o0 1.2157 +/* 0x0b08 */ fdtox %f0,%f0 1.2158 +/* 0x0b0c */ std %f0,[%sp+2239] 1.2159 +/* 0x0b10 */ sllx %o1,16,%o1 1.2160 +/* 0x0b14 */ add %o0,%o1,%o1 1.2161 +/* 0x0b18 */ add %g5,2,%g5 1.2162 +/* 0x0b1c */ ldd [%o7+%o2],%f0 1.2163 +/* 0x0b20 */ srax %o1,32,%g1 1.2164 +/* 0x0b24 */ and %o1,%o5,%o2 1.2165 +/* 0x0b28 */ srax %i1,16,%o0 1.2166 +/* 0x0b2c */ add %g4,2,%g4 1.2167 +/* 0x0b30 */ fdtox %f0,%f0 1.2168 +/* 0x0b34 */ std %f0,[%sp+2231] 1.2169 +/* 0x0b38 */ sra %i2,0,%o1 1.2170 +/* 0x0b3c */ sllx %o1,2,%o1 1.2171 +/* 0x0b40 */ add %o0,%g1,%g2 1.2172 +/* 0x0b44 */ srax %i0,32,%g1 1.2173 +/* 0x0b48 */ add %i2,1,%i2 1.2174 +/* 0x0b4c */ add %g1,%g2,%g1 1.2175 +/* 0x0b50 */ cmp %i2,%g3 1.2176 +/* 0x0b54 */ ldx [%sp+2239],%o3 1.2177 +/* 0x0b58 */ ldx [%sp+2231],%i1 1.2178 +/* 0x0b5c */ st %o2,[%l2+%o1] 1.2179 +/* 0x0b60 */ or %g0,%o3,%i0 1.2180 +/* 0x0b64 */ ble,pt %icc,.L900000647 1.2181 +/* 0x0b68 */ sra %g5,0,%o1 1.2182 + .L77000236: 1.2183 +/* 0x0b6c */ sethi %hi(0xfc00),%g2 1.2184 + .L900000648: 1.2185 +/* 0x0b70 */ or %g0,-1,%o0 1.2186 +/* 0x0b74 */ add %g2,1023,%g2 1.2187 +/* 0x0b78 */ srl %o0,0,%g3 1.2188 +/* 0x0b7c */ and %i1,%g2,%g2 1.2189 +/* 0x0b80 */ and %i0,%g3,%g4 1.2190 +/* 0x0b84 */ sllx %g2,16,%g2 1.2191 +/* 0x0b88 */ add %g1,%g4,%g4 1.2192 +/* 0x0b8c */ sra %i2,0,%g5 1.2193 +/* 0x0b90 */ add %g4,%g2,%g4 1.2194 +/* 0x0b94 */ sllx %g5,2,%g2 1.2195 +/* 0x0b98 */ and %g4,%g3,%g3 1.2196 +/* 0x0b9c */ st %g3,[%l2+%g2] 1.2197 + 1.2198 +! 317 ! adjust_montf_result(result,nint,nlen); 1.2199 + 1.2200 +/* 0x0ba0 317 */ sra %l0,0,%g4 1.2201 +/* 0x0ba4 */ sllx %g4,2,%g2 1.2202 +/* 0x0ba8 */ ld [%l2+%g2],%g2 1.2203 +/* 0x0bac */ cmp %g2,0 1.2204 +/* 0x0bb0 */ bleu,pn %icc,.L77000241 1.2205 +/* 0x0bb4 */ or %g0,-1,%o1 1.2206 +/* 0x0bb8 */ ba .L900000646 1.2207 +/* 0x0bbc */ cmp %o1,0 1.2208 + .L77000241: 1.2209 +/* 0x0bc0 */ sub %l0,1,%o1 1.2210 +/* 0x0bc4 */ cmp %o1,0 1.2211 +/* 0x0bc8 */ bl,pn %icc,.L77000244 1.2212 +/* 0x0bcc */ sra %o1,0,%g2 1.2213 + .L900000645: 1.2214 +/* 0x0bd0 */ sllx %g2,2,%g2 1.2215 +/* 0x0bd4 */ sub %o1,1,%o0 1.2216 +/* 0x0bd8 */ ld [%l3+%g2],%g3 1.2217 +/* 0x0bdc */ ld [%l2+%g2],%g2 1.2218 +/* 0x0be0 */ cmp %g2,%g3 1.2219 +/* 0x0be4 */ bne,pn %icc,.L77000244 1.2220 +/* 0x0be8 */ nop 1.2221 +/* 0x0bec 0 */ or %g0,%o0,%o1 1.2222 +/* 0x0bf0 317 */ cmp %o0,0 1.2223 +/* 0x0bf4 */ bge,pt %icc,.L900000645 1.2224 +/* 0x0bf8 */ sra %o1,0,%g2 1.2225 + .L77000244: 1.2226 +/* 0x0bfc */ cmp %o1,0 1.2227 + .L900000646: 1.2228 +/* 0x0c00 */ bl,pn %icc,.L77000288 1.2229 +/* 0x0c04 */ sra %o1,0,%g2 1.2230 +/* 0x0c08 */ sllx %g2,2,%g2 1.2231 +/* 0x0c0c */ ld [%l3+%g2],%g3 1.2232 +/* 0x0c10 */ ld [%l2+%g2],%g2 1.2233 +/* 0x0c14 */ cmp %g2,%g3 1.2234 +/* 0x0c18 */ bleu,pt %icc,.L77000224 1.2235 +/* 0x0c1c */ nop 1.2236 + .L77000288: 1.2237 +/* 0x0c20 */ cmp %l0,0 1.2238 +/* 0x0c24 */ ble,pt %icc,.L77000224 1.2239 +/* 0x0c28 */ nop 1.2240 +/* 0x0c2c 317 */ or %g0,-1,%g2 1.2241 +/* 0x0c30 315 */ or %g0,0,%i0 1.2242 +/* 0x0c34 317 */ srl %g2,0,%g2 1.2243 +/* 0x0c38 315 */ or %g0,0,%g4 1.2244 +/* 0x0c3c */ or %g0,0,%o1 1.2245 +/* 0x0c40 317 */ sub %l0,1,%g5 1.2246 +/* 0x0c44 */ cmp %l0,9 1.2247 +/* 0x0c48 315 */ or %g0,8,%o5 1.2248 +/* 0x0c4c */ bl,pn %icc,.L77000289 1.2249 +/* 0x0c50 */ sub %l0,4,%o7 1.2250 +/* 0x0c54 */ ld [%l2],%o1 1.2251 +/* 0x0c58 */ or %g0,5,%i0 1.2252 +/* 0x0c5c */ ld [%l3],%o2 1.2253 +/* 0x0c60 */ or %g0,12,%o4 1.2254 +/* 0x0c64 */ or %g0,16,%g1 1.2255 +/* 0x0c68 */ ld [%l3+4],%o3 1.2256 +/* 0x0c6c */ ld [%l2+4],%o0 1.2257 +/* 0x0c70 */ sub %o1,%o2,%o1 1.2258 +/* 0x0c74 */ ld [%l3+8],%i1 1.2259 +/* 0x0c78 */ and %o1,%g2,%g4 1.2260 +/* 0x0c7c */ st %g4,[%l2] 1.2261 +/* 0x0c80 */ srax %o1,32,%g4 1.2262 +/* 0x0c84 */ sub %o0,%o3,%o0 1.2263 +/* 0x0c88 */ ld [%l3+12],%o2 1.2264 +/* 0x0c8c */ add %o0,%g4,%o0 1.2265 +/* 0x0c90 */ and %o0,%g2,%g4 1.2266 +/* 0x0c94 */ st %g4,[%l2+4] 1.2267 +/* 0x0c98 */ srax %o0,32,%o0 1.2268 +/* 0x0c9c */ ld [%l2+8],%o1 1.2269 +/* 0x0ca0 */ ld [%l2+12],%o3 1.2270 +/* 0x0ca4 */ sub %o1,%i1,%o1 1.2271 + .L900000635: 1.2272 +/* 0x0ca8 */ add %g1,4,%g3 1.2273 +/* 0x0cac */ ld [%g1+%l2],%g4 1.2274 +/* 0x0cb0 */ add %o1,%o0,%o0 1.2275 +/* 0x0cb4 */ ld [%l3+%g1],%i1 1.2276 +/* 0x0cb8 */ sub %o3,%o2,%o1 1.2277 +/* 0x0cbc */ and %o0,%g2,%o2 1.2278 +/* 0x0cc0 */ st %o2,[%o5+%l2] 1.2279 +/* 0x0cc4 */ srax %o0,32,%o2 1.2280 +/* 0x0cc8 */ add %i0,4,%i0 1.2281 +/* 0x0ccc */ add %g1,8,%o5 1.2282 +/* 0x0cd0 */ ld [%g3+%l2],%o0 1.2283 +/* 0x0cd4 */ add %o1,%o2,%o1 1.2284 +/* 0x0cd8 */ ld [%l3+%g3],%o3 1.2285 +/* 0x0cdc */ sub %g4,%i1,%o2 1.2286 +/* 0x0ce0 */ and %o1,%g2,%g4 1.2287 +/* 0x0ce4 */ st %g4,[%o4+%l2] 1.2288 +/* 0x0ce8 */ srax %o1,32,%g4 1.2289 +/* 0x0cec */ cmp %i0,%o7 1.2290 +/* 0x0cf0 */ add %g1,12,%o4 1.2291 +/* 0x0cf4 */ ld [%o5+%l2],%o1 1.2292 +/* 0x0cf8 */ add %o2,%g4,%o2 1.2293 +/* 0x0cfc */ ld [%l3+%o5],%i1 1.2294 +/* 0x0d00 */ sub %o0,%o3,%o0 1.2295 +/* 0x0d04 */ and %o2,%g2,%o3 1.2296 +/* 0x0d08 */ st %o3,[%g1+%l2] 1.2297 +/* 0x0d0c */ srax %o2,32,%g4 1.2298 +/* 0x0d10 */ ld [%o4+%l2],%o3 1.2299 +/* 0x0d14 */ add %g1,16,%g1 1.2300 +/* 0x0d18 */ add %o0,%g4,%o0 1.2301 +/* 0x0d1c */ ld [%l3+%o4],%o2 1.2302 +/* 0x0d20 */ sub %o1,%i1,%o1 1.2303 +/* 0x0d24 */ and %o0,%g2,%g4 1.2304 +/* 0x0d28 */ st %g4,[%g3+%l2] 1.2305 +/* 0x0d2c */ ble,pt %icc,.L900000635 1.2306 +/* 0x0d30 */ srax %o0,32,%o0 1.2307 + .L900000638: 1.2308 +/* 0x0d34 */ add %o1,%o0,%g3 1.2309 +/* 0x0d38 */ sub %o3,%o2,%o1 1.2310 +/* 0x0d3c */ ld [%g1+%l2],%o0 1.2311 +/* 0x0d40 */ ld [%l3+%g1],%o2 1.2312 +/* 0x0d44 */ srax %g3,32,%o7 1.2313 +/* 0x0d48 */ and %g3,%g2,%o3 1.2314 +/* 0x0d4c */ add %o1,%o7,%o1 1.2315 +/* 0x0d50 */ st %o3,[%o5+%l2] 1.2316 +/* 0x0d54 */ cmp %i0,%g5 1.2317 +/* 0x0d58 */ sub %o0,%o2,%o0 1.2318 +/* 0x0d5c */ and %o1,%g2,%o2 1.2319 +/* 0x0d60 */ st %o2,[%o4+%l2] 1.2320 +/* 0x0d64 */ srax %o1,32,%o1 1.2321 +/* 0x0d68 */ sra %i0,0,%o2 1.2322 +/* 0x0d6c */ add %o0,%o1,%o0 1.2323 +/* 0x0d70 */ srax %o0,32,%g4 1.2324 +/* 0x0d74 */ and %o0,%g2,%o1 1.2325 +/* 0x0d78 */ st %o1,[%g1+%l2] 1.2326 +/* 0x0d7c */ bg,pn %icc,.L77000224 1.2327 +/* 0x0d80 */ sllx %o2,2,%o1 1.2328 + .L77000289: 1.2329 +/* 0x0d84 0 */ or %g0,%o1,%g1 1.2330 + .L900000644: 1.2331 +/* 0x0d88 */ ld [%o1+%l2],%o0 1.2332 +/* 0x0d8c */ add %i0,1,%i0 1.2333 +/* 0x0d90 */ ld [%l3+%o1],%o1 1.2334 +/* 0x0d94 */ sra %i0,0,%o2 1.2335 +/* 0x0d98 */ cmp %i0,%g5 1.2336 +/* 0x0d9c */ add %g4,%o0,%o0 1.2337 +/* 0x0da0 */ sub %o0,%o1,%o0 1.2338 +/* 0x0da4 */ srax %o0,32,%g4 1.2339 +/* 0x0da8 */ and %o0,%g2,%o1 1.2340 +/* 0x0dac */ st %o1,[%g1+%l2] 1.2341 +/* 0x0db0 */ sllx %o2,2,%o1 1.2342 +/* 0x0db4 */ ble,pt %icc,.L900000644 1.2343 +/* 0x0db8 */ or %g0,%o1,%g1 1.2344 + .L77000224: 1.2345 +/* 0x0dbc */ ret ! Result = 1.2346 +/* 0x0dc0 */ restore %g0,%g0,%g0 1.2347 +/* 0x0dc4 0 */ .type mont_mulf_noconv,2 1.2348 +/* 0x0dc4 */ .size mont_mulf_noconv,(.-mont_mulf_noconv) 1.2349 +