security/nss/lib/freebl/mpi/montmulfv8.s

Thu, 22 Jan 2015 13:21:57 +0100

author
Michael Schloh von Bennewitz <michael@schloh.com>
date
Thu, 22 Jan 2015 13:21:57 +0100
branch
TOR_BUG_9701
changeset 15
b8a032363ba2
permissions
-rw-r--r--

Incorporate requested changes from Mozilla in review:
https://bugzilla.mozilla.org/show_bug.cgi?id=1123480#c6

michael@0 1 !
michael@0 2 ! This Source Code Form is subject to the terms of the Mozilla Public
michael@0 3 ! License, v. 2.0. If a copy of the MPL was not distributed with this
michael@0 4 ! file, You can obtain one at http://mozilla.org/MPL/2.0/.
michael@0 5
michael@0 6 .section ".text",#alloc,#execinstr
michael@0 7 .file "montmulf.c"
michael@0 8
michael@0 9 .section ".rodata",#alloc
michael@0 10 .global TwoTo16
michael@0 11 .align 8
michael@0 12 !
michael@0 13 ! CONSTANT POOL
michael@0 14 !
michael@0 15 .global TwoTo16
michael@0 16 TwoTo16:
michael@0 17 .word 1089470464
michael@0 18 .word 0
michael@0 19 .type TwoTo16,#object
michael@0 20 .size TwoTo16,8
michael@0 21 .global TwoToMinus16
michael@0 22 !
michael@0 23 ! CONSTANT POOL
michael@0 24 !
michael@0 25 .global TwoToMinus16
michael@0 26 TwoToMinus16:
michael@0 27 .word 1055916032
michael@0 28 .word 0
michael@0 29 .type TwoToMinus16,#object
michael@0 30 .size TwoToMinus16,8
michael@0 31 .global Zero
michael@0 32 !
michael@0 33 ! CONSTANT POOL
michael@0 34 !
michael@0 35 .global Zero
michael@0 36 Zero:
michael@0 37 .word 0
michael@0 38 .word 0
michael@0 39 .type Zero,#object
michael@0 40 .size Zero,8
michael@0 41 .global TwoTo32
michael@0 42 !
michael@0 43 ! CONSTANT POOL
michael@0 44 !
michael@0 45 .global TwoTo32
michael@0 46 TwoTo32:
michael@0 47 .word 1106247680
michael@0 48 .word 0
michael@0 49 .type TwoTo32,#object
michael@0 50 .size TwoTo32,8
michael@0 51 .global TwoToMinus32
michael@0 52 !
michael@0 53 ! CONSTANT POOL
michael@0 54 !
michael@0 55 .global TwoToMinus32
michael@0 56 TwoToMinus32:
michael@0 57 .word 1039138816
michael@0 58 .word 0
michael@0 59 .type TwoToMinus32,#object
michael@0 60 .size TwoToMinus32,8
michael@0 61
michael@0 62 .section ".text",#alloc,#execinstr
michael@0 63 /* 000000 0 */ .align 4
michael@0 64 !
michael@0 65 ! SUBROUTINE conv_d16_to_i32
michael@0 66 !
michael@0 67 ! OFFSET SOURCE LINE LABEL INSTRUCTION
michael@0 68
michael@0 69 .global conv_d16_to_i32
michael@0 70 conv_d16_to_i32:
michael@0 71 /* 000000 */ save %sp,-128,%sp
michael@0 72 ! FILE montmulf.c
michael@0 73
michael@0 74 ! 36 !#define RF_INLINE_MACROS
michael@0 75 ! 38 !static const double TwoTo16=65536.0;
michael@0 76 ! 39 !static const double TwoToMinus16=1.0/65536.0;
michael@0 77 ! 40 !static const double Zero=0.0;
michael@0 78 ! 41 !static const double TwoTo32=65536.0*65536.0;
michael@0 79 ! 42 !static const double TwoToMinus32=1.0/(65536.0*65536.0);
michael@0 80 ! 44 !#ifdef RF_INLINE_MACROS
michael@0 81 ! 46 !double upper32(double);
michael@0 82 ! 47 !double lower32(double, double);
michael@0 83 ! 48 !double mod(double, double, double);
michael@0 84 ! 50 !void i16_to_d16_and_d32x4(const double * /*1/(2^16)*/,
michael@0 85 ! 51 ! const double * /* 2^16*/,
michael@0 86 ! 52 ! const double * /* 0 */,
michael@0 87 ! 53 ! double * /*result16*/,
michael@0 88 ! 54 ! double * /* result32 */,
michael@0 89 ! 55 ! float * /*source - should be unsigned int*
michael@0 90 ! 56 ! converted to float* */);
michael@0 91 ! 58 !#else
michael@0 92 ! 60 !static double upper32(double x)
michael@0 93 ! 61 !{
michael@0 94 ! 62 ! return floor(x*TwoToMinus32);
michael@0 95 ! 63 !}
michael@0 96 ! 65 !static double lower32(double x, double y)
michael@0 97 ! 66 !{
michael@0 98 ! 67 ! return x-TwoTo32*floor(x*TwoToMinus32);
michael@0 99 ! 68 !}
michael@0 100 ! 70 !static double mod(double x, double oneoverm, double m)
michael@0 101 ! 71 !{
michael@0 102 ! 72 ! return x-m*floor(x*oneoverm);
michael@0 103 ! 73 !}
michael@0 104 ! 75 !#endif
michael@0 105 ! 78 !static void cleanup(double *dt, int from, int tlen)
michael@0 106 ! 79 !{
michael@0 107 ! 80 ! int i;
michael@0 108 ! 81 ! double tmp,tmp1,x,x1;
michael@0 109 ! 83 ! tmp=tmp1=Zero;
michael@0 110 ! 84 ! /* original code **
michael@0 111 ! 85 ! for(i=2*from;i<2*tlen-2;i++)
michael@0 112 ! 86 ! {
michael@0 113 ! 87 ! x=dt[i];
michael@0 114 ! 88 ! dt[i]=lower32(x,Zero)+tmp1;
michael@0 115 ! 89 ! tmp1=tmp;
michael@0 116 ! 90 ! tmp=upper32(x);
michael@0 117 ! 91 ! }
michael@0 118 ! 92 ! dt[tlen-2]+=tmp1;
michael@0 119 ! 93 ! dt[tlen-1]+=tmp;
michael@0 120 ! 94 ! **end original code ***/
michael@0 121 ! 95 ! /* new code ***/
michael@0 122 ! 96 ! for(i=2*from;i<2*tlen;i+=2)
michael@0 123 ! 97 ! {
michael@0 124 ! 98 ! x=dt[i];
michael@0 125 ! 99 ! x1=dt[i+1];
michael@0 126 ! 100 ! dt[i]=lower32(x,Zero)+tmp;
michael@0 127 ! 101 ! dt[i+1]=lower32(x1,Zero)+tmp1;
michael@0 128 ! 102 ! tmp=upper32(x);
michael@0 129 ! 103 ! tmp1=upper32(x1);
michael@0 130 ! 104 ! }
michael@0 131 ! 105 ! /** end new code **/
michael@0 132 ! 106 !}
michael@0 133 ! 109 !void conv_d16_to_i32(unsigned int *i32, double *d16, long long *tmp, int ilen)
michael@0 134 ! 110 !{
michael@0 135 ! 111 !int i;
michael@0 136 ! 112 !long long t, t1, a, b, c, d;
michael@0 137 ! 114 ! t1=0;
michael@0 138 ! 115 ! a=(long long)d16[0];
michael@0 139
michael@0 140 /* 0x0004 115 */ ldd [%i1],%f0
michael@0 141 /* 0x0008 110 */ or %g0,%i1,%o0
michael@0 142
michael@0 143 ! 116 ! b=(long long)d16[1];
michael@0 144 ! 117 ! for(i=0; i<ilen-1; i++)
michael@0 145
michael@0 146 /* 0x000c 117 */ sub %i3,1,%g2
michael@0 147 /* 0x0010 */ cmp %g2,0
michael@0 148 /* 0x0014 114 */ or %g0,0,%o4
michael@0 149 /* 0x0018 115 */ fdtox %f0,%f0
michael@0 150 /* 0x001c */ std %f0,[%sp+120]
michael@0 151 /* 0x0020 117 */ or %g0,0,%o7
michael@0 152 /* 0x0024 110 */ or %g0,%i3,%o1
michael@0 153 /* 0x0028 */ sub %i3,2,%o2
michael@0 154 /* 0x002c 116 */ ldd [%o0+8],%f0
michael@0 155 /* 0x0030 110 */ sethi %hi(0xfc00),%o1
michael@0 156 /* 0x0034 */ add %o2,1,%g3
michael@0 157 /* 0x0038 */ add %o1,1023,%o1
michael@0 158 /* 0x003c */ or %g0,%i0,%o5
michael@0 159 /* 0x0040 116 */ fdtox %f0,%f0
michael@0 160 /* 0x0044 */ std %f0,[%sp+112]
michael@0 161 /* 0x0048 */ ldx [%sp+112],%g1
michael@0 162 /* 0x004c 115 */ ldx [%sp+120],%g4
michael@0 163 /* 0x0050 117 */ ble,pt %icc,.L900000117
michael@0 164 /* 0x0054 */ sethi %hi(0xfc00),%g2
michael@0 165 /* 0x0058 110 */ or %g0,-1,%g2
michael@0 166 /* 0x005c 117 */ cmp %g3,3
michael@0 167 /* 0x0060 110 */ srl %g2,0,%o3
michael@0 168 /* 0x0064 117 */ bl,pn %icc,.L77000134
michael@0 169 /* 0x0068 */ or %g0,%o0,%g2
michael@0 170
michael@0 171 ! 118 ! {
michael@0 172 ! 119 ! c=(long long)d16[2*i+2];
michael@0 173
michael@0 174 /* 0x006c 119 */ ldd [%o0+16],%f0
michael@0 175
michael@0 176 ! 120 ! t1+=a&0xffffffff;
michael@0 177 ! 121 ! t=(a>>32);
michael@0 178 ! 122 ! d=(long long)d16[2*i+3];
michael@0 179 ! 123 ! t1+=(b&0xffff)<<16;
michael@0 180 ! 124 ! t+=(b>>16)+(t1>>32);
michael@0 181 ! 125 ! i32[i]=t1&0xffffffff;
michael@0 182 ! 126 ! t1=t;
michael@0 183 ! 127 ! a=c;
michael@0 184 ! 128 ! b=d;
michael@0 185
michael@0 186 /* 0x0070 128 */ add %o0,16,%g2
michael@0 187 /* 0x0074 123 */ and %g1,%o1,%o0
michael@0 188 /* 0x0078 */ sllx %o0,16,%g3
michael@0 189 /* 0x007c 120 */ and %g4,%o3,%o0
michael@0 190 /* 0x0080 117 */ add %o0,%g3,%o4
michael@0 191 /* 0x0084 119 */ fdtox %f0,%f0
michael@0 192 /* 0x0088 */ std %f0,[%sp+104]
michael@0 193 /* 0x008c 125 */ and %o4,%o3,%g5
michael@0 194 /* 0x0090 122 */ ldd [%g2+8],%f2
michael@0 195 /* 0x0094 128 */ add %o5,4,%o5
michael@0 196 /* 0x0098 124 */ srax %o4,32,%o4
michael@0 197 /* 0x009c */ stx %o4,[%sp+112]
michael@0 198 /* 0x00a0 122 */ fdtox %f2,%f0
michael@0 199 /* 0x00a4 */ std %f0,[%sp+96]
michael@0 200 /* 0x00a8 124 */ srax %g1,16,%o0
michael@0 201 /* 0x00ac */ ldx [%sp+112],%o7
michael@0 202 /* 0x00b0 121 */ srax %g4,32,%o4
michael@0 203 /* 0x00b4 124 */ add %o0,%o7,%g4
michael@0 204 /* 0x00b8 128 */ or %g0,1,%o7
michael@0 205 /* 0x00bc 119 */ ldx [%sp+104],%g3
michael@0 206 /* 0x00c0 124 */ add %o4,%g4,%o4
michael@0 207 /* 0x00c4 122 */ ldx [%sp+96],%g1
michael@0 208 /* 0x00c8 125 */ st %g5,[%o5-4]
michael@0 209 /* 0x00cc 127 */ or %g0,%g3,%g4
michael@0 210 .L900000112:
michael@0 211 /* 0x00d0 119 */ ldd [%g2+16],%f0
michael@0 212 /* 0x00d4 128 */ add %o7,1,%o7
michael@0 213 /* 0x00d8 */ add %o5,4,%o5
michael@0 214 /* 0x00dc */ cmp %o7,%o2
michael@0 215 /* 0x00e0 */ add %g2,16,%g2
michael@0 216 /* 0x00e4 119 */ fdtox %f0,%f0
michael@0 217 /* 0x00e8 */ std %f0,[%sp+104]
michael@0 218 /* 0x00ec 122 */ ldd [%g2+8],%f0
michael@0 219 /* 0x00f0 */ fdtox %f0,%f0
michael@0 220 /* 0x00f4 */ std %f0,[%sp+96]
michael@0 221 /* 0x00f8 123 */ and %g1,%o1,%g3
michael@0 222 /* 0x00fc */ sllx %g3,16,%g5
michael@0 223 /* 0x0100 120 */ and %g4,%o3,%g3
michael@0 224 /* 0x0104 117 */ add %g3,%g5,%g3
michael@0 225 /* 0x0108 124 */ srax %g1,16,%g1
michael@0 226 /* 0x010c 117 */ add %g3,%o4,%g3
michael@0 227 /* 0x0110 124 */ srax %g3,32,%o4
michael@0 228 /* 0x0114 */ stx %o4,[%sp+112]
michael@0 229 /* 0x0118 119 */ ldx [%sp+104],%g5
michael@0 230 /* 0x011c 121 */ srax %g4,32,%o4
michael@0 231 /* 0x0120 124 */ ldx [%sp+112],%g4
michael@0 232 /* 0x0124 */ add %g1,%g4,%g4
michael@0 233 /* 0x0128 122 */ ldx [%sp+96],%g1
michael@0 234 /* 0x012c 124 */ add %o4,%g4,%o4
michael@0 235 /* 0x0130 125 */ and %g3,%o3,%g3
michael@0 236 /* 0x0134 127 */ or %g0,%g5,%g4
michael@0 237 /* 0x0138 128 */ ble,pt %icc,.L900000112
michael@0 238 /* 0x013c */ st %g3,[%o5-4]
michael@0 239 .L900000115:
michael@0 240 /* 0x0140 128 */ ba .L900000117
michael@0 241 /* 0x0144 */ sethi %hi(0xfc00),%g2
michael@0 242 .L77000134:
michael@0 243 /* 0x0148 119 */ ldd [%g2+16],%f0
michael@0 244 .L900000116:
michael@0 245 /* 0x014c 120 */ and %g4,%o3,%o0
michael@0 246 /* 0x0150 123 */ and %g1,%o1,%g3
michael@0 247 /* 0x0154 119 */ fdtox %f0,%f0
michael@0 248 /* 0x0158 120 */ add %o4,%o0,%o0
michael@0 249 /* 0x015c 119 */ std %f0,[%sp+104]
michael@0 250 /* 0x0160 128 */ add %o7,1,%o7
michael@0 251 /* 0x0164 123 */ sllx %g3,16,%o4
michael@0 252 /* 0x0168 122 */ ldd [%g2+24],%f2
michael@0 253 /* 0x016c 128 */ add %g2,16,%g2
michael@0 254 /* 0x0170 123 */ add %o0,%o4,%o0
michael@0 255 /* 0x0174 128 */ cmp %o7,%o2
michael@0 256 /* 0x0178 125 */ and %o0,%o3,%g3
michael@0 257 /* 0x017c 122 */ fdtox %f2,%f0
michael@0 258 /* 0x0180 */ std %f0,[%sp+96]
michael@0 259 /* 0x0184 124 */ srax %o0,32,%o0
michael@0 260 /* 0x0188 */ stx %o0,[%sp+112]
michael@0 261 /* 0x018c 121 */ srax %g4,32,%o4
michael@0 262 /* 0x0190 122 */ ldx [%sp+96],%o0
michael@0 263 /* 0x0194 124 */ srax %g1,16,%g5
michael@0 264 /* 0x0198 */ ldx [%sp+112],%g4
michael@0 265 /* 0x019c 119 */ ldx [%sp+104],%g1
michael@0 266 /* 0x01a0 125 */ st %g3,[%o5]
michael@0 267 /* 0x01a4 124 */ add %g5,%g4,%g4
michael@0 268 /* 0x01a8 128 */ add %o5,4,%o5
michael@0 269 /* 0x01ac 124 */ add %o4,%g4,%o4
michael@0 270 /* 0x01b0 127 */ or %g0,%g1,%g4
michael@0 271 /* 0x01b4 128 */ or %g0,%o0,%g1
michael@0 272 /* 0x01b8 */ ble,a,pt %icc,.L900000116
michael@0 273 /* 0x01bc */ ldd [%g2+16],%f0
michael@0 274 .L77000127:
michael@0 275
michael@0 276 ! 129 ! }
michael@0 277 ! 130 ! t1+=a&0xffffffff;
michael@0 278 ! 131 ! t=(a>>32);
michael@0 279 ! 132 ! t1+=(b&0xffff)<<16;
michael@0 280 ! 133 ! i32[i]=t1&0xffffffff;
michael@0 281
michael@0 282 /* 0x01c0 133 */ sethi %hi(0xfc00),%g2
michael@0 283 .L900000117:
michael@0 284 /* 0x01c4 133 */ or %g0,-1,%g3
michael@0 285 /* 0x01c8 */ add %g2,1023,%g2
michael@0 286 /* 0x01cc */ srl %g3,0,%g3
michael@0 287 /* 0x01d0 */ and %g1,%g2,%g2
michael@0 288 /* 0x01d4 */ and %g4,%g3,%g4
michael@0 289 /* 0x01d8 */ sllx %g2,16,%g2
michael@0 290 /* 0x01dc */ add %o4,%g4,%g4
michael@0 291 /* 0x01e0 */ add %g4,%g2,%g2
michael@0 292 /* 0x01e4 */ sll %o7,2,%g4
michael@0 293 /* 0x01e8 */ and %g2,%g3,%g2
michael@0 294 /* 0x01ec */ st %g2,[%i0+%g4]
michael@0 295 /* 0x01f0 */ ret ! Result =
michael@0 296 /* 0x01f4 */ restore %g0,%g0,%g0
michael@0 297 /* 0x01f8 0 */ .type conv_d16_to_i32,2
michael@0 298 /* 0x01f8 */ .size conv_d16_to_i32,(.-conv_d16_to_i32)
michael@0 299
michael@0 300 .section ".text",#alloc,#execinstr
michael@0 301 /* 000000 0 */ .align 8
michael@0 302 !
michael@0 303 ! CONSTANT POOL
michael@0 304 !
michael@0 305 .L_const_seg_900000201:
michael@0 306 /* 000000 0 */ .word 1127219200,0
michael@0 307 /* 0x0008 0 */ .align 4
michael@0 308 /* 0x0008 */ .skip 16
michael@0 309 !
michael@0 310 ! SUBROUTINE conv_i32_to_d32
michael@0 311 !
michael@0 312 ! OFFSET SOURCE LINE LABEL INSTRUCTION
michael@0 313
michael@0 314 .global conv_i32_to_d32
michael@0 315 conv_i32_to_d32:
michael@0 316 /* 000000 */ or %g0,%o7,%g2
michael@0 317
michael@0 318 ! 135 !}
michael@0 319 ! 137 !void conv_i32_to_d32(double *d32, unsigned int *i32, int len)
michael@0 320 ! 138 !{
michael@0 321 ! 139 !int i;
michael@0 322 ! 141 !#pragma pipeloop(0)
michael@0 323 ! 142 ! for(i=0;i<len;i++) d32[i]=(double)(i32[i]);
michael@0 324
michael@0 325 /* 0x0004 142 */ cmp %o2,0
michael@0 326 .L900000210:
michael@0 327 /* 0x0008 */ call .+8
michael@0 328 /* 0x000c */ sethi /*X*/%hi(_GLOBAL_OFFSET_TABLE_-(.L900000210-.)),%g4
michael@0 329 /* 0x0010 142 */ or %g0,0,%o5
michael@0 330 /* 0x0014 138 */ add %g4,/*X*/%lo(_GLOBAL_OFFSET_TABLE_-(.L900000210-.)),%g4
michael@0 331 /* 0x0018 */ or %g0,%o0,%g5
michael@0 332 /* 0x001c */ add %g4,%o7,%g1
michael@0 333 /* 0x0020 142 */ ble,pt %icc,.L77000140
michael@0 334 /* 0x0024 */ or %g0,%g2,%o7
michael@0 335 /* 0x0028 */ sethi %hi(.L_const_seg_900000201),%g2
michael@0 336 /* 0x002c 138 */ or %g0,%o1,%g4
michael@0 337 /* 0x0030 142 */ add %g2,%lo(.L_const_seg_900000201),%g2
michael@0 338 /* 0x0034 */ sub %o2,1,%g3
michael@0 339 /* 0x0038 */ ld [%g1+%g2],%g2
michael@0 340 /* 0x003c */ cmp %o2,9
michael@0 341 /* 0x0040 */ bl,pn %icc,.L77000144
michael@0 342 /* 0x0044 */ ldd [%g2],%f8
michael@0 343 /* 0x0048 */ add %o1,16,%g4
michael@0 344 /* 0x004c */ sub %o2,5,%g1
michael@0 345 /* 0x0050 */ ld [%o1],%f7
michael@0 346 /* 0x0054 */ or %g0,4,%o5
michael@0 347 /* 0x0058 */ ld [%o1+4],%f5
michael@0 348 /* 0x005c */ ld [%o1+8],%f3
michael@0 349 /* 0x0060 */ fmovs %f8,%f6
michael@0 350 /* 0x0064 */ ld [%o1+12],%f1
michael@0 351 .L900000205:
michael@0 352 /* 0x0068 */ ld [%g4],%f11
michael@0 353 /* 0x006c */ add %o5,5,%o5
michael@0 354 /* 0x0070 */ add %g4,20,%g4
michael@0 355 /* 0x0074 */ fsubd %f6,%f8,%f6
michael@0 356 /* 0x0078 */ std %f6,[%g5]
michael@0 357 /* 0x007c */ cmp %o5,%g1
michael@0 358 /* 0x0080 */ add %g5,40,%g5
michael@0 359 /* 0x0084 */ fmovs %f8,%f4
michael@0 360 /* 0x0088 */ ld [%g4-16],%f7
michael@0 361 /* 0x008c */ fsubd %f4,%f8,%f12
michael@0 362 /* 0x0090 */ fmovs %f8,%f2
michael@0 363 /* 0x0094 */ std %f12,[%g5-32]
michael@0 364 /* 0x0098 */ ld [%g4-12],%f5
michael@0 365 /* 0x009c */ fsubd %f2,%f8,%f12
michael@0 366 /* 0x00a0 */ fmovs %f8,%f0
michael@0 367 /* 0x00a4 */ std %f12,[%g5-24]
michael@0 368 /* 0x00a8 */ ld [%g4-8],%f3
michael@0 369 /* 0x00ac */ fsubd %f0,%f8,%f12
michael@0 370 /* 0x00b0 */ fmovs %f8,%f10
michael@0 371 /* 0x00b4 */ std %f12,[%g5-16]
michael@0 372 /* 0x00b8 */ ld [%g4-4],%f1
michael@0 373 /* 0x00bc */ fsubd %f10,%f8,%f10
michael@0 374 /* 0x00c0 */ fmovs %f8,%f6
michael@0 375 /* 0x00c4 */ ble,pt %icc,.L900000205
michael@0 376 /* 0x00c8 */ std %f10,[%g5-8]
michael@0 377 .L900000208:
michael@0 378 /* 0x00cc */ fmovs %f8,%f4
michael@0 379 /* 0x00d0 */ add %g5,32,%g5
michael@0 380 /* 0x00d4 */ cmp %o5,%g3
michael@0 381 /* 0x00d8 */ fmovs %f8,%f2
michael@0 382 /* 0x00dc */ fmovs %f8,%f0
michael@0 383 /* 0x00e0 */ fsubd %f6,%f8,%f6
michael@0 384 /* 0x00e4 */ std %f6,[%g5-32]
michael@0 385 /* 0x00e8 */ fsubd %f4,%f8,%f4
michael@0 386 /* 0x00ec */ std %f4,[%g5-24]
michael@0 387 /* 0x00f0 */ fsubd %f2,%f8,%f2
michael@0 388 /* 0x00f4 */ std %f2,[%g5-16]
michael@0 389 /* 0x00f8 */ fsubd %f0,%f8,%f0
michael@0 390 /* 0x00fc */ bg,pn %icc,.L77000140
michael@0 391 /* 0x0100 */ std %f0,[%g5-8]
michael@0 392 .L77000144:
michael@0 393 /* 0x0104 */ ld [%g4],%f1
michael@0 394 .L900000211:
michael@0 395 /* 0x0108 */ ldd [%g2],%f8
michael@0 396 /* 0x010c */ add %o5,1,%o5
michael@0 397 /* 0x0110 */ add %g4,4,%g4
michael@0 398 /* 0x0114 */ cmp %o5,%g3
michael@0 399 /* 0x0118 */ fmovs %f8,%f0
michael@0 400 /* 0x011c */ fsubd %f0,%f8,%f0
michael@0 401 /* 0x0120 */ std %f0,[%g5]
michael@0 402 /* 0x0124 */ add %g5,8,%g5
michael@0 403 /* 0x0128 */ ble,a,pt %icc,.L900000211
michael@0 404 /* 0x012c */ ld [%g4],%f1
michael@0 405 .L77000140:
michael@0 406 /* 0x0130 */ retl ! Result =
michael@0 407 /* 0x0134 */ nop
michael@0 408 /* 0x0138 0 */ .type conv_i32_to_d32,2
michael@0 409 /* 0x0138 */ .size conv_i32_to_d32,(.-conv_i32_to_d32)
michael@0 410
michael@0 411 .section ".text",#alloc,#execinstr
michael@0 412 /* 000000 0 */ .align 8
michael@0 413 !
michael@0 414 ! CONSTANT POOL
michael@0 415 !
michael@0 416 .L_const_seg_900000301:
michael@0 417 /* 000000 0 */ .word 1127219200,0
michael@0 418 /* 0x0008 0 */ .align 4
michael@0 419 !
michael@0 420 ! SUBROUTINE conv_i32_to_d16
michael@0 421 !
michael@0 422 ! OFFSET SOURCE LINE LABEL INSTRUCTION
michael@0 423
michael@0 424 .global conv_i32_to_d16
michael@0 425 conv_i32_to_d16:
michael@0 426 /* 000000 */ save %sp,-104,%sp
michael@0 427 /* 0x0004 */ or %g0,%i2,%o0
michael@0 428
michael@0 429 ! 143 !}
michael@0 430 ! 146 !void conv_i32_to_d16(double *d16, unsigned int *i32, int len)
michael@0 431 ! 147 !{
michael@0 432 ! 148 !int i;
michael@0 433 ! 149 !unsigned int a;
michael@0 434 ! 151 !#pragma pipeloop(0)
michael@0 435 ! 152 ! for(i=0;i<len;i++)
michael@0 436 ! 153 ! {
michael@0 437 ! 154 ! a=i32[i];
michael@0 438 ! 155 ! d16[2*i]=(double)(a&0xffff);
michael@0 439 ! 156 ! d16[2*i+1]=(double)(a>>16);
michael@0 440
michael@0 441 /* 0x0008 156 */ sethi %hi(.L_const_seg_900000301),%g2
michael@0 442 .L900000310:
michael@0 443 /* 0x000c */ call .+8
michael@0 444 /* 0x0010 */ sethi /*X*/%hi(_GLOBAL_OFFSET_TABLE_-(.L900000310-.)),%g3
michael@0 445 /* 0x0014 152 */ cmp %o0,0
michael@0 446 /* 0x0018 147 */ add %g3,/*X*/%lo(_GLOBAL_OFFSET_TABLE_-(.L900000310-.)),%g3
michael@0 447 /* 0x001c 152 */ ble,pt %icc,.L77000150
michael@0 448 /* 0x0020 */ add %g3,%o7,%o2
michael@0 449 /* 0x0024 */ sub %i2,1,%o5
michael@0 450 /* 0x0028 156 */ add %g2,%lo(.L_const_seg_900000301),%o1
michael@0 451 /* 0x002c 152 */ sethi %hi(0xfc00),%o0
michael@0 452 /* 0x0030 */ ld [%o2+%o1],%o3
michael@0 453 /* 0x0034 */ add %o5,1,%g2
michael@0 454 /* 0x0038 */ or %g0,0,%g1
michael@0 455 /* 0x003c */ cmp %g2,3
michael@0 456 /* 0x0040 */ or %g0,%i1,%o7
michael@0 457 /* 0x0044 */ add %o0,1023,%o4
michael@0 458 /* 0x0048 */ or %g0,%i0,%g3
michael@0 459 /* 0x004c */ bl,pn %icc,.L77000154
michael@0 460 /* 0x0050 */ add %o7,4,%o0
michael@0 461 /* 0x0054 155 */ ldd [%o3],%f0
michael@0 462 /* 0x0058 156 */ or %g0,1,%g1
michael@0 463 /* 0x005c 154 */ ld [%o0-4],%o1
michael@0 464 /* 0x0060 0 */ or %g0,%o0,%o7
michael@0 465 /* 0x0064 155 */ and %o1,%o4,%o0
michael@0 466 .L900000306:
michael@0 467 /* 0x0068 155 */ st %o0,[%sp+96]
michael@0 468 /* 0x006c 156 */ add %g1,1,%g1
michael@0 469 /* 0x0070 */ add %g3,16,%g3
michael@0 470 /* 0x0074 */ cmp %g1,%o5
michael@0 471 /* 0x0078 */ add %o7,4,%o7
michael@0 472 /* 0x007c 155 */ ld [%sp+96],%f3
michael@0 473 /* 0x0080 */ fmovs %f0,%f2
michael@0 474 /* 0x0084 */ fsubd %f2,%f0,%f2
michael@0 475 /* 0x0088 156 */ srl %o1,16,%o0
michael@0 476 /* 0x008c 155 */ std %f2,[%g3-16]
michael@0 477 /* 0x0090 156 */ st %o0,[%sp+92]
michael@0 478 /* 0x0094 */ ld [%sp+92],%f3
michael@0 479 /* 0x0098 154 */ ld [%o7-4],%o1
michael@0 480 /* 0x009c 156 */ fmovs %f0,%f2
michael@0 481 /* 0x00a0 */ fsubd %f2,%f0,%f2
michael@0 482 /* 0x00a4 155 */ and %o1,%o4,%o0
michael@0 483 /* 0x00a8 156 */ ble,pt %icc,.L900000306
michael@0 484 /* 0x00ac */ std %f2,[%g3-8]
michael@0 485 .L900000309:
michael@0 486 /* 0x00b0 155 */ st %o0,[%sp+96]
michael@0 487 /* 0x00b4 */ fmovs %f0,%f2
michael@0 488 /* 0x00b8 156 */ add %g3,16,%g3
michael@0 489 /* 0x00bc */ srl %o1,16,%o0
michael@0 490 /* 0x00c0 155 */ ld [%sp+96],%f3
michael@0 491 /* 0x00c4 */ fsubd %f2,%f0,%f2
michael@0 492 /* 0x00c8 */ std %f2,[%g3-16]
michael@0 493 /* 0x00cc 156 */ st %o0,[%sp+92]
michael@0 494 /* 0x00d0 */ fmovs %f0,%f2
michael@0 495 /* 0x00d4 */ ld [%sp+92],%f3
michael@0 496 /* 0x00d8 */ fsubd %f2,%f0,%f0
michael@0 497 /* 0x00dc */ std %f0,[%g3-8]
michael@0 498 /* 0x00e0 */ ret ! Result =
michael@0 499 /* 0x00e4 */ restore %g0,%g0,%g0
michael@0 500 .L77000154:
michael@0 501 /* 0x00e8 154 */ ld [%o7],%o0
michael@0 502 .L900000311:
michael@0 503 /* 0x00ec 155 */ and %o0,%o4,%o1
michael@0 504 /* 0x00f0 */ st %o1,[%sp+96]
michael@0 505 /* 0x00f4 156 */ add %g1,1,%g1
michael@0 506 /* 0x00f8 155 */ ldd [%o3],%f0
michael@0 507 /* 0x00fc 156 */ srl %o0,16,%o0
michael@0 508 /* 0x0100 */ add %o7,4,%o7
michael@0 509 /* 0x0104 */ cmp %g1,%o5
michael@0 510 /* 0x0108 155 */ fmovs %f0,%f2
michael@0 511 /* 0x010c */ ld [%sp+96],%f3
michael@0 512 /* 0x0110 */ fsubd %f2,%f0,%f2
michael@0 513 /* 0x0114 */ std %f2,[%g3]
michael@0 514 /* 0x0118 156 */ st %o0,[%sp+92]
michael@0 515 /* 0x011c */ fmovs %f0,%f2
michael@0 516 /* 0x0120 */ ld [%sp+92],%f3
michael@0 517 /* 0x0124 */ fsubd %f2,%f0,%f0
michael@0 518 /* 0x0128 */ std %f0,[%g3+8]
michael@0 519 /* 0x012c */ add %g3,16,%g3
michael@0 520 /* 0x0130 */ ble,a,pt %icc,.L900000311
michael@0 521 /* 0x0134 */ ld [%o7],%o0
michael@0 522 .L77000150:
michael@0 523 /* 0x0138 */ ret ! Result =
michael@0 524 /* 0x013c */ restore %g0,%g0,%g0
michael@0 525 /* 0x0140 0 */ .type conv_i32_to_d16,2
michael@0 526 /* 0x0140 */ .size conv_i32_to_d16,(.-conv_i32_to_d16)
michael@0 527
michael@0 528 .section ".text",#alloc,#execinstr
michael@0 529 /* 000000 0 */ .align 8
michael@0 530 !
michael@0 531 ! CONSTANT POOL
michael@0 532 !
michael@0 533 .L_const_seg_900000401:
michael@0 534 /* 000000 0 */ .word 1127219200,0
michael@0 535 /* 0x0008 0 */ .align 4
michael@0 536 /* 0x0008 */ .skip 16
michael@0 537 !
michael@0 538 ! SUBROUTINE conv_i32_to_d32_and_d16
michael@0 539 !
michael@0 540 ! OFFSET SOURCE LINE LABEL INSTRUCTION
michael@0 541
michael@0 542 .global conv_i32_to_d32_and_d16
michael@0 543 conv_i32_to_d32_and_d16:
michael@0 544 /* 000000 */ save %sp,-120,%sp
michael@0 545 .L900000415:
michael@0 546 /* 0x0004 */ call .+8
michael@0 547 /* 0x0008 */ sethi /*X*/%hi(_GLOBAL_OFFSET_TABLE_-(.L900000415-.)),%g4
michael@0 548
michael@0 549 ! 157 ! }
michael@0 550 ! 158 !}
michael@0 551 ! 161 !void conv_i32_to_d32_and_d16(double *d32, double *d16,
michael@0 552 ! 162 ! unsigned int *i32, int len)
michael@0 553 ! 163 !{
michael@0 554 ! 164 !int i = 0;
michael@0 555 ! 165 !unsigned int a;
michael@0 556 ! 167 !#pragma pipeloop(0)
michael@0 557 ! 168 !#ifdef RF_INLINE_MACROS
michael@0 558 ! 169 ! for(;i<len-3;i+=4)
michael@0 559
michael@0 560 /* 0x000c 169 */ sub %i3,3,%g2
michael@0 561 /* 0x0010 */ cmp %g2,0
michael@0 562 /* 0x0014 163 */ add %g4,/*X*/%lo(_GLOBAL_OFFSET_TABLE_-(.L900000415-.)),%g4
michael@0 563
michael@0 564 ! 170 ! {
michael@0 565 ! 171 ! i16_to_d16_and_d32x4(&TwoToMinus16, &TwoTo16, &Zero,
michael@0 566 ! 172 ! &(d16[2*i]), &(d32[i]), (float *)(&(i32[i])));
michael@0 567
michael@0 568 /* 0x0018 172 */ sethi %hi(Zero),%g2
michael@0 569 /* 0x001c 163 */ add %g4,%o7,%o4
michael@0 570 /* 0x0020 172 */ add %g2,%lo(Zero),%g2
michael@0 571 /* 0x0024 */ sethi %hi(TwoToMinus16),%g3
michael@0 572 /* 0x0028 */ ld [%o4+%g2],%o1
michael@0 573 /* 0x002c */ sethi %hi(TwoTo16),%g4
michael@0 574 /* 0x0030 */ add %g3,%lo(TwoToMinus16),%g2
michael@0 575 /* 0x0034 */ ld [%o4+%g2],%o3
michael@0 576 /* 0x0038 164 */ or %g0,0,%g5
michael@0 577 /* 0x003c 172 */ add %g4,%lo(TwoTo16),%g3
michael@0 578 /* 0x0040 */ ld [%o4+%g3],%o2
michael@0 579 /* 0x0044 163 */ or %g0,%i0,%i4
michael@0 580 /* 0x0048 169 */ or %g0,%i2,%o7
michael@0 581 /* 0x004c */ ble,pt %icc,.L900000418
michael@0 582 /* 0x0050 */ cmp %g5,%i3
michael@0 583 /* 0x0054 172 */ stx %o7,[%sp+104]
michael@0 584 /* 0x0058 169 */ sub %i3,4,%o5
michael@0 585 /* 0x005c */ or %g0,0,%g4
michael@0 586 /* 0x0060 */ or %g0,0,%g1
michael@0 587 .L900000417:
michael@0 588 /* 0x0064 */ ldd [%o1],%f2
michael@0 589 /* 0x0068 172 */ add %i4,%g4,%g2
michael@0 590 /* 0x006c */ add %i1,%g1,%g3
michael@0 591 /* 0x0070 */ ldd [%o3],%f0
michael@0 592 /* 0x0074 */ add %g5,4,%g5
michael@0 593 /* 0x0078 */ fmovd %f2,%f14
michael@0 594 /* 0x007c */ ld [%o7],%f15
michael@0 595 /* 0x0080 */ cmp %g5,%o5
michael@0 596 /* 0x0084 */ fmovd %f2,%f10
michael@0 597 /* 0x0088 */ ld [%o7+4],%f11
michael@0 598 /* 0x008c */ add %o7,16,%o7
michael@0 599 /* 0x0090 */ ldx [%sp+104],%o0
michael@0 600 /* 0x0094 */ fmovd %f2,%f6
michael@0 601 /* 0x0098 */ stx %o7,[%sp+112]
michael@0 602 /* 0x009c */ fxtod %f14,%f14
michael@0 603 /* 0x00a0 */ ld [%o0+8],%f7
michael@0 604 /* 0x00a4 */ fxtod %f10,%f10
michael@0 605 /* 0x00a8 */ ld [%o0+12],%f3
michael@0 606 /* 0x00ac */ fxtod %f6,%f6
michael@0 607 /* 0x00b0 */ ldd [%o2],%f16
michael@0 608 /* 0x00b4 */ fmuld %f0,%f14,%f12
michael@0 609 /* 0x00b8 */ fxtod %f2,%f2
michael@0 610 /* 0x00bc */ fmuld %f0,%f10,%f8
michael@0 611 /* 0x00c0 */ std %f14,[%i4+%g4]
michael@0 612 /* 0x00c4 */ ldx [%sp+112],%o7
michael@0 613 /* 0x00c8 */ add %g4,32,%g4
michael@0 614 /* 0x00cc */ fmuld %f0,%f6,%f4
michael@0 615 /* 0x00d0 */ fdtox %f12,%f12
michael@0 616 /* 0x00d4 */ std %f10,[%g2+8]
michael@0 617 /* 0x00d8 */ fmuld %f0,%f2,%f0
michael@0 618 /* 0x00dc */ fdtox %f8,%f8
michael@0 619 /* 0x00e0 */ std %f6,[%g2+16]
michael@0 620 /* 0x00e4 */ std %f2,[%g2+24]
michael@0 621 /* 0x00e8 */ fdtox %f4,%f4
michael@0 622 /* 0x00ec */ fdtox %f0,%f0
michael@0 623 /* 0x00f0 */ fxtod %f12,%f12
michael@0 624 /* 0x00f4 */ std %f12,[%g3+8]
michael@0 625 /* 0x00f8 */ fxtod %f8,%f8
michael@0 626 /* 0x00fc */ std %f8,[%g3+24]
michael@0 627 /* 0x0100 */ fxtod %f4,%f4
michael@0 628 /* 0x0104 */ std %f4,[%g3+40]
michael@0 629 /* 0x0108 */ fxtod %f0,%f0
michael@0 630 /* 0x010c */ std %f0,[%g3+56]
michael@0 631 /* 0x0110 */ fmuld %f12,%f16,%f12
michael@0 632 /* 0x0114 */ fmuld %f8,%f16,%f8
michael@0 633 /* 0x0118 */ fmuld %f4,%f16,%f4
michael@0 634 /* 0x011c */ fsubd %f14,%f12,%f12
michael@0 635 /* 0x0120 */ std %f12,[%i1+%g1]
michael@0 636 /* 0x0124 */ fmuld %f0,%f16,%f0
michael@0 637 /* 0x0128 */ fsubd %f10,%f8,%f8
michael@0 638 /* 0x012c */ std %f8,[%g3+16]
michael@0 639 /* 0x0130 */ add %g1,64,%g1
michael@0 640 /* 0x0134 */ fsubd %f6,%f4,%f4
michael@0 641 /* 0x0138 */ std %f4,[%g3+32]
michael@0 642 /* 0x013c */ fsubd %f2,%f0,%f0
michael@0 643 /* 0x0140 */ std %f0,[%g3+48]
michael@0 644 /* 0x0144 */ ble,a,pt %icc,.L900000417
michael@0 645 /* 0x0148 */ stx %o7,[%sp+104]
michael@0 646 .L77000159:
michael@0 647
michael@0 648 ! 173 ! }
michael@0 649 ! 174 !#endif
michael@0 650 ! 175 ! for(;i<len;i++)
michael@0 651
michael@0 652 /* 0x014c 175 */ cmp %g5,%i3
michael@0 653 .L900000418:
michael@0 654 /* 0x0150 175 */ bge,pt %icc,.L77000164
michael@0 655 /* 0x0154 */ nop
michael@0 656
michael@0 657 ! 176 ! {
michael@0 658 ! 177 ! a=i32[i];
michael@0 659 ! 178 ! d32[i]=(double)(i32[i]);
michael@0 660 ! 179 ! d16[2*i]=(double)(a&0xffff);
michael@0 661 ! 180 ! d16[2*i+1]=(double)(a>>16);
michael@0 662
michael@0 663 /* 0x0158 180 */ sethi %hi(.L_const_seg_900000401),%g2
michael@0 664 /* 0x015c */ add %g2,%lo(.L_const_seg_900000401),%o1
michael@0 665 /* 0x0160 175 */ sethi %hi(0xfc00),%o0
michael@0 666 /* 0x0164 */ ld [%o4+%o1],%o2
michael@0 667 /* 0x0168 */ sll %g5,2,%o3
michael@0 668 /* 0x016c */ sub %i3,%g5,%g3
michael@0 669 /* 0x0170 */ sll %g5,3,%g2
michael@0 670 /* 0x0174 */ add %o0,1023,%o4
michael@0 671 /* 0x0178 178 */ ldd [%o2],%f0
michael@0 672 /* 0x017c */ add %i2,%o3,%o0
michael@0 673 /* 0x0180 175 */ cmp %g3,3
michael@0 674 /* 0x0184 */ add %i4,%g2,%o3
michael@0 675 /* 0x0188 */ sub %i3,1,%o1
michael@0 676 /* 0x018c */ sll %g5,4,%g4
michael@0 677 /* 0x0190 */ bl,pn %icc,.L77000161
michael@0 678 /* 0x0194 */ add %i1,%g4,%o5
michael@0 679 /* 0x0198 178 */ ld [%o0],%f3
michael@0 680 /* 0x019c 180 */ add %o3,8,%o3
michael@0 681 /* 0x01a0 177 */ ld [%o0],%o7
michael@0 682 /* 0x01a4 180 */ add %o5,16,%o5
michael@0 683 /* 0x01a8 */ add %g5,1,%g5
michael@0 684 /* 0x01ac 178 */ fmovs %f0,%f2
michael@0 685 /* 0x01b0 180 */ add %o0,4,%o0
michael@0 686 /* 0x01b4 179 */ and %o7,%o4,%g1
michael@0 687 /* 0x01b8 178 */ fsubd %f2,%f0,%f2
michael@0 688 /* 0x01bc */ std %f2,[%o3-8]
michael@0 689 /* 0x01c0 180 */ srl %o7,16,%o7
michael@0 690 /* 0x01c4 179 */ st %g1,[%sp+96]
michael@0 691 /* 0x01c8 */ fmovs %f0,%f2
michael@0 692 /* 0x01cc */ ld [%sp+96],%f3
michael@0 693 /* 0x01d0 */ fsubd %f2,%f0,%f2
michael@0 694 /* 0x01d4 */ std %f2,[%o5-16]
michael@0 695 /* 0x01d8 180 */ st %o7,[%sp+92]
michael@0 696 /* 0x01dc */ fmovs %f0,%f2
michael@0 697 /* 0x01e0 */ ld [%sp+92],%f3
michael@0 698 /* 0x01e4 */ fsubd %f2,%f0,%f2
michael@0 699 /* 0x01e8 */ std %f2,[%o5-8]
michael@0 700 .L900000411:
michael@0 701 /* 0x01ec 178 */ ld [%o0],%f3
michael@0 702 /* 0x01f0 180 */ add %g5,2,%g5
michael@0 703 /* 0x01f4 */ add %o5,32,%o5
michael@0 704 /* 0x01f8 177 */ ld [%o0],%o7
michael@0 705 /* 0x01fc 180 */ cmp %g5,%o1
michael@0 706 /* 0x0200 */ add %o3,16,%o3
michael@0 707 /* 0x0204 178 */ fmovs %f0,%f2
michael@0 708 /* 0x0208 */ fsubd %f2,%f0,%f2
michael@0 709 /* 0x020c */ std %f2,[%o3-16]
michael@0 710 /* 0x0210 179 */ and %o7,%o4,%g1
michael@0 711 /* 0x0214 */ st %g1,[%sp+96]
michael@0 712 /* 0x0218 */ ld [%sp+96],%f3
michael@0 713 /* 0x021c */ fmovs %f0,%f2
michael@0 714 /* 0x0220 */ fsubd %f2,%f0,%f2
michael@0 715 /* 0x0224 180 */ srl %o7,16,%o7
michael@0 716 /* 0x0228 179 */ std %f2,[%o5-32]
michael@0 717 /* 0x022c 180 */ st %o7,[%sp+92]
michael@0 718 /* 0x0230 */ ld [%sp+92],%f3
michael@0 719 /* 0x0234 */ fmovs %f0,%f2
michael@0 720 /* 0x0238 */ fsubd %f2,%f0,%f2
michael@0 721 /* 0x023c */ std %f2,[%o5-24]
michael@0 722 /* 0x0240 */ add %o0,4,%o0
michael@0 723 /* 0x0244 178 */ ld [%o0],%f3
michael@0 724 /* 0x0248 177 */ ld [%o0],%o7
michael@0 725 /* 0x024c 178 */ fmovs %f0,%f2
michael@0 726 /* 0x0250 */ fsubd %f2,%f0,%f2
michael@0 727 /* 0x0254 */ std %f2,[%o3-8]
michael@0 728 /* 0x0258 179 */ and %o7,%o4,%g1
michael@0 729 /* 0x025c */ st %g1,[%sp+96]
michael@0 730 /* 0x0260 */ ld [%sp+96],%f3
michael@0 731 /* 0x0264 */ fmovs %f0,%f2
michael@0 732 /* 0x0268 */ fsubd %f2,%f0,%f2
michael@0 733 /* 0x026c 180 */ srl %o7,16,%o7
michael@0 734 /* 0x0270 179 */ std %f2,[%o5-16]
michael@0 735 /* 0x0274 180 */ st %o7,[%sp+92]
michael@0 736 /* 0x0278 */ ld [%sp+92],%f3
michael@0 737 /* 0x027c */ fmovs %f0,%f2
michael@0 738 /* 0x0280 */ fsubd %f2,%f0,%f2
michael@0 739 /* 0x0284 */ std %f2,[%o5-8]
michael@0 740 /* 0x0288 */ bl,pt %icc,.L900000411
michael@0 741 /* 0x028c */ add %o0,4,%o0
michael@0 742 .L900000414:
michael@0 743 /* 0x0290 180 */ cmp %g5,%i3
michael@0 744 /* 0x0294 */ bge,pn %icc,.L77000164
michael@0 745 /* 0x0298 */ nop
michael@0 746 .L77000161:
michael@0 747 /* 0x029c 178 */ ld [%o0],%f3
michael@0 748 .L900000416:
michael@0 749 /* 0x02a0 178 */ ldd [%o2],%f0
michael@0 750 /* 0x02a4 180 */ add %g5,1,%g5
michael@0 751 /* 0x02a8 177 */ ld [%o0],%o1
michael@0 752 /* 0x02ac 180 */ add %o0,4,%o0
michael@0 753 /* 0x02b0 */ cmp %g5,%i3
michael@0 754 /* 0x02b4 178 */ fmovs %f0,%f2
michael@0 755 /* 0x02b8 179 */ and %o1,%o4,%o7
michael@0 756 /* 0x02bc 178 */ fsubd %f2,%f0,%f2
michael@0 757 /* 0x02c0 */ std %f2,[%o3]
michael@0 758 /* 0x02c4 180 */ srl %o1,16,%o1
michael@0 759 /* 0x02c8 179 */ st %o7,[%sp+96]
michael@0 760 /* 0x02cc 180 */ add %o3,8,%o3
michael@0 761 /* 0x02d0 179 */ fmovs %f0,%f2
michael@0 762 /* 0x02d4 */ ld [%sp+96],%f3
michael@0 763 /* 0x02d8 */ fsubd %f2,%f0,%f2
michael@0 764 /* 0x02dc */ std %f2,[%o5]
michael@0 765 /* 0x02e0 180 */ st %o1,[%sp+92]
michael@0 766 /* 0x02e4 */ fmovs %f0,%f2
michael@0 767 /* 0x02e8 */ ld [%sp+92],%f3
michael@0 768 /* 0x02ec */ fsubd %f2,%f0,%f0
michael@0 769 /* 0x02f0 */ std %f0,[%o5+8]
michael@0 770 /* 0x02f4 */ add %o5,16,%o5
michael@0 771 /* 0x02f8 */ bl,a,pt %icc,.L900000416
michael@0 772 /* 0x02fc */ ld [%o0],%f3
michael@0 773 .L77000164:
michael@0 774 /* 0x0300 */ ret ! Result =
michael@0 775 /* 0x0304 */ restore %g0,%g0,%g0
michael@0 776 /* 0x0308 0 */ .type conv_i32_to_d32_and_d16,2
michael@0 777 /* 0x0308 */ .size conv_i32_to_d32_and_d16,(.-conv_i32_to_d32_and_d16)
michael@0 778
michael@0 779 .section ".text",#alloc,#execinstr
michael@0 780 /* 000000 0 */ .align 4
michael@0 781 !
michael@0 782 ! SUBROUTINE adjust_montf_result
michael@0 783 !
michael@0 784 ! OFFSET SOURCE LINE LABEL INSTRUCTION
michael@0 785
michael@0 786 .global adjust_montf_result
michael@0 787 adjust_montf_result:
michael@0 788 /* 000000 */ or %g0,%o2,%g5
michael@0 789
michael@0 790 ! 181 ! }
michael@0 791 ! 182 !}
michael@0 792 ! 185 !void adjust_montf_result(unsigned int *i32, unsigned int *nint, int len)
michael@0 793 ! 186 !{
michael@0 794 ! 187 !long long acc;
michael@0 795 ! 188 !int i;
michael@0 796 ! 190 ! if(i32[len]>0) i=-1;
michael@0 797
michael@0 798 /* 0x0004 190 */ or %g0,-1,%g4
michael@0 799 /* 0x0008 */ sll %o2,2,%g1
michael@0 800 /* 0x000c */ ld [%o0+%g1],%g1
michael@0 801 /* 0x0010 */ cmp %g1,0
michael@0 802 /* 0x0014 */ bleu,pn %icc,.L77000175
michael@0 803 /* 0x0018 */ or %g0,%o1,%o3
michael@0 804 /* 0x001c */ ba .L900000511
michael@0 805 /* 0x0020 */ cmp %g4,0
michael@0 806 .L77000175:
michael@0 807
michael@0 808 ! 191 ! else
michael@0 809 ! 192 ! {
michael@0 810 ! 193 ! for(i=len-1; i>=0; i--)
michael@0 811
michael@0 812 /* 0x0024 193 */ sub %o2,1,%g4
michael@0 813 /* 0x0028 */ sll %g4,2,%g1
michael@0 814 /* 0x002c */ cmp %g4,0
michael@0 815 /* 0x0030 */ bl,pt %icc,.L900000511
michael@0 816 /* 0x0034 */ cmp %g4,0
michael@0 817 /* 0x0038 */ add %o1,%g1,%g2
michael@0 818
michael@0 819 ! 194 ! {
michael@0 820 ! 195 ! if(i32[i]!=nint[i]) break;
michael@0 821
michael@0 822 /* 0x003c 195 */ ld [%g2],%o5
michael@0 823 /* 0x0040 193 */ add %o0,%g1,%g3
michael@0 824 .L900000510:
michael@0 825 /* 0x0044 195 */ ld [%g3],%o2
michael@0 826 /* 0x0048 */ sub %g4,1,%g1
michael@0 827 /* 0x004c */ sub %g2,4,%g2
michael@0 828 /* 0x0050 */ sub %g3,4,%g3
michael@0 829 /* 0x0054 */ cmp %o2,%o5
michael@0 830 /* 0x0058 */ bne,pn %icc,.L77000182
michael@0 831 /* 0x005c */ nop
michael@0 832 /* 0x0060 0 */ or %g0,%g1,%g4
michael@0 833 /* 0x0064 195 */ cmp %g1,0
michael@0 834 /* 0x0068 */ bge,a,pt %icc,.L900000510
michael@0 835 /* 0x006c */ ld [%g2],%o5
michael@0 836 .L77000182:
michael@0 837
michael@0 838 ! 196 ! }
michael@0 839 ! 197 ! }
michael@0 840 ! 198 ! if((i<0)||(i32[i]>nint[i]))
michael@0 841
michael@0 842 /* 0x0070 198 */ cmp %g4,0
michael@0 843 .L900000511:
michael@0 844 /* 0x0074 198 */ bl,pn %icc,.L77000198
michael@0 845 /* 0x0078 */ sll %g4,2,%g2
michael@0 846 /* 0x007c */ ld [%o1+%g2],%g1
michael@0 847 /* 0x0080 */ ld [%o0+%g2],%g2
michael@0 848 /* 0x0084 */ cmp %g2,%g1
michael@0 849 /* 0x0088 */ bleu,pt %icc,.L77000191
michael@0 850 /* 0x008c */ nop
michael@0 851 .L77000198:
michael@0 852
michael@0 853 ! 199 ! {
michael@0 854 ! 200 ! acc=0;
michael@0 855 ! 201 ! for(i=0;i<len;i++)
michael@0 856
michael@0 857 /* 0x0090 201 */ cmp %g5,0
michael@0 858 /* 0x0094 */ ble,pt %icc,.L77000191
michael@0 859 /* 0x0098 */ nop
michael@0 860 /* 0x009c */ or %g0,%g5,%g1
michael@0 861 /* 0x00a0 198 */ or %g0,-1,%g2
michael@0 862 /* 0x00a4 */ srl %g2,0,%g3
michael@0 863 /* 0x00a8 */ sub %g5,1,%g4
michael@0 864 /* 0x00ac 200 */ or %g0,0,%g5
michael@0 865 /* 0x00b0 201 */ or %g0,0,%o5
michael@0 866 /* 0x00b4 198 */ or %g0,%o0,%o4
michael@0 867 /* 0x00b8 */ cmp %g1,3
michael@0 868 /* 0x00bc 201 */ bl,pn %icc,.L77000199
michael@0 869 /* 0x00c0 */ add %o0,8,%g1
michael@0 870 /* 0x00c4 */ add %o1,4,%g2
michael@0 871
michael@0 872 ! 202 ! {
michael@0 873 ! 203 ! acc=acc+(unsigned long long)(i32[i])-(unsigned long long)(nint[i]);
michael@0 874
michael@0 875 /* 0x00c8 203 */ ld [%o0],%o2
michael@0 876 /* 0x00cc */ ld [%o1],%o1
michael@0 877 /* 0x00d0 0 */ or %g0,%g1,%o4
michael@0 878 /* 0x00d4 */ or %g0,%g2,%o3
michael@0 879 /* 0x00d8 203 */ ld [%o0+4],%g1
michael@0 880
michael@0 881 ! 204 ! i32[i]=acc&0xffffffff;
michael@0 882 ! 205 ! acc=acc>>32;
michael@0 883
michael@0 884 /* 0x00dc 205 */ or %g0,2,%o5
michael@0 885 /* 0x00e0 201 */ sub %o2,%o1,%o2
michael@0 886 /* 0x00e4 */ or %g0,%o2,%g5
michael@0 887 /* 0x00e8 204 */ and %o2,%g3,%o2
michael@0 888 /* 0x00ec */ st %o2,[%o0]
michael@0 889 /* 0x00f0 205 */ srax %g5,32,%g5
michael@0 890 .L900000505:
michael@0 891 /* 0x00f4 203 */ ld [%o3],%o2
michael@0 892 /* 0x00f8 205 */ add %o5,1,%o5
michael@0 893 /* 0x00fc */ add %o3,4,%o3
michael@0 894 /* 0x0100 */ cmp %o5,%g4
michael@0 895 /* 0x0104 */ add %o4,4,%o4
michael@0 896 /* 0x0108 201 */ sub %g1,%o2,%g1
michael@0 897 /* 0x010c */ add %g1,%g5,%g5
michael@0 898 /* 0x0110 204 */ and %g5,%g3,%o2
michael@0 899 /* 0x0114 203 */ ld [%o4-4],%g1
michael@0 900 /* 0x0118 204 */ st %o2,[%o4-8]
michael@0 901 /* 0x011c 205 */ ble,pt %icc,.L900000505
michael@0 902 /* 0x0120 */ srax %g5,32,%g5
michael@0 903 .L900000508:
michael@0 904 /* 0x0124 203 */ ld [%o3],%g2
michael@0 905 /* 0x0128 201 */ sub %g1,%g2,%g1
michael@0 906 /* 0x012c */ add %g1,%g5,%g1
michael@0 907 /* 0x0130 204 */ and %g1,%g3,%g2
michael@0 908 /* 0x0134 */ retl ! Result =
michael@0 909 /* 0x0138 */ st %g2,[%o4-4]
michael@0 910 .L77000199:
michael@0 911 /* 0x013c 203 */ ld [%o4],%g1
michael@0 912 .L900000509:
michael@0 913 /* 0x0140 203 */ ld [%o3],%g2
michael@0 914 /* 0x0144 */ add %g5,%g1,%g1
michael@0 915 /* 0x0148 205 */ add %o5,1,%o5
michael@0 916 /* 0x014c */ add %o3,4,%o3
michael@0 917 /* 0x0150 */ cmp %o5,%g4
michael@0 918 /* 0x0154 203 */ sub %g1,%g2,%g1
michael@0 919 /* 0x0158 204 */ and %g1,%g3,%g2
michael@0 920 /* 0x015c */ st %g2,[%o4]
michael@0 921 /* 0x0160 205 */ add %o4,4,%o4
michael@0 922 /* 0x0164 */ srax %g1,32,%g5
michael@0 923 /* 0x0168 */ ble,a,pt %icc,.L900000509
michael@0 924 /* 0x016c */ ld [%o4],%g1
michael@0 925 .L77000191:
michael@0 926 /* 0x0170 */ retl ! Result =
michael@0 927 /* 0x0174 */ nop
michael@0 928 /* 0x0178 0 */ .type adjust_montf_result,2
michael@0 929 /* 0x0178 */ .size adjust_montf_result,(.-adjust_montf_result)
michael@0 930
michael@0 931 .section ".text",#alloc,#execinstr
michael@0 932 /* 000000 0 */ .align 4
michael@0 933 /* 000000 */ .skip 16
michael@0 934 !
michael@0 935 ! SUBROUTINE mont_mulf_noconv
michael@0 936 !
michael@0 937 ! OFFSET SOURCE LINE LABEL INSTRUCTION
michael@0 938
michael@0 939 .global mont_mulf_noconv
michael@0 940 mont_mulf_noconv:
michael@0 941 /* 000000 */ save %sp,-144,%sp
michael@0 942 .L900000646:
michael@0 943 /* 0x0004 */ call .+8
michael@0 944 /* 0x0008 */ sethi /*X*/%hi(_GLOBAL_OFFSET_TABLE_-(.L900000646-.)),%g5
michael@0 945
michael@0 946 ! 206 ! }
michael@0 947 ! 207 ! }
michael@0 948 ! 208 !}
michael@0 949 ! 213 !/*
michael@0 950 ! 214 !** the lengths of the input arrays should be at least the following:
michael@0 951 ! 215 !** result[nlen+1], dm1[nlen], dm2[2*nlen+1], dt[4*nlen+2], dn[nlen], nint[nlen]
michael@0 952 ! 216 !** all of them should be different from one another
michael@0 953 ! 217 !**
michael@0 954 ! 218 !*/
michael@0 955 ! 219 !void mont_mulf_noconv(unsigned int *result,
michael@0 956 ! 220 ! double *dm1, double *dm2, double *dt,
michael@0 957 ! 221 ! double *dn, unsigned int *nint,
michael@0 958 ! 222 ! int nlen, double dn0)
michael@0 959 ! 223 !{
michael@0 960 ! 224 ! int i, j, jj;
michael@0 961 ! 225 ! int tmp;
michael@0 962 ! 226 ! double digit, m2j, nextm2j, a, b;
michael@0 963 ! 227 ! double *dptmp, *pdm1, *pdm2, *pdn, *pdtj, pdn_0, pdm1_0;
michael@0 964 ! 229 ! pdm1=&(dm1[0]);
michael@0 965 ! 230 ! pdm2=&(dm2[0]);
michael@0 966 ! 231 ! pdn=&(dn[0]);
michael@0 967 ! 232 ! pdm2[2*nlen]=Zero;
michael@0 968
michael@0 969 /* 0x000c 232 */ ld [%fp+92],%o1
michael@0 970 /* 0x0010 */ sethi %hi(Zero),%g2
michael@0 971 /* 0x0014 223 */ ldd [%fp+96],%f2
michael@0 972 /* 0x0018 */ add %g5,/*X*/%lo(_GLOBAL_OFFSET_TABLE_-(.L900000646-.)),%g5
michael@0 973 /* 0x001c 232 */ add %g2,%lo(Zero),%g2
michael@0 974 /* 0x0020 223 */ st %i0,[%fp+68]
michael@0 975 /* 0x0024 */ add %g5,%o7,%o3
michael@0 976
michael@0 977 ! 234 ! if (nlen!=16)
michael@0 978 ! 235 ! {
michael@0 979 ! 236 ! for(i=0;i<4*nlen+2;i++) dt[i]=Zero;
michael@0 980 ! 238 ! a=dt[0]=pdm1[0]*pdm2[0];
michael@0 981 ! 239 ! digit=mod(lower32(a,Zero)*dn0,TwoToMinus16,TwoTo16);
michael@0 982
michael@0 983 /* 0x0028 239 */ sethi %hi(TwoToMinus16),%g3
michael@0 984 /* 0x002c 232 */ ld [%o3+%g2],%l0
michael@0 985 /* 0x0030 239 */ sethi %hi(TwoTo16),%g4
michael@0 986 /* 0x0034 223 */ or %g0,%i2,%o2
michael@0 987 /* 0x0038 */ fmovd %f2,%f16
michael@0 988 /* 0x003c */ st %i5,[%fp+88]
michael@0 989 /* 0x0040 239 */ add %g3,%lo(TwoToMinus16),%g2
michael@0 990 /* 0x0044 223 */ or %g0,%i1,%i2
michael@0 991 /* 0x0048 232 */ ldd [%l0],%f0
michael@0 992 /* 0x004c 239 */ add %g4,%lo(TwoTo16),%g3
michael@0 993 /* 0x0050 223 */ or %g0,%i3,%o0
michael@0 994 /* 0x0054 232 */ sll %o1,4,%g4
michael@0 995 /* 0x0058 239 */ ld [%o3+%g2],%g5
michael@0 996 /* 0x005c 223 */ or %g0,%i3,%i1
michael@0 997 /* 0x0060 239 */ ld [%o3+%g3],%g1
michael@0 998 /* 0x0064 232 */ or %g0,%o1,%i0
michael@0 999 /* 0x0068 */ or %g0,%o2,%i3
michael@0 1000 /* 0x006c 234 */ cmp %o1,16
michael@0 1001 /* 0x0070 */ be,pn %icc,.L77000279
michael@0 1002 /* 0x0074 */ std %f0,[%o2+%g4]
michael@0 1003 /* 0x0078 236 */ sll %o1,2,%g2
michael@0 1004 /* 0x007c */ or %g0,%o0,%o3
michael@0 1005 /* 0x0080 232 */ sll %o1,1,%o1
michael@0 1006 /* 0x0084 236 */ add %g2,2,%o2
michael@0 1007 /* 0x0088 */ cmp %o2,0
michael@0 1008 /* 0x008c */ ble,a,pt %icc,.L900000660
michael@0 1009 /* 0x0090 */ ldd [%i2],%f0
michael@0 1010
michael@0 1011 ! 241 ! pdtj=&(dt[0]);
michael@0 1012 ! 242 ! for(j=jj=0;j<2*nlen;j++,jj++,pdtj++)
michael@0 1013 ! 243 ! {
michael@0 1014 ! 244 ! m2j=pdm2[j];
michael@0 1015 ! 245 ! a=pdtj[0]+pdn[0]*digit;
michael@0 1016 ! 246 ! b=pdtj[1]+pdm1[0]*pdm2[j+1]+a*TwoToMinus16;
michael@0 1017 ! 247 ! pdtj[1]=b;
michael@0 1018 ! 249 !#pragma pipeloop(0)
michael@0 1019 ! 250 ! for(i=1;i<nlen;i++)
michael@0 1020 ! 251 ! {
michael@0 1021 ! 252 ! pdtj[2*i]+=pdm1[i]*m2j+pdn[i]*digit;
michael@0 1022 ! 253 ! }
michael@0 1023 ! 254 ! if((jj==30)) {cleanup(dt,j/2+1,2*nlen+1); jj=0;}
michael@0 1024 ! 255 !
michael@0 1025 ! 256 ! digit=mod(lower32(b,Zero)*dn0,TwoToMinus16,TwoTo16);
michael@0 1026 ! 257 ! }
michael@0 1027 ! 258 ! }
michael@0 1028 ! 259 ! else
michael@0 1029 ! 260 ! {
michael@0 1030 ! 261 ! a=dt[0]=pdm1[0]*pdm2[0];
michael@0 1031 ! 263 ! dt[65]= dt[64]= dt[63]= dt[62]= dt[61]= dt[60]=
michael@0 1032 ! 264 ! dt[59]= dt[58]= dt[57]= dt[56]= dt[55]= dt[54]=
michael@0 1033 ! 265 ! dt[53]= dt[52]= dt[51]= dt[50]= dt[49]= dt[48]=
michael@0 1034 ! 266 ! dt[47]= dt[46]= dt[45]= dt[44]= dt[43]= dt[42]=
michael@0 1035 ! 267 ! dt[41]= dt[40]= dt[39]= dt[38]= dt[37]= dt[36]=
michael@0 1036 ! 268 ! dt[35]= dt[34]= dt[33]= dt[32]= dt[31]= dt[30]=
michael@0 1037 ! 269 ! dt[29]= dt[28]= dt[27]= dt[26]= dt[25]= dt[24]=
michael@0 1038 ! 270 ! dt[23]= dt[22]= dt[21]= dt[20]= dt[19]= dt[18]=
michael@0 1039 ! 271 ! dt[17]= dt[16]= dt[15]= dt[14]= dt[13]= dt[12]=
michael@0 1040 ! 272 ! dt[11]= dt[10]= dt[ 9]= dt[ 8]= dt[ 7]= dt[ 6]=
michael@0 1041 ! 273 ! dt[ 5]= dt[ 4]= dt[ 3]= dt[ 2]= dt[ 1]=Zero;
michael@0 1042 ! 275 ! pdn_0=pdn[0];
michael@0 1043 ! 276 ! pdm1_0=pdm1[0];
michael@0 1044 ! 278 ! digit=mod(lower32(a,Zero)*dn0,TwoToMinus16,TwoTo16);
michael@0 1045 ! 279 ! pdtj=&(dt[0]);
michael@0 1046 ! 281 ! for(j=0;j<32;j++,pdtj++)
michael@0 1047
michael@0 1048 /* 0x0094 281 */ add %g2,2,%o0
michael@0 1049 /* 0x0098 236 */ add %g2,1,%o2
michael@0 1050 /* 0x009c 281 */ cmp %o0,3
michael@0 1051 /* 0x00a0 */ bl,pn %icc,.L77000280
michael@0 1052 /* 0x00a4 */ or %g0,1,%o0
michael@0 1053 /* 0x00a8 */ add %o3,8,%o3
michael@0 1054 /* 0x00ac */ or %g0,1,%o4
michael@0 1055 /* 0x00b0 */ std %f0,[%o3-8]
michael@0 1056 .L900000630:
michael@0 1057 /* 0x00b4 */ std %f0,[%o3]
michael@0 1058 /* 0x00b8 */ add %o4,2,%o4
michael@0 1059 /* 0x00bc */ add %o3,16,%o3
michael@0 1060 /* 0x00c0 */ cmp %o4,%g2
michael@0 1061 /* 0x00c4 */ ble,pt %icc,.L900000630
michael@0 1062 /* 0x00c8 */ std %f0,[%o3-8]
michael@0 1063 .L900000633:
michael@0 1064 /* 0x00cc */ cmp %o4,%o2
michael@0 1065 /* 0x00d0 */ bg,pn %icc,.L77000285
michael@0 1066 /* 0x00d4 */ add %o4,1,%o0
michael@0 1067 .L77000280:
michael@0 1068 /* 0x00d8 */ std %f0,[%o3]
michael@0 1069 .L900000659:
michael@0 1070 /* 0x00dc */ ldd [%l0],%f0
michael@0 1071 /* 0x00e0 */ cmp %o0,%o2
michael@0 1072 /* 0x00e4 */ add %o3,8,%o3
michael@0 1073 /* 0x00e8 */ add %o0,1,%o0
michael@0 1074 /* 0x00ec */ ble,a,pt %icc,.L900000659
michael@0 1075 /* 0x00f0 */ std %f0,[%o3]
michael@0 1076 .L77000285:
michael@0 1077 /* 0x00f4 238 */ ldd [%i2],%f0
michael@0 1078 .L900000660:
michael@0 1079 /* 0x00f8 238 */ ldd [%i3],%f2
michael@0 1080 /* 0x00fc */ add %o1,1,%o2
michael@0 1081 /* 0x0100 242 */ cmp %o1,0
michael@0 1082 /* 0x0104 */ sll %o2,1,%o0
michael@0 1083 /* 0x0108 */ sub %o1,1,%o1
michael@0 1084 /* 0x010c 238 */ fmuld %f0,%f2,%f0
michael@0 1085 /* 0x0110 */ std %f0,[%i1]
michael@0 1086 /* 0x0114 0 */ or %g0,0,%l1
michael@0 1087 /* 0x0118 */ ldd [%l0],%f6
michael@0 1088 /* 0x011c */ or %g0,0,%g4
michael@0 1089 /* 0x0120 */ or %g0,%o2,%i5
michael@0 1090 /* 0x0124 */ ldd [%g5],%f2
michael@0 1091 /* 0x0128 */ or %g0,%o1,%g3
michael@0 1092 /* 0x012c */ or %g0,%o0,%o3
michael@0 1093 /* 0x0130 */ fdtox %f0,%f0
michael@0 1094 /* 0x0134 */ ldd [%g1],%f4
michael@0 1095 /* 0x0138 246 */ add %i3,8,%o4
michael@0 1096 /* 0x013c */ or %g0,0,%l2
michael@0 1097 /* 0x0140 */ or %g0,%i1,%o5
michael@0 1098 /* 0x0144 */ sub %i0,1,%o7
michael@0 1099 /* 0x0148 */ fmovs %f6,%f0
michael@0 1100 /* 0x014c */ fxtod %f0,%f0
michael@0 1101 /* 0x0150 239 */ fmuld %f0,%f16,%f0
michael@0 1102 /* 0x0154 */ fmuld %f0,%f2,%f2
michael@0 1103 /* 0x0158 */ fdtox %f2,%f2
michael@0 1104 /* 0x015c */ fxtod %f2,%f2
michael@0 1105 /* 0x0160 */ fmuld %f2,%f4,%f2
michael@0 1106 /* 0x0164 */ fsubd %f0,%f2,%f22
michael@0 1107 /* 0x0168 242 */ ble,pt %icc,.L900000653
michael@0 1108 /* 0x016c */ sll %i0,4,%g2
michael@0 1109 /* 0x0170 246 */ ldd [%i4],%f0
michael@0 1110 .L900000654:
michael@0 1111 /* 0x0174 246 */ fmuld %f0,%f22,%f8
michael@0 1112 /* 0x0178 */ ldd [%i2],%f0
michael@0 1113 /* 0x017c 250 */ cmp %i0,1
michael@0 1114 /* 0x0180 246 */ ldd [%o4+%l2],%f6
michael@0 1115 /* 0x0184 */ add %i2,8,%o0
michael@0 1116 /* 0x0188 250 */ or %g0,1,%o1
michael@0 1117 /* 0x018c 246 */ ldd [%o5],%f2
michael@0 1118 /* 0x0190 */ add %o5,16,%l3
michael@0 1119 /* 0x0194 */ fmuld %f0,%f6,%f6
michael@0 1120 /* 0x0198 */ ldd [%g5],%f4
michael@0 1121 /* 0x019c */ faddd %f2,%f8,%f2
michael@0 1122 /* 0x01a0 */ ldd [%o5+8],%f0
michael@0 1123 /* 0x01a4 244 */ ldd [%i3+%l2],%f20
michael@0 1124 /* 0x01a8 246 */ faddd %f0,%f6,%f0
michael@0 1125 /* 0x01ac */ fmuld %f2,%f4,%f2
michael@0 1126 /* 0x01b0 */ faddd %f0,%f2,%f18
michael@0 1127 /* 0x01b4 247 */ std %f18,[%o5+8]
michael@0 1128 /* 0x01b8 250 */ ble,pt %icc,.L900000658
michael@0 1129 /* 0x01bc */ srl %g4,31,%g2
michael@0 1130 /* 0x01c0 */ cmp %o7,7
michael@0 1131 /* 0x01c4 246 */ add %i4,8,%g2
michael@0 1132 /* 0x01c8 250 */ bl,pn %icc,.L77000284
michael@0 1133 /* 0x01cc */ add %g2,24,%o2
michael@0 1134 /* 0x01d0 252 */ ldd [%o0+24],%f12
michael@0 1135 /* 0x01d4 */ add %o5,48,%l3
michael@0 1136 /* 0x01d8 */ ldd [%o0],%f2
michael@0 1137 /* 0x01dc 0 */ or %g0,%o2,%g2
michael@0 1138 /* 0x01e0 250 */ sub %o7,2,%o2
michael@0 1139 /* 0x01e4 252 */ ldd [%g2-24],%f0
michael@0 1140 /* 0x01e8 */ or %g0,5,%o1
michael@0 1141 /* 0x01ec */ ldd [%o0+8],%f6
michael@0 1142 /* 0x01f0 */ fmuld %f2,%f20,%f2
michael@0 1143 /* 0x01f4 */ ldd [%o0+16],%f14
michael@0 1144 /* 0x01f8 */ fmuld %f0,%f22,%f4
michael@0 1145 /* 0x01fc */ add %o0,32,%o0
michael@0 1146 /* 0x0200 */ ldd [%g2-16],%f8
michael@0 1147 /* 0x0204 */ fmuld %f6,%f20,%f10
michael@0 1148 /* 0x0208 */ ldd [%o5+16],%f0
michael@0 1149 /* 0x020c */ ldd [%g2-8],%f6
michael@0 1150 /* 0x0210 */ faddd %f2,%f4,%f4
michael@0 1151 /* 0x0214 */ ldd [%o5+32],%f2
michael@0 1152 .L900000642:
michael@0 1153 /* 0x0218 252 */ ldd [%g2],%f24
michael@0 1154 /* 0x021c */ add %o1,3,%o1
michael@0 1155 /* 0x0220 */ add %g2,24,%g2
michael@0 1156 /* 0x0224 */ fmuld %f8,%f22,%f8
michael@0 1157 /* 0x0228 */ ldd [%l3],%f28
michael@0 1158 /* 0x022c */ cmp %o1,%o2
michael@0 1159 /* 0x0230 */ add %o0,24,%o0
michael@0 1160 /* 0x0234 */ ldd [%o0-24],%f26
michael@0 1161 /* 0x0238 */ faddd %f0,%f4,%f0
michael@0 1162 /* 0x023c */ add %l3,48,%l3
michael@0 1163 /* 0x0240 */ faddd %f10,%f8,%f10
michael@0 1164 /* 0x0244 */ fmuld %f14,%f20,%f4
michael@0 1165 /* 0x0248 */ std %f0,[%l3-80]
michael@0 1166 /* 0x024c */ ldd [%g2-16],%f8
michael@0 1167 /* 0x0250 */ fmuld %f6,%f22,%f6
michael@0 1168 /* 0x0254 */ ldd [%l3-32],%f0
michael@0 1169 /* 0x0258 */ ldd [%o0-16],%f14
michael@0 1170 /* 0x025c */ faddd %f2,%f10,%f2
michael@0 1171 /* 0x0260 */ faddd %f4,%f6,%f10
michael@0 1172 /* 0x0264 */ fmuld %f12,%f20,%f4
michael@0 1173 /* 0x0268 */ std %f2,[%l3-64]
michael@0 1174 /* 0x026c */ ldd [%g2-8],%f6
michael@0 1175 /* 0x0270 */ fmuld %f24,%f22,%f24
michael@0 1176 /* 0x0274 */ ldd [%l3-16],%f2
michael@0 1177 /* 0x0278 */ ldd [%o0-8],%f12
michael@0 1178 /* 0x027c */ faddd %f28,%f10,%f10
michael@0 1179 /* 0x0280 */ std %f10,[%l3-48]
michael@0 1180 /* 0x0284 */ fmuld %f26,%f20,%f10
michael@0 1181 /* 0x0288 */ ble,pt %icc,.L900000642
michael@0 1182 /* 0x028c */ faddd %f4,%f24,%f4
michael@0 1183 .L900000645:
michael@0 1184 /* 0x0290 252 */ fmuld %f8,%f22,%f28
michael@0 1185 /* 0x0294 */ ldd [%g2],%f24
michael@0 1186 /* 0x0298 */ faddd %f0,%f4,%f26
michael@0 1187 /* 0x029c */ fmuld %f12,%f20,%f8
michael@0 1188 /* 0x02a0 */ add %l3,32,%l3
michael@0 1189 /* 0x02a4 */ cmp %o1,%o7
michael@0 1190 /* 0x02a8 */ fmuld %f14,%f20,%f14
michael@0 1191 /* 0x02ac */ ldd [%l3-32],%f4
michael@0 1192 /* 0x02b0 */ add %g2,8,%g2
michael@0 1193 /* 0x02b4 */ faddd %f10,%f28,%f12
michael@0 1194 /* 0x02b8 */ fmuld %f6,%f22,%f6
michael@0 1195 /* 0x02bc */ ldd [%l3-16],%f0
michael@0 1196 /* 0x02c0 */ fmuld %f24,%f22,%f10
michael@0 1197 /* 0x02c4 */ std %f26,[%l3-64]
michael@0 1198 /* 0x02c8 */ faddd %f2,%f12,%f2
michael@0 1199 /* 0x02cc */ std %f2,[%l3-48]
michael@0 1200 /* 0x02d0 */ faddd %f14,%f6,%f6
michael@0 1201 /* 0x02d4 */ faddd %f8,%f10,%f2
michael@0 1202 /* 0x02d8 */ faddd %f4,%f6,%f4
michael@0 1203 /* 0x02dc */ std %f4,[%l3-32]
michael@0 1204 /* 0x02e0 */ faddd %f0,%f2,%f0
michael@0 1205 /* 0x02e4 */ bg,pn %icc,.L77000213
michael@0 1206 /* 0x02e8 */ std %f0,[%l3-16]
michael@0 1207 .L77000284:
michael@0 1208 /* 0x02ec 252 */ ldd [%o0],%f0
michael@0 1209 .L900000657:
michael@0 1210 /* 0x02f0 252 */ ldd [%g2],%f4
michael@0 1211 /* 0x02f4 */ fmuld %f0,%f20,%f2
michael@0 1212 /* 0x02f8 */ add %o1,1,%o1
michael@0 1213 /* 0x02fc */ ldd [%l3],%f0
michael@0 1214 /* 0x0300 */ add %o0,8,%o0
michael@0 1215 /* 0x0304 */ add %g2,8,%g2
michael@0 1216 /* 0x0308 */ fmuld %f4,%f22,%f4
michael@0 1217 /* 0x030c */ cmp %o1,%o7
michael@0 1218 /* 0x0310 */ faddd %f2,%f4,%f2
michael@0 1219 /* 0x0314 */ faddd %f0,%f2,%f0
michael@0 1220 /* 0x0318 */ std %f0,[%l3]
michael@0 1221 /* 0x031c */ add %l3,16,%l3
michael@0 1222 /* 0x0320 */ ble,a,pt %icc,.L900000657
michael@0 1223 /* 0x0324 */ ldd [%o0],%f0
michael@0 1224 .L77000213:
michael@0 1225 /* 0x0328 */ srl %g4,31,%g2
michael@0 1226 .L900000658:
michael@0 1227 /* 0x032c 254 */ cmp %l1,30
michael@0 1228 /* 0x0330 */ bne,a,pt %icc,.L900000656
michael@0 1229 /* 0x0334 */ fdtox %f18,%f0
michael@0 1230 /* 0x0338 */ add %g4,%g2,%g2
michael@0 1231 /* 0x033c */ sra %g2,1,%o0
michael@0 1232 /* 0x0340 281 */ ldd [%l0],%f0
michael@0 1233 /* 0x0344 */ sll %i5,1,%o2
michael@0 1234 /* 0x0348 */ add %o0,1,%g2
michael@0 1235 /* 0x034c */ sll %g2,1,%o0
michael@0 1236 /* 0x0350 254 */ sub %o2,1,%o2
michael@0 1237 /* 0x0354 281 */ fmovd %f0,%f2
michael@0 1238 /* 0x0358 */ sll %g2,4,%o1
michael@0 1239 /* 0x035c */ cmp %o0,%o3
michael@0 1240 /* 0x0360 */ bge,pt %icc,.L77000215
michael@0 1241 /* 0x0364 */ or %g0,0,%l1
michael@0 1242 /* 0x0368 254 */ add %i1,%o1,%o1
michael@0 1243 /* 0x036c 281 */ ldd [%o1],%f6
michael@0 1244 .L900000655:
michael@0 1245 /* 0x0370 */ fdtox %f6,%f10
michael@0 1246 /* 0x0374 */ ldd [%o1+8],%f4
michael@0 1247 /* 0x0378 */ add %o0,2,%o0
michael@0 1248 /* 0x037c */ ldd [%l0],%f12
michael@0 1249 /* 0x0380 */ fdtox %f6,%f6
michael@0 1250 /* 0x0384 */ cmp %o0,%o2
michael@0 1251 /* 0x0388 */ fdtox %f4,%f8
michael@0 1252 /* 0x038c */ fdtox %f4,%f4
michael@0 1253 /* 0x0390 */ fmovs %f12,%f10
michael@0 1254 /* 0x0394 */ fmovs %f12,%f8
michael@0 1255 /* 0x0398 */ fxtod %f10,%f10
michael@0 1256 /* 0x039c */ fxtod %f8,%f8
michael@0 1257 /* 0x03a0 */ faddd %f10,%f2,%f2
michael@0 1258 /* 0x03a4 */ std %f2,[%o1]
michael@0 1259 /* 0x03a8 */ faddd %f8,%f0,%f0
michael@0 1260 /* 0x03ac */ std %f0,[%o1+8]
michael@0 1261 /* 0x03b0 */ add %o1,16,%o1
michael@0 1262 /* 0x03b4 */ fitod %f6,%f2
michael@0 1263 /* 0x03b8 */ fitod %f4,%f0
michael@0 1264 /* 0x03bc */ ble,a,pt %icc,.L900000655
michael@0 1265 /* 0x03c0 */ ldd [%o1],%f6
michael@0 1266 .L77000233:
michael@0 1267 /* 0x03c4 */ or %g0,0,%l1
michael@0 1268 .L77000215:
michael@0 1269 /* 0x03c8 */ fdtox %f18,%f0
michael@0 1270 .L900000656:
michael@0 1271 /* 0x03cc */ ldd [%l0],%f6
michael@0 1272 /* 0x03d0 256 */ add %g4,1,%g4
michael@0 1273 /* 0x03d4 */ add %l2,8,%l2
michael@0 1274 /* 0x03d8 */ ldd [%g5],%f2
michael@0 1275 /* 0x03dc */ add %l1,1,%l1
michael@0 1276 /* 0x03e0 */ add %o5,8,%o5
michael@0 1277 /* 0x03e4 */ fmovs %f6,%f0
michael@0 1278 /* 0x03e8 */ ldd [%g1],%f4
michael@0 1279 /* 0x03ec */ cmp %g4,%g3
michael@0 1280 /* 0x03f0 */ fxtod %f0,%f0
michael@0 1281 /* 0x03f4 */ fmuld %f0,%f16,%f0
michael@0 1282 /* 0x03f8 */ fmuld %f0,%f2,%f2
michael@0 1283 /* 0x03fc */ fdtox %f2,%f2
michael@0 1284 /* 0x0400 */ fxtod %f2,%f2
michael@0 1285 /* 0x0404 */ fmuld %f2,%f4,%f2
michael@0 1286 /* 0x0408 */ fsubd %f0,%f2,%f22
michael@0 1287 /* 0x040c */ ble,a,pt %icc,.L900000654
michael@0 1288 /* 0x0410 */ ldd [%i4],%f0
michael@0 1289 .L900000629:
michael@0 1290 /* 0x0414 256 */ ba .L900000653
michael@0 1291 /* 0x0418 */ sll %i0,4,%g2
michael@0 1292 .L77000279:
michael@0 1293 /* 0x041c 261 */ ldd [%o2],%f6
michael@0 1294 /* 0x0420 279 */ or %g0,%o0,%o4
michael@0 1295 /* 0x0424 281 */ or %g0,0,%o3
michael@0 1296 /* 0x0428 261 */ ldd [%i2],%f4
michael@0 1297 /* 0x042c 273 */ std %f0,[%o0+8]
michael@0 1298 /* 0x0430 */ std %f0,[%o0+16]
michael@0 1299 /* 0x0434 261 */ fmuld %f4,%f6,%f4
michael@0 1300 /* 0x0438 */ std %f4,[%o0]
michael@0 1301 /* 0x043c 273 */ std %f0,[%o0+24]
michael@0 1302 /* 0x0440 */ std %f0,[%o0+32]
michael@0 1303 /* 0x0444 */ fdtox %f4,%f4
michael@0 1304 /* 0x0448 */ std %f0,[%o0+40]
michael@0 1305 /* 0x044c */ std %f0,[%o0+48]
michael@0 1306 /* 0x0450 */ std %f0,[%o0+56]
michael@0 1307 /* 0x0454 */ std %f0,[%o0+64]
michael@0 1308 /* 0x0458 */ std %f0,[%o0+72]
michael@0 1309 /* 0x045c */ std %f0,[%o0+80]
michael@0 1310 /* 0x0460 */ std %f0,[%o0+88]
michael@0 1311 /* 0x0464 */ std %f0,[%o0+96]
michael@0 1312 /* 0x0468 */ std %f0,[%o0+104]
michael@0 1313 /* 0x046c */ std %f0,[%o0+112]
michael@0 1314 /* 0x0470 */ std %f0,[%o0+120]
michael@0 1315 /* 0x0474 */ std %f0,[%o0+128]
michael@0 1316 /* 0x0478 */ std %f0,[%o0+136]
michael@0 1317 /* 0x047c */ std %f0,[%o0+144]
michael@0 1318 /* 0x0480 */ std %f0,[%o0+152]
michael@0 1319 /* 0x0484 */ std %f0,[%o0+160]
michael@0 1320 /* 0x0488 */ std %f0,[%o0+168]
michael@0 1321 /* 0x048c */ fmovs %f0,%f4
michael@0 1322 /* 0x0490 */ std %f0,[%o0+176]
michael@0 1323 /* 0x0494 281 */ or %g0,0,%o1
michael@0 1324 /* 0x0498 273 */ std %f0,[%o0+184]
michael@0 1325 /* 0x049c */ fxtod %f4,%f4
michael@0 1326 /* 0x04a0 */ std %f0,[%o0+192]
michael@0 1327 /* 0x04a4 */ std %f0,[%o0+200]
michael@0 1328 /* 0x04a8 */ std %f0,[%o0+208]
michael@0 1329 /* 0x04ac 278 */ fmuld %f4,%f2,%f2
michael@0 1330 /* 0x04b0 273 */ std %f0,[%o0+216]
michael@0 1331 /* 0x04b4 */ std %f0,[%o0+224]
michael@0 1332 /* 0x04b8 */ std %f0,[%o0+232]
michael@0 1333 /* 0x04bc */ std %f0,[%o0+240]
michael@0 1334 /* 0x04c0 */ std %f0,[%o0+248]
michael@0 1335 /* 0x04c4 */ std %f0,[%o0+256]
michael@0 1336 /* 0x04c8 */ std %f0,[%o0+264]
michael@0 1337 /* 0x04cc */ std %f0,[%o0+272]
michael@0 1338 /* 0x04d0 */ std %f0,[%o0+280]
michael@0 1339 /* 0x04d4 */ std %f0,[%o0+288]
michael@0 1340 /* 0x04d8 */ std %f0,[%o0+296]
michael@0 1341 /* 0x04dc */ std %f0,[%o0+304]
michael@0 1342 /* 0x04e0 */ std %f0,[%o0+312]
michael@0 1343 /* 0x04e4 */ std %f0,[%o0+320]
michael@0 1344 /* 0x04e8 */ std %f0,[%o0+328]
michael@0 1345 /* 0x04ec */ std %f0,[%o0+336]
michael@0 1346 /* 0x04f0 */ std %f0,[%o0+344]
michael@0 1347 /* 0x04f4 */ std %f0,[%o0+352]
michael@0 1348 /* 0x04f8 */ std %f0,[%o0+360]
michael@0 1349 /* 0x04fc */ std %f0,[%o0+368]
michael@0 1350 /* 0x0500 */ std %f0,[%o0+376]
michael@0 1351 /* 0x0504 */ std %f0,[%o0+384]
michael@0 1352 /* 0x0508 */ std %f0,[%o0+392]
michael@0 1353 /* 0x050c */ std %f0,[%o0+400]
michael@0 1354 /* 0x0510 */ std %f0,[%o0+408]
michael@0 1355 /* 0x0514 */ std %f0,[%o0+416]
michael@0 1356 /* 0x0518 */ std %f0,[%o0+424]
michael@0 1357 /* 0x051c */ std %f0,[%o0+432]
michael@0 1358 /* 0x0520 */ std %f0,[%o0+440]
michael@0 1359 /* 0x0524 */ std %f0,[%o0+448]
michael@0 1360 /* 0x0528 */ std %f0,[%o0+456]
michael@0 1361 /* 0x052c */ std %f0,[%o0+464]
michael@0 1362 /* 0x0530 */ std %f0,[%o0+472]
michael@0 1363 /* 0x0534 */ std %f0,[%o0+480]
michael@0 1364 /* 0x0538 */ std %f0,[%o0+488]
michael@0 1365 /* 0x053c */ std %f0,[%o0+496]
michael@0 1366 /* 0x0540 */ std %f0,[%o0+504]
michael@0 1367 /* 0x0544 */ std %f0,[%o0+512]
michael@0 1368 /* 0x0548 */ std %f0,[%o0+520]
michael@0 1369 /* 0x054c */ ldd [%g5],%f0
michael@0 1370 /* 0x0550 */ ldd [%g1],%f8
michael@0 1371 /* 0x0554 */ fmuld %f2,%f0,%f6
michael@0 1372 /* 0x0558 275 */ ldd [%i4],%f4
michael@0 1373 /* 0x055c 276 */ ldd [%i2],%f0
michael@0 1374 /* 0x0560 */ fdtox %f6,%f6
michael@0 1375 /* 0x0564 */ fxtod %f6,%f6
michael@0 1376 /* 0x0568 */ fmuld %f6,%f8,%f6
michael@0 1377 /* 0x056c */ fsubd %f2,%f6,%f2
michael@0 1378 /* 0x0570 286 */ fmuld %f4,%f2,%f12
michael@0 1379
michael@0 1380 ! 282 ! {
michael@0 1381 ! 284 ! m2j=pdm2[j];
michael@0 1382 ! 285 ! a=pdtj[0]+pdn_0*digit;
michael@0 1383 ! 286 ! b=pdtj[1]+pdm1_0*pdm2[j+1]+a*TwoToMinus16;
michael@0 1384
michael@0 1385 ! 287 ! pdtj[1]=b;
michael@0 1386 ! 289 ! /**** this loop will be fully unrolled:
michael@0 1387 ! 290 ! for(i=1;i<16;i++)
michael@0 1388 ! 291 ! {
michael@0 1389 ! 292 ! pdtj[2*i]+=pdm1[i]*m2j+pdn[i]*digit;
michael@0 1390 ! 293 ! }
michael@0 1391 ! 294 ! *************************************/
michael@0 1392 ! 295 ! pdtj[2]+=pdm1[1]*m2j+pdn[1]*digit;
michael@0 1393 ! 296 ! pdtj[4]+=pdm1[2]*m2j+pdn[2]*digit;
michael@0 1394 ! 297 ! pdtj[6]+=pdm1[3]*m2j+pdn[3]*digit;
michael@0 1395 ! 298 ! pdtj[8]+=pdm1[4]*m2j+pdn[4]*digit;
michael@0 1396 ! 299 ! pdtj[10]+=pdm1[5]*m2j+pdn[5]*digit;
michael@0 1397 ! 300 ! pdtj[12]+=pdm1[6]*m2j+pdn[6]*digit;
michael@0 1398 ! 301 ! pdtj[14]+=pdm1[7]*m2j+pdn[7]*digit;
michael@0 1399 ! 302 ! pdtj[16]+=pdm1[8]*m2j+pdn[8]*digit;
michael@0 1400 ! 303 ! pdtj[18]+=pdm1[9]*m2j+pdn[9]*digit;
michael@0 1401 ! 304 ! pdtj[20]+=pdm1[10]*m2j+pdn[10]*digit;
michael@0 1402 ! 305 ! pdtj[22]+=pdm1[11]*m2j+pdn[11]*digit;
michael@0 1403 ! 306 ! pdtj[24]+=pdm1[12]*m2j+pdn[12]*digit;
michael@0 1404 ! 307 ! pdtj[26]+=pdm1[13]*m2j+pdn[13]*digit;
michael@0 1405 ! 308 ! pdtj[28]+=pdm1[14]*m2j+pdn[14]*digit;
michael@0 1406 ! 309 ! pdtj[30]+=pdm1[15]*m2j+pdn[15]*digit;
michael@0 1407 ! 310 ! /* no need for cleenup, cannot overflow */
michael@0 1408 ! 311 ! digit=mod(lower32(b,Zero)*dn0,TwoToMinus16,TwoTo16);
michael@0 1409
michael@0 1410 fmovd %f2,%f0 ! hand modified
michael@0 1411 fmovd %f16,%f18 ! hand modified
michael@0 1412 ldd [%i4],%f2
michael@0 1413 ldd [%o4],%f8
michael@0 1414 ldd [%i2],%f10
michael@0 1415 ldd [%g5],%f14 ! hand modified
michael@0 1416 ldd [%g1],%f16 ! hand modified
michael@0 1417 ldd [%i3],%f24
michael@0 1418
michael@0 1419 ldd [%i2+8],%f26
michael@0 1420 ldd [%i2+16],%f40
michael@0 1421 ldd [%i2+48],%f46
michael@0 1422 ldd [%i2+56],%f30
michael@0 1423 ldd [%i2+64],%f54
michael@0 1424 ldd [%i2+104],%f34
michael@0 1425 ldd [%i2+112],%f58
michael@0 1426
michael@0 1427 ldd [%i4+8],%f28
michael@0 1428 ldd [%i4+104],%f38
michael@0 1429 ldd [%i4+112],%f60
michael@0 1430
michael@0 1431 .L99999999: !1
michael@0 1432 ldd [%i2+24],%f32
michael@0 1433 fmuld %f0,%f2,%f4 !2
michael@0 1434 ldd [%i4+24],%f36
michael@0 1435 fmuld %f26,%f24,%f20 !3
michael@0 1436 ldd [%i2+40],%f42
michael@0 1437 fmuld %f28,%f0,%f22 !4
michael@0 1438 ldd [%i4+40],%f44
michael@0 1439 fmuld %f32,%f24,%f32 !5
michael@0 1440 ldd [%i3+8],%f6
michael@0 1441 faddd %f4,%f8,%f4
michael@0 1442 fmuld %f36,%f0,%f36 !6
michael@0 1443 add %i3,8,%i3
michael@0 1444 ldd [%i4+56],%f50
michael@0 1445 fmuld %f42,%f24,%f42 !7
michael@0 1446 ldd [%i2+72],%f52
michael@0 1447 faddd %f20,%f22,%f20
michael@0 1448 fmuld %f44,%f0,%f44 !8
michael@0 1449 ldd [%o4+16],%f22
michael@0 1450 fmuld %f10,%f6,%f12 !9
michael@0 1451 ldd [%i4+72],%f56
michael@0 1452 faddd %f32,%f36,%f32
michael@0 1453 fmuld %f14,%f4,%f4 !10
michael@0 1454 ldd [%o4+48],%f36
michael@0 1455 fmuld %f30,%f24,%f48 !11
michael@0 1456 ldd [%o4+8],%f8
michael@0 1457 faddd %f20,%f22,%f20
michael@0 1458 fmuld %f50,%f0,%f50 !12
michael@0 1459 std %f20,[%o4+16]
michael@0 1460 faddd %f42,%f44,%f42
michael@0 1461 fmuld %f52,%f24,%f52 !13
michael@0 1462 ldd [%o4+80],%f44
michael@0 1463 faddd %f4,%f12,%f4
michael@0 1464 fmuld %f56,%f0,%f56 !14
michael@0 1465 ldd [%i2+88],%f20
michael@0 1466 faddd %f32,%f36,%f32 !15
michael@0 1467 ldd [%i4+88],%f22
michael@0 1468 faddd %f48,%f50,%f48 !16
michael@0 1469 ldd [%o4+112],%f50
michael@0 1470 faddd %f52,%f56,%f52 !17
michael@0 1471 ldd [%o4+144],%f56
michael@0 1472 faddd %f4,%f8,%f8
michael@0 1473 fmuld %f20,%f24,%f20 !18
michael@0 1474 std %f32,[%o4+48]
michael@0 1475 faddd %f42,%f44,%f42
michael@0 1476 fmuld %f22,%f0,%f22 !19
michael@0 1477 std %f42,[%o4+80]
michael@0 1478 faddd %f48,%f50,%f48
michael@0 1479 fmuld %f34,%f24,%f32 !20
michael@0 1480 std %f48,[%o4+112]
michael@0 1481 faddd %f52,%f56,%f52
michael@0 1482 fmuld %f38,%f0,%f36 !21
michael@0 1483 ldd [%i2+120],%f42
michael@0 1484 fdtox %f8,%f4 !22
michael@0 1485 std %f52,[%o4+144]
michael@0 1486 faddd %f20,%f22,%f20 !23
michael@0 1487 ldd [%i4+120],%f44 !24
michael@0 1488 ldd [%o4+176],%f22
michael@0 1489 faddd %f32,%f36,%f32
michael@0 1490 fmuld %f42,%f24,%f42 !25
michael@0 1491 ldd [%i4+16],%f50
michael@0 1492 fmovs %f17,%f4 !26
michael@0 1493 ldd [%i2+32],%f52
michael@0 1494 fmuld %f44,%f0,%f44 !27
michael@0 1495 ldd [%i4+32],%f56
michael@0 1496 fmuld %f40,%f24,%f48 !28
michael@0 1497 ldd [%o4+208],%f36
michael@0 1498 faddd %f20,%f22,%f20
michael@0 1499 fmuld %f50,%f0,%f50 !29
michael@0 1500 std %f20,[%o4+176]
michael@0 1501 fxtod %f4,%f4
michael@0 1502 fmuld %f52,%f24,%f52 !30
michael@0 1503 ldd [%i4+48],%f22
michael@0 1504 faddd %f42,%f44,%f42
michael@0 1505 fmuld %f56,%f0,%f56 !31
michael@0 1506 ldd [%o4+240],%f44
michael@0 1507 faddd %f32,%f36,%f32 !32
michael@0 1508 std %f32,[%o4+208]
michael@0 1509 faddd %f48,%f50,%f48
michael@0 1510 fmuld %f46,%f24,%f20 !33
michael@0 1511 ldd [%o4+32],%f50
michael@0 1512 fmuld %f4,%f18,%f12 !34
michael@0 1513 ldd [%i4+64],%f36
michael@0 1514 faddd %f52,%f56,%f52
michael@0 1515 fmuld %f22,%f0,%f22 !35
michael@0 1516 ldd [%o4+64],%f56
michael@0 1517 faddd %f42,%f44,%f42 !36
michael@0 1518 std %f42,[%o4+240]
michael@0 1519 faddd %f48,%f50,%f48
michael@0 1520 fmuld %f54,%f24,%f32 !37
michael@0 1521 std %f48,[%o4+32]
michael@0 1522 fmuld %f12,%f14,%f4 !38
michael@0 1523 ldd [%i2+80],%f42
michael@0 1524 faddd %f52,%f56,%f56 ! yes, tmp52!
michael@0 1525 fmuld %f36,%f0,%f36 !39
michael@0 1526 ldd [%i4+80],%f44
michael@0 1527 faddd %f20,%f22,%f20 !40
michael@0 1528 ldd [%i2+96],%f48
michael@0 1529 fmuld %f58,%f24,%f52 !41
michael@0 1530 ldd [%i4+96],%f50
michael@0 1531 fdtox %f4,%f4
michael@0 1532 fmuld %f42,%f24,%f42 !42
michael@0 1533 std %f56,[%o4+64] ! yes, tmp52!
michael@0 1534 faddd %f32,%f36,%f32
michael@0 1535 fmuld %f44,%f0,%f44 !43
michael@0 1536 ldd [%o4+96],%f22
michael@0 1537 fmuld %f48,%f24,%f48 !44
michael@0 1538 ldd [%o4+128],%f36
michael@0 1539 fmovd %f6,%f24
michael@0 1540 fmuld %f50,%f0,%f50 !45
michael@0 1541 fxtod %f4,%f4
michael@0 1542 fmuld %f60,%f0,%f56 !46
michael@0 1543 add %o4,8,%o4
michael@0 1544 faddd %f42,%f44,%f42 !47
michael@0 1545 ldd [%o4+160-8],%f44
michael@0 1546 faddd %f20,%f22,%f20 !48
michael@0 1547 std %f20,[%o4+96-8]
michael@0 1548 faddd %f48,%f50,%f48 !49
michael@0 1549 ldd [%o4+192-8],%f50
michael@0 1550 faddd %f52,%f56,%f52
michael@0 1551 fmuld %f4,%f16,%f4 !50
michael@0 1552 ldd [%o4+224-8],%f56
michael@0 1553 faddd %f32,%f36,%f32 !51
michael@0 1554 std %f32,[%o4+128-8]
michael@0 1555 faddd %f42,%f44,%f42 !52
michael@0 1556 add %o3,1,%o3
michael@0 1557 std %f42,[%o4+160-8]
michael@0 1558 faddd %f48,%f50,%f48 !53
michael@0 1559 cmp %o3,31
michael@0 1560 std %f48,[%o4+192-8]
michael@0 1561 fsubd %f12,%f4,%f0 !54
michael@0 1562 faddd %f52,%f56,%f52
michael@0 1563 ble,pt %icc,.L99999999
michael@0 1564 std %f52,[%o4+224-8] !55
michael@0 1565 std %f8,[%o4]
michael@0 1566
michael@0 1567 ! 312 ! }
michael@0 1568 ! 313 ! }
michael@0 1569 ! 315 ! conv_d16_to_i32(result,dt+2*nlen,(long long *)dt,nlen+1);
michael@0 1570
michael@0 1571 /* 0x07c8 315 */ sll %i0,4,%g2
michael@0 1572 .L900000653:
michael@0 1573 /* 0x07cc 315 */ add %i1,%g2,%i1
michael@0 1574 /* 0x07d0 242 */ ld [%fp+68],%o0
michael@0 1575 /* 0x07d4 315 */ or %g0,0,%o4
michael@0 1576 /* 0x07d8 */ ldd [%i1],%f0
michael@0 1577 /* 0x07dc */ or %g0,0,%g5
michael@0 1578 /* 0x07e0 */ cmp %i0,0
michael@0 1579 /* 0x07e4 242 */ or %g0,%o0,%o3
michael@0 1580 /* 0x07e8 311 */ sub %i0,1,%g1
michael@0 1581 /* 0x07ec 315 */ fdtox %f0,%f0
michael@0 1582 /* 0x07f0 */ std %f0,[%sp+120]
michael@0 1583 /* 0x07f4 311 */ sethi %hi(0xfc00),%o1
michael@0 1584 /* 0x07f8 */ add %g1,1,%g3
michael@0 1585 /* 0x07fc */ or %g0,%o0,%g4
michael@0 1586 /* 0x0800 315 */ ldd [%i1+8],%f0
michael@0 1587 /* 0x0804 */ add %o1,1023,%o1
michael@0 1588 /* 0x0808 */ fdtox %f0,%f0
michael@0 1589 /* 0x080c */ std %f0,[%sp+112]
michael@0 1590 /* 0x0810 */ ldx [%sp+112],%o5
michael@0 1591 /* 0x0814 */ ldx [%sp+120],%o7
michael@0 1592 /* 0x0818 */ ble,pt %icc,.L900000651
michael@0 1593 /* 0x081c */ sethi %hi(0xfc00),%g2
michael@0 1594 /* 0x0820 311 */ or %g0,-1,%g2
michael@0 1595 /* 0x0824 315 */ cmp %g3,3
michael@0 1596 /* 0x0828 311 */ srl %g2,0,%o2
michael@0 1597 /* 0x082c 315 */ bl,pn %icc,.L77000287
michael@0 1598 /* 0x0830 */ or %g0,%i1,%g2
michael@0 1599 /* 0x0834 */ ldd [%i1+16],%f0
michael@0 1600 /* 0x0838 */ and %o5,%o1,%o0
michael@0 1601 /* 0x083c */ add %i1,16,%g2
michael@0 1602 /* 0x0840 */ sllx %o0,16,%g3
michael@0 1603 /* 0x0844 */ and %o7,%o2,%o0
michael@0 1604 /* 0x0848 */ fdtox %f0,%f0
michael@0 1605 /* 0x084c */ std %f0,[%sp+104]
michael@0 1606 /* 0x0850 */ add %o0,%g3,%o4
michael@0 1607 /* 0x0854 */ ldd [%i1+24],%f2
michael@0 1608 /* 0x0858 */ srax %o5,16,%o0
michael@0 1609 /* 0x085c */ add %o3,4,%g4
michael@0 1610 /* 0x0860 */ stx %o0,[%sp+128]
michael@0 1611 /* 0x0864 */ and %o4,%o2,%o0
michael@0 1612 /* 0x0868 */ stx %o0,[%sp+112]
michael@0 1613 /* 0x086c */ srax %o4,32,%o0
michael@0 1614 /* 0x0870 */ fdtox %f2,%f0
michael@0 1615 /* 0x0874 */ stx %o0,[%sp+136]
michael@0 1616 /* 0x0878 */ srax %o7,32,%o4
michael@0 1617 /* 0x087c */ std %f0,[%sp+96]
michael@0 1618 /* 0x0880 */ ldx [%sp+128],%g5
michael@0 1619 /* 0x0884 */ ldx [%sp+136],%o7
michael@0 1620 /* 0x0888 */ ldx [%sp+104],%g3
michael@0 1621 /* 0x088c */ add %g5,%o7,%o0
michael@0 1622 /* 0x0890 */ or %g0,1,%g5
michael@0 1623 /* 0x0894 */ ldx [%sp+112],%o7
michael@0 1624 /* 0x0898 */ add %o4,%o0,%o4
michael@0 1625 /* 0x089c */ ldx [%sp+96],%o5
michael@0 1626 /* 0x08a0 */ st %o7,[%o3]
michael@0 1627 /* 0x08a4 */ or %g0,%g3,%o7
michael@0 1628 .L900000634:
michael@0 1629 /* 0x08a8 */ ldd [%g2+16],%f0
michael@0 1630 /* 0x08ac */ add %g5,1,%g5
michael@0 1631 /* 0x08b0 */ add %g4,4,%g4
michael@0 1632 /* 0x08b4 */ cmp %g5,%g1
michael@0 1633 /* 0x08b8 */ add %g2,16,%g2
michael@0 1634 /* 0x08bc */ fdtox %f0,%f0
michael@0 1635 /* 0x08c0 */ std %f0,[%sp+104]
michael@0 1636 /* 0x08c4 */ ldd [%g2+8],%f0
michael@0 1637 /* 0x08c8 */ fdtox %f0,%f0
michael@0 1638 /* 0x08cc */ std %f0,[%sp+96]
michael@0 1639 /* 0x08d0 */ and %o5,%o1,%g3
michael@0 1640 /* 0x08d4 */ sllx %g3,16,%g3
michael@0 1641 /* 0x08d8 */ stx %g3,[%sp+120]
michael@0 1642 /* 0x08dc */ and %o7,%o2,%g3
michael@0 1643 /* 0x08e0 */ stx %o7,[%sp+128]
michael@0 1644 /* 0x08e4 */ ldx [%sp+120],%o7
michael@0 1645 /* 0x08e8 */ add %g3,%o7,%g3
michael@0 1646 /* 0x08ec */ ldx [%sp+128],%o7
michael@0 1647 /* 0x08f0 */ srax %o5,16,%o5
michael@0 1648 /* 0x08f4 */ add %g3,%o4,%g3
michael@0 1649 /* 0x08f8 */ srax %g3,32,%o4
michael@0 1650 /* 0x08fc */ stx %o4,[%sp+112]
michael@0 1651 /* 0x0900 */ srax %o7,32,%o4
michael@0 1652 /* 0x0904 */ ldx [%sp+112],%o7
michael@0 1653 /* 0x0908 */ add %o5,%o7,%o7
michael@0 1654 /* 0x090c */ ldx [%sp+96],%o5
michael@0 1655 /* 0x0910 */ add %o4,%o7,%o4
michael@0 1656 /* 0x0914 */ and %g3,%o2,%g3
michael@0 1657 /* 0x0918 */ ldx [%sp+104],%o7
michael@0 1658 /* 0x091c */ ble,pt %icc,.L900000634
michael@0 1659 /* 0x0920 */ st %g3,[%g4-4]
michael@0 1660 .L900000637:
michael@0 1661 /* 0x0924 */ ba .L900000651
michael@0 1662 /* 0x0928 */ sethi %hi(0xfc00),%g2
michael@0 1663 .L77000287:
michael@0 1664 /* 0x092c */ ldd [%g2+16],%f0
michael@0 1665 .L900000650:
michael@0 1666 /* 0x0930 */ and %o7,%o2,%o0
michael@0 1667 /* 0x0934 */ and %o5,%o1,%g3
michael@0 1668 /* 0x0938 */ fdtox %f0,%f0
michael@0 1669 /* 0x093c */ add %o4,%o0,%o0
michael@0 1670 /* 0x0940 */ std %f0,[%sp+104]
michael@0 1671 /* 0x0944 */ add %g5,1,%g5
michael@0 1672 /* 0x0948 */ sllx %g3,16,%o4
michael@0 1673 /* 0x094c */ ldd [%g2+24],%f2
michael@0 1674 /* 0x0950 */ add %g2,16,%g2
michael@0 1675 /* 0x0954 */ add %o0,%o4,%o4
michael@0 1676 /* 0x0958 */ cmp %g5,%g1
michael@0 1677 /* 0x095c */ srax %o5,16,%o0
michael@0 1678 /* 0x0960 */ stx %o0,[%sp+112]
michael@0 1679 /* 0x0964 */ and %o4,%o2,%g3
michael@0 1680 /* 0x0968 */ srax %o4,32,%o5
michael@0 1681 /* 0x096c */ fdtox %f2,%f0
michael@0 1682 /* 0x0970 */ std %f0,[%sp+96]
michael@0 1683 /* 0x0974 */ srax %o7,32,%o4
michael@0 1684 /* 0x0978 */ ldx [%sp+112],%o7
michael@0 1685 /* 0x097c */ add %o7,%o5,%o7
michael@0 1686 /* 0x0980 */ ldx [%sp+104],%o5
michael@0 1687 /* 0x0984 */ add %o4,%o7,%o4
michael@0 1688 /* 0x0988 */ ldx [%sp+96],%o0
michael@0 1689 /* 0x098c */ st %g3,[%g4]
michael@0 1690 /* 0x0990 */ or %g0,%o5,%o7
michael@0 1691 /* 0x0994 */ add %g4,4,%g4
michael@0 1692 /* 0x0998 */ or %g0,%o0,%o5
michael@0 1693 /* 0x099c */ ble,a,pt %icc,.L900000650
michael@0 1694 /* 0x09a0 */ ldd [%g2+16],%f0
michael@0 1695 .L77000236:
michael@0 1696 /* 0x09a4 */ sethi %hi(0xfc00),%g2
michael@0 1697 .L900000651:
michael@0 1698 /* 0x09a8 */ or %g0,-1,%o0
michael@0 1699 /* 0x09ac */ add %g2,1023,%g2
michael@0 1700 /* 0x09b0 */ ld [%fp+88],%o1
michael@0 1701 /* 0x09b4 */ srl %o0,0,%g3
michael@0 1702 /* 0x09b8 */ and %o5,%g2,%g2
michael@0 1703 /* 0x09bc */ and %o7,%g3,%g4
michael@0 1704
michael@0 1705 ! 317 ! adjust_montf_result(result,nint,nlen);
michael@0 1706
michael@0 1707 /* 0x09c0 317 */ or %g0,-1,%o5
michael@0 1708 /* 0x09c4 311 */ sllx %g2,16,%g2
michael@0 1709 /* 0x09c8 */ add %o4,%g4,%g4
michael@0 1710 /* 0x09cc */ add %g4,%g2,%g2
michael@0 1711 /* 0x09d0 */ sll %g5,2,%g4
michael@0 1712 /* 0x09d4 */ and %g2,%g3,%g2
michael@0 1713 /* 0x09d8 */ st %g2,[%o3+%g4]
michael@0 1714 /* 0x09dc 317 */ sll %i0,2,%g2
michael@0 1715 /* 0x09e0 */ ld [%o3+%g2],%g2
michael@0 1716 /* 0x09e4 */ cmp %g2,0
michael@0 1717 /* 0x09e8 */ bleu,pn %icc,.L77000241
michael@0 1718 /* 0x09ec */ or %g0,%o1,%o2
michael@0 1719 /* 0x09f0 */ ba .L900000649
michael@0 1720 /* 0x09f4 */ cmp %o5,0
michael@0 1721 .L77000241:
michael@0 1722 /* 0x09f8 */ sub %i0,1,%o5
michael@0 1723 /* 0x09fc */ sll %o5,2,%g2
michael@0 1724 /* 0x0a00 */ cmp %o5,0
michael@0 1725 /* 0x0a04 */ bl,pt %icc,.L900000649
michael@0 1726 /* 0x0a08 */ cmp %o5,0
michael@0 1727 /* 0x0a0c */ add %o1,%g2,%o1
michael@0 1728 /* 0x0a10 */ add %o3,%g2,%o4
michael@0 1729 /* 0x0a14 */ ld [%o1],%g2
michael@0 1730 .L900000648:
michael@0 1731 /* 0x0a18 */ ld [%o4],%g3
michael@0 1732 /* 0x0a1c */ sub %o5,1,%o0
michael@0 1733 /* 0x0a20 */ sub %o1,4,%o1
michael@0 1734 /* 0x0a24 */ sub %o4,4,%o4
michael@0 1735 /* 0x0a28 */ cmp %g3,%g2
michael@0 1736 /* 0x0a2c */ bne,pn %icc,.L77000244
michael@0 1737 /* 0x0a30 */ nop
michael@0 1738 /* 0x0a34 0 */ or %g0,%o0,%o5
michael@0 1739 /* 0x0a38 317 */ cmp %o0,0
michael@0 1740 /* 0x0a3c */ bge,a,pt %icc,.L900000648
michael@0 1741 /* 0x0a40 */ ld [%o1],%g2
michael@0 1742 .L77000244:
michael@0 1743 /* 0x0a44 */ cmp %o5,0
michael@0 1744 .L900000649:
michael@0 1745 /* 0x0a48 */ bl,pn %icc,.L77000288
michael@0 1746 /* 0x0a4c */ sll %o5,2,%g2
michael@0 1747 /* 0x0a50 */ ld [%o2+%g2],%g3
michael@0 1748 /* 0x0a54 */ ld [%o3+%g2],%g2
michael@0 1749 /* 0x0a58 */ cmp %g2,%g3
michael@0 1750 /* 0x0a5c */ bleu,pt %icc,.L77000224
michael@0 1751 /* 0x0a60 */ nop
michael@0 1752 .L77000288:
michael@0 1753 /* 0x0a64 */ cmp %i0,0
michael@0 1754 /* 0x0a68 */ ble,pt %icc,.L77000224
michael@0 1755 /* 0x0a6c */ nop
michael@0 1756 /* 0x0a70 317 */ sub %i0,1,%o7
michael@0 1757 /* 0x0a74 */ or %g0,-1,%g2
michael@0 1758 /* 0x0a78 */ srl %g2,0,%o4
michael@0 1759 /* 0x0a7c */ add %o7,1,%o0
michael@0 1760 /* 0x0a80 315 */ or %g0,0,%o5
michael@0 1761 /* 0x0a84 */ or %g0,0,%g1
michael@0 1762 /* 0x0a88 */ cmp %o0,3
michael@0 1763 /* 0x0a8c */ bl,pn %icc,.L77000289
michael@0 1764 /* 0x0a90 */ add %o3,8,%o1
michael@0 1765 /* 0x0a94 */ add %o2,4,%o0
michael@0 1766 /* 0x0a98 */ ld [%o1-8],%g2
michael@0 1767 /* 0x0a9c 0 */ or %g0,%o1,%o3
michael@0 1768 /* 0x0aa0 315 */ ld [%o0-4],%g3
michael@0 1769 /* 0x0aa4 0 */ or %g0,%o0,%o2
michael@0 1770 /* 0x0aa8 315 */ or %g0,2,%g1
michael@0 1771 /* 0x0aac */ ld [%o3-4],%o0
michael@0 1772 /* 0x0ab0 */ sub %g2,%g3,%g2
michael@0 1773 /* 0x0ab4 */ or %g0,%g2,%o5
michael@0 1774 /* 0x0ab8 */ and %g2,%o4,%g2
michael@0 1775 /* 0x0abc */ st %g2,[%o3-8]
michael@0 1776 /* 0x0ac0 */ srax %o5,32,%o5
michael@0 1777 .L900000638:
michael@0 1778 /* 0x0ac4 */ ld [%o2],%g2
michael@0 1779 /* 0x0ac8 */ add %g1,1,%g1
michael@0 1780 /* 0x0acc */ add %o2,4,%o2
michael@0 1781 /* 0x0ad0 */ cmp %g1,%o7
michael@0 1782 /* 0x0ad4 */ add %o3,4,%o3
michael@0 1783 /* 0x0ad8 */ sub %o0,%g2,%o0
michael@0 1784 /* 0x0adc */ add %o0,%o5,%o5
michael@0 1785 /* 0x0ae0 */ and %o5,%o4,%g2
michael@0 1786 /* 0x0ae4 */ ld [%o3-4],%o0
michael@0 1787 /* 0x0ae8 */ st %g2,[%o3-8]
michael@0 1788 /* 0x0aec */ ble,pt %icc,.L900000638
michael@0 1789 /* 0x0af0 */ srax %o5,32,%o5
michael@0 1790 .L900000641:
michael@0 1791 /* 0x0af4 */ ld [%o2],%o1
michael@0 1792 /* 0x0af8 */ sub %o0,%o1,%o0
michael@0 1793 /* 0x0afc */ add %o0,%o5,%o0
michael@0 1794 /* 0x0b00 */ and %o0,%o4,%o1
michael@0 1795 /* 0x0b04 */ st %o1,[%o3-4]
michael@0 1796 /* 0x0b08 */ ret ! Result =
michael@0 1797 /* 0x0b0c */ restore %g0,%g0,%g0
michael@0 1798 .L77000289:
michael@0 1799 /* 0x0b10 */ ld [%o3],%o0
michael@0 1800 .L900000647:
michael@0 1801 /* 0x0b14 */ ld [%o2],%o1
michael@0 1802 /* 0x0b18 */ add %o5,%o0,%o0
michael@0 1803 /* 0x0b1c */ add %g1,1,%g1
michael@0 1804 /* 0x0b20 */ add %o2,4,%o2
michael@0 1805 /* 0x0b24 */ cmp %g1,%o7
michael@0 1806 /* 0x0b28 */ sub %o0,%o1,%o0
michael@0 1807 /* 0x0b2c */ and %o0,%o4,%o1
michael@0 1808 /* 0x0b30 */ st %o1,[%o3]
michael@0 1809 /* 0x0b34 */ add %o3,4,%o3
michael@0 1810 /* 0x0b38 */ srax %o0,32,%o5
michael@0 1811 /* 0x0b3c */ ble,a,pt %icc,.L900000647
michael@0 1812 /* 0x0b40 */ ld [%o3],%o0
michael@0 1813 .L77000224:
michael@0 1814 /* 0x0b44 */ ret ! Result =
michael@0 1815 /* 0x0b48 */ restore %g0,%g0,%g0
michael@0 1816 /* 0x0b4c 0 */ .type mont_mulf_noconv,2
michael@0 1817 /* 0x0b4c */ .size mont_mulf_noconv,(.-mont_mulf_noconv)
michael@0 1818

mercurial