Thu, 22 Jan 2015 13:21:57 +0100
Incorporate requested changes from Mozilla in review:
https://bugzilla.mozilla.org/show_bug.cgi?id=1123480#c6
michael@0 | 1 | ! |
michael@0 | 2 | ! This Source Code Form is subject to the terms of the Mozilla Public |
michael@0 | 3 | ! License, v. 2.0. If a copy of the MPL was not distributed with this |
michael@0 | 4 | ! file, You can obtain one at http://mozilla.org/MPL/2.0/. |
michael@0 | 5 | |
michael@0 | 6 | .section ".text",#alloc,#execinstr |
michael@0 | 7 | .file "montmulf.c" |
michael@0 | 8 | |
michael@0 | 9 | .section ".rodata",#alloc |
michael@0 | 10 | .global TwoTo16 |
michael@0 | 11 | .align 8 |
michael@0 | 12 | ! |
michael@0 | 13 | ! CONSTANT POOL |
michael@0 | 14 | ! |
michael@0 | 15 | .global TwoTo16 |
michael@0 | 16 | TwoTo16: |
michael@0 | 17 | .word 1089470464 |
michael@0 | 18 | .word 0 |
michael@0 | 19 | .type TwoTo16,#object |
michael@0 | 20 | .size TwoTo16,8 |
michael@0 | 21 | .global TwoToMinus16 |
michael@0 | 22 | ! |
michael@0 | 23 | ! CONSTANT POOL |
michael@0 | 24 | ! |
michael@0 | 25 | .global TwoToMinus16 |
michael@0 | 26 | TwoToMinus16: |
michael@0 | 27 | .word 1055916032 |
michael@0 | 28 | .word 0 |
michael@0 | 29 | .type TwoToMinus16,#object |
michael@0 | 30 | .size TwoToMinus16,8 |
michael@0 | 31 | .global Zero |
michael@0 | 32 | ! |
michael@0 | 33 | ! CONSTANT POOL |
michael@0 | 34 | ! |
michael@0 | 35 | .global Zero |
michael@0 | 36 | Zero: |
michael@0 | 37 | .word 0 |
michael@0 | 38 | .word 0 |
michael@0 | 39 | .type Zero,#object |
michael@0 | 40 | .size Zero,8 |
michael@0 | 41 | .global TwoTo32 |
michael@0 | 42 | ! |
michael@0 | 43 | ! CONSTANT POOL |
michael@0 | 44 | ! |
michael@0 | 45 | .global TwoTo32 |
michael@0 | 46 | TwoTo32: |
michael@0 | 47 | .word 1106247680 |
michael@0 | 48 | .word 0 |
michael@0 | 49 | .type TwoTo32,#object |
michael@0 | 50 | .size TwoTo32,8 |
michael@0 | 51 | .global TwoToMinus32 |
michael@0 | 52 | ! |
michael@0 | 53 | ! CONSTANT POOL |
michael@0 | 54 | ! |
michael@0 | 55 | .global TwoToMinus32 |
michael@0 | 56 | TwoToMinus32: |
michael@0 | 57 | .word 1039138816 |
michael@0 | 58 | .word 0 |
michael@0 | 59 | .type TwoToMinus32,#object |
michael@0 | 60 | .size TwoToMinus32,8 |
michael@0 | 61 | |
michael@0 | 62 | .section ".text",#alloc,#execinstr |
michael@0 | 63 | /* 000000 0 */ .align 4 |
michael@0 | 64 | ! |
michael@0 | 65 | ! SUBROUTINE conv_d16_to_i32 |
michael@0 | 66 | ! |
michael@0 | 67 | ! OFFSET SOURCE LINE LABEL INSTRUCTION |
michael@0 | 68 | |
michael@0 | 69 | .global conv_d16_to_i32 |
michael@0 | 70 | conv_d16_to_i32: |
michael@0 | 71 | /* 000000 */ save %sp,-128,%sp |
michael@0 | 72 | ! FILE montmulf.c |
michael@0 | 73 | |
michael@0 | 74 | ! 36 !#define RF_INLINE_MACROS |
michael@0 | 75 | ! 38 !static const double TwoTo16=65536.0; |
michael@0 | 76 | ! 39 !static const double TwoToMinus16=1.0/65536.0; |
michael@0 | 77 | ! 40 !static const double Zero=0.0; |
michael@0 | 78 | ! 41 !static const double TwoTo32=65536.0*65536.0; |
michael@0 | 79 | ! 42 !static const double TwoToMinus32=1.0/(65536.0*65536.0); |
michael@0 | 80 | ! 44 !#ifdef RF_INLINE_MACROS |
michael@0 | 81 | ! 46 !double upper32(double); |
michael@0 | 82 | ! 47 !double lower32(double, double); |
michael@0 | 83 | ! 48 !double mod(double, double, double); |
michael@0 | 84 | ! 50 !void i16_to_d16_and_d32x4(const double * /*1/(2^16)*/, |
michael@0 | 85 | ! 51 ! const double * /* 2^16*/, |
michael@0 | 86 | ! 52 ! const double * /* 0 */, |
michael@0 | 87 | ! 53 ! double * /*result16*/, |
michael@0 | 88 | ! 54 ! double * /* result32 */, |
michael@0 | 89 | ! 55 ! float * /*source - should be unsigned int* |
michael@0 | 90 | ! 56 ! converted to float* */); |
michael@0 | 91 | ! 58 !#else |
michael@0 | 92 | ! 60 !static double upper32(double x) |
michael@0 | 93 | ! 61 !{ |
michael@0 | 94 | ! 62 ! return floor(x*TwoToMinus32); |
michael@0 | 95 | ! 63 !} |
michael@0 | 96 | ! 65 !static double lower32(double x, double y) |
michael@0 | 97 | ! 66 !{ |
michael@0 | 98 | ! 67 ! return x-TwoTo32*floor(x*TwoToMinus32); |
michael@0 | 99 | ! 68 !} |
michael@0 | 100 | ! 70 !static double mod(double x, double oneoverm, double m) |
michael@0 | 101 | ! 71 !{ |
michael@0 | 102 | ! 72 ! return x-m*floor(x*oneoverm); |
michael@0 | 103 | ! 73 !} |
michael@0 | 104 | ! 75 !#endif |
michael@0 | 105 | ! 78 !static void cleanup(double *dt, int from, int tlen) |
michael@0 | 106 | ! 79 !{ |
michael@0 | 107 | ! 80 ! int i; |
michael@0 | 108 | ! 81 ! double tmp,tmp1,x,x1; |
michael@0 | 109 | ! 83 ! tmp=tmp1=Zero; |
michael@0 | 110 | ! 84 ! /* original code ** |
michael@0 | 111 | ! 85 ! for(i=2*from;i<2*tlen-2;i++) |
michael@0 | 112 | ! 86 ! { |
michael@0 | 113 | ! 87 ! x=dt[i]; |
michael@0 | 114 | ! 88 ! dt[i]=lower32(x,Zero)+tmp1; |
michael@0 | 115 | ! 89 ! tmp1=tmp; |
michael@0 | 116 | ! 90 ! tmp=upper32(x); |
michael@0 | 117 | ! 91 ! } |
michael@0 | 118 | ! 92 ! dt[tlen-2]+=tmp1; |
michael@0 | 119 | ! 93 ! dt[tlen-1]+=tmp; |
michael@0 | 120 | ! 94 ! **end original code ***/ |
michael@0 | 121 | ! 95 ! /* new code ***/ |
michael@0 | 122 | ! 96 ! for(i=2*from;i<2*tlen;i+=2) |
michael@0 | 123 | ! 97 ! { |
michael@0 | 124 | ! 98 ! x=dt[i]; |
michael@0 | 125 | ! 99 ! x1=dt[i+1]; |
michael@0 | 126 | ! 100 ! dt[i]=lower32(x,Zero)+tmp; |
michael@0 | 127 | ! 101 ! dt[i+1]=lower32(x1,Zero)+tmp1; |
michael@0 | 128 | ! 102 ! tmp=upper32(x); |
michael@0 | 129 | ! 103 ! tmp1=upper32(x1); |
michael@0 | 130 | ! 104 ! } |
michael@0 | 131 | ! 105 ! /** end new code **/ |
michael@0 | 132 | ! 106 !} |
michael@0 | 133 | ! 109 !void conv_d16_to_i32(unsigned int *i32, double *d16, long long *tmp, int ilen) |
michael@0 | 134 | ! 110 !{ |
michael@0 | 135 | ! 111 !int i; |
michael@0 | 136 | ! 112 !long long t, t1, a, b, c, d; |
michael@0 | 137 | ! 114 ! t1=0; |
michael@0 | 138 | ! 115 ! a=(long long)d16[0]; |
michael@0 | 139 | |
michael@0 | 140 | /* 0x0004 115 */ ldd [%i1],%f0 |
michael@0 | 141 | /* 0x0008 110 */ or %g0,%i1,%o0 |
michael@0 | 142 | |
michael@0 | 143 | ! 116 ! b=(long long)d16[1]; |
michael@0 | 144 | ! 117 ! for(i=0; i<ilen-1; i++) |
michael@0 | 145 | |
michael@0 | 146 | /* 0x000c 117 */ sub %i3,1,%g2 |
michael@0 | 147 | /* 0x0010 */ cmp %g2,0 |
michael@0 | 148 | /* 0x0014 114 */ or %g0,0,%o4 |
michael@0 | 149 | /* 0x0018 115 */ fdtox %f0,%f0 |
michael@0 | 150 | /* 0x001c */ std %f0,[%sp+120] |
michael@0 | 151 | /* 0x0020 117 */ or %g0,0,%o7 |
michael@0 | 152 | /* 0x0024 110 */ or %g0,%i3,%o1 |
michael@0 | 153 | /* 0x0028 */ sub %i3,2,%o2 |
michael@0 | 154 | /* 0x002c 116 */ ldd [%o0+8],%f0 |
michael@0 | 155 | /* 0x0030 110 */ sethi %hi(0xfc00),%o1 |
michael@0 | 156 | /* 0x0034 */ add %o2,1,%g3 |
michael@0 | 157 | /* 0x0038 */ add %o1,1023,%o1 |
michael@0 | 158 | /* 0x003c */ or %g0,%i0,%o5 |
michael@0 | 159 | /* 0x0040 116 */ fdtox %f0,%f0 |
michael@0 | 160 | /* 0x0044 */ std %f0,[%sp+112] |
michael@0 | 161 | /* 0x0048 */ ldx [%sp+112],%g1 |
michael@0 | 162 | /* 0x004c 115 */ ldx [%sp+120],%g4 |
michael@0 | 163 | /* 0x0050 117 */ ble,pt %icc,.L900000117 |
michael@0 | 164 | /* 0x0054 */ sethi %hi(0xfc00),%g2 |
michael@0 | 165 | /* 0x0058 110 */ or %g0,-1,%g2 |
michael@0 | 166 | /* 0x005c 117 */ cmp %g3,3 |
michael@0 | 167 | /* 0x0060 110 */ srl %g2,0,%o3 |
michael@0 | 168 | /* 0x0064 117 */ bl,pn %icc,.L77000134 |
michael@0 | 169 | /* 0x0068 */ or %g0,%o0,%g2 |
michael@0 | 170 | |
michael@0 | 171 | ! 118 ! { |
michael@0 | 172 | ! 119 ! c=(long long)d16[2*i+2]; |
michael@0 | 173 | |
michael@0 | 174 | /* 0x006c 119 */ ldd [%o0+16],%f0 |
michael@0 | 175 | |
michael@0 | 176 | ! 120 ! t1+=a&0xffffffff; |
michael@0 | 177 | ! 121 ! t=(a>>32); |
michael@0 | 178 | ! 122 ! d=(long long)d16[2*i+3]; |
michael@0 | 179 | ! 123 ! t1+=(b&0xffff)<<16; |
michael@0 | 180 | ! 124 ! t+=(b>>16)+(t1>>32); |
michael@0 | 181 | ! 125 ! i32[i]=t1&0xffffffff; |
michael@0 | 182 | ! 126 ! t1=t; |
michael@0 | 183 | ! 127 ! a=c; |
michael@0 | 184 | ! 128 ! b=d; |
michael@0 | 185 | |
michael@0 | 186 | /* 0x0070 128 */ add %o0,16,%g2 |
michael@0 | 187 | /* 0x0074 123 */ and %g1,%o1,%o0 |
michael@0 | 188 | /* 0x0078 */ sllx %o0,16,%g3 |
michael@0 | 189 | /* 0x007c 120 */ and %g4,%o3,%o0 |
michael@0 | 190 | /* 0x0080 117 */ add %o0,%g3,%o4 |
michael@0 | 191 | /* 0x0084 119 */ fdtox %f0,%f0 |
michael@0 | 192 | /* 0x0088 */ std %f0,[%sp+104] |
michael@0 | 193 | /* 0x008c 125 */ and %o4,%o3,%g5 |
michael@0 | 194 | /* 0x0090 122 */ ldd [%g2+8],%f2 |
michael@0 | 195 | /* 0x0094 128 */ add %o5,4,%o5 |
michael@0 | 196 | /* 0x0098 124 */ srax %o4,32,%o4 |
michael@0 | 197 | /* 0x009c */ stx %o4,[%sp+112] |
michael@0 | 198 | /* 0x00a0 122 */ fdtox %f2,%f0 |
michael@0 | 199 | /* 0x00a4 */ std %f0,[%sp+96] |
michael@0 | 200 | /* 0x00a8 124 */ srax %g1,16,%o0 |
michael@0 | 201 | /* 0x00ac */ ldx [%sp+112],%o7 |
michael@0 | 202 | /* 0x00b0 121 */ srax %g4,32,%o4 |
michael@0 | 203 | /* 0x00b4 124 */ add %o0,%o7,%g4 |
michael@0 | 204 | /* 0x00b8 128 */ or %g0,1,%o7 |
michael@0 | 205 | /* 0x00bc 119 */ ldx [%sp+104],%g3 |
michael@0 | 206 | /* 0x00c0 124 */ add %o4,%g4,%o4 |
michael@0 | 207 | /* 0x00c4 122 */ ldx [%sp+96],%g1 |
michael@0 | 208 | /* 0x00c8 125 */ st %g5,[%o5-4] |
michael@0 | 209 | /* 0x00cc 127 */ or %g0,%g3,%g4 |
michael@0 | 210 | .L900000112: |
michael@0 | 211 | /* 0x00d0 119 */ ldd [%g2+16],%f0 |
michael@0 | 212 | /* 0x00d4 128 */ add %o7,1,%o7 |
michael@0 | 213 | /* 0x00d8 */ add %o5,4,%o5 |
michael@0 | 214 | /* 0x00dc */ cmp %o7,%o2 |
michael@0 | 215 | /* 0x00e0 */ add %g2,16,%g2 |
michael@0 | 216 | /* 0x00e4 119 */ fdtox %f0,%f0 |
michael@0 | 217 | /* 0x00e8 */ std %f0,[%sp+104] |
michael@0 | 218 | /* 0x00ec 122 */ ldd [%g2+8],%f0 |
michael@0 | 219 | /* 0x00f0 */ fdtox %f0,%f0 |
michael@0 | 220 | /* 0x00f4 */ std %f0,[%sp+96] |
michael@0 | 221 | /* 0x00f8 123 */ and %g1,%o1,%g3 |
michael@0 | 222 | /* 0x00fc */ sllx %g3,16,%g5 |
michael@0 | 223 | /* 0x0100 120 */ and %g4,%o3,%g3 |
michael@0 | 224 | /* 0x0104 117 */ add %g3,%g5,%g3 |
michael@0 | 225 | /* 0x0108 124 */ srax %g1,16,%g1 |
michael@0 | 226 | /* 0x010c 117 */ add %g3,%o4,%g3 |
michael@0 | 227 | /* 0x0110 124 */ srax %g3,32,%o4 |
michael@0 | 228 | /* 0x0114 */ stx %o4,[%sp+112] |
michael@0 | 229 | /* 0x0118 119 */ ldx [%sp+104],%g5 |
michael@0 | 230 | /* 0x011c 121 */ srax %g4,32,%o4 |
michael@0 | 231 | /* 0x0120 124 */ ldx [%sp+112],%g4 |
michael@0 | 232 | /* 0x0124 */ add %g1,%g4,%g4 |
michael@0 | 233 | /* 0x0128 122 */ ldx [%sp+96],%g1 |
michael@0 | 234 | /* 0x012c 124 */ add %o4,%g4,%o4 |
michael@0 | 235 | /* 0x0130 125 */ and %g3,%o3,%g3 |
michael@0 | 236 | /* 0x0134 127 */ or %g0,%g5,%g4 |
michael@0 | 237 | /* 0x0138 128 */ ble,pt %icc,.L900000112 |
michael@0 | 238 | /* 0x013c */ st %g3,[%o5-4] |
michael@0 | 239 | .L900000115: |
michael@0 | 240 | /* 0x0140 128 */ ba .L900000117 |
michael@0 | 241 | /* 0x0144 */ sethi %hi(0xfc00),%g2 |
michael@0 | 242 | .L77000134: |
michael@0 | 243 | /* 0x0148 119 */ ldd [%g2+16],%f0 |
michael@0 | 244 | .L900000116: |
michael@0 | 245 | /* 0x014c 120 */ and %g4,%o3,%o0 |
michael@0 | 246 | /* 0x0150 123 */ and %g1,%o1,%g3 |
michael@0 | 247 | /* 0x0154 119 */ fdtox %f0,%f0 |
michael@0 | 248 | /* 0x0158 120 */ add %o4,%o0,%o0 |
michael@0 | 249 | /* 0x015c 119 */ std %f0,[%sp+104] |
michael@0 | 250 | /* 0x0160 128 */ add %o7,1,%o7 |
michael@0 | 251 | /* 0x0164 123 */ sllx %g3,16,%o4 |
michael@0 | 252 | /* 0x0168 122 */ ldd [%g2+24],%f2 |
michael@0 | 253 | /* 0x016c 128 */ add %g2,16,%g2 |
michael@0 | 254 | /* 0x0170 123 */ add %o0,%o4,%o0 |
michael@0 | 255 | /* 0x0174 128 */ cmp %o7,%o2 |
michael@0 | 256 | /* 0x0178 125 */ and %o0,%o3,%g3 |
michael@0 | 257 | /* 0x017c 122 */ fdtox %f2,%f0 |
michael@0 | 258 | /* 0x0180 */ std %f0,[%sp+96] |
michael@0 | 259 | /* 0x0184 124 */ srax %o0,32,%o0 |
michael@0 | 260 | /* 0x0188 */ stx %o0,[%sp+112] |
michael@0 | 261 | /* 0x018c 121 */ srax %g4,32,%o4 |
michael@0 | 262 | /* 0x0190 122 */ ldx [%sp+96],%o0 |
michael@0 | 263 | /* 0x0194 124 */ srax %g1,16,%g5 |
michael@0 | 264 | /* 0x0198 */ ldx [%sp+112],%g4 |
michael@0 | 265 | /* 0x019c 119 */ ldx [%sp+104],%g1 |
michael@0 | 266 | /* 0x01a0 125 */ st %g3,[%o5] |
michael@0 | 267 | /* 0x01a4 124 */ add %g5,%g4,%g4 |
michael@0 | 268 | /* 0x01a8 128 */ add %o5,4,%o5 |
michael@0 | 269 | /* 0x01ac 124 */ add %o4,%g4,%o4 |
michael@0 | 270 | /* 0x01b0 127 */ or %g0,%g1,%g4 |
michael@0 | 271 | /* 0x01b4 128 */ or %g0,%o0,%g1 |
michael@0 | 272 | /* 0x01b8 */ ble,a,pt %icc,.L900000116 |
michael@0 | 273 | /* 0x01bc */ ldd [%g2+16],%f0 |
michael@0 | 274 | .L77000127: |
michael@0 | 275 | |
michael@0 | 276 | ! 129 ! } |
michael@0 | 277 | ! 130 ! t1+=a&0xffffffff; |
michael@0 | 278 | ! 131 ! t=(a>>32); |
michael@0 | 279 | ! 132 ! t1+=(b&0xffff)<<16; |
michael@0 | 280 | ! 133 ! i32[i]=t1&0xffffffff; |
michael@0 | 281 | |
michael@0 | 282 | /* 0x01c0 133 */ sethi %hi(0xfc00),%g2 |
michael@0 | 283 | .L900000117: |
michael@0 | 284 | /* 0x01c4 133 */ or %g0,-1,%g3 |
michael@0 | 285 | /* 0x01c8 */ add %g2,1023,%g2 |
michael@0 | 286 | /* 0x01cc */ srl %g3,0,%g3 |
michael@0 | 287 | /* 0x01d0 */ and %g1,%g2,%g2 |
michael@0 | 288 | /* 0x01d4 */ and %g4,%g3,%g4 |
michael@0 | 289 | /* 0x01d8 */ sllx %g2,16,%g2 |
michael@0 | 290 | /* 0x01dc */ add %o4,%g4,%g4 |
michael@0 | 291 | /* 0x01e0 */ add %g4,%g2,%g2 |
michael@0 | 292 | /* 0x01e4 */ sll %o7,2,%g4 |
michael@0 | 293 | /* 0x01e8 */ and %g2,%g3,%g2 |
michael@0 | 294 | /* 0x01ec */ st %g2,[%i0+%g4] |
michael@0 | 295 | /* 0x01f0 */ ret ! Result = |
michael@0 | 296 | /* 0x01f4 */ restore %g0,%g0,%g0 |
michael@0 | 297 | /* 0x01f8 0 */ .type conv_d16_to_i32,2 |
michael@0 | 298 | /* 0x01f8 */ .size conv_d16_to_i32,(.-conv_d16_to_i32) |
michael@0 | 299 | |
michael@0 | 300 | .section ".text",#alloc,#execinstr |
michael@0 | 301 | /* 000000 0 */ .align 8 |
michael@0 | 302 | ! |
michael@0 | 303 | ! CONSTANT POOL |
michael@0 | 304 | ! |
michael@0 | 305 | .L_const_seg_900000201: |
michael@0 | 306 | /* 000000 0 */ .word 1127219200,0 |
michael@0 | 307 | /* 0x0008 0 */ .align 4 |
michael@0 | 308 | /* 0x0008 */ .skip 16 |
michael@0 | 309 | ! |
michael@0 | 310 | ! SUBROUTINE conv_i32_to_d32 |
michael@0 | 311 | ! |
michael@0 | 312 | ! OFFSET SOURCE LINE LABEL INSTRUCTION |
michael@0 | 313 | |
michael@0 | 314 | .global conv_i32_to_d32 |
michael@0 | 315 | conv_i32_to_d32: |
michael@0 | 316 | /* 000000 */ or %g0,%o7,%g2 |
michael@0 | 317 | |
michael@0 | 318 | ! 135 !} |
michael@0 | 319 | ! 137 !void conv_i32_to_d32(double *d32, unsigned int *i32, int len) |
michael@0 | 320 | ! 138 !{ |
michael@0 | 321 | ! 139 !int i; |
michael@0 | 322 | ! 141 !#pragma pipeloop(0) |
michael@0 | 323 | ! 142 ! for(i=0;i<len;i++) d32[i]=(double)(i32[i]); |
michael@0 | 324 | |
michael@0 | 325 | /* 0x0004 142 */ cmp %o2,0 |
michael@0 | 326 | .L900000210: |
michael@0 | 327 | /* 0x0008 */ call .+8 |
michael@0 | 328 | /* 0x000c */ sethi /*X*/%hi(_GLOBAL_OFFSET_TABLE_-(.L900000210-.)),%g4 |
michael@0 | 329 | /* 0x0010 142 */ or %g0,0,%o5 |
michael@0 | 330 | /* 0x0014 138 */ add %g4,/*X*/%lo(_GLOBAL_OFFSET_TABLE_-(.L900000210-.)),%g4 |
michael@0 | 331 | /* 0x0018 */ or %g0,%o0,%g5 |
michael@0 | 332 | /* 0x001c */ add %g4,%o7,%g1 |
michael@0 | 333 | /* 0x0020 142 */ ble,pt %icc,.L77000140 |
michael@0 | 334 | /* 0x0024 */ or %g0,%g2,%o7 |
michael@0 | 335 | /* 0x0028 */ sethi %hi(.L_const_seg_900000201),%g2 |
michael@0 | 336 | /* 0x002c 138 */ or %g0,%o1,%g4 |
michael@0 | 337 | /* 0x0030 142 */ add %g2,%lo(.L_const_seg_900000201),%g2 |
michael@0 | 338 | /* 0x0034 */ sub %o2,1,%g3 |
michael@0 | 339 | /* 0x0038 */ ld [%g1+%g2],%g2 |
michael@0 | 340 | /* 0x003c */ cmp %o2,9 |
michael@0 | 341 | /* 0x0040 */ bl,pn %icc,.L77000144 |
michael@0 | 342 | /* 0x0044 */ ldd [%g2],%f8 |
michael@0 | 343 | /* 0x0048 */ add %o1,16,%g4 |
michael@0 | 344 | /* 0x004c */ sub %o2,5,%g1 |
michael@0 | 345 | /* 0x0050 */ ld [%o1],%f7 |
michael@0 | 346 | /* 0x0054 */ or %g0,4,%o5 |
michael@0 | 347 | /* 0x0058 */ ld [%o1+4],%f5 |
michael@0 | 348 | /* 0x005c */ ld [%o1+8],%f3 |
michael@0 | 349 | /* 0x0060 */ fmovs %f8,%f6 |
michael@0 | 350 | /* 0x0064 */ ld [%o1+12],%f1 |
michael@0 | 351 | .L900000205: |
michael@0 | 352 | /* 0x0068 */ ld [%g4],%f11 |
michael@0 | 353 | /* 0x006c */ add %o5,5,%o5 |
michael@0 | 354 | /* 0x0070 */ add %g4,20,%g4 |
michael@0 | 355 | /* 0x0074 */ fsubd %f6,%f8,%f6 |
michael@0 | 356 | /* 0x0078 */ std %f6,[%g5] |
michael@0 | 357 | /* 0x007c */ cmp %o5,%g1 |
michael@0 | 358 | /* 0x0080 */ add %g5,40,%g5 |
michael@0 | 359 | /* 0x0084 */ fmovs %f8,%f4 |
michael@0 | 360 | /* 0x0088 */ ld [%g4-16],%f7 |
michael@0 | 361 | /* 0x008c */ fsubd %f4,%f8,%f12 |
michael@0 | 362 | /* 0x0090 */ fmovs %f8,%f2 |
michael@0 | 363 | /* 0x0094 */ std %f12,[%g5-32] |
michael@0 | 364 | /* 0x0098 */ ld [%g4-12],%f5 |
michael@0 | 365 | /* 0x009c */ fsubd %f2,%f8,%f12 |
michael@0 | 366 | /* 0x00a0 */ fmovs %f8,%f0 |
michael@0 | 367 | /* 0x00a4 */ std %f12,[%g5-24] |
michael@0 | 368 | /* 0x00a8 */ ld [%g4-8],%f3 |
michael@0 | 369 | /* 0x00ac */ fsubd %f0,%f8,%f12 |
michael@0 | 370 | /* 0x00b0 */ fmovs %f8,%f10 |
michael@0 | 371 | /* 0x00b4 */ std %f12,[%g5-16] |
michael@0 | 372 | /* 0x00b8 */ ld [%g4-4],%f1 |
michael@0 | 373 | /* 0x00bc */ fsubd %f10,%f8,%f10 |
michael@0 | 374 | /* 0x00c0 */ fmovs %f8,%f6 |
michael@0 | 375 | /* 0x00c4 */ ble,pt %icc,.L900000205 |
michael@0 | 376 | /* 0x00c8 */ std %f10,[%g5-8] |
michael@0 | 377 | .L900000208: |
michael@0 | 378 | /* 0x00cc */ fmovs %f8,%f4 |
michael@0 | 379 | /* 0x00d0 */ add %g5,32,%g5 |
michael@0 | 380 | /* 0x00d4 */ cmp %o5,%g3 |
michael@0 | 381 | /* 0x00d8 */ fmovs %f8,%f2 |
michael@0 | 382 | /* 0x00dc */ fmovs %f8,%f0 |
michael@0 | 383 | /* 0x00e0 */ fsubd %f6,%f8,%f6 |
michael@0 | 384 | /* 0x00e4 */ std %f6,[%g5-32] |
michael@0 | 385 | /* 0x00e8 */ fsubd %f4,%f8,%f4 |
michael@0 | 386 | /* 0x00ec */ std %f4,[%g5-24] |
michael@0 | 387 | /* 0x00f0 */ fsubd %f2,%f8,%f2 |
michael@0 | 388 | /* 0x00f4 */ std %f2,[%g5-16] |
michael@0 | 389 | /* 0x00f8 */ fsubd %f0,%f8,%f0 |
michael@0 | 390 | /* 0x00fc */ bg,pn %icc,.L77000140 |
michael@0 | 391 | /* 0x0100 */ std %f0,[%g5-8] |
michael@0 | 392 | .L77000144: |
michael@0 | 393 | /* 0x0104 */ ld [%g4],%f1 |
michael@0 | 394 | .L900000211: |
michael@0 | 395 | /* 0x0108 */ ldd [%g2],%f8 |
michael@0 | 396 | /* 0x010c */ add %o5,1,%o5 |
michael@0 | 397 | /* 0x0110 */ add %g4,4,%g4 |
michael@0 | 398 | /* 0x0114 */ cmp %o5,%g3 |
michael@0 | 399 | /* 0x0118 */ fmovs %f8,%f0 |
michael@0 | 400 | /* 0x011c */ fsubd %f0,%f8,%f0 |
michael@0 | 401 | /* 0x0120 */ std %f0,[%g5] |
michael@0 | 402 | /* 0x0124 */ add %g5,8,%g5 |
michael@0 | 403 | /* 0x0128 */ ble,a,pt %icc,.L900000211 |
michael@0 | 404 | /* 0x012c */ ld [%g4],%f1 |
michael@0 | 405 | .L77000140: |
michael@0 | 406 | /* 0x0130 */ retl ! Result = |
michael@0 | 407 | /* 0x0134 */ nop |
michael@0 | 408 | /* 0x0138 0 */ .type conv_i32_to_d32,2 |
michael@0 | 409 | /* 0x0138 */ .size conv_i32_to_d32,(.-conv_i32_to_d32) |
michael@0 | 410 | |
michael@0 | 411 | .section ".text",#alloc,#execinstr |
michael@0 | 412 | /* 000000 0 */ .align 8 |
michael@0 | 413 | ! |
michael@0 | 414 | ! CONSTANT POOL |
michael@0 | 415 | ! |
michael@0 | 416 | .L_const_seg_900000301: |
michael@0 | 417 | /* 000000 0 */ .word 1127219200,0 |
michael@0 | 418 | /* 0x0008 0 */ .align 4 |
michael@0 | 419 | ! |
michael@0 | 420 | ! SUBROUTINE conv_i32_to_d16 |
michael@0 | 421 | ! |
michael@0 | 422 | ! OFFSET SOURCE LINE LABEL INSTRUCTION |
michael@0 | 423 | |
michael@0 | 424 | .global conv_i32_to_d16 |
michael@0 | 425 | conv_i32_to_d16: |
michael@0 | 426 | /* 000000 */ save %sp,-104,%sp |
michael@0 | 427 | /* 0x0004 */ or %g0,%i2,%o0 |
michael@0 | 428 | |
michael@0 | 429 | ! 143 !} |
michael@0 | 430 | ! 146 !void conv_i32_to_d16(double *d16, unsigned int *i32, int len) |
michael@0 | 431 | ! 147 !{ |
michael@0 | 432 | ! 148 !int i; |
michael@0 | 433 | ! 149 !unsigned int a; |
michael@0 | 434 | ! 151 !#pragma pipeloop(0) |
michael@0 | 435 | ! 152 ! for(i=0;i<len;i++) |
michael@0 | 436 | ! 153 ! { |
michael@0 | 437 | ! 154 ! a=i32[i]; |
michael@0 | 438 | ! 155 ! d16[2*i]=(double)(a&0xffff); |
michael@0 | 439 | ! 156 ! d16[2*i+1]=(double)(a>>16); |
michael@0 | 440 | |
michael@0 | 441 | /* 0x0008 156 */ sethi %hi(.L_const_seg_900000301),%g2 |
michael@0 | 442 | .L900000310: |
michael@0 | 443 | /* 0x000c */ call .+8 |
michael@0 | 444 | /* 0x0010 */ sethi /*X*/%hi(_GLOBAL_OFFSET_TABLE_-(.L900000310-.)),%g3 |
michael@0 | 445 | /* 0x0014 152 */ cmp %o0,0 |
michael@0 | 446 | /* 0x0018 147 */ add %g3,/*X*/%lo(_GLOBAL_OFFSET_TABLE_-(.L900000310-.)),%g3 |
michael@0 | 447 | /* 0x001c 152 */ ble,pt %icc,.L77000150 |
michael@0 | 448 | /* 0x0020 */ add %g3,%o7,%o2 |
michael@0 | 449 | /* 0x0024 */ sub %i2,1,%o5 |
michael@0 | 450 | /* 0x0028 156 */ add %g2,%lo(.L_const_seg_900000301),%o1 |
michael@0 | 451 | /* 0x002c 152 */ sethi %hi(0xfc00),%o0 |
michael@0 | 452 | /* 0x0030 */ ld [%o2+%o1],%o3 |
michael@0 | 453 | /* 0x0034 */ add %o5,1,%g2 |
michael@0 | 454 | /* 0x0038 */ or %g0,0,%g1 |
michael@0 | 455 | /* 0x003c */ cmp %g2,3 |
michael@0 | 456 | /* 0x0040 */ or %g0,%i1,%o7 |
michael@0 | 457 | /* 0x0044 */ add %o0,1023,%o4 |
michael@0 | 458 | /* 0x0048 */ or %g0,%i0,%g3 |
michael@0 | 459 | /* 0x004c */ bl,pn %icc,.L77000154 |
michael@0 | 460 | /* 0x0050 */ add %o7,4,%o0 |
michael@0 | 461 | /* 0x0054 155 */ ldd [%o3],%f0 |
michael@0 | 462 | /* 0x0058 156 */ or %g0,1,%g1 |
michael@0 | 463 | /* 0x005c 154 */ ld [%o0-4],%o1 |
michael@0 | 464 | /* 0x0060 0 */ or %g0,%o0,%o7 |
michael@0 | 465 | /* 0x0064 155 */ and %o1,%o4,%o0 |
michael@0 | 466 | .L900000306: |
michael@0 | 467 | /* 0x0068 155 */ st %o0,[%sp+96] |
michael@0 | 468 | /* 0x006c 156 */ add %g1,1,%g1 |
michael@0 | 469 | /* 0x0070 */ add %g3,16,%g3 |
michael@0 | 470 | /* 0x0074 */ cmp %g1,%o5 |
michael@0 | 471 | /* 0x0078 */ add %o7,4,%o7 |
michael@0 | 472 | /* 0x007c 155 */ ld [%sp+96],%f3 |
michael@0 | 473 | /* 0x0080 */ fmovs %f0,%f2 |
michael@0 | 474 | /* 0x0084 */ fsubd %f2,%f0,%f2 |
michael@0 | 475 | /* 0x0088 156 */ srl %o1,16,%o0 |
michael@0 | 476 | /* 0x008c 155 */ std %f2,[%g3-16] |
michael@0 | 477 | /* 0x0090 156 */ st %o0,[%sp+92] |
michael@0 | 478 | /* 0x0094 */ ld [%sp+92],%f3 |
michael@0 | 479 | /* 0x0098 154 */ ld [%o7-4],%o1 |
michael@0 | 480 | /* 0x009c 156 */ fmovs %f0,%f2 |
michael@0 | 481 | /* 0x00a0 */ fsubd %f2,%f0,%f2 |
michael@0 | 482 | /* 0x00a4 155 */ and %o1,%o4,%o0 |
michael@0 | 483 | /* 0x00a8 156 */ ble,pt %icc,.L900000306 |
michael@0 | 484 | /* 0x00ac */ std %f2,[%g3-8] |
michael@0 | 485 | .L900000309: |
michael@0 | 486 | /* 0x00b0 155 */ st %o0,[%sp+96] |
michael@0 | 487 | /* 0x00b4 */ fmovs %f0,%f2 |
michael@0 | 488 | /* 0x00b8 156 */ add %g3,16,%g3 |
michael@0 | 489 | /* 0x00bc */ srl %o1,16,%o0 |
michael@0 | 490 | /* 0x00c0 155 */ ld [%sp+96],%f3 |
michael@0 | 491 | /* 0x00c4 */ fsubd %f2,%f0,%f2 |
michael@0 | 492 | /* 0x00c8 */ std %f2,[%g3-16] |
michael@0 | 493 | /* 0x00cc 156 */ st %o0,[%sp+92] |
michael@0 | 494 | /* 0x00d0 */ fmovs %f0,%f2 |
michael@0 | 495 | /* 0x00d4 */ ld [%sp+92],%f3 |
michael@0 | 496 | /* 0x00d8 */ fsubd %f2,%f0,%f0 |
michael@0 | 497 | /* 0x00dc */ std %f0,[%g3-8] |
michael@0 | 498 | /* 0x00e0 */ ret ! Result = |
michael@0 | 499 | /* 0x00e4 */ restore %g0,%g0,%g0 |
michael@0 | 500 | .L77000154: |
michael@0 | 501 | /* 0x00e8 154 */ ld [%o7],%o0 |
michael@0 | 502 | .L900000311: |
michael@0 | 503 | /* 0x00ec 155 */ and %o0,%o4,%o1 |
michael@0 | 504 | /* 0x00f0 */ st %o1,[%sp+96] |
michael@0 | 505 | /* 0x00f4 156 */ add %g1,1,%g1 |
michael@0 | 506 | /* 0x00f8 155 */ ldd [%o3],%f0 |
michael@0 | 507 | /* 0x00fc 156 */ srl %o0,16,%o0 |
michael@0 | 508 | /* 0x0100 */ add %o7,4,%o7 |
michael@0 | 509 | /* 0x0104 */ cmp %g1,%o5 |
michael@0 | 510 | /* 0x0108 155 */ fmovs %f0,%f2 |
michael@0 | 511 | /* 0x010c */ ld [%sp+96],%f3 |
michael@0 | 512 | /* 0x0110 */ fsubd %f2,%f0,%f2 |
michael@0 | 513 | /* 0x0114 */ std %f2,[%g3] |
michael@0 | 514 | /* 0x0118 156 */ st %o0,[%sp+92] |
michael@0 | 515 | /* 0x011c */ fmovs %f0,%f2 |
michael@0 | 516 | /* 0x0120 */ ld [%sp+92],%f3 |
michael@0 | 517 | /* 0x0124 */ fsubd %f2,%f0,%f0 |
michael@0 | 518 | /* 0x0128 */ std %f0,[%g3+8] |
michael@0 | 519 | /* 0x012c */ add %g3,16,%g3 |
michael@0 | 520 | /* 0x0130 */ ble,a,pt %icc,.L900000311 |
michael@0 | 521 | /* 0x0134 */ ld [%o7],%o0 |
michael@0 | 522 | .L77000150: |
michael@0 | 523 | /* 0x0138 */ ret ! Result = |
michael@0 | 524 | /* 0x013c */ restore %g0,%g0,%g0 |
michael@0 | 525 | /* 0x0140 0 */ .type conv_i32_to_d16,2 |
michael@0 | 526 | /* 0x0140 */ .size conv_i32_to_d16,(.-conv_i32_to_d16) |
michael@0 | 527 | |
michael@0 | 528 | .section ".text",#alloc,#execinstr |
michael@0 | 529 | /* 000000 0 */ .align 8 |
michael@0 | 530 | ! |
michael@0 | 531 | ! CONSTANT POOL |
michael@0 | 532 | ! |
michael@0 | 533 | .L_const_seg_900000401: |
michael@0 | 534 | /* 000000 0 */ .word 1127219200,0 |
michael@0 | 535 | /* 0x0008 0 */ .align 4 |
michael@0 | 536 | /* 0x0008 */ .skip 16 |
michael@0 | 537 | ! |
michael@0 | 538 | ! SUBROUTINE conv_i32_to_d32_and_d16 |
michael@0 | 539 | ! |
michael@0 | 540 | ! OFFSET SOURCE LINE LABEL INSTRUCTION |
michael@0 | 541 | |
michael@0 | 542 | .global conv_i32_to_d32_and_d16 |
michael@0 | 543 | conv_i32_to_d32_and_d16: |
michael@0 | 544 | /* 000000 */ save %sp,-120,%sp |
michael@0 | 545 | .L900000415: |
michael@0 | 546 | /* 0x0004 */ call .+8 |
michael@0 | 547 | /* 0x0008 */ sethi /*X*/%hi(_GLOBAL_OFFSET_TABLE_-(.L900000415-.)),%g4 |
michael@0 | 548 | |
michael@0 | 549 | ! 157 ! } |
michael@0 | 550 | ! 158 !} |
michael@0 | 551 | ! 161 !void conv_i32_to_d32_and_d16(double *d32, double *d16, |
michael@0 | 552 | ! 162 ! unsigned int *i32, int len) |
michael@0 | 553 | ! 163 !{ |
michael@0 | 554 | ! 164 !int i = 0; |
michael@0 | 555 | ! 165 !unsigned int a; |
michael@0 | 556 | ! 167 !#pragma pipeloop(0) |
michael@0 | 557 | ! 168 !#ifdef RF_INLINE_MACROS |
michael@0 | 558 | ! 169 ! for(;i<len-3;i+=4) |
michael@0 | 559 | |
michael@0 | 560 | /* 0x000c 169 */ sub %i3,3,%g2 |
michael@0 | 561 | /* 0x0010 */ cmp %g2,0 |
michael@0 | 562 | /* 0x0014 163 */ add %g4,/*X*/%lo(_GLOBAL_OFFSET_TABLE_-(.L900000415-.)),%g4 |
michael@0 | 563 | |
michael@0 | 564 | ! 170 ! { |
michael@0 | 565 | ! 171 ! i16_to_d16_and_d32x4(&TwoToMinus16, &TwoTo16, &Zero, |
michael@0 | 566 | ! 172 ! &(d16[2*i]), &(d32[i]), (float *)(&(i32[i]))); |
michael@0 | 567 | |
michael@0 | 568 | /* 0x0018 172 */ sethi %hi(Zero),%g2 |
michael@0 | 569 | /* 0x001c 163 */ add %g4,%o7,%o4 |
michael@0 | 570 | /* 0x0020 172 */ add %g2,%lo(Zero),%g2 |
michael@0 | 571 | /* 0x0024 */ sethi %hi(TwoToMinus16),%g3 |
michael@0 | 572 | /* 0x0028 */ ld [%o4+%g2],%o1 |
michael@0 | 573 | /* 0x002c */ sethi %hi(TwoTo16),%g4 |
michael@0 | 574 | /* 0x0030 */ add %g3,%lo(TwoToMinus16),%g2 |
michael@0 | 575 | /* 0x0034 */ ld [%o4+%g2],%o3 |
michael@0 | 576 | /* 0x0038 164 */ or %g0,0,%g5 |
michael@0 | 577 | /* 0x003c 172 */ add %g4,%lo(TwoTo16),%g3 |
michael@0 | 578 | /* 0x0040 */ ld [%o4+%g3],%o2 |
michael@0 | 579 | /* 0x0044 163 */ or %g0,%i0,%i4 |
michael@0 | 580 | /* 0x0048 169 */ or %g0,%i2,%o7 |
michael@0 | 581 | /* 0x004c */ ble,pt %icc,.L900000418 |
michael@0 | 582 | /* 0x0050 */ cmp %g5,%i3 |
michael@0 | 583 | /* 0x0054 172 */ stx %o7,[%sp+104] |
michael@0 | 584 | /* 0x0058 169 */ sub %i3,4,%o5 |
michael@0 | 585 | /* 0x005c */ or %g0,0,%g4 |
michael@0 | 586 | /* 0x0060 */ or %g0,0,%g1 |
michael@0 | 587 | .L900000417: |
michael@0 | 588 | /* 0x0064 */ ldd [%o1],%f2 |
michael@0 | 589 | /* 0x0068 172 */ add %i4,%g4,%g2 |
michael@0 | 590 | /* 0x006c */ add %i1,%g1,%g3 |
michael@0 | 591 | /* 0x0070 */ ldd [%o3],%f0 |
michael@0 | 592 | /* 0x0074 */ add %g5,4,%g5 |
michael@0 | 593 | /* 0x0078 */ fmovd %f2,%f14 |
michael@0 | 594 | /* 0x007c */ ld [%o7],%f15 |
michael@0 | 595 | /* 0x0080 */ cmp %g5,%o5 |
michael@0 | 596 | /* 0x0084 */ fmovd %f2,%f10 |
michael@0 | 597 | /* 0x0088 */ ld [%o7+4],%f11 |
michael@0 | 598 | /* 0x008c */ add %o7,16,%o7 |
michael@0 | 599 | /* 0x0090 */ ldx [%sp+104],%o0 |
michael@0 | 600 | /* 0x0094 */ fmovd %f2,%f6 |
michael@0 | 601 | /* 0x0098 */ stx %o7,[%sp+112] |
michael@0 | 602 | /* 0x009c */ fxtod %f14,%f14 |
michael@0 | 603 | /* 0x00a0 */ ld [%o0+8],%f7 |
michael@0 | 604 | /* 0x00a4 */ fxtod %f10,%f10 |
michael@0 | 605 | /* 0x00a8 */ ld [%o0+12],%f3 |
michael@0 | 606 | /* 0x00ac */ fxtod %f6,%f6 |
michael@0 | 607 | /* 0x00b0 */ ldd [%o2],%f16 |
michael@0 | 608 | /* 0x00b4 */ fmuld %f0,%f14,%f12 |
michael@0 | 609 | /* 0x00b8 */ fxtod %f2,%f2 |
michael@0 | 610 | /* 0x00bc */ fmuld %f0,%f10,%f8 |
michael@0 | 611 | /* 0x00c0 */ std %f14,[%i4+%g4] |
michael@0 | 612 | /* 0x00c4 */ ldx [%sp+112],%o7 |
michael@0 | 613 | /* 0x00c8 */ add %g4,32,%g4 |
michael@0 | 614 | /* 0x00cc */ fmuld %f0,%f6,%f4 |
michael@0 | 615 | /* 0x00d0 */ fdtox %f12,%f12 |
michael@0 | 616 | /* 0x00d4 */ std %f10,[%g2+8] |
michael@0 | 617 | /* 0x00d8 */ fmuld %f0,%f2,%f0 |
michael@0 | 618 | /* 0x00dc */ fdtox %f8,%f8 |
michael@0 | 619 | /* 0x00e0 */ std %f6,[%g2+16] |
michael@0 | 620 | /* 0x00e4 */ std %f2,[%g2+24] |
michael@0 | 621 | /* 0x00e8 */ fdtox %f4,%f4 |
michael@0 | 622 | /* 0x00ec */ fdtox %f0,%f0 |
michael@0 | 623 | /* 0x00f0 */ fxtod %f12,%f12 |
michael@0 | 624 | /* 0x00f4 */ std %f12,[%g3+8] |
michael@0 | 625 | /* 0x00f8 */ fxtod %f8,%f8 |
michael@0 | 626 | /* 0x00fc */ std %f8,[%g3+24] |
michael@0 | 627 | /* 0x0100 */ fxtod %f4,%f4 |
michael@0 | 628 | /* 0x0104 */ std %f4,[%g3+40] |
michael@0 | 629 | /* 0x0108 */ fxtod %f0,%f0 |
michael@0 | 630 | /* 0x010c */ std %f0,[%g3+56] |
michael@0 | 631 | /* 0x0110 */ fmuld %f12,%f16,%f12 |
michael@0 | 632 | /* 0x0114 */ fmuld %f8,%f16,%f8 |
michael@0 | 633 | /* 0x0118 */ fmuld %f4,%f16,%f4 |
michael@0 | 634 | /* 0x011c */ fsubd %f14,%f12,%f12 |
michael@0 | 635 | /* 0x0120 */ std %f12,[%i1+%g1] |
michael@0 | 636 | /* 0x0124 */ fmuld %f0,%f16,%f0 |
michael@0 | 637 | /* 0x0128 */ fsubd %f10,%f8,%f8 |
michael@0 | 638 | /* 0x012c */ std %f8,[%g3+16] |
michael@0 | 639 | /* 0x0130 */ add %g1,64,%g1 |
michael@0 | 640 | /* 0x0134 */ fsubd %f6,%f4,%f4 |
michael@0 | 641 | /* 0x0138 */ std %f4,[%g3+32] |
michael@0 | 642 | /* 0x013c */ fsubd %f2,%f0,%f0 |
michael@0 | 643 | /* 0x0140 */ std %f0,[%g3+48] |
michael@0 | 644 | /* 0x0144 */ ble,a,pt %icc,.L900000417 |
michael@0 | 645 | /* 0x0148 */ stx %o7,[%sp+104] |
michael@0 | 646 | .L77000159: |
michael@0 | 647 | |
michael@0 | 648 | ! 173 ! } |
michael@0 | 649 | ! 174 !#endif |
michael@0 | 650 | ! 175 ! for(;i<len;i++) |
michael@0 | 651 | |
michael@0 | 652 | /* 0x014c 175 */ cmp %g5,%i3 |
michael@0 | 653 | .L900000418: |
michael@0 | 654 | /* 0x0150 175 */ bge,pt %icc,.L77000164 |
michael@0 | 655 | /* 0x0154 */ nop |
michael@0 | 656 | |
michael@0 | 657 | ! 176 ! { |
michael@0 | 658 | ! 177 ! a=i32[i]; |
michael@0 | 659 | ! 178 ! d32[i]=(double)(i32[i]); |
michael@0 | 660 | ! 179 ! d16[2*i]=(double)(a&0xffff); |
michael@0 | 661 | ! 180 ! d16[2*i+1]=(double)(a>>16); |
michael@0 | 662 | |
michael@0 | 663 | /* 0x0158 180 */ sethi %hi(.L_const_seg_900000401),%g2 |
michael@0 | 664 | /* 0x015c */ add %g2,%lo(.L_const_seg_900000401),%o1 |
michael@0 | 665 | /* 0x0160 175 */ sethi %hi(0xfc00),%o0 |
michael@0 | 666 | /* 0x0164 */ ld [%o4+%o1],%o2 |
michael@0 | 667 | /* 0x0168 */ sll %g5,2,%o3 |
michael@0 | 668 | /* 0x016c */ sub %i3,%g5,%g3 |
michael@0 | 669 | /* 0x0170 */ sll %g5,3,%g2 |
michael@0 | 670 | /* 0x0174 */ add %o0,1023,%o4 |
michael@0 | 671 | /* 0x0178 178 */ ldd [%o2],%f0 |
michael@0 | 672 | /* 0x017c */ add %i2,%o3,%o0 |
michael@0 | 673 | /* 0x0180 175 */ cmp %g3,3 |
michael@0 | 674 | /* 0x0184 */ add %i4,%g2,%o3 |
michael@0 | 675 | /* 0x0188 */ sub %i3,1,%o1 |
michael@0 | 676 | /* 0x018c */ sll %g5,4,%g4 |
michael@0 | 677 | /* 0x0190 */ bl,pn %icc,.L77000161 |
michael@0 | 678 | /* 0x0194 */ add %i1,%g4,%o5 |
michael@0 | 679 | /* 0x0198 178 */ ld [%o0],%f3 |
michael@0 | 680 | /* 0x019c 180 */ add %o3,8,%o3 |
michael@0 | 681 | /* 0x01a0 177 */ ld [%o0],%o7 |
michael@0 | 682 | /* 0x01a4 180 */ add %o5,16,%o5 |
michael@0 | 683 | /* 0x01a8 */ add %g5,1,%g5 |
michael@0 | 684 | /* 0x01ac 178 */ fmovs %f0,%f2 |
michael@0 | 685 | /* 0x01b0 180 */ add %o0,4,%o0 |
michael@0 | 686 | /* 0x01b4 179 */ and %o7,%o4,%g1 |
michael@0 | 687 | /* 0x01b8 178 */ fsubd %f2,%f0,%f2 |
michael@0 | 688 | /* 0x01bc */ std %f2,[%o3-8] |
michael@0 | 689 | /* 0x01c0 180 */ srl %o7,16,%o7 |
michael@0 | 690 | /* 0x01c4 179 */ st %g1,[%sp+96] |
michael@0 | 691 | /* 0x01c8 */ fmovs %f0,%f2 |
michael@0 | 692 | /* 0x01cc */ ld [%sp+96],%f3 |
michael@0 | 693 | /* 0x01d0 */ fsubd %f2,%f0,%f2 |
michael@0 | 694 | /* 0x01d4 */ std %f2,[%o5-16] |
michael@0 | 695 | /* 0x01d8 180 */ st %o7,[%sp+92] |
michael@0 | 696 | /* 0x01dc */ fmovs %f0,%f2 |
michael@0 | 697 | /* 0x01e0 */ ld [%sp+92],%f3 |
michael@0 | 698 | /* 0x01e4 */ fsubd %f2,%f0,%f2 |
michael@0 | 699 | /* 0x01e8 */ std %f2,[%o5-8] |
michael@0 | 700 | .L900000411: |
michael@0 | 701 | /* 0x01ec 178 */ ld [%o0],%f3 |
michael@0 | 702 | /* 0x01f0 180 */ add %g5,2,%g5 |
michael@0 | 703 | /* 0x01f4 */ add %o5,32,%o5 |
michael@0 | 704 | /* 0x01f8 177 */ ld [%o0],%o7 |
michael@0 | 705 | /* 0x01fc 180 */ cmp %g5,%o1 |
michael@0 | 706 | /* 0x0200 */ add %o3,16,%o3 |
michael@0 | 707 | /* 0x0204 178 */ fmovs %f0,%f2 |
michael@0 | 708 | /* 0x0208 */ fsubd %f2,%f0,%f2 |
michael@0 | 709 | /* 0x020c */ std %f2,[%o3-16] |
michael@0 | 710 | /* 0x0210 179 */ and %o7,%o4,%g1 |
michael@0 | 711 | /* 0x0214 */ st %g1,[%sp+96] |
michael@0 | 712 | /* 0x0218 */ ld [%sp+96],%f3 |
michael@0 | 713 | /* 0x021c */ fmovs %f0,%f2 |
michael@0 | 714 | /* 0x0220 */ fsubd %f2,%f0,%f2 |
michael@0 | 715 | /* 0x0224 180 */ srl %o7,16,%o7 |
michael@0 | 716 | /* 0x0228 179 */ std %f2,[%o5-32] |
michael@0 | 717 | /* 0x022c 180 */ st %o7,[%sp+92] |
michael@0 | 718 | /* 0x0230 */ ld [%sp+92],%f3 |
michael@0 | 719 | /* 0x0234 */ fmovs %f0,%f2 |
michael@0 | 720 | /* 0x0238 */ fsubd %f2,%f0,%f2 |
michael@0 | 721 | /* 0x023c */ std %f2,[%o5-24] |
michael@0 | 722 | /* 0x0240 */ add %o0,4,%o0 |
michael@0 | 723 | /* 0x0244 178 */ ld [%o0],%f3 |
michael@0 | 724 | /* 0x0248 177 */ ld [%o0],%o7 |
michael@0 | 725 | /* 0x024c 178 */ fmovs %f0,%f2 |
michael@0 | 726 | /* 0x0250 */ fsubd %f2,%f0,%f2 |
michael@0 | 727 | /* 0x0254 */ std %f2,[%o3-8] |
michael@0 | 728 | /* 0x0258 179 */ and %o7,%o4,%g1 |
michael@0 | 729 | /* 0x025c */ st %g1,[%sp+96] |
michael@0 | 730 | /* 0x0260 */ ld [%sp+96],%f3 |
michael@0 | 731 | /* 0x0264 */ fmovs %f0,%f2 |
michael@0 | 732 | /* 0x0268 */ fsubd %f2,%f0,%f2 |
michael@0 | 733 | /* 0x026c 180 */ srl %o7,16,%o7 |
michael@0 | 734 | /* 0x0270 179 */ std %f2,[%o5-16] |
michael@0 | 735 | /* 0x0274 180 */ st %o7,[%sp+92] |
michael@0 | 736 | /* 0x0278 */ ld [%sp+92],%f3 |
michael@0 | 737 | /* 0x027c */ fmovs %f0,%f2 |
michael@0 | 738 | /* 0x0280 */ fsubd %f2,%f0,%f2 |
michael@0 | 739 | /* 0x0284 */ std %f2,[%o5-8] |
michael@0 | 740 | /* 0x0288 */ bl,pt %icc,.L900000411 |
michael@0 | 741 | /* 0x028c */ add %o0,4,%o0 |
michael@0 | 742 | .L900000414: |
michael@0 | 743 | /* 0x0290 180 */ cmp %g5,%i3 |
michael@0 | 744 | /* 0x0294 */ bge,pn %icc,.L77000164 |
michael@0 | 745 | /* 0x0298 */ nop |
michael@0 | 746 | .L77000161: |
michael@0 | 747 | /* 0x029c 178 */ ld [%o0],%f3 |
michael@0 | 748 | .L900000416: |
michael@0 | 749 | /* 0x02a0 178 */ ldd [%o2],%f0 |
michael@0 | 750 | /* 0x02a4 180 */ add %g5,1,%g5 |
michael@0 | 751 | /* 0x02a8 177 */ ld [%o0],%o1 |
michael@0 | 752 | /* 0x02ac 180 */ add %o0,4,%o0 |
michael@0 | 753 | /* 0x02b0 */ cmp %g5,%i3 |
michael@0 | 754 | /* 0x02b4 178 */ fmovs %f0,%f2 |
michael@0 | 755 | /* 0x02b8 179 */ and %o1,%o4,%o7 |
michael@0 | 756 | /* 0x02bc 178 */ fsubd %f2,%f0,%f2 |
michael@0 | 757 | /* 0x02c0 */ std %f2,[%o3] |
michael@0 | 758 | /* 0x02c4 180 */ srl %o1,16,%o1 |
michael@0 | 759 | /* 0x02c8 179 */ st %o7,[%sp+96] |
michael@0 | 760 | /* 0x02cc 180 */ add %o3,8,%o3 |
michael@0 | 761 | /* 0x02d0 179 */ fmovs %f0,%f2 |
michael@0 | 762 | /* 0x02d4 */ ld [%sp+96],%f3 |
michael@0 | 763 | /* 0x02d8 */ fsubd %f2,%f0,%f2 |
michael@0 | 764 | /* 0x02dc */ std %f2,[%o5] |
michael@0 | 765 | /* 0x02e0 180 */ st %o1,[%sp+92] |
michael@0 | 766 | /* 0x02e4 */ fmovs %f0,%f2 |
michael@0 | 767 | /* 0x02e8 */ ld [%sp+92],%f3 |
michael@0 | 768 | /* 0x02ec */ fsubd %f2,%f0,%f0 |
michael@0 | 769 | /* 0x02f0 */ std %f0,[%o5+8] |
michael@0 | 770 | /* 0x02f4 */ add %o5,16,%o5 |
michael@0 | 771 | /* 0x02f8 */ bl,a,pt %icc,.L900000416 |
michael@0 | 772 | /* 0x02fc */ ld [%o0],%f3 |
michael@0 | 773 | .L77000164: |
michael@0 | 774 | /* 0x0300 */ ret ! Result = |
michael@0 | 775 | /* 0x0304 */ restore %g0,%g0,%g0 |
michael@0 | 776 | /* 0x0308 0 */ .type conv_i32_to_d32_and_d16,2 |
michael@0 | 777 | /* 0x0308 */ .size conv_i32_to_d32_and_d16,(.-conv_i32_to_d32_and_d16) |
michael@0 | 778 | |
michael@0 | 779 | .section ".text",#alloc,#execinstr |
michael@0 | 780 | /* 000000 0 */ .align 4 |
michael@0 | 781 | ! |
michael@0 | 782 | ! SUBROUTINE adjust_montf_result |
michael@0 | 783 | ! |
michael@0 | 784 | ! OFFSET SOURCE LINE LABEL INSTRUCTION |
michael@0 | 785 | |
michael@0 | 786 | .global adjust_montf_result |
michael@0 | 787 | adjust_montf_result: |
michael@0 | 788 | /* 000000 */ or %g0,%o2,%g5 |
michael@0 | 789 | |
michael@0 | 790 | ! 181 ! } |
michael@0 | 791 | ! 182 !} |
michael@0 | 792 | ! 185 !void adjust_montf_result(unsigned int *i32, unsigned int *nint, int len) |
michael@0 | 793 | ! 186 !{ |
michael@0 | 794 | ! 187 !long long acc; |
michael@0 | 795 | ! 188 !int i; |
michael@0 | 796 | ! 190 ! if(i32[len]>0) i=-1; |
michael@0 | 797 | |
michael@0 | 798 | /* 0x0004 190 */ or %g0,-1,%g4 |
michael@0 | 799 | /* 0x0008 */ sll %o2,2,%g1 |
michael@0 | 800 | /* 0x000c */ ld [%o0+%g1],%g1 |
michael@0 | 801 | /* 0x0010 */ cmp %g1,0 |
michael@0 | 802 | /* 0x0014 */ bleu,pn %icc,.L77000175 |
michael@0 | 803 | /* 0x0018 */ or %g0,%o1,%o3 |
michael@0 | 804 | /* 0x001c */ ba .L900000511 |
michael@0 | 805 | /* 0x0020 */ cmp %g4,0 |
michael@0 | 806 | .L77000175: |
michael@0 | 807 | |
michael@0 | 808 | ! 191 ! else |
michael@0 | 809 | ! 192 ! { |
michael@0 | 810 | ! 193 ! for(i=len-1; i>=0; i--) |
michael@0 | 811 | |
michael@0 | 812 | /* 0x0024 193 */ sub %o2,1,%g4 |
michael@0 | 813 | /* 0x0028 */ sll %g4,2,%g1 |
michael@0 | 814 | /* 0x002c */ cmp %g4,0 |
michael@0 | 815 | /* 0x0030 */ bl,pt %icc,.L900000511 |
michael@0 | 816 | /* 0x0034 */ cmp %g4,0 |
michael@0 | 817 | /* 0x0038 */ add %o1,%g1,%g2 |
michael@0 | 818 | |
michael@0 | 819 | ! 194 ! { |
michael@0 | 820 | ! 195 ! if(i32[i]!=nint[i]) break; |
michael@0 | 821 | |
michael@0 | 822 | /* 0x003c 195 */ ld [%g2],%o5 |
michael@0 | 823 | /* 0x0040 193 */ add %o0,%g1,%g3 |
michael@0 | 824 | .L900000510: |
michael@0 | 825 | /* 0x0044 195 */ ld [%g3],%o2 |
michael@0 | 826 | /* 0x0048 */ sub %g4,1,%g1 |
michael@0 | 827 | /* 0x004c */ sub %g2,4,%g2 |
michael@0 | 828 | /* 0x0050 */ sub %g3,4,%g3 |
michael@0 | 829 | /* 0x0054 */ cmp %o2,%o5 |
michael@0 | 830 | /* 0x0058 */ bne,pn %icc,.L77000182 |
michael@0 | 831 | /* 0x005c */ nop |
michael@0 | 832 | /* 0x0060 0 */ or %g0,%g1,%g4 |
michael@0 | 833 | /* 0x0064 195 */ cmp %g1,0 |
michael@0 | 834 | /* 0x0068 */ bge,a,pt %icc,.L900000510 |
michael@0 | 835 | /* 0x006c */ ld [%g2],%o5 |
michael@0 | 836 | .L77000182: |
michael@0 | 837 | |
michael@0 | 838 | ! 196 ! } |
michael@0 | 839 | ! 197 ! } |
michael@0 | 840 | ! 198 ! if((i<0)||(i32[i]>nint[i])) |
michael@0 | 841 | |
michael@0 | 842 | /* 0x0070 198 */ cmp %g4,0 |
michael@0 | 843 | .L900000511: |
michael@0 | 844 | /* 0x0074 198 */ bl,pn %icc,.L77000198 |
michael@0 | 845 | /* 0x0078 */ sll %g4,2,%g2 |
michael@0 | 846 | /* 0x007c */ ld [%o1+%g2],%g1 |
michael@0 | 847 | /* 0x0080 */ ld [%o0+%g2],%g2 |
michael@0 | 848 | /* 0x0084 */ cmp %g2,%g1 |
michael@0 | 849 | /* 0x0088 */ bleu,pt %icc,.L77000191 |
michael@0 | 850 | /* 0x008c */ nop |
michael@0 | 851 | .L77000198: |
michael@0 | 852 | |
michael@0 | 853 | ! 199 ! { |
michael@0 | 854 | ! 200 ! acc=0; |
michael@0 | 855 | ! 201 ! for(i=0;i<len;i++) |
michael@0 | 856 | |
michael@0 | 857 | /* 0x0090 201 */ cmp %g5,0 |
michael@0 | 858 | /* 0x0094 */ ble,pt %icc,.L77000191 |
michael@0 | 859 | /* 0x0098 */ nop |
michael@0 | 860 | /* 0x009c */ or %g0,%g5,%g1 |
michael@0 | 861 | /* 0x00a0 198 */ or %g0,-1,%g2 |
michael@0 | 862 | /* 0x00a4 */ srl %g2,0,%g3 |
michael@0 | 863 | /* 0x00a8 */ sub %g5,1,%g4 |
michael@0 | 864 | /* 0x00ac 200 */ or %g0,0,%g5 |
michael@0 | 865 | /* 0x00b0 201 */ or %g0,0,%o5 |
michael@0 | 866 | /* 0x00b4 198 */ or %g0,%o0,%o4 |
michael@0 | 867 | /* 0x00b8 */ cmp %g1,3 |
michael@0 | 868 | /* 0x00bc 201 */ bl,pn %icc,.L77000199 |
michael@0 | 869 | /* 0x00c0 */ add %o0,8,%g1 |
michael@0 | 870 | /* 0x00c4 */ add %o1,4,%g2 |
michael@0 | 871 | |
michael@0 | 872 | ! 202 ! { |
michael@0 | 873 | ! 203 ! acc=acc+(unsigned long long)(i32[i])-(unsigned long long)(nint[i]); |
michael@0 | 874 | |
michael@0 | 875 | /* 0x00c8 203 */ ld [%o0],%o2 |
michael@0 | 876 | /* 0x00cc */ ld [%o1],%o1 |
michael@0 | 877 | /* 0x00d0 0 */ or %g0,%g1,%o4 |
michael@0 | 878 | /* 0x00d4 */ or %g0,%g2,%o3 |
michael@0 | 879 | /* 0x00d8 203 */ ld [%o0+4],%g1 |
michael@0 | 880 | |
michael@0 | 881 | ! 204 ! i32[i]=acc&0xffffffff; |
michael@0 | 882 | ! 205 ! acc=acc>>32; |
michael@0 | 883 | |
michael@0 | 884 | /* 0x00dc 205 */ or %g0,2,%o5 |
michael@0 | 885 | /* 0x00e0 201 */ sub %o2,%o1,%o2 |
michael@0 | 886 | /* 0x00e4 */ or %g0,%o2,%g5 |
michael@0 | 887 | /* 0x00e8 204 */ and %o2,%g3,%o2 |
michael@0 | 888 | /* 0x00ec */ st %o2,[%o0] |
michael@0 | 889 | /* 0x00f0 205 */ srax %g5,32,%g5 |
michael@0 | 890 | .L900000505: |
michael@0 | 891 | /* 0x00f4 203 */ ld [%o3],%o2 |
michael@0 | 892 | /* 0x00f8 205 */ add %o5,1,%o5 |
michael@0 | 893 | /* 0x00fc */ add %o3,4,%o3 |
michael@0 | 894 | /* 0x0100 */ cmp %o5,%g4 |
michael@0 | 895 | /* 0x0104 */ add %o4,4,%o4 |
michael@0 | 896 | /* 0x0108 201 */ sub %g1,%o2,%g1 |
michael@0 | 897 | /* 0x010c */ add %g1,%g5,%g5 |
michael@0 | 898 | /* 0x0110 204 */ and %g5,%g3,%o2 |
michael@0 | 899 | /* 0x0114 203 */ ld [%o4-4],%g1 |
michael@0 | 900 | /* 0x0118 204 */ st %o2,[%o4-8] |
michael@0 | 901 | /* 0x011c 205 */ ble,pt %icc,.L900000505 |
michael@0 | 902 | /* 0x0120 */ srax %g5,32,%g5 |
michael@0 | 903 | .L900000508: |
michael@0 | 904 | /* 0x0124 203 */ ld [%o3],%g2 |
michael@0 | 905 | /* 0x0128 201 */ sub %g1,%g2,%g1 |
michael@0 | 906 | /* 0x012c */ add %g1,%g5,%g1 |
michael@0 | 907 | /* 0x0130 204 */ and %g1,%g3,%g2 |
michael@0 | 908 | /* 0x0134 */ retl ! Result = |
michael@0 | 909 | /* 0x0138 */ st %g2,[%o4-4] |
michael@0 | 910 | .L77000199: |
michael@0 | 911 | /* 0x013c 203 */ ld [%o4],%g1 |
michael@0 | 912 | .L900000509: |
michael@0 | 913 | /* 0x0140 203 */ ld [%o3],%g2 |
michael@0 | 914 | /* 0x0144 */ add %g5,%g1,%g1 |
michael@0 | 915 | /* 0x0148 205 */ add %o5,1,%o5 |
michael@0 | 916 | /* 0x014c */ add %o3,4,%o3 |
michael@0 | 917 | /* 0x0150 */ cmp %o5,%g4 |
michael@0 | 918 | /* 0x0154 203 */ sub %g1,%g2,%g1 |
michael@0 | 919 | /* 0x0158 204 */ and %g1,%g3,%g2 |
michael@0 | 920 | /* 0x015c */ st %g2,[%o4] |
michael@0 | 921 | /* 0x0160 205 */ add %o4,4,%o4 |
michael@0 | 922 | /* 0x0164 */ srax %g1,32,%g5 |
michael@0 | 923 | /* 0x0168 */ ble,a,pt %icc,.L900000509 |
michael@0 | 924 | /* 0x016c */ ld [%o4],%g1 |
michael@0 | 925 | .L77000191: |
michael@0 | 926 | /* 0x0170 */ retl ! Result = |
michael@0 | 927 | /* 0x0174 */ nop |
michael@0 | 928 | /* 0x0178 0 */ .type adjust_montf_result,2 |
michael@0 | 929 | /* 0x0178 */ .size adjust_montf_result,(.-adjust_montf_result) |
michael@0 | 930 | |
michael@0 | 931 | .section ".text",#alloc,#execinstr |
michael@0 | 932 | /* 000000 0 */ .align 4 |
michael@0 | 933 | /* 000000 */ .skip 16 |
michael@0 | 934 | ! |
michael@0 | 935 | ! SUBROUTINE mont_mulf_noconv |
michael@0 | 936 | ! |
michael@0 | 937 | ! OFFSET SOURCE LINE LABEL INSTRUCTION |
michael@0 | 938 | |
michael@0 | 939 | .global mont_mulf_noconv |
michael@0 | 940 | mont_mulf_noconv: |
michael@0 | 941 | /* 000000 */ save %sp,-144,%sp |
michael@0 | 942 | .L900000646: |
michael@0 | 943 | /* 0x0004 */ call .+8 |
michael@0 | 944 | /* 0x0008 */ sethi /*X*/%hi(_GLOBAL_OFFSET_TABLE_-(.L900000646-.)),%g5 |
michael@0 | 945 | |
michael@0 | 946 | ! 206 ! } |
michael@0 | 947 | ! 207 ! } |
michael@0 | 948 | ! 208 !} |
michael@0 | 949 | ! 213 !/* |
michael@0 | 950 | ! 214 !** the lengths of the input arrays should be at least the following: |
michael@0 | 951 | ! 215 !** result[nlen+1], dm1[nlen], dm2[2*nlen+1], dt[4*nlen+2], dn[nlen], nint[nlen] |
michael@0 | 952 | ! 216 !** all of them should be different from one another |
michael@0 | 953 | ! 217 !** |
michael@0 | 954 | ! 218 !*/ |
michael@0 | 955 | ! 219 !void mont_mulf_noconv(unsigned int *result, |
michael@0 | 956 | ! 220 ! double *dm1, double *dm2, double *dt, |
michael@0 | 957 | ! 221 ! double *dn, unsigned int *nint, |
michael@0 | 958 | ! 222 ! int nlen, double dn0) |
michael@0 | 959 | ! 223 !{ |
michael@0 | 960 | ! 224 ! int i, j, jj; |
michael@0 | 961 | ! 225 ! int tmp; |
michael@0 | 962 | ! 226 ! double digit, m2j, nextm2j, a, b; |
michael@0 | 963 | ! 227 ! double *dptmp, *pdm1, *pdm2, *pdn, *pdtj, pdn_0, pdm1_0; |
michael@0 | 964 | ! 229 ! pdm1=&(dm1[0]); |
michael@0 | 965 | ! 230 ! pdm2=&(dm2[0]); |
michael@0 | 966 | ! 231 ! pdn=&(dn[0]); |
michael@0 | 967 | ! 232 ! pdm2[2*nlen]=Zero; |
michael@0 | 968 | |
michael@0 | 969 | /* 0x000c 232 */ ld [%fp+92],%o1 |
michael@0 | 970 | /* 0x0010 */ sethi %hi(Zero),%g2 |
michael@0 | 971 | /* 0x0014 223 */ ldd [%fp+96],%f2 |
michael@0 | 972 | /* 0x0018 */ add %g5,/*X*/%lo(_GLOBAL_OFFSET_TABLE_-(.L900000646-.)),%g5 |
michael@0 | 973 | /* 0x001c 232 */ add %g2,%lo(Zero),%g2 |
michael@0 | 974 | /* 0x0020 223 */ st %i0,[%fp+68] |
michael@0 | 975 | /* 0x0024 */ add %g5,%o7,%o3 |
michael@0 | 976 | |
michael@0 | 977 | ! 234 ! if (nlen!=16) |
michael@0 | 978 | ! 235 ! { |
michael@0 | 979 | ! 236 ! for(i=0;i<4*nlen+2;i++) dt[i]=Zero; |
michael@0 | 980 | ! 238 ! a=dt[0]=pdm1[0]*pdm2[0]; |
michael@0 | 981 | ! 239 ! digit=mod(lower32(a,Zero)*dn0,TwoToMinus16,TwoTo16); |
michael@0 | 982 | |
michael@0 | 983 | /* 0x0028 239 */ sethi %hi(TwoToMinus16),%g3 |
michael@0 | 984 | /* 0x002c 232 */ ld [%o3+%g2],%l0 |
michael@0 | 985 | /* 0x0030 239 */ sethi %hi(TwoTo16),%g4 |
michael@0 | 986 | /* 0x0034 223 */ or %g0,%i2,%o2 |
michael@0 | 987 | /* 0x0038 */ fmovd %f2,%f16 |
michael@0 | 988 | /* 0x003c */ st %i5,[%fp+88] |
michael@0 | 989 | /* 0x0040 239 */ add %g3,%lo(TwoToMinus16),%g2 |
michael@0 | 990 | /* 0x0044 223 */ or %g0,%i1,%i2 |
michael@0 | 991 | /* 0x0048 232 */ ldd [%l0],%f0 |
michael@0 | 992 | /* 0x004c 239 */ add %g4,%lo(TwoTo16),%g3 |
michael@0 | 993 | /* 0x0050 223 */ or %g0,%i3,%o0 |
michael@0 | 994 | /* 0x0054 232 */ sll %o1,4,%g4 |
michael@0 | 995 | /* 0x0058 239 */ ld [%o3+%g2],%g5 |
michael@0 | 996 | /* 0x005c 223 */ or %g0,%i3,%i1 |
michael@0 | 997 | /* 0x0060 239 */ ld [%o3+%g3],%g1 |
michael@0 | 998 | /* 0x0064 232 */ or %g0,%o1,%i0 |
michael@0 | 999 | /* 0x0068 */ or %g0,%o2,%i3 |
michael@0 | 1000 | /* 0x006c 234 */ cmp %o1,16 |
michael@0 | 1001 | /* 0x0070 */ be,pn %icc,.L77000279 |
michael@0 | 1002 | /* 0x0074 */ std %f0,[%o2+%g4] |
michael@0 | 1003 | /* 0x0078 236 */ sll %o1,2,%g2 |
michael@0 | 1004 | /* 0x007c */ or %g0,%o0,%o3 |
michael@0 | 1005 | /* 0x0080 232 */ sll %o1,1,%o1 |
michael@0 | 1006 | /* 0x0084 236 */ add %g2,2,%o2 |
michael@0 | 1007 | /* 0x0088 */ cmp %o2,0 |
michael@0 | 1008 | /* 0x008c */ ble,a,pt %icc,.L900000660 |
michael@0 | 1009 | /* 0x0090 */ ldd [%i2],%f0 |
michael@0 | 1010 | |
michael@0 | 1011 | ! 241 ! pdtj=&(dt[0]); |
michael@0 | 1012 | ! 242 ! for(j=jj=0;j<2*nlen;j++,jj++,pdtj++) |
michael@0 | 1013 | ! 243 ! { |
michael@0 | 1014 | ! 244 ! m2j=pdm2[j]; |
michael@0 | 1015 | ! 245 ! a=pdtj[0]+pdn[0]*digit; |
michael@0 | 1016 | ! 246 ! b=pdtj[1]+pdm1[0]*pdm2[j+1]+a*TwoToMinus16; |
michael@0 | 1017 | ! 247 ! pdtj[1]=b; |
michael@0 | 1018 | ! 249 !#pragma pipeloop(0) |
michael@0 | 1019 | ! 250 ! for(i=1;i<nlen;i++) |
michael@0 | 1020 | ! 251 ! { |
michael@0 | 1021 | ! 252 ! pdtj[2*i]+=pdm1[i]*m2j+pdn[i]*digit; |
michael@0 | 1022 | ! 253 ! } |
michael@0 | 1023 | ! 254 ! if((jj==30)) {cleanup(dt,j/2+1,2*nlen+1); jj=0;} |
michael@0 | 1024 | ! 255 ! |
michael@0 | 1025 | ! 256 ! digit=mod(lower32(b,Zero)*dn0,TwoToMinus16,TwoTo16); |
michael@0 | 1026 | ! 257 ! } |
michael@0 | 1027 | ! 258 ! } |
michael@0 | 1028 | ! 259 ! else |
michael@0 | 1029 | ! 260 ! { |
michael@0 | 1030 | ! 261 ! a=dt[0]=pdm1[0]*pdm2[0]; |
michael@0 | 1031 | ! 263 ! dt[65]= dt[64]= dt[63]= dt[62]= dt[61]= dt[60]= |
michael@0 | 1032 | ! 264 ! dt[59]= dt[58]= dt[57]= dt[56]= dt[55]= dt[54]= |
michael@0 | 1033 | ! 265 ! dt[53]= dt[52]= dt[51]= dt[50]= dt[49]= dt[48]= |
michael@0 | 1034 | ! 266 ! dt[47]= dt[46]= dt[45]= dt[44]= dt[43]= dt[42]= |
michael@0 | 1035 | ! 267 ! dt[41]= dt[40]= dt[39]= dt[38]= dt[37]= dt[36]= |
michael@0 | 1036 | ! 268 ! dt[35]= dt[34]= dt[33]= dt[32]= dt[31]= dt[30]= |
michael@0 | 1037 | ! 269 ! dt[29]= dt[28]= dt[27]= dt[26]= dt[25]= dt[24]= |
michael@0 | 1038 | ! 270 ! dt[23]= dt[22]= dt[21]= dt[20]= dt[19]= dt[18]= |
michael@0 | 1039 | ! 271 ! dt[17]= dt[16]= dt[15]= dt[14]= dt[13]= dt[12]= |
michael@0 | 1040 | ! 272 ! dt[11]= dt[10]= dt[ 9]= dt[ 8]= dt[ 7]= dt[ 6]= |
michael@0 | 1041 | ! 273 ! dt[ 5]= dt[ 4]= dt[ 3]= dt[ 2]= dt[ 1]=Zero; |
michael@0 | 1042 | ! 275 ! pdn_0=pdn[0]; |
michael@0 | 1043 | ! 276 ! pdm1_0=pdm1[0]; |
michael@0 | 1044 | ! 278 ! digit=mod(lower32(a,Zero)*dn0,TwoToMinus16,TwoTo16); |
michael@0 | 1045 | ! 279 ! pdtj=&(dt[0]); |
michael@0 | 1046 | ! 281 ! for(j=0;j<32;j++,pdtj++) |
michael@0 | 1047 | |
michael@0 | 1048 | /* 0x0094 281 */ add %g2,2,%o0 |
michael@0 | 1049 | /* 0x0098 236 */ add %g2,1,%o2 |
michael@0 | 1050 | /* 0x009c 281 */ cmp %o0,3 |
michael@0 | 1051 | /* 0x00a0 */ bl,pn %icc,.L77000280 |
michael@0 | 1052 | /* 0x00a4 */ or %g0,1,%o0 |
michael@0 | 1053 | /* 0x00a8 */ add %o3,8,%o3 |
michael@0 | 1054 | /* 0x00ac */ or %g0,1,%o4 |
michael@0 | 1055 | /* 0x00b0 */ std %f0,[%o3-8] |
michael@0 | 1056 | .L900000630: |
michael@0 | 1057 | /* 0x00b4 */ std %f0,[%o3] |
michael@0 | 1058 | /* 0x00b8 */ add %o4,2,%o4 |
michael@0 | 1059 | /* 0x00bc */ add %o3,16,%o3 |
michael@0 | 1060 | /* 0x00c0 */ cmp %o4,%g2 |
michael@0 | 1061 | /* 0x00c4 */ ble,pt %icc,.L900000630 |
michael@0 | 1062 | /* 0x00c8 */ std %f0,[%o3-8] |
michael@0 | 1063 | .L900000633: |
michael@0 | 1064 | /* 0x00cc */ cmp %o4,%o2 |
michael@0 | 1065 | /* 0x00d0 */ bg,pn %icc,.L77000285 |
michael@0 | 1066 | /* 0x00d4 */ add %o4,1,%o0 |
michael@0 | 1067 | .L77000280: |
michael@0 | 1068 | /* 0x00d8 */ std %f0,[%o3] |
michael@0 | 1069 | .L900000659: |
michael@0 | 1070 | /* 0x00dc */ ldd [%l0],%f0 |
michael@0 | 1071 | /* 0x00e0 */ cmp %o0,%o2 |
michael@0 | 1072 | /* 0x00e4 */ add %o3,8,%o3 |
michael@0 | 1073 | /* 0x00e8 */ add %o0,1,%o0 |
michael@0 | 1074 | /* 0x00ec */ ble,a,pt %icc,.L900000659 |
michael@0 | 1075 | /* 0x00f0 */ std %f0,[%o3] |
michael@0 | 1076 | .L77000285: |
michael@0 | 1077 | /* 0x00f4 238 */ ldd [%i2],%f0 |
michael@0 | 1078 | .L900000660: |
michael@0 | 1079 | /* 0x00f8 238 */ ldd [%i3],%f2 |
michael@0 | 1080 | /* 0x00fc */ add %o1,1,%o2 |
michael@0 | 1081 | /* 0x0100 242 */ cmp %o1,0 |
michael@0 | 1082 | /* 0x0104 */ sll %o2,1,%o0 |
michael@0 | 1083 | /* 0x0108 */ sub %o1,1,%o1 |
michael@0 | 1084 | /* 0x010c 238 */ fmuld %f0,%f2,%f0 |
michael@0 | 1085 | /* 0x0110 */ std %f0,[%i1] |
michael@0 | 1086 | /* 0x0114 0 */ or %g0,0,%l1 |
michael@0 | 1087 | /* 0x0118 */ ldd [%l0],%f6 |
michael@0 | 1088 | /* 0x011c */ or %g0,0,%g4 |
michael@0 | 1089 | /* 0x0120 */ or %g0,%o2,%i5 |
michael@0 | 1090 | /* 0x0124 */ ldd [%g5],%f2 |
michael@0 | 1091 | /* 0x0128 */ or %g0,%o1,%g3 |
michael@0 | 1092 | /* 0x012c */ or %g0,%o0,%o3 |
michael@0 | 1093 | /* 0x0130 */ fdtox %f0,%f0 |
michael@0 | 1094 | /* 0x0134 */ ldd [%g1],%f4 |
michael@0 | 1095 | /* 0x0138 246 */ add %i3,8,%o4 |
michael@0 | 1096 | /* 0x013c */ or %g0,0,%l2 |
michael@0 | 1097 | /* 0x0140 */ or %g0,%i1,%o5 |
michael@0 | 1098 | /* 0x0144 */ sub %i0,1,%o7 |
michael@0 | 1099 | /* 0x0148 */ fmovs %f6,%f0 |
michael@0 | 1100 | /* 0x014c */ fxtod %f0,%f0 |
michael@0 | 1101 | /* 0x0150 239 */ fmuld %f0,%f16,%f0 |
michael@0 | 1102 | /* 0x0154 */ fmuld %f0,%f2,%f2 |
michael@0 | 1103 | /* 0x0158 */ fdtox %f2,%f2 |
michael@0 | 1104 | /* 0x015c */ fxtod %f2,%f2 |
michael@0 | 1105 | /* 0x0160 */ fmuld %f2,%f4,%f2 |
michael@0 | 1106 | /* 0x0164 */ fsubd %f0,%f2,%f22 |
michael@0 | 1107 | /* 0x0168 242 */ ble,pt %icc,.L900000653 |
michael@0 | 1108 | /* 0x016c */ sll %i0,4,%g2 |
michael@0 | 1109 | /* 0x0170 246 */ ldd [%i4],%f0 |
michael@0 | 1110 | .L900000654: |
michael@0 | 1111 | /* 0x0174 246 */ fmuld %f0,%f22,%f8 |
michael@0 | 1112 | /* 0x0178 */ ldd [%i2],%f0 |
michael@0 | 1113 | /* 0x017c 250 */ cmp %i0,1 |
michael@0 | 1114 | /* 0x0180 246 */ ldd [%o4+%l2],%f6 |
michael@0 | 1115 | /* 0x0184 */ add %i2,8,%o0 |
michael@0 | 1116 | /* 0x0188 250 */ or %g0,1,%o1 |
michael@0 | 1117 | /* 0x018c 246 */ ldd [%o5],%f2 |
michael@0 | 1118 | /* 0x0190 */ add %o5,16,%l3 |
michael@0 | 1119 | /* 0x0194 */ fmuld %f0,%f6,%f6 |
michael@0 | 1120 | /* 0x0198 */ ldd [%g5],%f4 |
michael@0 | 1121 | /* 0x019c */ faddd %f2,%f8,%f2 |
michael@0 | 1122 | /* 0x01a0 */ ldd [%o5+8],%f0 |
michael@0 | 1123 | /* 0x01a4 244 */ ldd [%i3+%l2],%f20 |
michael@0 | 1124 | /* 0x01a8 246 */ faddd %f0,%f6,%f0 |
michael@0 | 1125 | /* 0x01ac */ fmuld %f2,%f4,%f2 |
michael@0 | 1126 | /* 0x01b0 */ faddd %f0,%f2,%f18 |
michael@0 | 1127 | /* 0x01b4 247 */ std %f18,[%o5+8] |
michael@0 | 1128 | /* 0x01b8 250 */ ble,pt %icc,.L900000658 |
michael@0 | 1129 | /* 0x01bc */ srl %g4,31,%g2 |
michael@0 | 1130 | /* 0x01c0 */ cmp %o7,7 |
michael@0 | 1131 | /* 0x01c4 246 */ add %i4,8,%g2 |
michael@0 | 1132 | /* 0x01c8 250 */ bl,pn %icc,.L77000284 |
michael@0 | 1133 | /* 0x01cc */ add %g2,24,%o2 |
michael@0 | 1134 | /* 0x01d0 252 */ ldd [%o0+24],%f12 |
michael@0 | 1135 | /* 0x01d4 */ add %o5,48,%l3 |
michael@0 | 1136 | /* 0x01d8 */ ldd [%o0],%f2 |
michael@0 | 1137 | /* 0x01dc 0 */ or %g0,%o2,%g2 |
michael@0 | 1138 | /* 0x01e0 250 */ sub %o7,2,%o2 |
michael@0 | 1139 | /* 0x01e4 252 */ ldd [%g2-24],%f0 |
michael@0 | 1140 | /* 0x01e8 */ or %g0,5,%o1 |
michael@0 | 1141 | /* 0x01ec */ ldd [%o0+8],%f6 |
michael@0 | 1142 | /* 0x01f0 */ fmuld %f2,%f20,%f2 |
michael@0 | 1143 | /* 0x01f4 */ ldd [%o0+16],%f14 |
michael@0 | 1144 | /* 0x01f8 */ fmuld %f0,%f22,%f4 |
michael@0 | 1145 | /* 0x01fc */ add %o0,32,%o0 |
michael@0 | 1146 | /* 0x0200 */ ldd [%g2-16],%f8 |
michael@0 | 1147 | /* 0x0204 */ fmuld %f6,%f20,%f10 |
michael@0 | 1148 | /* 0x0208 */ ldd [%o5+16],%f0 |
michael@0 | 1149 | /* 0x020c */ ldd [%g2-8],%f6 |
michael@0 | 1150 | /* 0x0210 */ faddd %f2,%f4,%f4 |
michael@0 | 1151 | /* 0x0214 */ ldd [%o5+32],%f2 |
michael@0 | 1152 | .L900000642: |
michael@0 | 1153 | /* 0x0218 252 */ ldd [%g2],%f24 |
michael@0 | 1154 | /* 0x021c */ add %o1,3,%o1 |
michael@0 | 1155 | /* 0x0220 */ add %g2,24,%g2 |
michael@0 | 1156 | /* 0x0224 */ fmuld %f8,%f22,%f8 |
michael@0 | 1157 | /* 0x0228 */ ldd [%l3],%f28 |
michael@0 | 1158 | /* 0x022c */ cmp %o1,%o2 |
michael@0 | 1159 | /* 0x0230 */ add %o0,24,%o0 |
michael@0 | 1160 | /* 0x0234 */ ldd [%o0-24],%f26 |
michael@0 | 1161 | /* 0x0238 */ faddd %f0,%f4,%f0 |
michael@0 | 1162 | /* 0x023c */ add %l3,48,%l3 |
michael@0 | 1163 | /* 0x0240 */ faddd %f10,%f8,%f10 |
michael@0 | 1164 | /* 0x0244 */ fmuld %f14,%f20,%f4 |
michael@0 | 1165 | /* 0x0248 */ std %f0,[%l3-80] |
michael@0 | 1166 | /* 0x024c */ ldd [%g2-16],%f8 |
michael@0 | 1167 | /* 0x0250 */ fmuld %f6,%f22,%f6 |
michael@0 | 1168 | /* 0x0254 */ ldd [%l3-32],%f0 |
michael@0 | 1169 | /* 0x0258 */ ldd [%o0-16],%f14 |
michael@0 | 1170 | /* 0x025c */ faddd %f2,%f10,%f2 |
michael@0 | 1171 | /* 0x0260 */ faddd %f4,%f6,%f10 |
michael@0 | 1172 | /* 0x0264 */ fmuld %f12,%f20,%f4 |
michael@0 | 1173 | /* 0x0268 */ std %f2,[%l3-64] |
michael@0 | 1174 | /* 0x026c */ ldd [%g2-8],%f6 |
michael@0 | 1175 | /* 0x0270 */ fmuld %f24,%f22,%f24 |
michael@0 | 1176 | /* 0x0274 */ ldd [%l3-16],%f2 |
michael@0 | 1177 | /* 0x0278 */ ldd [%o0-8],%f12 |
michael@0 | 1178 | /* 0x027c */ faddd %f28,%f10,%f10 |
michael@0 | 1179 | /* 0x0280 */ std %f10,[%l3-48] |
michael@0 | 1180 | /* 0x0284 */ fmuld %f26,%f20,%f10 |
michael@0 | 1181 | /* 0x0288 */ ble,pt %icc,.L900000642 |
michael@0 | 1182 | /* 0x028c */ faddd %f4,%f24,%f4 |
michael@0 | 1183 | .L900000645: |
michael@0 | 1184 | /* 0x0290 252 */ fmuld %f8,%f22,%f28 |
michael@0 | 1185 | /* 0x0294 */ ldd [%g2],%f24 |
michael@0 | 1186 | /* 0x0298 */ faddd %f0,%f4,%f26 |
michael@0 | 1187 | /* 0x029c */ fmuld %f12,%f20,%f8 |
michael@0 | 1188 | /* 0x02a0 */ add %l3,32,%l3 |
michael@0 | 1189 | /* 0x02a4 */ cmp %o1,%o7 |
michael@0 | 1190 | /* 0x02a8 */ fmuld %f14,%f20,%f14 |
michael@0 | 1191 | /* 0x02ac */ ldd [%l3-32],%f4 |
michael@0 | 1192 | /* 0x02b0 */ add %g2,8,%g2 |
michael@0 | 1193 | /* 0x02b4 */ faddd %f10,%f28,%f12 |
michael@0 | 1194 | /* 0x02b8 */ fmuld %f6,%f22,%f6 |
michael@0 | 1195 | /* 0x02bc */ ldd [%l3-16],%f0 |
michael@0 | 1196 | /* 0x02c0 */ fmuld %f24,%f22,%f10 |
michael@0 | 1197 | /* 0x02c4 */ std %f26,[%l3-64] |
michael@0 | 1198 | /* 0x02c8 */ faddd %f2,%f12,%f2 |
michael@0 | 1199 | /* 0x02cc */ std %f2,[%l3-48] |
michael@0 | 1200 | /* 0x02d0 */ faddd %f14,%f6,%f6 |
michael@0 | 1201 | /* 0x02d4 */ faddd %f8,%f10,%f2 |
michael@0 | 1202 | /* 0x02d8 */ faddd %f4,%f6,%f4 |
michael@0 | 1203 | /* 0x02dc */ std %f4,[%l3-32] |
michael@0 | 1204 | /* 0x02e0 */ faddd %f0,%f2,%f0 |
michael@0 | 1205 | /* 0x02e4 */ bg,pn %icc,.L77000213 |
michael@0 | 1206 | /* 0x02e8 */ std %f0,[%l3-16] |
michael@0 | 1207 | .L77000284: |
michael@0 | 1208 | /* 0x02ec 252 */ ldd [%o0],%f0 |
michael@0 | 1209 | .L900000657: |
michael@0 | 1210 | /* 0x02f0 252 */ ldd [%g2],%f4 |
michael@0 | 1211 | /* 0x02f4 */ fmuld %f0,%f20,%f2 |
michael@0 | 1212 | /* 0x02f8 */ add %o1,1,%o1 |
michael@0 | 1213 | /* 0x02fc */ ldd [%l3],%f0 |
michael@0 | 1214 | /* 0x0300 */ add %o0,8,%o0 |
michael@0 | 1215 | /* 0x0304 */ add %g2,8,%g2 |
michael@0 | 1216 | /* 0x0308 */ fmuld %f4,%f22,%f4 |
michael@0 | 1217 | /* 0x030c */ cmp %o1,%o7 |
michael@0 | 1218 | /* 0x0310 */ faddd %f2,%f4,%f2 |
michael@0 | 1219 | /* 0x0314 */ faddd %f0,%f2,%f0 |
michael@0 | 1220 | /* 0x0318 */ std %f0,[%l3] |
michael@0 | 1221 | /* 0x031c */ add %l3,16,%l3 |
michael@0 | 1222 | /* 0x0320 */ ble,a,pt %icc,.L900000657 |
michael@0 | 1223 | /* 0x0324 */ ldd [%o0],%f0 |
michael@0 | 1224 | .L77000213: |
michael@0 | 1225 | /* 0x0328 */ srl %g4,31,%g2 |
michael@0 | 1226 | .L900000658: |
michael@0 | 1227 | /* 0x032c 254 */ cmp %l1,30 |
michael@0 | 1228 | /* 0x0330 */ bne,a,pt %icc,.L900000656 |
michael@0 | 1229 | /* 0x0334 */ fdtox %f18,%f0 |
michael@0 | 1230 | /* 0x0338 */ add %g4,%g2,%g2 |
michael@0 | 1231 | /* 0x033c */ sra %g2,1,%o0 |
michael@0 | 1232 | /* 0x0340 281 */ ldd [%l0],%f0 |
michael@0 | 1233 | /* 0x0344 */ sll %i5,1,%o2 |
michael@0 | 1234 | /* 0x0348 */ add %o0,1,%g2 |
michael@0 | 1235 | /* 0x034c */ sll %g2,1,%o0 |
michael@0 | 1236 | /* 0x0350 254 */ sub %o2,1,%o2 |
michael@0 | 1237 | /* 0x0354 281 */ fmovd %f0,%f2 |
michael@0 | 1238 | /* 0x0358 */ sll %g2,4,%o1 |
michael@0 | 1239 | /* 0x035c */ cmp %o0,%o3 |
michael@0 | 1240 | /* 0x0360 */ bge,pt %icc,.L77000215 |
michael@0 | 1241 | /* 0x0364 */ or %g0,0,%l1 |
michael@0 | 1242 | /* 0x0368 254 */ add %i1,%o1,%o1 |
michael@0 | 1243 | /* 0x036c 281 */ ldd [%o1],%f6 |
michael@0 | 1244 | .L900000655: |
michael@0 | 1245 | /* 0x0370 */ fdtox %f6,%f10 |
michael@0 | 1246 | /* 0x0374 */ ldd [%o1+8],%f4 |
michael@0 | 1247 | /* 0x0378 */ add %o0,2,%o0 |
michael@0 | 1248 | /* 0x037c */ ldd [%l0],%f12 |
michael@0 | 1249 | /* 0x0380 */ fdtox %f6,%f6 |
michael@0 | 1250 | /* 0x0384 */ cmp %o0,%o2 |
michael@0 | 1251 | /* 0x0388 */ fdtox %f4,%f8 |
michael@0 | 1252 | /* 0x038c */ fdtox %f4,%f4 |
michael@0 | 1253 | /* 0x0390 */ fmovs %f12,%f10 |
michael@0 | 1254 | /* 0x0394 */ fmovs %f12,%f8 |
michael@0 | 1255 | /* 0x0398 */ fxtod %f10,%f10 |
michael@0 | 1256 | /* 0x039c */ fxtod %f8,%f8 |
michael@0 | 1257 | /* 0x03a0 */ faddd %f10,%f2,%f2 |
michael@0 | 1258 | /* 0x03a4 */ std %f2,[%o1] |
michael@0 | 1259 | /* 0x03a8 */ faddd %f8,%f0,%f0 |
michael@0 | 1260 | /* 0x03ac */ std %f0,[%o1+8] |
michael@0 | 1261 | /* 0x03b0 */ add %o1,16,%o1 |
michael@0 | 1262 | /* 0x03b4 */ fitod %f6,%f2 |
michael@0 | 1263 | /* 0x03b8 */ fitod %f4,%f0 |
michael@0 | 1264 | /* 0x03bc */ ble,a,pt %icc,.L900000655 |
michael@0 | 1265 | /* 0x03c0 */ ldd [%o1],%f6 |
michael@0 | 1266 | .L77000233: |
michael@0 | 1267 | /* 0x03c4 */ or %g0,0,%l1 |
michael@0 | 1268 | .L77000215: |
michael@0 | 1269 | /* 0x03c8 */ fdtox %f18,%f0 |
michael@0 | 1270 | .L900000656: |
michael@0 | 1271 | /* 0x03cc */ ldd [%l0],%f6 |
michael@0 | 1272 | /* 0x03d0 256 */ add %g4,1,%g4 |
michael@0 | 1273 | /* 0x03d4 */ add %l2,8,%l2 |
michael@0 | 1274 | /* 0x03d8 */ ldd [%g5],%f2 |
michael@0 | 1275 | /* 0x03dc */ add %l1,1,%l1 |
michael@0 | 1276 | /* 0x03e0 */ add %o5,8,%o5 |
michael@0 | 1277 | /* 0x03e4 */ fmovs %f6,%f0 |
michael@0 | 1278 | /* 0x03e8 */ ldd [%g1],%f4 |
michael@0 | 1279 | /* 0x03ec */ cmp %g4,%g3 |
michael@0 | 1280 | /* 0x03f0 */ fxtod %f0,%f0 |
michael@0 | 1281 | /* 0x03f4 */ fmuld %f0,%f16,%f0 |
michael@0 | 1282 | /* 0x03f8 */ fmuld %f0,%f2,%f2 |
michael@0 | 1283 | /* 0x03fc */ fdtox %f2,%f2 |
michael@0 | 1284 | /* 0x0400 */ fxtod %f2,%f2 |
michael@0 | 1285 | /* 0x0404 */ fmuld %f2,%f4,%f2 |
michael@0 | 1286 | /* 0x0408 */ fsubd %f0,%f2,%f22 |
michael@0 | 1287 | /* 0x040c */ ble,a,pt %icc,.L900000654 |
michael@0 | 1288 | /* 0x0410 */ ldd [%i4],%f0 |
michael@0 | 1289 | .L900000629: |
michael@0 | 1290 | /* 0x0414 256 */ ba .L900000653 |
michael@0 | 1291 | /* 0x0418 */ sll %i0,4,%g2 |
michael@0 | 1292 | .L77000279: |
michael@0 | 1293 | /* 0x041c 261 */ ldd [%o2],%f6 |
michael@0 | 1294 | /* 0x0420 279 */ or %g0,%o0,%o4 |
michael@0 | 1295 | /* 0x0424 281 */ or %g0,0,%o3 |
michael@0 | 1296 | /* 0x0428 261 */ ldd [%i2],%f4 |
michael@0 | 1297 | /* 0x042c 273 */ std %f0,[%o0+8] |
michael@0 | 1298 | /* 0x0430 */ std %f0,[%o0+16] |
michael@0 | 1299 | /* 0x0434 261 */ fmuld %f4,%f6,%f4 |
michael@0 | 1300 | /* 0x0438 */ std %f4,[%o0] |
michael@0 | 1301 | /* 0x043c 273 */ std %f0,[%o0+24] |
michael@0 | 1302 | /* 0x0440 */ std %f0,[%o0+32] |
michael@0 | 1303 | /* 0x0444 */ fdtox %f4,%f4 |
michael@0 | 1304 | /* 0x0448 */ std %f0,[%o0+40] |
michael@0 | 1305 | /* 0x044c */ std %f0,[%o0+48] |
michael@0 | 1306 | /* 0x0450 */ std %f0,[%o0+56] |
michael@0 | 1307 | /* 0x0454 */ std %f0,[%o0+64] |
michael@0 | 1308 | /* 0x0458 */ std %f0,[%o0+72] |
michael@0 | 1309 | /* 0x045c */ std %f0,[%o0+80] |
michael@0 | 1310 | /* 0x0460 */ std %f0,[%o0+88] |
michael@0 | 1311 | /* 0x0464 */ std %f0,[%o0+96] |
michael@0 | 1312 | /* 0x0468 */ std %f0,[%o0+104] |
michael@0 | 1313 | /* 0x046c */ std %f0,[%o0+112] |
michael@0 | 1314 | /* 0x0470 */ std %f0,[%o0+120] |
michael@0 | 1315 | /* 0x0474 */ std %f0,[%o0+128] |
michael@0 | 1316 | /* 0x0478 */ std %f0,[%o0+136] |
michael@0 | 1317 | /* 0x047c */ std %f0,[%o0+144] |
michael@0 | 1318 | /* 0x0480 */ std %f0,[%o0+152] |
michael@0 | 1319 | /* 0x0484 */ std %f0,[%o0+160] |
michael@0 | 1320 | /* 0x0488 */ std %f0,[%o0+168] |
michael@0 | 1321 | /* 0x048c */ fmovs %f0,%f4 |
michael@0 | 1322 | /* 0x0490 */ std %f0,[%o0+176] |
michael@0 | 1323 | /* 0x0494 281 */ or %g0,0,%o1 |
michael@0 | 1324 | /* 0x0498 273 */ std %f0,[%o0+184] |
michael@0 | 1325 | /* 0x049c */ fxtod %f4,%f4 |
michael@0 | 1326 | /* 0x04a0 */ std %f0,[%o0+192] |
michael@0 | 1327 | /* 0x04a4 */ std %f0,[%o0+200] |
michael@0 | 1328 | /* 0x04a8 */ std %f0,[%o0+208] |
michael@0 | 1329 | /* 0x04ac 278 */ fmuld %f4,%f2,%f2 |
michael@0 | 1330 | /* 0x04b0 273 */ std %f0,[%o0+216] |
michael@0 | 1331 | /* 0x04b4 */ std %f0,[%o0+224] |
michael@0 | 1332 | /* 0x04b8 */ std %f0,[%o0+232] |
michael@0 | 1333 | /* 0x04bc */ std %f0,[%o0+240] |
michael@0 | 1334 | /* 0x04c0 */ std %f0,[%o0+248] |
michael@0 | 1335 | /* 0x04c4 */ std %f0,[%o0+256] |
michael@0 | 1336 | /* 0x04c8 */ std %f0,[%o0+264] |
michael@0 | 1337 | /* 0x04cc */ std %f0,[%o0+272] |
michael@0 | 1338 | /* 0x04d0 */ std %f0,[%o0+280] |
michael@0 | 1339 | /* 0x04d4 */ std %f0,[%o0+288] |
michael@0 | 1340 | /* 0x04d8 */ std %f0,[%o0+296] |
michael@0 | 1341 | /* 0x04dc */ std %f0,[%o0+304] |
michael@0 | 1342 | /* 0x04e0 */ std %f0,[%o0+312] |
michael@0 | 1343 | /* 0x04e4 */ std %f0,[%o0+320] |
michael@0 | 1344 | /* 0x04e8 */ std %f0,[%o0+328] |
michael@0 | 1345 | /* 0x04ec */ std %f0,[%o0+336] |
michael@0 | 1346 | /* 0x04f0 */ std %f0,[%o0+344] |
michael@0 | 1347 | /* 0x04f4 */ std %f0,[%o0+352] |
michael@0 | 1348 | /* 0x04f8 */ std %f0,[%o0+360] |
michael@0 | 1349 | /* 0x04fc */ std %f0,[%o0+368] |
michael@0 | 1350 | /* 0x0500 */ std %f0,[%o0+376] |
michael@0 | 1351 | /* 0x0504 */ std %f0,[%o0+384] |
michael@0 | 1352 | /* 0x0508 */ std %f0,[%o0+392] |
michael@0 | 1353 | /* 0x050c */ std %f0,[%o0+400] |
michael@0 | 1354 | /* 0x0510 */ std %f0,[%o0+408] |
michael@0 | 1355 | /* 0x0514 */ std %f0,[%o0+416] |
michael@0 | 1356 | /* 0x0518 */ std %f0,[%o0+424] |
michael@0 | 1357 | /* 0x051c */ std %f0,[%o0+432] |
michael@0 | 1358 | /* 0x0520 */ std %f0,[%o0+440] |
michael@0 | 1359 | /* 0x0524 */ std %f0,[%o0+448] |
michael@0 | 1360 | /* 0x0528 */ std %f0,[%o0+456] |
michael@0 | 1361 | /* 0x052c */ std %f0,[%o0+464] |
michael@0 | 1362 | /* 0x0530 */ std %f0,[%o0+472] |
michael@0 | 1363 | /* 0x0534 */ std %f0,[%o0+480] |
michael@0 | 1364 | /* 0x0538 */ std %f0,[%o0+488] |
michael@0 | 1365 | /* 0x053c */ std %f0,[%o0+496] |
michael@0 | 1366 | /* 0x0540 */ std %f0,[%o0+504] |
michael@0 | 1367 | /* 0x0544 */ std %f0,[%o0+512] |
michael@0 | 1368 | /* 0x0548 */ std %f0,[%o0+520] |
michael@0 | 1369 | /* 0x054c */ ldd [%g5],%f0 |
michael@0 | 1370 | /* 0x0550 */ ldd [%g1],%f8 |
michael@0 | 1371 | /* 0x0554 */ fmuld %f2,%f0,%f6 |
michael@0 | 1372 | /* 0x0558 275 */ ldd [%i4],%f4 |
michael@0 | 1373 | /* 0x055c 276 */ ldd [%i2],%f0 |
michael@0 | 1374 | /* 0x0560 */ fdtox %f6,%f6 |
michael@0 | 1375 | /* 0x0564 */ fxtod %f6,%f6 |
michael@0 | 1376 | /* 0x0568 */ fmuld %f6,%f8,%f6 |
michael@0 | 1377 | /* 0x056c */ fsubd %f2,%f6,%f2 |
michael@0 | 1378 | /* 0x0570 286 */ fmuld %f4,%f2,%f12 |
michael@0 | 1379 | |
michael@0 | 1380 | ! 282 ! { |
michael@0 | 1381 | ! 284 ! m2j=pdm2[j]; |
michael@0 | 1382 | ! 285 ! a=pdtj[0]+pdn_0*digit; |
michael@0 | 1383 | ! 286 ! b=pdtj[1]+pdm1_0*pdm2[j+1]+a*TwoToMinus16; |
michael@0 | 1384 | |
michael@0 | 1385 | ! 287 ! pdtj[1]=b; |
michael@0 | 1386 | ! 289 ! /**** this loop will be fully unrolled: |
michael@0 | 1387 | ! 290 ! for(i=1;i<16;i++) |
michael@0 | 1388 | ! 291 ! { |
michael@0 | 1389 | ! 292 ! pdtj[2*i]+=pdm1[i]*m2j+pdn[i]*digit; |
michael@0 | 1390 | ! 293 ! } |
michael@0 | 1391 | ! 294 ! *************************************/ |
michael@0 | 1392 | ! 295 ! pdtj[2]+=pdm1[1]*m2j+pdn[1]*digit; |
michael@0 | 1393 | ! 296 ! pdtj[4]+=pdm1[2]*m2j+pdn[2]*digit; |
michael@0 | 1394 | ! 297 ! pdtj[6]+=pdm1[3]*m2j+pdn[3]*digit; |
michael@0 | 1395 | ! 298 ! pdtj[8]+=pdm1[4]*m2j+pdn[4]*digit; |
michael@0 | 1396 | ! 299 ! pdtj[10]+=pdm1[5]*m2j+pdn[5]*digit; |
michael@0 | 1397 | ! 300 ! pdtj[12]+=pdm1[6]*m2j+pdn[6]*digit; |
michael@0 | 1398 | ! 301 ! pdtj[14]+=pdm1[7]*m2j+pdn[7]*digit; |
michael@0 | 1399 | ! 302 ! pdtj[16]+=pdm1[8]*m2j+pdn[8]*digit; |
michael@0 | 1400 | ! 303 ! pdtj[18]+=pdm1[9]*m2j+pdn[9]*digit; |
michael@0 | 1401 | ! 304 ! pdtj[20]+=pdm1[10]*m2j+pdn[10]*digit; |
michael@0 | 1402 | ! 305 ! pdtj[22]+=pdm1[11]*m2j+pdn[11]*digit; |
michael@0 | 1403 | ! 306 ! pdtj[24]+=pdm1[12]*m2j+pdn[12]*digit; |
michael@0 | 1404 | ! 307 ! pdtj[26]+=pdm1[13]*m2j+pdn[13]*digit; |
michael@0 | 1405 | ! 308 ! pdtj[28]+=pdm1[14]*m2j+pdn[14]*digit; |
michael@0 | 1406 | ! 309 ! pdtj[30]+=pdm1[15]*m2j+pdn[15]*digit; |
michael@0 | 1407 | ! 310 ! /* no need for cleenup, cannot overflow */ |
michael@0 | 1408 | ! 311 ! digit=mod(lower32(b,Zero)*dn0,TwoToMinus16,TwoTo16); |
michael@0 | 1409 | |
michael@0 | 1410 | fmovd %f2,%f0 ! hand modified |
michael@0 | 1411 | fmovd %f16,%f18 ! hand modified |
michael@0 | 1412 | ldd [%i4],%f2 |
michael@0 | 1413 | ldd [%o4],%f8 |
michael@0 | 1414 | ldd [%i2],%f10 |
michael@0 | 1415 | ldd [%g5],%f14 ! hand modified |
michael@0 | 1416 | ldd [%g1],%f16 ! hand modified |
michael@0 | 1417 | ldd [%i3],%f24 |
michael@0 | 1418 | |
michael@0 | 1419 | ldd [%i2+8],%f26 |
michael@0 | 1420 | ldd [%i2+16],%f40 |
michael@0 | 1421 | ldd [%i2+48],%f46 |
michael@0 | 1422 | ldd [%i2+56],%f30 |
michael@0 | 1423 | ldd [%i2+64],%f54 |
michael@0 | 1424 | ldd [%i2+104],%f34 |
michael@0 | 1425 | ldd [%i2+112],%f58 |
michael@0 | 1426 | |
michael@0 | 1427 | ldd [%i4+8],%f28 |
michael@0 | 1428 | ldd [%i4+104],%f38 |
michael@0 | 1429 | ldd [%i4+112],%f60 |
michael@0 | 1430 | |
michael@0 | 1431 | .L99999999: !1 |
michael@0 | 1432 | ldd [%i2+24],%f32 |
michael@0 | 1433 | fmuld %f0,%f2,%f4 !2 |
michael@0 | 1434 | ldd [%i4+24],%f36 |
michael@0 | 1435 | fmuld %f26,%f24,%f20 !3 |
michael@0 | 1436 | ldd [%i2+40],%f42 |
michael@0 | 1437 | fmuld %f28,%f0,%f22 !4 |
michael@0 | 1438 | ldd [%i4+40],%f44 |
michael@0 | 1439 | fmuld %f32,%f24,%f32 !5 |
michael@0 | 1440 | ldd [%i3+8],%f6 |
michael@0 | 1441 | faddd %f4,%f8,%f4 |
michael@0 | 1442 | fmuld %f36,%f0,%f36 !6 |
michael@0 | 1443 | add %i3,8,%i3 |
michael@0 | 1444 | ldd [%i4+56],%f50 |
michael@0 | 1445 | fmuld %f42,%f24,%f42 !7 |
michael@0 | 1446 | ldd [%i2+72],%f52 |
michael@0 | 1447 | faddd %f20,%f22,%f20 |
michael@0 | 1448 | fmuld %f44,%f0,%f44 !8 |
michael@0 | 1449 | ldd [%o4+16],%f22 |
michael@0 | 1450 | fmuld %f10,%f6,%f12 !9 |
michael@0 | 1451 | ldd [%i4+72],%f56 |
michael@0 | 1452 | faddd %f32,%f36,%f32 |
michael@0 | 1453 | fmuld %f14,%f4,%f4 !10 |
michael@0 | 1454 | ldd [%o4+48],%f36 |
michael@0 | 1455 | fmuld %f30,%f24,%f48 !11 |
michael@0 | 1456 | ldd [%o4+8],%f8 |
michael@0 | 1457 | faddd %f20,%f22,%f20 |
michael@0 | 1458 | fmuld %f50,%f0,%f50 !12 |
michael@0 | 1459 | std %f20,[%o4+16] |
michael@0 | 1460 | faddd %f42,%f44,%f42 |
michael@0 | 1461 | fmuld %f52,%f24,%f52 !13 |
michael@0 | 1462 | ldd [%o4+80],%f44 |
michael@0 | 1463 | faddd %f4,%f12,%f4 |
michael@0 | 1464 | fmuld %f56,%f0,%f56 !14 |
michael@0 | 1465 | ldd [%i2+88],%f20 |
michael@0 | 1466 | faddd %f32,%f36,%f32 !15 |
michael@0 | 1467 | ldd [%i4+88],%f22 |
michael@0 | 1468 | faddd %f48,%f50,%f48 !16 |
michael@0 | 1469 | ldd [%o4+112],%f50 |
michael@0 | 1470 | faddd %f52,%f56,%f52 !17 |
michael@0 | 1471 | ldd [%o4+144],%f56 |
michael@0 | 1472 | faddd %f4,%f8,%f8 |
michael@0 | 1473 | fmuld %f20,%f24,%f20 !18 |
michael@0 | 1474 | std %f32,[%o4+48] |
michael@0 | 1475 | faddd %f42,%f44,%f42 |
michael@0 | 1476 | fmuld %f22,%f0,%f22 !19 |
michael@0 | 1477 | std %f42,[%o4+80] |
michael@0 | 1478 | faddd %f48,%f50,%f48 |
michael@0 | 1479 | fmuld %f34,%f24,%f32 !20 |
michael@0 | 1480 | std %f48,[%o4+112] |
michael@0 | 1481 | faddd %f52,%f56,%f52 |
michael@0 | 1482 | fmuld %f38,%f0,%f36 !21 |
michael@0 | 1483 | ldd [%i2+120],%f42 |
michael@0 | 1484 | fdtox %f8,%f4 !22 |
michael@0 | 1485 | std %f52,[%o4+144] |
michael@0 | 1486 | faddd %f20,%f22,%f20 !23 |
michael@0 | 1487 | ldd [%i4+120],%f44 !24 |
michael@0 | 1488 | ldd [%o4+176],%f22 |
michael@0 | 1489 | faddd %f32,%f36,%f32 |
michael@0 | 1490 | fmuld %f42,%f24,%f42 !25 |
michael@0 | 1491 | ldd [%i4+16],%f50 |
michael@0 | 1492 | fmovs %f17,%f4 !26 |
michael@0 | 1493 | ldd [%i2+32],%f52 |
michael@0 | 1494 | fmuld %f44,%f0,%f44 !27 |
michael@0 | 1495 | ldd [%i4+32],%f56 |
michael@0 | 1496 | fmuld %f40,%f24,%f48 !28 |
michael@0 | 1497 | ldd [%o4+208],%f36 |
michael@0 | 1498 | faddd %f20,%f22,%f20 |
michael@0 | 1499 | fmuld %f50,%f0,%f50 !29 |
michael@0 | 1500 | std %f20,[%o4+176] |
michael@0 | 1501 | fxtod %f4,%f4 |
michael@0 | 1502 | fmuld %f52,%f24,%f52 !30 |
michael@0 | 1503 | ldd [%i4+48],%f22 |
michael@0 | 1504 | faddd %f42,%f44,%f42 |
michael@0 | 1505 | fmuld %f56,%f0,%f56 !31 |
michael@0 | 1506 | ldd [%o4+240],%f44 |
michael@0 | 1507 | faddd %f32,%f36,%f32 !32 |
michael@0 | 1508 | std %f32,[%o4+208] |
michael@0 | 1509 | faddd %f48,%f50,%f48 |
michael@0 | 1510 | fmuld %f46,%f24,%f20 !33 |
michael@0 | 1511 | ldd [%o4+32],%f50 |
michael@0 | 1512 | fmuld %f4,%f18,%f12 !34 |
michael@0 | 1513 | ldd [%i4+64],%f36 |
michael@0 | 1514 | faddd %f52,%f56,%f52 |
michael@0 | 1515 | fmuld %f22,%f0,%f22 !35 |
michael@0 | 1516 | ldd [%o4+64],%f56 |
michael@0 | 1517 | faddd %f42,%f44,%f42 !36 |
michael@0 | 1518 | std %f42,[%o4+240] |
michael@0 | 1519 | faddd %f48,%f50,%f48 |
michael@0 | 1520 | fmuld %f54,%f24,%f32 !37 |
michael@0 | 1521 | std %f48,[%o4+32] |
michael@0 | 1522 | fmuld %f12,%f14,%f4 !38 |
michael@0 | 1523 | ldd [%i2+80],%f42 |
michael@0 | 1524 | faddd %f52,%f56,%f56 ! yes, tmp52! |
michael@0 | 1525 | fmuld %f36,%f0,%f36 !39 |
michael@0 | 1526 | ldd [%i4+80],%f44 |
michael@0 | 1527 | faddd %f20,%f22,%f20 !40 |
michael@0 | 1528 | ldd [%i2+96],%f48 |
michael@0 | 1529 | fmuld %f58,%f24,%f52 !41 |
michael@0 | 1530 | ldd [%i4+96],%f50 |
michael@0 | 1531 | fdtox %f4,%f4 |
michael@0 | 1532 | fmuld %f42,%f24,%f42 !42 |
michael@0 | 1533 | std %f56,[%o4+64] ! yes, tmp52! |
michael@0 | 1534 | faddd %f32,%f36,%f32 |
michael@0 | 1535 | fmuld %f44,%f0,%f44 !43 |
michael@0 | 1536 | ldd [%o4+96],%f22 |
michael@0 | 1537 | fmuld %f48,%f24,%f48 !44 |
michael@0 | 1538 | ldd [%o4+128],%f36 |
michael@0 | 1539 | fmovd %f6,%f24 |
michael@0 | 1540 | fmuld %f50,%f0,%f50 !45 |
michael@0 | 1541 | fxtod %f4,%f4 |
michael@0 | 1542 | fmuld %f60,%f0,%f56 !46 |
michael@0 | 1543 | add %o4,8,%o4 |
michael@0 | 1544 | faddd %f42,%f44,%f42 !47 |
michael@0 | 1545 | ldd [%o4+160-8],%f44 |
michael@0 | 1546 | faddd %f20,%f22,%f20 !48 |
michael@0 | 1547 | std %f20,[%o4+96-8] |
michael@0 | 1548 | faddd %f48,%f50,%f48 !49 |
michael@0 | 1549 | ldd [%o4+192-8],%f50 |
michael@0 | 1550 | faddd %f52,%f56,%f52 |
michael@0 | 1551 | fmuld %f4,%f16,%f4 !50 |
michael@0 | 1552 | ldd [%o4+224-8],%f56 |
michael@0 | 1553 | faddd %f32,%f36,%f32 !51 |
michael@0 | 1554 | std %f32,[%o4+128-8] |
michael@0 | 1555 | faddd %f42,%f44,%f42 !52 |
michael@0 | 1556 | add %o3,1,%o3 |
michael@0 | 1557 | std %f42,[%o4+160-8] |
michael@0 | 1558 | faddd %f48,%f50,%f48 !53 |
michael@0 | 1559 | cmp %o3,31 |
michael@0 | 1560 | std %f48,[%o4+192-8] |
michael@0 | 1561 | fsubd %f12,%f4,%f0 !54 |
michael@0 | 1562 | faddd %f52,%f56,%f52 |
michael@0 | 1563 | ble,pt %icc,.L99999999 |
michael@0 | 1564 | std %f52,[%o4+224-8] !55 |
michael@0 | 1565 | std %f8,[%o4] |
michael@0 | 1566 | |
michael@0 | 1567 | ! 312 ! } |
michael@0 | 1568 | ! 313 ! } |
michael@0 | 1569 | ! 315 ! conv_d16_to_i32(result,dt+2*nlen,(long long *)dt,nlen+1); |
michael@0 | 1570 | |
michael@0 | 1571 | /* 0x07c8 315 */ sll %i0,4,%g2 |
michael@0 | 1572 | .L900000653: |
michael@0 | 1573 | /* 0x07cc 315 */ add %i1,%g2,%i1 |
michael@0 | 1574 | /* 0x07d0 242 */ ld [%fp+68],%o0 |
michael@0 | 1575 | /* 0x07d4 315 */ or %g0,0,%o4 |
michael@0 | 1576 | /* 0x07d8 */ ldd [%i1],%f0 |
michael@0 | 1577 | /* 0x07dc */ or %g0,0,%g5 |
michael@0 | 1578 | /* 0x07e0 */ cmp %i0,0 |
michael@0 | 1579 | /* 0x07e4 242 */ or %g0,%o0,%o3 |
michael@0 | 1580 | /* 0x07e8 311 */ sub %i0,1,%g1 |
michael@0 | 1581 | /* 0x07ec 315 */ fdtox %f0,%f0 |
michael@0 | 1582 | /* 0x07f0 */ std %f0,[%sp+120] |
michael@0 | 1583 | /* 0x07f4 311 */ sethi %hi(0xfc00),%o1 |
michael@0 | 1584 | /* 0x07f8 */ add %g1,1,%g3 |
michael@0 | 1585 | /* 0x07fc */ or %g0,%o0,%g4 |
michael@0 | 1586 | /* 0x0800 315 */ ldd [%i1+8],%f0 |
michael@0 | 1587 | /* 0x0804 */ add %o1,1023,%o1 |
michael@0 | 1588 | /* 0x0808 */ fdtox %f0,%f0 |
michael@0 | 1589 | /* 0x080c */ std %f0,[%sp+112] |
michael@0 | 1590 | /* 0x0810 */ ldx [%sp+112],%o5 |
michael@0 | 1591 | /* 0x0814 */ ldx [%sp+120],%o7 |
michael@0 | 1592 | /* 0x0818 */ ble,pt %icc,.L900000651 |
michael@0 | 1593 | /* 0x081c */ sethi %hi(0xfc00),%g2 |
michael@0 | 1594 | /* 0x0820 311 */ or %g0,-1,%g2 |
michael@0 | 1595 | /* 0x0824 315 */ cmp %g3,3 |
michael@0 | 1596 | /* 0x0828 311 */ srl %g2,0,%o2 |
michael@0 | 1597 | /* 0x082c 315 */ bl,pn %icc,.L77000287 |
michael@0 | 1598 | /* 0x0830 */ or %g0,%i1,%g2 |
michael@0 | 1599 | /* 0x0834 */ ldd [%i1+16],%f0 |
michael@0 | 1600 | /* 0x0838 */ and %o5,%o1,%o0 |
michael@0 | 1601 | /* 0x083c */ add %i1,16,%g2 |
michael@0 | 1602 | /* 0x0840 */ sllx %o0,16,%g3 |
michael@0 | 1603 | /* 0x0844 */ and %o7,%o2,%o0 |
michael@0 | 1604 | /* 0x0848 */ fdtox %f0,%f0 |
michael@0 | 1605 | /* 0x084c */ std %f0,[%sp+104] |
michael@0 | 1606 | /* 0x0850 */ add %o0,%g3,%o4 |
michael@0 | 1607 | /* 0x0854 */ ldd [%i1+24],%f2 |
michael@0 | 1608 | /* 0x0858 */ srax %o5,16,%o0 |
michael@0 | 1609 | /* 0x085c */ add %o3,4,%g4 |
michael@0 | 1610 | /* 0x0860 */ stx %o0,[%sp+128] |
michael@0 | 1611 | /* 0x0864 */ and %o4,%o2,%o0 |
michael@0 | 1612 | /* 0x0868 */ stx %o0,[%sp+112] |
michael@0 | 1613 | /* 0x086c */ srax %o4,32,%o0 |
michael@0 | 1614 | /* 0x0870 */ fdtox %f2,%f0 |
michael@0 | 1615 | /* 0x0874 */ stx %o0,[%sp+136] |
michael@0 | 1616 | /* 0x0878 */ srax %o7,32,%o4 |
michael@0 | 1617 | /* 0x087c */ std %f0,[%sp+96] |
michael@0 | 1618 | /* 0x0880 */ ldx [%sp+128],%g5 |
michael@0 | 1619 | /* 0x0884 */ ldx [%sp+136],%o7 |
michael@0 | 1620 | /* 0x0888 */ ldx [%sp+104],%g3 |
michael@0 | 1621 | /* 0x088c */ add %g5,%o7,%o0 |
michael@0 | 1622 | /* 0x0890 */ or %g0,1,%g5 |
michael@0 | 1623 | /* 0x0894 */ ldx [%sp+112],%o7 |
michael@0 | 1624 | /* 0x0898 */ add %o4,%o0,%o4 |
michael@0 | 1625 | /* 0x089c */ ldx [%sp+96],%o5 |
michael@0 | 1626 | /* 0x08a0 */ st %o7,[%o3] |
michael@0 | 1627 | /* 0x08a4 */ or %g0,%g3,%o7 |
michael@0 | 1628 | .L900000634: |
michael@0 | 1629 | /* 0x08a8 */ ldd [%g2+16],%f0 |
michael@0 | 1630 | /* 0x08ac */ add %g5,1,%g5 |
michael@0 | 1631 | /* 0x08b0 */ add %g4,4,%g4 |
michael@0 | 1632 | /* 0x08b4 */ cmp %g5,%g1 |
michael@0 | 1633 | /* 0x08b8 */ add %g2,16,%g2 |
michael@0 | 1634 | /* 0x08bc */ fdtox %f0,%f0 |
michael@0 | 1635 | /* 0x08c0 */ std %f0,[%sp+104] |
michael@0 | 1636 | /* 0x08c4 */ ldd [%g2+8],%f0 |
michael@0 | 1637 | /* 0x08c8 */ fdtox %f0,%f0 |
michael@0 | 1638 | /* 0x08cc */ std %f0,[%sp+96] |
michael@0 | 1639 | /* 0x08d0 */ and %o5,%o1,%g3 |
michael@0 | 1640 | /* 0x08d4 */ sllx %g3,16,%g3 |
michael@0 | 1641 | /* 0x08d8 */ stx %g3,[%sp+120] |
michael@0 | 1642 | /* 0x08dc */ and %o7,%o2,%g3 |
michael@0 | 1643 | /* 0x08e0 */ stx %o7,[%sp+128] |
michael@0 | 1644 | /* 0x08e4 */ ldx [%sp+120],%o7 |
michael@0 | 1645 | /* 0x08e8 */ add %g3,%o7,%g3 |
michael@0 | 1646 | /* 0x08ec */ ldx [%sp+128],%o7 |
michael@0 | 1647 | /* 0x08f0 */ srax %o5,16,%o5 |
michael@0 | 1648 | /* 0x08f4 */ add %g3,%o4,%g3 |
michael@0 | 1649 | /* 0x08f8 */ srax %g3,32,%o4 |
michael@0 | 1650 | /* 0x08fc */ stx %o4,[%sp+112] |
michael@0 | 1651 | /* 0x0900 */ srax %o7,32,%o4 |
michael@0 | 1652 | /* 0x0904 */ ldx [%sp+112],%o7 |
michael@0 | 1653 | /* 0x0908 */ add %o5,%o7,%o7 |
michael@0 | 1654 | /* 0x090c */ ldx [%sp+96],%o5 |
michael@0 | 1655 | /* 0x0910 */ add %o4,%o7,%o4 |
michael@0 | 1656 | /* 0x0914 */ and %g3,%o2,%g3 |
michael@0 | 1657 | /* 0x0918 */ ldx [%sp+104],%o7 |
michael@0 | 1658 | /* 0x091c */ ble,pt %icc,.L900000634 |
michael@0 | 1659 | /* 0x0920 */ st %g3,[%g4-4] |
michael@0 | 1660 | .L900000637: |
michael@0 | 1661 | /* 0x0924 */ ba .L900000651 |
michael@0 | 1662 | /* 0x0928 */ sethi %hi(0xfc00),%g2 |
michael@0 | 1663 | .L77000287: |
michael@0 | 1664 | /* 0x092c */ ldd [%g2+16],%f0 |
michael@0 | 1665 | .L900000650: |
michael@0 | 1666 | /* 0x0930 */ and %o7,%o2,%o0 |
michael@0 | 1667 | /* 0x0934 */ and %o5,%o1,%g3 |
michael@0 | 1668 | /* 0x0938 */ fdtox %f0,%f0 |
michael@0 | 1669 | /* 0x093c */ add %o4,%o0,%o0 |
michael@0 | 1670 | /* 0x0940 */ std %f0,[%sp+104] |
michael@0 | 1671 | /* 0x0944 */ add %g5,1,%g5 |
michael@0 | 1672 | /* 0x0948 */ sllx %g3,16,%o4 |
michael@0 | 1673 | /* 0x094c */ ldd [%g2+24],%f2 |
michael@0 | 1674 | /* 0x0950 */ add %g2,16,%g2 |
michael@0 | 1675 | /* 0x0954 */ add %o0,%o4,%o4 |
michael@0 | 1676 | /* 0x0958 */ cmp %g5,%g1 |
michael@0 | 1677 | /* 0x095c */ srax %o5,16,%o0 |
michael@0 | 1678 | /* 0x0960 */ stx %o0,[%sp+112] |
michael@0 | 1679 | /* 0x0964 */ and %o4,%o2,%g3 |
michael@0 | 1680 | /* 0x0968 */ srax %o4,32,%o5 |
michael@0 | 1681 | /* 0x096c */ fdtox %f2,%f0 |
michael@0 | 1682 | /* 0x0970 */ std %f0,[%sp+96] |
michael@0 | 1683 | /* 0x0974 */ srax %o7,32,%o4 |
michael@0 | 1684 | /* 0x0978 */ ldx [%sp+112],%o7 |
michael@0 | 1685 | /* 0x097c */ add %o7,%o5,%o7 |
michael@0 | 1686 | /* 0x0980 */ ldx [%sp+104],%o5 |
michael@0 | 1687 | /* 0x0984 */ add %o4,%o7,%o4 |
michael@0 | 1688 | /* 0x0988 */ ldx [%sp+96],%o0 |
michael@0 | 1689 | /* 0x098c */ st %g3,[%g4] |
michael@0 | 1690 | /* 0x0990 */ or %g0,%o5,%o7 |
michael@0 | 1691 | /* 0x0994 */ add %g4,4,%g4 |
michael@0 | 1692 | /* 0x0998 */ or %g0,%o0,%o5 |
michael@0 | 1693 | /* 0x099c */ ble,a,pt %icc,.L900000650 |
michael@0 | 1694 | /* 0x09a0 */ ldd [%g2+16],%f0 |
michael@0 | 1695 | .L77000236: |
michael@0 | 1696 | /* 0x09a4 */ sethi %hi(0xfc00),%g2 |
michael@0 | 1697 | .L900000651: |
michael@0 | 1698 | /* 0x09a8 */ or %g0,-1,%o0 |
michael@0 | 1699 | /* 0x09ac */ add %g2,1023,%g2 |
michael@0 | 1700 | /* 0x09b0 */ ld [%fp+88],%o1 |
michael@0 | 1701 | /* 0x09b4 */ srl %o0,0,%g3 |
michael@0 | 1702 | /* 0x09b8 */ and %o5,%g2,%g2 |
michael@0 | 1703 | /* 0x09bc */ and %o7,%g3,%g4 |
michael@0 | 1704 | |
michael@0 | 1705 | ! 317 ! adjust_montf_result(result,nint,nlen); |
michael@0 | 1706 | |
michael@0 | 1707 | /* 0x09c0 317 */ or %g0,-1,%o5 |
michael@0 | 1708 | /* 0x09c4 311 */ sllx %g2,16,%g2 |
michael@0 | 1709 | /* 0x09c8 */ add %o4,%g4,%g4 |
michael@0 | 1710 | /* 0x09cc */ add %g4,%g2,%g2 |
michael@0 | 1711 | /* 0x09d0 */ sll %g5,2,%g4 |
michael@0 | 1712 | /* 0x09d4 */ and %g2,%g3,%g2 |
michael@0 | 1713 | /* 0x09d8 */ st %g2,[%o3+%g4] |
michael@0 | 1714 | /* 0x09dc 317 */ sll %i0,2,%g2 |
michael@0 | 1715 | /* 0x09e0 */ ld [%o3+%g2],%g2 |
michael@0 | 1716 | /* 0x09e4 */ cmp %g2,0 |
michael@0 | 1717 | /* 0x09e8 */ bleu,pn %icc,.L77000241 |
michael@0 | 1718 | /* 0x09ec */ or %g0,%o1,%o2 |
michael@0 | 1719 | /* 0x09f0 */ ba .L900000649 |
michael@0 | 1720 | /* 0x09f4 */ cmp %o5,0 |
michael@0 | 1721 | .L77000241: |
michael@0 | 1722 | /* 0x09f8 */ sub %i0,1,%o5 |
michael@0 | 1723 | /* 0x09fc */ sll %o5,2,%g2 |
michael@0 | 1724 | /* 0x0a00 */ cmp %o5,0 |
michael@0 | 1725 | /* 0x0a04 */ bl,pt %icc,.L900000649 |
michael@0 | 1726 | /* 0x0a08 */ cmp %o5,0 |
michael@0 | 1727 | /* 0x0a0c */ add %o1,%g2,%o1 |
michael@0 | 1728 | /* 0x0a10 */ add %o3,%g2,%o4 |
michael@0 | 1729 | /* 0x0a14 */ ld [%o1],%g2 |
michael@0 | 1730 | .L900000648: |
michael@0 | 1731 | /* 0x0a18 */ ld [%o4],%g3 |
michael@0 | 1732 | /* 0x0a1c */ sub %o5,1,%o0 |
michael@0 | 1733 | /* 0x0a20 */ sub %o1,4,%o1 |
michael@0 | 1734 | /* 0x0a24 */ sub %o4,4,%o4 |
michael@0 | 1735 | /* 0x0a28 */ cmp %g3,%g2 |
michael@0 | 1736 | /* 0x0a2c */ bne,pn %icc,.L77000244 |
michael@0 | 1737 | /* 0x0a30 */ nop |
michael@0 | 1738 | /* 0x0a34 0 */ or %g0,%o0,%o5 |
michael@0 | 1739 | /* 0x0a38 317 */ cmp %o0,0 |
michael@0 | 1740 | /* 0x0a3c */ bge,a,pt %icc,.L900000648 |
michael@0 | 1741 | /* 0x0a40 */ ld [%o1],%g2 |
michael@0 | 1742 | .L77000244: |
michael@0 | 1743 | /* 0x0a44 */ cmp %o5,0 |
michael@0 | 1744 | .L900000649: |
michael@0 | 1745 | /* 0x0a48 */ bl,pn %icc,.L77000288 |
michael@0 | 1746 | /* 0x0a4c */ sll %o5,2,%g2 |
michael@0 | 1747 | /* 0x0a50 */ ld [%o2+%g2],%g3 |
michael@0 | 1748 | /* 0x0a54 */ ld [%o3+%g2],%g2 |
michael@0 | 1749 | /* 0x0a58 */ cmp %g2,%g3 |
michael@0 | 1750 | /* 0x0a5c */ bleu,pt %icc,.L77000224 |
michael@0 | 1751 | /* 0x0a60 */ nop |
michael@0 | 1752 | .L77000288: |
michael@0 | 1753 | /* 0x0a64 */ cmp %i0,0 |
michael@0 | 1754 | /* 0x0a68 */ ble,pt %icc,.L77000224 |
michael@0 | 1755 | /* 0x0a6c */ nop |
michael@0 | 1756 | /* 0x0a70 317 */ sub %i0,1,%o7 |
michael@0 | 1757 | /* 0x0a74 */ or %g0,-1,%g2 |
michael@0 | 1758 | /* 0x0a78 */ srl %g2,0,%o4 |
michael@0 | 1759 | /* 0x0a7c */ add %o7,1,%o0 |
michael@0 | 1760 | /* 0x0a80 315 */ or %g0,0,%o5 |
michael@0 | 1761 | /* 0x0a84 */ or %g0,0,%g1 |
michael@0 | 1762 | /* 0x0a88 */ cmp %o0,3 |
michael@0 | 1763 | /* 0x0a8c */ bl,pn %icc,.L77000289 |
michael@0 | 1764 | /* 0x0a90 */ add %o3,8,%o1 |
michael@0 | 1765 | /* 0x0a94 */ add %o2,4,%o0 |
michael@0 | 1766 | /* 0x0a98 */ ld [%o1-8],%g2 |
michael@0 | 1767 | /* 0x0a9c 0 */ or %g0,%o1,%o3 |
michael@0 | 1768 | /* 0x0aa0 315 */ ld [%o0-4],%g3 |
michael@0 | 1769 | /* 0x0aa4 0 */ or %g0,%o0,%o2 |
michael@0 | 1770 | /* 0x0aa8 315 */ or %g0,2,%g1 |
michael@0 | 1771 | /* 0x0aac */ ld [%o3-4],%o0 |
michael@0 | 1772 | /* 0x0ab0 */ sub %g2,%g3,%g2 |
michael@0 | 1773 | /* 0x0ab4 */ or %g0,%g2,%o5 |
michael@0 | 1774 | /* 0x0ab8 */ and %g2,%o4,%g2 |
michael@0 | 1775 | /* 0x0abc */ st %g2,[%o3-8] |
michael@0 | 1776 | /* 0x0ac0 */ srax %o5,32,%o5 |
michael@0 | 1777 | .L900000638: |
michael@0 | 1778 | /* 0x0ac4 */ ld [%o2],%g2 |
michael@0 | 1779 | /* 0x0ac8 */ add %g1,1,%g1 |
michael@0 | 1780 | /* 0x0acc */ add %o2,4,%o2 |
michael@0 | 1781 | /* 0x0ad0 */ cmp %g1,%o7 |
michael@0 | 1782 | /* 0x0ad4 */ add %o3,4,%o3 |
michael@0 | 1783 | /* 0x0ad8 */ sub %o0,%g2,%o0 |
michael@0 | 1784 | /* 0x0adc */ add %o0,%o5,%o5 |
michael@0 | 1785 | /* 0x0ae0 */ and %o5,%o4,%g2 |
michael@0 | 1786 | /* 0x0ae4 */ ld [%o3-4],%o0 |
michael@0 | 1787 | /* 0x0ae8 */ st %g2,[%o3-8] |
michael@0 | 1788 | /* 0x0aec */ ble,pt %icc,.L900000638 |
michael@0 | 1789 | /* 0x0af0 */ srax %o5,32,%o5 |
michael@0 | 1790 | .L900000641: |
michael@0 | 1791 | /* 0x0af4 */ ld [%o2],%o1 |
michael@0 | 1792 | /* 0x0af8 */ sub %o0,%o1,%o0 |
michael@0 | 1793 | /* 0x0afc */ add %o0,%o5,%o0 |
michael@0 | 1794 | /* 0x0b00 */ and %o0,%o4,%o1 |
michael@0 | 1795 | /* 0x0b04 */ st %o1,[%o3-4] |
michael@0 | 1796 | /* 0x0b08 */ ret ! Result = |
michael@0 | 1797 | /* 0x0b0c */ restore %g0,%g0,%g0 |
michael@0 | 1798 | .L77000289: |
michael@0 | 1799 | /* 0x0b10 */ ld [%o3],%o0 |
michael@0 | 1800 | .L900000647: |
michael@0 | 1801 | /* 0x0b14 */ ld [%o2],%o1 |
michael@0 | 1802 | /* 0x0b18 */ add %o5,%o0,%o0 |
michael@0 | 1803 | /* 0x0b1c */ add %g1,1,%g1 |
michael@0 | 1804 | /* 0x0b20 */ add %o2,4,%o2 |
michael@0 | 1805 | /* 0x0b24 */ cmp %g1,%o7 |
michael@0 | 1806 | /* 0x0b28 */ sub %o0,%o1,%o0 |
michael@0 | 1807 | /* 0x0b2c */ and %o0,%o4,%o1 |
michael@0 | 1808 | /* 0x0b30 */ st %o1,[%o3] |
michael@0 | 1809 | /* 0x0b34 */ add %o3,4,%o3 |
michael@0 | 1810 | /* 0x0b38 */ srax %o0,32,%o5 |
michael@0 | 1811 | /* 0x0b3c */ ble,a,pt %icc,.L900000647 |
michael@0 | 1812 | /* 0x0b40 */ ld [%o3],%o0 |
michael@0 | 1813 | .L77000224: |
michael@0 | 1814 | /* 0x0b44 */ ret ! Result = |
michael@0 | 1815 | /* 0x0b48 */ restore %g0,%g0,%g0 |
michael@0 | 1816 | /* 0x0b4c 0 */ .type mont_mulf_noconv,2 |
michael@0 | 1817 | /* 0x0b4c */ .size mont_mulf_noconv,(.-mont_mulf_noconv) |
michael@0 | 1818 |