security/nss/lib/freebl/mpi/montmulf.s

changeset 0
6474c204b198
     1.1 --- /dev/null	Thu Jan 01 00:00:00 1970 +0000
     1.2 +++ b/security/nss/lib/freebl/mpi/montmulf.s	Wed Dec 31 06:09:35 2014 +0100
     1.3 @@ -0,0 +1,1938 @@
     1.4 +!  
     1.5 +! This Source Code Form is subject to the terms of the Mozilla Public
     1.6 +! License, v. 2.0. If a copy of the MPL was not distributed with this
     1.7 +! file, You can obtain one at http://mozilla.org/MPL/2.0/.
     1.8 +
     1.9 +	.section	".text",#alloc,#execinstr
    1.10 +	.file	"montmulf.c"
    1.11 +
    1.12 +	.section	".data",#alloc,#write
    1.13 +	.align	8
    1.14 +TwoTo16:		/* frequency 1.0 confidence 0.0 */
    1.15 +	.word	1089470464
    1.16 +	.word	0
    1.17 +	.type	TwoTo16,#object
    1.18 +	.size	TwoTo16,8
    1.19 +TwoToMinus16:		/* frequency 1.0 confidence 0.0 */
    1.20 +	.word	1055916032
    1.21 +	.word	0
    1.22 +	.type	TwoToMinus16,#object
    1.23 +	.size	TwoToMinus16,8
    1.24 +Zero:		/* frequency 1.0 confidence 0.0 */
    1.25 +	.word	0
    1.26 +	.word	0
    1.27 +	.type	Zero,#object
    1.28 +	.size	Zero,8
    1.29 +TwoTo32:		/* frequency 1.0 confidence 0.0 */
    1.30 +	.word	1106247680
    1.31 +	.word	0
    1.32 +	.type	TwoTo32,#object
    1.33 +	.size	TwoTo32,8
    1.34 +TwoToMinus32:		/* frequency 1.0 confidence 0.0 */
    1.35 +	.word	1039138816
    1.36 +	.word	0
    1.37 +	.type	TwoToMinus32,#object
    1.38 +	.size	TwoToMinus32,8
    1.39 +
    1.40 +	.section	".text",#alloc,#execinstr
    1.41 +/* 000000	   0 ( 0  0) */		.align	4
    1.42 +!
    1.43 +! SUBROUTINE cleanup
    1.44 +!
    1.45 +! OFFSET    SOURCE LINE	LABEL	INSTRUCTION	(ISSUE TIME)	(COMPLETION TIME)
    1.46 +
    1.47 +                                   	.global cleanup
    1.48 +                                   cleanup:		/* frequency 1.0 confidence 0.0 */
    1.49 +! FILE montmulf.c
    1.50 +
    1.51 +!    1		                    !#define RF_INLINE_MACROS
    1.52 +!    3		                    !static double TwoTo16=65536.0;
    1.53 +!    4		                    !static double TwoToMinus16=1.0/65536.0;
    1.54 +!    5		                    !static double Zero=0.0;
    1.55 +!    6		                    !static double TwoTo32=65536.0*65536.0;
    1.56 +!    7		                    !static double TwoToMinus32=1.0/(65536.0*65536.0);
    1.57 +!    9		                    !#ifdef RF_INLINE_MACROS
    1.58 +!   11		                    !double upper32(double);
    1.59 +!   12		                    !double lower32(double, double);
    1.60 +!   13		                    !double mod(double, double, double);
    1.61 +!   15		                    !#else
    1.62 +!   17		                    !static double upper32(double x)
    1.63 +!   18		                    !{
    1.64 +!   19		                    !  return floor(x*TwoToMinus32);
    1.65 +!   20		                    !}
    1.66 +!   22		                    !static double lower32(double x, double y)
    1.67 +!   23		                    !{
    1.68 +!   24		                    !  return x-TwoTo32*floor(x*TwoToMinus32);
    1.69 +!   25		                    !}
    1.70 +!   27		                    !static double mod(double x, double oneoverm, double m)
    1.71 +!   28		                    !{
    1.72 +!   29		                    !  return x-m*floor(x*oneoverm);
    1.73 +!   30		                    !}
    1.74 +!   32		                    !#endif
    1.75 +!   35		                    !void cleanup(double *dt, int from, int tlen)
    1.76 +!   36		                    !{
    1.77 +!   37		                    ! int i;
    1.78 +!   38		                    ! double tmp,tmp1,x,x1;
    1.79 +!   40		                    ! tmp=tmp1=Zero;
    1.80 +
    1.81 +/* 000000	  40 ( 0  1) */		sethi	%hi(Zero),%g2
    1.82 +
    1.83 +!   41		                    ! /* original code **
    1.84 +!   42		                    ! for(i=2*from;i<2*tlen-2;i++)
    1.85 +!   43		                    !   {
    1.86 +!   44		                    !     x=dt[i];
    1.87 +!   45		                    !     dt[i]=lower32(x,Zero)+tmp1;
    1.88 +!   46		                    !     tmp1=tmp;
    1.89 +!   47		                    !     tmp=upper32(x);
    1.90 +!   48		                    !   }
    1.91 +!   49		                    ! dt[tlen-2]+=tmp1;
    1.92 +!   50		                    ! dt[tlen-1]+=tmp;
    1.93 +!   51		                    ! **end original code ***/
    1.94 +!   52		                    ! /* new code ***/
    1.95 +!   53		                    ! for(i=2*from;i<2*tlen;i+=2)
    1.96 +
    1.97 +/* 0x0004	  53 ( 1  2) */		sll	%o2,1,%g3
    1.98 +/* 0x0008	  40 ( 1  4) */		ldd	[%g2+%lo(Zero)],%f0
    1.99 +/* 0x000c	     ( 1  2) */		add	%g2,%lo(Zero),%g2
   1.100 +/* 0x0010	  53 ( 2  3) */		sll	%o1,1,%g4
   1.101 +/* 0x0014	  36 ( 3  4) */		sll	%o1,4,%g1
   1.102 +/* 0x0018	  40 ( 3  4) */		fmovd	%f0,%f4
   1.103 +/* 0x001c	  53 ( 3  4) */		cmp	%g4,%g3
   1.104 +/* 0x0020	     ( 3  4) */		bge,pt	%icc,.L77000116	! tprob=0.56
   1.105 +/* 0x0024	     ( 4  5) */		fmovd	%f0,%f2
   1.106 +/* 0x0028	  36 ( 4  5) */		add	%o0,%g1,%g1
   1.107 +/* 0x002c	     ( 4  5) */		sub	%g3,1,%g3
   1.108 +
   1.109 +!   54		                    !   {
   1.110 +!   55		                    !     x=dt[i];
   1.111 +
   1.112 +/* 0x0030	  55 ( 5  8) */		ldd	[%g1],%f8
   1.113 +                                   .L900000114:		/* frequency 6.4 confidence 0.0 */
   1.114 +/* 0x0034	     ( 0  3) */		fdtox	%f8,%f6
   1.115 +
   1.116 +!   56		                    !     x1=dt[i+1];
   1.117 +
   1.118 +/* 0x0038	  56 ( 0  3) */		ldd	[%g1+8],%f10
   1.119 +
   1.120 +!   57		                    !     dt[i]=lower32(x,Zero)+tmp;
   1.121 +!   58		                    !     dt[i+1]=lower32(x1,Zero)+tmp1;
   1.122 +!   59		                    !     tmp=upper32(x);
   1.123 +!   60		                    !     tmp1=upper32(x1);
   1.124 +
   1.125 +/* 0x003c	  60 ( 0  1) */		add	%g4,2,%g4
   1.126 +/* 0x0040	     ( 1  4) */		fdtox	%f8,%f8
   1.127 +/* 0x0044	     ( 1  2) */		cmp	%g4,%g3
   1.128 +/* 0x0048	     ( 5  6) */		fmovs	%f0,%f6
   1.129 +/* 0x004c	     ( 7 10) */		fxtod	%f6,%f6
   1.130 +/* 0x0050	     ( 8 11) */		fdtox	%f10,%f0
   1.131 +/* 0x0054	  57 (10 13) */		faddd	%f6,%f2,%f2
   1.132 +/* 0x0058	     (10 11) */		std	%f2,[%g1]
   1.133 +/* 0x005c	     (12 15) */		ldd	[%g2],%f2
   1.134 +/* 0x0060	     (14 15) */		fmovs	%f2,%f0
   1.135 +/* 0x0064	     (16 19) */		fxtod	%f0,%f6
   1.136 +/* 0x0068	     (17 20) */		fdtox	%f10,%f0
   1.137 +/* 0x006c	     (18 21) */		fitod	%f8,%f2
   1.138 +/* 0x0070	  58 (19 22) */		faddd	%f6,%f4,%f4
   1.139 +/* 0x0074	     (19 20) */		std	%f4,[%g1+8]
   1.140 +/* 0x0078	  60 (19 20) */		add	%g1,16,%g1
   1.141 +/* 0x007c	     (20 23) */		fitod	%f0,%f4
   1.142 +/* 0x0080	     (20 23) */		ldd	[%g2],%f0
   1.143 +/* 0x0084	     (20 21) */		ble,a,pt	%icc,.L900000114	! tprob=0.86
   1.144 +/* 0x0088	     (21 24) */		ldd	[%g1],%f8
   1.145 +                                   .L77000116:		/* frequency 1.0 confidence 0.0 */
   1.146 +/* 0x008c	     ( 0  2) */		retl	! Result = 
   1.147 +/* 0x0090	     ( 1  2) */		nop
   1.148 +/* 0x0094	   0 ( 0  0) */		.type	cleanup,2
   1.149 +/* 0x0094	     ( 0  0) */		.size	cleanup,(.-cleanup)
   1.150 +
   1.151 +	.section	".text",#alloc,#execinstr
   1.152 +/* 000000	   0 ( 0  0) */		.align	4
   1.153 +!
   1.154 +! SUBROUTINE conv_d16_to_i32
   1.155 +!
   1.156 +! OFFSET    SOURCE LINE	LABEL	INSTRUCTION	(ISSUE TIME)	(COMPLETION TIME)
   1.157 +
   1.158 +                                   	.global conv_d16_to_i32
   1.159 +                                   conv_d16_to_i32:		/* frequency 1.0 confidence 0.0 */
   1.160 +/* 000000	     ( 0  1) */		save	%sp,-136,%sp
   1.161 +
   1.162 +!   61		                    !   }
   1.163 +!   62		                    !  /** end new code **/
   1.164 +!   63		                    !}
   1.165 +!   66		                    !void conv_d16_to_i32(unsigned int *i32, double *d16, long long *tmp, int ilen)
   1.166 +!   67		                    !{
   1.167 +!   68		                    !int i;
   1.168 +!   69		                    !long long t, t1, a, b, c, d;
   1.169 +!   71		                    ! t1=0;
   1.170 +!   72		                    ! a=(long long)d16[0];
   1.171 +
   1.172 +/* 0x0004	  72 ( 1  4) */		ldd	[%i1],%f0
   1.173 +
   1.174 +!   73		                    ! b=(long long)d16[1];
   1.175 +!   74		                    ! for(i=0; i<ilen-1; i++)
   1.176 +
   1.177 +/* 0x0008	  74 ( 1  2) */		sub	%i3,1,%g2
   1.178 +/* 0x000c	  67 ( 1  2) */		or	%g0,%i0,%g5
   1.179 +/* 0x0010	  74 ( 2  3) */		cmp	%g2,0
   1.180 +/* 0x0014	  71 ( 2  3) */		or	%g0,0,%o4
   1.181 +/* 0x0018	  72 ( 3  6) */		fdtox	%f0,%f0
   1.182 +/* 0x001c	     ( 3  4) */		std	%f0,[%sp+120]
   1.183 +/* 0x0020	  74 ( 3  4) */		or	%g0,0,%o7
   1.184 +/* 0x0024	  67 ( 4  5) */		or	%g0,%i3,%o0
   1.185 +/* 0x0028	     ( 4  5) */		sub	%i3,2,%o2
   1.186 +/* 0x002c	  73 ( 5  8) */		ldd	[%i1+8],%f0
   1.187 +/* 0x0030	  67 ( 5  6) */		sethi	%hi(0xfc00),%o0
   1.188 +/* 0x0034	     ( 5  6) */		add	%o2,1,%g3
   1.189 +/* 0x0038	     ( 6  7) */		add	%o0,1023,%o1
   1.190 +/* 0x003c	     ( 6  7) */		or	%g0,%g5,%o5
   1.191 +/* 0x0040	  73 ( 7 10) */		fdtox	%f0,%f0
   1.192 +/* 0x0044	     ( 7  8) */		std	%f0,[%sp+112]
   1.193 +/* 0x0048	  72 (11 13) */		ldx	[%sp+120],%g4
   1.194 +/* 0x004c	  73 (12 14) */		ldx	[%sp+112],%g1
   1.195 +/* 0x0050	  74 (12 13) */		ble,pt	%icc,.L900000214	! tprob=0.56
   1.196 +/* 0x0054	     (12 13) */		sethi	%hi(0xfc00),%g2
   1.197 +/* 0x0058	  67 (13 14) */		or	%g0,-1,%g2
   1.198 +/* 0x005c	  74 (13 14) */		cmp	%g3,3
   1.199 +/* 0x0060	  67 (14 15) */		srl	%g2,0,%o3
   1.200 +/* 0x0064	     (14 15) */		or	%g0,%i1,%g2
   1.201 +/* 0x0068	  74 (14 15) */		bl,pn	%icc,.L77000134	! tprob=0.44
   1.202 +/* 0x006c	     (15 18) */		ldd	[%g2+16],%f0
   1.203 +
   1.204 +!   75		                    !   {
   1.205 +!   76		                    !     c=(long long)d16[2*i+2];
   1.206 +!   77		                    !     t1+=a&0xffffffff;
   1.207 +!   78		                    !     t=(a>>32);
   1.208 +!   79		                    !     d=(long long)d16[2*i+3];
   1.209 +!   80		                    !     t1+=(b&0xffff)<<16;
   1.210 +
   1.211 +/* 0x0070	  80 (15 16) */		and	%g1,%o1,%o0
   1.212 +
   1.213 +!   81		                    !     t+=(b>>16)+(t1>>32);
   1.214 +!   82		                    !     i32[i]=t1&0xffffffff;
   1.215 +!   83		                    !     t1=t;
   1.216 +!   84		                    !     a=c;
   1.217 +!   85		                    !     b=d;
   1.218 +
   1.219 +/* 0x0074	  85 (15 16) */		add	%g2,16,%g2
   1.220 +/* 0x0078	  80 (16 17) */		sllx	%o0,16,%g3
   1.221 +/* 0x007c	  77 (16 17) */		and	%g4,%o3,%o0
   1.222 +/* 0x0080	  76 (17 20) */		fdtox	%f0,%f0
   1.223 +/* 0x0084	     (17 18) */		std	%f0,[%sp+104]
   1.224 +/* 0x0088	  74 (17 18) */		add	%o0,%g3,%o4
   1.225 +/* 0x008c	  79 (18 21) */		ldd	[%g2+8],%f2
   1.226 +/* 0x0090	  81 (18 19) */		srax	%g1,16,%o0
   1.227 +/* 0x0094	  82 (18 19) */		and	%o4,%o3,%o7
   1.228 +/* 0x0098	  81 (19 20) */		stx	%o0,[%sp+112]
   1.229 +/* 0x009c	     (19 20) */		srax	%o4,32,%o0
   1.230 +/* 0x00a0	  85 (19 20) */		add	%g5,4,%o5
   1.231 +/* 0x00a4	  81 (20 21) */		stx	%o0,[%sp+120]
   1.232 +/* 0x00a8	  78 (20 21) */		srax	%g4,32,%o4
   1.233 +/* 0x00ac	  79 (20 23) */		fdtox	%f2,%f0
   1.234 +/* 0x00b0	     (21 22) */		std	%f0,[%sp+96]
   1.235 +/* 0x00b4	  81 (22 24) */		ldx	[%sp+112],%o0
   1.236 +/* 0x00b8	     (23 25) */		ldx	[%sp+120],%g4
   1.237 +/* 0x00bc	  76 (25 27) */		ldx	[%sp+104],%g3
   1.238 +/* 0x00c0	  81 (25 26) */		add	%o0,%g4,%g4
   1.239 +/* 0x00c4	  79 (26 28) */		ldx	[%sp+96],%g1
   1.240 +/* 0x00c8	  81 (26 27) */		add	%o4,%g4,%o4
   1.241 +/* 0x00cc	  82 (27 28) */		st	%o7,[%g5]
   1.242 +/* 0x00d0	     (27 28) */		or	%g0,1,%o7
   1.243 +/* 0x00d4	  84 (27 28) */		or	%g0,%g3,%g4
   1.244 +                                   .L900000209:		/* frequency 64.0 confidence 0.0 */
   1.245 +/* 0x00d8	  76 (17 19) */		ldd	[%g2+16],%f0
   1.246 +/* 0x00dc	  85 (17 18) */		add	%o7,1,%o7
   1.247 +/* 0x00e0	     (17 18) */		add	%o5,4,%o5
   1.248 +/* 0x00e4	     (18 18) */		cmp	%o7,%o2
   1.249 +/* 0x00e8	     (18 19) */		add	%g2,16,%g2
   1.250 +/* 0x00ec	  76 (19 22) */		fdtox	%f0,%f0
   1.251 +/* 0x00f0	     (20 21) */		std	%f0,[%sp+104]
   1.252 +/* 0x00f4	  79 (21 23) */		ldd	[%g2+8],%f0
   1.253 +/* 0x00f8	     (23 26) */		fdtox	%f0,%f0
   1.254 +/* 0x00fc	     (24 25) */		std	%f0,[%sp+96]
   1.255 +/* 0x0100	  80 (25 26) */		and	%g1,%o1,%g3
   1.256 +/* 0x0104	     (26 27) */		sllx	%g3,16,%g3
   1.257 +/* 0x0108	     ( 0  0) */		stx	%g3,[%sp+120]
   1.258 +/* 0x010c	  77 (26 27) */		and	%g4,%o3,%g3
   1.259 +/* 0x0110	  74 ( 0  0) */		stx	%o7,[%sp+128]
   1.260 +/* 0x0114	     ( 0  0) */		ldx	[%sp+120],%o7
   1.261 +/* 0x0118	     (27 27) */		add	%g3,%o7,%g3
   1.262 +/* 0x011c	     ( 0  0) */		ldx	[%sp+128],%o7
   1.263 +/* 0x0120	  81 (28 29) */		srax	%g1,16,%g1
   1.264 +/* 0x0124	  74 (28 28) */		add	%g3,%o4,%g3
   1.265 +/* 0x0128	  81 (29 30) */		srax	%g3,32,%o4
   1.266 +/* 0x012c	     ( 0  0) */		stx	%o4,[%sp+112]
   1.267 +/* 0x0130	  78 (30 31) */		srax	%g4,32,%o4
   1.268 +/* 0x0134	  81 ( 0  0) */		ldx	[%sp+112],%g4
   1.269 +/* 0x0138	     (30 31) */		add	%g1,%g4,%g4
   1.270 +/* 0x013c	  79 (31 33) */		ldx	[%sp+96],%g1
   1.271 +/* 0x0140	  81 (31 32) */		add	%o4,%g4,%o4
   1.272 +/* 0x0144	  82 (32 33) */		and	%g3,%o3,%g3
   1.273 +/* 0x0148	  84 ( 0  0) */		ldx	[%sp+104],%g4
   1.274 +/* 0x014c	  85 (33 34) */		ble,pt	%icc,.L900000209	! tprob=0.50
   1.275 +/* 0x0150	     (33 34) */		st	%g3,[%o5-4]
   1.276 +                                   .L900000212:		/* frequency 8.0 confidence 0.0 */
   1.277 +/* 0x0154	  85 ( 0  1) */		ba	.L900000214	! tprob=1.00
   1.278 +/* 0x0158	     ( 0  1) */		sethi	%hi(0xfc00),%g2
   1.279 +                                   .L77000134:		/* frequency 0.7 confidence 0.0 */
   1.280 +                                   .L900000213:		/* frequency 6.4 confidence 0.0 */
   1.281 +/* 0x015c	  77 ( 0  1) */		and	%g4,%o3,%o0
   1.282 +/* 0x0160	  80 ( 0  1) */		and	%g1,%o1,%g3
   1.283 +/* 0x0164	  76 ( 0  3) */		fdtox	%f0,%f0
   1.284 +/* 0x0168	  77 ( 1  2) */		add	%o4,%o0,%o0
   1.285 +/* 0x016c	  76 ( 1  2) */		std	%f0,[%sp+104]
   1.286 +/* 0x0170	  85 ( 1  2) */		add	%o7,1,%o7
   1.287 +/* 0x0174	  80 ( 2  3) */		sllx	%g3,16,%o4
   1.288 +/* 0x0178	  79 ( 2  5) */		ldd	[%g2+24],%f2
   1.289 +/* 0x017c	  85 ( 2  3) */		add	%g2,16,%g2
   1.290 +/* 0x0180	  80 ( 3  4) */		add	%o0,%o4,%o4
   1.291 +/* 0x0184	  81 ( 3  4) */		stx	%o7,[%sp+128]
   1.292 +/* 0x0188	     ( 4  5) */		srax	%g1,16,%o0
   1.293 +/* 0x018c	     ( 4  5) */		stx	%o0,[%sp+112]
   1.294 +/* 0x0190	  82 ( 4  5) */		and	%o4,%o3,%g3
   1.295 +/* 0x0194	  81 ( 5  6) */		srax	%o4,32,%o0
   1.296 +/* 0x0198	     ( 5  6) */		stx	%o0,[%sp+120]
   1.297 +/* 0x019c	  79 ( 5  8) */		fdtox	%f2,%f0
   1.298 +/* 0x01a0	     ( 6  7) */		std	%f0,[%sp+96]
   1.299 +/* 0x01a4	  78 ( 6  7) */		srax	%g4,32,%o4
   1.300 +/* 0x01a8	  81 ( 7  9) */		ldx	[%sp+120],%o7
   1.301 +/* 0x01ac	     ( 8 10) */		ldx	[%sp+112],%g4
   1.302 +/* 0x01b0	  76 (10 12) */		ldx	[%sp+104],%g1
   1.303 +/* 0x01b4	  81 (10 11) */		add	%g4,%o7,%g4
   1.304 +/* 0x01b8	     (11 13) */		ldx	[%sp+128],%o7
   1.305 +/* 0x01bc	     (11 12) */		add	%o4,%g4,%o4
   1.306 +/* 0x01c0	  79 (12 14) */		ldx	[%sp+96],%o0
   1.307 +/* 0x01c4	  84 (12 13) */		or	%g0,%g1,%g4
   1.308 +/* 0x01c8	  82 (13 14) */		st	%g3,[%o5]
   1.309 +/* 0x01cc	  85 (13 14) */		add	%o5,4,%o5
   1.310 +/* 0x01d0	     (13 14) */		cmp	%o7,%o2
   1.311 +/* 0x01d4	     (14 15) */		or	%g0,%o0,%g1
   1.312 +/* 0x01d8	     (14 15) */		ble,a,pt	%icc,.L900000213	! tprob=0.86
   1.313 +/* 0x01dc	     (14 17) */		ldd	[%g2+16],%f0
   1.314 +                                   .L77000127:		/* frequency 1.0 confidence 0.0 */
   1.315 +
   1.316 +!   86		                    !   }
   1.317 +!   87		                    !     t1+=a&0xffffffff;
   1.318 +!   88		                    !     t=(a>>32);
   1.319 +!   89		                    !     t1+=(b&0xffff)<<16;
   1.320 +!   90		                    !     i32[i]=t1&0xffffffff;
   1.321 +
   1.322 +/* 0x01e0	  90 ( 0  1) */		sethi	%hi(0xfc00),%g2
   1.323 +                                   .L900000214:		/* frequency 1.0 confidence 0.0 */
   1.324 +/* 0x01e4	  90 ( 0  1) */		or	%g0,-1,%g3
   1.325 +/* 0x01e8	     ( 0  1) */		add	%g2,1023,%g2
   1.326 +/* 0x01ec	     ( 1  2) */		srl	%g3,0,%g3
   1.327 +/* 0x01f0	     ( 1  2) */		and	%g1,%g2,%g2
   1.328 +/* 0x01f4	     ( 2  3) */		and	%g4,%g3,%g4
   1.329 +/* 0x01f8	     ( 3  4) */		sllx	%g2,16,%g2
   1.330 +/* 0x01fc	     ( 3  4) */		add	%o4,%g4,%g4
   1.331 +/* 0x0200	     ( 4  5) */		add	%g4,%g2,%g2
   1.332 +/* 0x0204	     ( 5  6) */		sll	%o7,2,%g4
   1.333 +/* 0x0208	     ( 5  6) */		and	%g2,%g3,%g2
   1.334 +/* 0x020c	     ( 6  7) */		st	%g2,[%g5+%g4]
   1.335 +/* 0x0210	     ( 7  9) */		ret	! Result = 
   1.336 +/* 0x0214	     ( 9 10) */		restore	%g0,%g0,%g0
   1.337 +/* 0x0218	   0 ( 0  0) */		.type	conv_d16_to_i32,2
   1.338 +/* 0x0218	     ( 0  0) */		.size	conv_d16_to_i32,(.-conv_d16_to_i32)
   1.339 +
   1.340 +	.section	".text",#alloc,#execinstr
   1.341 +/* 000000	   0 ( 0  0) */		.align	8
   1.342 +!
   1.343 +! CONSTANT POOL
   1.344 +!
   1.345 +                                   .L_const_seg_900000301:		/* frequency 1.0 confidence 0.0 */
   1.346 +/* 000000	   0 ( 0  0) */		.word	1127219200,0
   1.347 +/* 0x0008	   0 ( 0  0) */		.align	4
   1.348 +!
   1.349 +! SUBROUTINE conv_i32_to_d32
   1.350 +!
   1.351 +! OFFSET    SOURCE LINE	LABEL	INSTRUCTION	(ISSUE TIME)	(COMPLETION TIME)
   1.352 +
   1.353 +                                   	.global conv_i32_to_d32
   1.354 +                                   conv_i32_to_d32:		/* frequency 1.0 confidence 0.0 */
   1.355 +/* 000000	     ( 0  1) */		orcc	%g0,%o2,%g1
   1.356 +
   1.357 +!   92		                    !}
   1.358 +!   94		                    !void conv_i32_to_d32(double *d32, unsigned int *i32, int len)
   1.359 +!   95		                    !{
   1.360 +!   96		                    !int i;
   1.361 +!   98		                    !#pragma pipeloop(0)
   1.362 +!   99		                    ! for(i=0;i<len;i++) d32[i]=(double)(i32[i]);
   1.363 +
   1.364 +/* 0x0004	  99 ( 0  1) */		ble,pt	%icc,.L77000140	! tprob=0.56
   1.365 +/* 0x0008	     ( 0  1) */		nop
   1.366 +/* 0x000c	     ( 1  2) */		sethi	%hi(.L_const_seg_900000301),%g2
   1.367 +/* 0x0010	  95 ( 1  2) */		or	%g0,%o1,%g4
   1.368 +/* 0x0014	  99 ( 2  3) */		add	%g2,%lo(.L_const_seg_900000301),%g2
   1.369 +/* 0x0018	     ( 2  3) */		or	%g0,0,%o5
   1.370 +/* 0x001c	  95 ( 3  4) */		or	%g0,%o0,%g5
   1.371 +/* 0x0020	  99 ( 3  4) */		sub	%o2,1,%g3
   1.372 +/* 0x0024	     ( 4  5) */		cmp	%o2,9
   1.373 +/* 0x0028	     ( 4  5) */		bl,pn	%icc,.L77000144	! tprob=0.44
   1.374 +/* 0x002c	     ( 4  7) */		ldd	[%g2],%f8
   1.375 +/* 0x0030	     ( 5  8) */		ld	[%o1],%f7
   1.376 +/* 0x0034	     ( 5  6) */		add	%o1,16,%g4
   1.377 +/* 0x0038	     ( 5  6) */		sub	%o2,5,%g1
   1.378 +/* 0x003c	     ( 6  9) */		ld	[%o1+4],%f5
   1.379 +/* 0x0040	     ( 6  7) */		or	%g0,4,%o5
   1.380 +/* 0x0044	     ( 7 10) */		ld	[%o1+8],%f3
   1.381 +/* 0x0048	     ( 7  8) */		fmovs	%f8,%f6
   1.382 +/* 0x004c	     ( 8 11) */		ld	[%o1+12],%f1
   1.383 +                                   .L900000305:		/* frequency 64.0 confidence 0.0 */
   1.384 +/* 0x0050	     ( 8 16) */		ld	[%g4],%f11
   1.385 +/* 0x0054	     ( 8  9) */		add	%o5,5,%o5
   1.386 +/* 0x0058	     ( 8  9) */		add	%g4,20,%g4
   1.387 +/* 0x005c	     ( 8 11) */		fsubd	%f6,%f8,%f6
   1.388 +/* 0x0060	     ( 9 10) */		std	%f6,[%g5]
   1.389 +/* 0x0064	     ( 9  9) */		cmp	%o5,%g1
   1.390 +/* 0x0068	     ( 9 10) */		add	%g5,40,%g5
   1.391 +/* 0x006c	     ( 0  0) */		fmovs	%f8,%f4
   1.392 +/* 0x0070	     (10 18) */		ld	[%g4-16],%f7
   1.393 +/* 0x0074	     (10 13) */		fsubd	%f4,%f8,%f12
   1.394 +/* 0x0078	     ( 0  0) */		fmovs	%f8,%f2
   1.395 +/* 0x007c	     (11 12) */		std	%f12,[%g5-32]
   1.396 +/* 0x0080	     (12 20) */		ld	[%g4-12],%f5
   1.397 +/* 0x0084	     (12 15) */		fsubd	%f2,%f8,%f12
   1.398 +/* 0x0088	     ( 0  0) */		fmovs	%f8,%f0
   1.399 +/* 0x008c	     (13 14) */		std	%f12,[%g5-24]
   1.400 +/* 0x0090	     (14 22) */		ld	[%g4-8],%f3
   1.401 +/* 0x0094	     (14 17) */		fsubd	%f0,%f8,%f12
   1.402 +/* 0x0098	     ( 0  0) */		fmovs	%f8,%f10
   1.403 +/* 0x009c	     (15 16) */		std	%f12,[%g5-16]
   1.404 +/* 0x00a0	     (16 24) */		ld	[%g4-4],%f1
   1.405 +/* 0x00a4	     (16 19) */		fsubd	%f10,%f8,%f10
   1.406 +/* 0x00a8	     ( 0  0) */		fmovs	%f8,%f6
   1.407 +/* 0x00ac	     (17 18) */		ble,pt	%icc,.L900000305	! tprob=0.50
   1.408 +/* 0x00b0	     (17 18) */		std	%f10,[%g5-8]
   1.409 +                                   .L900000308:		/* frequency 8.0 confidence 0.0 */
   1.410 +/* 0x00b4	     ( 0  1) */		fmovs	%f8,%f4
   1.411 +/* 0x00b8	     ( 0  1) */		add	%g5,32,%g5
   1.412 +/* 0x00bc	     ( 0  1) */		cmp	%o5,%g3
   1.413 +/* 0x00c0	     ( 1  2) */		fmovs	%f8,%f2
   1.414 +/* 0x00c4	     ( 2  3) */		fmovs	%f8,%f0
   1.415 +/* 0x00c8	     ( 4  7) */		fsubd	%f6,%f8,%f6
   1.416 +/* 0x00cc	     ( 4  5) */		std	%f6,[%g5-32]
   1.417 +/* 0x00d0	     ( 5  8) */		fsubd	%f4,%f8,%f4
   1.418 +/* 0x00d4	     ( 5  6) */		std	%f4,[%g5-24]
   1.419 +/* 0x00d8	     ( 6  9) */		fsubd	%f2,%f8,%f2
   1.420 +/* 0x00dc	     ( 6  7) */		std	%f2,[%g5-16]
   1.421 +/* 0x00e0	     ( 7 10) */		fsubd	%f0,%f8,%f0
   1.422 +/* 0x00e4	     ( 7  8) */		bg,pn	%icc,.L77000140	! tprob=0.14
   1.423 +/* 0x00e8	     ( 7  8) */		std	%f0,[%g5-8]
   1.424 +                                   .L77000144:		/* frequency 0.7 confidence 0.0 */
   1.425 +/* 0x00ec	     ( 0  3) */		ld	[%g4],%f1
   1.426 +                                   .L900000309:		/* frequency 6.4 confidence 0.0 */
   1.427 +/* 0x00f0	     ( 0  3) */		ldd	[%g2],%f8
   1.428 +/* 0x00f4	     ( 0  1) */		add	%o5,1,%o5
   1.429 +/* 0x00f8	     ( 0  1) */		add	%g4,4,%g4
   1.430 +/* 0x00fc	     ( 1  2) */		cmp	%o5,%g3
   1.431 +/* 0x0100	     ( 2  3) */		fmovs	%f8,%f0
   1.432 +/* 0x0104	     ( 4  7) */		fsubd	%f0,%f8,%f0
   1.433 +/* 0x0108	     ( 4  5) */		std	%f0,[%g5]
   1.434 +/* 0x010c	     ( 4  5) */		add	%g5,8,%g5
   1.435 +/* 0x0110	     ( 4  5) */		ble,a,pt	%icc,.L900000309	! tprob=0.86
   1.436 +/* 0x0114	     ( 6  9) */		ld	[%g4],%f1
   1.437 +                                   .L77000140:		/* frequency 1.0 confidence 0.0 */
   1.438 +/* 0x0118	     ( 0  2) */		retl	! Result = 
   1.439 +/* 0x011c	     ( 1  2) */		nop
   1.440 +/* 0x0120	   0 ( 0  0) */		.type	conv_i32_to_d32,2
   1.441 +/* 0x0120	     ( 0  0) */		.size	conv_i32_to_d32,(.-conv_i32_to_d32)
   1.442 +
   1.443 +	.section	".text",#alloc,#execinstr
   1.444 +/* 000000	   0 ( 0  0) */		.align	8
   1.445 +!
   1.446 +! CONSTANT POOL
   1.447 +!
   1.448 +                                   .L_const_seg_900000401:		/* frequency 1.0 confidence 0.0 */
   1.449 +/* 000000	   0 ( 0  0) */		.word	1127219200,0
   1.450 +/* 0x0008	   0 ( 0  0) */		.align	4
   1.451 +!
   1.452 +! SUBROUTINE conv_i32_to_d16
   1.453 +!
   1.454 +! OFFSET    SOURCE LINE	LABEL	INSTRUCTION	(ISSUE TIME)	(COMPLETION TIME)
   1.455 +
   1.456 +                                   	.global conv_i32_to_d16
   1.457 +                                   conv_i32_to_d16:		/* frequency 1.0 confidence 0.0 */
   1.458 +/* 000000	     ( 0  1) */		save	%sp,-104,%sp
   1.459 +/* 0x0004	     ( 1  2) */		orcc	%g0,%i2,%o0
   1.460 +
   1.461 +!  100		                    !}
   1.462 +!  103		                    !void conv_i32_to_d16(double *d16, unsigned int *i32, int len)
   1.463 +!  104		                    !{
   1.464 +!  105		                    !int i;
   1.465 +!  106		                    !unsigned int a;
   1.466 +!  108		                    !#pragma pipeloop(0)
   1.467 +!  109		                    ! for(i=0;i<len;i++)
   1.468 +
   1.469 +/* 0x0008	 109 ( 1  2) */		ble,pt	%icc,.L77000150	! tprob=0.56
   1.470 +/* 0x000c	     ( 1  2) */		nop
   1.471 +/* 0x0010	     ( 2  3) */		sub	%o0,1,%o5
   1.472 +/* 0x0014	     ( 2  3) */		sethi	%hi(0xfc00),%g2
   1.473 +
   1.474 +!  110		                    !   {
   1.475 +!  111		                    !     a=i32[i];
   1.476 +!  112		                    !     d16[2*i]=(double)(a&0xffff);
   1.477 +!  113		                    !     d16[2*i+1]=(double)(a>>16);
   1.478 +
   1.479 +/* 0x0018	 113 ( 3  4) */		sethi	%hi(.L_const_seg_900000401),%o0
   1.480 +/* 0x001c	     ( 3  4) */		add	%o5,1,%g3
   1.481 +/* 0x0020	     ( 4  5) */		add	%g2,1023,%o4
   1.482 +/* 0x0024	 109 ( 4  5) */		or	%g0,0,%g1
   1.483 +/* 0x0028	     ( 5  6) */		cmp	%g3,3
   1.484 +/* 0x002c	     ( 5  6) */		or	%g0,%i1,%o7
   1.485 +/* 0x0030	     ( 6  7) */		add	%o0,%lo(.L_const_seg_900000401),%o3
   1.486 +/* 0x0034	     ( 6  7) */		or	%g0,%i0,%g2
   1.487 +/* 0x0038	     ( 6  7) */		bl,pn	%icc,.L77000154	! tprob=0.44
   1.488 +/* 0x003c	     ( 7  8) */		add	%o7,4,%o0
   1.489 +/* 0x0040	 112 ( 7 10) */		ldd	[%o3],%f0
   1.490 +/* 0x0044	 113 ( 7  8) */		or	%g0,1,%g1
   1.491 +/* 0x0048	 111 ( 8 11) */		ld	[%o0-4],%o1
   1.492 +/* 0x004c	   0 ( 8  9) */		or	%g0,%o0,%o7
   1.493 +/* 0x0050	 112 (10 11) */		and	%o1,%o4,%o0
   1.494 +                                   .L900000406:		/* frequency 64.0 confidence 0.0 */
   1.495 +/* 0x0054	 112 (22 23) */		st	%o0,[%sp+96]
   1.496 +/* 0x0058	 113 (22 23) */		add	%g1,1,%g1
   1.497 +/* 0x005c	     (22 23) */		add	%g2,16,%g2
   1.498 +/* 0x0060	     (23 23) */		cmp	%g1,%o5
   1.499 +/* 0x0064	     (23 24) */		add	%o7,4,%o7
   1.500 +/* 0x0068	 112 (29 31) */		ld	[%sp+96],%f3
   1.501 +/* 0x006c	     ( 0  0) */		fmovs	%f0,%f2
   1.502 +/* 0x0070	     (31 34) */		fsubd	%f2,%f0,%f2
   1.503 +/* 0x0074	 113 (32 33) */		srl	%o1,16,%o0
   1.504 +/* 0x0078	 112 (32 33) */		std	%f2,[%g2-16]
   1.505 +/* 0x007c	 113 (33 34) */		st	%o0,[%sp+92]
   1.506 +/* 0x0080	     (40 42) */		ld	[%sp+92],%f3
   1.507 +/* 0x0084	 111 (41 43) */		ld	[%o7-4],%o1
   1.508 +/* 0x0088	 113 ( 0  0) */		fmovs	%f0,%f2
   1.509 +/* 0x008c	     (42 45) */		fsubd	%f2,%f0,%f2
   1.510 +/* 0x0090	 112 (43 44) */		and	%o1,%o4,%o0
   1.511 +/* 0x0094	 113 (43 44) */		ble,pt	%icc,.L900000406	! tprob=0.50
   1.512 +/* 0x0098	     (43 44) */		std	%f2,[%g2-8]
   1.513 +                                   .L900000409:		/* frequency 8.0 confidence 0.0 */
   1.514 +/* 0x009c	 112 ( 0  1) */		st	%o0,[%sp+96]
   1.515 +/* 0x00a0	     ( 0  1) */		fmovs	%f0,%f2
   1.516 +/* 0x00a4	 113 ( 0  1) */		add	%g2,16,%g2
   1.517 +/* 0x00a8	     ( 1  2) */		srl	%o1,16,%o0
   1.518 +/* 0x00ac	 112 ( 4  7) */		ld	[%sp+96],%f3
   1.519 +/* 0x00b0	     ( 6  9) */		fsubd	%f2,%f0,%f2
   1.520 +/* 0x00b4	     ( 6  7) */		std	%f2,[%g2-16]
   1.521 +/* 0x00b8	 113 ( 7  8) */		st	%o0,[%sp+92]
   1.522 +/* 0x00bc	     (10 11) */		fmovs	%f0,%f2
   1.523 +/* 0x00c0	     (11 14) */		ld	[%sp+92],%f3
   1.524 +/* 0x00c4	     (13 16) */		fsubd	%f2,%f0,%f0
   1.525 +/* 0x00c8	     (13 14) */		std	%f0,[%g2-8]
   1.526 +/* 0x00cc	     (14 16) */		ret	! Result = 
   1.527 +/* 0x00d0	     (16 17) */		restore	%g0,%g0,%g0
   1.528 +                                   .L77000154:		/* frequency 0.7 confidence 0.0 */
   1.529 +/* 0x00d4	 111 ( 0  3) */		ld	[%o7],%o0
   1.530 +                                   .L900000410:		/* frequency 6.4 confidence 0.0 */
   1.531 +/* 0x00d8	 112 ( 0  1) */		and	%o0,%o4,%o1
   1.532 +/* 0x00dc	     ( 0  1) */		st	%o1,[%sp+96]
   1.533 +/* 0x00e0	 113 ( 0  1) */		add	%g1,1,%g1
   1.534 +/* 0x00e4	 112 ( 1  4) */		ldd	[%o3],%f0
   1.535 +/* 0x00e8	 113 ( 1  2) */		srl	%o0,16,%o0
   1.536 +/* 0x00ec	     ( 1  2) */		add	%o7,4,%o7
   1.537 +/* 0x00f0	     ( 2  3) */		cmp	%g1,%o5
   1.538 +/* 0x00f4	 112 ( 3  4) */		fmovs	%f0,%f2
   1.539 +/* 0x00f8	     ( 4  7) */		ld	[%sp+96],%f3
   1.540 +/* 0x00fc	     ( 6  9) */		fsubd	%f2,%f0,%f2
   1.541 +/* 0x0100	     ( 6  7) */		std	%f2,[%g2]
   1.542 +/* 0x0104	 113 ( 7  8) */		st	%o0,[%sp+92]
   1.543 +/* 0x0108	     (10 11) */		fmovs	%f0,%f2
   1.544 +/* 0x010c	     (11 14) */		ld	[%sp+92],%f3
   1.545 +/* 0x0110	     (13 16) */		fsubd	%f2,%f0,%f0
   1.546 +/* 0x0114	     (13 14) */		std	%f0,[%g2+8]
   1.547 +/* 0x0118	     (13 14) */		add	%g2,16,%g2
   1.548 +/* 0x011c	     (13 14) */		ble,a,pt	%icc,.L900000410	! tprob=0.86
   1.549 +/* 0x0120	     (14 17) */		ld	[%o7],%o0
   1.550 +                                   .L77000150:		/* frequency 1.0 confidence 0.0 */
   1.551 +/* 0x0124	     ( 0  2) */		ret	! Result = 
   1.552 +/* 0x0128	     ( 2  3) */		restore	%g0,%g0,%g0
   1.553 +/* 0x012c	   0 ( 0  0) */		.type	conv_i32_to_d16,2
   1.554 +/* 0x012c	     ( 0  0) */		.size	conv_i32_to_d16,(.-conv_i32_to_d16)
   1.555 +
   1.556 +	.section	".text",#alloc,#execinstr
   1.557 +/* 000000	   0 ( 0  0) */		.align	8
   1.558 +!
   1.559 +! CONSTANT POOL
   1.560 +!
   1.561 +                                   .L_const_seg_900000501:		/* frequency 1.0 confidence 0.0 */
   1.562 +/* 000000	   0 ( 0  0) */		.word	1127219200,0
   1.563 +/* 0x0008	   0 ( 0  0) */		.align	4
   1.564 +!
   1.565 +! SUBROUTINE conv_i32_to_d32_and_d16
   1.566 +!
   1.567 +! OFFSET    SOURCE LINE	LABEL	INSTRUCTION	(ISSUE TIME)	(COMPLETION TIME)
   1.568 +
   1.569 +                                   	.global conv_i32_to_d32_and_d16
   1.570 +                                   conv_i32_to_d32_and_d16:		/* frequency 1.0 confidence 0.0 */
   1.571 +/* 000000	     ( 0  1) */		save	%sp,-104,%sp
   1.572 +/* 0x0004	     ( 1  2) */		or	%g0,%i3,%i4
   1.573 +/* 0x0008	     ( 1  2) */		or	%g0,%i2,%g1
   1.574 +
   1.575 +!  114		                    !   }
   1.576 +!  115		                    !}
   1.577 +!  118		                    !void i16_to_d16_and_d32x4(double * /*1/(2^16)*/, double * /* 2^16*/,
   1.578 +!  119		                    !			  double * /* 0 */,
   1.579 +!  120		                    !			  double * /*result16*/, double * /* result32 */,
   1.580 +!  121		                    !			  float *  /*source - should be unsigned int*
   1.581 +!  122		                    !		          	       converted to float* */);
   1.582 +!  126		                    !void conv_i32_to_d32_and_d16(double *d32, double *d16, 
   1.583 +!  127		                    !			     unsigned int *i32, int len)
   1.584 +!  128		                    !{
   1.585 +!  129		                    !int i;
   1.586 +!  130		                    !unsigned int a;
   1.587 +!  132		                    !#pragma pipeloop(0)
   1.588 +!  133		                    ! for(i=0;i<len-3;i+=4)
   1.589 +
   1.590 +/* 0x000c	 133 ( 2  3) */		sub	%i4,3,%g2
   1.591 +/* 0x0010	     ( 2  3) */		or	%g0,0,%o7
   1.592 +/* 0x0014	     ( 3  4) */		cmp	%g2,0
   1.593 +/* 0x0018	 128 ( 3  4) */		or	%g0,%i0,%i3
   1.594 +/* 0x001c	 133 ( 3  4) */		ble,pt	%icc,.L900000515	! tprob=0.56
   1.595 +/* 0x0020	     ( 4  5) */		cmp	%o7,%i4
   1.596 +
   1.597 +!  134		                    !   {
   1.598 +!  135		                    !     i16_to_d16_and_d32x4(&TwoToMinus16, &TwoTo16, &Zero,
   1.599 +!  136		                    !			  &(d16[2*i]), &(d32[i]), (float *)(&(i32[i])));
   1.600 +
   1.601 +/* 0x0024	 136 ( 4  5) */		sethi	%hi(Zero),%g2
   1.602 +/* 0x0028	 133 ( 5  6) */		or	%g0,%g1,%o3
   1.603 +/* 0x002c	     ( 5  6) */		sub	%i4,4,%o2
   1.604 +/* 0x0030	 136 ( 6  7) */		add	%g2,%lo(Zero),%o1
   1.605 +/* 0x0034	 133 ( 6  7) */		or	%g0,0,%o5
   1.606 +/* 0x0038	     ( 7  8) */		or	%g0,0,%o4
   1.607 +/* 0x003c	 136 ( 7  8) */		or	%g0,%o3,%g4
   1.608 +                                   .L900000514:		/* frequency 6.4 confidence 0.0 */
   1.609 +/* 0x0040	     ( 0  3) */		ldd	[%o1],%f2
   1.610 +/* 0x0044	 136 ( 0  1) */		add	%i3,%o5,%g2
   1.611 +/* 0x0048	     ( 0  1) */		add	%i1,%o4,%g3
   1.612 +/* 0x004c	     ( 1  4) */		ldd	[%o1-8],%f0
   1.613 +/* 0x0050	     ( 1  2) */		add	%o7,4,%o7
   1.614 +/* 0x0054	     ( 1  2) */		add	%o3,16,%o3
   1.615 +/* 0x0058	     ( 2  3) */		fmovd	%f2,%f14
   1.616 +/* 0x005c	     ( 2  5) */		ld	[%g4],%f15
   1.617 +/* 0x0060	     ( 2  3) */		cmp	%o7,%o2
   1.618 +/* 0x0064	     ( 3  4) */		fmovd	%f2,%f10
   1.619 +/* 0x0068	     ( 3  6) */		ld	[%g4+4],%f11
   1.620 +/* 0x006c	     ( 4  5) */		fmovd	%f2,%f6
   1.621 +/* 0x0070	     ( 4  7) */		ld	[%g4+8],%f7
   1.622 +/* 0x0074	     ( 5  8) */		ld	[%g4+12],%f3
   1.623 +/* 0x0078	     ( 5  8) */		fxtod	%f14,%f14
   1.624 +/* 0x007c	     ( 6  9) */		fxtod	%f10,%f10
   1.625 +/* 0x0080	     ( 6  9) */		ldd	[%o1-16],%f16
   1.626 +/* 0x0084	     ( 7 10) */		fxtod	%f6,%f6
   1.627 +/* 0x0088	     ( 7  8) */		std	%f14,[%i3+%o5]
   1.628 +/* 0x008c	     ( 7  8) */		add	%o5,32,%o5
   1.629 +/* 0x0090	     ( 8 11) */		fxtod	%f2,%f2
   1.630 +/* 0x0094	     ( 8 11) */		fmuld	%f0,%f14,%f12
   1.631 +/* 0x0098	     ( 8  9) */		std	%f10,[%g2+8]
   1.632 +/* 0x009c	     ( 9 12) */		fmuld	%f0,%f10,%f8
   1.633 +/* 0x00a0	     ( 9 10) */		std	%f6,[%g2+16]
   1.634 +/* 0x00a4	     (10 13) */		fmuld	%f0,%f6,%f4
   1.635 +/* 0x00a8	     (10 11) */		std	%f2,[%g2+24]
   1.636 +/* 0x00ac	     (11 14) */		fmuld	%f0,%f2,%f0
   1.637 +/* 0x00b0	     (11 14) */		fdtox	%f12,%f12
   1.638 +/* 0x00b4	     (12 15) */		fdtox	%f8,%f8
   1.639 +/* 0x00b8	     (13 16) */		fdtox	%f4,%f4
   1.640 +/* 0x00bc	     (14 17) */		fdtox	%f0,%f0
   1.641 +/* 0x00c0	     (15 18) */		fxtod	%f12,%f12
   1.642 +/* 0x00c4	     (15 16) */		std	%f12,[%g3+8]
   1.643 +/* 0x00c8	     (16 19) */		fxtod	%f8,%f8
   1.644 +/* 0x00cc	     (16 17) */		std	%f8,[%g3+24]
   1.645 +/* 0x00d0	     (17 20) */		fxtod	%f4,%f4
   1.646 +/* 0x00d4	     (17 18) */		std	%f4,[%g3+40]
   1.647 +/* 0x00d8	     (18 21) */		fxtod	%f0,%f0
   1.648 +/* 0x00dc	     (18 21) */		fmuld	%f12,%f16,%f12
   1.649 +/* 0x00e0	     (18 19) */		std	%f0,[%g3+56]
   1.650 +/* 0x00e4	     (19 22) */		fmuld	%f8,%f16,%f8
   1.651 +/* 0x00e8	     (20 23) */		fmuld	%f4,%f16,%f4
   1.652 +/* 0x00ec	     (21 24) */		fmuld	%f0,%f16,%f0
   1.653 +/* 0x00f0	     (21 24) */		fsubd	%f14,%f12,%f12
   1.654 +/* 0x00f4	     (21 22) */		std	%f12,[%i1+%o4]
   1.655 +/* 0x00f8	     (22 25) */		fsubd	%f10,%f8,%f8
   1.656 +/* 0x00fc	     (22 23) */		std	%f8,[%g3+16]
   1.657 +/* 0x0100	     (22 23) */		add	%o4,64,%o4
   1.658 +/* 0x0104	     (23 26) */		fsubd	%f6,%f4,%f4
   1.659 +/* 0x0108	     (23 24) */		std	%f4,[%g3+32]
   1.660 +/* 0x010c	     (24 27) */		fsubd	%f2,%f0,%f0
   1.661 +/* 0x0110	     (24 25) */		std	%f0,[%g3+48]
   1.662 +/* 0x0114	     (24 25) */		ble,pt	%icc,.L900000514	! tprob=0.86
   1.663 +/* 0x0118	     (25 26) */		or	%g0,%o3,%g4
   1.664 +                                   .L77000159:		/* frequency 1.0 confidence 0.0 */
   1.665 +
   1.666 +!  137		                    !   }
   1.667 +!  138		                    ! for(;i<len;i++)
   1.668 +
   1.669 +/* 0x011c	 138 ( 0  1) */		cmp	%o7,%i4
   1.670 +                                   .L900000515:		/* frequency 1.0 confidence 0.0 */
   1.671 +/* 0x0120	 138 ( 0  1) */		bge,pt	%icc,.L77000164	! tprob=0.56
   1.672 +/* 0x0124	     ( 0  1) */		nop
   1.673 +
   1.674 +!  139		                    !   {
   1.675 +!  140		                    !     a=i32[i];
   1.676 +!  141		                    !     d32[i]=(double)(i32[i]);
   1.677 +!  142		                    !     d16[2*i]=(double)(a&0xffff);
   1.678 +!  143		                    !     d16[2*i+1]=(double)(a>>16);
   1.679 +
   1.680 +/* 0x0128	 143 ( 0  1) */		sethi	%hi(.L_const_seg_900000501),%o1
   1.681 +/* 0x012c	 138 ( 1  2) */		sethi	%hi(0xfc00),%o0
   1.682 +/* 0x0130	 141 ( 1  4) */		ldd	[%o1+%lo(.L_const_seg_900000501)],%f0
   1.683 +/* 0x0134	 138 ( 1  2) */		sub	%i4,%o7,%g3
   1.684 +/* 0x0138	     ( 2  3) */		sll	%o7,2,%g2
   1.685 +/* 0x013c	     ( 2  3) */		add	%o0,1023,%o3
   1.686 +/* 0x0140	     ( 3  4) */		sll	%o7,3,%g4
   1.687 +/* 0x0144	     ( 3  4) */		cmp	%g3,3
   1.688 +/* 0x0148	     ( 4  5) */		add	%g1,%g2,%o0
   1.689 +/* 0x014c	     ( 4  5) */		add	%o1,%lo(.L_const_seg_900000501),%o2
   1.690 +/* 0x0150	     ( 5  6) */		add	%i3,%g4,%o4
   1.691 +/* 0x0154	     ( 5  6) */		sub	%i4,1,%o1
   1.692 +/* 0x0158	     ( 6  7) */		sll	%o7,4,%g5
   1.693 +/* 0x015c	     ( 6  7) */		bl,pn	%icc,.L77000161	! tprob=0.44
   1.694 +/* 0x0160	     ( 7  8) */		add	%i1,%g5,%o5
   1.695 +/* 0x0164	 141 ( 7 10) */		ld	[%g1+%g2],%f3
   1.696 +/* 0x0168	 143 ( 7  8) */		add	%o4,8,%o4
   1.697 +/* 0x016c	 140 ( 8 11) */		ld	[%g1+%g2],%g1
   1.698 +/* 0x0170	 143 ( 8  9) */		add	%o5,16,%o5
   1.699 +/* 0x0174	     ( 8  9) */		add	%o7,1,%o7
   1.700 +/* 0x0178	 141 ( 9 10) */		fmovs	%f0,%f2
   1.701 +/* 0x017c	 143 ( 9 10) */		add	%o0,4,%o0
   1.702 +/* 0x0180	 142 (10 11) */		and	%g1,%o3,%g2
   1.703 +/* 0x0184	 141 (11 14) */		fsubd	%f2,%f0,%f2
   1.704 +/* 0x0188	     (11 12) */		std	%f2,[%o4-8]
   1.705 +/* 0x018c	 143 (11 12) */		srl	%g1,16,%g1
   1.706 +/* 0x0190	 142 (12 13) */		st	%g2,[%sp+96]
   1.707 +/* 0x0194	     (15 16) */		fmovs	%f0,%f2
   1.708 +/* 0x0198	     (16 19) */		ld	[%sp+96],%f3
   1.709 +/* 0x019c	     (18 21) */		fsubd	%f2,%f0,%f2
   1.710 +/* 0x01a0	     (18 19) */		std	%f2,[%o5-16]
   1.711 +/* 0x01a4	 143 (19 20) */		st	%g1,[%sp+92]
   1.712 +/* 0x01a8	     (22 23) */		fmovs	%f0,%f2
   1.713 +/* 0x01ac	     (23 26) */		ld	[%sp+92],%f3
   1.714 +/* 0x01b0	     (25 28) */		fsubd	%f2,%f0,%f2
   1.715 +/* 0x01b4	     (25 26) */		std	%f2,[%o5-8]
   1.716 +                                   .L900000509:		/* frequency 64.0 confidence 0.0 */
   1.717 +/* 0x01b8	 141 (26 28) */		ld	[%o0],%f3
   1.718 +/* 0x01bc	 143 (26 27) */		add	%o7,2,%o7
   1.719 +/* 0x01c0	     (26 27) */		add	%o5,32,%o5
   1.720 +/* 0x01c4	 140 (27 29) */		ld	[%o0],%g1
   1.721 +/* 0x01c8	 143 (27 27) */		cmp	%o7,%o1
   1.722 +/* 0x01cc	     (27 28) */		add	%o4,16,%o4
   1.723 +/* 0x01d0	 141 ( 0  0) */		fmovs	%f0,%f2
   1.724 +/* 0x01d4	     (28 31) */		fsubd	%f2,%f0,%f2
   1.725 +/* 0x01d8	     (29 30) */		std	%f2,[%o4-16]
   1.726 +/* 0x01dc	 142 (29 30) */		and	%g1,%o3,%g2
   1.727 +/* 0x01e0	     (30 31) */		st	%g2,[%sp+96]
   1.728 +/* 0x01e4	     (37 39) */		ld	[%sp+96],%f3
   1.729 +/* 0x01e8	     ( 0  0) */		fmovs	%f0,%f2
   1.730 +/* 0x01ec	     (39 42) */		fsubd	%f2,%f0,%f2
   1.731 +/* 0x01f0	 143 (40 41) */		srl	%g1,16,%g1
   1.732 +/* 0x01f4	 142 (40 41) */		std	%f2,[%o5-32]
   1.733 +/* 0x01f8	 143 (41 42) */		st	%g1,[%sp+92]
   1.734 +/* 0x01fc	     (48 50) */		ld	[%sp+92],%f3
   1.735 +/* 0x0200	     ( 0  0) */		fmovs	%f0,%f2
   1.736 +/* 0x0204	     (50 53) */		fsubd	%f2,%f0,%f2
   1.737 +/* 0x0208	     (51 52) */		std	%f2,[%o5-24]
   1.738 +/* 0x020c	     (51 52) */		add	%o0,4,%o0
   1.739 +/* 0x0210	 141 (52 54) */		ld	[%o0],%f3
   1.740 +/* 0x0214	 140 (53 55) */		ld	[%o0],%g1
   1.741 +/* 0x0218	 141 ( 0  0) */		fmovs	%f0,%f2
   1.742 +/* 0x021c	     (54 57) */		fsubd	%f2,%f0,%f2
   1.743 +/* 0x0220	     (55 56) */		std	%f2,[%o4-8]
   1.744 +/* 0x0224	 142 (55 56) */		and	%g1,%o3,%g2
   1.745 +/* 0x0228	     (56 57) */		st	%g2,[%sp+96]
   1.746 +/* 0x022c	     (63 65) */		ld	[%sp+96],%f3
   1.747 +/* 0x0230	     ( 0  0) */		fmovs	%f0,%f2
   1.748 +/* 0x0234	     (65 68) */		fsubd	%f2,%f0,%f2
   1.749 +/* 0x0238	 143 (66 67) */		srl	%g1,16,%g1
   1.750 +/* 0x023c	 142 (66 67) */		std	%f2,[%o5-16]
   1.751 +/* 0x0240	 143 (67 68) */		st	%g1,[%sp+92]
   1.752 +/* 0x0244	     (74 76) */		ld	[%sp+92],%f3
   1.753 +/* 0x0248	     ( 0  0) */		fmovs	%f0,%f2
   1.754 +/* 0x024c	     (76 79) */		fsubd	%f2,%f0,%f2
   1.755 +/* 0x0250	     (77 78) */		std	%f2,[%o5-8]
   1.756 +/* 0x0254	     (77 78) */		bl,pt	%icc,.L900000509	! tprob=0.50
   1.757 +/* 0x0258	     (77 78) */		add	%o0,4,%o0
   1.758 +                                   .L900000512:		/* frequency 8.0 confidence 0.0 */
   1.759 +/* 0x025c	 143 ( 0  1) */		cmp	%o7,%i4
   1.760 +/* 0x0260	     ( 0  1) */		bge,pn	%icc,.L77000164	! tprob=0.14
   1.761 +/* 0x0264	     ( 0  1) */		nop
   1.762 +                                   .L77000161:		/* frequency 0.7 confidence 0.0 */
   1.763 +/* 0x0268	 141 ( 0  3) */		ld	[%o0],%f3
   1.764 +                                   .L900000513:		/* frequency 6.4 confidence 0.0 */
   1.765 +/* 0x026c	 141 ( 0  3) */		ldd	[%o2],%f0
   1.766 +/* 0x0270	 143 ( 0  1) */		add	%o7,1,%o7
   1.767 +/* 0x0274	 140 ( 1  4) */		ld	[%o0],%o1
   1.768 +/* 0x0278	 143 ( 1  2) */		add	%o0,4,%o0
   1.769 +/* 0x027c	     ( 1  2) */		cmp	%o7,%i4
   1.770 +/* 0x0280	 141 ( 2  3) */		fmovs	%f0,%f2
   1.771 +/* 0x0284	 142 ( 3  4) */		and	%o1,%o3,%g1
   1.772 +/* 0x0288	 141 ( 4  7) */		fsubd	%f2,%f0,%f2
   1.773 +/* 0x028c	     ( 4  5) */		std	%f2,[%o4]
   1.774 +/* 0x0290	 143 ( 4  5) */		srl	%o1,16,%o1
   1.775 +/* 0x0294	 142 ( 5  6) */		st	%g1,[%sp+96]
   1.776 +/* 0x0298	 143 ( 5  6) */		add	%o4,8,%o4
   1.777 +/* 0x029c	 142 ( 8  9) */		fmovs	%f0,%f2
   1.778 +/* 0x02a0	     ( 9 12) */		ld	[%sp+96],%f3
   1.779 +/* 0x02a4	     (11 14) */		fsubd	%f2,%f0,%f2
   1.780 +/* 0x02a8	     (11 12) */		std	%f2,[%o5]
   1.781 +/* 0x02ac	 143 (12 13) */		st	%o1,[%sp+92]
   1.782 +/* 0x02b0	     (15 16) */		fmovs	%f0,%f2
   1.783 +/* 0x02b4	     (16 19) */		ld	[%sp+92],%f3
   1.784 +/* 0x02b8	     (18 21) */		fsubd	%f2,%f0,%f0
   1.785 +/* 0x02bc	     (18 19) */		std	%f0,[%o5+8]
   1.786 +/* 0x02c0	     (18 19) */		add	%o5,16,%o5
   1.787 +/* 0x02c4	     (18 19) */		bl,a,pt	%icc,.L900000513	! tprob=0.86
   1.788 +/* 0x02c8	     (19 22) */		ld	[%o0],%f3
   1.789 +                                   .L77000164:		/* frequency 1.0 confidence 0.0 */
   1.790 +/* 0x02cc	     ( 0  2) */		ret	! Result = 
   1.791 +/* 0x02d0	     ( 2  3) */		restore	%g0,%g0,%g0
   1.792 +/* 0x02d4	   0 ( 0  0) */		.type	conv_i32_to_d32_and_d16,2
   1.793 +/* 0x02d4	     ( 0  0) */		.size	conv_i32_to_d32_and_d16,(.-conv_i32_to_d32_and_d16)
   1.794 +
   1.795 +	.section	".text",#alloc,#execinstr
   1.796 +/* 000000	   0 ( 0  0) */		.align	4
   1.797 +!
   1.798 +! SUBROUTINE adjust_montf_result
   1.799 +!
   1.800 +! OFFSET    SOURCE LINE	LABEL	INSTRUCTION	(ISSUE TIME)	(COMPLETION TIME)
   1.801 +
   1.802 +                                   	.global adjust_montf_result
   1.803 +                                   adjust_montf_result:		/* frequency 1.0 confidence 0.0 */
   1.804 +
   1.805 +!  144		                    !   }
   1.806 +!  145		                    !}
   1.807 +!  148		                    !void adjust_montf_result(unsigned int *i32, unsigned int *nint, int len)
   1.808 +!  149		                    !{
   1.809 +!  150		                    !long long acc;
   1.810 +!  151		                    !int i;
   1.811 +!  153		                    ! if(i32[len]>0) i=-1;
   1.812 +
   1.813 +/* 000000	 153 ( 0  1) */		sll	%o2,2,%g1
   1.814 +/* 0x0004	     ( 0  1) */		or	%g0,-1,%g3
   1.815 +/* 0x0008	     ( 1  4) */		ld	[%o0+%g1],%g1
   1.816 +/* 0x000c	     ( 3  4) */		cmp	%g1,0
   1.817 +/* 0x0010	     ( 3  4) */		bleu,pn	%icc,.L77000175	! tprob=0.50
   1.818 +/* 0x0014	     ( 3  4) */		or	%g0,%o1,%o3
   1.819 +/* 0x0018	     ( 4  5) */		ba	.L900000611	! tprob=1.00
   1.820 +/* 0x001c	     ( 4  5) */		cmp	%g3,0
   1.821 +                                   .L77000175:		/* frequency 0.8 confidence 0.0 */
   1.822 +
   1.823 +!  154		                    ! else
   1.824 +!  155		                    !   {
   1.825 +!  156		                    !     for(i=len-1; i>=0; i++)
   1.826 +
   1.827 +/* 0x0020	 156 ( 0  1) */		subcc	%o2,1,%g3
   1.828 +/* 0x0024	     ( 0  1) */		bneg,pt	%icc,.L900000611	! tprob=0.60
   1.829 +/* 0x0028	     ( 1  2) */		cmp	%g3,0
   1.830 +/* 0x002c	     ( 1  2) */		sll	%g3,2,%g1
   1.831 +/* 0x0030	     ( 2  3) */		add	%o0,%g1,%g2
   1.832 +/* 0x0034	     ( 2  3) */		add	%o1,%g1,%g1
   1.833 +
   1.834 +!  157		                    !       {
   1.835 +!  158		                    !	 if(i32[i]!=nint[i]) break;
   1.836 +
   1.837 +/* 0x0038	 158 ( 3  6) */		ld	[%g1],%g5
   1.838 +                                   .L900000610:		/* frequency 5.3 confidence 0.0 */
   1.839 +/* 0x003c	 158 ( 0  3) */		ld	[%g2],%o5
   1.840 +/* 0x0040	     ( 0  1) */		add	%g1,4,%g1
   1.841 +/* 0x0044	     ( 0  1) */		add	%g2,4,%g2
   1.842 +/* 0x0048	     ( 2  3) */		cmp	%o5,%g5
   1.843 +/* 0x004c	     ( 2  3) */		bne,pn	%icc,.L77000182	! tprob=0.16
   1.844 +/* 0x0050	     ( 2  3) */		nop
   1.845 +/* 0x0054	     ( 3  4) */		addcc	%g3,1,%g3
   1.846 +/* 0x0058	     ( 3  4) */		bpos,a,pt	%icc,.L900000610	! tprob=0.84
   1.847 +/* 0x005c	     ( 3  6) */		ld	[%g1],%g5
   1.848 +                                   .L77000182:		/* frequency 1.0 confidence 0.0 */
   1.849 +
   1.850 +!  159		                    !       }
   1.851 +!  160		                    !   }
   1.852 +!  161		                    ! if((i<0)||(i32[i]>nint[i]))
   1.853 +
   1.854 +/* 0x0060	 161 ( 0  1) */		cmp	%g3,0
   1.855 +                                   .L900000611:		/* frequency 1.0 confidence 0.0 */
   1.856 +/* 0x0064	 161 ( 0  1) */		bl,pn	%icc,.L77000198	! tprob=0.50
   1.857 +/* 0x0068	     ( 0  1) */		sll	%g3,2,%g2
   1.858 +/* 0x006c	     ( 1  4) */		ld	[%o1+%g2],%g1
   1.859 +/* 0x0070	     ( 2  5) */		ld	[%o0+%g2],%g2
   1.860 +/* 0x0074	     ( 4  5) */		cmp	%g2,%g1
   1.861 +/* 0x0078	     ( 4  5) */		bleu,pt	%icc,.L77000191	! tprob=0.56
   1.862 +/* 0x007c	     ( 4  5) */		nop
   1.863 +                                   .L77000198:		/* frequency 0.8 confidence 0.0 */
   1.864 +
   1.865 +!  162		                    !   {
   1.866 +!  163		                    !     acc=0;
   1.867 +!  164		                    !     for(i=0;i<len;i++)
   1.868 +
   1.869 +/* 0x0080	 164 ( 0  1) */		cmp	%o2,0
   1.870 +/* 0x0084	     ( 0  1) */		ble,pt	%icc,.L77000191	! tprob=0.60
   1.871 +/* 0x0088	     ( 0  1) */		nop
   1.872 +/* 0x008c	 161 ( 1  2) */		or	%g0,-1,%g2
   1.873 +/* 0x0090	     ( 1  2) */		sub	%o2,1,%g4
   1.874 +/* 0x0094	     ( 2  3) */		srl	%g2,0,%g3
   1.875 +/* 0x0098	 163 ( 2  3) */		or	%g0,0,%g5
   1.876 +/* 0x009c	 164 ( 3  4) */		or	%g0,0,%o5
   1.877 +/* 0x00a0	 161 ( 3  4) */		or	%g0,%o0,%o4
   1.878 +/* 0x00a4	     ( 4  5) */		cmp	%o2,3
   1.879 +/* 0x00a8	     ( 4  5) */		add	%o1,4,%g2
   1.880 +/* 0x00ac	 164 ( 4  5) */		bl,pn	%icc,.L77000199	! tprob=0.40
   1.881 +/* 0x00b0	     ( 5  6) */		add	%o0,8,%g1
   1.882 +
   1.883 +!  165		                    !       {
   1.884 +!  166		                    !	 acc=acc+(unsigned long long)(i32[i])-(unsigned long long)(nint[i]);
   1.885 +
   1.886 +/* 0x00b4	 166 ( 5  8) */		ld	[%o0],%o2
   1.887 +/* 0x00b8	   0 ( 5  6) */		or	%g0,%g2,%o3
   1.888 +/* 0x00bc	 166 ( 6  9) */		ld	[%o1],%o1
   1.889 +/* 0x00c0	   0 ( 6  7) */		or	%g0,%g1,%o4
   1.890 +
   1.891 +!  167		                    !	 i32[i]=acc&0xffffffff;
   1.892 +!  168		                    !	 acc=acc>>32;
   1.893 +
   1.894 +/* 0x00c4	 168 ( 6  7) */		or	%g0,2,%o5
   1.895 +/* 0x00c8	 166 ( 7 10) */		ld	[%o0+4],%g1
   1.896 +/* 0x00cc	 164 ( 8  9) */		sub	%o2,%o1,%o2
   1.897 +/* 0x00d0	     ( 9 10) */		or	%g0,%o2,%g5
   1.898 +/* 0x00d4	 167 ( 9 10) */		and	%o2,%g3,%o2
   1.899 +/* 0x00d8	     ( 9 10) */		st	%o2,[%o0]
   1.900 +/* 0x00dc	 168 (10 11) */		srax	%g5,32,%g5
   1.901 +                                   .L900000605:		/* frequency 64.0 confidence 0.0 */
   1.902 +/* 0x00e0	 166 (12 20) */		ld	[%o3],%o2
   1.903 +/* 0x00e4	 168 (12 13) */		add	%o5,1,%o5
   1.904 +/* 0x00e8	     (12 13) */		add	%o3,4,%o3
   1.905 +/* 0x00ec	     (13 13) */		cmp	%o5,%g4
   1.906 +/* 0x00f0	     (13 14) */		add	%o4,4,%o4
   1.907 +/* 0x00f4	 164 (14 14) */		sub	%g1,%o2,%g1
   1.908 +/* 0x00f8	     (15 15) */		add	%g1,%g5,%g5
   1.909 +/* 0x00fc	 167 (16 17) */		and	%g5,%g3,%o2
   1.910 +/* 0x0100	 166 (16 24) */		ld	[%o4-4],%g1
   1.911 +/* 0x0104	 167 (17 18) */		st	%o2,[%o4-8]
   1.912 +/* 0x0108	 168 (17 18) */		ble,pt	%icc,.L900000605	! tprob=0.50
   1.913 +/* 0x010c	     (17 18) */		srax	%g5,32,%g5
   1.914 +                                   .L900000608:		/* frequency 8.0 confidence 0.0 */
   1.915 +/* 0x0110	 166 ( 0  3) */		ld	[%o3],%g2
   1.916 +/* 0x0114	 164 ( 2  3) */		sub	%g1,%g2,%g1
   1.917 +/* 0x0118	     ( 3  4) */		add	%g1,%g5,%g1
   1.918 +/* 0x011c	 167 ( 4  5) */		and	%g1,%g3,%g2
   1.919 +/* 0x0120	     ( 5  7) */		retl	! Result = 
   1.920 +/* 0x0124	     ( 6  7) */		st	%g2,[%o4-4]
   1.921 +                                   .L77000199:		/* frequency 0.6 confidence 0.0 */
   1.922 +/* 0x0128	 166 ( 0  3) */		ld	[%o4],%g1
   1.923 +                                   .L900000609:		/* frequency 5.3 confidence 0.0 */
   1.924 +/* 0x012c	 166 ( 0  3) */		ld	[%o3],%g2
   1.925 +/* 0x0130	     ( 0  1) */		add	%g5,%g1,%g1
   1.926 +/* 0x0134	 168 ( 0  1) */		add	%o5,1,%o5
   1.927 +/* 0x0138	     ( 1  2) */		add	%o3,4,%o3
   1.928 +/* 0x013c	     ( 1  2) */		cmp	%o5,%g4
   1.929 +/* 0x0140	 166 ( 2  3) */		sub	%g1,%g2,%g1
   1.930 +/* 0x0144	 167 ( 3  4) */		and	%g1,%g3,%g2
   1.931 +/* 0x0148	     ( 3  4) */		st	%g2,[%o4]
   1.932 +/* 0x014c	 168 ( 3  4) */		add	%o4,4,%o4
   1.933 +/* 0x0150	     ( 4  5) */		srax	%g1,32,%g5
   1.934 +/* 0x0154	     ( 4  5) */		ble,a,pt	%icc,.L900000609	! tprob=0.84
   1.935 +/* 0x0158	     ( 4  7) */		ld	[%o4],%g1
   1.936 +                                   .L77000191:		/* frequency 1.0 confidence 0.0 */
   1.937 +/* 0x015c	     ( 0  2) */		retl	! Result = 
   1.938 +/* 0x0160	     ( 1  2) */		nop
   1.939 +/* 0x0164	   0 ( 0  0) */		.type	adjust_montf_result,2
   1.940 +/* 0x0164	     ( 0  0) */		.size	adjust_montf_result,(.-adjust_montf_result)
   1.941 +
   1.942 +	.section	".text",#alloc,#execinstr
   1.943 +/* 000000	   0 ( 0  0) */		.align	32
   1.944 +!
   1.945 +! SUBROUTINE mont_mulf_noconv
   1.946 +!
   1.947 +! OFFSET    SOURCE LINE	LABEL	INSTRUCTION	(ISSUE TIME)	(COMPLETION TIME)
   1.948 +
   1.949 +                                   	.global mont_mulf_noconv
   1.950 +                                   mont_mulf_noconv:		/* frequency 1.0 confidence 0.0 */
   1.951 +/* 000000	     ( 0  1) */		save	%sp,-144,%sp
   1.952 +/* 0x0004	     ( 1  2) */		st	%i0,[%fp+68]
   1.953 +
   1.954 +!  169		                    !       }
   1.955 +!  170		                    !   }
   1.956 +!  171		                    !}
   1.957 +!  175		                    !void cleanup(double *dt, int from, int tlen);
   1.958 +!  177		                    !/*
   1.959 +!  178		                    !** the lengths of the input arrays should be at least the following:
   1.960 +!  179		                    !** result[nlen+1], dm1[nlen], dm2[2*nlen+1], dt[4*nlen+2], dn[nlen], nint[nlen]
   1.961 +!  180		                    !** all of them should be different from one another
   1.962 +!  181		                    !**
   1.963 +!  182		                    !*/
   1.964 +!  183		                    !void mont_mulf_noconv(unsigned int *result,
   1.965 +!  184		                    !		     double *dm1, double *dm2, double *dt,
   1.966 +!  185		                    !		     double *dn, unsigned int *nint,
   1.967 +!  186		                    !		     int nlen, double dn0)
   1.968 +!  187		                    !{
   1.969 +!  188		                    ! int i, j, jj;
   1.970 +!  189		                    ! int tmp;
   1.971 +!  190		                    ! double digit, m2j, nextm2j, a, b;
   1.972 +!  191		                    ! double *dptmp, *pdm1, *pdm2, *pdn, *pdtj, pdn_0, pdm1_0;
   1.973 +!  193		                    ! pdm1=&(dm1[0]);
   1.974 +!  194		                    ! pdm2=&(dm2[0]);
   1.975 +!  195		                    ! pdn=&(dn[0]);
   1.976 +!  196		                    ! pdm2[2*nlen]=Zero;
   1.977 +
   1.978 +/* 0x0008	 196 ( 1  2) */		sethi	%hi(Zero),%g2
   1.979 +/* 0x000c	 187 ( 1  2) */		or	%g0,%i2,%o1
   1.980 +/* 0x0010	     ( 2  3) */		st	%i5,[%fp+88]
   1.981 +/* 0x0014	     ( 2  3) */		or	%g0,%i3,%o2
   1.982 +/* 0x0018	 196 ( 2  3) */		add	%g2,%lo(Zero),%g4
   1.983 +/* 0x001c	     ( 3  6) */		ldd	[%g2+%lo(Zero)],%f2
   1.984 +/* 0x0020	 187 ( 3  4) */		or	%g0,%o2,%g5
   1.985 +/* 0x0024	 196 ( 3  4) */		or	%g0,%o1,%i0
   1.986 +/* 0x0028	 187 ( 4  5) */		or	%g0,%i4,%i2
   1.987 +
   1.988 +!  198		                    ! if (nlen!=16)
   1.989 +!  199		                    !   {
   1.990 +!  200		                    !     for(i=0;i<4*nlen+2;i++) dt[i]=Zero;
   1.991 +!  202		                    !     a=dt[0]=pdm1[0]*pdm2[0];
   1.992 +!  203		                    !     digit=mod(lower32(a,Zero)*dn0,TwoToMinus16,TwoTo16);
   1.993 +!  205		                    !     pdtj=&(dt[0]);
   1.994 +!  206		                    !     for(j=jj=0;j<2*nlen;j++,jj++,pdtj++)
   1.995 +!  207		                    !       {
   1.996 +!  208		                    !	 m2j=pdm2[j];
   1.997 +!  209		                    !	 a=pdtj[0]+pdn[0]*digit;
   1.998 +!  210		                    !	 b=pdtj[1]+pdm1[0]*pdm2[j+1]+a*TwoToMinus16;
   1.999 +!  211		                    !	 pdtj[1]=b;
  1.1000 +!  213		                    !#pragma pipeloop(0)
  1.1001 +!  214		                    !	 for(i=1;i<nlen;i++)
  1.1002 +!  215		                    !	   {
  1.1003 +!  216		                    !	     pdtj[2*i]+=pdm1[i]*m2j+pdn[i]*digit;
  1.1004 +!  217		                    !	   }
  1.1005 +!  218		                    ! 	 if((jj==30)) {cleanup(dt,j/2+1,2*nlen+1); jj=0;}
  1.1006 +!  219		                    !	 
  1.1007 +!  220		                    !	 digit=mod(lower32(b,Zero)*dn0,TwoToMinus16,TwoTo16);
  1.1008 +!  221		                    !       }
  1.1009 +!  222		                    !   }
  1.1010 +!  223		                    ! else
  1.1011 +!  224		                    !   {
  1.1012 +!  225		                    !     a=dt[0]=pdm1[0]*pdm2[0];
  1.1013 +!  227		                    !     dt[65]=     dt[64]=     dt[63]=     dt[62]=     dt[61]=     dt[60]=
  1.1014 +!  228		                    !     dt[59]=     dt[58]=     dt[57]=     dt[56]=     dt[55]=     dt[54]=
  1.1015 +!  229		                    !     dt[53]=     dt[52]=     dt[51]=     dt[50]=     dt[49]=     dt[48]=
  1.1016 +!  230		                    !     dt[47]=     dt[46]=     dt[45]=     dt[44]=     dt[43]=     dt[42]=
  1.1017 +!  231		                    !     dt[41]=     dt[40]=     dt[39]=     dt[38]=     dt[37]=     dt[36]=
  1.1018 +!  232		                    !     dt[35]=     dt[34]=     dt[33]=     dt[32]=     dt[31]=     dt[30]=
  1.1019 +!  233		                    !     dt[29]=     dt[28]=     dt[27]=     dt[26]=     dt[25]=     dt[24]=
  1.1020 +!  234		                    !     dt[23]=     dt[22]=     dt[21]=     dt[20]=     dt[19]=     dt[18]=
  1.1021 +!  235		                    !     dt[17]=     dt[16]=     dt[15]=     dt[14]=     dt[13]=     dt[12]=
  1.1022 +!  236		                    !     dt[11]=     dt[10]=     dt[ 9]=     dt[ 8]=     dt[ 7]=     dt[ 6]=
  1.1023 +!  237		                    !     dt[ 5]=     dt[ 4]=     dt[ 3]=     dt[ 2]=     dt[ 1]=Zero;
  1.1024 +!  239		                    !     pdn_0=pdn[0];
  1.1025 +!  240		                    !     pdm1_0=pdm1[0];
  1.1026 +!  242		                    !     digit=mod(lower32(a,Zero)*dn0,TwoToMinus16,TwoTo16);
  1.1027 +!  243		                    !     pdtj=&(dt[0]);
  1.1028 +!  245		                    !     for(j=0;j<32;j++,pdtj++)
  1.1029 +!  246		                    !       {
  1.1030 +!  248		                    !	 m2j=pdm2[j];
  1.1031 +!  249		                    !	 a=pdtj[0]+pdn_0*digit;
  1.1032 +!  250		                    !	 b=pdtj[1]+pdm1_0*pdm2[j+1]+a*TwoToMinus16;
  1.1033 +!  251		                    !	 pdtj[1]=b;
  1.1034 +!  253		                    !	 /**** this loop will be fully unrolled:
  1.1035 +!  254		                    !	 for(i=1;i<16;i++)
  1.1036 +!  255		                    !	   {
  1.1037 +!  256		                    !	     pdtj[2*i]+=pdm1[i]*m2j+pdn[i]*digit;
  1.1038 +!  257		                    !	   }
  1.1039 +!  258		                    !	 *************************************/
  1.1040 +!  259		                    !	     pdtj[2]+=pdm1[1]*m2j+pdn[1]*digit;
  1.1041 +!  260		                    !	     pdtj[4]+=pdm1[2]*m2j+pdn[2]*digit;
  1.1042 +!  261		                    !	     pdtj[6]+=pdm1[3]*m2j+pdn[3]*digit;
  1.1043 +!  262		                    !	     pdtj[8]+=pdm1[4]*m2j+pdn[4]*digit;
  1.1044 +!  263		                    !	     pdtj[10]+=pdm1[5]*m2j+pdn[5]*digit;
  1.1045 +!  264		                    !	     pdtj[12]+=pdm1[6]*m2j+pdn[6]*digit;
  1.1046 +!  265		                    !	     pdtj[14]+=pdm1[7]*m2j+pdn[7]*digit;
  1.1047 +!  266		                    !	     pdtj[16]+=pdm1[8]*m2j+pdn[8]*digit;
  1.1048 +!  267		                    !	     pdtj[18]+=pdm1[9]*m2j+pdn[9]*digit;
  1.1049 +!  268		                    !	     pdtj[20]+=pdm1[10]*m2j+pdn[10]*digit;
  1.1050 +!  269		                    !	     pdtj[22]+=pdm1[11]*m2j+pdn[11]*digit;
  1.1051 +!  270		                    !	     pdtj[24]+=pdm1[12]*m2j+pdn[12]*digit;
  1.1052 +!  271		                    !	     pdtj[26]+=pdm1[13]*m2j+pdn[13]*digit;
  1.1053 +!  272		                    !	     pdtj[28]+=pdm1[14]*m2j+pdn[14]*digit;
  1.1054 +!  273		                    !	     pdtj[30]+=pdm1[15]*m2j+pdn[15]*digit;
  1.1055 +!  274		                    !	 /* no need for cleenup, cannot overflow */
  1.1056 +!  275		                    !	 digit=mod(lower32(b,Zero)*dn0,TwoToMinus16,TwoTo16);
  1.1057 +!  276		                    !       }
  1.1058 +!  277		                    !   }
  1.1059 +!  279		                    ! conv_d16_to_i32(result,dt+2*nlen,(long long *)dt,nlen+1);
  1.1060 +!  281		                    ! adjust_montf_result(result,nint,nlen); 
  1.1061 +
  1.1062 +/* 0x002c	 281 ( 4  5) */		or	%g0,1,%o4
  1.1063 +/* 0x0030	 187 ( 6  9) */		ldd	[%fp+96],%f0
  1.1064 +/* 0x0034	 196 ( 7 10) */		ld	[%fp+92],%o0
  1.1065 +/* 0x0038	 187 ( 8  9) */		fmovd	%f0,%f16
  1.1066 +/* 0x003c	 196 ( 9 10) */		sll	%o0,4,%g2
  1.1067 +/* 0x0040	     ( 9 10) */		or	%g0,%o0,%g1
  1.1068 +/* 0x0044	 198 (10 11) */		cmp	%o0,16
  1.1069 +/* 0x0048	     (10 11) */		be,pn	%icc,.L77000289	! tprob=0.50
  1.1070 +/* 0x004c	     (10 11) */		std	%f2,[%o1+%g2]
  1.1071 +/* 0x0050	 200 (11 12) */		sll	%o0,2,%g2
  1.1072 +/* 0x0054	     (11 14) */		ldd	[%g4],%f2
  1.1073 +/* 0x0058	     (12 13) */		add	%g2,2,%o1
  1.1074 +/* 0x005c	     (12 13) */		add	%g2,1,%o3
  1.1075 +/* 0x0060	 196 (13 14) */		sll	%o0,1,%o7
  1.1076 +/* 0x0064	 200 (13 14) */		cmp	%o1,0
  1.1077 +/* 0x0068	     (13 14) */		ble,a,pt	%icc,.L900000755	! tprob=0.55
  1.1078 +/* 0x006c	     (14 17) */		ldd	[%i1],%f0
  1.1079 +/* 0x0070	     (14 15) */		cmp	%o1,3
  1.1080 +/* 0x0074	 281 (14 15) */		or	%g0,1,%o1
  1.1081 +/* 0x0078	     (14 15) */		bl,pn	%icc,.L77000279	! tprob=0.40
  1.1082 +/* 0x007c	     (15 16) */		add	%o2,8,%o0
  1.1083 +/* 0x0080	     (15 16) */		std	%f2,[%g5]
  1.1084 +/* 0x0084	   0 (16 17) */		or	%g0,%o0,%o2
  1.1085 +                                   .L900000726:		/* frequency 64.0 confidence 0.0 */
  1.1086 +/* 0x0088	     ( 3  5) */		ldd	[%g4],%f0
  1.1087 +/* 0x008c	     ( 3  4) */		add	%o4,1,%o4
  1.1088 +/* 0x0090	     ( 3  4) */		add	%o2,8,%o2
  1.1089 +/* 0x0094	     ( 4  4) */		cmp	%o4,%o3
  1.1090 +/* 0x0098	     ( 5  6) */		ble,pt	%icc,.L900000726	! tprob=0.50
  1.1091 +/* 0x009c	     ( 5  6) */		std	%f0,[%o2-8]
  1.1092 +                                   .L900000729:		/* frequency 8.0 confidence 0.0 */
  1.1093 +/* 0x00a0	     ( 0  1) */		ba	.L900000755	! tprob=1.00
  1.1094 +/* 0x00a4	     ( 0  3) */		ldd	[%i1],%f0
  1.1095 +                                   .L77000279:		/* frequency 0.6 confidence 0.0 */
  1.1096 +/* 0x00a8	     ( 0  1) */		std	%f2,[%o2]
  1.1097 +                                   .L900000754:		/* frequency 5.3 confidence 0.0 */
  1.1098 +/* 0x00ac	     ( 0  3) */		ldd	[%g4],%f2
  1.1099 +/* 0x00b0	     ( 0  1) */		cmp	%o1,%o3
  1.1100 +/* 0x00b4	     ( 0  1) */		add	%o2,8,%o2
  1.1101 +/* 0x00b8	     ( 1  2) */		add	%o1,1,%o1
  1.1102 +/* 0x00bc	     ( 1  2) */		ble,a,pt	%icc,.L900000754	! tprob=0.87
  1.1103 +/* 0x00c0	     ( 3  4) */		std	%f2,[%o2]
  1.1104 +                                   .L77000284:		/* frequency 0.8 confidence 0.0 */
  1.1105 +/* 0x00c4	 202 ( 0  3) */		ldd	[%i1],%f0
  1.1106 +                                   .L900000755:		/* frequency 0.8 confidence 0.0 */
  1.1107 +/* 0x00c8	 202 ( 0  3) */		ldd	[%i0],%f2
  1.1108 +/* 0x00cc	     ( 0  1) */		add	%o7,1,%o2
  1.1109 +/* 0x00d0	 206 ( 0  1) */		cmp	%o7,0
  1.1110 +/* 0x00d4	     ( 1  2) */		sll	%o2,1,%o0
  1.1111 +/* 0x00d8	     ( 1  2) */		sub	%o7,1,%o1
  1.1112 +/* 0x00dc	 202 ( 2  5) */		fmuld	%f0,%f2,%f0
  1.1113 +/* 0x00e0	     ( 2  3) */		std	%f0,[%g5]
  1.1114 +/* 0x00e4	     ( 2  3) */		sub	%g1,1,%o7
  1.1115 +/* 0x00e8	     ( 3  6) */		ldd	[%g4],%f6
  1.1116 +/* 0x00ec	   0 ( 3  4) */		or	%g0,%o7,%g3
  1.1117 +/* 0x00f0	     ( 3  4) */		or	%g0,0,%l0
  1.1118 +/* 0x00f4	     ( 4  7) */		ldd	[%g4-8],%f2
  1.1119 +/* 0x00f8	     ( 4  5) */		or	%g0,0,%i5
  1.1120 +/* 0x00fc	     ( 4  5) */		or	%g0,%o1,%o5
  1.1121 +/* 0x0100	     ( 5  8) */		fdtox	%f0,%f0
  1.1122 +/* 0x0104	     ( 5  8) */		ldd	[%g4-16],%f4
  1.1123 +/* 0x0108	     ( 5  6) */		or	%g0,%o0,%o3
  1.1124 +/* 0x010c	 210 ( 6  7) */		add	%i0,8,%o4
  1.1125 +/* 0x0110	     ( 6  7) */		or	%g0,0,%i4
  1.1126 +/* 0x0114	     ( 9 10) */		fmovs	%f6,%f0
  1.1127 +/* 0x0118	     (11 14) */		fxtod	%f0,%f0
  1.1128 +/* 0x011c	 203 (14 17) */		fmuld	%f0,%f16,%f0
  1.1129 +/* 0x0120	     (17 20) */		fmuld	%f0,%f2,%f2
  1.1130 +/* 0x0124	     (20 23) */		fdtox	%f2,%f2
  1.1131 +/* 0x0128	     (23 26) */		fxtod	%f2,%f2
  1.1132 +/* 0x012c	     (26 29) */		fmuld	%f2,%f4,%f2
  1.1133 +/* 0x0130	     (29 32) */		fsubd	%f0,%f2,%f22
  1.1134 +/* 0x0134	 206 (29 30) */		ble,pt	%icc,.L900000748	! tprob=0.60
  1.1135 +/* 0x0138	     (29 30) */		sll	%g1,4,%g2
  1.1136 +/* 0x013c	 210 (30 33) */		ldd	[%i2],%f0
  1.1137 +                                   .L900000749:		/* frequency 5.3 confidence 0.0 */
  1.1138 +/* 0x0140	 210 ( 0  3) */		fmuld	%f0,%f22,%f8
  1.1139 +/* 0x0144	     ( 0  3) */		ldd	[%i1],%f0
  1.1140 +/* 0x0148	 214 ( 0  1) */		cmp	%g1,1
  1.1141 +/* 0x014c	 210 ( 1  4) */		ldd	[%o4+%i4],%f6
  1.1142 +/* 0x0150	     ( 1  2) */		add	%i1,8,%o0
  1.1143 +/* 0x0154	 214 ( 1  2) */		or	%g0,1,%o1
  1.1144 +/* 0x0158	 210 ( 2  5) */		ldd	[%i3],%f2
  1.1145 +/* 0x015c	     ( 2  3) */		add	%i3,16,%l1
  1.1146 +/* 0x0160	     ( 3  6) */		fmuld	%f0,%f6,%f6
  1.1147 +/* 0x0164	     ( 3  6) */		ldd	[%g4-8],%f4
  1.1148 +/* 0x0168	     ( 4  7) */		faddd	%f2,%f8,%f2
  1.1149 +/* 0x016c	     ( 4  7) */		ldd	[%i3+8],%f0
  1.1150 +/* 0x0170	 208 ( 5  8) */		ldd	[%i0+%i4],%f20
  1.1151 +/* 0x0174	 210 ( 6  9) */		faddd	%f0,%f6,%f0
  1.1152 +/* 0x0178	     ( 7 10) */		fmuld	%f2,%f4,%f2
  1.1153 +/* 0x017c	     (10 13) */		faddd	%f0,%f2,%f18
  1.1154 +/* 0x0180	 211 (10 11) */		std	%f18,[%i3+8]
  1.1155 +/* 0x0184	 214 (10 11) */		ble,pt	%icc,.L900000753	! tprob=0.54
  1.1156 +/* 0x0188	     (11 12) */		srl	%i5,31,%g2
  1.1157 +/* 0x018c	     (11 12) */		cmp	%g3,7
  1.1158 +/* 0x0190	 210 (12 13) */		add	%i2,8,%g2
  1.1159 +/* 0x0194	 214 (12 13) */		bl,pn	%icc,.L77000281	! tprob=0.36
  1.1160 +/* 0x0198	     (13 14) */		add	%g2,24,%o2
  1.1161 +/* 0x019c	 216 (13 16) */		ldd	[%o0+16],%f14
  1.1162 +/* 0x01a0	     (13 14) */		add	%i3,48,%l1
  1.1163 +/* 0x01a4	     (14 17) */		ldd	[%o0+24],%f12
  1.1164 +/* 0x01a8	   0 (14 15) */		or	%g0,%o2,%g2
  1.1165 +/* 0x01ac	 214 (14 15) */		sub	%g1,3,%o2
  1.1166 +/* 0x01b0	 216 (15 18) */		ldd	[%o0],%f2
  1.1167 +/* 0x01b4	     (15 16) */		or	%g0,5,%o1
  1.1168 +/* 0x01b8	     (16 19) */		ldd	[%g2-24],%f0
  1.1169 +/* 0x01bc	     (17 20) */		ldd	[%o0+8],%f6
  1.1170 +/* 0x01c0	     (17 20) */		fmuld	%f2,%f20,%f2
  1.1171 +/* 0x01c4	     (17 18) */		add	%o0,32,%o0
  1.1172 +/* 0x01c8	     (18 21) */		ldd	[%g2-16],%f8
  1.1173 +/* 0x01cc	     (18 21) */		fmuld	%f0,%f22,%f4
  1.1174 +/* 0x01d0	     (19 22) */		ldd	[%i3+16],%f0
  1.1175 +/* 0x01d4	     (19 22) */		fmuld	%f6,%f20,%f10
  1.1176 +/* 0x01d8	     (20 23) */		ldd	[%g2-8],%f6
  1.1177 +/* 0x01dc	     (21 24) */		faddd	%f2,%f4,%f4
  1.1178 +/* 0x01e0	     (21 24) */		ldd	[%i3+32],%f2
  1.1179 +                                   .L900000738:		/* frequency 512.0 confidence 0.0 */
  1.1180 +/* 0x01e4	 216 (16 24) */		ldd	[%g2],%f24
  1.1181 +/* 0x01e8	     (16 17) */		add	%o1,3,%o1
  1.1182 +/* 0x01ec	     (16 17) */		add	%g2,24,%g2
  1.1183 +/* 0x01f0	     (16 19) */		fmuld	%f8,%f22,%f8
  1.1184 +/* 0x01f4	     (17 25) */		ldd	[%l1],%f28
  1.1185 +/* 0x01f8	     (17 17) */		cmp	%o1,%o2
  1.1186 +/* 0x01fc	     (17 18) */		add	%o0,24,%o0
  1.1187 +/* 0x0200	     (18 26) */		ldd	[%o0-24],%f26
  1.1188 +/* 0x0204	     (18 21) */		faddd	%f0,%f4,%f0
  1.1189 +/* 0x0208	     (18 19) */		add	%l1,48,%l1
  1.1190 +/* 0x020c	     (19 22) */		faddd	%f10,%f8,%f10
  1.1191 +/* 0x0210	     (19 22) */		fmuld	%f14,%f20,%f4
  1.1192 +/* 0x0214	     (19 20) */		std	%f0,[%l1-80]
  1.1193 +/* 0x0218	     (20 28) */		ldd	[%g2-16],%f8
  1.1194 +/* 0x021c	     (20 23) */		fmuld	%f6,%f22,%f6
  1.1195 +/* 0x0220	     (21 29) */		ldd	[%l1-32],%f0
  1.1196 +/* 0x0224	     (22 30) */		ldd	[%o0-16],%f14
  1.1197 +/* 0x0228	     (22 25) */		faddd	%f2,%f10,%f2
  1.1198 +/* 0x022c	     (23 26) */		faddd	%f4,%f6,%f10
  1.1199 +/* 0x0230	     (23 26) */		fmuld	%f12,%f20,%f4
  1.1200 +/* 0x0234	     (23 24) */		std	%f2,[%l1-64]
  1.1201 +/* 0x0238	     (24 32) */		ldd	[%g2-8],%f6
  1.1202 +/* 0x023c	     (24 27) */		fmuld	%f24,%f22,%f24
  1.1203 +/* 0x0240	     (25 33) */		ldd	[%l1-16],%f2
  1.1204 +/* 0x0244	     (26 34) */		ldd	[%o0-8],%f12
  1.1205 +/* 0x0248	     (26 29) */		faddd	%f28,%f10,%f10
  1.1206 +/* 0x024c	     (27 28) */		std	%f10,[%l1-48]
  1.1207 +/* 0x0250	     (27 30) */		fmuld	%f26,%f20,%f10
  1.1208 +/* 0x0254	     (27 28) */		ble,pt	%icc,.L900000738	! tprob=0.50
  1.1209 +/* 0x0258	     (27 30) */		faddd	%f4,%f24,%f4
  1.1210 +                                   .L900000741:		/* frequency 64.0 confidence 0.0 */
  1.1211 +/* 0x025c	 216 ( 0  3) */		fmuld	%f8,%f22,%f28
  1.1212 +/* 0x0260	     ( 0  3) */		ldd	[%g2],%f24
  1.1213 +/* 0x0264	     ( 0  3) */		faddd	%f0,%f4,%f26
  1.1214 +/* 0x0268	     ( 1  4) */		fmuld	%f12,%f20,%f8
  1.1215 +/* 0x026c	     ( 1  2) */		add	%l1,32,%l1
  1.1216 +/* 0x0270	     ( 1  2) */		cmp	%o1,%g3
  1.1217 +/* 0x0274	     ( 2  5) */		fmuld	%f14,%f20,%f14
  1.1218 +/* 0x0278	     ( 2  5) */		ldd	[%l1-32],%f4
  1.1219 +/* 0x027c	     ( 2  3) */		add	%g2,8,%g2
  1.1220 +/* 0x0280	     ( 3  6) */		faddd	%f10,%f28,%f12
  1.1221 +/* 0x0284	     ( 3  6) */		fmuld	%f6,%f22,%f6
  1.1222 +/* 0x0288	     ( 3  6) */		ldd	[%l1-16],%f0
  1.1223 +/* 0x028c	     ( 4  7) */		fmuld	%f24,%f22,%f10
  1.1224 +/* 0x0290	     ( 4  5) */		std	%f26,[%l1-64]
  1.1225 +/* 0x0294	     ( 6  9) */		faddd	%f2,%f12,%f2
  1.1226 +/* 0x0298	     ( 6  7) */		std	%f2,[%l1-48]
  1.1227 +/* 0x029c	     ( 7 10) */		faddd	%f14,%f6,%f6
  1.1228 +/* 0x02a0	     ( 8 11) */		faddd	%f8,%f10,%f2
  1.1229 +/* 0x02a4	     (10 13) */		faddd	%f4,%f6,%f4
  1.1230 +/* 0x02a8	     (10 11) */		std	%f4,[%l1-32]
  1.1231 +/* 0x02ac	     (11 14) */		faddd	%f0,%f2,%f0
  1.1232 +/* 0x02b0	     (11 12) */		bg,pn	%icc,.L77000213	! tprob=0.13
  1.1233 +/* 0x02b4	     (11 12) */		std	%f0,[%l1-16]
  1.1234 +                                   .L77000281:		/* frequency 4.0 confidence 0.0 */
  1.1235 +/* 0x02b8	 216 ( 0  3) */		ldd	[%o0],%f0
  1.1236 +                                   .L900000752:		/* frequency 36.6 confidence 0.0 */
  1.1237 +/* 0x02bc	 216 ( 0  3) */		ldd	[%g2],%f4
  1.1238 +/* 0x02c0	     ( 0  3) */		fmuld	%f0,%f20,%f2
  1.1239 +/* 0x02c4	     ( 0  1) */		add	%o1,1,%o1
  1.1240 +/* 0x02c8	     ( 1  4) */		ldd	[%l1],%f0
  1.1241 +/* 0x02cc	     ( 1  2) */		add	%o0,8,%o0
  1.1242 +/* 0x02d0	     ( 1  2) */		add	%g2,8,%g2
  1.1243 +/* 0x02d4	     ( 2  5) */		fmuld	%f4,%f22,%f4
  1.1244 +/* 0x02d8	     ( 2  3) */		cmp	%o1,%g3
  1.1245 +/* 0x02dc	     ( 5  8) */		faddd	%f2,%f4,%f2
  1.1246 +/* 0x02e0	     ( 8 11) */		faddd	%f0,%f2,%f0
  1.1247 +/* 0x02e4	     ( 8  9) */		std	%f0,[%l1]
  1.1248 +/* 0x02e8	     ( 8  9) */		add	%l1,16,%l1
  1.1249 +/* 0x02ec	     ( 8  9) */		ble,a,pt	%icc,.L900000752	! tprob=0.87
  1.1250 +/* 0x02f0	     (10 13) */		ldd	[%o0],%f0
  1.1251 +                                   .L77000213:		/* frequency 5.3 confidence 0.0 */
  1.1252 +/* 0x02f4	     ( 0  1) */		srl	%i5,31,%g2
  1.1253 +                                   .L900000753:		/* frequency 5.3 confidence 0.0 */
  1.1254 +/* 0x02f8	 218 ( 0  1) */		cmp	%l0,30
  1.1255 +/* 0x02fc	     ( 0  1) */		bne,a,pt	%icc,.L900000751	! tprob=0.54
  1.1256 +/* 0x0300	     ( 0  3) */		fdtox	%f18,%f0
  1.1257 +/* 0x0304	     ( 1  2) */		add	%i5,%g2,%g2
  1.1258 +/* 0x0308	     ( 1  2) */		sub	%o3,1,%o2
  1.1259 +/* 0x030c	     ( 2  3) */		sra	%g2,1,%o0
  1.1260 +/* 0x0310	 216 ( 2  5) */		ldd	[%g4],%f0
  1.1261 +/* 0x0314	     ( 3  4) */		add	%o0,1,%g2
  1.1262 +/* 0x0318	     ( 4  5) */		sll	%g2,1,%o0
  1.1263 +/* 0x031c	     ( 4  5) */		fmovd	%f0,%f2
  1.1264 +/* 0x0320	     ( 5  6) */		sll	%g2,4,%o1
  1.1265 +/* 0x0324	     ( 5  6) */		cmp	%o0,%o3
  1.1266 +/* 0x0328	     ( 5  6) */		bge,pt	%icc,.L77000215	! tprob=0.53
  1.1267 +/* 0x032c	     ( 6  7) */		or	%g0,0,%l0
  1.1268 +/* 0x0330	 218 ( 6  7) */		add	%g5,%o1,%o1
  1.1269 +/* 0x0334	 216 ( 7 10) */		ldd	[%o1],%f8
  1.1270 +                                   .L900000750:		/* frequency 32.0 confidence 0.0 */
  1.1271 +/* 0x0338	     ( 0  3) */		fdtox	%f8,%f6
  1.1272 +/* 0x033c	     ( 0  3) */		ldd	[%g4],%f10
  1.1273 +/* 0x0340	     ( 0  1) */		add	%o0,2,%o0
  1.1274 +/* 0x0344	     ( 1  4) */		ldd	[%o1+8],%f4
  1.1275 +/* 0x0348	     ( 1  4) */		fdtox	%f8,%f8
  1.1276 +/* 0x034c	     ( 1  2) */		cmp	%o0,%o2
  1.1277 +/* 0x0350	     ( 5  6) */		fmovs	%f10,%f6
  1.1278 +/* 0x0354	     ( 7 10) */		fxtod	%f6,%f10
  1.1279 +/* 0x0358	     ( 8 11) */		fdtox	%f4,%f6
  1.1280 +/* 0x035c	     ( 9 12) */		fdtox	%f4,%f4
  1.1281 +/* 0x0360	     (10 13) */		faddd	%f10,%f2,%f2
  1.1282 +/* 0x0364	     (10 11) */		std	%f2,[%o1]
  1.1283 +/* 0x0368	     (12 15) */		ldd	[%g4],%f2
  1.1284 +/* 0x036c	     (14 15) */		fmovs	%f2,%f6
  1.1285 +/* 0x0370	     (16 19) */		fxtod	%f6,%f6
  1.1286 +/* 0x0374	     (17 20) */		fitod	%f8,%f2
  1.1287 +/* 0x0378	     (19 22) */		faddd	%f6,%f0,%f0
  1.1288 +/* 0x037c	     (19 20) */		std	%f0,[%o1+8]
  1.1289 +/* 0x0380	     (19 20) */		add	%o1,16,%o1
  1.1290 +/* 0x0384	     (20 23) */		fitod	%f4,%f0
  1.1291 +/* 0x0388	     (20 21) */		ble,a,pt	%icc,.L900000750	! tprob=0.87
  1.1292 +/* 0x038c	     (20 23) */		ldd	[%o1],%f8
  1.1293 +                                   .L77000233:		/* frequency 4.6 confidence 0.0 */
  1.1294 +/* 0x0390	     ( 0  0) */		or	%g0,0,%l0
  1.1295 +                                   .L77000215:		/* frequency 5.3 confidence 0.0 */
  1.1296 +/* 0x0394	     ( 0  3) */		fdtox	%f18,%f0
  1.1297 +                                   .L900000751:		/* frequency 5.3 confidence 0.0 */
  1.1298 +/* 0x0398	     ( 0  3) */		ldd	[%g4],%f6
  1.1299 +/* 0x039c	 220 ( 0  1) */		add	%i5,1,%i5
  1.1300 +/* 0x03a0	     ( 0  1) */		add	%i4,8,%i4
  1.1301 +/* 0x03a4	     ( 1  4) */		ldd	[%g4-8],%f2
  1.1302 +/* 0x03a8	     ( 1  2) */		add	%l0,1,%l0
  1.1303 +/* 0x03ac	     ( 1  2) */		add	%i3,8,%i3
  1.1304 +/* 0x03b0	     ( 2  3) */		fmovs	%f6,%f0
  1.1305 +/* 0x03b4	     ( 2  5) */		ldd	[%g4-16],%f4
  1.1306 +/* 0x03b8	     ( 2  3) */		cmp	%i5,%o5
  1.1307 +/* 0x03bc	     ( 4  7) */		fxtod	%f0,%f0
  1.1308 +/* 0x03c0	     ( 7 10) */		fmuld	%f0,%f16,%f0
  1.1309 +/* 0x03c4	     (10 13) */		fmuld	%f0,%f2,%f2
  1.1310 +/* 0x03c8	     (13 16) */		fdtox	%f2,%f2
  1.1311 +/* 0x03cc	     (16 19) */		fxtod	%f2,%f2
  1.1312 +/* 0x03d0	     (19 22) */		fmuld	%f2,%f4,%f2
  1.1313 +/* 0x03d4	     (22 25) */		fsubd	%f0,%f2,%f22
  1.1314 +/* 0x03d8	     (22 23) */		ble,a,pt	%icc,.L900000749	! tprob=0.89
  1.1315 +/* 0x03dc	     (22 25) */		ldd	[%i2],%f0
  1.1316 +                                   .L900000725:		/* frequency 0.7 confidence 0.0 */
  1.1317 +/* 0x03e0	 220 ( 0  1) */		ba	.L900000748	! tprob=1.00
  1.1318 +/* 0x03e4	     ( 0  1) */		sll	%g1,4,%g2
  1.1319 +
  1.1320 +	
  1.1321 +                                   .L77000289:		/* frequency 0.8 confidence 0.0 */
  1.1322 +/* 0x03e8	 225 ( 0  3) */		ldd	[%o1],%f6
  1.1323 +/* 0x03ec	 242 ( 0  1) */		add	%g4,-8,%g2
  1.1324 +/* 0x03f0	     ( 0  1) */		add	%g4,-16,%g3
  1.1325 +/* 0x03f4	 225 ( 1  4) */		ldd	[%i1],%f2
  1.1326 +/* 0x03f8	 245 ( 1  2) */		or	%g0,0,%o3
  1.1327 +/* 0x03fc	     ( 1  2) */		or	%g0,0,%o0
  1.1328 +/* 0x0400	 225 ( 3  6) */		fmuld	%f2,%f6,%f2
  1.1329 +/* 0x0404	     ( 3  4) */		std	%f2,[%o2]
  1.1330 +/* 0x0408	     ( 4  7) */		ldd	[%g4],%f6
  1.1331 +/* 0x040c	 237 ( 7  8) */		std	%f6,[%o2+8]
  1.1332 +/* 0x0410	     ( 8  9) */		std	%f6,[%o2+16]
  1.1333 +/* 0x0414	     ( 9 10) */		std	%f6,[%o2+24]
  1.1334 +/* 0x0418	     (10 11) */		std	%f6,[%o2+32]
  1.1335 +/* 0x041c	     (11 12) */		std	%f6,[%o2+40]
  1.1336 +/* 0x0420	     (12 13) */		std	%f6,[%o2+48]
  1.1337 +/* 0x0424	     (13 14) */		std	%f6,[%o2+56]
  1.1338 +/* 0x0428	     (14 15) */		std	%f6,[%o2+64]
  1.1339 +/* 0x042c	     (15 16) */		std	%f6,[%o2+72]
  1.1340 +!	prefetch	[%i4],0
  1.1341 +!	prefetch	[%i4+32],0
  1.1342 +!	prefetch	[%i4+64],0
  1.1343 +!	prefetch	[%i4+96],0
  1.1344 +!	prefetch	[%i4+120],0
  1.1345 +!	prefetch	[%i1],0
  1.1346 +!	prefetch	[%i1+32],0
  1.1347 +!	prefetch	[%i1+64],0
  1.1348 +!	prefetch	[%i1+96],0
  1.1349 +!	prefetch	[%i1+120],0
  1.1350 +/* 0x0430	     (16 17) */		std	%f6,[%o2+80]
  1.1351 +/* 0x0434	     (17 18) */		std	%f6,[%o2+88]
  1.1352 +/* 0x0438	     (18 19) */		std	%f6,[%o2+96]
  1.1353 +/* 0x043c	     (19 20) */		std	%f6,[%o2+104]
  1.1354 +/* 0x0440	     (20 21) */		std	%f6,[%o2+112]
  1.1355 +/* 0x0444	     (21 22) */		std	%f6,[%o2+120]
  1.1356 +/* 0x0448	     (22 23) */		std	%f6,[%o2+128]
  1.1357 +/* 0x044c	     (23 24) */		std	%f6,[%o2+136]
  1.1358 +/* 0x0450	     (24 25) */		std	%f6,[%o2+144]
  1.1359 +/* 0x0454	     (25 26) */		std	%f6,[%o2+152]
  1.1360 +/* 0x0458	     (26 27) */		std	%f6,[%o2+160]
  1.1361 +/* 0x045c	     (27 28) */		std	%f6,[%o2+168]
  1.1362 +/* 0x0460	     (27 30) */		fdtox	%f2,%f2
  1.1363 +/* 0x0464	     (28 29) */		std	%f6,[%o2+176]
  1.1364 +/* 0x0468	     (29 30) */		std	%f6,[%o2+184]
  1.1365 +/* 0x046c	     (30 31) */		std	%f6,[%o2+192]
  1.1366 +/* 0x0470	     (31 32) */		std	%f6,[%o2+200]
  1.1367 +/* 0x0474	     (32 33) */		std	%f6,[%o2+208]
  1.1368 +/* 0x0478	     (33 34) */		std	%f6,[%o2+216]
  1.1369 +/* 0x047c	     (34 35) */		std	%f6,[%o2+224]
  1.1370 +/* 0x0480	     (35 36) */		std	%f6,[%o2+232]
  1.1371 +/* 0x0484	     (36 37) */		std	%f6,[%o2+240]
  1.1372 +/* 0x0488	     (37 38) */		std	%f6,[%o2+248]
  1.1373 +/* 0x048c	     (38 39) */		std	%f6,[%o2+256]
  1.1374 +/* 0x0490	     (39 40) */		std	%f6,[%o2+264]
  1.1375 +/* 0x0494	     (40 41) */		std	%f6,[%o2+272]
  1.1376 +/* 0x0498	     (41 42) */		std	%f6,[%o2+280]
  1.1377 +/* 0x049c	     (42 43) */		std	%f6,[%o2+288]
  1.1378 +/* 0x04a0	     (43 44) */		std	%f6,[%o2+296]
  1.1379 +/* 0x04a4	     (44 45) */		std	%f6,[%o2+304]
  1.1380 +/* 0x04a8	     (45 46) */		std	%f6,[%o2+312]
  1.1381 +/* 0x04ac	     (46 47) */		std	%f6,[%o2+320]
  1.1382 +/* 0x04b0	     (47 48) */		std	%f6,[%o2+328]
  1.1383 +/* 0x04b4	     (48 49) */		std	%f6,[%o2+336]
  1.1384 +/* 0x04b8	     (49 50) */		std	%f6,[%o2+344]
  1.1385 +/* 0x04bc	     (50 51) */		std	%f6,[%o2+352]
  1.1386 +/* 0x04c0	     (51 52) */		std	%f6,[%o2+360]
  1.1387 +/* 0x04c4	     (52 53) */		std	%f6,[%o2+368]
  1.1388 +/* 0x04c8	     (53 54) */		std	%f6,[%o2+376]
  1.1389 +/* 0x04cc	     (54 55) */		std	%f6,[%o2+384]
  1.1390 +/* 0x04d0	     (55 56) */		std	%f6,[%o2+392]
  1.1391 +/* 0x04d4	     (56 57) */		std	%f6,[%o2+400]
  1.1392 +/* 0x04d8	     (57 58) */		std	%f6,[%o2+408]
  1.1393 +/* 0x04dc	     (58 59) */		std	%f6,[%o2+416]
  1.1394 +/* 0x04e0	     (59 60) */		std	%f6,[%o2+424]
  1.1395 +/* 0x04e4	     (60 61) */		std	%f6,[%o2+432]
  1.1396 +/* 0x04e8	     (61 62) */		std	%f6,[%o2+440]
  1.1397 +/* 0x04ec	     (62 63) */		std	%f6,[%o2+448]
  1.1398 +/* 0x04f0	     (63 64) */		std	%f6,[%o2+456]
  1.1399 +/* 0x04f4	     (64 65) */		std	%f6,[%o2+464]
  1.1400 +/* 0x04f8	     (65 66) */		std	%f6,[%o2+472]
  1.1401 +/* 0x04fc	     (66 67) */		std	%f6,[%o2+480]
  1.1402 +/* 0x0500	     (67 68) */		std	%f6,[%o2+488]
  1.1403 +/* 0x0504	     (68 69) */		std	%f6,[%o2+496]
  1.1404 +/* 0x0508	     (69 70) */		std	%f6,[%o2+504]
  1.1405 +/* 0x050c	     (70 71) */		std	%f6,[%o2+512]
  1.1406 +/* 0x0510	     (71 72) */		std	%f6,[%o2+520]
  1.1407 +/* 0x0514	 242 (72 75) */		ld	[%g4],%f2 ! dalign
  1.1408 +/* 0x0518	     (73 76) */		ld	[%g2],%f6 ! dalign
  1.1409 +/* 0x051c	     (74 77) */		fxtod	%f2,%f10
  1.1410 +/* 0x0520	     (74 77) */		ld	[%g2+4],%f7
  1.1411 +/* 0x0524	     (75 78) */		ld	[%g3],%f8 ! dalign
  1.1412 +/* 0x0528	     (76 79) */		ld	[%g3+4],%f9
  1.1413 +/* 0x052c	     (77 80) */		fmuld	%f10,%f0,%f0
  1.1414 +/* 0x0530	 239 (77 80) */		ldd	[%i4],%f4
  1.1415 +/* 0x0534	 240 (78 81) */		ldd	[%i1],%f2
  1.1416 +/* 0x0538	     (80 83) */		fmuld	%f0,%f6,%f6
  1.1417 +/* 0x053c	     (83 86) */		fdtox	%f6,%f6
  1.1418 +/* 0x0540	     (86 89) */		fxtod	%f6,%f6
  1.1419 +/* 0x0544	     (89 92) */		fmuld	%f6,%f8,%f6
  1.1420 +/* 0x0548	     (92 95) */		fsubd	%f0,%f6,%f0
  1.1421 +/* 0x054c	 250 (95 98) */		fmuld	%f4,%f0,%f10
  1.1422 +                                   .L900000747:		/* frequency 6.4 confidence 0.0 */
  1.1423 +
  1.1424 +
  1.1425 +	fmovd %f0,%f0
  1.1426 +	fmovd %f16,%f18
  1.1427 +	ldd [%i4],%f2
  1.1428 +	ldd [%o2],%f8
  1.1429 +	ldd [%i1],%f10
  1.1430 +	ldd [%g4-8],%f14
  1.1431 +	ldd [%g4-16],%f16
  1.1432 +	ldd [%o1],%f24
  1.1433 +
  1.1434 +	ldd [%i1+8],%f26
  1.1435 +	ldd [%i1+16],%f40
  1.1436 +	ldd [%i1+48],%f46
  1.1437 +	ldd [%i1+56],%f30
  1.1438 +	ldd [%i1+64],%f54
  1.1439 +	ldd [%i1+104],%f34
  1.1440 +	ldd [%i1+112],%f58
  1.1441 +
  1.1442 +	ldd [%i4+112],%f60
  1.1443 +	ldd [%i4+8],%f28	
  1.1444 +	ldd [%i4+104],%f38
  1.1445 +
  1.1446 +	nop
  1.1447 +	nop
  1.1448 +!
  1.1449 +	.L99999999:
  1.1450 +!1
  1.1451 +!!!
  1.1452 +	ldd	[%i1+24],%f32
  1.1453 +	fmuld	%f0,%f2,%f4
  1.1454 +!2
  1.1455 +!!!
  1.1456 +	ldd	[%i4+24],%f36
  1.1457 +	fmuld	%f26,%f24,%f20
  1.1458 +!3
  1.1459 +!!!
  1.1460 +	ldd	[%i1+40],%f42
  1.1461 +	fmuld	%f28,%f0,%f22
  1.1462 +!4
  1.1463 +!!!
  1.1464 +	ldd	[%i4+40],%f44
  1.1465 +	fmuld	%f32,%f24,%f32
  1.1466 +!5
  1.1467 +!!!
  1.1468 +	ldd	[%o1+8],%f6
  1.1469 +	faddd	%f4,%f8,%f4
  1.1470 +	fmuld	%f36,%f0,%f36
  1.1471 +!6
  1.1472 +!!!
  1.1473 +	add	%o1,8,%o1
  1.1474 +	ldd	[%i4+56],%f50
  1.1475 +	fmuld	%f42,%f24,%f42
  1.1476 +!7
  1.1477 +!!!
  1.1478 +	ldd	[%i1+72],%f52
  1.1479 +	faddd	%f20,%f22,%f20
  1.1480 +	fmuld	%f44,%f0,%f44
  1.1481 +!8
  1.1482 +!!!
  1.1483 +	ldd	[%o2+16],%f22
  1.1484 +	fmuld	%f10,%f6,%f12
  1.1485 +!9
  1.1486 +!!!
  1.1487 +	ldd	[%i4+72],%f56
  1.1488 +	faddd	%f32,%f36,%f32
  1.1489 +	fmuld	%f14,%f4,%f4
  1.1490 +!10
  1.1491 +!!!
  1.1492 +	ldd	[%o2+48],%f36
  1.1493 +	fmuld	%f30,%f24,%f48
  1.1494 +!11
  1.1495 +!!!
  1.1496 +	ldd	[%o2+8],%f8
  1.1497 +	faddd	%f20,%f22,%f20
  1.1498 +	fmuld	%f50,%f0,%f50	
  1.1499 +!12
  1.1500 +!!!
  1.1501 +	std	%f20,[%o2+16]
  1.1502 +	faddd	%f42,%f44,%f42
  1.1503 +	fmuld	%f52,%f24,%f52
  1.1504 +!13
  1.1505 +!!!
  1.1506 +	ldd	[%o2+80],%f44
  1.1507 +	faddd	%f4,%f12,%f4
  1.1508 +	fmuld	%f56,%f0,%f56
  1.1509 +!14
  1.1510 +!!!
  1.1511 +	ldd	[%i1+88],%f20
  1.1512 +	faddd	%f32,%f36,%f32
  1.1513 +!15
  1.1514 +!!!
  1.1515 +	ldd	[%i4+88],%f22
  1.1516 +	faddd	%f48,%f50,%f48
  1.1517 +!16
  1.1518 +!!!
  1.1519 +	ldd	[%o2+112],%f50
  1.1520 +	faddd	%f52,%f56,%f52
  1.1521 +!17
  1.1522 +!!!
  1.1523 +	ldd	[%o2+144],%f56
  1.1524 +	faddd	%f4,%f8,%f8
  1.1525 +	fmuld	%f20,%f24,%f20
  1.1526 +!18
  1.1527 +!!!
  1.1528 +	std	%f32,[%o2+48]
  1.1529 +	faddd	%f42,%f44,%f42
  1.1530 +	fmuld	%f22,%f0,%f22
  1.1531 +!19
  1.1532 +!!!
  1.1533 +	std	%f42,[%o2+80]
  1.1534 +	faddd	%f48,%f50,%f48
  1.1535 +	fmuld	%f34,%f24,%f32
  1.1536 +!20
  1.1537 +!!!
  1.1538 +	std	%f48,[%o2+112]
  1.1539 +	faddd	%f52,%f56,%f52
  1.1540 +	fmuld	%f38,%f0,%f36
  1.1541 +!21
  1.1542 +!!!
  1.1543 +	ldd	[%i1+120],%f42
  1.1544 +	fdtox	%f8,%f4
  1.1545 +!22
  1.1546 +!!!
  1.1547 +	std	%f52,[%o2+144]
  1.1548 +	faddd	%f20,%f22,%f20
  1.1549 +!23
  1.1550 +!!!
  1.1551 +	ldd	[%i4+120],%f44
  1.1552 +!24
  1.1553 +!!!
  1.1554 +	ldd	[%o2+176],%f22
  1.1555 +	faddd	%f32,%f36,%f32
  1.1556 +	fmuld	%f42,%f24,%f42
  1.1557 +!25
  1.1558 +!!!
  1.1559 +	ldd	[%i4+16],%f50
  1.1560 +	fmovs	%f17,%f4
  1.1561 +!26
  1.1562 +!!!
  1.1563 +	ldd	[%i1+32],%f52
  1.1564 +	fmuld	%f44,%f0,%f44
  1.1565 +!27
  1.1566 +!!!
  1.1567 +	ldd	[%i4+32],%f56
  1.1568 +	fmuld	%f40,%f24,%f48
  1.1569 +!28
  1.1570 +!!!
  1.1571 +	ldd	[%o2+208],%f36
  1.1572 +	faddd	%f20,%f22,%f20
  1.1573 +	fmuld	%f50,%f0,%f50
  1.1574 +!29
  1.1575 +!!!
  1.1576 +	std	%f20,[%o2+176]
  1.1577 +	fxtod	%f4,%f4
  1.1578 +	fmuld	%f52,%f24,%f52
  1.1579 +!30
  1.1580 +!!!
  1.1581 +	ldd	[%i4+48],%f22
  1.1582 +	faddd	%f42,%f44,%f42
  1.1583 +	fmuld	%f56,%f0,%f56
  1.1584 +!31
  1.1585 +!!!
  1.1586 +	ldd	[%o2+240],%f44
  1.1587 +	faddd	%f32,%f36,%f32
  1.1588 +!32
  1.1589 +!!!
  1.1590 +	std	%f32,[%o2+208]
  1.1591 +	faddd	%f48,%f50,%f48
  1.1592 +	fmuld	%f46,%f24,%f20
  1.1593 +!33
  1.1594 +!!!
  1.1595 +	ldd	[%o2+32],%f50
  1.1596 +	fmuld	%f4,%f18,%f12
  1.1597 +!34
  1.1598 +!!!
  1.1599 +	ldd	[%i4+64],%f36
  1.1600 +	faddd	%f52,%f56,%f52
  1.1601 +	fmuld	%f22,%f0,%f22
  1.1602 +!35
  1.1603 +!!!
  1.1604 +	ldd	[%o2+64],%f56
  1.1605 +	faddd	%f42,%f44,%f42
  1.1606 +!36
  1.1607 +!!!
  1.1608 +	std	%f42,[%o2+240]
  1.1609 +	faddd	%f48,%f50,%f48
  1.1610 +	fmuld	%f54,%f24,%f32
  1.1611 +!37
  1.1612 +!!!
  1.1613 +	std	%f48,[%o2+32]
  1.1614 +	fmuld	%f12,%f14,%f4
  1.1615 +!38
  1.1616 +!!!
  1.1617 +	ldd	[%i1+80],%f42
  1.1618 +	faddd	%f52,%f56,%f56	! yes, tmp52!
  1.1619 +	fmuld	%f36,%f0,%f36
  1.1620 +!39
  1.1621 +!!!
  1.1622 +	ldd	[%i4+80],%f44
  1.1623 +	faddd	%f20,%f22,%f20
  1.1624 +!40
  1.1625 +!!!
  1.1626 +	ldd	[%i1+96],%f48
  1.1627 +	fmuld	%f58,%f24,%f52
  1.1628 +!41
  1.1629 +!!!
  1.1630 +	ldd	[%i4+96],%f50
  1.1631 +	fdtox	%f4,%f4
  1.1632 +	fmuld	%f42,%f24,%f42
  1.1633 +!42
  1.1634 +!!!
  1.1635 +	std	%f56,[%o2+64]	! yes, tmp52!
  1.1636 +	faddd	%f32,%f36,%f32
  1.1637 +	fmuld	%f44,%f0,%f44
  1.1638 +!43
  1.1639 +!!!
  1.1640 +	ldd	[%o2+96],%f22
  1.1641 +	fmuld	%f48,%f24,%f48
  1.1642 +!44
  1.1643 +!!!
  1.1644 +	ldd	[%o2+128],%f36
  1.1645 +	fmovd	%f6,%f24
  1.1646 +	fmuld	%f50,%f0,%f50
  1.1647 +!45
  1.1648 +!!!
  1.1649 +	fxtod	%f4,%f4
  1.1650 +	fmuld	%f60,%f0,%f56
  1.1651 +!46
  1.1652 +!!!
  1.1653 +	add	%o2,8,%o2
  1.1654 +	faddd	%f42,%f44,%f42
  1.1655 +!47
  1.1656 +!!!
  1.1657 +	ldd	[%o2+160-8],%f44
  1.1658 +	faddd	%f20,%f22,%f20
  1.1659 +!48
  1.1660 +!!!
  1.1661 +	std	%f20,[%o2+96-8]
  1.1662 +	faddd	%f48,%f50,%f48
  1.1663 +!49
  1.1664 +!!!
  1.1665 +	ldd	[%o2+192-8],%f50
  1.1666 +	faddd	%f52,%f56,%f52
  1.1667 +	fmuld	%f4,%f16,%f4
  1.1668 +!50
  1.1669 +!!!
  1.1670 +	ldd	[%o2+224-8],%f56
  1.1671 +	faddd	%f32,%f36,%f32
  1.1672 +!51
  1.1673 +!!!
  1.1674 +	std	%f32,[%o2+128-8]
  1.1675 +	faddd	%f42,%f44,%f42
  1.1676 +!52
  1.1677 +	add	%o3,1,%o3
  1.1678 +	std	%f42,[%o2+160-8]
  1.1679 +	faddd	%f48,%f50,%f48
  1.1680 +!53
  1.1681 +!!!
  1.1682 +	cmp	%o3,31
  1.1683 +	std	%f48,[%o2+192-8]
  1.1684 +	faddd	%f52,%f56,%f52
  1.1685 +!54
  1.1686 +	std	%f52,[%o2+224-8]
  1.1687 +	ble,pt	%icc,.L99999999
  1.1688 +	fsubd	%f12,%f4,%f0
  1.1689 +
  1.1690 +
  1.1691 +
  1.1692 +!55
  1.1693 +	std %f8,[%o2]
  1.1694 +
  1.1695 +	
  1.1696 +	
  1.1697 +	
  1.1698 +	
  1.1699 +	
  1.1700 +	                                   .L77000285:		/* frequency 1.0 confidence 0.0 */
  1.1701 +/* 0x07a8	 279 ( 0  1) */		sll	%g1,4,%g2
  1.1702 +                                   .L900000748:		/* frequency 1.0 confidence 0.0 */
  1.1703 +/* 0x07ac	 279 ( 0  3) */		ldd	[%g5+%g2],%f0
  1.1704 +/* 0x07b0	     ( 0  1) */		add	%g5,%g2,%i1
  1.1705 +/* 0x07b4	     ( 0  1) */		or	%g0,0,%o4
  1.1706 +/* 0x07b8	 206 ( 1  4) */		ld	[%fp+68],%o0
  1.1707 +/* 0x07bc	 279 ( 1  2) */		or	%g0,0,%i0
  1.1708 +/* 0x07c0	     ( 1  2) */		cmp	%g1,0
  1.1709 +/* 0x07c4	     ( 2  5) */		fdtox	%f0,%f0
  1.1710 +/* 0x07c8	     ( 2  3) */		std	%f0,[%sp+120]
  1.1711 +/* 0x07cc	 275 ( 2  3) */		sethi	%hi(0xfc00),%o1
  1.1712 +/* 0x07d0	 206 ( 3  4) */		or	%g0,%o0,%o3
  1.1713 +/* 0x07d4	 275 ( 3  4) */		sub	%g1,1,%g4
  1.1714 +/* 0x07d8	 279 ( 4  7) */		ldd	[%i1+8],%f0
  1.1715 +/* 0x07dc	     ( 4  5) */		or	%g0,%o0,%g5
  1.1716 +/* 0x07e0	     ( 4  5) */		add	%o1,1023,%o1
  1.1717 +/* 0x07e4	     ( 6  9) */		fdtox	%f0,%f0
  1.1718 +/* 0x07e8	     ( 6  7) */		std	%f0,[%sp+112]
  1.1719 +/* 0x07ec	     (10 12) */		ldx	[%sp+112],%o5
  1.1720 +/* 0x07f0	     (11 13) */		ldx	[%sp+120],%o7
  1.1721 +/* 0x07f4	     (11 12) */		ble,pt	%icc,.L900000746	! tprob=0.56
  1.1722 +/* 0x07f8	     (11 12) */		sethi	%hi(0xfc00),%g2
  1.1723 +/* 0x07fc	 275 (12 13) */		or	%g0,-1,%g2
  1.1724 +/* 0x0800	 279 (12 13) */		cmp	%g1,3
  1.1725 +/* 0x0804	 275 (13 14) */		srl	%g2,0,%o2
  1.1726 +/* 0x0808	 279 (13 14) */		bl,pn	%icc,.L77000286	! tprob=0.44
  1.1727 +/* 0x080c	     (13 14) */		or	%g0,%i1,%g2
  1.1728 +/* 0x0810	     (14 17) */		ldd	[%i1+16],%f0
  1.1729 +/* 0x0814	     (14 15) */		and	%o5,%o1,%o0
  1.1730 +/* 0x0818	     (14 15) */		add	%i1,16,%g2
  1.1731 +/* 0x081c	     (15 16) */		sllx	%o0,16,%g3
  1.1732 +/* 0x0820	     (15 16) */		and	%o7,%o2,%o0
  1.1733 +/* 0x0824	     (16 19) */		fdtox	%f0,%f0
  1.1734 +/* 0x0828	     (16 17) */		std	%f0,[%sp+104]
  1.1735 +/* 0x082c	     (16 17) */		add	%o0,%g3,%o4
  1.1736 +/* 0x0830	     (17 20) */		ldd	[%i1+24],%f2
  1.1737 +/* 0x0834	     (17 18) */		srax	%o5,16,%o0
  1.1738 +/* 0x0838	     (17 18) */		add	%o3,4,%g5
  1.1739 +/* 0x083c	     (18 19) */		stx	%o0,[%sp+128]
  1.1740 +/* 0x0840	     (18 19) */		and	%o4,%o2,%o0
  1.1741 +/* 0x0844	     (18 19) */		or	%g0,1,%i0
  1.1742 +/* 0x0848	     (19 20) */		stx	%o0,[%sp+112]
  1.1743 +/* 0x084c	     (19 20) */		srax	%o4,32,%o0
  1.1744 +/* 0x0850	     (19 22) */		fdtox	%f2,%f0
  1.1745 +/* 0x0854	     (20 21) */		stx	%o0,[%sp+136]
  1.1746 +/* 0x0858	     (20 21) */		srax	%o7,32,%o4
  1.1747 +/* 0x085c	     (21 22) */		std	%f0,[%sp+96]
  1.1748 +/* 0x0860	     (22 24) */		ldx	[%sp+136],%o7
  1.1749 +/* 0x0864	     (23 25) */		ldx	[%sp+128],%o0
  1.1750 +/* 0x0868	     (25 27) */		ldx	[%sp+104],%g3
  1.1751 +/* 0x086c	     (25 26) */		add	%o0,%o7,%o0
  1.1752 +/* 0x0870	     (26 28) */		ldx	[%sp+112],%o7
  1.1753 +/* 0x0874	     (26 27) */		add	%o4,%o0,%o4
  1.1754 +/* 0x0878	     (27 29) */		ldx	[%sp+96],%o5
  1.1755 +/* 0x087c	     (28 29) */		st	%o7,[%o3]
  1.1756 +/* 0x0880	     (28 29) */		or	%g0,%g3,%o7
  1.1757 +                                   .L900000730:		/* frequency 64.0 confidence 0.0 */
  1.1758 +/* 0x0884	     (17 19) */		ldd	[%g2+16],%f0
  1.1759 +/* 0x0888	     (17 18) */		add	%i0,1,%i0
  1.1760 +/* 0x088c	     (17 18) */		add	%g5,4,%g5
  1.1761 +/* 0x0890	     (18 18) */		cmp	%i0,%g4
  1.1762 +/* 0x0894	     (18 19) */		add	%g2,16,%g2
  1.1763 +/* 0x0898	     (19 22) */		fdtox	%f0,%f0
  1.1764 +/* 0x089c	     (20 21) */		std	%f0,[%sp+104]
  1.1765 +/* 0x08a0	     (21 23) */		ldd	[%g2+8],%f0
  1.1766 +/* 0x08a4	     (23 26) */		fdtox	%f0,%f0
  1.1767 +/* 0x08a8	     (24 25) */		std	%f0,[%sp+96]
  1.1768 +/* 0x08ac	     (25 26) */		and	%o5,%o1,%g3
  1.1769 +/* 0x08b0	     (26 27) */		sllx	%g3,16,%g3
  1.1770 +/* 0x08b4	     ( 0  0) */		stx	%g3,[%sp+120]
  1.1771 +/* 0x08b8	     (26 27) */		and	%o7,%o2,%g3
  1.1772 +/* 0x08bc	     ( 0  0) */		stx	%o7,[%sp+128]
  1.1773 +/* 0x08c0	     ( 0  0) */		ldx	[%sp+120],%o7
  1.1774 +/* 0x08c4	     (27 27) */		add	%g3,%o7,%g3
  1.1775 +/* 0x08c8	     ( 0  0) */		ldx	[%sp+128],%o7
  1.1776 +/* 0x08cc	     (28 29) */		srax	%o5,16,%o5
  1.1777 +/* 0x08d0	     (28 28) */		add	%g3,%o4,%g3
  1.1778 +/* 0x08d4	     (29 30) */		srax	%g3,32,%o4
  1.1779 +/* 0x08d8	     ( 0  0) */		stx	%o4,[%sp+112]
  1.1780 +/* 0x08dc	     (30 31) */		srax	%o7,32,%o4
  1.1781 +/* 0x08e0	     ( 0  0) */		ldx	[%sp+112],%o7
  1.1782 +/* 0x08e4	     (30 31) */		add	%o5,%o7,%o7
  1.1783 +/* 0x08e8	     (31 33) */		ldx	[%sp+96],%o5
  1.1784 +/* 0x08ec	     (31 32) */		add	%o4,%o7,%o4
  1.1785 +/* 0x08f0	     (32 33) */		and	%g3,%o2,%g3
  1.1786 +/* 0x08f4	     ( 0  0) */		ldx	[%sp+104],%o7
  1.1787 +/* 0x08f8	     (33 34) */		ble,pt	%icc,.L900000730	! tprob=0.50
  1.1788 +/* 0x08fc	     (33 34) */		st	%g3,[%g5-4]
  1.1789 +                                   .L900000733:		/* frequency 8.0 confidence 0.0 */
  1.1790 +/* 0x0900	     ( 0  1) */		ba	.L900000746	! tprob=1.00
  1.1791 +/* 0x0904	     ( 0  1) */		sethi	%hi(0xfc00),%g2
  1.1792 +                                   .L77000286:		/* frequency 0.7 confidence 0.0 */
  1.1793 +/* 0x0908	     ( 0  3) */		ldd	[%g2+16],%f0
  1.1794 +                                   .L900000745:		/* frequency 6.4 confidence 0.0 */
  1.1795 +/* 0x090c	     ( 0  1) */		and	%o7,%o2,%o0
  1.1796 +/* 0x0910	     ( 0  1) */		and	%o5,%o1,%g3
  1.1797 +/* 0x0914	     ( 0  3) */		fdtox	%f0,%f0
  1.1798 +/* 0x0918	     ( 1  2) */		add	%o4,%o0,%o0
  1.1799 +/* 0x091c	     ( 1  2) */		std	%f0,[%sp+104]
  1.1800 +/* 0x0920	     ( 1  2) */		add	%i0,1,%i0
  1.1801 +/* 0x0924	     ( 2  3) */		sllx	%g3,16,%o4
  1.1802 +/* 0x0928	     ( 2  5) */		ldd	[%g2+24],%f2
  1.1803 +/* 0x092c	     ( 2  3) */		add	%g2,16,%g2
  1.1804 +/* 0x0930	     ( 3  4) */		add	%o0,%o4,%o4
  1.1805 +/* 0x0934	     ( 3  4) */		cmp	%i0,%g4
  1.1806 +/* 0x0938	     ( 4  5) */		srax	%o5,16,%o0
  1.1807 +/* 0x093c	     ( 4  5) */		stx	%o0,[%sp+112]
  1.1808 +/* 0x0940	     ( 4  5) */		and	%o4,%o2,%g3
  1.1809 +/* 0x0944	     ( 5  6) */		srax	%o4,32,%o5
  1.1810 +/* 0x0948	     ( 5  8) */		fdtox	%f2,%f0
  1.1811 +/* 0x094c	     ( 5  6) */		std	%f0,[%sp+96]
  1.1812 +/* 0x0950	     ( 6  7) */		srax	%o7,32,%o4
  1.1813 +/* 0x0954	     ( 6  8) */		ldx	[%sp+112],%o7
  1.1814 +/* 0x0958	     ( 8  9) */		add	%o7,%o5,%o7
  1.1815 +/* 0x095c	     ( 9 11) */		ldx	[%sp+104],%o5
  1.1816 +/* 0x0960	     ( 9 10) */		add	%o4,%o7,%o4
  1.1817 +/* 0x0964	     (10 12) */		ldx	[%sp+96],%o0
  1.1818 +/* 0x0968	     (11 12) */		st	%g3,[%g5]
  1.1819 +/* 0x096c	     (11 12) */		or	%g0,%o5,%o7
  1.1820 +/* 0x0970	     (11 12) */		add	%g5,4,%g5
  1.1821 +/* 0x0974	     (12 13) */		or	%g0,%o0,%o5
  1.1822 +/* 0x0978	     (12 13) */		ble,a,pt	%icc,.L900000745	! tprob=0.86
  1.1823 +/* 0x097c	     (12 15) */		ldd	[%g2+16],%f0
  1.1824 +                                   .L77000236:		/* frequency 1.0 confidence 0.0 */
  1.1825 +/* 0x0980	     ( 0  1) */		sethi	%hi(0xfc00),%g2
  1.1826 +                                   .L900000746:		/* frequency 1.0 confidence 0.0 */
  1.1827 +/* 0x0984	     ( 0  1) */		or	%g0,-1,%o0
  1.1828 +/* 0x0988	     ( 0  1) */		add	%g2,1023,%g2
  1.1829 +/* 0x098c	     ( 0  3) */		ld	[%fp+88],%o1
  1.1830 +/* 0x0990	     ( 1  2) */		srl	%o0,0,%g3
  1.1831 +/* 0x0994	     ( 1  2) */		and	%o5,%g2,%g2
  1.1832 +/* 0x0998	     ( 2  3) */		and	%o7,%g3,%g4
  1.1833 +/* 0x099c	 281 ( 2  3) */		or	%g0,-1,%o5
  1.1834 +/* 0x09a0	 275 ( 3  4) */		sllx	%g2,16,%g2
  1.1835 +/* 0x09a4	     ( 3  4) */		add	%o4,%g4,%g4
  1.1836 +/* 0x09a8	     ( 4  5) */		add	%g4,%g2,%g2
  1.1837 +/* 0x09ac	     ( 5  6) */		sll	%i0,2,%g4
  1.1838 +/* 0x09b0	     ( 5  6) */		and	%g2,%g3,%g2
  1.1839 +/* 0x09b4	     ( 6  7) */		st	%g2,[%o3+%g4]
  1.1840 +/* 0x09b8	 281 ( 6  7) */		sll	%g1,2,%g2
  1.1841 +/* 0x09bc	     ( 7 10) */		ld	[%o3+%g2],%g2
  1.1842 +/* 0x09c0	     ( 9 10) */		cmp	%g2,0
  1.1843 +/* 0x09c4	     ( 9 10) */		bleu,pn	%icc,.L77000241	! tprob=0.50
  1.1844 +/* 0x09c8	     ( 9 10) */		or	%g0,%o1,%o2
  1.1845 +/* 0x09cc	     (10 11) */		ba	.L900000744	! tprob=1.00
  1.1846 +/* 0x09d0	     (10 11) */		cmp	%o5,0
  1.1847 +                                   .L77000241:		/* frequency 0.8 confidence 0.0 */
  1.1848 +/* 0x09d4	     ( 0  1) */		subcc	%g1,1,%o5
  1.1849 +/* 0x09d8	     ( 0  1) */		bneg,pt	%icc,.L900000744	! tprob=0.60
  1.1850 +/* 0x09dc	     ( 1  2) */		cmp	%o5,0
  1.1851 +/* 0x09e0	     ( 1  2) */		sll	%o5,2,%g2
  1.1852 +/* 0x09e4	     ( 2  3) */		add	%o1,%g2,%o0
  1.1853 +/* 0x09e8	     ( 2  3) */		add	%o3,%g2,%o4
  1.1854 +/* 0x09ec	     ( 3  6) */		ld	[%o0],%g2
  1.1855 +                                   .L900000743:		/* frequency 5.3 confidence 0.0 */
  1.1856 +/* 0x09f0	     ( 0  3) */		ld	[%o4],%g3
  1.1857 +/* 0x09f4	     ( 0  1) */		add	%o0,4,%o0
  1.1858 +/* 0x09f8	     ( 0  1) */		add	%o4,4,%o4
  1.1859 +/* 0x09fc	     ( 2  3) */		cmp	%g3,%g2
  1.1860 +/* 0x0a00	     ( 2  3) */		bne,pn	%icc,.L77000244	! tprob=0.16
  1.1861 +/* 0x0a04	     ( 2  3) */		nop
  1.1862 +/* 0x0a08	     ( 3  4) */		addcc	%o5,1,%o5
  1.1863 +/* 0x0a0c	     ( 3  4) */		bpos,a,pt	%icc,.L900000743	! tprob=0.84
  1.1864 +/* 0x0a10	     ( 3  6) */		ld	[%o0],%g2
  1.1865 +                                   .L77000244:		/* frequency 1.0 confidence 0.0 */
  1.1866 +/* 0x0a14	     ( 0  1) */		cmp	%o5,0
  1.1867 +                                   .L900000744:		/* frequency 1.0 confidence 0.0 */
  1.1868 +/* 0x0a18	     ( 0  1) */		bl,pn	%icc,.L77000287	! tprob=0.50
  1.1869 +/* 0x0a1c	     ( 0  1) */		sll	%o5,2,%g2
  1.1870 +/* 0x0a20	     ( 1  4) */		ld	[%o2+%g2],%g3
  1.1871 +/* 0x0a24	     ( 2  5) */		ld	[%o3+%g2],%g2
  1.1872 +/* 0x0a28	     ( 4  5) */		cmp	%g2,%g3
  1.1873 +/* 0x0a2c	     ( 4  5) */		bleu,pt	%icc,.L77000224	! tprob=0.56
  1.1874 +/* 0x0a30	     ( 4  5) */		nop
  1.1875 +                                   .L77000287:		/* frequency 0.8 confidence 0.0 */
  1.1876 +/* 0x0a34	     ( 0  1) */		cmp	%g1,0
  1.1877 +/* 0x0a38	     ( 0  1) */		ble,pt	%icc,.L77000224	! tprob=0.60
  1.1878 +/* 0x0a3c	     ( 0  1) */		nop
  1.1879 +/* 0x0a40	 281 ( 1  2) */		sub	%g1,1,%o7
  1.1880 +/* 0x0a44	     ( 1  2) */		or	%g0,-1,%g2
  1.1881 +/* 0x0a48	     ( 2  3) */		srl	%g2,0,%o4
  1.1882 +/* 0x0a4c	     ( 2  3) */		add	%o7,1,%o0
  1.1883 +/* 0x0a50	 279 ( 3  4) */		or	%g0,0,%o5
  1.1884 +/* 0x0a54	     ( 3  4) */		or	%g0,0,%g1
  1.1885 +/* 0x0a58	     ( 4  5) */		cmp	%o0,3
  1.1886 +/* 0x0a5c	     ( 4  5) */		bl,pn	%icc,.L77000288	! tprob=0.40
  1.1887 +/* 0x0a60	     ( 4  5) */		add	%o3,8,%o1
  1.1888 +/* 0x0a64	     ( 5  6) */		add	%o2,4,%o0
  1.1889 +/* 0x0a68	     ( 5  8) */		ld	[%o1-8],%g2
  1.1890 +/* 0x0a6c	   0 ( 5  6) */		or	%g0,%o1,%o3
  1.1891 +/* 0x0a70	 279 ( 6  9) */		ld	[%o0-4],%g3
  1.1892 +/* 0x0a74	   0 ( 6  7) */		or	%g0,%o0,%o2
  1.1893 +/* 0x0a78	 279 ( 6  7) */		or	%g0,2,%g1
  1.1894 +/* 0x0a7c	     ( 7 10) */		ld	[%o3-4],%o0
  1.1895 +/* 0x0a80	     ( 8  9) */		sub	%g2,%g3,%g2
  1.1896 +/* 0x0a84	     ( 9 10) */		or	%g0,%g2,%o5
  1.1897 +/* 0x0a88	     ( 9 10) */		and	%g2,%o4,%g2
  1.1898 +/* 0x0a8c	     ( 9 10) */		st	%g2,[%o3-8]
  1.1899 +/* 0x0a90	     (10 11) */		srax	%o5,32,%o5
  1.1900 +                                   .L900000734:		/* frequency 64.0 confidence 0.0 */
  1.1901 +/* 0x0a94	     (12 20) */		ld	[%o2],%g2
  1.1902 +/* 0x0a98	     (12 13) */		add	%g1,1,%g1
  1.1903 +/* 0x0a9c	     (12 13) */		add	%o2,4,%o2
  1.1904 +/* 0x0aa0	     (13 13) */		cmp	%g1,%o7
  1.1905 +/* 0x0aa4	     (13 14) */		add	%o3,4,%o3
  1.1906 +/* 0x0aa8	     (14 14) */		sub	%o0,%g2,%o0
  1.1907 +/* 0x0aac	     (15 15) */		add	%o0,%o5,%o5
  1.1908 +/* 0x0ab0	     (16 17) */		and	%o5,%o4,%g2
  1.1909 +/* 0x0ab4	     (16 24) */		ld	[%o3-4],%o0
  1.1910 +/* 0x0ab8	     (17 18) */		st	%g2,[%o3-8]
  1.1911 +/* 0x0abc	     (17 18) */		ble,pt	%icc,.L900000734	! tprob=0.50
  1.1912 +/* 0x0ac0	     (17 18) */		srax	%o5,32,%o5
  1.1913 +                                   .L900000737:		/* frequency 8.0 confidence 0.0 */
  1.1914 +/* 0x0ac4	     ( 0  3) */		ld	[%o2],%o1
  1.1915 +/* 0x0ac8	     ( 2  3) */		sub	%o0,%o1,%o0
  1.1916 +/* 0x0acc	     ( 3  4) */		add	%o0,%o5,%o0
  1.1917 +/* 0x0ad0	     ( 4  5) */		and	%o0,%o4,%o1
  1.1918 +/* 0x0ad4	     ( 4  5) */		st	%o1,[%o3-4]
  1.1919 +/* 0x0ad8	     ( 5  7) */		ret	! Result = 
  1.1920 +/* 0x0adc	     ( 7  8) */		restore	%g0,%g0,%g0
  1.1921 +                                   .L77000288:		/* frequency 0.6 confidence 0.0 */
  1.1922 +/* 0x0ae0	     ( 0  3) */		ld	[%o3],%o0
  1.1923 +                                   .L900000742:		/* frequency 5.3 confidence 0.0 */
  1.1924 +/* 0x0ae4	     ( 0  3) */		ld	[%o2],%o1
  1.1925 +/* 0x0ae8	     ( 0  1) */		add	%o5,%o0,%o0
  1.1926 +/* 0x0aec	     ( 0  1) */		add	%g1,1,%g1
  1.1927 +/* 0x0af0	     ( 1  2) */		add	%o2,4,%o2
  1.1928 +/* 0x0af4	     ( 1  2) */		cmp	%g1,%o7
  1.1929 +/* 0x0af8	     ( 2  3) */		sub	%o0,%o1,%o0
  1.1930 +/* 0x0afc	     ( 3  4) */		and	%o0,%o4,%o1
  1.1931 +/* 0x0b00	     ( 3  4) */		st	%o1,[%o3]
  1.1932 +/* 0x0b04	     ( 3  4) */		add	%o3,4,%o3
  1.1933 +/* 0x0b08	     ( 4  5) */		srax	%o0,32,%o5
  1.1934 +/* 0x0b0c	     ( 4  5) */		ble,a,pt	%icc,.L900000742	! tprob=0.84
  1.1935 +/* 0x0b10	     ( 4  7) */		ld	[%o3],%o0
  1.1936 +                                   .L77000224:		/* frequency 1.0 confidence 0.0 */
  1.1937 +/* 0x0b14	     ( 0  2) */		ret	! Result = 
  1.1938 +/* 0x0b18	     ( 2  3) */		restore	%g0,%g0,%g0
  1.1939 +/* 0x0b1c	   0 ( 0  0) */		.type	mont_mulf_noconv,2
  1.1940 +/* 0x0b1c	     ( 0  0) */		.size	mont_mulf_noconv,(.-mont_mulf_noconv)
  1.1941 +

mercurial