Lines Matching refs:un

43 C  * Address relative slowness for un<=3 for Pentium M.  The old code is there
49 C un sp + 12
56 mov 12(%esp), %ecx C un
72 L(un2): movd (%eax), %mm0 C un=2
73 movd (%eax), %mm2 C un=2
74 movd 4(%eax), %mm1 C un=2
75 pmuludq %mm0, %mm0 C 64b weight 0 un=2
76 pmuludq %mm1, %mm2 C 64b weight 32 un=2
77 pmuludq %mm1, %mm1 C 64b weight 64 un=2
78 movd %mm0, (%edx) C un=2
79 psrlq $32, %mm0 C 32b weight 32 un=2
80 pcmpeqd %mm7, %mm7 C un=2
81 psrlq $33, %mm7 C 0x000000007FFFFFFF un=2
82 pand %mm2, %mm7 C 31b weight 32 un=2
83 psrlq $31, %mm2 C 33b weight 65 un=2
84 psllq $1, %mm7 C 31b weight 33 un=2
85 paddq %mm7, %mm0 C un=2
86 movd %mm0, 4(%edx) C un=2
87 psrlq $32, %mm0 C un=2
88 paddq %mm2, %mm1 C un=2
89 paddq %mm0, %mm1 C un=2
90 movd %mm1, 8(%edx) C un=2
91 psrlq $32, %mm1 C un=2
92 movd %mm1, 12(%edx) C un=2
95 L(un3): movd (%eax), %mm7 C un=3
96 movd 4(%eax), %mm6 C un=3
97 pmuludq %mm7, %mm6 C un=3
98 movd 8(%eax), %mm2 C un=3
99 pmuludq %mm7, %mm2 C un=3
100 movd %mm6, 4(%edx) C un=3
101 psrlq $32, %mm6 C un=3
102 paddq %mm2, %mm6 C un=3
103 movd %mm6, 8(%edx) C un=3
104 psrlq $32, %mm6 C un=3
105 movd %mm6, 12(%edx) C un=3
106 lea 4(%edx), %edx C un=3
107 lea 4(%eax), %eax C un=3
109 L(un4): movd (%eax), %mm7 C un=4
110 movd 4(%eax), %mm6 C un=4
111 pmuludq %mm7, %mm6 C un=4
112 movd 8(%eax), %mm0 C un=4
113 pmuludq %mm7, %mm0 C un=4
114 movd 12(%eax), %mm1 C un=4
115 pmuludq %mm7, %mm1 C un=4
116 movd %mm6, 4(%edx) C un=4
117 psrlq $32, %mm6 C un=4
118 paddq %mm0, %mm6 C un=4
119 movd %mm6, 8(%edx) C un=4
120 psrlq $32, %mm6 C un=4
121 paddq %mm1, %mm6 C un=4
122 movd %mm6, 12(%edx) C un=4
123 psrlq $32, %mm6 C un=4
124 movd %mm6, 16(%edx) C un=4
125 lea 4(%edx), %edx C un=4
126 lea 4(%eax), %eax C un=4
581 L(am3): C up[un-1..un-3] x up[un-4]
607 L(am2): C up[un-1..un-2] x up[un-3]
626 L(am1): C up[un-1] x up[un-2]
641 mov 12(%esp), %ecx C un