diff options
author | eb | 2008-06-23 22:49:20 +0000 |
---|---|---|
committer | eb | 2008-06-23 22:49:20 +0000 |
commit | aa4f0cf382ec49c6689896b8ba1d6afb2664f718 (patch) | |
tree | e704181ee8a3413ec857b8c30d0ee7aa2366d2cb /gnuradio-core/src | |
parent | fd2bf069496e39e6be2df18f37e4fec89e09a6a8 (diff) | |
download | gnuradio-aa4f0cf382ec49c6689896b8ba1d6afb2664f718.tar.gz gnuradio-aa4f0cf382ec49c6689896b8ba1d6afb2664f718.tar.bz2 gnuradio-aa4f0cf382ec49c6689896b8ba1d6afb2664f718.zip |
in SIMD assmebler, changed .cleanup to a local symbol
git-svn-id: http://gnuradio.org/svn/gnuradio/trunk@8684 221aa14e-8319-0410-a670-987f0aec2ac5
Diffstat (limited to 'gnuradio-core/src')
6 files changed, 12 insertions, 12 deletions
diff --git a/gnuradio-core/src/lib/filter/complex_dotprod_sse.S b/gnuradio-core/src/lib/filter/complex_dotprod_sse.S index 0e1cd337d..f74484864 100644 --- a/gnuradio-core/src/lib/filter/complex_dotprod_sse.S +++ b/gnuradio-core/src/lib/filter/complex_dotprod_sse.S @@ -105,7 +105,7 @@ GLOB_SYMB(complex_dotprod_sse): movaps %xmm5, %xmm7 shrl $2, %ecx # n_2_complex_blocks / 4 - je .cleanup # if zero, take short path + je .Lcleanup # if zero, take short path # finish setup and loop priming @@ -188,7 +188,7 @@ GLOB_SYMB(complex_dotprod_sse): # At this point, xmm4 contains 2x2 partial sums. We need # to compute a "horizontal complex add" across xmm4. -.cleanup: # xmm4 = r1 i2 r3 i4 +.Lcleanup: # xmm4 = r1 i2 r3 i4 movl 20(%ebp), %eax # @result movhlps %xmm4, %xmm0 # xmm0 = ?? ?? r1 r2 addps %xmm4, %xmm0 # xmm0 = ?? ?? r1+r3 i2+i4 diff --git a/gnuradio-core/src/lib/filter/complex_dotprod_sse64.S b/gnuradio-core/src/lib/filter/complex_dotprod_sse64.S index de258bc7a..3096da20b 100644 --- a/gnuradio-core/src/lib/filter/complex_dotprod_sse64.S +++ b/gnuradio-core/src/lib/filter/complex_dotprod_sse64.S @@ -103,7 +103,7 @@ GLOB_SYMB(complex_dotprod_sse): shr $2, %rdx # n_2_complex_blocks / 4 movaps %xmm5, %xmm7 - je .cleanup # if zero, take short path + je .Lcleanup # if zero, take short path # finish setup and loop priming @@ -186,7 +186,7 @@ GLOB_SYMB(complex_dotprod_sse): # At this point, xmm4 contains 2x2 partial sums. We need # to compute a "horizontal complex add" across xmm4. -.cleanup: # xmm4 = r1 i2 r3 i4 +.Lcleanup: # xmm4 = r1 i2 r3 i4 movhlps %xmm4, %xmm0 # xmm0 = ?? ?? r1 r2 addps %xmm4, %xmm0 # xmm0 = ?? ?? r1+r3 i2+i4 movlps %xmm0, (%rcx) # store low 2x32 bits (complex) to memory diff --git a/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse.S b/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse.S index 54b815abd..98563f905 100644 --- a/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse.S +++ b/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse.S @@ -102,7 +102,7 @@ GLOB_SYMB(fcomplex_dotprod_sse): movaps %xmm5, %xmm7 shrl $2, %ecx # n_2_complex_blocks / 4 - je .cleanup # if zero, take short path + je .Lcleanup # if zero, take short path # finish setup and loop priming @@ -171,7 +171,7 @@ GLOB_SYMB(fcomplex_dotprod_sse): # At this point, xmm4 contains 2x2 partial sums. We need # to compute a "horizontal complex add" across xmm4. -.cleanup: # xmm4 = r1 i2 r3 i4 +.Lcleanup: # xmm4 = r1 i2 r3 i4 movl 20(%ebp), %eax # @result movhlps %xmm4, %xmm0 # xmm0 = ?? ?? r1 r2 addps %xmm4, %xmm0 # xmm0 = ?? ?? r1+r3 i2+i4 diff --git a/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse64.S b/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse64.S index 31027c6e2..b260bffcd 100644 --- a/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse64.S +++ b/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse64.S @@ -99,7 +99,7 @@ GLOB_SYMB(fcomplex_dotprod_sse): movaps %xmm5, %xmm7 shr $2, %rdx # n_2_complex_blocks / 4 - je .cleanup # if zero, take short path + je .Lcleanup # if zero, take short path # finish setup and loop priming @@ -168,7 +168,7 @@ GLOB_SYMB(fcomplex_dotprod_sse): # At this point, xmm4 contains 2x2 partial sums. We need # to compute a "horizontal complex add" across xmm4. -.cleanup: # xmm4 = r1 i2 r3 i4 +.Lcleanup: # xmm4 = r1 i2 r3 i4 movhlps %xmm4, %xmm0 # xmm0 = ?? ?? r1 r2 addps %xmm4, %xmm0 # xmm0 = ?? ?? r1+r3 i2+i4 movlps %xmm0, (%rcx) # store low 2x32 bits (complex) to memory diff --git a/gnuradio-core/src/lib/filter/float_dotprod_sse.S b/gnuradio-core/src/lib/filter/float_dotprod_sse.S index 5d5359fe7..a8f03b83f 100644 --- a/gnuradio-core/src/lib/filter/float_dotprod_sse.S +++ b/gnuradio-core/src/lib/filter/float_dotprod_sse.S @@ -97,7 +97,7 @@ GLOB_SYMB(float_dotprod_sse): movaps %xmm5, %xmm7 shrl $2, %ecx # n_4_float_blocks / 4 - je .cleanup # if zero, take short path + je .Lcleanup # if zero, take short path # finish setup and loop priming @@ -150,7 +150,7 @@ GLOB_SYMB(float_dotprod_sse): # to compute a "horizontal add" across xmm4. # This is a fairly nasty operation... -.cleanup: # xmm4 = d1 d2 d3 d4 +.Lcleanup: # xmm4 = d1 d2 d3 d4 xorps %xmm0, %xmm0 # xmm0 = 0 0 0 0 (may be unnecessary) movhlps %xmm4, %xmm0 # xmm0 = 0 0 d1 d2 addps %xmm4, %xmm0 # xmm0 = d1 d2 d1+d3 d2+d4 diff --git a/gnuradio-core/src/lib/filter/float_dotprod_sse64.S b/gnuradio-core/src/lib/filter/float_dotprod_sse64.S index c725b69fb..696f2cc0d 100644 --- a/gnuradio-core/src/lib/filter/float_dotprod_sse64.S +++ b/gnuradio-core/src/lib/filter/float_dotprod_sse64.S @@ -94,7 +94,7 @@ GLOB_SYMB(float_dotprod_sse): movaps %xmm5, %xmm7 shr $2, %rdx # n_4_float_blocks / 4 - je .cleanup # if zero, take short path + je .Lcleanup # if zero, take short path # finish setup and loop priming @@ -147,7 +147,7 @@ GLOB_SYMB(float_dotprod_sse): # to compute a "horizontal add" across xmm4. # This is a fairly nasty operation... -.cleanup: # xmm4 = d1 d2 d3 d4 +.Lcleanup: # xmm4 = d1 d2 d3 d4 xorps %xmm0, %xmm0 # xmm0 = 0 0 0 0 (may be unnecessary) movhlps %xmm4, %xmm0 # xmm0 = 0 0 d1 d2 addps %xmm4, %xmm0 # xmm0 = d1 d2 d1+d3 d2+d4 |