diff options
Diffstat (limited to 'gnuradio-core')
22 files changed, 56 insertions, 56 deletions
diff --git a/gnuradio-core/src/lib/filter/3dnow_float_dotprod_really_simple.S b/gnuradio-core/src/lib/filter/3dnow_float_dotprod_really_simple.S index 11fc88e3e..b5f435b60 100644 --- a/gnuradio-core/src/lib/filter/3dnow_float_dotprod_really_simple.S +++ b/gnuradio-core/src/lib/filter/3dnow_float_dotprod_really_simple.S @@ -72,14 +72,14 @@ sse_float_dotprod: shll $1, %ecx # count * 2 .p2align 4 -.loop1: +.3dnow_float_dotprod_really_simple_loop1: movq (%eax), %mm0 pfmul (%edx), %mm0 pfadd %mm0, %mm4 addl $8, %edx addl $8, %eax decl %ecx - jne .loop1 + jne .3dnow_float_dotprod_really_simple_loop1 # at this point mm4 contains partial sums diff --git a/gnuradio-core/src/lib/filter/3dnow_float_dotprod_simple.S b/gnuradio-core/src/lib/filter/3dnow_float_dotprod_simple.S index 505071bbb..91370bb13 100644 --- a/gnuradio-core/src/lib/filter/3dnow_float_dotprod_simple.S +++ b/gnuradio-core/src/lib/filter/3dnow_float_dotprod_simple.S @@ -72,7 +72,7 @@ sse_float_dotprod: pxor %mm5, %mm5 # mm5 = 0 0 .p2align 4 -.loop1: +.3dnow_float_dotprod_simple_loop1: movq 0(%eax), %mm0 movq 8(%eax), %mm1 @@ -85,7 +85,7 @@ sse_float_dotprod: addl $16, %edx addl $16, %eax decl %ecx - jne .loop1 + jne .3dnow_float_dotprod_simple_loop1 # at this point mm4 and mm5 contain partial sums diff --git a/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnow.S b/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnow.S index 9c6903cdf..51a09badb 100644 --- a/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnow.S +++ b/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnow.S @@ -91,7 +91,7 @@ GLOB_SYMB(ccomplex_dotprod_3dnow): # .p2align 4 -.loop1: +.ccomplex_dotprod_3dnow_loop1: # complex prod: C += A * B, w/ temp Z, mmPN=$80000000 # @@ -165,7 +165,7 @@ GLOB_SYMB(ccomplex_dotprod_3dnow): .L1_test: decl %ecx - jge .loop1 + jge .ccomplex_dotprod_3dnow_loop1 # We've handled the bulk of multiplies up to here. # Let's see if original n_2_ccomplex_blocks was odd. diff --git a/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnow64.S b/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnow64.S index c18fe2355..bc9859b2c 100644 --- a/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnow64.S +++ b/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnow64.S @@ -91,7 +91,7 @@ GLOB_SYMB(ccomplex_dotprod_3dnow): # .p2align 4 -.loop1: +.ccomplex_dotprod_3dnow64_loop1: # complex prod: C += A * B, w/ temp Z, mmPN=$80000000 # @@ -165,7 +165,7 @@ GLOB_SYMB(ccomplex_dotprod_3dnow): .L1_test: dec %rax - jge .loop1 + jge .ccomplex_dotprod_3dnow64_loop1 # We've handled the bulk of multiplies up to here. # Let's see if original n_2_ccomplex_blocks was odd. diff --git a/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnowext.S b/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnowext.S index 8a441b7a6..ffe4d597c 100644 --- a/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnowext.S +++ b/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnowext.S @@ -89,7 +89,7 @@ GLOB_SYMB(ccomplex_dotprod_3dnowext): # .p2align 4 -.loop1: +.ccomplex_dotprod_3dnowext_loop1: # complex prod: C += A * B, w/ temp Z # @@ -144,7 +144,7 @@ GLOB_SYMB(ccomplex_dotprod_3dnowext): .L1_test: decl %ecx - jge .loop1 + jge .ccomplex_dotprod_3dnowext_loop1 # We've handled the bulk of multiplies up to here. # Let's see if original n_2_ccomplex_blocks was odd. diff --git a/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnowext64.S b/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnowext64.S index 943223725..7fb4c3065 100644 --- a/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnowext64.S +++ b/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnowext64.S @@ -89,7 +89,7 @@ GLOB_SYMB(ccomplex_dotprod_3dnowext): # .p2align 4 -.loop1: +.ccomplex_dotprod_3dnowext64_loop1: # complex prod: C += A * B, w/ temp Z # @@ -144,7 +144,7 @@ GLOB_SYMB(ccomplex_dotprod_3dnowext): .L1_test: dec %rax - jge .loop1 + jge .ccomplex_dotprod_3dnowext64_loop1 # We've handled the bulk of multiplies up to here. # Let's see if original n_2_ccomplex_blocks was odd. diff --git a/gnuradio-core/src/lib/filter/ccomplex_dotprod_sse.S b/gnuradio-core/src/lib/filter/ccomplex_dotprod_sse.S index 1989a6ac0..5107faecd 100644 --- a/gnuradio-core/src/lib/filter/ccomplex_dotprod_sse.S +++ b/gnuradio-core/src/lib/filter/ccomplex_dotprod_sse.S @@ -85,7 +85,7 @@ GLOB_SYMB(ccomplex_dotprod_sse): # .p2align 4 -.loop1: +.ccomplex_dotprod_sse_loop1: # complex prod: C += A * B, w/ temp Z & Y (or B), xmmPN=$0x8000000080000000 # @@ -141,7 +141,7 @@ GLOB_SYMB(ccomplex_dotprod_sse): .L1_test: decl %ecx - jge .loop1 + jge .ccomplex_dotprod_sse_loop1 # We've handled the bulk of multiplies up to here. # Let's sse if original n_2_ccomplex_blocks was odd. diff --git a/gnuradio-core/src/lib/filter/ccomplex_dotprod_sse64.S b/gnuradio-core/src/lib/filter/ccomplex_dotprod_sse64.S index b674e6ff2..b9c3bad09 100644 --- a/gnuradio-core/src/lib/filter/ccomplex_dotprod_sse64.S +++ b/gnuradio-core/src/lib/filter/ccomplex_dotprod_sse64.S @@ -85,7 +85,7 @@ GLOB_SYMB(ccomplex_dotprod_sse): # .p2align 4 -.loop1: +.ccomplex_dotprod_sse64_loop1: # complex prod: C += A * B, w/ temp Z & Y (or B), xmmPN=$0x8000000080000000 # @@ -141,7 +141,7 @@ GLOB_SYMB(ccomplex_dotprod_sse): .L1_test: dec %rax - jge .loop1 + jge .ccomplex_dotprod_sse64_loop1 # We've handled the bulk of multiplies up to here. # Let's sse if original n_2_ccomplex_blocks was odd. diff --git a/gnuradio-core/src/lib/filter/complex_dotprod_3dnow.S b/gnuradio-core/src/lib/filter/complex_dotprod_3dnow.S index 55bf5b6c3..a2222f267 100644 --- a/gnuradio-core/src/lib/filter/complex_dotprod_3dnow.S +++ b/gnuradio-core/src/lib/filter/complex_dotprod_3dnow.S @@ -100,7 +100,7 @@ GLOB_SYMB(complex_dotprod_3dnow): # .p2align 4 -.loop1: +.complex_dotprod_3dnow_loop1: pfmul 0(%edx), %mm0 pfadd %mm2, %mm6 @@ -145,7 +145,7 @@ GLOB_SYMB(complex_dotprod_3dnow): .L1_test: decl %ecx - jge .loop1 + jge .complex_dotprod_3dnow_loop1 # We've handled the bulk of multiplies up to here. # Now accumulate the final two additions and see if original diff --git a/gnuradio-core/src/lib/filter/complex_dotprod_3dnow64.S b/gnuradio-core/src/lib/filter/complex_dotprod_3dnow64.S index a4b492c76..d67448d86 100644 --- a/gnuradio-core/src/lib/filter/complex_dotprod_3dnow64.S +++ b/gnuradio-core/src/lib/filter/complex_dotprod_3dnow64.S @@ -100,7 +100,7 @@ GLOB_SYMB(complex_dotprod_3dnow): # .p2align 4 -.loop1: +.complex_dotprod_3dnow64_loop1: pfmul 0(%rsi), %mm0 pfadd %mm2, %mm6 @@ -145,7 +145,7 @@ GLOB_SYMB(complex_dotprod_3dnow): .L1_test: dec %rax - jge .loop1 + jge .complex_dotprod_3dnow64_loop1 # We've handled the bulk of multiplies up to here. # Now accumulate the final two additions and see if original diff --git a/gnuradio-core/src/lib/filter/complex_dotprod_3dnowext.S b/gnuradio-core/src/lib/filter/complex_dotprod_3dnowext.S index 30b9a417e..03c931705 100644 --- a/gnuradio-core/src/lib/filter/complex_dotprod_3dnowext.S +++ b/gnuradio-core/src/lib/filter/complex_dotprod_3dnowext.S @@ -93,7 +93,7 @@ GLOB_SYMB(complex_dotprod_3dnowext): # .p2align 4 -.loop1: +.complex_dotprod_3dnowext_loop1: pfmul 0(%edx), %mm0 pfadd %mm2, %mm6 @@ -125,7 +125,7 @@ GLOB_SYMB(complex_dotprod_3dnowext): .L1_test: decl %ecx - jge .loop1 + jge .complex_dotprod_3dnowext_loop1 # We've handled the bulk of multiplies up to here. # Now accumulate the final two additions and see if original diff --git a/gnuradio-core/src/lib/filter/complex_dotprod_3dnowext64.S b/gnuradio-core/src/lib/filter/complex_dotprod_3dnowext64.S index 162e830ae..1f4da3c59 100644 --- a/gnuradio-core/src/lib/filter/complex_dotprod_3dnowext64.S +++ b/gnuradio-core/src/lib/filter/complex_dotprod_3dnowext64.S @@ -93,7 +93,7 @@ GLOB_SYMB(complex_dotprod_3dnowext): # .p2align 4 -.loop1: +.complex_dotprod_3dnowext64_loop1: pfmul 0(%rsi), %mm0 pfadd %mm2, %mm6 @@ -125,7 +125,7 @@ GLOB_SYMB(complex_dotprod_3dnowext): .L1_test: dec %rax - jge .loop1 + jge .complex_dotprod_3dnowext64_loop1 # We've handled the bulk of multiplies up to here. # Now accumulate the final two additions and see if original diff --git a/gnuradio-core/src/lib/filter/complex_dotprod_sse.S b/gnuradio-core/src/lib/filter/complex_dotprod_sse.S index 6ac805bce..0e1cd337d 100644 --- a/gnuradio-core/src/lib/filter/complex_dotprod_sse.S +++ b/gnuradio-core/src/lib/filter/complex_dotprod_sse.S @@ -81,7 +81,7 @@ GLOB_SYMB(complex_dotprod_sse): jmp .L1_test .p2align 4 -.loop1: +.complex_dotprod_sse_loop1: pxor %mm0, %mm0 punpcklwd 0(%eax), %mm0 @@ -95,7 +95,7 @@ GLOB_SYMB(complex_dotprod_sse): addps %xmm0, %xmm4 .L1_test: decl %ecx - jge .loop1 + jge .complex_dotprod_sse_loop1 # set up for primary loop which is unrolled 4 times @@ -129,7 +129,7 @@ GLOB_SYMB(complex_dotprod_sse): # hence enter loop at top .p2align 4 -.loop2: +.complex_dotprod_sse_loop2: mulps (%edx), %xmm0 addps %xmm2, %xmm6 @@ -169,7 +169,7 @@ GLOB_SYMB(complex_dotprod_sse): addl $0x40, %edx addl $0x10, %eax decl %ecx - jne .loop2 + jne .complex_dotprod_sse_loop2 # OK, now we've done with all the multiplies, but # we still need to handle the unaccumulated diff --git a/gnuradio-core/src/lib/filter/complex_dotprod_sse64.S b/gnuradio-core/src/lib/filter/complex_dotprod_sse64.S index 4ce2bc4fe..de258bc7a 100644 --- a/gnuradio-core/src/lib/filter/complex_dotprod_sse64.S +++ b/gnuradio-core/src/lib/filter/complex_dotprod_sse64.S @@ -80,7 +80,7 @@ GLOB_SYMB(complex_dotprod_sse): jmp .L1_test .p2align 4 -.loop1: +.complex_dotprod_sse64_loop1: pxor %mm0, %mm0 punpcklwd 0(%rdi), %mm0 @@ -94,7 +94,7 @@ GLOB_SYMB(complex_dotprod_sse): addps %xmm0, %xmm4 .L1_test: dec %rax - jge .loop1 + jge .complex_dotprod_sse64_loop1 # set up for primary loop which is unrolled 4 times @@ -127,7 +127,7 @@ GLOB_SYMB(complex_dotprod_sse): # hence enter loop at top .p2align 4 -.loop2: +.complex_dotprod_sse64_loop2: mulps (%rsi), %xmm0 addps %xmm2, %xmm6 @@ -167,7 +167,7 @@ GLOB_SYMB(complex_dotprod_sse): add $0x40, %rsi add $0x10, %rdi dec %rdx - jne .loop2 + jne .complex_dotprod_sse64_loop2 # OK, now we've done with all the multiplies, but # we still need to handle the unaccumulated diff --git a/gnuradio-core/src/lib/filter/fcomplex_dotprod_3dnow.S b/gnuradio-core/src/lib/filter/fcomplex_dotprod_3dnow.S index 9acd95a1d..7aa11fe56 100644 --- a/gnuradio-core/src/lib/filter/fcomplex_dotprod_3dnow.S +++ b/gnuradio-core/src/lib/filter/fcomplex_dotprod_3dnow.S @@ -92,7 +92,7 @@ GLOB_SYMB(fcomplex_dotprod_3dnow): # .p2align 4 -.loop1: +.fcomplex_dotprod_3dnow_loop1: pfmul 0(%edx), %mm0 pfadd %mm2, %mm6 @@ -129,7 +129,7 @@ GLOB_SYMB(fcomplex_dotprod_3dnow): .L1_test: decl %ecx - jge .loop1 + jge .fcomplex_dotprod_3dnow_loop1 # We've handled the bulk of multiplies up to here. # Now accumulate the final two additions and see if original diff --git a/gnuradio-core/src/lib/filter/fcomplex_dotprod_3dnow64.S b/gnuradio-core/src/lib/filter/fcomplex_dotprod_3dnow64.S index 453dc9319..c4566153b 100644 --- a/gnuradio-core/src/lib/filter/fcomplex_dotprod_3dnow64.S +++ b/gnuradio-core/src/lib/filter/fcomplex_dotprod_3dnow64.S @@ -91,7 +91,7 @@ GLOB_SYMB(fcomplex_dotprod_3dnow): # .p2align 4 -.loop1: +.fcomplex_dotprod_3dnow64_loop1: pfmul 0(%rsi), %mm0 pfadd %mm2, %mm6 @@ -128,7 +128,7 @@ GLOB_SYMB(fcomplex_dotprod_3dnow): .L1_test: dec %rax - jge .loop1 + jge .fcomplex_dotprod_3dnow64_loop1 # We've handled the bulk of multiplies up to here. # Now accumulate the final two additions and see if original diff --git a/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse.S b/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse.S index d67b047b8..54b815abd 100644 --- a/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse.S +++ b/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse.S @@ -81,7 +81,7 @@ GLOB_SYMB(fcomplex_dotprod_sse): jmp .L1_test .p2align 4 -.loop1: +.fcomplex_dotprod_sse_loop1: movlps 0(%eax), %xmm0 shufps $0x50, %xmm0, %xmm0 # b01010000 @@ -92,7 +92,7 @@ GLOB_SYMB(fcomplex_dotprod_sse): addps %xmm0, %xmm4 .L1_test: decl %ecx - jge .loop1 + jge .fcomplex_dotprod_sse_loop1 # set up for primary loop which is unrolled 4 times @@ -120,7 +120,7 @@ GLOB_SYMB(fcomplex_dotprod_sse): # hence enter loop at top .p2align 4 -.loop2: +.fcomplex_dotprod_sse_loop2: addps %xmm2, %xmm6 movlps 0x10(%eax), %xmm2 @@ -152,7 +152,7 @@ GLOB_SYMB(fcomplex_dotprod_sse): addl $0x40, %edx addl $0x20, %eax decl %ecx - jne .loop2 + jne .fcomplex_dotprod_sse_loop2 # OK, now we've done with all the multiplies, but # we still need to handle the unaccumulated diff --git a/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse64.S b/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse64.S index 10e7372e6..31027c6e2 100644 --- a/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse64.S +++ b/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse64.S @@ -79,7 +79,7 @@ GLOB_SYMB(fcomplex_dotprod_sse): jmp .L1_test .p2align 4 -.loop1: +.fcomplex_dotprod_sse64_loop1: movlps 0(%rdi), %xmm0 shufps $0x50, %xmm0, %xmm0 # b01010000 @@ -90,7 +90,7 @@ GLOB_SYMB(fcomplex_dotprod_sse): addps %xmm0, %xmm4 .L1_test: dec %rax - jge .loop1 + jge .fcomplex_dotprod_sse64_loop1 # set up for primary loop which is unrolled 4 times @@ -117,7 +117,7 @@ GLOB_SYMB(fcomplex_dotprod_sse): # hence enter loop at top .p2align 4 -.loop2: +.fcomplex_dotprod_sse64_loop2: addps %xmm2, %xmm6 movlps 0x10(%rdi), %xmm2 @@ -149,7 +149,7 @@ GLOB_SYMB(fcomplex_dotprod_sse): add $0x40, %rsi add $0x20, %rdi dec %rdx - jne .loop2 + jne .fcomplex_dotprod_sse64_loop2 # OK, now we've done with all the multiplies, but # we still need to handle the unaccumulated diff --git a/gnuradio-core/src/lib/filter/float_dotprod_3dnow.S b/gnuradio-core/src/lib/filter/float_dotprod_3dnow.S index ed625bd6b..a5da9a852 100644 --- a/gnuradio-core/src/lib/filter/float_dotprod_3dnow.S +++ b/gnuradio-core/src/lib/filter/float_dotprod_3dnow.S @@ -86,7 +86,7 @@ GLOB_SYMB(float_dotprod_3dnow): # .p2align 4 -.loop1: +.float_dotprod_3dnow_loop1: pfmul 0(%edx), %mm0 pfadd %mm2, %mm6 movq 16(%eax), %mm2 @@ -107,7 +107,7 @@ GLOB_SYMB(float_dotprod_3dnow): addl $32, %eax .L1_test: decl %ecx - jge .loop1 + jge .float_dotprod_3dnow_loop1 # We've handled the bulk of multiplies up to here. # Now accumulate the final two additions and see if original diff --git a/gnuradio-core/src/lib/filter/float_dotprod_3dnow64.S b/gnuradio-core/src/lib/filter/float_dotprod_3dnow64.S index 17ecd9059..a19e007cc 100644 --- a/gnuradio-core/src/lib/filter/float_dotprod_3dnow64.S +++ b/gnuradio-core/src/lib/filter/float_dotprod_3dnow64.S @@ -85,7 +85,7 @@ GLOB_SYMB(float_dotprod_3dnow): # .p2align 4 -.loop1: +.float_dotprod_3dnow64_loop1: pfmul 0(%rdi), %mm0 pfadd %mm2, %mm6 movq 16(%rsi), %mm2 @@ -106,7 +106,7 @@ GLOB_SYMB(float_dotprod_3dnow): add $32, %rsi .L1_test: dec %rax - jge .loop1 + jge .float_dotprod_3dnow64_loop1 # We've handled the bulk of multiplies up to here. # Now accumulate the final two additions and see if original diff --git a/gnuradio-core/src/lib/filter/float_dotprod_sse.S b/gnuradio-core/src/lib/filter/float_dotprod_sse.S index 9444dd6dd..5d5359fe7 100644 --- a/gnuradio-core/src/lib/filter/float_dotprod_sse.S +++ b/gnuradio-core/src/lib/filter/float_dotprod_sse.S @@ -79,7 +79,7 @@ GLOB_SYMB(float_dotprod_sse): jmp .L1_test .p2align 4 -.loop1: +.float_dotprod_sse_loop1: movaps (%eax), %xmm0 mulps (%edx), %xmm0 addl $0x10, %edx @@ -87,7 +87,7 @@ GLOB_SYMB(float_dotprod_sse): addps %xmm0, %xmm4 .L1_test: decl %ecx - jge .loop1 + jge .float_dotprod_sse_loop1 # set up for primary loop which is unrolled 4 times @@ -110,7 +110,7 @@ GLOB_SYMB(float_dotprod_sse): # hence enter loop at top .p2align 4 -.loop2: +.float_dotprod_sse_loop2: mulps (%edx), %xmm0 addps %xmm2, %xmm6 movaps 0x20(%eax), %xmm2 @@ -130,7 +130,7 @@ GLOB_SYMB(float_dotprod_sse): addl $0x40, %edx addl $0x40, %eax decl %ecx - jne .loop2 + jne .float_dotprod_sse_loop2 # OK, now we've done with all the multiplies, but # we still need to handle the unaccumulated diff --git a/gnuradio-core/src/lib/filter/float_dotprod_sse64.S b/gnuradio-core/src/lib/filter/float_dotprod_sse64.S index 3ba20acab..c725b69fb 100644 --- a/gnuradio-core/src/lib/filter/float_dotprod_sse64.S +++ b/gnuradio-core/src/lib/filter/float_dotprod_sse64.S @@ -77,7 +77,7 @@ GLOB_SYMB(float_dotprod_sse): jmp .L1_test .p2align 4 -.loop1: +.float_dotprod_sse64_loop1: movaps (%rsi), %xmm0 mulps (%rdi), %xmm0 add $0x10, %rdi @@ -85,7 +85,7 @@ GLOB_SYMB(float_dotprod_sse): addps %xmm0, %xmm4 .L1_test: dec %rax - jge .loop1 + jge .float_dotprod_sse64_loop1 # set up for primary loop which is unrolled 4 times @@ -107,7 +107,7 @@ GLOB_SYMB(float_dotprod_sse): # hence enter loop at top .p2align 4 -.loop2: +.float_dotprod_sse64_loop2: mulps (%rdi), %xmm0 addps %xmm2, %xmm6 movaps 0x20(%rsi), %xmm2 @@ -127,7 +127,7 @@ GLOB_SYMB(float_dotprod_sse): add $0x40, %rdi add $0x40, %rsi dec %rdx - jne .loop2 + jne .float_dotprod_sse64_loop2 # OK, now we've done with all the multiplies, but # we still need to handle the unaccumulated |