commit-gnuradio
[Top][All Lists]
Advanced

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

[Commit-gnuradio] r8669 - gnuradio/trunk/gnuradio-core/src/lib/filter


From: eb
Subject: [Commit-gnuradio] r8669 - gnuradio/trunk/gnuradio-core/src/lib/filter
Date: Mon, 23 Jun 2008 13:10:40 -0600 (MDT)

Author: eb
Date: 2008-06-23 13:10:40 -0600 (Mon, 23 Jun 2008)
New Revision: 8669

Modified:
   
gnuradio/trunk/gnuradio-core/src/lib/filter/3dnow_float_dotprod_really_simple.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/3dnow_float_dotprod_simple.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnow.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnow64.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnowext.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnowext64.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_sse.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_sse64.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_3dnow.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_3dnow64.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_3dnowext.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_3dnowext64.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_sse.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_sse64.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/fcomplex_dotprod_3dnow.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/fcomplex_dotprod_3dnow64.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse64.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/float_dotprod_3dnow.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/float_dotprod_3dnow64.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/float_dotprod_sse.S
   gnuradio/trunk/gnuradio-core/src/lib/filter/float_dotprod_sse64.S
Log:
Renamed labels .loop1 and .loop2 to include name of file they're contained in.



Modified: 
gnuradio/trunk/gnuradio-core/src/lib/filter/3dnow_float_dotprod_really_simple.S
===================================================================
--- 
gnuradio/trunk/gnuradio-core/src/lib/filter/3dnow_float_dotprod_really_simple.S 
    2008-06-23 19:06:16 UTC (rev 8668)
+++ 
gnuradio/trunk/gnuradio-core/src/lib/filter/3dnow_float_dotprod_really_simple.S 
    2008-06-23 19:10:40 UTC (rev 8669)
@@ -72,14 +72,14 @@
        shll    $1, %ecx                # count * 2
 
        .p2align 4
-.loop1:
+.3dnow_float_dotprod_really_simple_loop1:
        movq    (%eax), %mm0
        pfmul   (%edx), %mm0
        pfadd   %mm0, %mm4
        addl    $8, %edx
        addl    $8, %eax
        decl    %ecx
-       jne     .loop1
+       jne     .3dnow_float_dotprod_really_simple_loop1
        
        # at this point mm4 contains partial sums
 

Modified: 
gnuradio/trunk/gnuradio-core/src/lib/filter/3dnow_float_dotprod_simple.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/3dnow_float_dotprod_simple.S    
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/3dnow_float_dotprod_simple.S    
2008-06-23 19:10:40 UTC (rev 8669)
@@ -72,7 +72,7 @@
        pxor    %mm5, %mm5              # mm5 = 0 0 
 
        .p2align 4
-.loop1:
+.3dnow_float_dotprod_simple_loop1:
        movq    0(%eax), %mm0
        movq    8(%eax), %mm1
        
@@ -85,7 +85,7 @@
        addl    $16, %edx
        addl    $16, %eax
        decl    %ecx
-       jne     .loop1
+       jne     .3dnow_float_dotprod_simple_loop1
        
        # at this point mm4 and mm5 contain partial sums
 

Modified: gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnow.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnow.S        
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnow.S        
2008-06-23 19:10:40 UTC (rev 8669)
@@ -91,7 +91,7 @@
        #
        
        .p2align 4
-.loop1:        
+.ccomplex_dotprod_3dnow_loop1: 
 
 # complex prod: C += A * B,  w/ temp Z, mmPN=$80000000
 #
@@ -165,7 +165,7 @@
 
 .L1_test:
        decl    %ecx
-       jge     .loop1
+       jge     .ccomplex_dotprod_3dnow_loop1
 
        # We've handled the bulk of multiplies up to here.
        # Let's see if original n_2_ccomplex_blocks was odd.

Modified: gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnow64.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnow64.S      
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnow64.S      
2008-06-23 19:10:40 UTC (rev 8669)
@@ -91,7 +91,7 @@
        #
        
        .p2align 4
-.loop1:        
+.ccomplex_dotprod_3dnow64_loop1:       
 
 # complex prod: C += A * B,  w/ temp Z, mmPN=$80000000
 #
@@ -165,7 +165,7 @@
 
 .L1_test:
        dec     %rax
-       jge     .loop1
+       jge     .ccomplex_dotprod_3dnow64_loop1
 
        # We've handled the bulk of multiplies up to here.
        # Let's see if original n_2_ccomplex_blocks was odd.

Modified: 
gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnowext.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnowext.S     
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnowext.S     
2008-06-23 19:10:40 UTC (rev 8669)
@@ -89,7 +89,7 @@
        #
        
        .p2align 4
-.loop1:        
+.ccomplex_dotprod_3dnowext_loop1:      
 
 # complex prod: C += A * B,  w/ temp Z
 #
@@ -144,7 +144,7 @@
 
 .L1_test:
        decl    %ecx
-       jge     .loop1
+       jge     .ccomplex_dotprod_3dnowext_loop1
 
        # We've handled the bulk of multiplies up to here.
        # Let's see if original n_2_ccomplex_blocks was odd.

Modified: 
gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnowext64.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnowext64.S   
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_3dnowext64.S   
2008-06-23 19:10:40 UTC (rev 8669)
@@ -89,7 +89,7 @@
        #
        
        .p2align 4
-.loop1:        
+.ccomplex_dotprod_3dnowext64_loop1:    
 
 # complex prod: C += A * B,  w/ temp Z
 #
@@ -144,7 +144,7 @@
 
 .L1_test:
        dec     %rax
-       jge     .loop1
+       jge     .ccomplex_dotprod_3dnowext64_loop1
 
        # We've handled the bulk of multiplies up to here.
        # Let's see if original n_2_ccomplex_blocks was odd.

Modified: gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_sse.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_sse.S  
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_sse.S  
2008-06-23 19:10:40 UTC (rev 8669)
@@ -85,7 +85,7 @@
        #
        
        .p2align 4
-.loop1:        
+.ccomplex_dotprod_sse_loop1:   
 
 # complex prod: C += A * B,  w/ temp Z & Y (or B), xmmPN=$0x8000000080000000
 #
@@ -141,7 +141,7 @@
 
 .L1_test:
        decl    %ecx
-       jge     .loop1
+       jge     .ccomplex_dotprod_sse_loop1
 
        # We've handled the bulk of multiplies up to here.
        # Let's sse if original n_2_ccomplex_blocks was odd.

Modified: gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_sse64.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_sse64.S        
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/ccomplex_dotprod_sse64.S        
2008-06-23 19:10:40 UTC (rev 8669)
@@ -85,7 +85,7 @@
        #
        
        .p2align 4
-.loop1:        
+.ccomplex_dotprod_sse64_loop1: 
 
 # complex prod: C += A * B,  w/ temp Z & Y (or B), xmmPN=$0x8000000080000000
 #
@@ -141,7 +141,7 @@
 
 .L1_test:
        dec     %rax
-       jge     .loop1
+       jge     .ccomplex_dotprod_sse64_loop1
 
        # We've handled the bulk of multiplies up to here.
        # Let's sse if original n_2_ccomplex_blocks was odd.

Modified: gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_3dnow.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_3dnow.S 
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_3dnow.S 
2008-06-23 19:10:40 UTC (rev 8669)
@@ -100,7 +100,7 @@
        #
        
        .p2align 4
-.loop1:        
+.complex_dotprod_3dnow_loop1:  
        pfmul   0(%edx), %mm0
        pfadd   %mm2, %mm6
 
@@ -145,7 +145,7 @@
 
 .L1_test:
        decl    %ecx
-       jge     .loop1
+       jge     .complex_dotprod_3dnow_loop1
 
        # We've handled the bulk of multiplies up to here.
        # Now accumulate the final two additions and see if original

Modified: gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_3dnow64.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_3dnow64.S       
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_3dnow64.S       
2008-06-23 19:10:40 UTC (rev 8669)
@@ -100,7 +100,7 @@
        #
        
        .p2align 4
-.loop1:        
+.complex_dotprod_3dnow64_loop1:        
        pfmul   0(%rsi), %mm0
        pfadd   %mm2, %mm6
 
@@ -145,7 +145,7 @@
 
 .L1_test:
        dec     %rax
-       jge     .loop1
+       jge     .complex_dotprod_3dnow64_loop1
 
        # We've handled the bulk of multiplies up to here.
        # Now accumulate the final two additions and see if original

Modified: gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_3dnowext.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_3dnowext.S      
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_3dnowext.S      
2008-06-23 19:10:40 UTC (rev 8669)
@@ -93,7 +93,7 @@
        #
        
        .p2align 4
-.loop1:        
+.complex_dotprod_3dnowext_loop1:       
        pfmul   0(%edx), %mm0
        pfadd   %mm2, %mm6
 
@@ -125,7 +125,7 @@
 
 .L1_test:
        decl    %ecx
-       jge     .loop1
+       jge     .complex_dotprod_3dnowext_loop1
 
        # We've handled the bulk of multiplies up to here.
        # Now accumulate the final two additions and see if original

Modified: 
gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_3dnowext64.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_3dnowext64.S    
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_3dnowext64.S    
2008-06-23 19:10:40 UTC (rev 8669)
@@ -93,7 +93,7 @@
        #
        
        .p2align 4
-.loop1:        
+.complex_dotprod_3dnowext64_loop1:     
        pfmul   0(%rsi), %mm0
        pfadd   %mm2, %mm6
 
@@ -125,7 +125,7 @@
 
 .L1_test:
        dec     %rax
-       jge     .loop1
+       jge     .complex_dotprod_3dnowext64_loop1
 
        # We've handled the bulk of multiplies up to here.
        # Now accumulate the final two additions and see if original

Modified: gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_sse.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_sse.S   
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_sse.S   
2008-06-23 19:10:40 UTC (rev 8669)
@@ -81,7 +81,7 @@
        jmp     .L1_test
 
        .p2align 4
-.loop1:        
+.complex_dotprod_sse_loop1:    
 
        pxor    %mm0, %mm0
        punpcklwd       0(%eax), %mm0
@@ -95,7 +95,7 @@
        addps   %xmm0, %xmm4
 .L1_test:      
        decl    %ecx
-       jge     .loop1
+       jge     .complex_dotprod_sse_loop1
 
        
        # set up for primary loop which is unrolled 4 times
@@ -129,7 +129,7 @@
        # hence enter loop at top
 
        .p2align 4
-.loop2:
+.complex_dotprod_sse_loop2:
        mulps   (%edx), %xmm0
        addps   %xmm2, %xmm6
 
@@ -169,7 +169,7 @@
        addl    $0x40, %edx
        addl    $0x10, %eax
        decl    %ecx
-       jne     .loop2
+       jne     .complex_dotprod_sse_loop2
 
        # OK, now we've done with all the multiplies, but
        # we still need to handle the unaccumulated

Modified: gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_sse64.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_sse64.S 
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/complex_dotprod_sse64.S 
2008-06-23 19:10:40 UTC (rev 8669)
@@ -80,7 +80,7 @@
        jmp     .L1_test
 
        .p2align 4
-.loop1:        
+.complex_dotprod_sse64_loop1:  
 
        pxor    %mm0, %mm0
        punpcklwd       0(%rdi), %mm0
@@ -94,7 +94,7 @@
        addps   %xmm0, %xmm4
 .L1_test:      
        dec     %rax
-       jge     .loop1
+       jge     .complex_dotprod_sse64_loop1
 
        
        # set up for primary loop which is unrolled 4 times
@@ -127,7 +127,7 @@
        # hence enter loop at top
 
        .p2align 4
-.loop2:
+.complex_dotprod_sse64_loop2:
        mulps   (%rsi), %xmm0
        addps   %xmm2, %xmm6
 
@@ -167,7 +167,7 @@
        add     $0x40, %rsi
        add     $0x10, %rdi
        dec     %rdx
-       jne     .loop2
+       jne     .complex_dotprod_sse64_loop2
 
        # OK, now we've done with all the multiplies, but
        # we still need to handle the unaccumulated

Modified: gnuradio/trunk/gnuradio-core/src/lib/filter/fcomplex_dotprod_3dnow.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/fcomplex_dotprod_3dnow.S        
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/fcomplex_dotprod_3dnow.S        
2008-06-23 19:10:40 UTC (rev 8669)
@@ -92,7 +92,7 @@
        #
        
        .p2align 4
-.loop1:        
+.fcomplex_dotprod_3dnow_loop1: 
        pfmul   0(%edx), %mm0
        pfadd   %mm2, %mm6
 
@@ -129,7 +129,7 @@
 
 .L1_test:
        decl    %ecx
-       jge     .loop1
+       jge     .fcomplex_dotprod_3dnow_loop1
 
        # We've handled the bulk of multiplies up to here.
        # Now accumulate the final two additions and see if original

Modified: gnuradio/trunk/gnuradio-core/src/lib/filter/fcomplex_dotprod_3dnow64.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/fcomplex_dotprod_3dnow64.S      
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/fcomplex_dotprod_3dnow64.S      
2008-06-23 19:10:40 UTC (rev 8669)
@@ -91,7 +91,7 @@
        #
        
        .p2align 4
-.loop1:        
+.fcomplex_dotprod_3dnow64_loop1:       
        pfmul   0(%rsi), %mm0
        pfadd   %mm2, %mm6
 
@@ -128,7 +128,7 @@
 
 .L1_test:
        dec     %rax
-       jge     .loop1
+       jge     .fcomplex_dotprod_3dnow64_loop1
 
        # We've handled the bulk of multiplies up to here.
        # Now accumulate the final two additions and see if original

Modified: gnuradio/trunk/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse.S  
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse.S  
2008-06-23 19:10:40 UTC (rev 8669)
@@ -81,7 +81,7 @@
        jmp     .L1_test
 
        .p2align 4
-.loop1:        
+.fcomplex_dotprod_sse_loop1:   
 
        movlps  0(%eax), %xmm0
        shufps  $0x50, %xmm0, %xmm0     # b01010000
@@ -92,7 +92,7 @@
        addps   %xmm0, %xmm4
 .L1_test:      
        decl    %ecx
-       jge     .loop1
+       jge     .fcomplex_dotprod_sse_loop1
 
        
        # set up for primary loop which is unrolled 4 times
@@ -120,7 +120,7 @@
        # hence enter loop at top
 
        .p2align 4
-.loop2:
+.fcomplex_dotprod_sse_loop2:
        addps   %xmm2, %xmm6
        movlps  0x10(%eax), %xmm2
 
@@ -152,7 +152,7 @@
        addl    $0x40, %edx
        addl    $0x20, %eax
        decl    %ecx
-       jne     .loop2
+       jne     .fcomplex_dotprod_sse_loop2
 
        # OK, now we've done with all the multiplies, but
        # we still need to handle the unaccumulated

Modified: gnuradio/trunk/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse64.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse64.S        
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/fcomplex_dotprod_sse64.S        
2008-06-23 19:10:40 UTC (rev 8669)
@@ -79,7 +79,7 @@
        jmp     .L1_test
 
        .p2align 4
-.loop1:        
+.fcomplex_dotprod_sse64_loop1: 
 
        movlps  0(%rdi), %xmm0
        shufps  $0x50, %xmm0, %xmm0     # b01010000
@@ -90,7 +90,7 @@
        addps   %xmm0, %xmm4
 .L1_test:      
        dec     %rax
-       jge     .loop1
+       jge     .fcomplex_dotprod_sse64_loop1
 
        
        # set up for primary loop which is unrolled 4 times
@@ -117,7 +117,7 @@
        # hence enter loop at top
 
        .p2align 4
-.loop2:
+.fcomplex_dotprod_sse64_loop2:
        addps   %xmm2, %xmm6
        movlps  0x10(%rdi), %xmm2
 
@@ -149,7 +149,7 @@
        add     $0x40, %rsi
        add     $0x20, %rdi
        dec     %rdx
-       jne     .loop2
+       jne     .fcomplex_dotprod_sse64_loop2
 
        # OK, now we've done with all the multiplies, but
        # we still need to handle the unaccumulated

Modified: gnuradio/trunk/gnuradio-core/src/lib/filter/float_dotprod_3dnow.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/float_dotprod_3dnow.S   
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/float_dotprod_3dnow.S   
2008-06-23 19:10:40 UTC (rev 8669)
@@ -86,7 +86,7 @@
        #
        
        .p2align 4
-.loop1:        
+.float_dotprod_3dnow_loop1:    
        pfmul   0(%edx), %mm0
        pfadd   %mm2, %mm6
        movq    16(%eax), %mm2
@@ -107,7 +107,7 @@
        addl    $32, %eax
 .L1_test:
        decl    %ecx
-       jge     .loop1
+       jge     .float_dotprod_3dnow_loop1
 
        # We've handled the bulk of multiplies up to here.
        # Now accumulate the final two additions and see if original

Modified: gnuradio/trunk/gnuradio-core/src/lib/filter/float_dotprod_3dnow64.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/float_dotprod_3dnow64.S 
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/float_dotprod_3dnow64.S 
2008-06-23 19:10:40 UTC (rev 8669)
@@ -85,7 +85,7 @@
        #
        
        .p2align 4
-.loop1:        
+.float_dotprod_3dnow64_loop1:  
        pfmul   0(%rdi), %mm0
        pfadd   %mm2, %mm6
        movq    16(%rsi), %mm2
@@ -106,7 +106,7 @@
        add     $32, %rsi
 .L1_test:
        dec     %rax
-       jge     .loop1
+       jge     .float_dotprod_3dnow64_loop1
 
        # We've handled the bulk of multiplies up to here.
        # Now accumulate the final two additions and see if original

Modified: gnuradio/trunk/gnuradio-core/src/lib/filter/float_dotprod_sse.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/float_dotprod_sse.S     
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/float_dotprod_sse.S     
2008-06-23 19:10:40 UTC (rev 8669)
@@ -79,7 +79,7 @@
        jmp     .L1_test
 
        .p2align 4
-.loop1:        
+.float_dotprod_sse_loop1:      
        movaps  (%eax), %xmm0
        mulps   (%edx), %xmm0
        addl    $0x10, %edx
@@ -87,7 +87,7 @@
        addps   %xmm0, %xmm4
 .L1_test:      
        decl    %ecx
-       jge     .loop1
+       jge     .float_dotprod_sse_loop1
 
        
        # set up for primary loop which is unrolled 4 times
@@ -110,7 +110,7 @@
        # hence enter loop at top
 
        .p2align 4
-.loop2:
+.float_dotprod_sse_loop2:
        mulps   (%edx), %xmm0
        addps   %xmm2, %xmm6
        movaps  0x20(%eax), %xmm2
@@ -130,7 +130,7 @@
        addl    $0x40, %edx
        addl    $0x40, %eax
        decl    %ecx
-       jne     .loop2
+       jne     .float_dotprod_sse_loop2
 
        # OK, now we've done with all the multiplies, but
        # we still need to handle the unaccumulated

Modified: gnuradio/trunk/gnuradio-core/src/lib/filter/float_dotprod_sse64.S
===================================================================
--- gnuradio/trunk/gnuradio-core/src/lib/filter/float_dotprod_sse64.S   
2008-06-23 19:06:16 UTC (rev 8668)
+++ gnuradio/trunk/gnuradio-core/src/lib/filter/float_dotprod_sse64.S   
2008-06-23 19:10:40 UTC (rev 8669)
@@ -77,7 +77,7 @@
        jmp     .L1_test
 
        .p2align 4
-.loop1:        
+.float_dotprod_sse64_loop1:    
        movaps  (%rsi), %xmm0
        mulps   (%rdi), %xmm0
        add     $0x10, %rdi
@@ -85,7 +85,7 @@
        addps   %xmm0, %xmm4
 .L1_test:      
        dec     %rax
-       jge     .loop1
+       jge     .float_dotprod_sse64_loop1
 
        
        # set up for primary loop which is unrolled 4 times
@@ -107,7 +107,7 @@
        # hence enter loop at top
 
        .p2align 4
-.loop2:
+.float_dotprod_sse64_loop2:
        mulps   (%rdi), %xmm0
        addps   %xmm2, %xmm6
        movaps  0x20(%rsi), %xmm2
@@ -127,7 +127,7 @@
        add     $0x40, %rdi
        add     $0x40, %rsi
        dec     %rdx
-       jne     .loop2
+       jne     .float_dotprod_sse64_loop2
 
        # OK, now we've done with all the multiplies, but
        # we still need to handle the unaccumulated





reply via email to

[Prev in Thread] Current Thread [Next in Thread]