[llvm-bugs] [Bug 32085] Extra broadcasts in doubly-unrolled avx2 memcpy loop

via llvm-bugs llvm-bugs at lists.llvm.org
Wed Apr 26 10:48:57 PDT 2017


http://bugs.llvm.org/show_bug.cgi?id=32085

Filipe Cabecinhas <filcab at gmail.com> changed:

           What    |Removed                     |Added
----------------------------------------------------------------------------
             Status|NEW                         |RESOLVED
         Resolution|---                         |FIXED

--- Comment #5 from Filipe Cabecinhas <filcab at gmail.com> ---
It's been fixed now (r301395). Current output for the test posted here:

        .section        __TEXT,__text,regular,pure_instructions
        .macosx_version_min 10, 12
        .intel_syntax noprefix
        .globl  __Z3go4i
        .p2align        4, 0x90
__Z3go4i:                               ## @_Z3go4i
        .cfi_startproc
## BB#0:
        push    rbp
Lcfi0:
        .cfi_def_cfa_offset 16
Lcfi1:
        .cfi_offset rbp, -16
        mov     rbp, rsp
Lcfi2:
        .cfi_def_cfa_register rbp
        push    rbx
        push    rax
Lcfi3:
        .cfi_offset rbx, -24
        mov     ebx, edi
        mov     edi, 4096
        call    __Znam
        vmovd   xmm0, ebx
        vpbroadcastd    ymm0, xmm0
        vmovdqu ymmword ptr [rax], ymm0
        vmovdqu ymmword ptr [rax + 32], ymm0
        vmovdqu ymmword ptr [rax + 64], ymm0
...
        vmovdqu ymmword ptr [rax + 4032], ymm0
        vmovdqu ymmword ptr [rax + 4064], ymm0
        add     rsp, 8
        pop     rbx
        pop     rbp
        vzeroupper
        ret
        .cfi_endproc

-- 
You are receiving this mail because:
You are on the CC list for the bug.
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <http://lists.llvm.org/pipermail/llvm-bugs/attachments/20170426/d4586e11/attachment-0001.html>


More information about the llvm-bugs mailing list