| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py |
| ; RUN: llc -mtriple=i686-linux-gnu -mattr=-ermsb < %s -o - | FileCheck %s --check-prefix=ALL --check-prefix=NOFAST32 |
| ; RUN: llc -mtriple=i686-linux-gnu -mattr=+ermsb < %s -o - | FileCheck %s --check-prefix=ALL --check-prefix=FAST32 |
| ; RUN: llc -mtriple=x86_64-linux-gnu -mattr=-ermsb < %s -o - | FileCheck %s --check-prefix=ALL --check-prefix=NOFAST |
| ; RUN: llc -mtriple=x86_64-linux-gnu -mattr=+ermsb < %s -o - | FileCheck %s --check-prefix=ALL --check-prefix=FAST |
| ; RUN: llc -mtriple=x86_64-linux-gnu -mcpu=generic < %s -o - | FileCheck %s --check-prefix=ALL --check-prefix=NOFAST |
| ; RUN: llc -mtriple=x86_64-linux-gnu -mcpu=haswell < %s -o - | FileCheck %s --check-prefix=ALL --check-prefix=FAST |
| ; RUN: llc -mtriple=x86_64-linux-gnu -mcpu=skylake < %s -o - | FileCheck %s --check-prefix=ALL --check-prefix=FAST |
| ; FIXME: The documentation states that ivybridge has ermsb, but this is not |
| ; enabled right now since I could not confirm by testing. |
| ; RUN: llc -mtriple=x86_64-linux-gnu -mcpu=ivybridge < %s -o - | FileCheck %s --check-prefix=ALL --check-prefix=NOFAST |
| |
| %struct.large = type { [4096 x i8] } |
| |
| declare void @foo(%struct.large* align 8 byval) nounwind |
| |
| define void @test1(%struct.large* nocapture %x) nounwind { |
| ; NOFAST32-LABEL: test1: |
| ; NOFAST32: # %bb.0: |
| ; NOFAST32-NEXT: pushl %edi |
| ; NOFAST32-NEXT: pushl %esi |
| ; NOFAST32-NEXT: subl $4100, %esp # imm = 0x1004 |
| ; NOFAST32-NEXT: movl {{[0-9]+}}(%esp), %esi |
| ; NOFAST32-NEXT: movl $1024, %ecx # imm = 0x400 |
| ; NOFAST32-NEXT: movl %esp, %edi |
| ; NOFAST32-NEXT: rep;movsl (%esi), %es:(%edi) |
| ; NOFAST32-NEXT: calll foo |
| ; NOFAST32-NEXT: addl $4100, %esp # imm = 0x1004 |
| ; NOFAST32-NEXT: popl %esi |
| ; NOFAST32-NEXT: popl %edi |
| ; NOFAST32-NEXT: retl |
| ; |
| ; FAST32-LABEL: test1: |
| ; FAST32: # %bb.0: |
| ; FAST32-NEXT: pushl %edi |
| ; FAST32-NEXT: pushl %esi |
| ; FAST32-NEXT: subl $4100, %esp # imm = 0x1004 |
| ; FAST32-NEXT: movl {{[0-9]+}}(%esp), %esi |
| ; FAST32-NEXT: movl $4096, %ecx # imm = 0x1000 |
| ; FAST32-NEXT: movl %esp, %edi |
| ; FAST32-NEXT: rep;movsb (%esi), %es:(%edi) |
| ; FAST32-NEXT: calll foo |
| ; FAST32-NEXT: addl $4100, %esp # imm = 0x1004 |
| ; FAST32-NEXT: popl %esi |
| ; FAST32-NEXT: popl %edi |
| ; FAST32-NEXT: retl |
| ; |
| ; NOFAST-LABEL: test1: |
| ; NOFAST: # %bb.0: |
| ; NOFAST-NEXT: subq $4104, %rsp # imm = 0x1008 |
| ; NOFAST-NEXT: movq %rdi, %rsi |
| ; NOFAST-NEXT: movl $512, %ecx # imm = 0x200 |
| ; NOFAST-NEXT: movq %rsp, %rdi |
| ; NOFAST-NEXT: rep;movsq (%rsi), %es:(%rdi) |
| ; NOFAST-NEXT: callq foo |
| ; NOFAST-NEXT: addq $4104, %rsp # imm = 0x1008 |
| ; NOFAST-NEXT: retq |
| ; |
| ; FAST-LABEL: test1: |
| ; FAST: # %bb.0: |
| ; FAST-NEXT: subq $4104, %rsp # imm = 0x1008 |
| ; FAST-NEXT: movq %rdi, %rsi |
| ; FAST-NEXT: movl $4096, %ecx # imm = 0x1000 |
| ; FAST-NEXT: movq %rsp, %rdi |
| ; FAST-NEXT: rep;movsb (%rsi), %es:(%rdi) |
| ; FAST-NEXT: callq foo |
| ; FAST-NEXT: addq $4104, %rsp # imm = 0x1008 |
| ; FAST-NEXT: retq |
| call void @foo(%struct.large* align 8 byval %x) |
| ret void |
| |
| } |
| |
| define void @test2(%struct.large* nocapture %x) nounwind minsize { |
| ; NOFAST32-LABEL: test2: |
| ; NOFAST32: # %bb.0: |
| ; NOFAST32-NEXT: pushl %edi |
| ; NOFAST32-NEXT: pushl %esi |
| ; NOFAST32-NEXT: subl $4100, %esp # imm = 0x1004 |
| ; NOFAST32-NEXT: movl {{[0-9]+}}(%esp), %esi |
| ; NOFAST32-NEXT: movl $1024, %ecx # imm = 0x400 |
| ; NOFAST32-NEXT: movl %esp, %edi |
| ; NOFAST32-NEXT: rep;movsl (%esi), %es:(%edi) |
| ; NOFAST32-NEXT: calll foo |
| ; NOFAST32-NEXT: addl $4100, %esp # imm = 0x1004 |
| ; NOFAST32-NEXT: popl %esi |
| ; NOFAST32-NEXT: popl %edi |
| ; NOFAST32-NEXT: retl |
| ; |
| ; FAST32-LABEL: test2: |
| ; FAST32: # %bb.0: |
| ; FAST32-NEXT: pushl %edi |
| ; FAST32-NEXT: pushl %esi |
| ; FAST32-NEXT: subl $4100, %esp # imm = 0x1004 |
| ; FAST32-NEXT: movl {{[0-9]+}}(%esp), %esi |
| ; FAST32-NEXT: movl $4096, %ecx # imm = 0x1000 |
| ; FAST32-NEXT: movl %esp, %edi |
| ; FAST32-NEXT: rep;movsb (%esi), %es:(%edi) |
| ; FAST32-NEXT: calll foo |
| ; FAST32-NEXT: addl $4100, %esp # imm = 0x1004 |
| ; FAST32-NEXT: popl %esi |
| ; FAST32-NEXT: popl %edi |
| ; FAST32-NEXT: retl |
| ; |
| ; NOFAST-LABEL: test2: |
| ; NOFAST: # %bb.0: |
| ; NOFAST-NEXT: subq $4104, %rsp # imm = 0x1008 |
| ; NOFAST-NEXT: movq %rdi, %rsi |
| ; NOFAST-NEXT: movl $512, %ecx # imm = 0x200 |
| ; NOFAST-NEXT: movq %rsp, %rdi |
| ; NOFAST-NEXT: rep;movsq (%rsi), %es:(%rdi) |
| ; NOFAST-NEXT: callq foo |
| ; NOFAST-NEXT: addq $4104, %rsp # imm = 0x1008 |
| ; NOFAST-NEXT: retq |
| ; |
| ; FAST-LABEL: test2: |
| ; FAST: # %bb.0: |
| ; FAST-NEXT: subq $4104, %rsp # imm = 0x1008 |
| ; FAST-NEXT: movq %rdi, %rsi |
| ; FAST-NEXT: movl $4096, %ecx # imm = 0x1000 |
| ; FAST-NEXT: movq %rsp, %rdi |
| ; FAST-NEXT: rep;movsb (%rsi), %es:(%rdi) |
| ; FAST-NEXT: callq foo |
| ; FAST-NEXT: addq $4104, %rsp # imm = 0x1008 |
| ; FAST-NEXT: retq |
| call void @foo(%struct.large* align 8 byval %x) |
| ret void |
| |
| } |
| |
| %struct.large_oddsize = type { [4095 x i8] } |
| |
| declare void @foo_oddsize(%struct.large_oddsize* align 8 byval) nounwind |
| |
| define void @test3(%struct.large_oddsize* nocapture %x) nounwind minsize { |
| ; NOFAST32-LABEL: test3: |
| ; NOFAST32: # %bb.0: |
| ; NOFAST32-NEXT: pushl %edi |
| ; NOFAST32-NEXT: pushl %esi |
| ; NOFAST32-NEXT: subl $4100, %esp # imm = 0x1004 |
| ; NOFAST32-NEXT: movl {{[0-9]+}}(%esp), %esi |
| ; NOFAST32-NEXT: movl $4095, %ecx # imm = 0xFFF |
| ; NOFAST32-NEXT: movl %esp, %edi |
| ; NOFAST32-NEXT: rep;movsb (%esi), %es:(%edi) |
| ; NOFAST32-NEXT: calll foo_oddsize |
| ; NOFAST32-NEXT: addl $4100, %esp # imm = 0x1004 |
| ; NOFAST32-NEXT: popl %esi |
| ; NOFAST32-NEXT: popl %edi |
| ; NOFAST32-NEXT: retl |
| ; |
| ; FAST32-LABEL: test3: |
| ; FAST32: # %bb.0: |
| ; FAST32-NEXT: pushl %edi |
| ; FAST32-NEXT: pushl %esi |
| ; FAST32-NEXT: subl $4100, %esp # imm = 0x1004 |
| ; FAST32-NEXT: movl {{[0-9]+}}(%esp), %esi |
| ; FAST32-NEXT: movl $4095, %ecx # imm = 0xFFF |
| ; FAST32-NEXT: movl %esp, %edi |
| ; FAST32-NEXT: rep;movsb (%esi), %es:(%edi) |
| ; FAST32-NEXT: calll foo_oddsize |
| ; FAST32-NEXT: addl $4100, %esp # imm = 0x1004 |
| ; FAST32-NEXT: popl %esi |
| ; FAST32-NEXT: popl %edi |
| ; FAST32-NEXT: retl |
| ; |
| ; NOFAST-LABEL: test3: |
| ; NOFAST: # %bb.0: |
| ; NOFAST-NEXT: subq $4104, %rsp # imm = 0x1008 |
| ; NOFAST-NEXT: movq %rdi, %rsi |
| ; NOFAST-NEXT: movl $4095, %ecx # imm = 0xFFF |
| ; NOFAST-NEXT: movq %rsp, %rdi |
| ; NOFAST-NEXT: rep;movsb (%rsi), %es:(%rdi) |
| ; NOFAST-NEXT: callq foo_oddsize |
| ; NOFAST-NEXT: addq $4104, %rsp # imm = 0x1008 |
| ; NOFAST-NEXT: retq |
| ; |
| ; FAST-LABEL: test3: |
| ; FAST: # %bb.0: |
| ; FAST-NEXT: subq $4104, %rsp # imm = 0x1008 |
| ; FAST-NEXT: movq %rdi, %rsi |
| ; FAST-NEXT: movl $4095, %ecx # imm = 0xFFF |
| ; FAST-NEXT: movq %rsp, %rdi |
| ; FAST-NEXT: rep;movsb (%rsi), %es:(%rdi) |
| ; FAST-NEXT: callq foo_oddsize |
| ; FAST-NEXT: addq $4104, %rsp # imm = 0x1008 |
| ; FAST-NEXT: retq |
| call void @foo_oddsize(%struct.large_oddsize* align 8 byval %x) |
| ret void |
| |
| } |