mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2025-01-31 20:51:52 +01:00
d654e7d40c
Enable enableMultipleCopyHints() on X86. Original Patch by @jonpa: While enabling the mischeduler for SystemZ, it was discovered that for some reason a test needed one extra seemingly needless COPY (test/CodeGen/SystemZ/call-03.ll). The handling for that is resulted in this patch, which improves the register coalescing by providing not just one copy hint, but a sorted list of copy hints. On SystemZ, this gives ~12500 less register moves on SPEC, as well as marginally less spilling. Instead of improving just the SystemZ backend, the improvement has been implemented in common-code (calculateSpillWeightAndHint(). This gives a lot of test failures, but since this should be a general improvement I hope that the involved targets will help and review the test updates. Differential Revision: https://reviews.llvm.org/D38128 llvm-svn: 342578
29 lines
1.2 KiB
LLVM
29 lines
1.2 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc < %s -fast-isel -mtriple=x86_64-unknown-unknown -mattr=+sse4.2 | FileCheck %s --check-prefixes=CHECK,SSE
|
|
; RUN: llc < %s -fast-isel -mtriple=x86_64-unknown-unknown -mattr=+avx | FileCheck %s --check-prefixes=CHECK,AVX,AVX1
|
|
; RUN: llc < %s -fast-isel -mtriple=x86_64-unknown-unknown -mattr=+avx512f,+avx512bw,+avx512dq,+avx512vl | FileCheck %s --check-prefixes=CHECK,AVX,AVX512
|
|
|
|
; NOTE: This should use IR equivalent to what is generated by clang/test/CodeGen/sse42-builtins.c
|
|
|
|
define i64 @test_mm_crc64_u8(i64 %a0, i8 %a1) nounwind{
|
|
; CHECK-LABEL: test_mm_crc64_u8:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: crc32b %sil, %edi
|
|
; CHECK-NEXT: movl %edi, %eax
|
|
; CHECK-NEXT: retq
|
|
%res = call i64 @llvm.x86.sse42.crc32.64.8(i64 %a0, i8 %a1)
|
|
ret i64 %res
|
|
}
|
|
declare i64 @llvm.x86.sse42.crc32.64.8(i64, i8) nounwind readnone
|
|
|
|
define i64 @test_mm_crc64_u64(i64 %a0, i64 %a1) nounwind{
|
|
; CHECK-LABEL: test_mm_crc64_u64:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: movq %rdi, %rax
|
|
; CHECK-NEXT: crc32q %rsi, %rax
|
|
; CHECK-NEXT: retq
|
|
%res = call i64 @llvm.x86.sse42.crc32.64.64(i64 %a0, i64 %a1)
|
|
ret i64 %res
|
|
}
|
|
declare i64 @llvm.x86.sse42.crc32.64.64(i64, i64) nounwind readnone
|