forked from OSchip/llvm-project
[X86] Enable fast variable per-lane shuffle tuning on all Ryzen targets (PR44795)
rGa3b8695bf592 enabled this for znver3, but AMD SoG, Agner and uops.info all agree that even znver1 has a fast per-lane shuffle op (VPSHUFB), but cross-lane shuffles seem to be slow (PERMPS etc.) Fixes #44140 Differential Revision: https://reviews.llvm.org/D123306
This commit is contained in:
parent
b2a7f1c390
commit
cf3a09369a
|
@ -1193,6 +1193,7 @@ def ProcessorFeatures {
|
|||
TuningFastScalarFSQRT,
|
||||
TuningFastVectorFSQRT,
|
||||
TuningFastScalarShiftMasks,
|
||||
TuningFastVariablePerLaneShuffle,
|
||||
TuningFastMOVBE,
|
||||
TuningSlowSHLD,
|
||||
TuningSBBDepBreaking,
|
||||
|
@ -1208,9 +1209,7 @@ def ProcessorFeatures {
|
|||
FeaturePKU,
|
||||
FeatureVAES,
|
||||
FeatureVPCLMULQDQ];
|
||||
list<SubtargetFeature> ZN3AdditionalTuning =
|
||||
[TuningMacroFusion,
|
||||
TuningFastVariablePerLaneShuffle];
|
||||
list<SubtargetFeature> ZN3AdditionalTuning = [TuningMacroFusion];
|
||||
list<SubtargetFeature> ZN3Tuning =
|
||||
!listconcat(ZN2Tuning, ZN3AdditionalTuning);
|
||||
list<SubtargetFeature> ZN3Features =
|
||||
|
|
|
@ -4,8 +4,8 @@
|
|||
; RUN: llc < %s -mtriple=x86_64-unknown -mattr=+avx2,+fast-variable-perlane-shuffle | FileCheck %s --check-prefixes=FAST
|
||||
; RUN: llc < %s -mtriple=x86_64-unknown -mattr=+avx512f,+fast-variable-perlane-shuffle | FileCheck %s --check-prefixes=FAST
|
||||
;
|
||||
; RUN: llc < %s -mtriple=x86_64-unknown -mcpu=znver1 | FileCheck %s --check-prefixes=SLOW
|
||||
; RUN: llc < %s -mtriple=x86_64-unknown -mcpu=znver2 | FileCheck %s --check-prefixes=SLOW
|
||||
; RUN: llc < %s -mtriple=x86_64-unknown -mcpu=znver1 | FileCheck %s --check-prefixes=FAST
|
||||
; RUN: llc < %s -mtriple=x86_64-unknown -mcpu=znver2 | FileCheck %s --check-prefixes=FAST
|
||||
; RUN: llc < %s -mtriple=x86_64-unknown -mcpu=znver3 | FileCheck %s --check-prefixes=FAST
|
||||
; RUN: llc < %s -mtriple=x86_64-unknown -mcpu=haswell | FileCheck %s --check-prefixes=FAST
|
||||
; RUN: llc < %s -mtriple=x86_64-unknown -mcpu=skx | FileCheck %s --check-prefixes=FAST
|
||||
|
|
Loading…
Reference in New Issue