/external/llvm/lib/Transforms/Vectorize/ |
D | LoopVectorize.cpp | 241 static Type *ToVectorTy(Type *Scalar, unsigned VF) { in ToVectorTy() argument 242 if (Scalar->isVoidTy() || VF == 1) in ToVectorTy() 244 return VectorType::get(Scalar, VF); in ToVectorTy() 295 AC(AC), VF(VecWidth), UF(UnrollFactor), in InnerLoopVectorizer() 379 unsigned VF, PhiVector *PV); 542 unsigned VF; member in __anon63bf7e8f0111::InnerLoopVectorizer 1631 unsigned selectInterleaveCount(bool OptForSize, unsigned VF, 1638 unsigned computeInterleaveCount(bool OptForSize, unsigned VF, 1673 VectorizationCostTy expectedCost(unsigned VF); 1677 VectorizationCostTy getInstructionCost(Instruction *I, unsigned VF); [all …]
|
D | LoadStoreVectorizer.cpp | 684 unsigned VF = VecRegSize / Sz; in vectorizeStoreChain() local 687 if (!isPowerOf2_32(Sz) || VF < 2 || ChainSize < 2) { in vectorizeStoreChain() 735 if (ChainSize > VF) { in vectorizeStoreChain() 738 return vectorizeStoreChain(Chain.slice(0, VF), InstructionsProcessed) | in vectorizeStoreChain() 739 vectorizeStoreChain(Chain.slice(VF), InstructionsProcessed); in vectorizeStoreChain() 839 unsigned VF = VecRegSize / Sz; in vectorizeLoadChain() local 842 if (!isPowerOf2_32(Sz) || VF < 2 || ChainSize < 2) { in vectorizeLoadChain() 889 if (ChainSize > VF) { in vectorizeLoadChain() 892 return vectorizeLoadChain(Chain.slice(0, VF), InstructionsProcessed) | in vectorizeLoadChain() 893 vectorizeLoadChain(Chain.slice(VF), InstructionsProcessed); in vectorizeLoadChain()
|
/external/clang/test/SemaCXX/ |
D | destructor.cpp | 213 struct VF final: VB {}; struct 246 VF vf; use(vf); in nowarnstack() 310 VF* vf = new VF(); in nowarn0() 315 void nowarn0_explicit_dtor(F* f, VB* vb, VD* vd, VF* vf) { in nowarn0_explicit_dtor() 320 vf->~VF(); in nowarn0_explicit_dtor() 367 simple_ptr<VF> vf(new VF()); in nowarn1()
|
/external/llvm/include/llvm/Analysis/ |
D | TargetLibraryInfo.h | 162 bool isFunctionVectorizable(StringRef F, unsigned VF) const { in isFunctionVectorizable() argument 163 return !getVectorizedFunction(F, VF).empty(); in isFunctionVectorizable() 172 StringRef getVectorizedFunction(StringRef F, unsigned VF) const; 176 bool isFunctionScalarizable(StringRef F, unsigned &VF) const { in isFunctionScalarizable() argument 177 return !getScalarizedFunction(F, VF).empty(); in isFunctionScalarizable() 184 StringRef getScalarizedFunction(StringRef F, unsigned &VF) const; 229 bool isFunctionVectorizable(StringRef F, unsigned VF) const { in isFunctionVectorizable() argument 230 return Impl->isFunctionVectorizable(F, VF); in isFunctionVectorizable() 235 StringRef getVectorizedFunction(StringRef F, unsigned VF) const { in getVectorizedFunction() argument 236 return Impl->getVectorizedFunction(F, VF); in getVectorizedFunction()
|
D | TargetTransformInfo.h | 484 unsigned getMaxInterleaveFactor(unsigned VF) const; 692 virtual unsigned getMaxInterleaveFactor(unsigned VF) = 0; 892 unsigned getMaxInterleaveFactor(unsigned VF) override { in getMaxInterleaveFactor() argument 893 return Impl.getMaxInterleaveFactor(VF); in getMaxInterleaveFactor()
|
/external/llvm/test/Transforms/LoopVectorize/X86/ |
D | reg-usage.ll | 11 ; This function has a loop of SAD pattern. Here we check when VF = 16 the 15 ; CHECK: LV(REG): VF = 4 17 ; CHECK: LV(REG): VF = 8 19 ; CHECK: LV(REG): VF = 16 50 ; CHECK: LV(REG): VF = 2
|
D | uint64_to_fp64-cost-model.ll | 8 ; CHECK: cost of 10 for VF 2 For instruction: %conv = uitofp i64 %tmp to double 9 ; CHECK: cost of 20 for VF 4 For instruction: %conv = uitofp i64 %tmp to double
|
D | vector-scalar-select-cost.ll | 26 ; CHECK: cost of 1 for VF 2 {{.*}} select i1 %cond, i32 %6, i32 0 54 ; CHECK: cost of 1 for VF 2 {{.*}} select i1 %8, i32 %6, i32 0
|
D | gcc-examples.ll | 11 ; Select VF = 8; 47 ; Select VF=4 because sext <8 x i1> to <8 x i32> is expensive.
|
D | fp_to_sint8-cost-model.ll | 8 ; CHECK: cost of 7 for VF 8 For instruction: %conv = fptosi float %tmp to i8
|
D | vector_max_bandwidth.ll | 19 ; CHECK: LV: Selecting VF: 32.
|
/external/llvm/test/Transforms/LoopVectorize/AArch64/ |
D | max-vf-for-interleaved.ll | 10 ; vectorization is 16 bytes. Normally, this would lead to a maximum VF of 4. 11 ; However, for interleaved groups, the effective VF is VF * IF, where IF is the 13 ; as 16 / IF bytes, resulting in VF=2. Since IF=2, we should generate <4 x i32>
|
D | interleaved_cost.ll | 18 ; CHECK: LV: Found an estimated cost of 2 for VF 8 For instruction: %tmp = load i8, i8* %arrayidx… 19 ; CHECK: LV: Found an estimated cost of 2 for VF 16 For instruction: %tmp = load i8, i8* %arrayid… 52 ; CHECK: LV: Found an estimated cost of 6 for VF 2 For instruction: %1 = load double, double* %0,… 53 ; CHECK: LV: Found an estimated cost of 0 for VF 2 For instruction: %5 = load double, double* %4,… 54 ; CHECK: LV: Found an estimated cost of 10 for VF 2 For instruction: store double %9, double* %10…
|
/external/clang/test/Layout/ |
D | ms-x86-member-pointers.cpp | 14 struct VF { char a; int (V::*mp)(); }; struct 79 sizeof(VF) +
|
/external/clang/test/CodeGenCXX/ |
D | apple-kext-indirect-call-2.cpp | 15 virtual void VF(); 18 void B::VF() {} in VF() function in B
|
/external/llvm/test/Transforms/LoopVectorize/ARM/ |
D | interleaved_cost.ll | 17 ; CHECK: LV: Found an estimated cost of 2 for VF 8 For instruction: %tmp = load i8, i8* %arrayidx… 18 ; CHECK: LV: Found an estimated cost of 2 for VF 16 For instruction: %tmp = load i8, i8* %arrayid…
|
/external/llvm/lib/Target/PowerPC/ |
D | PPCRegisterInfo.td | 59 // VF - One of the 32 64-bit floating-point subregisters of the vector 61 class VF<bits<5> num, string n> : PPCReg<n> { 67 class VR<VF SubReg, string n> : PPCReg<n> { 121 def VF#Index : VF<Index, "vs" # !add(Index, 32)>; 132 def V#Index : VR<!cast<VF>("VF"#Index), "v"#Index>,
|
D | PPCTargetTransformInfo.h | 75 unsigned getMaxInterleaveFactor(unsigned VF);
|
/external/llvm/lib/Target/X86/ |
D | X86TargetTransformInfo.cpp | 70 unsigned X86TTIImpl::getMaxInterleaveFactor(unsigned VF) { in getMaxInterleaveFactor() argument 74 if (VF == 1) in getMaxInterleaveFactor() 1439 unsigned VF = SrcVTy->getVectorNumElements(); in getGSVectorCost() local 1473 unsigned IndexSize = (VF >= 16) ? getIndexSizeInBits(Ptr, DL) : in getGSVectorCost() 1477 IndexSize), VF); in getGSVectorCost() 1483 Type *SplitSrcTy = VectorType::get(SrcVTy->getScalarType(), VF / SplitFactor); in getGSVectorCost() 1491 return GSOverhead + VF * getMemoryOpCost(Opcode, SrcVTy->getScalarType(), in getGSVectorCost() 1506 unsigned VF = SrcVTy->getVectorNumElements(); in getGSScalarCost() local 1511 VectorType::get(Type::getInt1Ty(SrcVTy->getContext()), VF); in getGSScalarCost() 1517 MaskUnpackCost += VF * (BranchCost + ScalarCompareCost); in getGSScalarCost() [all …]
|
D | X86TargetTransformInfo.h | 64 unsigned getMaxInterleaveFactor(unsigned VF);
|
/external/clang/test/CodeGenOpenCL/ |
D | shifts.cl | 53 //OPT-NEXT: [[VF:%.+]] = add <4 x i32> [[VC]], <i32 2, i32 4, i32 16, i32 8> 57 //OPT-NEXT: ret <4 x i32> [[VF]]
|
/external/llvm/lib/Target/AMDGPU/ |
D | AMDGPUTargetTransformInfo.h | 86 unsigned getMaxInterleaveFactor(unsigned VF);
|
/external/llvm/test/Transforms/LoopVectorize/ |
D | unroll.ll | 1 ; This test makes sure that loop will not be unrolled in vectorization if VF computed
|
/external/llvm/lib/Target/ARM/ |
D | ARMTargetTransformInfo.h | 102 unsigned getMaxInterleaveFactor(unsigned VF) { in getMaxInterleaveFactor() argument
|
/external/llvm/lib/Target/AArch64/ |
D | AArch64TargetTransformInfo.h | 98 unsigned getMaxInterleaveFactor(unsigned VF);
|