llvm.org GIT mirror llvm / 5009e4f
[X86][AVX512] Fixed VPERMILPD/VPERMILPS shuffle comments. Fixed incorrect operands indices used to access src registers git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@269221 91177308-0d34-0410-b5e6-96231b3b80d8 Simon Pilgrim 4 years ago
3 changed file(s) with 14 addition(s) and 14 deletion(s). Raw diff Collapse all Expand all
587587 break;
588588
589589 CASE_VPERM(PERMILPS, r)
590 Src1Name = getRegName(MI->getOperand(1).getReg());
590 Src1Name = getRegName(MI->getOperand(NumOperands - 2).getReg());
591591 // FALL THROUGH.
592592 CASE_VPERM(PERMILPS, m)
593593 if (MI->getOperand(NumOperands - 1).isImm())
598598 break;
599599
600600 CASE_VPERM(PERMILPD, r)
601 Src1Name = getRegName(MI->getOperand(1).getReg());
601 Src1Name = getRegName(MI->getOperand(NumOperands - 2).getReg());
602602 // FALL THROUGH.
603603 CASE_VPERM(PERMILPD, m)
604604 if (MI->getOperand(NumOperands - 1).isImm())
59875987 ; CHECK-LABEL: test_int_x86_avx512_mask_vpermil_pd_512:
59885988 ; CHECK: ## BB#0:
59895989 ; CHECK-NEXT: kmovw %edi, %k1
5990 ; CHECK-NEXT: vpermilpd {{.*#+}} zmm1 = zmm1[0,1,3,2,5,4,6,6]
5991 ; CHECK-NEXT: vpermilpd {{.*#+}} zmm2 = k1[0,1,3,2,5,4,6,6]
5990 ; CHECK-NEXT: vpermilpd {{.*#+}} zmm1 = zmm0[0,1,3,2,5,4,6,6]
5991 ; CHECK-NEXT: vpermilpd {{.*#+}} zmm2 = zmm0[0,1,3,2,5,4,6,6]
59925992 ; CHECK-NEXT: vpermilpd {{.*#+}} zmm0 = zmm0[0,1,3,2,5,4,6,6]
59935993 ; CHECK-NEXT: vaddpd %zmm2, %zmm1, %zmm1
59945994 ; CHECK-NEXT: vaddpd %zmm0, %zmm1, %zmm0
60076007 ; CHECK-LABEL: test_int_x86_avx512_mask_vpermil_ps_512:
60086008 ; CHECK: ## BB#0:
60096009 ; CHECK-NEXT: kmovw %edi, %k1
6010 ; CHECK-NEXT: vpermilps {{.*#+}} zmm1 = zmm1[2,1,1,0,6,5,5,4,10,9,9,8,14,13,13,12]
6011 ; CHECK-NEXT: vpermilps {{.*#+}} zmm2 = k1[2,1,1,0,6,5,5,4,10,9,9,8,14,13,13,12]
6010 ; CHECK-NEXT: vpermilps {{.*#+}} zmm1 = zmm0[2,1,1,0,6,5,5,4,10,9,9,8,14,13,13,12]
6011 ; CHECK-NEXT: vpermilps {{.*#+}} zmm2 = zmm0[2,1,1,0,6,5,5,4,10,9,9,8,14,13,13,12]
60126012 ; CHECK-NEXT: vpermilps {{.*#+}} zmm0 = zmm0[2,1,1,0,6,5,5,4,10,9,9,8,14,13,13,12]
60136013 ; CHECK-NEXT: vaddps %zmm2, %zmm1, %zmm1
60146014 ; CHECK-NEXT: vaddps %zmm0, %zmm1, %zmm0
48334833 ; CHECK: ## BB#0:
48344834 ; CHECK-NEXT: kmovw %edi, %k1
48354835 ; CHECK-NEXT: vpermilpd $22, %ymm0, %ymm1 {%k1}
4836 ; CHECK-NEXT: ## ymm1 = ymm1[0,1,3,2]
4836 ; CHECK-NEXT: ## ymm1 = ymm0[0,1,3,2]
48374837 ; CHECK-NEXT: vpermilpd $22, %ymm0, %ymm2 {%k1} {z}
4838 ; CHECK-NEXT: ## ymm2 = k1[0,1,3,2]
4838 ; CHECK-NEXT: ## ymm2 = ymm0[0,1,3,2]
48394839 ; CHECK-NEXT: vpermilpd $22, %ymm0, %ymm0
48404840 ; CHECK-NEXT: ## ymm0 = ymm0[0,1,3,2]
48414841 ; CHECK-NEXT: vaddpd %ymm2, %ymm1, %ymm1
48564856 ; CHECK: ## BB#0:
48574857 ; CHECK-NEXT: kmovw %edi, %k1
48584858 ; CHECK-NEXT: vpermilpd $1, %xmm0, %xmm1 {%k1}
4859 ; CHECK-NEXT: ## xmm1 = xmm1[1,0]
4859 ; CHECK-NEXT: ## xmm1 = xmm0[1,0]
48604860 ; CHECK-NEXT: vpermilpd $1, %xmm0, %xmm2 {%k1} {z}
4861 ; CHECK-NEXT: ## xmm2 = k1[1,0]
4861 ; CHECK-NEXT: ## xmm2 = xmm0[1,0]
48624862 ; CHECK-NEXT: vpermilpd $1, %xmm0, %xmm0
48634863 ; CHECK-NEXT: ## xmm0 = xmm0[1,0]
48644864 ; CHECK-NEXT: vaddpd %xmm2, %xmm1, %xmm1
48794879 ; CHECK: ## BB#0:
48804880 ; CHECK-NEXT: kmovw %edi, %k1
48814881 ; CHECK-NEXT: vpermilps $22, %ymm0, %ymm1 {%k1}
4882 ; CHECK-NEXT: ## ymm1 = ymm1[2,1,1,0,6,5,5,4]
4882 ; CHECK-NEXT: ## ymm1 = ymm0[2,1,1,0,6,5,5,4]
48834883 ; CHECK-NEXT: vpermilps $22, %ymm0, %ymm2 {%k1} {z}
4884 ; CHECK-NEXT: ## ymm2 = k1[2,1,1,0,6,5,5,4]
4884 ; CHECK-NEXT: ## ymm2 = ymm0[2,1,1,0,6,5,5,4]
48854885 ; CHECK-NEXT: vpermilps $22, %ymm0, %ymm0
48864886 ; CHECK-NEXT: ## ymm0 = ymm0[2,1,1,0,6,5,5,4]
48874887 ; CHECK-NEXT: vaddps %ymm2, %ymm1, %ymm1
49024902 ; CHECK: ## BB#0:
49034903 ; CHECK-NEXT: kmovw %edi, %k1
49044904 ; CHECK-NEXT: vpermilps $22, %xmm0, %xmm1 {%k1}
4905 ; CHECK-NEXT: ## xmm1 = xmm1[2,1,1,0]
4905 ; CHECK-NEXT: ## xmm1 = xmm0[2,1,1,0]
49064906 ; CHECK-NEXT: vpermilps $22, %xmm0, %xmm2 {%k1} {z}
4907 ; CHECK-NEXT: ## xmm2 = k1[2,1,1,0]
4907 ; CHECK-NEXT: ## xmm2 = xmm0[2,1,1,0]
49084908 ; CHECK-NEXT: vpermilps $22, %xmm0, %xmm0
49094909 ; CHECK-NEXT: ## xmm0 = xmm0[2,1,1,0]
49104910 ; CHECK-NEXT: vaddps %xmm2, %xmm1, %xmm1