%res = bitcast <8 x i1> %insertvec to i8
ret i8 %res
}
+
+define i8 @v2i64_concat_undef(<2 x i64> %vec) {
+; SSE2-SSSE3-LABEL: v2i64_concat_undef:
+; SSE2-SSSE3: # %bb.0:
+; SSE2-SSSE3-NEXT: pxor %xmm1, %xmm1
+; SSE2-SSSE3-NEXT: pcmpeqd %xmm0, %xmm1
+; SSE2-SSSE3-NEXT: pshufd {{.*#+}} xmm0 = xmm1[1,3,3,2]
+; SSE2-SSSE3-NEXT: pshufd {{.*#+}} xmm1 = xmm1[0,2,2,3]
+; SSE2-SSSE3-NEXT: pand %xmm0, %xmm1
+; SSE2-SSSE3-NEXT: pshuflw {{.*#+}} xmm0 = xmm1[0,2,2,3,4,5,6,7]
+; SSE2-SSSE3-NEXT: psllw $15, %xmm0
+; SSE2-SSSE3-NEXT: packsswb %xmm0, %xmm0
+; SSE2-SSSE3-NEXT: pmovmskb %xmm0, %eax
+; SSE2-SSSE3-NEXT: # kill: def $al killed $al killed $eax
+; SSE2-SSSE3-NEXT: retq
+;
+; AVX12-LABEL: v2i64_concat_undef:
+; AVX12: # %bb.0:
+; AVX12-NEXT: vpxor %xmm1, %xmm1, %xmm1
+; AVX12-NEXT: vpcmpeqq %xmm1, %xmm0, %xmm0
+; AVX12-NEXT: vpackssdw %xmm0, %xmm0, %xmm0
+; AVX12-NEXT: vpackssdw %xmm0, %xmm0, %xmm0
+; AVX12-NEXT: vpsllw $15, %xmm0, %xmm0
+; AVX12-NEXT: vpacksswb %xmm0, %xmm0, %xmm0
+; AVX12-NEXT: vpmovmskb %xmm0, %eax
+; AVX12-NEXT: # kill: def $al killed $al killed $eax
+; AVX12-NEXT: retq
+;
+; AVX512F-LABEL: v2i64_concat_undef:
+; AVX512F: # %bb.0:
+; AVX512F-NEXT: vptestnmq %xmm0, %xmm0, %k0
+; AVX512F-NEXT: kmovw %k0, %eax
+; AVX512F-NEXT: # kill: def $al killed $al killed $eax
+; AVX512F-NEXT: retq
+;
+; AVX512BW-LABEL: v2i64_concat_undef:
+; AVX512BW: # %bb.0:
+; AVX512BW-NEXT: vptestnmq %xmm0, %xmm0, %k0
+; AVX512BW-NEXT: kmovd %k0, %eax
+; AVX512BW-NEXT: # kill: def $al killed $al killed $eax
+; AVX512BW-NEXT: retq
+ %tobool = icmp eq <2 x i64> %vec, zeroinitializer
+ %insertvec = shufflevector <2 x i1> %tobool, <2 x i1> poison, <8 x i32> <i32 0, i32 1, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef>
+ %res = bitcast <8 x i1> %insertvec to i8
+ ret i8 %res
+}
+
+define i8 @v4f64_concat_undef(<4 x double> %vec) {
+; SSE2-SSSE3-LABEL: v4f64_concat_undef:
+; SSE2-SSSE3: # %bb.0:
+; SSE2-SSSE3-NEXT: xorpd %xmm2, %xmm2
+; SSE2-SSSE3-NEXT: xorpd %xmm3, %xmm3
+; SSE2-SSSE3-NEXT: cmpltpd %xmm1, %xmm3
+; SSE2-SSSE3-NEXT: cmpltpd %xmm0, %xmm2
+; SSE2-SSSE3-NEXT: packssdw %xmm3, %xmm2
+; SSE2-SSSE3-NEXT: movmskps %xmm2, %eax
+; SSE2-SSSE3-NEXT: # kill: def $al killed $al killed $eax
+; SSE2-SSSE3-NEXT: retq
+;
+; AVX12-LABEL: v4f64_concat_undef:
+; AVX12: # %bb.0:
+; AVX12-NEXT: vxorpd %xmm1, %xmm1, %xmm1
+; AVX12-NEXT: vcmpltpd %ymm0, %ymm1, %ymm0
+; AVX12-NEXT: vmovmskpd %ymm0, %eax
+; AVX12-NEXT: # kill: def $al killed $al killed $eax
+; AVX12-NEXT: vzeroupper
+; AVX12-NEXT: retq
+;
+; AVX512F-LABEL: v4f64_concat_undef:
+; AVX512F: # %bb.0:
+; AVX512F-NEXT: vxorpd %xmm1, %xmm1, %xmm1
+; AVX512F-NEXT: vcmpltpd %ymm0, %ymm1, %k0
+; AVX512F-NEXT: kmovw %k0, %eax
+; AVX512F-NEXT: # kill: def $al killed $al killed $eax
+; AVX512F-NEXT: vzeroupper
+; AVX512F-NEXT: retq
+;
+; AVX512BW-LABEL: v4f64_concat_undef:
+; AVX512BW: # %bb.0:
+; AVX512BW-NEXT: vxorpd %xmm1, %xmm1, %xmm1
+; AVX512BW-NEXT: vcmpltpd %ymm0, %ymm1, %k0
+; AVX512BW-NEXT: kmovd %k0, %eax
+; AVX512BW-NEXT: # kill: def $al killed $al killed $eax
+; AVX512BW-NEXT: vzeroupper
+; AVX512BW-NEXT: retq
+ %tobool = fcmp ogt <4 x double> %vec, zeroinitializer
+ %insertvec = shufflevector <4 x i1> %tobool, <4 x i1> poison, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 undef, i32 undef, i32 undef, i32 undef>
+ %res = bitcast <8 x i1> %insertvec to i8
+ ret i8 %res
+}