Skip to content

Commit 7896df2

Browse files
authored
Merge pull request #52 from schweitzpgi/release_70
merge up LLVM changes [Release 70 branch]
2 parents 04a4ab9 + 1b7b2fc commit 7896df2

File tree

7 files changed

+96
-18
lines changed

7 files changed

+96
-18
lines changed

lib/Target/X86/X86DomainReassignment.cpp

Lines changed: 21 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -217,6 +217,27 @@ class InstrCOPYReplacer : public InstrReplacer {
217217
InstrCOPYReplacer(unsigned SrcOpcode, RegDomain DstDomain, unsigned DstOpcode)
218218
: InstrReplacer(SrcOpcode, DstOpcode), DstDomain(DstDomain) {}
219219

220+
bool isLegal(const MachineInstr *MI,
221+
const TargetInstrInfo *TII) const override {
222+
if (!InstrConverterBase::isLegal(MI, TII))
223+
return false;
224+
225+
// Don't allow copies to/flow GR8/GR16 physical registers.
226+
// FIXME: Is there some better way to support this?
227+
unsigned DstReg = MI->getOperand(0).getReg();
228+
if (TargetRegisterInfo::isPhysicalRegister(DstReg) &&
229+
(X86::GR8RegClass.contains(DstReg) ||
230+
X86::GR16RegClass.contains(DstReg)))
231+
return false;
232+
unsigned SrcReg = MI->getOperand(1).getReg();
233+
if (TargetRegisterInfo::isPhysicalRegister(SrcReg) &&
234+
(X86::GR8RegClass.contains(SrcReg) ||
235+
X86::GR16RegClass.contains(SrcReg)))
236+
return false;
237+
238+
return true;
239+
}
240+
220241
double getExtraCost(const MachineInstr *MI,
221242
MachineRegisterInfo *MRI) const override {
222243
assert(MI->getOpcode() == TargetOpcode::COPY && "Expected a COPY");

lib/Target/X86/X86ISelLowering.cpp

Lines changed: 3 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -23312,15 +23312,14 @@ static SDValue LowerScalarVariableShift(SDValue Op, SelectionDAG &DAG,
2331223312
}
2331323313

2331423314
// Check cases (mainly 32-bit) where i64 is expanded into high and low parts.
23315-
if (VT == MVT::v2i64 && Amt.getOpcode() == ISD::BITCAST &&
23315+
if (VT == MVT::v2i64 && Amt.getOpcode() == ISD::BITCAST &&
2331623316
Amt.getOperand(0).getOpcode() == ISD::BUILD_VECTOR) {
2331723317
Amt = Amt.getOperand(0);
23318-
unsigned Ratio = Amt.getSimpleValueType().getVectorNumElements() /
23319-
VT.getVectorNumElements();
23318+
unsigned Ratio = 64 / Amt.getScalarValueSizeInBits();
2332023319
std::vector<SDValue> Vals(Ratio);
2332123320
for (unsigned i = 0; i != Ratio; ++i)
2332223321
Vals[i] = Amt.getOperand(i);
23323-
for (unsigned i = Ratio; i != Amt.getNumOperands(); i += Ratio) {
23322+
for (unsigned i = Ratio, e = Amt.getNumOperands(); i != e; i += Ratio) {
2332423323
for (unsigned j = 0; j != Ratio; ++j)
2332523324
if (Vals[j] != Amt.getOperand(i + j))
2332623325
return SDValue();

lib/Target/X86/X86InstrInfo.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3109,7 +3109,7 @@ void X86InstrInfo::copyPhysReg(MachineBasicBlock &MBB,
31093109

31103110
LLVM_DEBUG(dbgs() << "Cannot copy " << RI.getName(SrcReg) << " to "
31113111
<< RI.getName(DestReg) << '\n');
3112-
llvm_unreachable("Cannot emit physreg copy instruction");
3112+
report_fatal_error("Cannot emit physreg copy instruction");
31133113
}
31143114

31153115
bool X86InstrInfo::isCopyInstr(const MachineInstr &MI,

test/CodeGen/X86/known-signbits-vector.ll

Lines changed: 18 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -381,19 +381,26 @@ define <4 x float> @signbits_ashr_sext_select_shuffle_sitofp(<4 x i64> %a0, <4 x
381381
; X32-NEXT: movl %esp, %ebp
382382
; X32-NEXT: andl $-16, %esp
383383
; X32-NEXT: subl $16, %esp
384+
; X32-NEXT: vmovdqa {{.*#+}} xmm3 = [33,0,63,0]
385+
; X32-NEXT: vmovdqa {{.*#+}} xmm4 = [0,2147483648,0,2147483648]
386+
; X32-NEXT: vpsrlq %xmm3, %xmm4, %xmm5
387+
; X32-NEXT: vpshufd {{.*#+}} xmm6 = xmm3[2,3,0,1]
388+
; X32-NEXT: vpsrlq %xmm6, %xmm4, %xmm4
389+
; X32-NEXT: vpblendw {{.*#+}} xmm4 = xmm5[0,1,2,3],xmm4[4,5,6,7]
390+
; X32-NEXT: vextractf128 $1, %ymm2, %xmm5
391+
; X32-NEXT: vpsrlq %xmm6, %xmm5, %xmm7
392+
; X32-NEXT: vpsrlq %xmm3, %xmm5, %xmm5
393+
; X32-NEXT: vpblendw {{.*#+}} xmm5 = xmm5[0,1,2,3],xmm7[4,5,6,7]
394+
; X32-NEXT: vpsrlq %xmm6, %xmm2, %xmm6
395+
; X32-NEXT: vpsrlq %xmm3, %xmm2, %xmm2
396+
; X32-NEXT: vpblendw {{.*#+}} xmm2 = xmm2[0,1,2,3],xmm6[4,5,6,7]
384397
; X32-NEXT: vpmovsxdq 16(%ebp), %xmm3
398+
; X32-NEXT: vpxor %xmm4, %xmm5, %xmm5
399+
; X32-NEXT: vpsubq %xmm4, %xmm5, %xmm5
400+
; X32-NEXT: vpxor %xmm4, %xmm2, %xmm2
401+
; X32-NEXT: vpsubq %xmm4, %xmm2, %xmm2
385402
; X32-NEXT: vpmovsxdq 8(%ebp), %xmm4
386-
; X32-NEXT: vmovdqa {{.*#+}} xmm5 = [33,0,63,0]
387-
; X32-NEXT: vmovdqa {{.*#+}} xmm6 = [0,2147483648,0,2147483648]
388-
; X32-NEXT: vpsrlq %xmm5, %xmm6, %xmm6
389-
; X32-NEXT: vextractf128 $1, %ymm2, %xmm7
390-
; X32-NEXT: vpsrlq %xmm5, %xmm7, %xmm7
391-
; X32-NEXT: vpxor %xmm6, %xmm7, %xmm7
392-
; X32-NEXT: vpsubq %xmm6, %xmm7, %xmm7
393-
; X32-NEXT: vpsrlq %xmm5, %xmm2, %xmm2
394-
; X32-NEXT: vpxor %xmm6, %xmm2, %xmm2
395-
; X32-NEXT: vpsubq %xmm6, %xmm2, %xmm2
396-
; X32-NEXT: vinsertf128 $1, %xmm7, %ymm2, %ymm2
403+
; X32-NEXT: vinsertf128 $1, %xmm5, %ymm2, %ymm2
397404
; X32-NEXT: vinsertf128 $1, %xmm3, %ymm4, %ymm3
398405
; X32-NEXT: vextractf128 $1, %ymm1, %xmm4
399406
; X32-NEXT: vextractf128 $1, %ymm0, %xmm5

test/CodeGen/X86/pr38803.ll

Lines changed: 48 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,48 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2+
; RUN: llc < %s -mcpu=skylake-avx512 -mtriple=x86_64-unknown-unknown | FileCheck %s
3+
4+
@b = local_unnamed_addr global i32 0, align 4
5+
@c = local_unnamed_addr global i32 0, align 4
6+
@d = local_unnamed_addr global float 0.000000e+00, align 4
7+
8+
define float @_Z3fn2v() {
9+
; CHECK-LABEL: _Z3fn2v:
10+
; CHECK: # %bb.0: # %entry
11+
; CHECK-NEXT: pushq %rax
12+
; CHECK-NEXT: .cfi_def_cfa_offset 16
13+
; CHECK-NEXT: callq _Z1av
14+
; CHECK-NEXT: # kill: def $al killed $al def $eax
15+
; CHECK-NEXT: kmovd %eax, %k1
16+
; CHECK-NEXT: vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero
17+
; CHECK-NEXT: vmovss %xmm0, %xmm0, %xmm0 {%k1} {z}
18+
; CHECK-NEXT: cmpl $0, {{.*}}(%rip)
19+
; CHECK-NEXT: je .LBB0_2
20+
; CHECK-NEXT: # %bb.1: # %if.then
21+
; CHECK-NEXT: vcvtsi2ssl {{.*}}(%rip), %xmm1, %xmm1
22+
; CHECK-NEXT: kmovd %eax, %k1
23+
; CHECK-NEXT: vxorps %xmm2, %xmm2, %xmm2
24+
; CHECK-NEXT: vmovss %xmm2, %xmm0, %xmm1 {%k1}
25+
; CHECK-NEXT: vmovss %xmm1, {{.*}}(%rip)
26+
; CHECK-NEXT: .LBB0_2: # %if.end
27+
; CHECK-NEXT: popq %rax
28+
; CHECK-NEXT: .cfi_def_cfa_offset 8
29+
; CHECK-NEXT: retq
30+
entry:
31+
%call = tail call zeroext i1 @_Z1av()
32+
%cond = select i1 %call, float 7.500000e-01, float 0.000000e+00
33+
%0 = load i32, i32* @c, align 4
34+
%tobool2 = icmp eq i32 %0, 0
35+
br i1 %tobool2, label %if.end, label %if.then
36+
37+
if.then: ; preds = %entry
38+
%1 = load i32, i32* @b, align 4
39+
%2 = sitofp i32 %1 to float
40+
%conv5 = select i1 %call, float 0.000000e+00, float %2
41+
store float %conv5, float* @d, align 4
42+
br label %if.end
43+
44+
if.end: ; preds = %entry, %if.then
45+
ret float %cond
46+
}
47+
48+
declare zeroext i1 @_Z1av()

tools/llvm-xray/xray-account.cpp

Lines changed: 5 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -358,8 +358,11 @@ void LatencyAccountant::exportStats(const XRayFileHeader &Header, F Fn) const {
358358
break;
359359
}
360360

361-
if (AccountTop > 0)
362-
Results.erase(Results.begin() + AccountTop.getValue(), Results.end());
361+
if (AccountTop > 0) {
362+
auto MaxTop =
363+
std::min(AccountTop.getValue(), static_cast<int>(Results.size()));
364+
Results.erase(Results.begin() + MaxTop, Results.end());
365+
}
363366

364367
for (const auto &R : Results)
365368
Fn(std::get<0>(R), std::get<1>(R), std::get<2>(R));

utils/lit/lit/builtin_commands/__init__.py

Whitespace-only changes.

0 commit comments

Comments
 (0)