Add TargetLoweringInfo hook for explicitly setting the ABI calling convention endianess

author Dylan McKay <me@dylanmckay.io>

Tue, 21 May 2019 06:38:02 +0000 (06:38 +0000)

committer Dylan McKay <me@dylanmckay.io>

Tue, 21 May 2019 06:38:02 +0000 (06:38 +0000)
author Dylan McKay <me@dylanmckay.io>
Tue, 21 May 2019 06:38:02 +0000 (06:38 +0000)
committer Dylan McKay <me@dylanmckay.io>
Tue, 21 May 2019 06:38:02 +0000 (06:38 +0000)
diff --git a/include/llvm/CodeGen/TargetLowering.h b/include/llvm/CodeGen/TargetLowering.h

index 51542533bec4dd028e2d6860049759b3a98c39d7..b65612cb25b497de5dc0a374913f9fe513f8c0c1 100644 (file)
--- a/include/llvm/CodeGen/TargetLowering.h
+++ b/include/llvm/CodeGen/TargetLowering.h
@@ -3538,6 +3538,15 @@ public:
      return false;
    }
  
+  /// For most targets, an LLVM type must be broken down into multiple
+  /// smaller types. Usually the halves are ordered according to the endianness
+  /// but for some platform that would break. So this method will default to
+  /// matching the endianness but can be overridden.
+  virtual bool
+  shouldSplitFunctionArgumentsAsLittleEndian(const DataLayout &DL) const {
+    return DL.isLittleEndian();
+  }
+
    /// Returns a 0 terminated array of registers that can be safely used as
    /// scratch registers.
    virtual const MCPhysReg *getScratchRegisters(CallingConv::ID CC) const {
diff --git a/lib/CodeGen/SelectionDAG/TargetLowering.cpp b/lib/CodeGen/SelectionDAG/TargetLowering.cpp

index ab6b7a7398e5a53ada09c056f559e952700b62e5..f07180a2faaa60e26127813f21fa9425cde216a5 100644 (file)
--- a/lib/CodeGen/SelectionDAG/TargetLowering.cpp
+++ b/lib/CodeGen/SelectionDAG/TargetLowering.cpp
@@ -5920,7 +5920,7 @@ bool TargetLowering::expandMULO(SDNode *Node, SDValue &Result,
      // being a legal type for the architecture and thus has to be split to
      // two arguments.
      SDValue Ret;
-    if (DAG.getDataLayout().isLittleEndian()) {
+    if (shouldSplitFunctionArgumentsAsLittleEndian(DAG.getDataLayout())) {
        // Halves of WideVT are packed into registers in different order
        // depending on platform endianness. This is usually handled by
        // the C calling convention, but we can't defer to it in
diff --git a/lib/Target/AVR/AVRISelLowering.h b/lib/Target/AVR/AVRISelLowering.h

index 7e4496324a1dfb42e57cbe668a9bd9832fdc7fd9..ed2d0835903c4c5b727275e730e68ad2e25ab763 100644 (file)
--- a/lib/Target/AVR/AVRISelLowering.h
+++ b/lib/Target/AVR/AVRISelLowering.h
@@ -128,6 +128,11 @@ public:
    unsigned getRegisterByName(const char* RegName, EVT VT,
                               SelectionDAG &DAG) const override;
  
+  bool shouldSplitFunctionArgumentsAsLittleEndian(const DataLayout &DL)
+    const override {
+    return false;
+  }
+
  private:
    SDValue getAVRCmp(SDValue LHS, SDValue RHS, ISD::CondCode CC, SDValue &AVRcc,
                      SelectionDAG &DAG, SDLoc dl) const;
diff --git a/test/CodeGen/AVR/umul.with.overflow.i16-bug.ll b/test/CodeGen/AVR/umul.with.overflow.i16-bug.ll

new file mode 100644 (file)

index 0000000..4ea8f32
--- /dev/null
+++ b/test/CodeGen/AVR/umul.with.overflow.i16-bug.ll
@@ -0,0 +1,49 @@
+; RUN: llc -O1 < %s -march=avr | FileCheck %s
+
+target datalayout = "e-m:o-i64:64-f80:128-n8:16:32:64-S128"
+target triple = "x86_64-apple-macosx10.9"
+
+%Vs6UInt16 = type <{ i16 }>
+%Sb = type <{ i1 }>
+
+define hidden void @setServoAngle(i16) {
+  ; CHECK-LABEL: entry
+entry:
+  %adjustedAngle = alloca %Vs6UInt16, align 2
+  %1 = bitcast %Vs6UInt16* %adjustedAngle to i8*
+  %adjustedAngle._value = getelementptr inbounds %Vs6UInt16, %Vs6UInt16* %adjustedAngle, i32 0, i32 0
+  store i16 %0, i16* %adjustedAngle._value, align 2
+
+;print(unsignedInt: adjustedAngle &* UInt16(11))
+; breaks here
+  %adjustedAngle._value2 = getelementptr inbounds %Vs6UInt16, %Vs6UInt16* %adjustedAngle, i32 0, i32 0
+  %2 = load i16, i16* %adjustedAngle._value2, align 2
+
+; CHECK: mov r22, r24
+; CHECK: mov r23, r25
+
+; CHECK-DAG: ldi r20, 0
+; CHECK-DAG: ldi r21, 0
+; CHECK-DAG: ldi r18, 11
+; CHECK-DAG: ldi r19, 0
+
+; CHECK: mov r24, r20
+; CHECK: mov r25, r21
+; CHECK: call  __mulsi3
+  %3 = call { i16, i1 } @llvm.umul.with.overflow.i16(i16 %2, i16 11)
+  %4 = extractvalue { i16, i1 } %3, 0
+  %5 = extractvalue { i16, i1 } %3, 1
+
+  ; above code looks fine, how is it lowered?
+  %6 = call i1 @printDefaultParam()
+  call void @print(i16 %4, i1 %6)
+
+; CHECK: ret
+  ret void
+}
+
+declare void @print(i16, i1)
+declare i1 @printDefaultParam()
+
+; Function Attrs: nounwind readnone speculatable
+declare { i16, i1 } @llvm.umul.with.overflow.i16(i16, i16)
author	Dylan McKay <me@dylanmckay.io>
	Tue, 21 May 2019 06:38:02 +0000 (06:38 +0000)
committer	Dylan McKay <me@dylanmckay.io>
	Tue, 21 May 2019 06:38:02 +0000 (06:38 +0000)
include/llvm/CodeGen/TargetLowering.h		patch \| blob \| history
lib/CodeGen/SelectionDAG/TargetLowering.cpp		patch \| blob \| history
lib/Target/AVR/AVRISelLowering.h		patch \| blob \| history
test/CodeGen/AVR/umul.with.overflow.i16-bug.ll	[new file with mode: 0644]	patch \| blob