AMDGPU: Refactor SIMachineFunctionInfo slightly

author Matt Arsenault <Matthew.Arsenault@amd.com>

Tue, 11 Apr 2017 22:29:28 +0000 (22:29 +0000)

committer Matt Arsenault <Matthew.Arsenault@amd.com>

Tue, 11 Apr 2017 22:29:28 +0000 (22:29 +0000)
author Matt Arsenault <Matthew.Arsenault@amd.com>
Tue, 11 Apr 2017 22:29:28 +0000 (22:29 +0000)
committer Matt Arsenault <Matthew.Arsenault@amd.com>
Tue, 11 Apr 2017 22:29:28 +0000 (22:29 +0000)
diff --git a/lib/Target/AMDGPU/SIISelLowering.cpp b/lib/Target/AMDGPU/SIISelLowering.cpp

index 4696f645cf842b2e43197752fe34adc0315fbd3d..eda825d8c6eee356eda7caf88a6e24b1362c037e 100644 (file)
--- a/lib/Target/AMDGPU/SIISelLowering.cpp
+++ b/lib/Target/AMDGPU/SIISelLowering.cpp
@@ -1171,7 +1171,7 @@ SDValue SITargetLowering::LowerFormalArguments(
                   *DAG.getContext());
  
    bool IsShader = AMDGPU::isShader(CallConv);
-  bool IsKernel = !IsShader;
+  bool IsKernel = AMDGPU::isKernel(CallConv);
    bool IsEntryFunc = AMDGPU::isEntryFunctionCC(CallConv);
  
    if (IsShader) {
diff --git a/lib/Target/AMDGPU/SIMachineFunctionInfo.cpp b/lib/Target/AMDGPU/SIMachineFunctionInfo.cpp

index debb42fc0fcfc4f58bbabe95189516e3d5202c97..8e612d2ddfdae85f40b3d73712b79465609a38b7 100644 (file)
--- a/lib/Target/AMDGPU/SIMachineFunctionInfo.cpp
+++ b/lib/Target/AMDGPU/SIMachineFunctionInfo.cpp
@@ -75,34 +75,48 @@ SIMachineFunctionInfo::SIMachineFunctionInfo(const MachineFunction &MF)
      PrivateMemoryInputPtr(false) {
    const SISubtarget &ST = MF.getSubtarget<SISubtarget>();
    const Function *F = MF.getFunction();
+  FlatWorkGroupSizes = ST.getFlatWorkGroupSizes(*F);
+  WavesPerEU = ST.getWavesPerEU(*F);
  
-  PSInputAddr = AMDGPU::getInitialPSInputAddr(*F);
+  // Non-entry functions have no special inputs for now.
+  // TODO: Return early for non-entry CCs.
  
-  const MachineFrameInfo &FrameInfo = MF.getFrameInfo();
+  CallingConv::ID CC = F->getCallingConv();
+  if (CC == CallingConv::AMDGPU_PS)
+    PSInputAddr = AMDGPU::getInitialPSInputAddr(*F);
  
-  if (!AMDGPU::isShader(F->getCallingConv())) {
+  if (AMDGPU::isKernel(CC)) {
      KernargSegmentPtr = true;
      WorkGroupIDX = true;
      WorkItemIDX = true;
    }
  
-  if (F->hasFnAttribute("amdgpu-work-group-id-y") || ST.debuggerEmitPrologue())
+  if (ST.debuggerEmitPrologue()) {
+    // Enable everything.
      WorkGroupIDY = true;
-
-  if (F->hasFnAttribute("amdgpu-work-group-id-z") || ST.debuggerEmitPrologue())
      WorkGroupIDZ = true;
-
-  if (F->hasFnAttribute("amdgpu-work-item-id-y") || ST.debuggerEmitPrologue())
      WorkItemIDY = true;
-
-  if (F->hasFnAttribute("amdgpu-work-item-id-z") || ST.debuggerEmitPrologue())
      WorkItemIDZ = true;
+  } else {
+    if (F->hasFnAttribute("amdgpu-work-group-id-y"))
+      WorkGroupIDY = true;
+
+    if (F->hasFnAttribute("amdgpu-work-group-id-z"))
+      WorkGroupIDZ = true;
+
+    if (F->hasFnAttribute("amdgpu-work-item-id-y"))
+      WorkItemIDY = true;
+
+    if (F->hasFnAttribute("amdgpu-work-item-id-z"))
+      WorkItemIDZ = true;
+  }
  
    // X, XY, and XYZ are the only supported combinations, so make sure Y is
    // enabled if Z is.
    if (WorkItemIDZ)
      WorkItemIDY = true;
  
+  const MachineFrameInfo &FrameInfo = MF.getFrameInfo();
    bool MaySpill = ST.isVGPRSpillingEnabled(*F);
    bool HasStackObjects = FrameInfo.hasStackObjects();
  
@@ -129,12 +143,8 @@ SIMachineFunctionInfo::SIMachineFunctionInfo(const MachineFunction &MF)
    // We don't need to worry about accessing spills with flat instructions.
    // TODO: On VI where we must use flat for global, we should be able to omit
    // this if it is never used for generic access.
-  if (HasStackObjects && ST.getGeneration() >= SISubtarget::SEA_ISLANDS &&
-      ST.isAmdHsaOS())
+  if (HasStackObjects && ST.hasFlatAddressSpace() && ST.isAmdHsaOS())
      FlatScratchInit = true;
-
-  FlatWorkGroupSizes = ST.getFlatWorkGroupSizes(*F);
-  WavesPerEU = ST.getWavesPerEU(*F);
  }
  
  unsigned SIMachineFunctionInfo::addPrivateSegmentBuffer(
diff --git a/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.h b/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.h

index 4a43ecda1778593b50cb785149340f64100b0c77..d6c836eb748b1521c9edfd24031d76b1c74111e9 100644 (file)
--- a/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.h
+++ b/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.h
@@ -258,6 +258,18 @@ bool isCompute(CallingConv::ID CC);
  LLVM_READNONE
  bool isEntryFunctionCC(CallingConv::ID CC);
  
+// FIXME: Remove this when calling conventions cleaned up
+LLVM_READNONE
+inline bool isKernel(CallingConv::ID CC) {
+  switch (CC) {
+  case CallingConv::C:
+  case CallingConv::AMDGPU_KERNEL:
+  case CallingConv::SPIR_KERNEL:
+    return true;
+  default:
+    return false;
+  }
+}
  
  bool isSI(const MCSubtargetInfo &STI);
  bool isCI(const MCSubtargetInfo &STI);
diff --git a/test/CodeGen/AMDGPU/calling-conventions.ll b/test/CodeGen/AMDGPU/calling-conventions.ll

index 55c2b503430cc55913b954e2af6a48445a6ee1bb..677147b6f4e53f450733c85e52654181e672c3e9 100644 (file)
--- a/test/CodeGen/AMDGPU/calling-conventions.ll
+++ b/test/CodeGen/AMDGPU/calling-conventions.ll
@@ -12,13 +12,13 @@ entry:
  }
  
  ; FIXME: This is treated like a kernel
-; GCN-LABEL: {{^}}func:
-; GCN: s_endpgm
-define spir_func void @func(i32 addrspace(1)* %out) {
-entry:
-  store i32 0, i32 addrspace(1)* %out
-  ret void
-}
+; XGCN-LABEL: {{^}}func:
+; XGCN: s_endpgm
+; define spir_func void @func(i32 addrspace(1)* %out) {
+; entry:
+;   store i32 0, i32 addrspace(1)* %out
+;   ret void
+; }
  
  ; GCN-LABEL: {{^}}ps_ret_cc_f16:
  ; SI: v_cvt_f16_f32_e32 v0, v0
author	Matt Arsenault <Matthew.Arsenault@amd.com>
	Tue, 11 Apr 2017 22:29:28 +0000 (22:29 +0000)
committer	Matt Arsenault <Matthew.Arsenault@amd.com>
	Tue, 11 Apr 2017 22:29:28 +0000 (22:29 +0000)
lib/Target/AMDGPU/SIISelLowering.cpp		patch \| blob \| history
lib/Target/AMDGPU/SIMachineFunctionInfo.cpp		patch \| blob \| history
lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.h		patch \| blob \| history
test/CodeGen/AMDGPU/calling-conventions.ll		patch \| blob \| history