AMD family 17h (znver1) enablement

author Craig Topper <craig.topper@gmail.com>

Tue, 10 Jan 2017 06:01:16 +0000 (06:01 +0000)

committer Craig Topper <craig.topper@gmail.com>

Tue, 10 Jan 2017 06:01:16 +0000 (06:01 +0000)
author Craig Topper <craig.topper@gmail.com>
Tue, 10 Jan 2017 06:01:16 +0000 (06:01 +0000)
committer Craig Topper <craig.topper@gmail.com>
Tue, 10 Jan 2017 06:01:16 +0000 (06:01 +0000)
diff --git a/lib/Support/Host.cpp b/lib/Support/Host.cpp

index 8a09589aa884ae3aacf9fe99eb5d259e0298a4a4..d1b40412a6fc64e73559b509698e48c0e965d671 100644 (file)
--- a/lib/Support/Host.cpp
+++ b/lib/Support/Host.cpp
@@ -111,6 +111,7 @@ enum ProcessorTypes {
    AMDATHLON,
    AMDFAM14H,
    AMDFAM16H,
+  AMDFAM17H,
    CPU_TYPE_MAX
  };
  
@@ -149,6 +150,7 @@ enum ProcessorSubtypes {
    AMD_BTVER2,
    AMDFAM15H_BDVER3,
    AMDFAM15H_BDVER4,
+  AMDFAM17H_ZNVER1,
    CPU_SUBTYPE_MAX
  };
  
@@ -742,6 +744,14 @@ static void getAMDProcessorTypeAndSubtype(unsigned int Family,
      }
      *Subtype = AMD_BTVER2;
      break; // "btver2"
+  case 23:
+    *Type = AMDFAM17H;
+    if (Features & (1 << FEATURE_ADX)) {
+      *Subtype = AMDFAM17H_ZNVER1;
+      break; // "znver1"
+    }
+    *Subtype =  AMD_BTVER1;
+    break;
    default:
      break; // "generic"
    }
@@ -950,6 +960,15 @@ StringRef sys::getHostCPUName() {
        default:
          return "amdfam16";
        }
+    case AMDFAM17H:
+      switch (Subtype) {
+      case AMD_BTVER1:
+        return "btver1";
+      case AMDFAM17H_ZNVER1:
+        return "znver1";
+      default:
+        return "amdfam17";
+      }
      default:
        return "generic";
      }
diff --git a/lib/Target/X86/X86.td b/lib/Target/X86/X86.td

index dc18a59a30bac04ed3afe80ac339c2f7bdbd94ed..f95022077d356d605f6b5fad0c14868a4271cd27 100644 (file)
--- a/lib/Target/X86/X86.td
+++ b/lib/Target/X86/X86.td
@@ -760,6 +760,42 @@ def : Proc<"bdver4", [
    FeatureMWAITX
  ]>;
  
+// TODO: The scheduler model falls to BTVER2 model.
+// The znver1 model has to be put in place.
+// Zen
+def: ProcessorModel<"znver1", BtVer2Model, [
+  FeatureADX,
+  FeatureAES,
+  FeatureAVX2,
+  FeatureBMI,
+  FeatureBMI2,
+  FeatureCLFLUSHOPT,
+  FeatureCMPXCHG16B,
+  FeatureF16C,
+  FeatureFMA,
+  FeatureFSGSBase,
+  FeatureFXSR,
+  FeatureFastLZCNT,
+  FeatureLAHFSAHF,
+  FeatureLZCNT,
+  FeatureMMX,
+  FeatureMOVBE,
+  FeatureMWAITX,
+  FeaturePCLMUL,
+  FeaturePOPCNT,
+  FeaturePRFCHW,
+  FeatureRDRAND,
+  FeatureRDSEED,
+  FeatureSHA,
+  FeatureSMAP,
+  FeatureSSE4A,
+  FeatureSlowSHLD,
+  FeatureX87,
+  FeatureXSAVE,
+  FeatureXSAVEC,
+  FeatureXSAVEOPT,
+  FeatureXSAVES]>;
+
  def : Proc<"geode",           [FeatureX87, FeatureSlowUAMem16, Feature3DNowA]>;
  
  def : Proc<"winchip-c6",      [FeatureX87, FeatureSlowUAMem16, FeatureMMX]>;
diff --git a/test/CodeGen/X86/cpus.ll b/test/CodeGen/X86/cpus.ll

index ee1f7bb5295bea9112d0e07e179adc073dcabf11..20ce932a184b5fe7a765a9eefc47ee88e62d3161 100644 (file)
--- a/test/CodeGen/X86/cpus.ll
+++ b/test/CodeGen/X86/cpus.ll
@@ -33,3 +33,4 @@
  ; RUN: llc < %s -o /dev/null -mtriple=x86_64-unknown-unknown -mcpu=bdver4 2>&1 | FileCheck %s --check-prefix=CHECK-NO-ERROR --allow-empty
  ; RUN: llc < %s -o /dev/null -mtriple=x86_64-unknown-unknown -mcpu=btver1 2>&1 | FileCheck %s --check-prefix=CHECK-NO-ERROR --allow-empty
  ; RUN: llc < %s -o /dev/null -mtriple=x86_64-unknown-unknown -mcpu=btver2 2>&1 | FileCheck %s --check-prefix=CHECK-NO-ERROR --allow-empty
+; RUN: llc < %s -o /dev/null -mtriple=x86_64-unknown-unknown -mcpu=znver1 2>&1 | FileCheck %s --check-prefix=CHECK-NO-ERROR --allow-empty
diff --git a/test/CodeGen/X86/lzcnt-zext-cmp.ll b/test/CodeGen/X86/lzcnt-zext-cmp.ll

index 6f4cb84a2b9cbb75fc5c9949e2b3fe8382e09604..c69dbf573f46d9f4e72f6e8dfcc3ec7f733bd2ce 100644 (file)
--- a/test/CodeGen/X86/lzcnt-zext-cmp.ll
+++ b/test/CodeGen/X86/lzcnt-zext-cmp.ll
@@ -3,6 +3,8 @@
  ; Eg: zext(or(setcc(cmp), setcc(cmp))) -> shr(or(lzcnt, lzcnt))
  ; RUN: llc < %s -mtriple=x86_64-pc-linux -mcpu=btver2 | FileCheck %s
  ; RUN: llc < %s -mtriple=x86_64-pc-linux -mcpu=btver2 -mattr=-fast-lzcnt | FileCheck --check-prefix=NOFASTLZCNT %s
+; RUN: llc < %s -mtriple=x86_64-pc-linux -mcpu=znver1 | FileCheck %s
+; RUN: llc < %s -mtriple=x86_64-pc-linux -mcpu=znver1 -mattr=-fast-lzcnt | FileCheck --check-prefix=NOFASTLZCNT %s
  
  ; Test one 32-bit input, output is 32-bit, no transformations expected.
  define i32 @test_zext_cmp0(i32 %a) {
diff --git a/test/CodeGen/X86/slow-unaligned-mem.ll b/test/CodeGen/X86/slow-unaligned-mem.ll

index 41e9a95bcdd8eb7ad6e4f0f78c54bc9ce4d0d8e3..8251eb324a77287b6123177ecaef5873b3f9f95a 100644 (file)
--- a/test/CodeGen/X86/slow-unaligned-mem.ll
+++ b/test/CodeGen/X86/slow-unaligned-mem.ll
@@ -46,6 +46,7 @@
  ; RUN: llc < %s -mtriple=i386-unknown-unknown -mcpu=bdver2        2>&1 | FileCheck %s --check-prefix=FAST
  ; RUN: llc < %s -mtriple=i386-unknown-unknown -mcpu=bdver3        2>&1 | FileCheck %s --check-prefix=FAST
  ; RUN: llc < %s -mtriple=i386-unknown-unknown -mcpu=bdver4        2>&1 | FileCheck %s --check-prefix=FAST
+; RUN: llc < %s -mtriple=i386-unknown-unknown -mcpu=znver1        2>&1 | FileCheck %s --check-prefix=FAST
  
  ; Other chips with slow unaligned memory accesses
  
diff --git a/test/CodeGen/X86/x86-64-double-shifts-var.ll b/test/CodeGen/X86/x86-64-double-shifts-var.ll

index 8d2dbbdb5d245b5c7c9d5312b7ffc208e157da4f..c025ee874b2d5e7ab31e59c389b422c53512efb1 100644 (file)
--- a/test/CodeGen/X86/x86-64-double-shifts-var.ll
+++ b/test/CodeGen/X86/x86-64-double-shifts-var.ll
@@ -17,6 +17,7 @@
  ; RUN: llc < %s -march=x86-64 -mcpu=bdver2 | FileCheck %s
  ; RUN: llc < %s -march=x86-64 -mcpu=bdver3 | FileCheck %s
  ; RUN: llc < %s -march=x86-64 -mcpu=bdver4 | FileCheck %s
+; RUN: llc < %s -march=x86-64 -mcpu=znver1 | FileCheck %s
  
  ; Verify that for the X86_64 processors that are known to have poor latency 
  ; double precision shift instructions we do not generate 'shld' or 'shrd'
author	Craig Topper <craig.topper@gmail.com>
	Tue, 10 Jan 2017 06:01:16 +0000 (06:01 +0000)
committer	Craig Topper <craig.topper@gmail.com>
	Tue, 10 Jan 2017 06:01:16 +0000 (06:01 +0000)
lib/Support/Host.cpp		patch \| blob \| history
lib/Target/X86/X86.td		patch \| blob \| history
test/CodeGen/X86/cpus.ll		patch \| blob \| history
test/CodeGen/X86/lzcnt-zext-cmp.ll		patch \| blob \| history
test/CodeGen/X86/slow-unaligned-mem.ll		patch \| blob \| history
test/CodeGen/X86/x86-64-double-shifts-var.ll		patch \| blob \| history