[llvm-exegesis] Finish plumbing the `Config` field.

author Clement Courbet <courbet@google.com>

Tue, 8 Oct 2019 09:06:48 +0000 (09:06 +0000)

committer Clement Courbet <courbet@google.com>

Tue, 8 Oct 2019 09:06:48 +0000 (09:06 +0000)
author Clement Courbet <courbet@google.com>
Tue, 8 Oct 2019 09:06:48 +0000 (09:06 +0000)
committer Clement Courbet <courbet@google.com>
Tue, 8 Oct 2019 09:06:48 +0000 (09:06 +0000)
diff --git a/test/tools/llvm-exegesis/X86/analysis-cluster-stabilization-config.test b/test/tools/llvm-exegesis/X86/analysis-cluster-stabilization-config.test

index 0403af4a229a534530fd1fde358a6336590b45e6..6fa4621b1b5f87b90dcc5b3751b1efdd14dd77e1 100644 (file)
--- a/test/tools/llvm-exegesis/X86/analysis-cluster-stabilization-config.test
+++ b/test/tools/llvm-exegesis/X86/analysis-cluster-stabilization-config.test
@@ -4,8 +4,7 @@
  # have different configs, so they should not be placed in the same cluster by
  # stabilization.
  
-# CHECK-UNSTABLE: SQRTSSr
-# CHECK-UNSTABLE: SQRTSSr
+# CHECK-UNSTABLE-NOT: SQRTSSr
  
  ---
  mode:            latency
diff --git a/tools/llvm-exegesis/lib/BenchmarkCode.h b/tools/llvm-exegesis/lib/BenchmarkCode.h

index 1976004c251a32b4e1546313edd1b7d966a35547..7dceb25b50762767b4883c8bee86fb004f7adaf0 100644 (file)
--- a/tools/llvm-exegesis/lib/BenchmarkCode.h
+++ b/tools/llvm-exegesis/lib/BenchmarkCode.h
@@ -9,7 +9,7 @@
  #ifndef LLVM_TOOLS_LLVM_EXEGESIS_BENCHMARKCODE_H
  #define LLVM_TOOLS_LLVM_EXEGESIS_BENCHMARKCODE_H
  
-#include "RegisterValue.h"
+#include "BenchmarkResult.h"
  #include "llvm/MC/MCInst.h"
  #include <string>
  #include <vector>
@@ -19,12 +19,7 @@ namespace exegesis {
  
  // A collection of instructions that are to be assembled, executed and measured.
  struct BenchmarkCode {
-  // The sequence of instructions that are to be repeated.
-  std::vector<llvm::MCInst> Instructions;
-
-  // Before the code is executed some instructions are added to setup the
-  // registers initial values.
-  std::vector<RegisterValue> RegisterInitialValues;
+  InstructionBenchmarkKey Key;
  
    // We also need to provide the registers that are live on entry for the
    // assembler to generate proper prologue/epilogue.
diff --git a/tools/llvm-exegesis/lib/BenchmarkResult.h b/tools/llvm-exegesis/lib/BenchmarkResult.h

index 17ffd0a8c8703659837cc37d1efaef2f953541f8..132dc36622a887bb1ec7d8205a05fa643c64ae9a 100644 (file)
--- a/tools/llvm-exegesis/lib/BenchmarkResult.h
+++ b/tools/llvm-exegesis/lib/BenchmarkResult.h
@@ -15,8 +15,8 @@
  #ifndef LLVM_TOOLS_LLVM_EXEGESIS_BENCHMARKRESULT_H
  #define LLVM_TOOLS_LLVM_EXEGESIS_BENCHMARKRESULT_H
  
-#include "BenchmarkCode.h"
  #include "LlvmState.h"
+#include "RegisterValue.h"
  #include "llvm/ADT/StringMap.h"
  #include "llvm/ADT/StringRef.h"
  #include "llvm/MC/MCInst.h"
diff --git a/tools/llvm-exegesis/lib/BenchmarkRunner.cpp b/tools/llvm-exegesis/lib/BenchmarkRunner.cpp

index 4b541f4d829de90b8a1a249a9b3bd1d27836dbac..da26bc458dcf2aa895c841a3f8778bc4498054c1 100644 (file)
--- a/tools/llvm-exegesis/lib/BenchmarkRunner.cpp
+++ b/tools/llvm-exegesis/lib/BenchmarkRunner.cpp
@@ -31,7 +31,6 @@ BenchmarkRunner::BenchmarkRunner(const LLVMState &State,
  
  BenchmarkRunner::~BenchmarkRunner() = default;
  
-
  namespace {
  class FunctionExecutorImpl : public BenchmarkRunner::FunctionExecutor {
  public:
@@ -92,10 +91,9 @@ InstructionBenchmark BenchmarkRunner::runConfiguration(
    InstrBenchmark.NumRepetitions = NumRepetitions;
    InstrBenchmark.Info = BC.Info;
  
-  const std::vector<llvm::MCInst> &Instructions = BC.Instructions;
+  const std::vector<llvm::MCInst> &Instructions = BC.Key.Instructions;
  
-  InstrBenchmark.Key.Instructions = Instructions;
-  InstrBenchmark.Key.RegisterInitialValues = BC.RegisterInitialValues;
+  InstrBenchmark.Key = BC.Key;
  
    // Assemble at least kMinInstructionsForSnippet instructions by repeating the
    // snippet for debug/analysis. This is so that the user clearly understands
@@ -104,10 +102,10 @@ InstructionBenchmark BenchmarkRunner::runConfiguration(
    {
      llvm::SmallString<0> Buffer;
      llvm::raw_svector_ostream OS(Buffer);
-    assembleToStream(
-        State.getExegesisTarget(), State.createTargetMachine(), BC.LiveIns,
-        BC.RegisterInitialValues,
-        Repetitor.Repeat(BC.Instructions, kMinInstructionsForSnippet), OS);
+    assembleToStream(State.getExegesisTarget(), State.createTargetMachine(),
+                     BC.LiveIns, BC.Key.RegisterInitialValues,
+                     Repetitor.Repeat(Instructions, kMinInstructionsForSnippet),
+                     OS);
      const ExecutableFunction EF(State.createTargetMachine(),
                                  getObjectFromBuffer(OS.str()));
      const auto FnBytes = EF.getFunctionBytes();
@@ -117,7 +115,7 @@ InstructionBenchmark BenchmarkRunner::runConfiguration(
    // Assemble NumRepetitions instructions repetitions of the snippet for
    // measurements.
    const auto Filler =
-      Repetitor.Repeat(BC.Instructions, InstrBenchmark.NumRepetitions);
+      Repetitor.Repeat(Instructions, InstrBenchmark.NumRepetitions);
  
    llvm::object::OwningBinary<llvm::object::ObjectFile> ObjectFile;
    if (DumpObjectToDisk) {
@@ -133,7 +131,7 @@ InstructionBenchmark BenchmarkRunner::runConfiguration(
      llvm::SmallString<0> Buffer;
      llvm::raw_svector_ostream OS(Buffer);
      assembleToStream(State.getExegesisTarget(), State.createTargetMachine(),
-                     BC.LiveIns, BC.RegisterInitialValues, Filler, OS);
+                     BC.LiveIns, BC.Key.RegisterInitialValues, Filler, OS);
      ObjectFile = getObjectFromBuffer(OS.str());
    }
  
@@ -150,7 +148,7 @@ InstructionBenchmark BenchmarkRunner::runConfiguration(
      // Scale the measurements by instruction.
      BM.PerInstructionValue /= InstrBenchmark.NumRepetitions;
      // Scale the measurements by snippet.
-    BM.PerSnippetValue *= static_cast<double>(BC.Instructions.size()) /
+    BM.PerSnippetValue *= static_cast<double>(Instructions.size()) /
                            InstrBenchmark.NumRepetitions;
    }
  
@@ -167,7 +165,7 @@ BenchmarkRunner::writeObjectFile(const BenchmarkCode &BC,
      return std::move(E);
    llvm::raw_fd_ostream OFS(ResultFD, true /*ShouldClose*/);
    assembleToStream(State.getExegesisTarget(), State.createTargetMachine(),
-                   BC.LiveIns, BC.RegisterInitialValues, FillFunction, OFS);
+                   BC.LiveIns, BC.Key.RegisterInitialValues, FillFunction, OFS);
    return ResultPath.str();
  }
  
diff --git a/tools/llvm-exegesis/lib/Clustering.cpp b/tools/llvm-exegesis/lib/Clustering.cpp

index 398bbf776af743606f759e530aa8a69820db6da6..5df47933e7127ad12140702a86f752a18ee3b3be 100644 (file)
--- a/tools/llvm-exegesis/lib/Clustering.cpp
+++ b/tools/llvm-exegesis/lib/Clustering.cpp
@@ -237,39 +237,40 @@ void InstructionBenchmarkClustering::clusterizeNaive(unsigned NumOpcodes) {
  // We shall find every opcode with benchmarks not in just one cluster, and move
  // *all* the benchmarks of said Opcode into one new unstable cluster per Opcode.
  void InstructionBenchmarkClustering::stabilize(unsigned NumOpcodes) {
-  // Given an instruction Opcode, in which clusters do benchmarks of this
-  // instruction lie? Normally, they all should be in the same cluster.
-  std::vector<llvm::SmallSet<ClusterId, 1>> OpcodeToClusterIDs;
-  OpcodeToClusterIDs.resize(NumOpcodes);
-  // The list of opcodes that have more than one cluster.
-  llvm::SetVector<size_t> UnstableOpcodes;
-  // Populate OpcodeToClusterIDs and UnstableOpcodes data structures.
+  // Given an instruction Opcode and Config, in which clusters do benchmarks of
+  // this instruction lie? Normally, they all should be in the same cluster.
+  struct OpcodeAndConfig {
+    explicit OpcodeAndConfig(const InstructionBenchmark &IB)
+        : Opcode(IB.keyInstruction().getOpcode()), Config(&IB.Key.Config) {}
+    unsigned Opcode;
+    const std::string *Config;
+
+    auto Tie() const -> auto { return std::tie(Opcode, *Config); }
+
+    bool operator<(const OpcodeAndConfig &O) const { return Tie() < O.Tie(); }
+    bool operator!=(const OpcodeAndConfig &O) const { return Tie() != O.Tie(); }
+  };
+  std::map<OpcodeAndConfig, llvm::SmallSet<ClusterId, 1>>
+      OpcodeConfigToClusterIDs;
+  // Populate OpcodeConfigToClusterIDs and UnstableOpcodes data structures.
    assert(ClusterIdForPoint_.size() == Points_.size() && "size mismatch");
    for (const auto &Point : zip(Points_, ClusterIdForPoint_)) {
      const ClusterId &ClusterIdOfPoint = std::get<1>(Point);
      if (!ClusterIdOfPoint.isValid())
        continue; // Only process fully valid clusters.
-    const unsigned Opcode = std::get<0>(Point).keyInstruction().getOpcode();
-    assert(Opcode < NumOpcodes && "NumOpcodes is incorrect (too small)");
+    const OpcodeAndConfig Key(std::get<0>(Point));
      llvm::SmallSet<ClusterId, 1> &ClusterIDsOfOpcode =
-        OpcodeToClusterIDs[Opcode];
+        OpcodeConfigToClusterIDs[Key];
      ClusterIDsOfOpcode.insert(ClusterIdOfPoint);
-    // Is there more than one ClusterID for this opcode?.
-    if (ClusterIDsOfOpcode.size() < 2)
-      continue; // If not, then at this moment this Opcode is stable.
-    // Else let's record this unstable opcode for future use.
-    UnstableOpcodes.insert(Opcode);
    }
-  assert(OpcodeToClusterIDs.size() == NumOpcodes && "sanity check");
  
-  // We know with how many [new] clusters we will end up with.
-  const auto NewTotalClusterCount = Clusters_.size() + UnstableOpcodes.size();
-  Clusters_.reserve(NewTotalClusterCount);
-  for (const size_t UnstableOpcode : UnstableOpcodes.getArrayRef()) {
+  for (const auto &OpcodeConfigToClusterID : OpcodeConfigToClusterIDs) {
      const llvm::SmallSet<ClusterId, 1> &ClusterIDs =
-        OpcodeToClusterIDs[UnstableOpcode];
-    assert(ClusterIDs.size() > 1 &&
-           "Should only have Opcodes with more than one cluster.");
+        OpcodeConfigToClusterID.second;
+    const OpcodeAndConfig &Key = OpcodeConfigToClusterID.first;
+    // We only care about unstable instructions.
+    if (ClusterIDs.size() < 2)
+      continue;
  
      // Create a new unstable cluster, one per Opcode.
      Clusters_.emplace_back(ClusterId::makeValidUnstable(Clusters_.size()));
@@ -290,8 +291,8 @@ void InstructionBenchmarkClustering::stabilize(unsigned NumOpcodes) {
        // and the rest of the points is for the UnstableOpcode.
        const auto it = std::stable_partition(
            OldCluster.PointIndices.begin(), OldCluster.PointIndices.end(),
-          [this, UnstableOpcode](size_t P) {
-            return Points_[P].keyInstruction().getOpcode() != UnstableOpcode;
+          [this, &Key](size_t P) {
+            return OpcodeAndConfig(Points_[P]) != Key;
            });
        assert(std::distance(it, OldCluster.PointIndices.end()) > 0 &&
               "Should have found at least one bad point");
@@ -314,7 +315,6 @@ void InstructionBenchmarkClustering::stabilize(unsigned NumOpcodes) {
             "New unstable cluster should end up with no less points than there "
             "was clusters");
    }
-  assert(Clusters_.size() == NewTotalClusterCount && "sanity check");
  }
  
  llvm::Expected<InstructionBenchmarkClustering>
diff --git a/tools/llvm-exegesis/lib/CodeTemplate.h b/tools/llvm-exegesis/lib/CodeTemplate.h

index 2edd51481695765a724bbcb93e89207f45581449..d782296ed33d66cf3aeeaebe55eec7b76f078f71 100644 (file)
--- a/tools/llvm-exegesis/lib/CodeTemplate.h
+++ b/tools/llvm-exegesis/lib/CodeTemplate.h
@@ -115,6 +115,8 @@ struct CodeTemplate {
    CodeTemplate &operator=(const CodeTemplate &) = delete;
  
    ExecutionMode Execution = ExecutionMode::UNKNOWN;
+  // See InstructionBenchmarkKey.::Config.
+  std::string Config;
    // Some information about how this template has been created.
    std::string Info;
    // The list of the instructions for this template.
diff --git a/tools/llvm-exegesis/lib/SnippetFile.cpp b/tools/llvm-exegesis/lib/SnippetFile.cpp

index f5666ecab9548cb3ce84b27edd2d6b2e86e53427..63df5c634537b7d0a8948c75cd6b659eb9c333ee 100644 (file)
--- a/tools/llvm-exegesis/lib/SnippetFile.cpp
+++ b/tools/llvm-exegesis/lib/SnippetFile.cpp
@@ -36,7 +36,7 @@ public:
    // instructions.
    void EmitInstruction(const MCInst &Instruction,
                         const MCSubtargetInfo &STI) override {
-    Result->Instructions.push_back(Instruction);
+    Result->Key.Instructions.push_back(Instruction);
    }
  
    // Implementation of the AsmCommentConsumer.
@@ -65,7 +65,7 @@ public:
        const StringRef HexValue = Parts[1].trim();
        RegVal.Value = APInt(
            /* each hex digit is 4 bits */ HexValue.size() * 4, HexValue, 16);
-      Result->RegisterInitialValues.push_back(std::move(RegVal));
+      Result->Key.RegisterInitialValues.push_back(std::move(RegVal));
        return;
      }
      if (CommentText.consume_front("LIVEIN")) {
diff --git a/tools/llvm-exegesis/lib/SnippetGenerator.cpp b/tools/llvm-exegesis/lib/SnippetGenerator.cpp

index 267ab13163345012406e977b3d3e7263a665929a..879962001e6bb04a61aa7b17b57c50c8ef24f83d 100644 (file)
--- a/tools/llvm-exegesis/lib/SnippetGenerator.cpp
+++ b/tools/llvm-exegesis/lib/SnippetGenerator.cpp
@@ -73,12 +73,13 @@ SnippetGenerator::generateConfigurations(
          BC.Info = CT.Info;
          for (InstructionTemplate &IT : CT.Instructions) {
            randomizeUnsetVariables(State.getExegesisTarget(), ForbiddenRegs, IT);
-          BC.Instructions.push_back(IT.build());
+          BC.Key.Instructions.push_back(IT.build());
          }
          if (CT.ScratchSpacePointerInReg)
            BC.LiveIns.push_back(CT.ScratchSpacePointerInReg);
-        BC.RegisterInitialValues =
+        BC.Key.RegisterInitialValues =
              computeRegisterInitialValues(CT.Instructions);
+        BC.Key.Config = CT.Config;
          Output.push_back(std::move(BC));
        }
      }
diff --git a/unittests/tools/llvm-exegesis/X86/SnippetFileTest.cpp b/unittests/tools/llvm-exegesis/X86/SnippetFileTest.cpp

index 69dd689fc492df1acaf628379f1c122f0ec648fc..04ba51cef277979a0fbf69980fe7220372e4f577 100644 (file)
--- a/unittests/tools/llvm-exegesis/X86/SnippetFileTest.cpp
+++ b/unittests/tools/llvm-exegesis/X86/SnippetFileTest.cpp
@@ -78,8 +78,8 @@ TEST_F(X86SnippetFileTest, Works) {
    EXPECT_FALSE((bool)Snippets.takeError());
    ASSERT_THAT(*Snippets, SizeIs(1));
    const auto &Snippet = (*Snippets)[0];
-  ASSERT_THAT(Snippet.Instructions, ElementsAre(HasOpcode(X86::INC64r)));
-  ASSERT_THAT(Snippet.RegisterInitialValues,
+  ASSERT_THAT(Snippet.Key.Instructions, ElementsAre(HasOpcode(X86::INC64r)));
+  ASSERT_THAT(Snippet.Key.RegisterInitialValues,
                ElementsAre(RegisterInitialValueIs(X86::RAX, 15),
                            RegisterInitialValueIs(X86::SIL, 0)));
    ASSERT_THAT(Snippet.LiveIns, ElementsAre(X86::RDI, X86::DL));
author	Clement Courbet <courbet@google.com>
	Tue, 8 Oct 2019 09:06:48 +0000 (09:06 +0000)
committer	Clement Courbet <courbet@google.com>
	Tue, 8 Oct 2019 09:06:48 +0000 (09:06 +0000)
test/tools/llvm-exegesis/X86/analysis-cluster-stabilization-config.test		patch \| blob \| history
tools/llvm-exegesis/lib/BenchmarkCode.h		patch \| blob \| history
tools/llvm-exegesis/lib/BenchmarkResult.h		patch \| blob \| history
tools/llvm-exegesis/lib/BenchmarkRunner.cpp		patch \| blob \| history
tools/llvm-exegesis/lib/Clustering.cpp		patch \| blob \| history
tools/llvm-exegesis/lib/CodeTemplate.h		patch \| blob \| history
tools/llvm-exegesis/lib/SnippetFile.cpp		patch \| blob \| history
tools/llvm-exegesis/lib/SnippetGenerator.cpp		patch \| blob \| history
unittests/tools/llvm-exegesis/X86/SnippetFileTest.cpp		patch \| blob \| history