codeplaysoftware
diff --git a/‎clang-tools-extra/clang-doc/tool/ClangDocMain.cpp
Lines changed: 1 addition & 2 deletions b/‎clang-tools-extra/clang-doc/tool/ClangDocMain.cpp
Lines changed: 1 addition & 2 deletions
diff --git a/‎clang-tools-extra/clangd/TUScheduler.cpp
Lines changed: 1 addition & 7 deletions b/‎clang-tools-extra/clangd/TUScheduler.cpp
Lines changed: 1 addition & 7 deletions
diff --git a/‎clang-tools-extra/clangd/index/Background.cpp
Lines changed: 3 additions & 2 deletions b/‎clang-tools-extra/clangd/index/Background.cpp
Lines changed: 3 additions & 2 deletions
diff --git a/‎clang-tools-extra/clangd/index/Background.h
Lines changed: 1 addition & 1 deletion b/‎clang-tools-extra/clangd/index/Background.h
Lines changed: 1 addition & 1 deletion
diff --git a/‎clang-tools-extra/clangd/index/BackgroundRebuild.h
Lines changed: 3 additions & 1 deletion b/‎clang-tools-extra/clangd/index/BackgroundRebuild.h
Lines changed: 3 additions & 1 deletion
diff --git a/‎clang/lib/Tooling/AllTUsExecution.cpp
Lines changed: 1 addition & 2 deletions b/‎clang/lib/Tooling/AllTUsExecution.cpp
Lines changed: 1 addition & 2 deletions
diff --git a/‎clang/lib/Tooling/DependencyScanning/DependencyScanningFilesystem.cpp
Lines changed: 2 additions & 1 deletion b/‎clang/lib/Tooling/DependencyScanning/DependencyScanningFilesystem.cpp
Lines changed: 2 additions & 1 deletion
diff --git a/‎clang/tools/clang-scan-deps/ClangScanDeps.cpp
Lines changed: 4 additions & 10 deletions b/‎clang/tools/clang-scan-deps/ClangScanDeps.cpp
Lines changed: 4 additions & 10 deletions
diff --git a/‎lld/ELF/SyntheticSections.cpp
Lines changed: 4 additions & 4 deletions b/‎lld/ELF/SyntheticSections.cpp
Lines changed: 4 additions & 4 deletions
diff --git a/‎llvm/include/llvm/LTO/LTO.h
Lines changed: 2 additions & 1 deletion b/‎llvm/include/llvm/LTO/LTO.h
Lines changed: 2 additions & 1 deletion
@@ -268,8 +268,7 @@ int main(int argc, const char **argv) {
   Error = false;
   llvm::sys::Mutex IndexMutex;
   // ExecutorConcurrency is a flag exposed by AllTUsExecution.h
-  llvm::ThreadPool Pool(ExecutorConcurrency == 0 ? llvm::hardware_concurrency()
-                                                 : ExecutorConcurrency);
+  llvm::ThreadPool Pool(llvm::hardware_concurrency(ExecutorConcurrency));
   for (auto &Group : USRToBitcode) {
     Pool.async([&]() {
       std::vector<std::unique_ptr<doc::Info>> Infos;
 
@@ -842,13 +842,7 @@ std::string renderTUAction(const TUAction &Action) {
 } // namespace
 
 unsigned getDefaultAsyncThreadsCount() {
-  unsigned HardwareConcurrency = llvm::heavyweight_hardware_concurrency();
-  // heavyweight_hardware_concurrency may fall back to hardware_concurrency.
-  // C++ standard says that hardware_concurrency() may return 0; fallback to 1
-  // worker thread in that case.
-  if (HardwareConcurrency == 0)
-    return 1;
-  return HardwareConcurrency;
+  return llvm::heavyweight_hardware_concurrency().compute_thread_count();
 }
 
 FileStatus TUStatus::render(PathRef File) const {
 
@@ -148,9 +148,10 @@ BackgroundIndex::BackgroundIndex(
           CDB.watch([&](const std::vector<std::string> &ChangedFiles) {
             enqueue(ChangedFiles);
           })) {
-  assert(ThreadPoolSize > 0 && "Thread pool size can't be zero.");
+  assert(Rebuilder.TUsBeforeFirstBuild > 0 &&
+         "Thread pool size can't be zero.");
   assert(this->IndexStorageFactory && "Storage factory can not be null!");
-  for (unsigned I = 0; I < ThreadPoolSize; ++I) {
+  for (unsigned I = 0; I < Rebuilder.TUsBeforeFirstBuild; ++I) {
     ThreadPool.runAsync("background-worker-" + llvm::Twine(I + 1), [this] {
       WithContext Ctx(this->BackgroundContext.clone());
       Queue.work([&] { Rebuilder.idle(); });
 
@@ -135,7 +135,7 @@ class BackgroundIndex : public SwapIndex {
       Context BackgroundContext, const FileSystemProvider &,
       const GlobalCompilationDatabase &CDB,
       BackgroundIndexStorage::Factory IndexStorageFactory,
-      size_t ThreadPoolSize = llvm::heavyweight_hardware_concurrency(),
+      size_t ThreadPoolSize = 0, // 0 = use all hardware threads
       std::function<void(BackgroundQueue::Stats)> OnProgress = nullptr);
   ~BackgroundIndex(); // Blocks while the current task finishes.
 
 
@@ -49,7 +49,9 @@ class BackgroundIndexRebuilder {
 public:
   BackgroundIndexRebuilder(SwapIndex *Target, FileSymbols *Source,
                            unsigned Threads)
-      : TUsBeforeFirstBuild(Threads), Target(Target), Source(Source) {}
+      : TUsBeforeFirstBuild(llvm::heavyweight_hardware_concurrency(Threads)
+                                .compute_thread_count()),
+        Target(Target), Source(Source) {}
 
   // Called to indicate a TU has been indexed.
   // May rebuild, if enough TUs have been indexed.
 
@@ -114,8 +114,7 @@ llvm::Error AllTUsToolExecutor::execute(
   auto &Action = Actions.front();
 
   {
-    llvm::ThreadPool Pool(ThreadCount == 0 ? llvm::hardware_concurrency()
-                                           : ThreadCount);
+    llvm::ThreadPool Pool(llvm::hardware_concurrency(ThreadCount));
     for (std::string File : Files) {
       Pool.async(
           [&](std::string Path) {
 
@@ -106,7 +106,8 @@ DependencyScanningFilesystemSharedCache::
   // sharding gives a performance edge by reducing the lock contention.
   // FIXME: A better heuristic might also consider the OS to account for
   // the different cost of lock contention on different OSes.
-  NumShards = std::max(2u, llvm::hardware_concurrency() / 4);
+  NumShards =
+      std::max(2u, llvm::hardware_concurrency().compute_thread_count() / 4);
   CacheShards = std::make_unique<CacheShard[]>(NumShards);
 }
 
 
@@ -485,15 +485,9 @@ int main(int argc, const char **argv) {
 
   DependencyScanningService Service(ScanMode, Format, ReuseFileManager,
                                     SkipExcludedPPRanges);
-#if LLVM_ENABLE_THREADS
-  unsigned NumWorkers =
-      NumThreads == 0 ? llvm::hardware_concurrency() : NumThreads;
-#else
-  unsigned NumWorkers = 1;
-#endif
-  llvm::ThreadPool Pool(NumWorkers);
+  llvm::ThreadPool Pool(llvm::hardware_concurrency(NumThreads));
   std::vector<std::unique_ptr<DependencyScanningTool>> WorkerTools;
-  for (unsigned I = 0; I < NumWorkers; ++I)
+  for (unsigned I = 0; I < Pool.getThreadCount(); ++I)
     WorkerTools.push_back(std::make_unique<DependencyScanningTool>(Service));
 
   std::vector<SingleCommandCompilationDatabase> Inputs;
@@ -508,9 +502,9 @@ int main(int argc, const char **argv) {
 
   if (Verbose) {
     llvm::outs() << "Running clang-scan-deps on " << Inputs.size()
-                 << " files using " << NumWorkers << " workers\n";
+                 << " files using " << Pool.getThreadCount() << " workers\n";
   }
-  for (unsigned I = 0; I < NumWorkers; ++I) {
+  for (unsigned I = 0; I < Pool.getThreadCount(); ++I) {
     Pool.async([I, &Lock, &Index, &Inputs, &HadErrors, &FD, &WorkerTools,
                 &DependencyOS, &Errs]() {
       llvm::StringSet<> AlreadySeenModules;
 
@@ -2747,8 +2747,8 @@ createSymbols(ArrayRef<std::vector<GdbIndexSection::NameAttrEntry>> nameAttrs,
   size_t numShards = 32;
   size_t concurrency = 1;
   if (threadsEnabled)
-    concurrency =
-        std::min<size_t>(PowerOf2Floor(hardware_concurrency()), numShards);
+    concurrency = std::min<size_t>(
+        hardware_concurrency().compute_thread_count(), numShards);
 
   // A sharded map to uniquify symbols by name.
   std::vector<DenseMap<CachedHashStringRef, size_t>> map(numShards);
@@ -3191,8 +3191,8 @@ void MergeNoTailSection::finalizeContents() {
   // operations in the following tight loop.
   size_t concurrency = 1;
   if (threadsEnabled)
-    concurrency =
-        std::min<size_t>(PowerOf2Floor(hardware_concurrency()), numShards);
+    concurrency = std::min<size_t>(
+        hardware_concurrency().compute_thread_count(), numShards);
 
   // Add section pieces to the builders.
   parallelForEachN(0, concurrency, [&](size_t threadId) {
 
@@ -227,7 +227,8 @@ using ThinBackend = std::function<std::unique_ptr<ThinBackendProc>(
     AddStreamFn AddStream, NativeObjectCache Cache)>;
 
 /// This ThinBackend runs the individual backend jobs in-process.
-ThinBackend createInProcessThinBackend(unsigned ParallelismLevel);
+/// The default value means to use one job per hardware core (not hyper-thread).
+ThinBackend createInProcessThinBackend(unsigned ParallelismLevel = 0);
 
 /// This ThinBackend writes individual module indexes to files, instead of
 /// running the individual backend jobs. This backend is for distributed builds
Original file line number	Diff line number	Diff line change
`@@ -114,8 +114,7 @@ llvm::Error AllTUsToolExecutor::execute(`
`114`	`114`	`auto &Action = Actions.front();`
`115`	`115`
`116`	`116`	`{`
`117`		`- llvm::ThreadPool Pool(ThreadCount == 0 ? llvm::hardware_concurrency()`
`118`		`- : ThreadCount);`
	`117`	`+ llvm::ThreadPool Pool(llvm::hardware_concurrency(ThreadCount));`
`119`	`118`	`for (std::string File : Files) {`
`120`	`119`	`Pool.async(`
`121`	`120`	`[&](std::string Path) {`
Original file line number	Diff line number	Diff line change
`@@ -106,7 +106,8 @@ DependencyScanningFilesystemSharedCache::`
`106`	`106`	`// sharding gives a performance edge by reducing the lock contention.`
`107`	`107`	`// FIXME: A better heuristic might also consider the OS to account for`
`108`	`108`	`// the different cost of lock contention on different OSes.`
`109`		`- NumShards = std::max(2u, llvm::hardware_concurrency() / 4);`
	`109`	`+ NumShards =`
	`110`	`+ std::max(2u, llvm::hardware_concurrency().compute_thread_count() / 4);`
`110`	`111`	`CacheShards = std::make_unique<CacheShard[]>(NumShards);`
`111`	`112`	`}`
`112`	`113`