llvm/openmp/runtime/test/tasking/hidden_helper_task/capacity_mix_threads.cpp

// RUN: %libomp-cxx-compile-and-run

#include <omp.h>

#include <algorithm>
#include <cassert>
#include <chrono>
#include <thread>
#include <vector>

// AIX runs out of resource in 32-bit if 4*omp_get_max_threads() is more
// than 64 threads with the default stack size.
#if defined(_AIX) && !__LP64__
#define MAX_THREADS 64
#endif

void dummy_root() {
  // omp_get_max_threads() will do middle initialization
  int nthreads = omp_get_max_threads();
  std::this_thread::sleep_for(std::chrono::milliseconds(1000));
}

int main(int argc, char *argv[]) {
  int N = std::min(std::max(std::max(32, 4 * omp_get_max_threads()),
                            4 * omp_get_num_procs()),
                   std::numeric_limits<int>::max());

#if defined(_AIX) && !__LP64__
  if (N > MAX_THREADS)
    N = MAX_THREADS;
#endif

  std::vector<int> data(N);

  // Create a new thread to initialize the OpenMP RTL. The new thread will not
  // be taken as the "initial thread".
  std::thread root(dummy_root);

#pragma omp parallel for num_threads(N)
  for (unsigned i = 0; i < N; ++i) {
    data[i] = i;
  }

#pragma omp parallel for num_threads(N + 1)
  for (unsigned i = 0; i < N; ++i) {
    data[i] += i;
  }

  for (unsigned i = 0; i < N; ++i) {
    assert(data[i] == 2 * i);
  }

  root.join();

  return 0;
}