One approach is to do this using nested parallelism:
void do_long(int threads) {
#pragma omp parallel for num_threads(threads)
for(...) {
}
}
int main(){
omp_set_nested(1);
int threads = 8;
int sub_threads = (threads + 1) / 2;
#pragma omp parallel num_threads(2)
{
int i = omp_get_thread_num();
if (i == 0){
do_long(data1, sub_threads);
}
if (i == 1 || omp_get_num_threads() != 2){
do_long(data2, sub_threads);
}
}
return 0;
}
source
share