10b57cec5SDimitry Andric /* 20b57cec5SDimitry Andric * kmp_sched.cpp -- static scheduling -- iteration initialization 30b57cec5SDimitry Andric */ 40b57cec5SDimitry Andric 50b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 80b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 90b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 100b57cec5SDimitry Andric // 110b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 120b57cec5SDimitry Andric 130b57cec5SDimitry Andric /* Static scheduling initialization. 140b57cec5SDimitry Andric 150b57cec5SDimitry Andric NOTE: team->t.t_nproc is a constant inside of any dispatch loop, however 160b57cec5SDimitry Andric it may change values between parallel regions. __kmp_max_nth 170b57cec5SDimitry Andric is the largest value __kmp_nth may take, 1 is the smallest. */ 180b57cec5SDimitry Andric 190b57cec5SDimitry Andric #include "kmp.h" 200b57cec5SDimitry Andric #include "kmp_error.h" 210b57cec5SDimitry Andric #include "kmp_i18n.h" 220b57cec5SDimitry Andric #include "kmp_itt.h" 230b57cec5SDimitry Andric #include "kmp_stats.h" 240b57cec5SDimitry Andric #include "kmp_str.h" 250b57cec5SDimitry Andric 260b57cec5SDimitry Andric #if OMPT_SUPPORT 270b57cec5SDimitry Andric #include "ompt-specific.h" 280b57cec5SDimitry Andric #endif 290b57cec5SDimitry Andric 300b57cec5SDimitry Andric #ifdef KMP_DEBUG 310b57cec5SDimitry Andric //------------------------------------------------------------------------- 320b57cec5SDimitry Andric // template for debug prints specification ( d, u, lld, llu ) 330b57cec5SDimitry Andric char const *traits_t<int>::spec = "d"; 340b57cec5SDimitry Andric char const *traits_t<unsigned int>::spec = "u"; 350b57cec5SDimitry Andric char const *traits_t<long long>::spec = "lld"; 360b57cec5SDimitry Andric char const *traits_t<unsigned long long>::spec = "llu"; 370b57cec5SDimitry Andric char const *traits_t<long>::spec = "ld"; 380b57cec5SDimitry Andric //------------------------------------------------------------------------- 390b57cec5SDimitry Andric #endif 400b57cec5SDimitry Andric 410b57cec5SDimitry Andric #if KMP_STATS_ENABLED 420b57cec5SDimitry Andric #define KMP_STATS_LOOP_END(stat) \ 430b57cec5SDimitry Andric { \ 440b57cec5SDimitry Andric kmp_int64 t; \ 450b57cec5SDimitry Andric kmp_int64 u = (kmp_int64)(*pupper); \ 460b57cec5SDimitry Andric kmp_int64 l = (kmp_int64)(*plower); \ 470b57cec5SDimitry Andric kmp_int64 i = (kmp_int64)incr; \ 480b57cec5SDimitry Andric if (i == 1) { \ 490b57cec5SDimitry Andric t = u - l + 1; \ 500b57cec5SDimitry Andric } else if (i == -1) { \ 510b57cec5SDimitry Andric t = l - u + 1; \ 520b57cec5SDimitry Andric } else if (i > 0) { \ 530b57cec5SDimitry Andric t = (u - l) / i + 1; \ 540b57cec5SDimitry Andric } else { \ 550b57cec5SDimitry Andric t = (l - u) / (-i) + 1; \ 560b57cec5SDimitry Andric } \ 570b57cec5SDimitry Andric KMP_COUNT_VALUE(stat, t); \ 580b57cec5SDimitry Andric KMP_POP_PARTITIONED_TIMER(); \ 590b57cec5SDimitry Andric } 600b57cec5SDimitry Andric #else 610b57cec5SDimitry Andric #define KMP_STATS_LOOP_END(stat) /* Nothing */ 620b57cec5SDimitry Andric #endif 630b57cec5SDimitry Andric 64e8d8bef9SDimitry Andric static ident_t loc_stub = {0, KMP_IDENT_KMPC, 0, 0, ";unknown;unknown;0;0;;"}; 65e8d8bef9SDimitry Andric static inline void check_loc(ident_t *&loc) { 66e8d8bef9SDimitry Andric if (loc == NULL) 67e8d8bef9SDimitry Andric loc = &loc_stub; // may need to report location info to ittnotify 68e8d8bef9SDimitry Andric } 69e8d8bef9SDimitry Andric 700b57cec5SDimitry Andric template <typename T> 710b57cec5SDimitry Andric static void __kmp_for_static_init(ident_t *loc, kmp_int32 global_tid, 720b57cec5SDimitry Andric kmp_int32 schedtype, kmp_int32 *plastiter, 730b57cec5SDimitry Andric T *plower, T *pupper, 740b57cec5SDimitry Andric typename traits_t<T>::signed_t *pstride, 750b57cec5SDimitry Andric typename traits_t<T>::signed_t incr, 760b57cec5SDimitry Andric typename traits_t<T>::signed_t chunk 770b57cec5SDimitry Andric #if OMPT_SUPPORT && OMPT_OPTIONAL 780b57cec5SDimitry Andric , 790b57cec5SDimitry Andric void *codeptr 800b57cec5SDimitry Andric #endif 810b57cec5SDimitry Andric ) { 820b57cec5SDimitry Andric KMP_COUNT_BLOCK(OMP_LOOP_STATIC); 830b57cec5SDimitry Andric KMP_PUSH_PARTITIONED_TIMER(OMP_loop_static); 840b57cec5SDimitry Andric KMP_PUSH_PARTITIONED_TIMER(OMP_loop_static_scheduling); 850b57cec5SDimitry Andric 860b57cec5SDimitry Andric typedef typename traits_t<T>::unsigned_t UT; 870b57cec5SDimitry Andric typedef typename traits_t<T>::signed_t ST; 880b57cec5SDimitry Andric /* this all has to be changed back to TID and such.. */ 890b57cec5SDimitry Andric kmp_int32 gtid = global_tid; 900b57cec5SDimitry Andric kmp_uint32 tid; 910b57cec5SDimitry Andric kmp_uint32 nth; 920b57cec5SDimitry Andric UT trip_count; 930b57cec5SDimitry Andric kmp_team_t *team; 94e8d8bef9SDimitry Andric __kmp_assert_valid_gtid(gtid); 950b57cec5SDimitry Andric kmp_info_t *th = __kmp_threads[gtid]; 960b57cec5SDimitry Andric 970b57cec5SDimitry Andric #if OMPT_SUPPORT && OMPT_OPTIONAL 980b57cec5SDimitry Andric ompt_team_info_t *team_info = NULL; 990b57cec5SDimitry Andric ompt_task_info_t *task_info = NULL; 1000b57cec5SDimitry Andric ompt_work_t ompt_work_type = ompt_work_loop; 1010b57cec5SDimitry Andric 1020b57cec5SDimitry Andric static kmp_int8 warn = 0; 1030b57cec5SDimitry Andric 104*81ad6265SDimitry Andric if (ompt_enabled.ompt_callback_work || ompt_enabled.ompt_callback_dispatch) { 1050b57cec5SDimitry Andric // Only fully initialize variables needed by OMPT if OMPT is enabled. 1060b57cec5SDimitry Andric team_info = __ompt_get_teaminfo(0, NULL); 1070b57cec5SDimitry Andric task_info = __ompt_get_task_info_object(0); 1080b57cec5SDimitry Andric // Determine workshare type 1090b57cec5SDimitry Andric if (loc != NULL) { 1100b57cec5SDimitry Andric if ((loc->flags & KMP_IDENT_WORK_LOOP) != 0) { 1110b57cec5SDimitry Andric ompt_work_type = ompt_work_loop; 1120b57cec5SDimitry Andric } else if ((loc->flags & KMP_IDENT_WORK_SECTIONS) != 0) { 1130b57cec5SDimitry Andric ompt_work_type = ompt_work_sections; 1140b57cec5SDimitry Andric } else if ((loc->flags & KMP_IDENT_WORK_DISTRIBUTE) != 0) { 1150b57cec5SDimitry Andric ompt_work_type = ompt_work_distribute; 1160b57cec5SDimitry Andric } else { 1170b57cec5SDimitry Andric kmp_int8 bool_res = 1180b57cec5SDimitry Andric KMP_COMPARE_AND_STORE_ACQ8(&warn, (kmp_int8)0, (kmp_int8)1); 1190b57cec5SDimitry Andric if (bool_res) 1200b57cec5SDimitry Andric KMP_WARNING(OmptOutdatedWorkshare); 1210b57cec5SDimitry Andric } 1220b57cec5SDimitry Andric KMP_DEBUG_ASSERT(ompt_work_type); 1230b57cec5SDimitry Andric } 1240b57cec5SDimitry Andric } 1250b57cec5SDimitry Andric #endif 1260b57cec5SDimitry Andric 1270b57cec5SDimitry Andric KMP_DEBUG_ASSERT(plastiter && plower && pupper && pstride); 1280b57cec5SDimitry Andric KE_TRACE(10, ("__kmpc_for_static_init called (%d)\n", global_tid)); 1290b57cec5SDimitry Andric #ifdef KMP_DEBUG 1300b57cec5SDimitry Andric { 1310b57cec5SDimitry Andric char *buff; 1320b57cec5SDimitry Andric // create format specifiers before the debug output 1330b57cec5SDimitry Andric buff = __kmp_str_format( 1340b57cec5SDimitry Andric "__kmpc_for_static_init: T#%%d sched=%%d liter=%%d iter=(%%%s," 1350b57cec5SDimitry Andric " %%%s, %%%s) incr=%%%s chunk=%%%s signed?<%s>\n", 1360b57cec5SDimitry Andric traits_t<T>::spec, traits_t<T>::spec, traits_t<ST>::spec, 1370b57cec5SDimitry Andric traits_t<ST>::spec, traits_t<ST>::spec, traits_t<T>::spec); 1380b57cec5SDimitry Andric KD_TRACE(100, (buff, global_tid, schedtype, *plastiter, *plower, *pupper, 1390b57cec5SDimitry Andric *pstride, incr, chunk)); 1400b57cec5SDimitry Andric __kmp_str_free(&buff); 1410b57cec5SDimitry Andric } 1420b57cec5SDimitry Andric #endif 1430b57cec5SDimitry Andric 1440b57cec5SDimitry Andric if (__kmp_env_consistency_check) { 1450b57cec5SDimitry Andric __kmp_push_workshare(global_tid, ct_pdo, loc); 1460b57cec5SDimitry Andric if (incr == 0) { 1470b57cec5SDimitry Andric __kmp_error_construct(kmp_i18n_msg_CnsLoopIncrZeroProhibited, ct_pdo, 1480b57cec5SDimitry Andric loc); 1490b57cec5SDimitry Andric } 1500b57cec5SDimitry Andric } 1510b57cec5SDimitry Andric /* special handling for zero-trip loops */ 1520b57cec5SDimitry Andric if (incr > 0 ? (*pupper < *plower) : (*plower < *pupper)) { 1530b57cec5SDimitry Andric if (plastiter != NULL) 1540b57cec5SDimitry Andric *plastiter = FALSE; 1550b57cec5SDimitry Andric /* leave pupper and plower set to entire iteration space */ 1560b57cec5SDimitry Andric *pstride = incr; /* value should never be used */ 1570b57cec5SDimitry Andric // *plower = *pupper - incr; 1580b57cec5SDimitry Andric // let compiler bypass the illegal loop (like for(i=1;i<10;i--)) 1590b57cec5SDimitry Andric // THE LINE COMMENTED ABOVE CAUSED shape2F/h_tests_1.f TO HAVE A FAILURE 1600b57cec5SDimitry Andric // ON A ZERO-TRIP LOOP (lower=1, upper=0,stride=1) - JPH June 23, 2009. 1610b57cec5SDimitry Andric #ifdef KMP_DEBUG 1620b57cec5SDimitry Andric { 1630b57cec5SDimitry Andric char *buff; 1640b57cec5SDimitry Andric // create format specifiers before the debug output 1650b57cec5SDimitry Andric buff = __kmp_str_format("__kmpc_for_static_init:(ZERO TRIP) liter=%%d " 1660b57cec5SDimitry Andric "lower=%%%s upper=%%%s stride = %%%s " 1670b57cec5SDimitry Andric "signed?<%s>, loc = %%s\n", 1680b57cec5SDimitry Andric traits_t<T>::spec, traits_t<T>::spec, 1690b57cec5SDimitry Andric traits_t<ST>::spec, traits_t<T>::spec); 170fe6060f1SDimitry Andric check_loc(loc); 1710b57cec5SDimitry Andric KD_TRACE(100, 1720b57cec5SDimitry Andric (buff, *plastiter, *plower, *pupper, *pstride, loc->psource)); 1730b57cec5SDimitry Andric __kmp_str_free(&buff); 1740b57cec5SDimitry Andric } 1750b57cec5SDimitry Andric #endif 1760b57cec5SDimitry Andric KE_TRACE(10, ("__kmpc_for_static_init: T#%d return\n", global_tid)); 1770b57cec5SDimitry Andric 1780b57cec5SDimitry Andric #if OMPT_SUPPORT && OMPT_OPTIONAL 1790b57cec5SDimitry Andric if (ompt_enabled.ompt_callback_work) { 1800b57cec5SDimitry Andric ompt_callbacks.ompt_callback(ompt_callback_work)( 1810b57cec5SDimitry Andric ompt_work_type, ompt_scope_begin, &(team_info->parallel_data), 1820b57cec5SDimitry Andric &(task_info->task_data), 0, codeptr); 1830b57cec5SDimitry Andric } 1840b57cec5SDimitry Andric #endif 1850b57cec5SDimitry Andric KMP_STATS_LOOP_END(OMP_loop_static_iterations); 1860b57cec5SDimitry Andric return; 1870b57cec5SDimitry Andric } 1880b57cec5SDimitry Andric 1890b57cec5SDimitry Andric // Although there are schedule enumerations above kmp_ord_upper which are not 1900b57cec5SDimitry Andric // schedules for "distribute", the only ones which are useful are dynamic, so 1910b57cec5SDimitry Andric // cannot be seen here, since this codepath is only executed for static 1920b57cec5SDimitry Andric // schedules. 1930b57cec5SDimitry Andric if (schedtype > kmp_ord_upper) { 1940b57cec5SDimitry Andric // we are in DISTRIBUTE construct 1950b57cec5SDimitry Andric schedtype += kmp_sch_static - 1960b57cec5SDimitry Andric kmp_distribute_static; // AC: convert to usual schedule type 197*81ad6265SDimitry Andric if (th->th.th_team->t.t_serialized > 1) { 198*81ad6265SDimitry Andric tid = 0; 199*81ad6265SDimitry Andric team = th->th.th_team; 200*81ad6265SDimitry Andric } else { 2010b57cec5SDimitry Andric tid = th->th.th_team->t.t_master_tid; 2020b57cec5SDimitry Andric team = th->th.th_team->t.t_parent; 203*81ad6265SDimitry Andric } 2040b57cec5SDimitry Andric } else { 2050b57cec5SDimitry Andric tid = __kmp_tid_from_gtid(global_tid); 2060b57cec5SDimitry Andric team = th->th.th_team; 2070b57cec5SDimitry Andric } 2080b57cec5SDimitry Andric 2090b57cec5SDimitry Andric /* determine if "for" loop is an active worksharing construct */ 2100b57cec5SDimitry Andric if (team->t.t_serialized) { 2110b57cec5SDimitry Andric /* serialized parallel, each thread executes whole iteration space */ 2120b57cec5SDimitry Andric if (plastiter != NULL) 2130b57cec5SDimitry Andric *plastiter = TRUE; 2140b57cec5SDimitry Andric /* leave pupper and plower set to entire iteration space */ 2150b57cec5SDimitry Andric *pstride = 2160b57cec5SDimitry Andric (incr > 0) ? (*pupper - *plower + 1) : (-(*plower - *pupper + 1)); 2170b57cec5SDimitry Andric 2180b57cec5SDimitry Andric #ifdef KMP_DEBUG 2190b57cec5SDimitry Andric { 2200b57cec5SDimitry Andric char *buff; 2210b57cec5SDimitry Andric // create format specifiers before the debug output 2220b57cec5SDimitry Andric buff = __kmp_str_format("__kmpc_for_static_init: (serial) liter=%%d " 2230b57cec5SDimitry Andric "lower=%%%s upper=%%%s stride = %%%s\n", 2240b57cec5SDimitry Andric traits_t<T>::spec, traits_t<T>::spec, 2250b57cec5SDimitry Andric traits_t<ST>::spec); 2260b57cec5SDimitry Andric KD_TRACE(100, (buff, *plastiter, *plower, *pupper, *pstride)); 2270b57cec5SDimitry Andric __kmp_str_free(&buff); 2280b57cec5SDimitry Andric } 2290b57cec5SDimitry Andric #endif 2300b57cec5SDimitry Andric KE_TRACE(10, ("__kmpc_for_static_init: T#%d return\n", global_tid)); 2310b57cec5SDimitry Andric 2320b57cec5SDimitry Andric #if OMPT_SUPPORT && OMPT_OPTIONAL 2330b57cec5SDimitry Andric if (ompt_enabled.ompt_callback_work) { 2340b57cec5SDimitry Andric ompt_callbacks.ompt_callback(ompt_callback_work)( 2350b57cec5SDimitry Andric ompt_work_type, ompt_scope_begin, &(team_info->parallel_data), 2360b57cec5SDimitry Andric &(task_info->task_data), *pstride, codeptr); 2370b57cec5SDimitry Andric } 2380b57cec5SDimitry Andric #endif 2390b57cec5SDimitry Andric KMP_STATS_LOOP_END(OMP_loop_static_iterations); 2400b57cec5SDimitry Andric return; 2410b57cec5SDimitry Andric } 2420b57cec5SDimitry Andric nth = team->t.t_nproc; 2430b57cec5SDimitry Andric if (nth == 1) { 2440b57cec5SDimitry Andric if (plastiter != NULL) 2450b57cec5SDimitry Andric *plastiter = TRUE; 2460b57cec5SDimitry Andric *pstride = 2470b57cec5SDimitry Andric (incr > 0) ? (*pupper - *plower + 1) : (-(*plower - *pupper + 1)); 2480b57cec5SDimitry Andric #ifdef KMP_DEBUG 2490b57cec5SDimitry Andric { 2500b57cec5SDimitry Andric char *buff; 2510b57cec5SDimitry Andric // create format specifiers before the debug output 2520b57cec5SDimitry Andric buff = __kmp_str_format("__kmpc_for_static_init: (serial) liter=%%d " 2530b57cec5SDimitry Andric "lower=%%%s upper=%%%s stride = %%%s\n", 2540b57cec5SDimitry Andric traits_t<T>::spec, traits_t<T>::spec, 2550b57cec5SDimitry Andric traits_t<ST>::spec); 2560b57cec5SDimitry Andric KD_TRACE(100, (buff, *plastiter, *plower, *pupper, *pstride)); 2570b57cec5SDimitry Andric __kmp_str_free(&buff); 2580b57cec5SDimitry Andric } 2590b57cec5SDimitry Andric #endif 2600b57cec5SDimitry Andric KE_TRACE(10, ("__kmpc_for_static_init: T#%d return\n", global_tid)); 2610b57cec5SDimitry Andric 2620b57cec5SDimitry Andric #if OMPT_SUPPORT && OMPT_OPTIONAL 2630b57cec5SDimitry Andric if (ompt_enabled.ompt_callback_work) { 2640b57cec5SDimitry Andric ompt_callbacks.ompt_callback(ompt_callback_work)( 2650b57cec5SDimitry Andric ompt_work_type, ompt_scope_begin, &(team_info->parallel_data), 2660b57cec5SDimitry Andric &(task_info->task_data), *pstride, codeptr); 2670b57cec5SDimitry Andric } 2680b57cec5SDimitry Andric #endif 2690b57cec5SDimitry Andric KMP_STATS_LOOP_END(OMP_loop_static_iterations); 2700b57cec5SDimitry Andric return; 2710b57cec5SDimitry Andric } 2720b57cec5SDimitry Andric 2730b57cec5SDimitry Andric /* compute trip count */ 2740b57cec5SDimitry Andric if (incr == 1) { 2750b57cec5SDimitry Andric trip_count = *pupper - *plower + 1; 2760b57cec5SDimitry Andric } else if (incr == -1) { 2770b57cec5SDimitry Andric trip_count = *plower - *pupper + 1; 2780b57cec5SDimitry Andric } else if (incr > 0) { 2790b57cec5SDimitry Andric // upper-lower can exceed the limit of signed type 2800b57cec5SDimitry Andric trip_count = (UT)(*pupper - *plower) / incr + 1; 2810b57cec5SDimitry Andric } else { 2820b57cec5SDimitry Andric trip_count = (UT)(*plower - *pupper) / (-incr) + 1; 2830b57cec5SDimitry Andric } 2840b57cec5SDimitry Andric 2850b57cec5SDimitry Andric #if KMP_STATS_ENABLED 2860b57cec5SDimitry Andric if (KMP_MASTER_GTID(gtid)) { 2870b57cec5SDimitry Andric KMP_COUNT_VALUE(OMP_loop_static_total_iterations, trip_count); 2880b57cec5SDimitry Andric } 2890b57cec5SDimitry Andric #endif 2900b57cec5SDimitry Andric 2910b57cec5SDimitry Andric if (__kmp_env_consistency_check) { 2920b57cec5SDimitry Andric /* tripcount overflow? */ 2930b57cec5SDimitry Andric if (trip_count == 0 && *pupper != *plower) { 2940b57cec5SDimitry Andric __kmp_error_construct(kmp_i18n_msg_CnsIterationRangeTooLarge, ct_pdo, 2950b57cec5SDimitry Andric loc); 2960b57cec5SDimitry Andric } 2970b57cec5SDimitry Andric } 2980b57cec5SDimitry Andric 2990b57cec5SDimitry Andric /* compute remaining parameters */ 3000b57cec5SDimitry Andric switch (schedtype) { 3010b57cec5SDimitry Andric case kmp_sch_static: { 3020b57cec5SDimitry Andric if (trip_count < nth) { 3030b57cec5SDimitry Andric KMP_DEBUG_ASSERT( 3040b57cec5SDimitry Andric __kmp_static == kmp_sch_static_greedy || 3050b57cec5SDimitry Andric __kmp_static == 3060b57cec5SDimitry Andric kmp_sch_static_balanced); // Unknown static scheduling type. 3070b57cec5SDimitry Andric if (tid < trip_count) { 3080b57cec5SDimitry Andric *pupper = *plower = *plower + tid * incr; 3090b57cec5SDimitry Andric } else { 310fe6060f1SDimitry Andric // set bounds so non-active threads execute no iterations 311fe6060f1SDimitry Andric *plower = *pupper + (incr > 0 ? 1 : -1); 3120b57cec5SDimitry Andric } 3130b57cec5SDimitry Andric if (plastiter != NULL) 3140b57cec5SDimitry Andric *plastiter = (tid == trip_count - 1); 3150b57cec5SDimitry Andric } else { 3160b57cec5SDimitry Andric if (__kmp_static == kmp_sch_static_balanced) { 3170b57cec5SDimitry Andric UT small_chunk = trip_count / nth; 3180b57cec5SDimitry Andric UT extras = trip_count % nth; 3190b57cec5SDimitry Andric *plower += incr * (tid * small_chunk + (tid < extras ? tid : extras)); 3200b57cec5SDimitry Andric *pupper = *plower + small_chunk * incr - (tid < extras ? 0 : incr); 3210b57cec5SDimitry Andric if (plastiter != NULL) 3220b57cec5SDimitry Andric *plastiter = (tid == nth - 1); 3230b57cec5SDimitry Andric } else { 3240b57cec5SDimitry Andric T big_chunk_inc_count = 3250b57cec5SDimitry Andric (trip_count / nth + ((trip_count % nth) ? 1 : 0)) * incr; 3260b57cec5SDimitry Andric T old_upper = *pupper; 3270b57cec5SDimitry Andric 3280b57cec5SDimitry Andric KMP_DEBUG_ASSERT(__kmp_static == kmp_sch_static_greedy); 3290b57cec5SDimitry Andric // Unknown static scheduling type. 3300b57cec5SDimitry Andric 3310b57cec5SDimitry Andric *plower += tid * big_chunk_inc_count; 3320b57cec5SDimitry Andric *pupper = *plower + big_chunk_inc_count - incr; 3330b57cec5SDimitry Andric if (incr > 0) { 3340b57cec5SDimitry Andric if (*pupper < *plower) 3350b57cec5SDimitry Andric *pupper = traits_t<T>::max_value; 3360b57cec5SDimitry Andric if (plastiter != NULL) 3370b57cec5SDimitry Andric *plastiter = *plower <= old_upper && *pupper > old_upper - incr; 3380b57cec5SDimitry Andric if (*pupper > old_upper) 3390b57cec5SDimitry Andric *pupper = old_upper; // tracker C73258 3400b57cec5SDimitry Andric } else { 3410b57cec5SDimitry Andric if (*pupper > *plower) 3420b57cec5SDimitry Andric *pupper = traits_t<T>::min_value; 3430b57cec5SDimitry Andric if (plastiter != NULL) 3440b57cec5SDimitry Andric *plastiter = *plower >= old_upper && *pupper < old_upper - incr; 3450b57cec5SDimitry Andric if (*pupper < old_upper) 3460b57cec5SDimitry Andric *pupper = old_upper; // tracker C73258 3470b57cec5SDimitry Andric } 3480b57cec5SDimitry Andric } 3490b57cec5SDimitry Andric } 3500b57cec5SDimitry Andric *pstride = trip_count; 3510b57cec5SDimitry Andric break; 3520b57cec5SDimitry Andric } 3530b57cec5SDimitry Andric case kmp_sch_static_chunked: { 3540b57cec5SDimitry Andric ST span; 355fe6060f1SDimitry Andric UT nchunks; 356fe6060f1SDimitry Andric if (chunk < 1) 3570b57cec5SDimitry Andric chunk = 1; 358fe6060f1SDimitry Andric else if ((UT)chunk > trip_count) 359fe6060f1SDimitry Andric chunk = trip_count; 360fe6060f1SDimitry Andric nchunks = (trip_count) / (UT)chunk + (trip_count % (UT)chunk ? 1 : 0); 3610b57cec5SDimitry Andric span = chunk * incr; 362fe6060f1SDimitry Andric if (nchunks < nth) { 363fe6060f1SDimitry Andric *pstride = span * nchunks; 364fe6060f1SDimitry Andric if (tid < nchunks) { 365fe6060f1SDimitry Andric *plower = *plower + (span * tid); 366fe6060f1SDimitry Andric *pupper = *plower + span - incr; 367fe6060f1SDimitry Andric } else { 368fe6060f1SDimitry Andric *plower = *pupper + (incr > 0 ? 1 : -1); 369fe6060f1SDimitry Andric } 370fe6060f1SDimitry Andric } else { 3710b57cec5SDimitry Andric *pstride = span * nth; 3720b57cec5SDimitry Andric *plower = *plower + (span * tid); 3730b57cec5SDimitry Andric *pupper = *plower + span - incr; 374fe6060f1SDimitry Andric } 3750b57cec5SDimitry Andric if (plastiter != NULL) 376fe6060f1SDimitry Andric *plastiter = (tid == (nchunks - 1) % nth); 3770b57cec5SDimitry Andric break; 3780b57cec5SDimitry Andric } 3790b57cec5SDimitry Andric case kmp_sch_static_balanced_chunked: { 3800b57cec5SDimitry Andric T old_upper = *pupper; 3810b57cec5SDimitry Andric // round up to make sure the chunk is enough to cover all iterations 3820b57cec5SDimitry Andric UT span = (trip_count + nth - 1) / nth; 3830b57cec5SDimitry Andric 3840b57cec5SDimitry Andric // perform chunk adjustment 3850b57cec5SDimitry Andric chunk = (span + chunk - 1) & ~(chunk - 1); 3860b57cec5SDimitry Andric 3870b57cec5SDimitry Andric span = chunk * incr; 3880b57cec5SDimitry Andric *plower = *plower + (span * tid); 3890b57cec5SDimitry Andric *pupper = *plower + span - incr; 3900b57cec5SDimitry Andric if (incr > 0) { 3910b57cec5SDimitry Andric if (*pupper > old_upper) 3920b57cec5SDimitry Andric *pupper = old_upper; 3930b57cec5SDimitry Andric } else if (*pupper < old_upper) 3940b57cec5SDimitry Andric *pupper = old_upper; 3950b57cec5SDimitry Andric 3960b57cec5SDimitry Andric if (plastiter != NULL) 3970b57cec5SDimitry Andric *plastiter = (tid == ((trip_count - 1) / (UT)chunk)); 3980b57cec5SDimitry Andric break; 3990b57cec5SDimitry Andric } 4000b57cec5SDimitry Andric default: 4010b57cec5SDimitry Andric KMP_ASSERT2(0, "__kmpc_for_static_init: unknown scheduling type"); 4020b57cec5SDimitry Andric break; 4030b57cec5SDimitry Andric } 4040b57cec5SDimitry Andric 4050b57cec5SDimitry Andric #if USE_ITT_BUILD 4060b57cec5SDimitry Andric // Report loop metadata 4070b57cec5SDimitry Andric if (KMP_MASTER_TID(tid) && __itt_metadata_add_ptr && 4080b57cec5SDimitry Andric __kmp_forkjoin_frames_mode == 3 && th->th.th_teams_microtask == NULL && 4090b57cec5SDimitry Andric team->t.t_active_level == 1) { 4100b57cec5SDimitry Andric kmp_uint64 cur_chunk = chunk; 411e8d8bef9SDimitry Andric check_loc(loc); 4120b57cec5SDimitry Andric // Calculate chunk in case it was not specified; it is specified for 4130b57cec5SDimitry Andric // kmp_sch_static_chunked 4140b57cec5SDimitry Andric if (schedtype == kmp_sch_static) { 4150b57cec5SDimitry Andric cur_chunk = trip_count / nth + ((trip_count % nth) ? 1 : 0); 4160b57cec5SDimitry Andric } 4170b57cec5SDimitry Andric // 0 - "static" schedule 4180b57cec5SDimitry Andric __kmp_itt_metadata_loop(loc, 0, trip_count, cur_chunk); 4190b57cec5SDimitry Andric } 4200b57cec5SDimitry Andric #endif 4210b57cec5SDimitry Andric #ifdef KMP_DEBUG 4220b57cec5SDimitry Andric { 4230b57cec5SDimitry Andric char *buff; 4240b57cec5SDimitry Andric // create format specifiers before the debug output 4250b57cec5SDimitry Andric buff = __kmp_str_format("__kmpc_for_static_init: liter=%%d lower=%%%s " 4260b57cec5SDimitry Andric "upper=%%%s stride = %%%s signed?<%s>\n", 4270b57cec5SDimitry Andric traits_t<T>::spec, traits_t<T>::spec, 4280b57cec5SDimitry Andric traits_t<ST>::spec, traits_t<T>::spec); 4290b57cec5SDimitry Andric KD_TRACE(100, (buff, *plastiter, *plower, *pupper, *pstride)); 4300b57cec5SDimitry Andric __kmp_str_free(&buff); 4310b57cec5SDimitry Andric } 4320b57cec5SDimitry Andric #endif 4330b57cec5SDimitry Andric KE_TRACE(10, ("__kmpc_for_static_init: T#%d return\n", global_tid)); 4340b57cec5SDimitry Andric 4350b57cec5SDimitry Andric #if OMPT_SUPPORT && OMPT_OPTIONAL 4360b57cec5SDimitry Andric if (ompt_enabled.ompt_callback_work) { 4370b57cec5SDimitry Andric ompt_callbacks.ompt_callback(ompt_callback_work)( 4380b57cec5SDimitry Andric ompt_work_type, ompt_scope_begin, &(team_info->parallel_data), 4390b57cec5SDimitry Andric &(task_info->task_data), trip_count, codeptr); 4400b57cec5SDimitry Andric } 441*81ad6265SDimitry Andric if (ompt_enabled.ompt_callback_dispatch) { 442*81ad6265SDimitry Andric ompt_dispatch_t dispatch_type; 443*81ad6265SDimitry Andric ompt_data_t instance = ompt_data_none; 444*81ad6265SDimitry Andric ompt_dispatch_chunk_t dispatch_chunk; 445*81ad6265SDimitry Andric if (ompt_work_type == ompt_work_sections) { 446*81ad6265SDimitry Andric dispatch_type = ompt_dispatch_section; 447*81ad6265SDimitry Andric instance.ptr = codeptr; 448*81ad6265SDimitry Andric } else { 449*81ad6265SDimitry Andric OMPT_GET_DISPATCH_CHUNK(dispatch_chunk, *plower, *pupper, incr); 450*81ad6265SDimitry Andric dispatch_type = (ompt_work_type == ompt_work_distribute) 451*81ad6265SDimitry Andric ? ompt_dispatch_distribute_chunk 452*81ad6265SDimitry Andric : ompt_dispatch_ws_loop_chunk; 453*81ad6265SDimitry Andric instance.ptr = &dispatch_chunk; 454*81ad6265SDimitry Andric } 455*81ad6265SDimitry Andric ompt_callbacks.ompt_callback(ompt_callback_dispatch)( 456*81ad6265SDimitry Andric &(team_info->parallel_data), &(task_info->task_data), dispatch_type, 457*81ad6265SDimitry Andric instance); 458*81ad6265SDimitry Andric } 4590b57cec5SDimitry Andric #endif 4600b57cec5SDimitry Andric 4610b57cec5SDimitry Andric KMP_STATS_LOOP_END(OMP_loop_static_iterations); 4620b57cec5SDimitry Andric return; 4630b57cec5SDimitry Andric } 4640b57cec5SDimitry Andric 4650b57cec5SDimitry Andric template <typename T> 4660b57cec5SDimitry Andric static void __kmp_dist_for_static_init(ident_t *loc, kmp_int32 gtid, 4670b57cec5SDimitry Andric kmp_int32 schedule, kmp_int32 *plastiter, 4680b57cec5SDimitry Andric T *plower, T *pupper, T *pupperDist, 4690b57cec5SDimitry Andric typename traits_t<T>::signed_t *pstride, 4700b57cec5SDimitry Andric typename traits_t<T>::signed_t incr, 471*81ad6265SDimitry Andric typename traits_t<T>::signed_t chunk 472*81ad6265SDimitry Andric #if OMPT_SUPPORT && OMPT_OPTIONAL 473*81ad6265SDimitry Andric , 474*81ad6265SDimitry Andric void *codeptr 475*81ad6265SDimitry Andric #endif 476*81ad6265SDimitry Andric ) { 4770b57cec5SDimitry Andric KMP_COUNT_BLOCK(OMP_DISTRIBUTE); 4780b57cec5SDimitry Andric KMP_PUSH_PARTITIONED_TIMER(OMP_distribute); 4790b57cec5SDimitry Andric KMP_PUSH_PARTITIONED_TIMER(OMP_distribute_scheduling); 4800b57cec5SDimitry Andric typedef typename traits_t<T>::unsigned_t UT; 4810b57cec5SDimitry Andric typedef typename traits_t<T>::signed_t ST; 4820b57cec5SDimitry Andric kmp_uint32 tid; 4830b57cec5SDimitry Andric kmp_uint32 nth; 4840b57cec5SDimitry Andric kmp_uint32 team_id; 4850b57cec5SDimitry Andric kmp_uint32 nteams; 4860b57cec5SDimitry Andric UT trip_count; 4870b57cec5SDimitry Andric kmp_team_t *team; 4880b57cec5SDimitry Andric kmp_info_t *th; 4890b57cec5SDimitry Andric 4900b57cec5SDimitry Andric KMP_DEBUG_ASSERT(plastiter && plower && pupper && pupperDist && pstride); 4910b57cec5SDimitry Andric KE_TRACE(10, ("__kmpc_dist_for_static_init called (%d)\n", gtid)); 492e8d8bef9SDimitry Andric __kmp_assert_valid_gtid(gtid); 4930b57cec5SDimitry Andric #ifdef KMP_DEBUG 4940b57cec5SDimitry Andric { 4950b57cec5SDimitry Andric char *buff; 4960b57cec5SDimitry Andric // create format specifiers before the debug output 4970b57cec5SDimitry Andric buff = __kmp_str_format( 4980b57cec5SDimitry Andric "__kmpc_dist_for_static_init: T#%%d schedLoop=%%d liter=%%d " 4990b57cec5SDimitry Andric "iter=(%%%s, %%%s, %%%s) chunk=%%%s signed?<%s>\n", 5000b57cec5SDimitry Andric traits_t<T>::spec, traits_t<T>::spec, traits_t<ST>::spec, 5010b57cec5SDimitry Andric traits_t<ST>::spec, traits_t<T>::spec); 5020b57cec5SDimitry Andric KD_TRACE(100, 5030b57cec5SDimitry Andric (buff, gtid, schedule, *plastiter, *plower, *pupper, incr, chunk)); 5040b57cec5SDimitry Andric __kmp_str_free(&buff); 5050b57cec5SDimitry Andric } 5060b57cec5SDimitry Andric #endif 5070b57cec5SDimitry Andric 5080b57cec5SDimitry Andric if (__kmp_env_consistency_check) { 5090b57cec5SDimitry Andric __kmp_push_workshare(gtid, ct_pdo, loc); 5100b57cec5SDimitry Andric if (incr == 0) { 5110b57cec5SDimitry Andric __kmp_error_construct(kmp_i18n_msg_CnsLoopIncrZeroProhibited, ct_pdo, 5120b57cec5SDimitry Andric loc); 5130b57cec5SDimitry Andric } 5140b57cec5SDimitry Andric if (incr > 0 ? (*pupper < *plower) : (*plower < *pupper)) { 5150b57cec5SDimitry Andric // The loop is illegal. 5160b57cec5SDimitry Andric // Some zero-trip loops maintained by compiler, e.g.: 5170b57cec5SDimitry Andric // for(i=10;i<0;++i) // lower >= upper - run-time check 5180b57cec5SDimitry Andric // for(i=0;i>10;--i) // lower <= upper - run-time check 5190b57cec5SDimitry Andric // for(i=0;i>10;++i) // incr > 0 - compile-time check 5200b57cec5SDimitry Andric // for(i=10;i<0;--i) // incr < 0 - compile-time check 5210b57cec5SDimitry Andric // Compiler does not check the following illegal loops: 5220b57cec5SDimitry Andric // for(i=0;i<10;i+=incr) // where incr<0 5230b57cec5SDimitry Andric // for(i=10;i>0;i-=incr) // where incr<0 5240b57cec5SDimitry Andric __kmp_error_construct(kmp_i18n_msg_CnsLoopIncrIllegal, ct_pdo, loc); 5250b57cec5SDimitry Andric } 5260b57cec5SDimitry Andric } 5270b57cec5SDimitry Andric tid = __kmp_tid_from_gtid(gtid); 5280b57cec5SDimitry Andric th = __kmp_threads[gtid]; 5290b57cec5SDimitry Andric nth = th->th.th_team_nproc; 5300b57cec5SDimitry Andric team = th->th.th_team; 5310b57cec5SDimitry Andric KMP_DEBUG_ASSERT(th->th.th_teams_microtask); // we are in the teams construct 5320b57cec5SDimitry Andric nteams = th->th.th_teams_size.nteams; 5330b57cec5SDimitry Andric team_id = team->t.t_master_tid; 5340b57cec5SDimitry Andric KMP_DEBUG_ASSERT(nteams == (kmp_uint32)team->t.t_parent->t.t_nproc); 5350b57cec5SDimitry Andric 5360b57cec5SDimitry Andric // compute global trip count 5370b57cec5SDimitry Andric if (incr == 1) { 5380b57cec5SDimitry Andric trip_count = *pupper - *plower + 1; 5390b57cec5SDimitry Andric } else if (incr == -1) { 5400b57cec5SDimitry Andric trip_count = *plower - *pupper + 1; 5410b57cec5SDimitry Andric } else if (incr > 0) { 5420b57cec5SDimitry Andric // upper-lower can exceed the limit of signed type 5430b57cec5SDimitry Andric trip_count = (UT)(*pupper - *plower) / incr + 1; 5440b57cec5SDimitry Andric } else { 5450b57cec5SDimitry Andric trip_count = (UT)(*plower - *pupper) / (-incr) + 1; 5460b57cec5SDimitry Andric } 5470b57cec5SDimitry Andric 5480b57cec5SDimitry Andric *pstride = *pupper - *plower; // just in case (can be unused) 5490b57cec5SDimitry Andric if (trip_count <= nteams) { 5500b57cec5SDimitry Andric KMP_DEBUG_ASSERT( 5510b57cec5SDimitry Andric __kmp_static == kmp_sch_static_greedy || 5520b57cec5SDimitry Andric __kmp_static == 5530b57cec5SDimitry Andric kmp_sch_static_balanced); // Unknown static scheduling type. 554fe6060f1SDimitry Andric // only primary threads of some teams get single iteration, other threads 555fe6060f1SDimitry Andric // get nothing 5560b57cec5SDimitry Andric if (team_id < trip_count && tid == 0) { 5570b57cec5SDimitry Andric *pupper = *pupperDist = *plower = *plower + team_id * incr; 5580b57cec5SDimitry Andric } else { 5590b57cec5SDimitry Andric *pupperDist = *pupper; 5600b57cec5SDimitry Andric *plower = *pupper + incr; // compiler should skip loop body 5610b57cec5SDimitry Andric } 5620b57cec5SDimitry Andric if (plastiter != NULL) 5630b57cec5SDimitry Andric *plastiter = (tid == 0 && team_id == trip_count - 1); 5640b57cec5SDimitry Andric } else { 5650b57cec5SDimitry Andric // Get the team's chunk first (each team gets at most one chunk) 5660b57cec5SDimitry Andric if (__kmp_static == kmp_sch_static_balanced) { 5670b57cec5SDimitry Andric UT chunkD = trip_count / nteams; 5680b57cec5SDimitry Andric UT extras = trip_count % nteams; 5690b57cec5SDimitry Andric *plower += 5700b57cec5SDimitry Andric incr * (team_id * chunkD + (team_id < extras ? team_id : extras)); 5710b57cec5SDimitry Andric *pupperDist = *plower + chunkD * incr - (team_id < extras ? 0 : incr); 5720b57cec5SDimitry Andric if (plastiter != NULL) 5730b57cec5SDimitry Andric *plastiter = (team_id == nteams - 1); 5740b57cec5SDimitry Andric } else { 5750b57cec5SDimitry Andric T chunk_inc_count = 5760b57cec5SDimitry Andric (trip_count / nteams + ((trip_count % nteams) ? 1 : 0)) * incr; 5770b57cec5SDimitry Andric T upper = *pupper; 5780b57cec5SDimitry Andric KMP_DEBUG_ASSERT(__kmp_static == kmp_sch_static_greedy); 5790b57cec5SDimitry Andric // Unknown static scheduling type. 5800b57cec5SDimitry Andric *plower += team_id * chunk_inc_count; 5810b57cec5SDimitry Andric *pupperDist = *plower + chunk_inc_count - incr; 5820b57cec5SDimitry Andric // Check/correct bounds if needed 5830b57cec5SDimitry Andric if (incr > 0) { 5840b57cec5SDimitry Andric if (*pupperDist < *plower) 5850b57cec5SDimitry Andric *pupperDist = traits_t<T>::max_value; 5860b57cec5SDimitry Andric if (plastiter != NULL) 5870b57cec5SDimitry Andric *plastiter = *plower <= upper && *pupperDist > upper - incr; 5880b57cec5SDimitry Andric if (*pupperDist > upper) 5890b57cec5SDimitry Andric *pupperDist = upper; // tracker C73258 5900b57cec5SDimitry Andric if (*plower > *pupperDist) { 5910b57cec5SDimitry Andric *pupper = *pupperDist; // no iterations available for the team 5920b57cec5SDimitry Andric goto end; 5930b57cec5SDimitry Andric } 5940b57cec5SDimitry Andric } else { 5950b57cec5SDimitry Andric if (*pupperDist > *plower) 5960b57cec5SDimitry Andric *pupperDist = traits_t<T>::min_value; 5970b57cec5SDimitry Andric if (plastiter != NULL) 5980b57cec5SDimitry Andric *plastiter = *plower >= upper && *pupperDist < upper - incr; 5990b57cec5SDimitry Andric if (*pupperDist < upper) 6000b57cec5SDimitry Andric *pupperDist = upper; // tracker C73258 6010b57cec5SDimitry Andric if (*plower < *pupperDist) { 6020b57cec5SDimitry Andric *pupper = *pupperDist; // no iterations available for the team 6030b57cec5SDimitry Andric goto end; 6040b57cec5SDimitry Andric } 6050b57cec5SDimitry Andric } 6060b57cec5SDimitry Andric } 6070b57cec5SDimitry Andric // Get the parallel loop chunk now (for thread) 6080b57cec5SDimitry Andric // compute trip count for team's chunk 6090b57cec5SDimitry Andric if (incr == 1) { 6100b57cec5SDimitry Andric trip_count = *pupperDist - *plower + 1; 6110b57cec5SDimitry Andric } else if (incr == -1) { 6120b57cec5SDimitry Andric trip_count = *plower - *pupperDist + 1; 6130b57cec5SDimitry Andric } else if (incr > 1) { 6140b57cec5SDimitry Andric // upper-lower can exceed the limit of signed type 6150b57cec5SDimitry Andric trip_count = (UT)(*pupperDist - *plower) / incr + 1; 6160b57cec5SDimitry Andric } else { 6170b57cec5SDimitry Andric trip_count = (UT)(*plower - *pupperDist) / (-incr) + 1; 6180b57cec5SDimitry Andric } 6190b57cec5SDimitry Andric KMP_DEBUG_ASSERT(trip_count); 6200b57cec5SDimitry Andric switch (schedule) { 6210b57cec5SDimitry Andric case kmp_sch_static: { 6220b57cec5SDimitry Andric if (trip_count <= nth) { 6230b57cec5SDimitry Andric KMP_DEBUG_ASSERT( 6240b57cec5SDimitry Andric __kmp_static == kmp_sch_static_greedy || 6250b57cec5SDimitry Andric __kmp_static == 6260b57cec5SDimitry Andric kmp_sch_static_balanced); // Unknown static scheduling type. 6270b57cec5SDimitry Andric if (tid < trip_count) 6280b57cec5SDimitry Andric *pupper = *plower = *plower + tid * incr; 6290b57cec5SDimitry Andric else 6300b57cec5SDimitry Andric *plower = *pupper + incr; // no iterations available 6310b57cec5SDimitry Andric if (plastiter != NULL) 6320b57cec5SDimitry Andric if (*plastiter != 0 && !(tid == trip_count - 1)) 6330b57cec5SDimitry Andric *plastiter = 0; 6340b57cec5SDimitry Andric } else { 6350b57cec5SDimitry Andric if (__kmp_static == kmp_sch_static_balanced) { 6360b57cec5SDimitry Andric UT chunkL = trip_count / nth; 6370b57cec5SDimitry Andric UT extras = trip_count % nth; 6380b57cec5SDimitry Andric *plower += incr * (tid * chunkL + (tid < extras ? tid : extras)); 6390b57cec5SDimitry Andric *pupper = *plower + chunkL * incr - (tid < extras ? 0 : incr); 6400b57cec5SDimitry Andric if (plastiter != NULL) 6410b57cec5SDimitry Andric if (*plastiter != 0 && !(tid == nth - 1)) 6420b57cec5SDimitry Andric *plastiter = 0; 6430b57cec5SDimitry Andric } else { 6440b57cec5SDimitry Andric T chunk_inc_count = 6450b57cec5SDimitry Andric (trip_count / nth + ((trip_count % nth) ? 1 : 0)) * incr; 6460b57cec5SDimitry Andric T upper = *pupperDist; 6470b57cec5SDimitry Andric KMP_DEBUG_ASSERT(__kmp_static == kmp_sch_static_greedy); 6480b57cec5SDimitry Andric // Unknown static scheduling type. 6490b57cec5SDimitry Andric *plower += tid * chunk_inc_count; 6500b57cec5SDimitry Andric *pupper = *plower + chunk_inc_count - incr; 6510b57cec5SDimitry Andric if (incr > 0) { 6520b57cec5SDimitry Andric if (*pupper < *plower) 6530b57cec5SDimitry Andric *pupper = traits_t<T>::max_value; 6540b57cec5SDimitry Andric if (plastiter != NULL) 6550b57cec5SDimitry Andric if (*plastiter != 0 && 6560b57cec5SDimitry Andric !(*plower <= upper && *pupper > upper - incr)) 6570b57cec5SDimitry Andric *plastiter = 0; 6580b57cec5SDimitry Andric if (*pupper > upper) 6590b57cec5SDimitry Andric *pupper = upper; // tracker C73258 6600b57cec5SDimitry Andric } else { 6610b57cec5SDimitry Andric if (*pupper > *plower) 6620b57cec5SDimitry Andric *pupper = traits_t<T>::min_value; 6630b57cec5SDimitry Andric if (plastiter != NULL) 6640b57cec5SDimitry Andric if (*plastiter != 0 && 6650b57cec5SDimitry Andric !(*plower >= upper && *pupper < upper - incr)) 6660b57cec5SDimitry Andric *plastiter = 0; 6670b57cec5SDimitry Andric if (*pupper < upper) 6680b57cec5SDimitry Andric *pupper = upper; // tracker C73258 6690b57cec5SDimitry Andric } 6700b57cec5SDimitry Andric } 6710b57cec5SDimitry Andric } 6720b57cec5SDimitry Andric break; 6730b57cec5SDimitry Andric } 6740b57cec5SDimitry Andric case kmp_sch_static_chunked: { 6750b57cec5SDimitry Andric ST span; 6760b57cec5SDimitry Andric if (chunk < 1) 6770b57cec5SDimitry Andric chunk = 1; 6780b57cec5SDimitry Andric span = chunk * incr; 6790b57cec5SDimitry Andric *pstride = span * nth; 6800b57cec5SDimitry Andric *plower = *plower + (span * tid); 6810b57cec5SDimitry Andric *pupper = *plower + span - incr; 6820b57cec5SDimitry Andric if (plastiter != NULL) 6830b57cec5SDimitry Andric if (*plastiter != 0 && !(tid == ((trip_count - 1) / (UT)chunk) % nth)) 6840b57cec5SDimitry Andric *plastiter = 0; 6850b57cec5SDimitry Andric break; 6860b57cec5SDimitry Andric } 6870b57cec5SDimitry Andric default: 6880b57cec5SDimitry Andric KMP_ASSERT2(0, 6890b57cec5SDimitry Andric "__kmpc_dist_for_static_init: unknown loop scheduling type"); 6900b57cec5SDimitry Andric break; 6910b57cec5SDimitry Andric } 6920b57cec5SDimitry Andric } 6930b57cec5SDimitry Andric end:; 6940b57cec5SDimitry Andric #ifdef KMP_DEBUG 6950b57cec5SDimitry Andric { 6960b57cec5SDimitry Andric char *buff; 6970b57cec5SDimitry Andric // create format specifiers before the debug output 6980b57cec5SDimitry Andric buff = __kmp_str_format( 6990b57cec5SDimitry Andric "__kmpc_dist_for_static_init: last=%%d lo=%%%s up=%%%s upDist=%%%s " 7000b57cec5SDimitry Andric "stride=%%%s signed?<%s>\n", 7010b57cec5SDimitry Andric traits_t<T>::spec, traits_t<T>::spec, traits_t<T>::spec, 7020b57cec5SDimitry Andric traits_t<ST>::spec, traits_t<T>::spec); 7030b57cec5SDimitry Andric KD_TRACE(100, (buff, *plastiter, *plower, *pupper, *pupperDist, *pstride)); 7040b57cec5SDimitry Andric __kmp_str_free(&buff); 7050b57cec5SDimitry Andric } 7060b57cec5SDimitry Andric #endif 7070b57cec5SDimitry Andric KE_TRACE(10, ("__kmpc_dist_for_static_init: T#%d return\n", gtid)); 708*81ad6265SDimitry Andric #if OMPT_SUPPORT && OMPT_OPTIONAL 709*81ad6265SDimitry Andric if (ompt_enabled.ompt_callback_work || ompt_enabled.ompt_callback_dispatch) { 710*81ad6265SDimitry Andric ompt_team_info_t *team_info = __ompt_get_teaminfo(0, NULL); 711*81ad6265SDimitry Andric ompt_task_info_t *task_info = __ompt_get_task_info_object(0); 712*81ad6265SDimitry Andric if (ompt_enabled.ompt_callback_work) { 713*81ad6265SDimitry Andric ompt_callbacks.ompt_callback(ompt_callback_work)( 714*81ad6265SDimitry Andric ompt_work_distribute, ompt_scope_begin, &(team_info->parallel_data), 715*81ad6265SDimitry Andric &(task_info->task_data), 0, codeptr); 716*81ad6265SDimitry Andric } 717*81ad6265SDimitry Andric if (ompt_enabled.ompt_callback_dispatch) { 718*81ad6265SDimitry Andric ompt_data_t instance = ompt_data_none; 719*81ad6265SDimitry Andric ompt_dispatch_chunk_t dispatch_chunk; 720*81ad6265SDimitry Andric OMPT_GET_DISPATCH_CHUNK(dispatch_chunk, *plower, *pupperDist, incr); 721*81ad6265SDimitry Andric instance.ptr = &dispatch_chunk; 722*81ad6265SDimitry Andric ompt_callbacks.ompt_callback(ompt_callback_dispatch)( 723*81ad6265SDimitry Andric &(team_info->parallel_data), &(task_info->task_data), 724*81ad6265SDimitry Andric ompt_dispatch_distribute_chunk, instance); 725*81ad6265SDimitry Andric } 726*81ad6265SDimitry Andric } 727*81ad6265SDimitry Andric #endif // OMPT_SUPPORT && OMPT_OPTIONAL 7280b57cec5SDimitry Andric KMP_STATS_LOOP_END(OMP_distribute_iterations); 7290b57cec5SDimitry Andric return; 7300b57cec5SDimitry Andric } 7310b57cec5SDimitry Andric 7320b57cec5SDimitry Andric template <typename T> 7330b57cec5SDimitry Andric static void __kmp_team_static_init(ident_t *loc, kmp_int32 gtid, 7340b57cec5SDimitry Andric kmp_int32 *p_last, T *p_lb, T *p_ub, 7350b57cec5SDimitry Andric typename traits_t<T>::signed_t *p_st, 7360b57cec5SDimitry Andric typename traits_t<T>::signed_t incr, 7370b57cec5SDimitry Andric typename traits_t<T>::signed_t chunk) { 7380b57cec5SDimitry Andric // The routine returns the first chunk distributed to the team and 7390b57cec5SDimitry Andric // stride for next chunks calculation. 7400b57cec5SDimitry Andric // Last iteration flag set for the team that will execute 7410b57cec5SDimitry Andric // the last iteration of the loop. 7425ffd83dbSDimitry Andric // The routine is called for dist_schedule(static,chunk) only. 7430b57cec5SDimitry Andric typedef typename traits_t<T>::unsigned_t UT; 7440b57cec5SDimitry Andric typedef typename traits_t<T>::signed_t ST; 7450b57cec5SDimitry Andric kmp_uint32 team_id; 7460b57cec5SDimitry Andric kmp_uint32 nteams; 7470b57cec5SDimitry Andric UT trip_count; 7480b57cec5SDimitry Andric T lower; 7490b57cec5SDimitry Andric T upper; 7500b57cec5SDimitry Andric ST span; 7510b57cec5SDimitry Andric kmp_team_t *team; 7520b57cec5SDimitry Andric kmp_info_t *th; 7530b57cec5SDimitry Andric 7540b57cec5SDimitry Andric KMP_DEBUG_ASSERT(p_last && p_lb && p_ub && p_st); 7550b57cec5SDimitry Andric KE_TRACE(10, ("__kmp_team_static_init called (%d)\n", gtid)); 756e8d8bef9SDimitry Andric __kmp_assert_valid_gtid(gtid); 7570b57cec5SDimitry Andric #ifdef KMP_DEBUG 7580b57cec5SDimitry Andric { 7590b57cec5SDimitry Andric char *buff; 7600b57cec5SDimitry Andric // create format specifiers before the debug output 7610b57cec5SDimitry Andric buff = __kmp_str_format("__kmp_team_static_init enter: T#%%d liter=%%d " 7620b57cec5SDimitry Andric "iter=(%%%s, %%%s, %%%s) chunk %%%s; signed?<%s>\n", 7630b57cec5SDimitry Andric traits_t<T>::spec, traits_t<T>::spec, 7640b57cec5SDimitry Andric traits_t<ST>::spec, traits_t<ST>::spec, 7650b57cec5SDimitry Andric traits_t<T>::spec); 7660b57cec5SDimitry Andric KD_TRACE(100, (buff, gtid, *p_last, *p_lb, *p_ub, *p_st, chunk)); 7670b57cec5SDimitry Andric __kmp_str_free(&buff); 7680b57cec5SDimitry Andric } 7690b57cec5SDimitry Andric #endif 7700b57cec5SDimitry Andric 7710b57cec5SDimitry Andric lower = *p_lb; 7720b57cec5SDimitry Andric upper = *p_ub; 7730b57cec5SDimitry Andric if (__kmp_env_consistency_check) { 7740b57cec5SDimitry Andric if (incr == 0) { 7750b57cec5SDimitry Andric __kmp_error_construct(kmp_i18n_msg_CnsLoopIncrZeroProhibited, ct_pdo, 7760b57cec5SDimitry Andric loc); 7770b57cec5SDimitry Andric } 7780b57cec5SDimitry Andric if (incr > 0 ? (upper < lower) : (lower < upper)) { 7790b57cec5SDimitry Andric // The loop is illegal. 7800b57cec5SDimitry Andric // Some zero-trip loops maintained by compiler, e.g.: 7810b57cec5SDimitry Andric // for(i=10;i<0;++i) // lower >= upper - run-time check 7820b57cec5SDimitry Andric // for(i=0;i>10;--i) // lower <= upper - run-time check 7830b57cec5SDimitry Andric // for(i=0;i>10;++i) // incr > 0 - compile-time check 7840b57cec5SDimitry Andric // for(i=10;i<0;--i) // incr < 0 - compile-time check 7850b57cec5SDimitry Andric // Compiler does not check the following illegal loops: 7860b57cec5SDimitry Andric // for(i=0;i<10;i+=incr) // where incr<0 7870b57cec5SDimitry Andric // for(i=10;i>0;i-=incr) // where incr<0 7880b57cec5SDimitry Andric __kmp_error_construct(kmp_i18n_msg_CnsLoopIncrIllegal, ct_pdo, loc); 7890b57cec5SDimitry Andric } 7900b57cec5SDimitry Andric } 7910b57cec5SDimitry Andric th = __kmp_threads[gtid]; 7920b57cec5SDimitry Andric team = th->th.th_team; 7930b57cec5SDimitry Andric KMP_DEBUG_ASSERT(th->th.th_teams_microtask); // we are in the teams construct 7940b57cec5SDimitry Andric nteams = th->th.th_teams_size.nteams; 7950b57cec5SDimitry Andric team_id = team->t.t_master_tid; 7960b57cec5SDimitry Andric KMP_DEBUG_ASSERT(nteams == (kmp_uint32)team->t.t_parent->t.t_nproc); 7970b57cec5SDimitry Andric 7980b57cec5SDimitry Andric // compute trip count 7990b57cec5SDimitry Andric if (incr == 1) { 8000b57cec5SDimitry Andric trip_count = upper - lower + 1; 8010b57cec5SDimitry Andric } else if (incr == -1) { 8020b57cec5SDimitry Andric trip_count = lower - upper + 1; 8030b57cec5SDimitry Andric } else if (incr > 0) { 8040b57cec5SDimitry Andric // upper-lower can exceed the limit of signed type 8050b57cec5SDimitry Andric trip_count = (UT)(upper - lower) / incr + 1; 8060b57cec5SDimitry Andric } else { 8070b57cec5SDimitry Andric trip_count = (UT)(lower - upper) / (-incr) + 1; 8080b57cec5SDimitry Andric } 8090b57cec5SDimitry Andric if (chunk < 1) 8100b57cec5SDimitry Andric chunk = 1; 8110b57cec5SDimitry Andric span = chunk * incr; 8120b57cec5SDimitry Andric *p_st = span * nteams; 8130b57cec5SDimitry Andric *p_lb = lower + (span * team_id); 8140b57cec5SDimitry Andric *p_ub = *p_lb + span - incr; 8150b57cec5SDimitry Andric if (p_last != NULL) 8160b57cec5SDimitry Andric *p_last = (team_id == ((trip_count - 1) / (UT)chunk) % nteams); 8170b57cec5SDimitry Andric // Correct upper bound if needed 8180b57cec5SDimitry Andric if (incr > 0) { 8190b57cec5SDimitry Andric if (*p_ub < *p_lb) // overflow? 8200b57cec5SDimitry Andric *p_ub = traits_t<T>::max_value; 8210b57cec5SDimitry Andric if (*p_ub > upper) 8220b57cec5SDimitry Andric *p_ub = upper; // tracker C73258 8230b57cec5SDimitry Andric } else { // incr < 0 8240b57cec5SDimitry Andric if (*p_ub > *p_lb) 8250b57cec5SDimitry Andric *p_ub = traits_t<T>::min_value; 8260b57cec5SDimitry Andric if (*p_ub < upper) 8270b57cec5SDimitry Andric *p_ub = upper; // tracker C73258 8280b57cec5SDimitry Andric } 8290b57cec5SDimitry Andric #ifdef KMP_DEBUG 8300b57cec5SDimitry Andric { 8310b57cec5SDimitry Andric char *buff; 8320b57cec5SDimitry Andric // create format specifiers before the debug output 8330b57cec5SDimitry Andric buff = 8340b57cec5SDimitry Andric __kmp_str_format("__kmp_team_static_init exit: T#%%d team%%u liter=%%d " 8350b57cec5SDimitry Andric "iter=(%%%s, %%%s, %%%s) chunk %%%s\n", 8360b57cec5SDimitry Andric traits_t<T>::spec, traits_t<T>::spec, 8370b57cec5SDimitry Andric traits_t<ST>::spec, traits_t<ST>::spec); 8380b57cec5SDimitry Andric KD_TRACE(100, (buff, gtid, team_id, *p_last, *p_lb, *p_ub, *p_st, chunk)); 8390b57cec5SDimitry Andric __kmp_str_free(&buff); 8400b57cec5SDimitry Andric } 8410b57cec5SDimitry Andric #endif 8420b57cec5SDimitry Andric } 8430b57cec5SDimitry Andric 8440b57cec5SDimitry Andric //------------------------------------------------------------------------------ 8450b57cec5SDimitry Andric extern "C" { 8460b57cec5SDimitry Andric /*! 8470b57cec5SDimitry Andric @ingroup WORK_SHARING 8480b57cec5SDimitry Andric @param loc Source code location 8490b57cec5SDimitry Andric @param gtid Global thread id of this thread 8500b57cec5SDimitry Andric @param schedtype Scheduling type 8510b57cec5SDimitry Andric @param plastiter Pointer to the "last iteration" flag 8520b57cec5SDimitry Andric @param plower Pointer to the lower bound 8530b57cec5SDimitry Andric @param pupper Pointer to the upper bound 8540b57cec5SDimitry Andric @param pstride Pointer to the stride 8550b57cec5SDimitry Andric @param incr Loop increment 8560b57cec5SDimitry Andric @param chunk The chunk size 8570b57cec5SDimitry Andric 8580b57cec5SDimitry Andric Each of the four functions here are identical apart from the argument types. 8590b57cec5SDimitry Andric 8600b57cec5SDimitry Andric The functions compute the upper and lower bounds and stride to be used for the 8610b57cec5SDimitry Andric set of iterations to be executed by the current thread from the statically 8620b57cec5SDimitry Andric scheduled loop that is described by the initial values of the bounds, stride, 8630b57cec5SDimitry Andric increment and chunk size. 8640b57cec5SDimitry Andric 8650b57cec5SDimitry Andric @{ 8660b57cec5SDimitry Andric */ 8670b57cec5SDimitry Andric void __kmpc_for_static_init_4(ident_t *loc, kmp_int32 gtid, kmp_int32 schedtype, 8680b57cec5SDimitry Andric kmp_int32 *plastiter, kmp_int32 *plower, 8690b57cec5SDimitry Andric kmp_int32 *pupper, kmp_int32 *pstride, 8700b57cec5SDimitry Andric kmp_int32 incr, kmp_int32 chunk) { 8710b57cec5SDimitry Andric __kmp_for_static_init<kmp_int32>(loc, gtid, schedtype, plastiter, plower, 8720b57cec5SDimitry Andric pupper, pstride, incr, chunk 8730b57cec5SDimitry Andric #if OMPT_SUPPORT && OMPT_OPTIONAL 8740b57cec5SDimitry Andric , 8750b57cec5SDimitry Andric OMPT_GET_RETURN_ADDRESS(0) 8760b57cec5SDimitry Andric #endif 8770b57cec5SDimitry Andric ); 8780b57cec5SDimitry Andric } 8790b57cec5SDimitry Andric 8800b57cec5SDimitry Andric /*! 8810b57cec5SDimitry Andric See @ref __kmpc_for_static_init_4 8820b57cec5SDimitry Andric */ 8830b57cec5SDimitry Andric void __kmpc_for_static_init_4u(ident_t *loc, kmp_int32 gtid, 8840b57cec5SDimitry Andric kmp_int32 schedtype, kmp_int32 *plastiter, 8850b57cec5SDimitry Andric kmp_uint32 *plower, kmp_uint32 *pupper, 8860b57cec5SDimitry Andric kmp_int32 *pstride, kmp_int32 incr, 8870b57cec5SDimitry Andric kmp_int32 chunk) { 8880b57cec5SDimitry Andric __kmp_for_static_init<kmp_uint32>(loc, gtid, schedtype, plastiter, plower, 8890b57cec5SDimitry Andric pupper, pstride, incr, chunk 8900b57cec5SDimitry Andric #if OMPT_SUPPORT && OMPT_OPTIONAL 8910b57cec5SDimitry Andric , 8920b57cec5SDimitry Andric OMPT_GET_RETURN_ADDRESS(0) 8930b57cec5SDimitry Andric #endif 8940b57cec5SDimitry Andric ); 8950b57cec5SDimitry Andric } 8960b57cec5SDimitry Andric 8970b57cec5SDimitry Andric /*! 8980b57cec5SDimitry Andric See @ref __kmpc_for_static_init_4 8990b57cec5SDimitry Andric */ 9000b57cec5SDimitry Andric void __kmpc_for_static_init_8(ident_t *loc, kmp_int32 gtid, kmp_int32 schedtype, 9010b57cec5SDimitry Andric kmp_int32 *plastiter, kmp_int64 *plower, 9020b57cec5SDimitry Andric kmp_int64 *pupper, kmp_int64 *pstride, 9030b57cec5SDimitry Andric kmp_int64 incr, kmp_int64 chunk) { 9040b57cec5SDimitry Andric __kmp_for_static_init<kmp_int64>(loc, gtid, schedtype, plastiter, plower, 9050b57cec5SDimitry Andric pupper, pstride, incr, chunk 9060b57cec5SDimitry Andric #if OMPT_SUPPORT && OMPT_OPTIONAL 9070b57cec5SDimitry Andric , 9080b57cec5SDimitry Andric OMPT_GET_RETURN_ADDRESS(0) 9090b57cec5SDimitry Andric #endif 9100b57cec5SDimitry Andric ); 9110b57cec5SDimitry Andric } 9120b57cec5SDimitry Andric 9130b57cec5SDimitry Andric /*! 9140b57cec5SDimitry Andric See @ref __kmpc_for_static_init_4 9150b57cec5SDimitry Andric */ 9160b57cec5SDimitry Andric void __kmpc_for_static_init_8u(ident_t *loc, kmp_int32 gtid, 9170b57cec5SDimitry Andric kmp_int32 schedtype, kmp_int32 *plastiter, 9180b57cec5SDimitry Andric kmp_uint64 *plower, kmp_uint64 *pupper, 9190b57cec5SDimitry Andric kmp_int64 *pstride, kmp_int64 incr, 9200b57cec5SDimitry Andric kmp_int64 chunk) { 9210b57cec5SDimitry Andric __kmp_for_static_init<kmp_uint64>(loc, gtid, schedtype, plastiter, plower, 9220b57cec5SDimitry Andric pupper, pstride, incr, chunk 9230b57cec5SDimitry Andric #if OMPT_SUPPORT && OMPT_OPTIONAL 9240b57cec5SDimitry Andric , 9250b57cec5SDimitry Andric OMPT_GET_RETURN_ADDRESS(0) 9260b57cec5SDimitry Andric #endif 9270b57cec5SDimitry Andric ); 9280b57cec5SDimitry Andric } 9290b57cec5SDimitry Andric /*! 9300b57cec5SDimitry Andric @} 9310b57cec5SDimitry Andric */ 9320b57cec5SDimitry Andric 933*81ad6265SDimitry Andric #if OMPT_SUPPORT && OMPT_OPTIONAL 934*81ad6265SDimitry Andric #define OMPT_CODEPTR_ARG , OMPT_GET_RETURN_ADDRESS(0) 935*81ad6265SDimitry Andric #else 936*81ad6265SDimitry Andric #define OMPT_CODEPTR_ARG 937*81ad6265SDimitry Andric #endif 938*81ad6265SDimitry Andric 9390b57cec5SDimitry Andric /*! 9400b57cec5SDimitry Andric @ingroup WORK_SHARING 9410b57cec5SDimitry Andric @param loc Source code location 9420b57cec5SDimitry Andric @param gtid Global thread id of this thread 9430b57cec5SDimitry Andric @param schedule Scheduling type for the parallel loop 9440b57cec5SDimitry Andric @param plastiter Pointer to the "last iteration" flag 9450b57cec5SDimitry Andric @param plower Pointer to the lower bound 9460b57cec5SDimitry Andric @param pupper Pointer to the upper bound of loop chunk 9470b57cec5SDimitry Andric @param pupperD Pointer to the upper bound of dist_chunk 9480b57cec5SDimitry Andric @param pstride Pointer to the stride for parallel loop 9490b57cec5SDimitry Andric @param incr Loop increment 9500b57cec5SDimitry Andric @param chunk The chunk size for the parallel loop 9510b57cec5SDimitry Andric 9520b57cec5SDimitry Andric Each of the four functions here are identical apart from the argument types. 9530b57cec5SDimitry Andric 9540b57cec5SDimitry Andric The functions compute the upper and lower bounds and strides to be used for the 9550b57cec5SDimitry Andric set of iterations to be executed by the current thread from the statically 9560b57cec5SDimitry Andric scheduled loop that is described by the initial values of the bounds, strides, 9570b57cec5SDimitry Andric increment and chunks for parallel loop and distribute constructs. 9580b57cec5SDimitry Andric 9590b57cec5SDimitry Andric @{ 9600b57cec5SDimitry Andric */ 9610b57cec5SDimitry Andric void __kmpc_dist_for_static_init_4(ident_t *loc, kmp_int32 gtid, 9620b57cec5SDimitry Andric kmp_int32 schedule, kmp_int32 *plastiter, 9630b57cec5SDimitry Andric kmp_int32 *plower, kmp_int32 *pupper, 9640b57cec5SDimitry Andric kmp_int32 *pupperD, kmp_int32 *pstride, 9650b57cec5SDimitry Andric kmp_int32 incr, kmp_int32 chunk) { 9660b57cec5SDimitry Andric __kmp_dist_for_static_init<kmp_int32>(loc, gtid, schedule, plastiter, plower, 967*81ad6265SDimitry Andric pupper, pupperD, pstride, incr, 968*81ad6265SDimitry Andric chunk OMPT_CODEPTR_ARG); 9690b57cec5SDimitry Andric } 9700b57cec5SDimitry Andric 9710b57cec5SDimitry Andric /*! 9720b57cec5SDimitry Andric See @ref __kmpc_dist_for_static_init_4 9730b57cec5SDimitry Andric */ 9740b57cec5SDimitry Andric void __kmpc_dist_for_static_init_4u(ident_t *loc, kmp_int32 gtid, 9750b57cec5SDimitry Andric kmp_int32 schedule, kmp_int32 *plastiter, 9760b57cec5SDimitry Andric kmp_uint32 *plower, kmp_uint32 *pupper, 9770b57cec5SDimitry Andric kmp_uint32 *pupperD, kmp_int32 *pstride, 9780b57cec5SDimitry Andric kmp_int32 incr, kmp_int32 chunk) { 9790b57cec5SDimitry Andric __kmp_dist_for_static_init<kmp_uint32>(loc, gtid, schedule, plastiter, plower, 980*81ad6265SDimitry Andric pupper, pupperD, pstride, incr, 981*81ad6265SDimitry Andric chunk OMPT_CODEPTR_ARG); 9820b57cec5SDimitry Andric } 9830b57cec5SDimitry Andric 9840b57cec5SDimitry Andric /*! 9850b57cec5SDimitry Andric See @ref __kmpc_dist_for_static_init_4 9860b57cec5SDimitry Andric */ 9870b57cec5SDimitry Andric void __kmpc_dist_for_static_init_8(ident_t *loc, kmp_int32 gtid, 9880b57cec5SDimitry Andric kmp_int32 schedule, kmp_int32 *plastiter, 9890b57cec5SDimitry Andric kmp_int64 *plower, kmp_int64 *pupper, 9900b57cec5SDimitry Andric kmp_int64 *pupperD, kmp_int64 *pstride, 9910b57cec5SDimitry Andric kmp_int64 incr, kmp_int64 chunk) { 9920b57cec5SDimitry Andric __kmp_dist_for_static_init<kmp_int64>(loc, gtid, schedule, plastiter, plower, 993*81ad6265SDimitry Andric pupper, pupperD, pstride, incr, 994*81ad6265SDimitry Andric chunk OMPT_CODEPTR_ARG); 9950b57cec5SDimitry Andric } 9960b57cec5SDimitry Andric 9970b57cec5SDimitry Andric /*! 9980b57cec5SDimitry Andric See @ref __kmpc_dist_for_static_init_4 9990b57cec5SDimitry Andric */ 10000b57cec5SDimitry Andric void __kmpc_dist_for_static_init_8u(ident_t *loc, kmp_int32 gtid, 10010b57cec5SDimitry Andric kmp_int32 schedule, kmp_int32 *plastiter, 10020b57cec5SDimitry Andric kmp_uint64 *plower, kmp_uint64 *pupper, 10030b57cec5SDimitry Andric kmp_uint64 *pupperD, kmp_int64 *pstride, 10040b57cec5SDimitry Andric kmp_int64 incr, kmp_int64 chunk) { 10050b57cec5SDimitry Andric __kmp_dist_for_static_init<kmp_uint64>(loc, gtid, schedule, plastiter, plower, 1006*81ad6265SDimitry Andric pupper, pupperD, pstride, incr, 1007*81ad6265SDimitry Andric chunk OMPT_CODEPTR_ARG); 10080b57cec5SDimitry Andric } 10090b57cec5SDimitry Andric /*! 10100b57cec5SDimitry Andric @} 10110b57cec5SDimitry Andric */ 10120b57cec5SDimitry Andric 10130b57cec5SDimitry Andric //------------------------------------------------------------------------------ 10140b57cec5SDimitry Andric // Auxiliary routines for Distribute Parallel Loop construct implementation 10150b57cec5SDimitry Andric // Transfer call to template< type T > 10160b57cec5SDimitry Andric // __kmp_team_static_init( ident_t *loc, int gtid, 10170b57cec5SDimitry Andric // int *p_last, T *lb, T *ub, ST *st, ST incr, ST chunk ) 10180b57cec5SDimitry Andric 10190b57cec5SDimitry Andric /*! 10200b57cec5SDimitry Andric @ingroup WORK_SHARING 10210b57cec5SDimitry Andric @{ 10220b57cec5SDimitry Andric @param loc Source location 10230b57cec5SDimitry Andric @param gtid Global thread id 10240b57cec5SDimitry Andric @param p_last pointer to last iteration flag 10250b57cec5SDimitry Andric @param p_lb pointer to Lower bound 10260b57cec5SDimitry Andric @param p_ub pointer to Upper bound 10270b57cec5SDimitry Andric @param p_st Step (or increment if you prefer) 10280b57cec5SDimitry Andric @param incr Loop increment 10290b57cec5SDimitry Andric @param chunk The chunk size to block with 10300b57cec5SDimitry Andric 10310b57cec5SDimitry Andric The functions compute the upper and lower bounds and stride to be used for the 10320b57cec5SDimitry Andric set of iterations to be executed by the current team from the statically 10330b57cec5SDimitry Andric scheduled loop that is described by the initial values of the bounds, stride, 10340b57cec5SDimitry Andric increment and chunk for the distribute construct as part of composite distribute 10350b57cec5SDimitry Andric parallel loop construct. These functions are all identical apart from the types 10360b57cec5SDimitry Andric of the arguments. 10370b57cec5SDimitry Andric */ 10380b57cec5SDimitry Andric 10390b57cec5SDimitry Andric void __kmpc_team_static_init_4(ident_t *loc, kmp_int32 gtid, kmp_int32 *p_last, 10400b57cec5SDimitry Andric kmp_int32 *p_lb, kmp_int32 *p_ub, 10410b57cec5SDimitry Andric kmp_int32 *p_st, kmp_int32 incr, 10420b57cec5SDimitry Andric kmp_int32 chunk) { 10430b57cec5SDimitry Andric KMP_DEBUG_ASSERT(__kmp_init_serial); 10440b57cec5SDimitry Andric __kmp_team_static_init<kmp_int32>(loc, gtid, p_last, p_lb, p_ub, p_st, incr, 10450b57cec5SDimitry Andric chunk); 10460b57cec5SDimitry Andric } 10470b57cec5SDimitry Andric 10480b57cec5SDimitry Andric /*! 10490b57cec5SDimitry Andric See @ref __kmpc_team_static_init_4 10500b57cec5SDimitry Andric */ 10510b57cec5SDimitry Andric void __kmpc_team_static_init_4u(ident_t *loc, kmp_int32 gtid, kmp_int32 *p_last, 10520b57cec5SDimitry Andric kmp_uint32 *p_lb, kmp_uint32 *p_ub, 10530b57cec5SDimitry Andric kmp_int32 *p_st, kmp_int32 incr, 10540b57cec5SDimitry Andric kmp_int32 chunk) { 10550b57cec5SDimitry Andric KMP_DEBUG_ASSERT(__kmp_init_serial); 10560b57cec5SDimitry Andric __kmp_team_static_init<kmp_uint32>(loc, gtid, p_last, p_lb, p_ub, p_st, incr, 10570b57cec5SDimitry Andric chunk); 10580b57cec5SDimitry Andric } 10590b57cec5SDimitry Andric 10600b57cec5SDimitry Andric /*! 10610b57cec5SDimitry Andric See @ref __kmpc_team_static_init_4 10620b57cec5SDimitry Andric */ 10630b57cec5SDimitry Andric void __kmpc_team_static_init_8(ident_t *loc, kmp_int32 gtid, kmp_int32 *p_last, 10640b57cec5SDimitry Andric kmp_int64 *p_lb, kmp_int64 *p_ub, 10650b57cec5SDimitry Andric kmp_int64 *p_st, kmp_int64 incr, 10660b57cec5SDimitry Andric kmp_int64 chunk) { 10670b57cec5SDimitry Andric KMP_DEBUG_ASSERT(__kmp_init_serial); 10680b57cec5SDimitry Andric __kmp_team_static_init<kmp_int64>(loc, gtid, p_last, p_lb, p_ub, p_st, incr, 10690b57cec5SDimitry Andric chunk); 10700b57cec5SDimitry Andric } 10710b57cec5SDimitry Andric 10720b57cec5SDimitry Andric /*! 10730b57cec5SDimitry Andric See @ref __kmpc_team_static_init_4 10740b57cec5SDimitry Andric */ 10750b57cec5SDimitry Andric void __kmpc_team_static_init_8u(ident_t *loc, kmp_int32 gtid, kmp_int32 *p_last, 10760b57cec5SDimitry Andric kmp_uint64 *p_lb, kmp_uint64 *p_ub, 10770b57cec5SDimitry Andric kmp_int64 *p_st, kmp_int64 incr, 10780b57cec5SDimitry Andric kmp_int64 chunk) { 10790b57cec5SDimitry Andric KMP_DEBUG_ASSERT(__kmp_init_serial); 10800b57cec5SDimitry Andric __kmp_team_static_init<kmp_uint64>(loc, gtid, p_last, p_lb, p_ub, p_st, incr, 10810b57cec5SDimitry Andric chunk); 10820b57cec5SDimitry Andric } 10830b57cec5SDimitry Andric /*! 10840b57cec5SDimitry Andric @} 10850b57cec5SDimitry Andric */ 10860b57cec5SDimitry Andric 10870b57cec5SDimitry Andric } // extern "C" 1088