10b57cec5SDimitry Andric /* 20b57cec5SDimitry Andric * kmp_taskdeps.h 30b57cec5SDimitry Andric */ 40b57cec5SDimitry Andric 50b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 80b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 90b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 100b57cec5SDimitry Andric // 110b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 120b57cec5SDimitry Andric 130b57cec5SDimitry Andric #ifndef KMP_TASKDEPS_H 140b57cec5SDimitry Andric #define KMP_TASKDEPS_H 150b57cec5SDimitry Andric 160b57cec5SDimitry Andric #include "kmp.h" 170b57cec5SDimitry Andric 180b57cec5SDimitry Andric #define KMP_ACQUIRE_DEPNODE(gtid, n) __kmp_acquire_lock(&(n)->dn.lock, (gtid)) 190b57cec5SDimitry Andric #define KMP_RELEASE_DEPNODE(gtid, n) __kmp_release_lock(&(n)->dn.lock, (gtid)) 200b57cec5SDimitry Andric 210b57cec5SDimitry Andric static inline void __kmp_node_deref(kmp_info_t *thread, kmp_depnode_t *node) { 220b57cec5SDimitry Andric if (!node) 230b57cec5SDimitry Andric return; 240b57cec5SDimitry Andric 250b57cec5SDimitry Andric kmp_int32 n = KMP_ATOMIC_DEC(&node->dn.nrefs) - 1; 266e75b2fbSDimitry Andric KMP_DEBUG_ASSERT(n >= 0); 270b57cec5SDimitry Andric if (n == 0) { 28*81ad6265SDimitry Andric #if USE_ITT_BUILD && USE_ITT_NOTIFY 29*81ad6265SDimitry Andric __itt_sync_destroy(node); 30*81ad6265SDimitry Andric #endif 310b57cec5SDimitry Andric KMP_ASSERT(node->dn.nrefs == 0); 320b57cec5SDimitry Andric #if USE_FAST_MEMORY 330b57cec5SDimitry Andric __kmp_fast_free(thread, node); 340b57cec5SDimitry Andric #else 350b57cec5SDimitry Andric __kmp_thread_free(thread, node); 360b57cec5SDimitry Andric #endif 370b57cec5SDimitry Andric } 380b57cec5SDimitry Andric } 390b57cec5SDimitry Andric 400b57cec5SDimitry Andric static inline void __kmp_depnode_list_free(kmp_info_t *thread, 410b57cec5SDimitry Andric kmp_depnode_list *list) { 420b57cec5SDimitry Andric kmp_depnode_list *next; 430b57cec5SDimitry Andric 440b57cec5SDimitry Andric for (; list; list = next) { 450b57cec5SDimitry Andric next = list->next; 460b57cec5SDimitry Andric 470b57cec5SDimitry Andric __kmp_node_deref(thread, list->node); 480b57cec5SDimitry Andric #if USE_FAST_MEMORY 490b57cec5SDimitry Andric __kmp_fast_free(thread, list); 500b57cec5SDimitry Andric #else 510b57cec5SDimitry Andric __kmp_thread_free(thread, list); 520b57cec5SDimitry Andric #endif 530b57cec5SDimitry Andric } 540b57cec5SDimitry Andric } 550b57cec5SDimitry Andric 560b57cec5SDimitry Andric static inline void __kmp_dephash_free_entries(kmp_info_t *thread, 570b57cec5SDimitry Andric kmp_dephash_t *h) { 580b57cec5SDimitry Andric for (size_t i = 0; i < h->size; i++) { 590b57cec5SDimitry Andric if (h->buckets[i]) { 600b57cec5SDimitry Andric kmp_dephash_entry_t *next; 610b57cec5SDimitry Andric for (kmp_dephash_entry_t *entry = h->buckets[i]; entry; entry = next) { 620b57cec5SDimitry Andric next = entry->next_in_bucket; 63fe6060f1SDimitry Andric __kmp_depnode_list_free(thread, entry->last_set); 64fe6060f1SDimitry Andric __kmp_depnode_list_free(thread, entry->prev_set); 650b57cec5SDimitry Andric __kmp_node_deref(thread, entry->last_out); 660b57cec5SDimitry Andric if (entry->mtx_lock) { 670b57cec5SDimitry Andric __kmp_destroy_lock(entry->mtx_lock); 680b57cec5SDimitry Andric __kmp_free(entry->mtx_lock); 690b57cec5SDimitry Andric } 700b57cec5SDimitry Andric #if USE_FAST_MEMORY 710b57cec5SDimitry Andric __kmp_fast_free(thread, entry); 720b57cec5SDimitry Andric #else 730b57cec5SDimitry Andric __kmp_thread_free(thread, entry); 740b57cec5SDimitry Andric #endif 750b57cec5SDimitry Andric } 760b57cec5SDimitry Andric h->buckets[i] = 0; 770b57cec5SDimitry Andric } 780b57cec5SDimitry Andric } 79349cc55cSDimitry Andric __kmp_node_deref(thread, h->last_all); 80349cc55cSDimitry Andric h->last_all = NULL; 810b57cec5SDimitry Andric } 820b57cec5SDimitry Andric 830b57cec5SDimitry Andric static inline void __kmp_dephash_free(kmp_info_t *thread, kmp_dephash_t *h) { 840b57cec5SDimitry Andric __kmp_dephash_free_entries(thread, h); 850b57cec5SDimitry Andric #if USE_FAST_MEMORY 860b57cec5SDimitry Andric __kmp_fast_free(thread, h); 870b57cec5SDimitry Andric #else 880b57cec5SDimitry Andric __kmp_thread_free(thread, h); 890b57cec5SDimitry Andric #endif 900b57cec5SDimitry Andric } 910b57cec5SDimitry Andric 92fe6060f1SDimitry Andric extern void __kmpc_give_task(kmp_task_t *ptask, kmp_int32 start); 93fe6060f1SDimitry Andric 940b57cec5SDimitry Andric static inline void __kmp_release_deps(kmp_int32 gtid, kmp_taskdata_t *task) { 950b57cec5SDimitry Andric kmp_info_t *thread = __kmp_threads[gtid]; 960b57cec5SDimitry Andric kmp_depnode_t *node = task->td_depnode; 970b57cec5SDimitry Andric 98e8d8bef9SDimitry Andric // Check mutexinoutset dependencies, release locks 99e8d8bef9SDimitry Andric if (UNLIKELY(node && (node->dn.mtx_num_locks < 0))) { 100e8d8bef9SDimitry Andric // negative num_locks means all locks were acquired 101e8d8bef9SDimitry Andric node->dn.mtx_num_locks = -node->dn.mtx_num_locks; 102e8d8bef9SDimitry Andric for (int i = node->dn.mtx_num_locks - 1; i >= 0; --i) { 103e8d8bef9SDimitry Andric KMP_DEBUG_ASSERT(node->dn.mtx_locks[i] != NULL); 104e8d8bef9SDimitry Andric __kmp_release_lock(node->dn.mtx_locks[i], gtid); 105e8d8bef9SDimitry Andric } 106e8d8bef9SDimitry Andric } 107e8d8bef9SDimitry Andric 1080b57cec5SDimitry Andric if (task->td_dephash) { 1090b57cec5SDimitry Andric KA_TRACE( 1100b57cec5SDimitry Andric 40, ("__kmp_release_deps: T#%d freeing dependencies hash of task %p.\n", 1110b57cec5SDimitry Andric gtid, task)); 1120b57cec5SDimitry Andric __kmp_dephash_free(thread, task->td_dephash); 1130b57cec5SDimitry Andric task->td_dephash = NULL; 1140b57cec5SDimitry Andric } 1150b57cec5SDimitry Andric 1160b57cec5SDimitry Andric if (!node) 1170b57cec5SDimitry Andric return; 1180b57cec5SDimitry Andric 1190b57cec5SDimitry Andric KA_TRACE(20, ("__kmp_release_deps: T#%d notifying successors of task %p.\n", 1200b57cec5SDimitry Andric gtid, task)); 1210b57cec5SDimitry Andric 1220b57cec5SDimitry Andric KMP_ACQUIRE_DEPNODE(gtid, node); 1230b57cec5SDimitry Andric node->dn.task = 1240b57cec5SDimitry Andric NULL; // mark this task as finished, so no new dependencies are generated 1250b57cec5SDimitry Andric KMP_RELEASE_DEPNODE(gtid, node); 1260b57cec5SDimitry Andric 1270b57cec5SDimitry Andric kmp_depnode_list_t *next; 128e8d8bef9SDimitry Andric kmp_taskdata_t *next_taskdata; 1290b57cec5SDimitry Andric for (kmp_depnode_list_t *p = node->dn.successors; p; p = next) { 1300b57cec5SDimitry Andric kmp_depnode_t *successor = p->node; 131*81ad6265SDimitry Andric #if USE_ITT_BUILD && USE_ITT_NOTIFY 132*81ad6265SDimitry Andric __itt_sync_releasing(successor); 133*81ad6265SDimitry Andric #endif 1340b57cec5SDimitry Andric kmp_int32 npredecessors = KMP_ATOMIC_DEC(&successor->dn.npredecessors) - 1; 1350b57cec5SDimitry Andric 1360b57cec5SDimitry Andric // successor task can be NULL for wait_depends or because deps are still 1370b57cec5SDimitry Andric // being processed 1380b57cec5SDimitry Andric if (npredecessors == 0) { 139*81ad6265SDimitry Andric #if USE_ITT_BUILD && USE_ITT_NOTIFY 140*81ad6265SDimitry Andric __itt_sync_acquired(successor); 141*81ad6265SDimitry Andric #endif 1420b57cec5SDimitry Andric KMP_MB(); 1430b57cec5SDimitry Andric if (successor->dn.task) { 1440b57cec5SDimitry Andric KA_TRACE(20, ("__kmp_release_deps: T#%d successor %p of %p scheduled " 1450b57cec5SDimitry Andric "for execution.\n", 1460b57cec5SDimitry Andric gtid, successor->dn.task, task)); 147e8d8bef9SDimitry Andric // If a regular task depending on a hidden helper task, when the 148e8d8bef9SDimitry Andric // hidden helper task is done, the regular task should be executed by 149e8d8bef9SDimitry Andric // its encountering team. 150e8d8bef9SDimitry Andric if (KMP_HIDDEN_HELPER_THREAD(gtid)) { 151e8d8bef9SDimitry Andric // Hidden helper thread can only execute hidden helper tasks 152e8d8bef9SDimitry Andric KMP_ASSERT(task->td_flags.hidden_helper); 153e8d8bef9SDimitry Andric next_taskdata = KMP_TASK_TO_TASKDATA(successor->dn.task); 154e8d8bef9SDimitry Andric // If the dependent task is a regular task, we need to push to its 155e8d8bef9SDimitry Andric // encountering thread's queue; otherwise, it can be pushed to its own 156e8d8bef9SDimitry Andric // queue. 157e8d8bef9SDimitry Andric if (!next_taskdata->td_flags.hidden_helper) { 158349cc55cSDimitry Andric kmp_int32 encountering_gtid = 159349cc55cSDimitry Andric next_taskdata->td_alloc_thread->th.th_info.ds.ds_gtid; 160349cc55cSDimitry Andric kmp_int32 encountering_tid = __kmp_tid_from_gtid(encountering_gtid); 161349cc55cSDimitry Andric __kmpc_give_task(successor->dn.task, encountering_tid); 162e8d8bef9SDimitry Andric } else { 1630b57cec5SDimitry Andric __kmp_omp_task(gtid, successor->dn.task, false); 1640b57cec5SDimitry Andric } 165e8d8bef9SDimitry Andric } else { 166e8d8bef9SDimitry Andric __kmp_omp_task(gtid, successor->dn.task, false); 167e8d8bef9SDimitry Andric } 168e8d8bef9SDimitry Andric } 1690b57cec5SDimitry Andric } 1700b57cec5SDimitry Andric 1710b57cec5SDimitry Andric next = p->next; 1720b57cec5SDimitry Andric __kmp_node_deref(thread, p->node); 1730b57cec5SDimitry Andric #if USE_FAST_MEMORY 1740b57cec5SDimitry Andric __kmp_fast_free(thread, p); 1750b57cec5SDimitry Andric #else 1760b57cec5SDimitry Andric __kmp_thread_free(thread, p); 1770b57cec5SDimitry Andric #endif 1780b57cec5SDimitry Andric } 1790b57cec5SDimitry Andric 1800b57cec5SDimitry Andric __kmp_node_deref(thread, node); 1810b57cec5SDimitry Andric 1820b57cec5SDimitry Andric KA_TRACE( 1830b57cec5SDimitry Andric 20, 1840b57cec5SDimitry Andric ("__kmp_release_deps: T#%d all successors of %p notified of completion\n", 1850b57cec5SDimitry Andric gtid, task)); 1860b57cec5SDimitry Andric } 1870b57cec5SDimitry Andric 1880b57cec5SDimitry Andric #endif // KMP_TASKDEPS_H 189