11fb62fb0SOlivier Houchard /*
21fb62fb0SOlivier Houchard * Copyright 2011-2015 Samy Al Bahra.
31fb62fb0SOlivier Houchard * Copyright 2011 David Joseph.
41fb62fb0SOlivier Houchard * All rights reserved.
51fb62fb0SOlivier Houchard *
61fb62fb0SOlivier Houchard * Redistribution and use in source and binary forms, with or without
71fb62fb0SOlivier Houchard * modification, are permitted provided that the following conditions
81fb62fb0SOlivier Houchard * are met:
91fb62fb0SOlivier Houchard * 1. Redistributions of source code must retain the above copyright
101fb62fb0SOlivier Houchard * notice, this list of conditions and the following disclaimer.
111fb62fb0SOlivier Houchard * 2. Redistributions in binary form must reproduce the above copyright
121fb62fb0SOlivier Houchard * notice, this list of conditions and the following disclaimer in the
131fb62fb0SOlivier Houchard * documentation and/or other materials provided with the distribution.
141fb62fb0SOlivier Houchard *
151fb62fb0SOlivier Houchard * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
161fb62fb0SOlivier Houchard * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
171fb62fb0SOlivier Houchard * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
181fb62fb0SOlivier Houchard * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
191fb62fb0SOlivier Houchard * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
201fb62fb0SOlivier Houchard * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
211fb62fb0SOlivier Houchard * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
221fb62fb0SOlivier Houchard * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
231fb62fb0SOlivier Houchard * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
241fb62fb0SOlivier Houchard * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
251fb62fb0SOlivier Houchard * SUCH DAMAGE.
261fb62fb0SOlivier Houchard */
271fb62fb0SOlivier Houchard
281fb62fb0SOlivier Houchard #include <ck_barrier.h>
291fb62fb0SOlivier Houchard #include <ck_cc.h>
301fb62fb0SOlivier Houchard #include <ck_pr.h>
311fb62fb0SOlivier Houchard #include <ck_spinlock.h>
321fb62fb0SOlivier Houchard
331fb62fb0SOlivier Houchard struct ck_barrier_combining_queue {
341fb62fb0SOlivier Houchard struct ck_barrier_combining_group *head;
351fb62fb0SOlivier Houchard struct ck_barrier_combining_group *tail;
361fb62fb0SOlivier Houchard };
371fb62fb0SOlivier Houchard
38*d8f1ed8dSOlivier Houchard static struct ck_barrier_combining_group *
ck_barrier_combining_queue_dequeue(struct ck_barrier_combining_queue * queue)391fb62fb0SOlivier Houchard ck_barrier_combining_queue_dequeue(struct ck_barrier_combining_queue *queue)
401fb62fb0SOlivier Houchard {
411fb62fb0SOlivier Houchard struct ck_barrier_combining_group *front = NULL;
421fb62fb0SOlivier Houchard
431fb62fb0SOlivier Houchard if (queue->head != NULL) {
441fb62fb0SOlivier Houchard front = queue->head;
451fb62fb0SOlivier Houchard queue->head = queue->head->next;
461fb62fb0SOlivier Houchard }
471fb62fb0SOlivier Houchard
481fb62fb0SOlivier Houchard return front;
491fb62fb0SOlivier Houchard }
501fb62fb0SOlivier Houchard
51*d8f1ed8dSOlivier Houchard static void
ck_barrier_combining_insert(struct ck_barrier_combining_group * parent,struct ck_barrier_combining_group * tnode,struct ck_barrier_combining_group ** child)521fb62fb0SOlivier Houchard ck_barrier_combining_insert(struct ck_barrier_combining_group *parent,
531fb62fb0SOlivier Houchard struct ck_barrier_combining_group *tnode,
541fb62fb0SOlivier Houchard struct ck_barrier_combining_group **child)
551fb62fb0SOlivier Houchard {
561fb62fb0SOlivier Houchard
571fb62fb0SOlivier Houchard *child = tnode;
581fb62fb0SOlivier Houchard tnode->parent = parent;
591fb62fb0SOlivier Houchard
601fb62fb0SOlivier Houchard /*
611fb62fb0SOlivier Houchard * After inserting, we must increment the parent group's count for
621fb62fb0SOlivier Houchard * number of threads expected to reach it; otherwise, the
631fb62fb0SOlivier Houchard * barrier may end prematurely.
641fb62fb0SOlivier Houchard */
651fb62fb0SOlivier Houchard parent->k++;
661fb62fb0SOlivier Houchard return;
671fb62fb0SOlivier Houchard }
681fb62fb0SOlivier Houchard
691fb62fb0SOlivier Houchard /*
701fb62fb0SOlivier Houchard * This implementation of software combining tree barriers
711fb62fb0SOlivier Houchard * uses level order traversal to insert new thread groups
721fb62fb0SOlivier Houchard * into the barrier's tree. We use a queue to implement this
731fb62fb0SOlivier Houchard * traversal.
741fb62fb0SOlivier Houchard */
75*d8f1ed8dSOlivier Houchard static void
ck_barrier_combining_queue_enqueue(struct ck_barrier_combining_queue * queue,struct ck_barrier_combining_group * node_value)761fb62fb0SOlivier Houchard ck_barrier_combining_queue_enqueue(struct ck_barrier_combining_queue *queue,
771fb62fb0SOlivier Houchard struct ck_barrier_combining_group *node_value)
781fb62fb0SOlivier Houchard {
791fb62fb0SOlivier Houchard
801fb62fb0SOlivier Houchard node_value->next = NULL;
811fb62fb0SOlivier Houchard if (queue->head == NULL) {
821fb62fb0SOlivier Houchard queue->head = queue->tail = node_value;
831fb62fb0SOlivier Houchard return;
841fb62fb0SOlivier Houchard }
851fb62fb0SOlivier Houchard
861fb62fb0SOlivier Houchard queue->tail->next = node_value;
871fb62fb0SOlivier Houchard queue->tail = node_value;
881fb62fb0SOlivier Houchard
891fb62fb0SOlivier Houchard return;
901fb62fb0SOlivier Houchard }
911fb62fb0SOlivier Houchard
921fb62fb0SOlivier Houchard
931fb62fb0SOlivier Houchard void
ck_barrier_combining_group_init(struct ck_barrier_combining * root,struct ck_barrier_combining_group * tnode,unsigned int nthr)941fb62fb0SOlivier Houchard ck_barrier_combining_group_init(struct ck_barrier_combining *root,
951fb62fb0SOlivier Houchard struct ck_barrier_combining_group *tnode,
961fb62fb0SOlivier Houchard unsigned int nthr)
971fb62fb0SOlivier Houchard {
981fb62fb0SOlivier Houchard struct ck_barrier_combining_group *node;
991fb62fb0SOlivier Houchard struct ck_barrier_combining_queue queue;
1001fb62fb0SOlivier Houchard
1011fb62fb0SOlivier Houchard queue.head = queue.tail = NULL;
1021fb62fb0SOlivier Houchard
1031fb62fb0SOlivier Houchard tnode->k = nthr;
1041fb62fb0SOlivier Houchard tnode->count = 0;
1051fb62fb0SOlivier Houchard tnode->sense = 0;
1061fb62fb0SOlivier Houchard tnode->left = tnode->right = NULL;
1071fb62fb0SOlivier Houchard
1081fb62fb0SOlivier Houchard /*
1091fb62fb0SOlivier Houchard * Finds the first available node for linkage into the combining
1101fb62fb0SOlivier Houchard * tree. The use of a spinlock is excusable as this is a one-time
1111fb62fb0SOlivier Houchard * initialization cost.
1121fb62fb0SOlivier Houchard */
1131fb62fb0SOlivier Houchard ck_spinlock_fas_lock(&root->mutex);
1141fb62fb0SOlivier Houchard ck_barrier_combining_queue_enqueue(&queue, root->root);
1151fb62fb0SOlivier Houchard while (queue.head != NULL) {
1161fb62fb0SOlivier Houchard node = ck_barrier_combining_queue_dequeue(&queue);
1171fb62fb0SOlivier Houchard
1181fb62fb0SOlivier Houchard /* If the left child is free, link the group there. */
1191fb62fb0SOlivier Houchard if (node->left == NULL) {
1201fb62fb0SOlivier Houchard ck_barrier_combining_insert(node, tnode, &node->left);
1211fb62fb0SOlivier Houchard goto leave;
1221fb62fb0SOlivier Houchard }
1231fb62fb0SOlivier Houchard
1241fb62fb0SOlivier Houchard /* If the right child is free, link the group there. */
1251fb62fb0SOlivier Houchard if (node->right == NULL) {
1261fb62fb0SOlivier Houchard ck_barrier_combining_insert(node, tnode, &node->right);
1271fb62fb0SOlivier Houchard goto leave;
1281fb62fb0SOlivier Houchard }
1291fb62fb0SOlivier Houchard
1301fb62fb0SOlivier Houchard /*
1311fb62fb0SOlivier Houchard * If unsuccessful, try inserting as a child of the children of the
1321fb62fb0SOlivier Houchard * current node.
1331fb62fb0SOlivier Houchard */
1341fb62fb0SOlivier Houchard ck_barrier_combining_queue_enqueue(&queue, node->left);
1351fb62fb0SOlivier Houchard ck_barrier_combining_queue_enqueue(&queue, node->right);
1361fb62fb0SOlivier Houchard }
1371fb62fb0SOlivier Houchard
1381fb62fb0SOlivier Houchard leave:
1391fb62fb0SOlivier Houchard ck_spinlock_fas_unlock(&root->mutex);
1401fb62fb0SOlivier Houchard return;
1411fb62fb0SOlivier Houchard }
1421fb62fb0SOlivier Houchard
1431fb62fb0SOlivier Houchard void
ck_barrier_combining_init(struct ck_barrier_combining * root,struct ck_barrier_combining_group * init_root)1441fb62fb0SOlivier Houchard ck_barrier_combining_init(struct ck_barrier_combining *root,
1451fb62fb0SOlivier Houchard struct ck_barrier_combining_group *init_root)
1461fb62fb0SOlivier Houchard {
1471fb62fb0SOlivier Houchard
1481fb62fb0SOlivier Houchard init_root->k = 0;
1491fb62fb0SOlivier Houchard init_root->count = 0;
1501fb62fb0SOlivier Houchard init_root->sense = 0;
1511fb62fb0SOlivier Houchard init_root->parent = init_root->left = init_root->right = NULL;
1521fb62fb0SOlivier Houchard ck_spinlock_fas_init(&root->mutex);
1531fb62fb0SOlivier Houchard root->root = init_root;
1541fb62fb0SOlivier Houchard return;
1551fb62fb0SOlivier Houchard }
1561fb62fb0SOlivier Houchard
1571fb62fb0SOlivier Houchard static void
ck_barrier_combining_aux(struct ck_barrier_combining * barrier,struct ck_barrier_combining_group * tnode,unsigned int sense)1581fb62fb0SOlivier Houchard ck_barrier_combining_aux(struct ck_barrier_combining *barrier,
1591fb62fb0SOlivier Houchard struct ck_barrier_combining_group *tnode,
1601fb62fb0SOlivier Houchard unsigned int sense)
1611fb62fb0SOlivier Houchard {
1621fb62fb0SOlivier Houchard
1631fb62fb0SOlivier Houchard /*
1641fb62fb0SOlivier Houchard * If this is the last thread in the group, it moves on to the parent group.
1651fb62fb0SOlivier Houchard * Otherwise, it spins on this group's sense.
1661fb62fb0SOlivier Houchard */
1671fb62fb0SOlivier Houchard if (ck_pr_faa_uint(&tnode->count, 1) == tnode->k - 1) {
1681fb62fb0SOlivier Houchard /*
1691fb62fb0SOlivier Houchard * If we are and will be the last thread entering the barrier for the
1701fb62fb0SOlivier Houchard * current group then signal the parent group if one exists.
1711fb62fb0SOlivier Houchard */
1721fb62fb0SOlivier Houchard if (tnode->parent != NULL)
1731fb62fb0SOlivier Houchard ck_barrier_combining_aux(barrier, tnode->parent, sense);
1741fb62fb0SOlivier Houchard
1751fb62fb0SOlivier Houchard /*
1761fb62fb0SOlivier Houchard * Once the thread returns from its parent(s), it reinitializes the group's
1771fb62fb0SOlivier Houchard * arrival count and signals other threads to continue by flipping the group
1781fb62fb0SOlivier Houchard * sense. Order of these operations is not important since we assume a static
1791fb62fb0SOlivier Houchard * number of threads are members of a barrier for the lifetime of the barrier.
1801fb62fb0SOlivier Houchard * Since count is explicitly reinitialized, it is guaranteed that at any point
1811fb62fb0SOlivier Houchard * tnode->count is equivalent to tnode->k if and only if that many threads
1821fb62fb0SOlivier Houchard * are at the barrier.
1831fb62fb0SOlivier Houchard */
1841fb62fb0SOlivier Houchard ck_pr_store_uint(&tnode->count, 0);
1851fb62fb0SOlivier Houchard ck_pr_fence_store();
1861fb62fb0SOlivier Houchard ck_pr_store_uint(&tnode->sense, ~tnode->sense);
1871fb62fb0SOlivier Houchard } else {
1881fb62fb0SOlivier Houchard while (sense != ck_pr_load_uint(&tnode->sense))
1891fb62fb0SOlivier Houchard ck_pr_stall();
1901fb62fb0SOlivier Houchard }
191*d8f1ed8dSOlivier Houchard ck_pr_fence_memory();
1921fb62fb0SOlivier Houchard
1931fb62fb0SOlivier Houchard return;
1941fb62fb0SOlivier Houchard }
1951fb62fb0SOlivier Houchard
1961fb62fb0SOlivier Houchard void
ck_barrier_combining(struct ck_barrier_combining * barrier,struct ck_barrier_combining_group * tnode,struct ck_barrier_combining_state * state)1971fb62fb0SOlivier Houchard ck_barrier_combining(struct ck_barrier_combining *barrier,
1981fb62fb0SOlivier Houchard struct ck_barrier_combining_group *tnode,
1991fb62fb0SOlivier Houchard struct ck_barrier_combining_state *state)
2001fb62fb0SOlivier Houchard {
2011fb62fb0SOlivier Houchard
2021fb62fb0SOlivier Houchard ck_barrier_combining_aux(barrier, tnode, state->sense);
2031fb62fb0SOlivier Houchard
2041fb62fb0SOlivier Houchard /* Reverse the execution context's sense for the next barrier. */
2051fb62fb0SOlivier Houchard state->sense = ~state->sense;
2061fb62fb0SOlivier Houchard return;
2071fb62fb0SOlivier Houchard }
208