/******************************************************************************* * This file is part of SWIFT. * Copyright (c) 2012 Pedro Gonnet (pedro.gonnet@durham.ac.uk) * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU Lesser General Public License as published * by the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU Lesser General Public License * along with this program. If not, see . * ******************************************************************************/ /* Config parameters. */ #include /* Some standard headers. */ #include #include #include /* MPI headers. */ #ifdef WITH_MPI #include #endif /* This object's header. */ #include "queue.h" /* Local headers. */ #include "atomic.h" #include "error.h" #include "memswap.h" /** * @brief Push the task at the given index up the heap until it is either at the * top or smaller than its parent. * * @param q The task #queue. * @param ind The index of the task to be sifted-down in the queue. * * @return The new index of the entry. */ int queue_bubble_up(struct queue *q, int ind) { /* Set some pointers we will use often. */ struct queue_entry *entries = q->entries; const float w = entries[ind].weight; /* While we are not yet at the top of the heap... */ while (ind > 0) { /* Check if the parent is larger and bail if not.. */ const int parent = (ind - 1) / 2; if (w < entries[parent].weight) break; /* Parent is not larger, so swap. */ memswap(&entries[ind], &entries[parent], sizeof(struct queue_entry)); ind = parent; } return ind; } /** * @brief Push the task at the given index down the heap until both its children * have a smaller weight. * * @param q The task #queue. * @param ind The index of the task to be sifted-down in the queue. * * @return The new index of the entry. */ int queue_sift_down(struct queue *q, int ind) { /* Set some pointers we will use often. */ struct queue_entry *entries = q->entries; const int qcount = q->count; const float w = entries[ind].weight; /* While we still have at least one child... */ while (1) { /* Check if we still have children. */ int child = 2 * ind + 1; if (child >= qcount) break; /* Which of both children is the largest? */ if (child + 1 < qcount && entries[child + 1].weight > entries[child].weight) child += 1; /* Do we want to swap with the largest child? */ if (entries[child].weight > w) { memswap(&entries[ind], &entries[child], sizeof(struct queue_entry)); ind = child; } else break; } return ind; } /** * @brief Enqueue all tasks in the incoming DEQ. * * @param q The #queue, assumed to be locked. */ void queue_get_incoming(struct queue *q) { struct queue_entry *entries = q->entries; /* Loop over the incoming DEQ. */ while (1) { /* Is there a next element? */ const int ind = q->first_incoming % queue_incoming_size; if (q->tid_incoming[ind] < 0) break; /* Get the next offset off the DEQ. */ const int offset = atomic_swap(&q->tid_incoming[ind], -1); atomic_inc(&q->first_incoming); /* Does the queue need to be grown? */ if (q->count == q->size) { struct queue_entry *temp; q->size *= queue_sizegrow; if ((temp = (struct queue_entry *)malloc(sizeof(struct queue_entry) * q->size)) == NULL) error("Failed to allocate new indices."); memcpy(temp, entries, sizeof(struct queue_entry) * q->count); free(entries); q->entries = entries = temp; } /* Drop the task at the end of the queue. */ entries[q->count].tid = offset; entries[q->count].weight = q->tasks[offset].weight; q->count += 1; atomic_dec(&q->count_incoming); /* Re-heap by bubbling up the new (last) element. */ queue_bubble_up(q, q->count - 1); #ifdef SWIFT_DEBUG_CHECK /* Check the queue's consistency. */ for (int k = 1; k < q->count; k++) if (entries[(k - 1) / 2].weight < entries[k].weight) error("Queue heap is disordered."); #endif } } /** * @brief Insert a used tasks into the given queue. * * @param q The #queue. * @param t The #task. */ void queue_insert(struct queue *q, struct task *t) { /* Get an index in the DEQ. */ const int ind = atomic_inc(&q->last_incoming) % queue_incoming_size; /* Spin until the new offset can be stored. */ while (atomic_cas(&q->tid_incoming[ind], -1, t - q->tasks) != -1) { /* Try to get the queue lock, non-blocking, ensures that at least somebody is working on this queue. */ if (lock_trylock(&q->lock) == 0) { /* Clean up the incoming DEQ. */ queue_get_incoming(q); /* Release the queue lock. */ if (lock_unlock(&q->lock) != 0) { error("Unlocking the qlock failed.\n"); } } } /* Increase the incoming count. */ atomic_inc(&q->count_incoming); } /** * @brief Initialize the given queue. * * @param q The #queue. * @param tasks List of tasks to which the queue indices refer to. */ void queue_init(struct queue *q, struct task *tasks) { /* Allocate the task list if needed. */ q->size = queue_sizeinit; if ((q->entries = (struct queue_entry *)malloc(sizeof(struct queue_entry) * q->size)) == NULL) error("Failed to allocate queue entries."); /* Set the tasks pointer. */ q->tasks = tasks; /* Init counters. */ q->count = 0; /* Init the queue lock. */ if (lock_init(&q->lock) != 0) error("Failed to init queue lock."); /* Init the incoming DEQ. */ if ((q->tid_incoming = (int *)malloc(sizeof(int) * queue_incoming_size)) == NULL) error("Failed to allocate queue incoming buffer."); for (int k = 0; k < queue_incoming_size; k++) { q->tid_incoming[k] = -1; } q->first_incoming = 0; q->last_incoming = 0; q->count_incoming = 0; } /** * @brief Get a task free of dependencies and conflicts. * * @param q The task #queue. * @param prev The previous #task extracted from this #queue. * @param blocking Block until access to the queue is granted. */ struct task *queue_gettask(struct queue *q, const struct task *prev, int blocking) { swift_lock_type *qlock = &q->lock; struct task *res = NULL; /* Grab the task lock. */ if (blocking) { if (lock_lock(qlock) != 0) error("Locking the qlock failed.\n"); } else { if (lock_trylock(qlock) != 0) return NULL; } /* Fill any tasks from the incoming DEQ. */ queue_get_incoming(q); /* If there are no tasks, leave immediately. */ if (q->count == 0) { lock_unlock_blind(qlock); return NULL; } /* Set some pointers we will use often. */ struct queue_entry *entries = q->entries; struct task *qtasks = q->tasks; const int old_qcount = q->count; /* Loop over the queue entries. */ int ind; for (ind = 0; ind < old_qcount; ind++) { /* Try to lock the next task. */ if (task_lock(&qtasks[entries[ind].tid])) break; /* Should we de-prioritize this task? */ // MATTHIEU: We now have more than 64 tasks so the bit-wise // operation here is problematic. // However, the mask was such that this condition is always true anyway. if (1 /* (1ULL << qtasks[entries[ind].tid].type) & */ /* queue_lock_fail_reweight_mask */) { /* Scale the task's weight. */ entries[ind].weight *= queue_lock_fail_reweight_factor; /* Send it down the binary heap. */ if (queue_sift_down(q, ind) != ind) ind -= 1; } } /* Did we get a task? */ if (ind < old_qcount) { /* Another one bites the dust. */ const int qcount = q->count -= 1; /* Get a pointer on the task that we want to return. */ res = &qtasks[entries[ind].tid]; /* Swap this task with the last task and re-heap. */ if (ind < qcount) { entries[ind] = entries[qcount]; ind = queue_bubble_up(q, ind); ind = queue_sift_down(q, ind); } } else res = NULL; #ifdef SWIFT_DEBUG_CHECKS /* Check the queue's consistency. */ for (int k = 1; k < q->count; k++) if (entries[(k - 1) / 2].weight < entries[k].weight) error("Queue heap is disordered."); #endif /* Release the task lock. */ if (lock_unlock(qlock) != 0) error("Unlocking the qlock failed.\n"); /* Take the money and run. */ return res; } void queue_clean(struct queue *q) { free(q->entries); free(q->tid_incoming); } /** * @brief Dump a formatted list of tasks in the queue to the given file stream. * * @param nodeID the node id of this rank. * @param index a number for this queue, added to the output. * @param file the FILE stream, should opened for write. * @param q The task #queue. */ void queue_dump(int nodeID, int index, FILE *file, struct queue *q) { swift_lock_type *qlock = &q->lock; /* Grab the queue lock. */ if (lock_lock(qlock) != 0) error("Locking the qlock failed.\n"); /* Fill any tasks from the incoming DEQ. */ queue_get_incoming(q); /* Loop over the queue entries. */ for (int k = 0; k < q->count; k++) { struct task *t = &q->tasks[q->entries[k].tid]; fprintf(file, "%d %d %d %s %s %.2f\n", nodeID, index, k, taskID_names[t->type], subtaskID_names[t->subtype], t->weight); } /* Release the task lock. */ if (lock_unlock(qlock) != 0) error("Unlocking the qlock failed.\n"); }