docs/master/binding_8c_source.html

 #include <stdbool.h>
 #include <string.h>
 #include <stdlib.h>

 #include <arch/atomic.h>
 #include <core/core.h>
 #include <core/timer.h>
 #include <datatypes/list.h>
 #include <scheduler/binding.h>
 #include <scheduler/process.h>
 #include <scheduler/scheduler.h>
 #include <statistics/statistics.h>
 #include <gvt/gvt.h>

 #include <arch/thread.h>

 #define REBIND_INTERVAL 10.0

 struct lp_cost_id {
     double workload_factor;
     unsigned int id;
 };

 struct lp_cost_id *lp_cost;

 static __thread bool first_lp_binding = true;

 static unsigned int *new_LPS_binding;
 static timer rebinding_timer;

 #ifdef HAVE_LP_REBINDING
 static int binding_acquire_phase = 0;
 static __thread int local_binding_acquire_phase = 0;

 static int binding_phase = 0;
 static __thread int local_binding_phase = 0;
 #endif

 static atomic_t worker_thread_reduction;

 static inline void LPs_block_binding(void)
 {
     unsigned int i, j;
     unsigned int buf1;
     unsigned int offset;
     unsigned int block_leftover;
     struct lp_struct *lp;

     buf1 = (n_prc / n_cores);
     block_leftover = n_prc - buf1 * n_cores;

     if (block_leftover > 0) {
         buf1++;
     }

     n_prc_per_thread = 0;
     i = 0;
     offset = 0;

     while (i < n_prc) {
         j = 0;
         while (j < buf1) {
             if (offset == local_tid) {
                 lp = lps_blocks[i];
                 LPS_bound_set(n_prc_per_thread++, lp);
                 lp->worker_thread = local_tid;
             }
             i++;
             j++;
         }
         offset++;
         block_leftover--;
         if (block_leftover == 0) {
             buf1--;
         }
     }
 }

 static int compare_lp_cost(const void *a, const void *b)
 {
     struct lp_cost_id *A = (struct lp_cost_id *)a;
     struct lp_cost_id *B = (struct lp_cost_id *)b;

     return (B->workload_factor - A->workload_factor);
 }

 static inline void LP_knapsack(void)
 {
     register unsigned int i, j;
     double reference_knapsack = 0;
     bool assigned;
     double assignments[n_cores];

     if (!master_thread())
         return;

     // Estimate the reference knapsack
     for (i = 0; i < n_prc; i++) {
         reference_knapsack += lp_cost[i].workload_factor;
     }
     reference_knapsack /= n_cores;

     // Sort the expected times
     qsort(lp_cost, n_prc, sizeof(struct lp_cost_id), compare_lp_cost);

     // At least one LP per thread
     bzero(assignments, sizeof(double) * n_cores);
     j = 0;
     for (i = 0; i < n_cores; i++) {
         assignments[j] += lp_cost[i].workload_factor;
         new_LPS_binding[i] = j;
         j++;
     }

     // Very suboptimal approximation of knapsack
     for (; i < n_prc; i++) {
         assigned = false;

         for (j = 0; j < n_cores; j++) {
             // Simulate assignment
             if (assignments[j] + lp_cost[i].workload_factor <=
                 reference_knapsack) {
                 assignments[j] += lp_cost[i].workload_factor;
                 new_LPS_binding[i] = j;
                 assigned = true;
                 break;
             }
         }

         if (assigned == false)
             break;
     }

     // Check for leftovers
     if (i < n_prc) {
         j = 0;
         for (; i < n_prc; i++) {
             new_LPS_binding[i] = j;
             j = (j + 1) % n_cores;
         }
     }
 }

 #ifdef HAVE_LP_REBINDING

 static void post_local_reduction(void)
 {
     unsigned int i = 0;
     msg_t *first_evt, *last_evt;

     foreach_bound_lp(lp) {
         first_evt = list_head(lp->queue_in);
         last_evt = list_tail(lp->queue_in);

         lp_cost[lp->lid.to_int].id = i++;   // TODO: do we really need this?
         lp_cost[lp->lid.to_int].workload_factor =
             list_sizeof(lp->queue_in);
         lp_cost[lp->lid.to_int].workload_factor *=
             statistics_get_lp_data(lp, STAT_GET_EVENT_TIME_LP);
         lp_cost[lp->lid.to_int].workload_factor /= (last_evt->
                                 timestamp -
                                 first_evt->
                                 timestamp);
     }
 }

 static void install_binding(void)
 {
     unsigned int i = 0;

     n_prc_per_thread = 0;

     foreach_lp(lp) {
         if (new_LPS_binding[i++] == local_tid) {
             LPS_bound_set(n_prc_per_thread++, lp);

             if (local_tid != lp->worker_thread) {
                 lp->worker_thread = local_tid;
             }
         }
     }
 }

 #endif

 void rebind_LPs(void)
 {

     if (unlikely(first_lp_binding)) {
         first_lp_binding = false;

         initialize_binding_blocks();

         LPs_block_binding();

         timer_start(rebinding_timer);

         if (master_thread()) {
             new_LPS_binding = rsalloc(sizeof(int) * n_prc);

             lp_cost = rsalloc(sizeof(struct lp_cost_id) * n_prc);

             atomic_set(&worker_thread_reduction, n_cores);
         }

         return;
     }
 #ifdef HAVE_LP_REBINDING
     if (master_thread()) {
         if (unlikely
             (timer_value_seconds(rebinding_timer) >= REBIND_INTERVAL)) {
             timer_restart(rebinding_timer);
             binding_phase++;
         }

         if (atomic_read(&worker_thread_reduction) == 0) {

             LP_knapsack();

             binding_acquire_phase++;
         }
     }

     if (local_binding_phase < binding_phase) {
         local_binding_phase = binding_phase;
         post_local_reduction();
         atomic_dec(&worker_thread_reduction);
     }

     if (local_binding_acquire_phase < binding_acquire_phase) {
         local_binding_acquire_phase = binding_acquire_phase;

         install_binding();

 #ifdef HAVE_PREEMPTION
         reset_min_in_transit(local_tid);
 #endif

         if (thread_barrier(&all_thread_barrier)) {
             atomic_set(&worker_thread_reduction, n_cores);
         }

     }
 #endif
 }
lps_blocks
struct lp_struct ** lps_blocks
Maintain LPs&#39; simulation and execution states.
Definition: process.c:44

atomic_read
#define atomic_read(v)
Read operation on an atomic counter.
Definition: atomic.h:66

core.h
Core ROOT-Sim functionalities.

lp_cost_id
Definition: binding.c:47

lp_struct
Definition: process.h:65

n_cores
unsigned int n_cores
Total number of cores required for simulation.
Definition: core.c:61

atomic_dec
void atomic_dec(atomic_t *)
Definition: x86.c:103

timer.h
Timers.

statistics.h
Statistics module.

scheduler.h
The ROOT-Sim scheduler main module header.

binding.h
Load sharing rules across worker threads.

thread.h
Generic thread management facilities.

atomic_set
#define atomic_set(v, i)
Set operation on an atomic counter.
Definition: atomic.h:69

LP_knapsack
static void LP_knapsack(void)
Definition: binding.c:143

list.h
Generic Lists.

_msg_t
Message Type definition.
Definition: core.h:164

thread_barrier
bool thread_barrier(barrier_t *b)
Definition: thread.c:200

process.h
LP control blocks.

atomic.h
Atomic operations.

all_thread_barrier
barrier_t all_thread_barrier
Barrier for all worker threads.
Definition: core.c:49

list_head
#define list_head(list)
Definition: list.h:74

master_thread
#define master_thread()
This macro expands to true if the current KLT is the master thread for the local kernel.
Definition: thread.h:155

atomic_t
Definition: atomic.h:42

first_lp_binding
static __thread bool first_lp_binding
A guard to know whether this is the first invocation or not.
Definition: binding.c:55

n_prc
unsigned int n_prc
Number of logical processes hosted by the current kernel instance.
Definition: core.c:67

gvt.h
Global Virtual Time.

n_prc_per_thread
__thread unsigned int n_prc_per_thread
This is used to keep track of how many LPs were bound to the current KLT.
Definition: scheduler.c:69

compare_lp_cost
static int compare_lp_cost(const void *a, const void *b)
Definition: binding.c:124

rebind_LPs
void rebind_LPs(void)
Definition: binding.c:252

local_tid
__thread unsigned int local_tid
Definition: thread.c:72

list_tail
#define list_tail(list)
Definition: list.h:81

lp_struct::worker_thread
unsigned int worker_thread
ID of the worker thread towards which the LP is bound.
Definition: process.h:85

unlikely
#define unlikely(exp)
Optimize the branch as likely not taken.
Definition: core.h:74

LPs_block_binding
static void LPs_block_binding(void)
Definition: binding.c:75