multiqueue_priority_scheduler.hpp

/src/graphlab/schedulers/multiqueue_priority_scheduler.hpp

https://github.com/ekoontz/graphlab
C++ Header | 247 lines | 156 code | 60 blank | 31 comment | 19 complexity | e6af1ea8e6ec75eaa3221fc04469d46e MD5 | raw file

/**
 * \author jegonzal This class defines a multiqueue version of the
 * priority scheduler.
 **/
#ifndef GRAPHLAB_MULTIQUEUE_PRIORITY_SCHEDULER_HPP
#define GRAPHLAB_MULTIQUEUE_PRIORITY_SCHEDULER_HPP

#include <queue>
#include <cmath>
#include <cassert>

#include <graphlab/util/mutable_queue.hpp>
#include <graphlab/graph/graph.hpp>
#include <graphlab/scope/iscope.hpp>
#include <graphlab/tasks/update_task.hpp>
#include <graphlab/schedulers/ischeduler.hpp>
#include <graphlab/parallel/pthread_tools.hpp>
#include <graphlab/schedulers/support/direct_callback.hpp>
#include <graphlab/schedulers/support/binary_vertex_task_set.hpp>

#include <graphlab/util/task_count_termination.hpp>



#include <graphlab/macros_def.hpp>
namespace graphlab {

 
  template<typename Graph>
  class multiqueue_priority_scheduler : 
    public ischeduler<Graph> {
  
  public:
    typedef Graph graph_type;
    typedef ischeduler<Graph> base;

    typedef typename base::iengine_type iengine_type;
    typedef typename base::update_task_type     update_task_type;
    typedef typename base::update_function_type update_function_type;
    typedef typename base::callback_type        callback_type;
    typedef typename base::monitor_type         monitor_type;

    typedef mutable_queue<update_task_type, double> taskqueue_type;

  private:
    using base::monitor;

  public:

    multiqueue_priority_scheduler(iengine_type* engine,
                                  Graph& g, 
                                  size_t ncpus) : 
      callbacks(ncpus, direct_callback<Graph>(this, engine)), 
      binary_vertex_tasks(g.num_vertices()) {
      numvertices = g.num_vertices();
        
      /* How many queues per cpu. More queues, less contention */
      queues_per_cpu = 2;
      num_queues = queues_per_cpu * ncpus;
       
      /* Each cpu keeps record of the queue it last 
         used to keep balance */
      lastqueue.resize(ncpus, 0);
       
      // Do this in the preconstructor
      task_queues.resize(num_queues);
      queue_locks.resize(num_queues);
      // for(int i=0; i<num_queues; i++) {
      //   task_queues.push_back(std::queue<update_task>());
      //   queue_locks.push_back(spinlock());
      // }
    }

  
    ~multiqueue_priority_scheduler() {}

    callback_type& get_callback(size_t cpuid) {
      return callbacks[cpuid];
    }


    /** Get the next element in the queue */
    sched_status::status_enum get_next_task(size_t cpuid,
                                            update_task_type &ret_task) {
      if (terminator.finish()) {
        return sched_status::COMPLETE;
      }
      bool found = false;
      /* First check my own queues. Keep track which own queue was checked
         so next time I can check next of my own queues to keep balance. */
      size_t firstown = cpuid * queues_per_cpu;
      for(size_t ownq_i = 0; ownq_i < queues_per_cpu; ++ownq_i) {
        size_t queueidx = 
          firstown + ((ownq_i + lastqueue[cpuid] + 1) % queues_per_cpu);
        taskqueue_type& queue = task_queues[queueidx];
        queue_locks[queueidx].lock();
        if (!queue.empty()) {
          ret_task = queue.pop().first;
          found = true;
          lastqueue[cpuid] = ownq_i;
        }
        queue_locks[queueidx].unlock();
        if (found) break;
      }
  
      /* Ok, my queues were empty - now check every other queue */
      if (!found) {
        /* First check own queue - if it is empty, check others */
        for(size_t roundrobin = 0; roundrobin < num_queues; ++roundrobin) {
          size_t queueidx = 
            (firstown + queues_per_cpu + roundrobin) % num_queues;
          taskqueue_type& queue = task_queues[queueidx];
          queue_locks[queueidx].lock();
          if (!queue.empty()) {
            ret_task = queue.pop().first;
            found = true;
          }
          queue_locks[queueidx].unlock();
          if (found)  break;
        }
      }
 
      if(!found) {
        return sched_status::WAITING;
      }
      
      binary_vertex_tasks.remove(ret_task);
      
      if (monitor != NULL) 
        monitor->scheduler_task_scheduled(ret_task, 0.0);
      return sched_status::NEWTASK;
    } // end of get_next_task


    void add_task(update_task_type task, double priority) {
      if (binary_vertex_tasks.add(task)) {
        terminator.new_job();
        // Check if task should be pruned
        /* "Randomize" the task queue task is put in. Note that we do
           not care if this counter is corrupted in race conditions */
    
   
        /* Find first queue that is not locked and put task there (or
           after iteration limit)*/
         
        /* Choose two random queues and use the one which has smaller
           size */
        // M.D. Mitzenmacher The Power of Two Choices in Randomized
        // Load Balancing (1991)
        // http://www.eecs.harvard.edu/~michaelm/postscripts/mythesis.pdf

//         size_t r1 = random::rand_int(num_queues - 1);
//         size_t r2 = random::rand_int(num_queues - 1);
        size_t prod = size_t(random::rand01() * num_queues * num_queues);
        size_t r1 = prod / num_queues;
        size_t r2 = prod % num_queues;

        size_t qidx = 
          (task_queues[r1].size() < task_queues[r2].size()) ? r1 : r2;
        
        queue_locks[qidx].lock();
        task_queues[qidx].push(task, priority);
        queue_locks[qidx].unlock();
    
        if (monitor != NULL) 
          monitor->scheduler_task_added(task, priority);
      } else {
        if (monitor != NULL) 
          monitor->scheduler_task_pruned(task);
      }
  
    }

    void add_tasks(const std::vector<vertex_id_t> &vertices,
                   update_function_type func,
                   double priority) {
      foreach(vertex_id_t vertex, vertices) {
        add_task(update_task_type(vertex, func), priority);
      }
    }


    void add_task_to_all(update_function_type func, double priority)  {
      for (vertex_id_t vertex = 0; vertex < numvertices; ++vertex){
        add_task(update_task_type(vertex, func), priority);
      }
    }

  
    void update_state(size_t cpuid,
                      const std::vector<vertex_id_t> &updated_vertices,
                      const std::vector<edge_id_t>& updatededges) {};

    void scoped_modifications(size_t cpuid, vertex_id_t rootvertex,
                              const std::vector<edge_id_t>& updatededges){}

    void completed_task(size_t cpuid, const update_task_type &task) {
      terminator.completed_job();
    }


    void abort() { terminator.abort(); }
  
    void restart() { terminator.restart(); }
  
    bool is_task_scheduled(update_task_type task)  {
      return binary_vertex_tasks.get(task);
    }


    void print() {
      std::cout << "SSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSS" << std::endl;
      std::cout << "Printing task queue sizes: " << std::endl;
      for(size_t i = 0; i < task_queues.size(); ++i) {
        std::cout << task_queues[i].size() << std::endl;
      }
      std::cout << "Is the terminator reporting finished: "
                << terminator.finish() << std::endl;
      std::cout << "SSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSSS" << std::endl;
        
    }

  private:
    size_t numvertices; /// Remember the number of vertices in the graph
  
    size_t num_queues;
    size_t queues_per_cpu;
  
    std::vector<taskqueue_type> task_queues; /// The actual task queue
    std::vector<mutex> queue_locks;
    std::vector<size_t> lastqueue;

    /// The callbacks pre-created for each cpuid
    std::vector<direct_callback<Graph> > callbacks; 

    // Task set for task pruning
    binary_vertex_task_set<Graph> binary_vertex_tasks;

  
    task_count_termination terminator;
  }; 


} // end of namespace graphlab
#include <graphlab/macros_undef.hpp>

#endif