graphlab/2.1/fifo__scheduler_8hpp_source.html

/**

 * Copyright (c) 2009 Carnegie Mellon University.

 *     All rights reserved.

 *

 *  Licensed under the Apache License, Version 2.0 (the "License");

 *  you may not use this file except in compliance with the License.

 *  You may obtain a copy of the License at

 *

 *      http://www.apache.org/licenses/LICENSE-2.0

 *

 *  Unless required by applicable law or agreed to in writing,

 *  software distributed under the License is distributed on an "AS

 *  IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either

 *  express or implied.  See the License for the specific language

 *  governing permissions and limitations under the License.

 *

 * For more about this software visit:

 *

 *      http://www.graphlab.ml.cmu.edu

 *

 */


#ifndef GRAPHLAB_FIFO_SCHEDULER_HPP

#define GRAPHLAB_FIFO_SCHEDULER_HPP


#include <algorithm>

#include <queue>


#include <graphlab/graph/graph_basic_types.hpp>

#include <graphlab/parallel/pthread_tools.hpp>

#include <graphlab/parallel/atomic.hpp>


#include <graphlab/util/random.hpp>

#include <graphlab/scheduler/ischeduler.hpp>

#include <graphlab/parallel/atomic_add_vector2.hpp>


#include <graphlab/scheduler/get_message_priority.hpp>

#include <graphlab/options/graphlab_options.hpp>


#include <graphlab/macros_def.hpp>

namespace graphlab {


  /**

   * \ingroup group_schedulers

   *

   * This class defines a multiple queue approximate fifo scheduler.

   * Each processor has its own in_queue which it puts new tasks in

   * and out_queue which it pulls tasks from.  Once a processors

   * in_queue gets too large, the entire queue is placed at the end of

   * the shared master queue.  Once a processors out queue is empty it

   * grabs the next out_queue from the master.

   */

  template<typename Message>

  class fifo_scheduler : public ischeduler<Message> {


  public:


    typedef Message message_type;


    typedef std::deque<lvid_type> queue_type;


  private:


    atomic_add_vector2<message_type> messages;

    std::vector<queue_type> queues;

    std::vector<spinlock>   locks;

    size_t multi;

    std::vector<size_t>     current_queue;


    double min_priority;


    // Terminator

  public:


    fifo_scheduler(size_t num_vertices,

                   const graphlab_options& opts) :

      messages(num_vertices), multi(3),

      current_queue(opts.get_ncpus()),

      min_priority(-std::numeric_limits<double>::max()) {

        set_options(opts);

    }


    void set_options(const graphlab_options& opts) {

      size_t new_ncpus = opts.get_ncpus();

      // check if ncpus changed

      if (new_ncpus != current_queue.size()) {

        logstream(LOG_INFO) << "Changing ncpus from " << current_queue.size()

                            << " to " << new_ncpus << std::endl;

        ASSERT_GE(new_ncpus, 1);

        current_queue.resize(new_ncpus);

      }


      std::vector<std::string> keys = opts.get_scheduler_args().get_option_keys();

      foreach(std::string opt, keys) {

        if (opt == "multi") {

          opts.get_scheduler_args().get_option("multi", multi);

        } else if (opt == "min_priority") {

          opts.get_scheduler_args().get_option("min_priority", min_priority);

        } else {

          logstream(LOG_FATAL) << "Unexpected Scheduler Option: " << opt << std::endl;

        }

      }


      const size_t nqueues = std::max(multi*current_queue.size(), size_t(1));

      // changing the number of queues.

      // reinsert everything

      if (nqueues != queues.size()) {

        std::vector<queue_type> old_queues;

        std::swap(old_queues, queues);

        queues.resize(nqueues);

        locks.resize(nqueues);


        size_t idx = 0;

        for (size_t i = 0;i < old_queues.size(); ++i) {

          while (!old_queues[i].empty()) {

            queues[idx].push_back(old_queues[i].front());

            old_queues[i].pop_front();

            ++idx;

          }

        }

      }

    }


    void start() {  }


    void schedule(const lvid_type vid,

                  const message_type& msg) {

      // If this is a new message, schedule it

      // the min priority will be taken care of by the get_next function

      if (messages.add(vid, msg)) {

        /* "Randomize" the task queue task is put in. Note that we do

           not care if this counter is corrupted in race conditions

           Find first queue that is not locked and put task there (or

           after iteration limit) Choose two random queues and use the

           one which has smaller size */

        // M.D. Mitzenmacher The Power of Two Choices in Randomized

        // Load Balancing (1991)

        // http://www.eecs.harvard.edu/~michaelm/postscripts/mythesis.

        size_t idx = 0;

        if(queues.size() > 1) {

          const uint32_t prod =

            random::fast_uniform(uint32_t(0),

                                 uint32_t(queues.size() * queues.size() - 1));

          const uint32_t r1 = prod / queues.size();

          const uint32_t r2 = prod % queues.size();

          idx = (queues[r1].size() < queues[r2].size()) ? r1 : r2;

        }

        locks[idx].lock(); queues[idx].push_back(vid); locks[idx].unlock();

      }

    } // end of schedule


    void schedule_from_execution_thread(const size_t cpuid,

                                        const lvid_type vid) {

      size_t idx = 0;

      if(queues.size() > 1) {

        const uint32_t prod =

          random::fast_uniform(uint32_t(0),

                                uint32_t(queues.size() * queues.size() - 1));

        const uint32_t r1 = prod / queues.size();

        const uint32_t r2 = prod % queues.size();

        idx = (queues[r1].size() < queues[r2].size()) ? r1 : r2;

      }

      locks[idx].lock(); queues[idx].push_back(vid); locks[idx].unlock();

    }

    void schedule_all(const message_type& msg,

                      const std::string& order) {

      if(order == "shuffle") {

        // add vertices randomly

        std::vector<lvid_type> permutation =

          random::permutation<lvid_type>(messages.size());

        foreach(lvid_type vid, permutation) {

          if(messages.add(vid,msg)) {

            const size_t idx = vid % queues.size();

            locks[idx].lock(); queues[idx].push_back(vid); locks[idx].unlock();

          }

        }

      } else {

        // Add vertices sequentially

        for (lvid_type vid = 0; vid < messages.size(); ++vid) {

          if(messages.add(vid,msg)) {

            const size_t idx = vid % queues.size();

            locks[idx].lock(); queues[idx].push_back(vid); locks[idx].unlock();

          }

        }

      }

    } // end of schedule_all


    void completed(const size_t cpuid,

                   const lvid_type vid,

                   const message_type& msg) {  }


    /** Get the next element in the queue */

    sched_status::status_enum get_next(const size_t cpuid,

                                       lvid_type& ret_vid,

                                       message_type& ret_msg) {

      while(1) {

        /* Check all of my queues for a task */

        for(size_t i = 0; i < multi; ++i) {

          const size_t idx = (++current_queue[cpuid] % multi) + cpuid * multi;

          locks[idx].lock();

          if(!queues[idx].empty()) {

            ret_vid = queues[idx].front();

            queues[idx].pop_front();

            locks[idx].unlock();

            const bool get_success = messages.test_and_get(ret_vid, ret_msg);

            // managed to retrieve a task

            if(get_success) {

              // if it is above priority, everything is good

              if (scheduler_impl::get_message_priority(ret_msg) >= min_priority) {

                return sched_status::NEW_TASK;

              } else {

                // it is below priority. try to put it back. If putting it back

                // makes it exceed priority, reschedule it

                message_type combined_message;

                messages.add(ret_vid, ret_msg, combined_message);

                double ret_priority = scheduler_impl::get_message_priority(combined_message);

                if(ret_priority >= min_priority) {

                  locks[idx].lock();

                  queues[idx].push_back(ret_vid);

                  locks[idx].unlock();

                }

              }

            }

            else continue;

          }

          else {

            locks[idx].unlock();

          }

        }

        /* Check all the queues */

        for(size_t i = 0; i < queues.size(); ++i) {

          const size_t idx = ++current_queue[cpuid] % queues.size();

          if(!queues[idx].empty()) { // quick pretest

            locks[idx].lock();

            if(!queues[idx].empty()) {

              ret_vid = queues[idx].front();

              queues[idx].pop_front();

              locks[idx].unlock();

              const bool get_success = messages.test_and_get(ret_vid, ret_msg);

              if(get_success) {

                // if it is above priority, everything is good

                if (scheduler_impl::get_message_priority(ret_msg) >= min_priority) {

                  return sched_status::NEW_TASK;

                } else {

                  // it is below priority. try to put it back. If putting it back

                  // makes it exceed priority, reschedule it

                  message_type combined_message;

                  messages.add(ret_vid, ret_msg, combined_message);

                  double ret_priority = scheduler_impl::get_message_priority(combined_message);

                  if(ret_priority >= min_priority) {

                    locks[idx].lock();

                    queues[idx].push_back(ret_vid);

                    locks[idx].unlock();

                  }

                }

              }

            }

            else {

              locks[idx].unlock();

            }

          }

        }

        break;

      }

      return sched_status::EMPTY;

    } // end of get_next_task


    sched_status::status_enum

    get_specific(lvid_type vid,

                 message_type& ret_msg) {

      bool get_success = messages.test_and_get(vid, ret_msg);

      if (get_success) return sched_status::NEW_TASK;

      else return sched_status::EMPTY;

    }


    void place(lvid_type vid,

                 const message_type& msg) {

      messages.add(vid, msg);

    }


    size_t num_joins() const {

      return messages.num_joins();

    }


    static void print_options_help(std::ostream& out) {

      out << "\t multi = [number of queues per thread. Default = 3].\n"

          << "min_priority = [double, minimum priority required to receive \n"

          << "\t a message, default = -inf]\n";

    }


  }; // end of fifo scheduler


} // end of namespace graphlab

#include <graphlab/macros_undef.hpp>


#endif