src/mpmc_queue.hpp - cassandra-cpp-driver - Git at Google

 /*
   Licensed to the Apache Software Foundation (ASF) under one
   or more contributor license agreements.  See the NOTICE file
   distributed with this work for additional information
   regarding copyright ownership.  The ASF licenses this file
   to you under the Apache License, Version 2.0 (the
   "License"); you may not use this file except in compliance
   with the License.  You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an "AS IS" BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
 */

 /*
   Implementation of Dmitry Vyukov's MPMC algorithm
   http://www.1024cores.net/home/lock-free-algorithms/queues/bounded-mpmc-queue
 */

 #ifndef DATASTAX_INTERNAL_MPMC_QUEUE
 #define DATASTAX_INTERNAL_MPMC_QUEUE

 #include "allocated.hpp"
 #include "atomic.hpp"
 #include "driver_config.hpp"
 #include "macros.hpp"
 #include "scoped_ptr.hpp"
 #include "utils.hpp"

 #include <assert.h>

 namespace datastax { namespace internal { namespace core {

 template <typename T>
 class MPMCQueue : public Allocated {
 public:
   typedef T EntryType;

   MPMCQueue(size_t size)
       : size_(next_pow_2(size))
       , mask_(size_ - 1)
       , buffer_(new Node[size_])
       , tail_(0)
       , head_(0) {
     // populate the sequence initial values
     for (size_t i = 0; i < size_; ++i) {
       buffer_[i].seq.store(i, MEMORY_ORDER_RELAXED);
     }
   }

   bool enqueue(const T& data) {
     // head_seq_ only wraps at MAX(head_seq_) instead we use a mask to
     // convert the sequence to an array index this is why the ring
     // buffer must be a size which is a power of 2. this also allows
     // the sequence to double as a ticket/lock.
     size_t pos = tail_.load(MEMORY_ORDER_RELAXED);
     Node* node;

     for (;;) {
       node = &buffer_[pos & mask_];
       size_t node_seq = node->seq.load(MEMORY_ORDER_ACQUIRE);
       intptr_t dif = (intptr_t)node_seq - (intptr_t)pos;

       // if seq and head_seq are the same then it means this slot is empty
       if (dif == 0) {
         // claim our spot by moving head if head isn't the same as we
         // last checked then that means someone beat us to the punch
         // weak compare is faster, but can return spurious results
         // which in this instance is OK, because it's in the loop
         if (tail_.compare_exchange_weak(pos, pos + 1, MEMORY_ORDER_RELAXED)) {
           break;
         }
       } else if (dif < 0) {
         // if seq is less than head seq then it means this slot is
         // full and therefore the buffer is full
         return false;
       } else {
         // under normal circumstances this branch should never be taken
         pos = tail_.load(MEMORY_ORDER_RELAXED);
       }
     }

     // set the data
     node->data = data;
     // increment the sequence so that the tail knows it's accessible
     node->seq.store(pos + 1, MEMORY_ORDER_RELEASE);
     return true;
   }

   bool dequeue(T& data) {
     size_t pos = head_.load(MEMORY_ORDER_RELAXED);
     Node* node;

     for (;;) {
       node = &buffer_[pos & mask_];
       size_t node_seq = node->seq.load(MEMORY_ORDER_ACQUIRE);
       intptr_t dif = (intptr_t)node_seq - (intptr_t)(pos + 1);

       // if seq and head_seq are the same then it means this slot is empty
       if (dif == 0) {
         // claim our spot by moving head if head isn't the same as we
         // last checked then that means someone beat us to the punch
         // weak compare is faster, but can return spurious results
         // which in this instance is OK, because it's in the loop
         if (head_.compare_exchange_weak(pos, pos + 1, MEMORY_ORDER_RELAXED)) {
           break;
         }
       } else if (dif < 0) {
         // if seq is less than head seq then it means this slot is
         // full and therefore the buffer is full
         return false;
       } else {
         // under normal circumstances this branch should never be taken
         pos = head_.load(MEMORY_ORDER_RELAXED);
       }
     }

     // set the output
     data = node->data;
     // set the sequence to what the head sequence should be next
     // time around
     node->seq.store(pos + mask_ + 1, MEMORY_ORDER_RELEASE);
     return true;
   }

   bool is_empty() const {
     size_t pos = head_.load(MEMORY_ORDER_RELAXED);
     const Node* node = &buffer_[pos & mask_];
     size_t node_seq = node->seq.load(MEMORY_ORDER_ACQUIRE);
     return (intptr_t)node_seq - (intptr_t)(pos + 1) < 0;
   }

   static void memory_fence() {
 #if defined(HAVE_BOOST_ATOMIC) || defined(HAVE_STD_ATOMIC)
     atomic_thread_fence(MEMORY_ORDER_SEQ_CST);
 #endif
   }

 private:
   struct Node : public Allocated {
     Atomic<size_t> seq;
     T data;
   };

   // it's either 32 or 64 so 64 is good enough
   typedef char CachePad[64];

   CachePad pad0_;
   const size_t size_;
   const size_t mask_;
   ScopedArray<Node> buffer_;
   CachePad pad1_;
   Atomic<size_t> tail_;
   CachePad pad2_;
   Atomic<size_t> head_;
   CachePad pad3_;

   DISALLOW_COPY_AND_ASSIGN(MPMCQueue);
 };

 }}} // namespace datastax::internal::core

 #endif
	/*
	Licensed to the Apache Software Foundation (ASF) under one
	or more contributor license agreements. See the NOTICE file
	distributed with this work for additional information
	regarding copyright ownership. The ASF licenses this file
	to you under the Apache License, Version 2.0 (the
	"License"); you may not use this file except in compliance
	with the License. You may obtain a copy of the License at

	http://www.apache.org/licenses/LICENSE-2.0

	Unless required by applicable law or agreed to in writing, software
	distributed under the License is distributed on an "AS IS" BASIS,
	WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	See the License for the specific language governing permissions and
	limitations under the License.
	*/

	/*
	Implementation of Dmitry Vyukov's MPMC algorithm
	http://www.1024cores.net/home/lock-free-algorithms/queues/bounded-mpmc-queue
	*/

	#ifndef DATASTAX_INTERNAL_MPMC_QUEUE
	#define DATASTAX_INTERNAL_MPMC_QUEUE

	#include "allocated.hpp"
	#include "atomic.hpp"
	#include "driver_config.hpp"
	#include "macros.hpp"
	#include "scoped_ptr.hpp"
	#include "utils.hpp"

	#include <assert.h>

	namespace datastax { namespace internal { namespace core {

	template <typename T>
	class MPMCQueue : public Allocated {
	public:
	typedef T EntryType;

	MPMCQueue(size_t size)
	: size_(next_pow_2(size))
	, mask_(size_ - 1)
	, buffer_(new Node[size_])
	, tail_(0)
	, head_(0) {
	// populate the sequence initial values
	for (size_t i = 0; i < size_; ++i) {
	buffer_[i].seq.store(i, MEMORY_ORDER_RELAXED);
	}
	}

	bool enqueue(const T& data) {
	// head_seq_ only wraps at MAX(head_seq_) instead we use a mask to
	// convert the sequence to an array index this is why the ring
	// buffer must be a size which is a power of 2. this also allows
	// the sequence to double as a ticket/lock.
	size_t pos = tail_.load(MEMORY_ORDER_RELAXED);
	Node* node;

	for (;;) {
	node = &buffer_[pos & mask_];
	size_t node_seq = node->seq.load(MEMORY_ORDER_ACQUIRE);
	intptr_t dif = (intptr_t)node_seq - (intptr_t)pos;

	// if seq and head_seq are the same then it means this slot is empty
	if (dif == 0) {
	// claim our spot by moving head if head isn't the same as we
	// last checked then that means someone beat us to the punch
	// weak compare is faster, but can return spurious results
	// which in this instance is OK, because it's in the loop
	if (tail_.compare_exchange_weak(pos, pos + 1, MEMORY_ORDER_RELAXED)) {
	break;
	}
	} else if (dif < 0) {
	// if seq is less than head seq then it means this slot is
	// full and therefore the buffer is full
	return false;
	} else {
	// under normal circumstances this branch should never be taken
	pos = tail_.load(MEMORY_ORDER_RELAXED);
	}
	}

	// set the data
	node->data = data;
	// increment the sequence so that the tail knows it's accessible
	node->seq.store(pos + 1, MEMORY_ORDER_RELEASE);
	return true;
	}

	bool dequeue(T& data) {
	size_t pos = head_.load(MEMORY_ORDER_RELAXED);
	Node* node;

	for (;;) {
	node = &buffer_[pos & mask_];
	size_t node_seq = node->seq.load(MEMORY_ORDER_ACQUIRE);
	intptr_t dif = (intptr_t)node_seq - (intptr_t)(pos + 1);

	// if seq and head_seq are the same then it means this slot is empty
	if (dif == 0) {
	// claim our spot by moving head if head isn't the same as we
	// last checked then that means someone beat us to the punch
	// weak compare is faster, but can return spurious results
	// which in this instance is OK, because it's in the loop
	if (head_.compare_exchange_weak(pos, pos + 1, MEMORY_ORDER_RELAXED)) {
	break;
	}
	} else if (dif < 0) {
	// if seq is less than head seq then it means this slot is
	// full and therefore the buffer is full
	return false;
	} else {
	// under normal circumstances this branch should never be taken
	pos = head_.load(MEMORY_ORDER_RELAXED);
	}
	}

	// set the output
	data = node->data;
	// set the sequence to what the head sequence should be next
	// time around
	node->seq.store(pos + mask_ + 1, MEMORY_ORDER_RELEASE);
	return true;
	}

	bool is_empty() const {
	size_t pos = head_.load(MEMORY_ORDER_RELAXED);
	const Node* node = &buffer_[pos & mask_];
	size_t node_seq = node->seq.load(MEMORY_ORDER_ACQUIRE);
	return (intptr_t)node_seq - (intptr_t)(pos + 1) < 0;
	}

	static void memory_fence() {
	#if defined(HAVE_BOOST_ATOMIC) \|\| defined(HAVE_STD_ATOMIC)
	atomic_thread_fence(MEMORY_ORDER_SEQ_CST);
	#endif
	}

	private:
	struct Node : public Allocated {
	Atomic<size_t> seq;
	T data;
	};

	// it's either 32 or 64 so 64 is good enough
	typedef char CachePad[64];

	CachePad pad0_;
	const size_t size_;
	const size_t mask_;
	ScopedArray<Node> buffer_;
	CachePad pad1_;
	Atomic<size_t> tail_;
	CachePad pad2_;
	Atomic<size_t> head_;
	CachePad pad3_;

	DISALLOW_COPY_AND_ASSIGN(MPMCQueue);
	};

	}}} // namespace datastax::internal::core

	#endif