Uses different pass count for different parallel queue test cases
[libcds.git] / cds / container / weak_ringbuffer.h
index 17b249b0a6c2f6d13149dfc54a519b6061129bf5..0198c0327de928875f71aed9ff2313b85f9c272d 100644 (file)
@@ -96,7 +96,7 @@ namespace cds { namespace container {
             - \p opt::memory_model - C++ memory ordering model. Can be \p opt::v::relaxed_ordering (relaxed memory model, the default)
                 or \p opt::v::sequential_consistent (sequentially consisnent memory model).
 
-            Example: declare \p %WeakRingBuffer with static iternal buffer of size 1024:
+            Example: declare \p %WeakRingBuffer with static iternal buffer for 1024 objects:
             \code
             typedef cds::container::WeakRingBuffer< Foo,
                 typename cds::container::weak_ringbuffer::make_traits<
@@ -126,6 +126,13 @@ namespace cds { namespace container {
 
         Ring buffer is a bounded queue. Additionally, \p %WeakRingBuffer supports batch operations -
         you can push/pop an array of elements.
+
+        There are a specialization \ref cds_nonintrusive_WeakRingBuffer_void "WeakRingBuffer<void, Traits>"
+        that is not a queue but a "memory pool" between producer and consumer threads.
+        \p WeakRingBuffer<void> supports variable-sized data.
+
+        @warning: \p %WeakRingBuffer is developed for 64-bit architecture.
+        32-bit platform must provide support for 64-bit atomics.
     */
     template <typename T, typename Traits = weak_ringbuffer::traits>
     class WeakRingBuffer: public cds::bounded_container
@@ -150,6 +157,7 @@ namespace cds { namespace container {
     private:
         //@cond
         typedef typename traits::buffer::template rebind< value_type >::other buffer;
+        typedef uint64_t    counter_type;
         //@endcond
 
     public:
@@ -174,8 +182,8 @@ namespace cds { namespace container {
         ~WeakRingBuffer()
         {
             value_cleaner cleaner;
-            size_t back = back_.load( memory_model::memory_order_relaxed );
-            for ( size_t front = front_.load( memory_model::memory_order_relaxed ); front != back; ++front )
+            counter_type back = back_.load( memory_model::memory_order_relaxed );
+            for ( counter_type front = front_.load( memory_model::memory_order_relaxed ); front != back; ++front )
                 cleaner( buffer_[ buffer_.mod( front ) ] );
         }
 
@@ -193,7 +201,7 @@ namespace cds { namespace container {
             \code
             cds::container::WeakRingBuffer<std::string> ringbuf;
             char const* arr[10];
-            ringbuf.push( arr, 10, 
+            ringbuf.push( arr, 10,
                 []( std::string& element, char const* src ) {
                     new( &element ) std::string( src );
                 });
@@ -208,21 +216,21 @@ namespace cds { namespace container {
                 });
             \endcode
 
-            Returns \p true if success or \p false if not enought sufficient space in the ring
+            Returns \p true if success or \p false if not enough space in the ring
         */
         template <typename Q, typename CopyFunc>
         bool push( Q* arr, size_t count, CopyFunc copy )
         {
-            assert( count < capacity() );
-            size_t back = back_.load( memory_model::memory_order_relaxed );
+            assert( count < capacity());
+            counter_type back = back_.load( memory_model::memory_order_relaxed );
 
-            assert( back - pfront_ <= capacity() );
+            assert( static_cast<size_t>( back - pfront_ ) <= capacity());
 
-            if ( pfront_ + capacity() - back < count ) {
+            if ( static_cast<size_t>( pfront_ + capacity() - back ) < count ) {
                 pfront_ = front_.load( memory_model::memory_order_acquire );
 
-                if ( pfront_ + capacity() - back < count ) {
-                    // not enought space
+                if ( static_cast<size_t>( pfront_ + capacity() - back ) < count ) {
+                    // not enough space
                     return false;
                 }
             }
@@ -246,7 +254,7 @@ namespace cds { namespace container {
             The function is available only if <tt>std::is_constructible<value_type, Q>::value</tt>
             is \p true.
 
-            Returns \p true if success or \p false if not enought sufficient space in the ring
+            Returns \p true if success or \p false if not enough space in the ring
         */
         template <typename Q>
         typename std::enable_if< std::is_constructible<value_type, Q>::value, bool>::type
@@ -266,15 +274,15 @@ namespace cds { namespace container {
         typename std::enable_if< std::is_constructible<value_type, Args...>::value, bool>::type
         emplace( Args&&... args )
         {
-            size_t back = back_.load( memory_model::memory_order_relaxed );
+            counter_type back = back_.load( memory_model::memory_order_relaxed );
 
-            assert( back - pfront_ <= capacity() );
+            assert( static_cast<size_t>( back - pfront_ ) <= capacity());
 
             if ( pfront_ + capacity() - back < 1 ) {
                 pfront_ = front_.load( memory_model::memory_order_acquire );
 
                 if ( pfront_ + capacity() - back < 1 ) {
-                    // not enought space
+                    // not enough space
                     return false;
                 }
             }
@@ -299,15 +307,15 @@ namespace cds { namespace container {
         template <typename Func>
         bool enqueue_with( Func f )
         {
-            size_t back = back_.load( memory_model::memory_order_relaxed );
+            counter_type back = back_.load( memory_model::memory_order_relaxed );
 
-            assert( back - pfront_ <= capacity() );
+            assert( static_cast<size_t>( back - pfront_ ) <= capacity());
 
             if ( pfront_ + capacity() - back < 1 ) {
                 pfront_ = front_.load( memory_model::memory_order_acquire );
 
                 if ( pfront_ + capacity() - back < 1 ) {
-                    // not enought space
+                    // not enough space
                     return false;
                 }
             }
@@ -364,19 +372,19 @@ namespace cds { namespace container {
             void copy_func( Q& dest, value_type& elemen );
             \endcode
 
-            Returns \p true if success or \p false if not enought sufficient space in the ring
+            Returns \p true if success or \p false if not enough space in the ring
         */
         template <typename Q, typename CopyFunc>
         bool pop( Q* arr, size_t count, CopyFunc copy )
         {
-            assert( count < capacity() );
+            assert( count < capacity());
 
-            size_t front = front_.load( memory_model::memory_order_relaxed );
-            assert( cback_ - front < capacity() );
+            counter_type front = front_.load( memory_model::memory_order_relaxed );
+            assert( static_cast<size_t>( cback_ - front ) < capacity());
 
-            if ( cback_ - front < count ) {
+            if ( static_cast<size_t>( cback_ - front ) < count ) {
                 cback_ = back_.load( memory_model::memory_order_acquire );
-                if ( cback_ - front < count )
+                if ( static_cast<size_t>( cback_ - front ) < count )
                     return false;
             }
 
@@ -402,7 +410,7 @@ namespace cds { namespace container {
             The function is available only if <tt>std::is_assignable<Q&, value_type const&>::value</tt>
             is \p true.
 
-            Returns \p true if success or \p false if not enought sufficient space in the ring
+            Returns \p true if success or \p false if not enough space in the ring
         */
         template <typename Q>
         typename std::enable_if< std::is_assignable<Q&, value_type const&>::value, bool>::type
@@ -449,8 +457,8 @@ namespace cds { namespace container {
         template <typename Func>
         bool dequeue_with( Func f )
         {
-            size_t front = front_.load( memory_model::memory_order_relaxed );
-            assert( cback_ - front < capacity() );
+            counter_type front = front_.load( memory_model::memory_order_relaxed );
+            assert( static_cast<size_t>( cback_ - front ) < capacity());
 
             if ( cback_ - front < 1 ) {
                 cback_ = back_.load( memory_model::memory_order_acquire );
@@ -482,8 +490,8 @@ namespace cds { namespace container {
         */
         value_type* front()
         {
-            size_t front = front_.load( memory_model::memory_order_relaxed );
-            assert( cback_ - front < capacity() );
+            counter_type front = front_.load( memory_model::memory_order_relaxed );
+            assert( static_cast<size_t>( cback_ - front ) < capacity());
 
             if ( cback_ - front < 1 ) {
                 cback_ = back_.load( memory_model::memory_order_acquire );
@@ -501,8 +509,8 @@ namespace cds { namespace container {
         */
         bool pop_front()
         {
-            size_t front = front_.load( memory_model::memory_order_relaxed );
-            assert( cback_ - front <= capacity() );
+            counter_type front = front_.load( memory_model::memory_order_relaxed );
+            assert( static_cast<size_t>( cback_ - front ) <= capacity());
 
             if ( cback_ - front < 1 ) {
                 cback_ = back_.load( memory_model::memory_order_acquire );
@@ -517,13 +525,411 @@ namespace cds { namespace container {
             return true;
         }
 
-        /// Clears the ring buffer
+        /// Clears the ring buffer (only consumer can call this function!)
         void clear()
         {
             value_type v;
-            while ( pop( v ) );
+            while ( pop( v ));
+        }
+
+        /// Checks if the ring-buffer is empty
+        bool empty() const
+        {
+            return front_.load( memory_model::memory_order_relaxed ) == back_.load( memory_model::memory_order_relaxed );
+        }
+
+        /// Checks if the ring-buffer is full
+        bool full() const
+        {
+            return back_.load( memory_model::memory_order_relaxed ) - front_.load( memory_model::memory_order_relaxed ) >= capacity();
+        }
+
+        /// Returns the current size of ring buffer
+        size_t size() const
+        {
+            return static_cast<size_t>( back_.load( memory_model::memory_order_relaxed ) - front_.load( memory_model::memory_order_relaxed ));
+        }
+
+        /// Returns capacity of the ring buffer
+        size_t capacity() const
+        {
+            return buffer_.capacity();
+        }
+
+    private:
+        //@cond
+        atomics::atomic<counter_type>   front_;
+        typename opt::details::apply_padding< atomics::atomic<counter_type>, traits::padding >::padding_type pad1_;
+        atomics::atomic<counter_type>   back_;
+        typename opt::details::apply_padding< atomics::atomic<counter_type>, traits::padding >::padding_type pad2_;
+        counter_type                    pfront_;
+        typename opt::details::apply_padding< counter_type, traits::padding >::padding_type pad3_;
+        counter_type                    cback_;
+        typename opt::details::apply_padding< counter_type, traits::padding >::padding_type pad4_;
+
+        buffer                      buffer_;
+        //@endcond
+    };
+
+
+    /// Single-producer single-consumer ring buffer for untyped variable-sized data
+    /** @ingroup cds_nonintrusive_queue
+        @anchor cds_nonintrusive_WeakRingBuffer_void
+
+        This SPSC ring-buffer is intended for data of variable size. The producer
+        allocates a buffer from ring, you fill it with data and pushes them back to ring.
+        The consumer thread reads data from front-end and then pops them:
+        \code
+        // allocates 1M ring buffer
+        WeakRingBuffer<void>    theRing( 1024 * 1024 );
+
+        void producer_thread()
+        {
+            // Get data of size N bytes
+            size_t size;
+            void*  data;
+
+            while ( true ) {
+                // Get external data
+                std::tie( data, size ) = get_data();
+
+                if ( data == nullptr )
+                    break;
+
+                // Allocates a buffer from the ring
+                void* buf = theRing.back( size );
+                if ( !buf ) {
+                    std::cout << "The ring is full" << std::endl;
+                    break;
+                }
+
+                memcpy( buf, data, size );
+
+                // Push data into the ring
+                theRing.push_back();
+            }
+        }
+
+        void consumer_thread()
+        {
+            while ( true ) {
+                auto buf = theRing.front();
+
+                if ( buf.first == nullptr ) {
+                    std::cout << "The ring is empty" << std::endl;
+                    break;
+                }
+
+                // Process data
+                process_data( buf.first, buf.second );
+
+                // Free buffer
+                theRing.pop_front();
+            }
+        }
+        \endcode
+
+        @warning: \p %WeakRingBuffer is developed for 64-bit architecture.
+        32-bit platform must provide support for 64-bit atomics.
+    */
+#ifdef CDS_DOXYGEN_INVOKED
+    template <typename Traits = weak_ringbuffer::traits>
+#else
+    template <typename Traits>
+#endif
+    class WeakRingBuffer<void, Traits>: public cds::bounded_container
+    {
+    public:
+        typedef Traits      traits;         ///< Ring buffer traits
+        typedef typename    traits::memory_model  memory_model;  ///< Memory ordering. See \p cds::opt::memory_model option
+
+    private:
+        //@cond
+        typedef typename traits::buffer::template rebind< uint8_t >::other buffer;
+        typedef uint64_t    counter_type;
+        //@endcond
+
+    public:
+        /// Creates the ring buffer of \p capacity bytes
+        /**
+            For \p cds::opt::v::uninitialized_static_buffer the \p nCapacity parameter is ignored.
+
+            If the buffer capacity is a power of two, lightweight binary arithmetics is used
+            instead of modulo arithmetics.
+        */
+        WeakRingBuffer( size_t capacity = 0 )
+            : front_( 0 )
+            , pfront_( 0 )
+            , cback_( 0 )
+            , buffer_( capacity )
+        {
+            back_.store( 0, memory_model::memory_order_release );
+        }
+
+        /// [producer] Reserve \p size bytes
+        /**
+            The function returns a pointer to reserved buffer of \p size bytes.
+            If no enough space in the ring buffer the function returns \p nullptr.
+
+            After successful \p %back() you should fill the buffer provided and call \p push_back():
+            \code
+            // allocates 1M ring buffer
+            WeakRingBuffer<void>    theRing( 1024 * 1024 );
+
+            void producer_thread()
+            {
+                // Get data of size N bytes
+                size_t size;1
+                void*  data;
+
+                while ( true ) {
+                    // Get external data
+                    std::tie( data, size ) = get_data();
+
+                    if ( data == nullptr )
+                        break;
+
+                    // Allocates a buffer from the ring
+                    void* buf = theRing.back( size );
+                    if ( !buf ) {
+                        std::cout << "The ring is full" << std::endl;
+                        break;
+                    }
+
+                    memcpy( buf, data, size );
+
+                    // Push data into the ring
+                    theRing.push_back();
+                }
+            }
+            \endcode
+        */
+        void* back( size_t size )
+        {
+            assert( size > 0 );
+
+            // Any data is rounded to 8-byte boundary
+            size_t real_size = calc_real_size( size );
+
+            // check if we can reserve read_size bytes
+            assert( real_size < capacity());
+            counter_type back = back_.load( memory_model::memory_order_relaxed );
+
+            assert( static_cast<size_t>( back - pfront_ ) <= capacity());
+
+            if ( static_cast<size_t>( pfront_ + capacity() - back ) < real_size ) {
+                pfront_ = front_.load( memory_model::memory_order_acquire );
+
+                if ( static_cast<size_t>( pfront_ + capacity() - back ) < real_size ) {
+                    // not enough space
+                    return nullptr;
+                }
+            }
+
+            uint8_t* reserved = buffer_.buffer() + buffer_.mod( back );
+
+            // Check if the buffer free space is enough for storing real_size bytes
+            size_t tail_size = capacity() - static_cast<size_t>( buffer_.mod( back ));
+            if ( tail_size < real_size ) {
+                // make unused tail
+                assert( tail_size >= sizeof( size_t ));
+                assert( !is_tail( tail_size ));
+
+                *reinterpret_cast<size_t*>( reserved ) = make_tail( tail_size - sizeof(size_t));
+                back += tail_size;
+
+                // We must be in beginning of buffer
+                assert( buffer_.mod( back ) == 0 );
+
+                if ( static_cast<size_t>( pfront_ + capacity() - back ) < real_size ) {
+                    pfront_ = front_.load( memory_model::memory_order_acquire );
+
+                    if ( static_cast<size_t>( pfront_ + capacity() - back ) < real_size ) {
+                        // not enough space
+                        return nullptr;
+                    }
+                }
+
+                back_.store( back, memory_model::memory_order_release );
+                reserved = buffer_.buffer();
+            }
+
+            // reserve and store size
+            *reinterpret_cast<size_t*>( reserved ) = size;
+
+            return reinterpret_cast<void*>( reserved + sizeof( size_t ));
+        }
+
+        /// [producer] Push reserved bytes into ring
+        /**
+            The function pushes reserved buffer into the ring. Afte this call,
+            the buffer becomes visible by a consumer:
+            \code
+            // allocates 1M ring buffer
+            WeakRingBuffer<void>    theRing( 1024 * 1024 );
+
+            void producer_thread()
+            {
+                // Get data of size N bytes
+                size_t size;1
+                void*  data;
+
+                while ( true ) {
+                    // Get external data
+                    std::tie( data, size ) = get_data();
+
+                    if ( data == nullptr )
+                        break;
+
+                    // Allocates a buffer from the ring
+                    void* buf = theRing.back( size );
+                    if ( !buf ) {
+                        std::cout << "The ring is full" << std::endl;
+                        break;
+                    }
+
+                    memcpy( buf, data, size );
+
+                    // Push data into the ring
+                    theRing.push_back();
+                }
+            }
+            \endcode
+        */
+        void push_back()
+        {
+            counter_type back = back_.load( memory_model::memory_order_relaxed );
+            uint8_t* reserved = buffer_.buffer() + buffer_.mod( back );
+
+            size_t real_size = calc_real_size( *reinterpret_cast<size_t*>( reserved ));
+            assert( real_size < capacity());
+
+            back_.store( back + real_size, memory_model::memory_order_release );
+        }
+
+        /// [producer] Push \p data of \p size bytes into ring
+        /**
+            This function invokes \p back( size ), \p memcpy( buf, data, size )
+            and \p push_back() in one call.
+        */
+        bool push_back( void const* data, size_t size )
+        {
+            void* buf = back( size );
+            if ( buf ) {
+                memcpy( buf, data, size );
+                push_back();
+                return true;
+            }
+            return false;
+        }
+
+        /// [consumer] Get top data from the ring
+        /**
+            If the ring is empty, the function returns \p nullptr in \p std:pair::first.
+        */
+        std::pair<void*, size_t> front()
+        {
+            counter_type front = front_.load( memory_model::memory_order_relaxed );
+            assert( static_cast<size_t>( cback_ - front ) < capacity());
+
+            if ( cback_ - front < sizeof( size_t )) {
+                cback_ = back_.load( memory_model::memory_order_acquire );
+                if ( cback_ - front < sizeof( size_t ))
+                    return std::make_pair( nullptr, 0u );
+            }
+
+            uint8_t * buf = buffer_.buffer() + buffer_.mod( front );
+
+            // check alignment
+            assert( ( reinterpret_cast<uintptr_t>( buf ) & ( sizeof( uintptr_t ) - 1 )) == 0 );
+
+            size_t size = *reinterpret_cast<size_t*>( buf );
+            if ( is_tail( size )) {
+                // unused tail, skip
+                CDS_VERIFY( pop_front());
+
+                front = front_.load( memory_model::memory_order_relaxed );
+                buf = buffer_.buffer() + buffer_.mod( front );
+                size = *reinterpret_cast<size_t*>( buf );
+
+                assert( !is_tail( size ));
+                assert( buf == buffer_.buffer());
+            }
+
+#ifdef _DEBUG
+            size_t real_size = calc_real_size( size );
+            if ( static_cast<size_t>( cback_ - front ) < real_size ) {
+                cback_ = back_.load( memory_model::memory_order_acquire );
+                assert( static_cast<size_t>( cback_ - front ) >= real_size );
+            }
+#endif
+
+            return std::make_pair( reinterpret_cast<void*>( buf + sizeof( size_t )), size );
+        }
+
+        /// [consumer] Pops top data
+        /**
+            Typical consumer workloop:
+            \code
+            // allocates 1M ring buffer
+            WeakRingBuffer<void>    theRing( 1024 * 1024 );
+
+            void consumer_thread()
+            {
+                while ( true ) {
+                    auto buf = theRing.front();
+
+                    if ( buf.first == nullptr ) {
+                        std::cout << "The ring is empty" << std::endl;
+                        break;
+                    }
+
+                    // Process data
+                    process_data( buf.first, buf.second );
+
+                    // Free buffer
+                    theRing.pop_front();
+                }
+            }
+            \endcode
+        */
+        bool pop_front()
+        {
+            counter_type front = front_.load( memory_model::memory_order_relaxed );
+            assert( static_cast<size_t>( cback_ - front ) <= capacity());
+
+            if ( cback_ - front < sizeof(size_t)) {
+                cback_ = back_.load( memory_model::memory_order_acquire );
+                if ( cback_ - front < sizeof( size_t ))
+                    return false;
+            }
+
+            uint8_t * buf = buffer_.buffer() + buffer_.mod( front );
+
+            // check alignment
+            assert( ( reinterpret_cast<uintptr_t>( buf ) & ( sizeof( uintptr_t ) - 1 )) == 0 );
+
+            size_t size = *reinterpret_cast<size_t*>( buf );
+            size_t real_size = calc_real_size( untail( size ));
+
+#ifdef _DEBUG
+            if ( static_cast<size_t>( cback_ - front ) < real_size ) {
+                cback_ = back_.load( memory_model::memory_order_acquire );
+                assert( static_cast<size_t>( cback_ - front ) >= real_size );
+            }
+#endif
+
+            front_.store( front + real_size, memory_model::memory_order_release );
+            return true;
+
         }
 
+        /// [consumer] Clears the ring buffer
+        void clear()
+        {
+            for ( auto el = front(); el.first; el = front())
+                pop_front();
+        }
 
         /// Checks if the ring-buffer is empty
         bool empty() const
@@ -540,7 +946,7 @@ namespace cds { namespace container {
         /// Returns the current size of ring buffer
         size_t size() const
         {
-            return back_.load( memory_model::memory_order_relaxed ) - front_.load( memory_model::memory_order_relaxed );
+            return static_cast<size_t>( back_.load( memory_model::memory_order_relaxed ) - front_.load( memory_model::memory_order_relaxed ));
         }
 
         /// Returns capacity of the ring buffer
@@ -551,14 +957,42 @@ namespace cds { namespace container {
 
     private:
         //@cond
-        atomics::atomic<size_t>     front_;
-        typename opt::details::apply_padding< atomics::atomic<size_t>, traits::padding >::padding_type pad1_;
-        atomics::atomic<size_t>     back_;
-        typename opt::details::apply_padding< atomics::atomic<size_t>, traits::padding >::padding_type pad2_;
-        size_t                      pfront_;
-        typename opt::details::apply_padding< size_t, traits::padding >::padding_type pad3_;
-        size_t                      cback_;
-        typename opt::details::apply_padding< size_t, traits::padding >::padding_type pad4_;
+        static size_t calc_real_size( size_t size )
+        {
+            size_t real_size =  (( size + sizeof( uintptr_t ) - 1 ) & ~( sizeof( uintptr_t ) - 1 )) + sizeof( size_t );
+
+            assert( real_size > size );
+            assert( real_size - size >= sizeof( size_t ));
+
+            return real_size;
+        }
+
+        static bool is_tail( size_t size )
+        {
+            return ( size & ( size_t( 1 ) << ( sizeof( size_t ) * 8 - 1 ))) != 0;
+        }
+
+        static size_t make_tail( size_t size )
+        {
+            return size | ( size_t( 1 ) << ( sizeof( size_t ) * 8 - 1 ));
+        }
+
+        static size_t untail( size_t size )
+        {
+            return size & (( size_t( 1 ) << ( sizeof( size_t ) * 8 - 1 )) - 1);
+        }
+        //@endcond
+
+    private:
+        //@cond
+        atomics::atomic<counter_type>     front_;
+        typename opt::details::apply_padding< atomics::atomic<counter_type>, traits::padding >::padding_type pad1_;
+        atomics::atomic<counter_type>     back_;
+        typename opt::details::apply_padding< atomics::atomic<counter_type>, traits::padding >::padding_type pad2_;
+        counter_type                      pfront_;
+        typename opt::details::apply_padding< counter_type, traits::padding >::padding_type pad3_;
+        counter_type                      cback_;
+        typename opt::details::apply_padding< counter_type, traits::padding >::padding_type pad4_;
 
         buffer                      buffer_;
         //@endcond