Fix case where ssl cert does not match key

[folly.git] / folly / RWSpinLock.h
diff --git a/folly/RWSpinLock.h b/folly/RWSpinLock.h

index a01a2346191b6385b068db76f8e6b614c5851f34..94f48028289ca496d6d29059ff3d2be0814643ab 100644 (file)
--- a/folly/RWSpinLock.h
+++ b/folly/RWSpinLock.h
@@ -1,5 +1,5 @@
  /*
- * Copyright 2016 Facebook, Inc.
+ * Copyright 2017 Facebook, Inc.
   *
   * Licensed under the Apache License, Version 2.0 (the "License");
   * you may not use this file except in compliance with the License.
@@ -14,38 +14,23 @@
   * limitations under the License.
   */
  
-/*************************************************
-
-IF YOU HAVE TO ASK, NO, YOU DO NOT WANT A SPINLOCK.
-
-Yes, even if a microbench shows that a spinlock is faster, you still probably
-don't want one.
-
-Spinlocks in general are a big problem on systems for which you cannot disable
-preemption, like normal user-space code running on POXIX and Windows 
-platforms. If the thread holding a spinlock is preempted, another thread
-trying to acquire the lock and pounding the lock variable 
-has no idea that it's spinning in vain. Some spinlock implementations use
-sched_yield or similar to try to make this problem less severe --- we don't
-use the rest of our timeslice to pointlessly read a variable --- 
-but the overall result is still poor, especially if the thread locking the lock
-sleeps (which any thread can do on a demand-paging system), then we'll
-sched_yield over and over again, still pointlessly, pounding on the lock.
-
-You really want a plain old mutex. Regular mutexes will spin for a little while,
-then go to sleep.  While sleeping, threads use no CPU resources and do
-not cause scheduler contention.
-
-There are exceptions to the above warning.  If you have to ask, no, your 
-code doesn't qualify.
-
-
-STOP USING SPINLOCKS IN ORDINARY CODE.
-
-
-**************************************************/
-
  /*
+ * N.B. You most likely do _not_ want to use RWSpinLock or any other
+ * kind of spinlock.  Use SharedMutex instead.
+ *
+ * In short, spinlocks in preemptive multi-tasking operating systems
+ * have serious problems and fast mutexes like SharedMutex are almost
+ * certainly the better choice, because letting the OS scheduler put a
+ * thread to sleep is better for system responsiveness and throughput
+ * than wasting a timeslice repeatedly querying a lock held by a
+ * thread that's blocked, and you can't prevent userspace
+ * programs blocking.
+ *
+ * Spinlocks in an operating system kernel make much more sense than
+ * they do in userspace.
+ *
+ * -------------------------------------------------------------------
+ *
   * Two Read-Write spin lock implementations.
   *
   *  Ref: http://locklessinc.com/articles/locks
@@ -55,12 +40,14 @@ STOP USING SPINLOCKS IN ORDINARY CODE.
   *  are very compact (4/8 bytes), so are suitable for per-instance
   *  based locking, particularly when contention is not expected.
   *
- *  In most cases, RWSpinLock is a reasonable choice.  It has minimal
- *  overhead, and comparable contention performance when the number of
- *  competing threads is less than or equal to the number of logical
- *  CPUs.  Even as the number of threads gets larger, RWSpinLock can
- *  still be very competitive in READ, although it is slower on WRITE,
- *  and also inherently unfair to writers.
+ *  For a spinlock, RWSpinLock is a reasonable choice.  (See the note
+ *  about for why a spin lock is frequently a bad idea generally.)
+ *  RWSpinLock has minimal overhead, and comparable contention
+ *  performance when the number of competing threads is less than or
+ *  equal to the number of logical CPUs.  Even as the number of
+ *  threads gets larger, RWSpinLock can still be very competitive in
+ *  READ, although it is slower on WRITE, and also inherently unfair
+ *  to writers.
   *
   *  RWTicketSpinLock shows more balanced READ/WRITE performance.  If
   *  your application really needs a lot more threads, and a
@@ -94,8 +81,7 @@ STOP USING SPINLOCKS IN ORDINARY CODE.
   * @author Xin Liu <xliux@fb.com>
   */
  
-#ifndef FOLLY_RWSPINLOCK_H_
-#define FOLLY_RWSPINLOCK_H_
+#pragma once
  
  /*
  ========================================================================
@@ -150,30 +136,29 @@ pthread_rwlock_t Read        728698     24us       101ns     7.28ms     194us
  */
  
  #include <folly/Portability.h>
+#include <folly/portability/Asm.h>
  
-#if defined(__GNUC__) && \
-  (defined(__i386) || FOLLY_X64 || \
-   defined(ARCH_K8))
-# define RW_SPINLOCK_USE_X86_INTRINSIC_
-# include <x86intrin.h>
+#if defined(__GNUC__) && (defined(__i386) || FOLLY_X64 || defined(ARCH_K8))
+#define RW_SPINLOCK_USE_X86_INTRINSIC_
+#include <x86intrin.h>
  #elif defined(_MSC_VER) && defined(FOLLY_X64)
-# define RW_SPINLOCK_USE_X86_INTRINSIC_
+#define RW_SPINLOCK_USE_X86_INTRINSIC_
  #else
-# undef RW_SPINLOCK_USE_X86_INTRINSIC_
+#undef RW_SPINLOCK_USE_X86_INTRINSIC_
  #endif
  
  // iOS doesn't define _mm_cvtsi64_si128 and friends
-#if (FOLLY_SSE >= 2) && !TARGET_OS_IPHONE
+#if (FOLLY_SSE >= 2) && !FOLLY_MOBILE && FOLLY_X64
  #define RW_SPINLOCK_USE_SSE_INSTRUCTIONS_
  #else
  #undef RW_SPINLOCK_USE_SSE_INSTRUCTIONS_
  #endif
  
+#include <algorithm>
  #include <atomic>
  #include <string>
-#include <algorithm>
+#include <thread>
  
-#include <sched.h>
  #include <glog/logging.h>
  
  #include <folly/Likely.h>
@@ -205,9 +190,11 @@ class RWSpinLock {
  
    // Lockable Concept
    void lock() {
-    int count = 0;
+    uint_fast32_t count = 0;
      while (!LIKELY(try_lock())) {
-      if (++count > 1000) sched_yield();
+      if (++count > 1000) {
+        std::this_thread::yield();
+      }
      }
    }
  
@@ -219,9 +206,11 @@ class RWSpinLock {
  
    // SharedLockable Concept
    void lock_shared() {
-    int count = 0;
+    uint_fast32_t count = 0;
      while (!LIKELY(try_lock_shared())) {
-      if (++count > 1000) sched_yield();
+      if (++count > 1000) {
+        std::this_thread::yield();
+      }
      }
    }
  
@@ -237,9 +226,11 @@ class RWSpinLock {
  
    // UpgradeLockable Concept
    void lock_upgrade() {
-    int count = 0;
+    uint_fast32_t count = 0;
      while (!try_lock_upgrade()) {
-      if (++count > 1000) sched_yield();
+      if (++count > 1000) {
+        std::this_thread::yield();
+      }
      }
    }
  
@@ -251,7 +242,9 @@ class RWSpinLock {
    void unlock_upgrade_and_lock() {
      int64_t count = 0;
      while (!try_unlock_upgrade_and_lock()) {
-      if (++count > 1000) sched_yield();
+      if (++count > 1000) {
+        std::this_thread::yield();
+      }
      }
    }
  
@@ -320,8 +313,10 @@ class RWSpinLock {
  
    class ReadHolder {
     public:
-    explicit ReadHolder(RWSpinLock* lock = nullptr) : lock_(lock) {
-      if (lock_) lock_->lock_shared();
+    explicit ReadHolder(RWSpinLock* lock) : lock_(lock) {
+      if (lock_) {
+        lock_->lock_shared();
+      }
      }
  
      explicit ReadHolder(RWSpinLock& lock) : lock_(&lock) {
@@ -335,12 +330,16 @@ class RWSpinLock {
      // down-grade
      explicit ReadHolder(UpgradedHolder&& upgraded) : lock_(upgraded.lock_) {
        upgraded.lock_ = nullptr;
-      if (lock_) lock_->unlock_upgrade_and_lock_shared();
+      if (lock_) {
+        lock_->unlock_upgrade_and_lock_shared();
+      }
      }
  
      explicit ReadHolder(WriteHolder&& writer) : lock_(writer.lock_) {
        writer.lock_ = nullptr;
-      if (lock_) lock_->unlock_and_lock_shared();
+      if (lock_) {
+        lock_->unlock_and_lock_shared();
+      }
      }
  
      ReadHolder& operator=(ReadHolder&& other) {
@@ -352,13 +351,23 @@ class RWSpinLock {
      ReadHolder(const ReadHolder& other) = delete;
      ReadHolder& operator=(const ReadHolder& other) = delete;
  
-    ~ReadHolder() { if (lock_) lock_->unlock_shared(); }
+    ~ReadHolder() {
+      if (lock_) {
+        lock_->unlock_shared();
+      }
+    }
  
      void reset(RWSpinLock* lock = nullptr) {
-      if (lock == lock_) return;
-      if (lock_) lock_->unlock_shared();
+      if (lock == lock_) {
+        return;
+      }
+      if (lock_) {
+        lock_->unlock_shared();
+      }
        lock_ = lock;
-      if (lock_) lock_->lock_shared();
+      if (lock_) {
+        lock_->lock_shared();
+      }
      }
  
      void swap(ReadHolder* other) {
@@ -373,8 +382,10 @@ class RWSpinLock {
  
    class UpgradedHolder {
     public:
-    explicit UpgradedHolder(RWSpinLock* lock = nullptr) : lock_(lock) {
-      if (lock_) lock_->lock_upgrade();
+    explicit UpgradedHolder(RWSpinLock* lock) : lock_(lock) {
+      if (lock_) {
+        lock_->lock_upgrade();
+      }
      }
  
      explicit UpgradedHolder(RWSpinLock& lock) : lock_(&lock) {
@@ -384,7 +395,9 @@ class RWSpinLock {
      explicit UpgradedHolder(WriteHolder&& writer) {
        lock_ = writer.lock_;
        writer.lock_ = nullptr;
-      if (lock_) lock_->unlock_and_lock_upgrade();
+      if (lock_) {
+        lock_->unlock_and_lock_upgrade();
+      }
      }
  
      UpgradedHolder(UpgradedHolder&& other) noexcept : lock_(other.lock_) {
@@ -400,13 +413,23 @@ class RWSpinLock {
      UpgradedHolder(const UpgradedHolder& other) = delete;
      UpgradedHolder& operator =(const UpgradedHolder& other) = delete;
  
-    ~UpgradedHolder() { if (lock_) lock_->unlock_upgrade(); }
+    ~UpgradedHolder() {
+      if (lock_) {
+        lock_->unlock_upgrade();
+      }
+    }
  
      void reset(RWSpinLock* lock = nullptr) {
-      if (lock == lock_) return;
-      if (lock_) lock_->unlock_upgrade();
+      if (lock == lock_) {
+        return;
+      }
+      if (lock_) {
+        lock_->unlock_upgrade();
+      }
        lock_ = lock;
-      if (lock_) lock_->lock_upgrade();
+      if (lock_) {
+        lock_->lock_upgrade();
+      }
      }
  
      void swap(UpgradedHolder* other) {
@@ -422,8 +445,10 @@ class RWSpinLock {
  
    class WriteHolder {
     public:
-    explicit WriteHolder(RWSpinLock* lock = nullptr) : lock_(lock) {
-      if (lock_) lock_->lock();
+    explicit WriteHolder(RWSpinLock* lock) : lock_(lock) {
+      if (lock_) {
+        lock_->lock();
+      }
      }
  
      explicit WriteHolder(RWSpinLock& lock) : lock_(&lock) {
@@ -434,7 +459,9 @@ class RWSpinLock {
      explicit WriteHolder(UpgradedHolder&& upgraded) {
        lock_ = upgraded.lock_;
        upgraded.lock_ = nullptr;
-      if (lock_) lock_->unlock_upgrade_and_lock();
+      if (lock_) {
+        lock_->unlock_upgrade_and_lock();
+      }
      }
  
      WriteHolder(WriteHolder&& other) noexcept : lock_(other.lock_) {
@@ -450,13 +477,23 @@ class RWSpinLock {
      WriteHolder(const WriteHolder& other) = delete;
      WriteHolder& operator =(const WriteHolder& other) = delete;
  
-    ~WriteHolder () { if (lock_) lock_->unlock(); }
+    ~WriteHolder() {
+      if (lock_) {
+        lock_->unlock();
+      }
+    }
  
      void reset(RWSpinLock* lock = nullptr) {
-      if (lock == lock_) return;
-      if (lock_) lock_->unlock();
+      if (lock == lock_) {
+        return;
+      }
+      if (lock_) {
+        lock_->unlock();
+      }
        lock_ = lock;
-      if (lock_) lock_->lock();
+      if (lock_) {
+        lock_->lock();
+      }
      }
  
      void swap(WriteHolder* other) {
@@ -470,12 +507,6 @@ class RWSpinLock {
      RWSpinLock* lock_;
    };
  
-  // Synchronized<> adaptors
-  friend void acquireRead(RWSpinLock& l) { return l.lock_shared(); }
-  friend void acquireReadWrite(RWSpinLock& l) { return l.lock(); }
-  friend void releaseRead(RWSpinLock& l) { return l.unlock_shared(); }
-  friend void releaseReadWrite(RWSpinLock& l) { return l.unlock(); }
-
   private:
    std::atomic<int32_t> bits_;
  };
@@ -498,13 +529,14 @@ struct RWTicketIntTrait<64> {
  
  #ifdef RW_SPINLOCK_USE_SSE_INSTRUCTIONS_
    static __m128i make128(const uint16_t v[4]) {
-    return _mm_set_epi16(0, 0, 0, 0, v[3], v[2], v[1], v[0]);
+    return _mm_set_epi16(0, 0, 0, 0,
+        short(v[3]), short(v[2]), short(v[1]), short(v[0]));
    }
    static inline __m128i fromInteger(uint64_t from) {
-    return _mm_cvtsi64_si128(from);
+    return _mm_cvtsi64_si128(int64_t(from));
    }
    static inline uint64_t toInteger(__m128i in) {
-    return _mm_cvtsi128_si64(in);
+    return uint64_t(_mm_cvtsi128_si64(in));
    }
    static inline uint64_t addParallel(__m128i in, __m128i kDelta) {
      return toInteger(_mm_add_epi16(in, kDelta));
@@ -520,24 +552,26 @@ struct RWTicketIntTrait<32> {
  
  #ifdef RW_SPINLOCK_USE_SSE_INSTRUCTIONS_
    static __m128i make128(const uint8_t v[4]) {
-    return _mm_set_epi8(0, 0, 0, 0, 0, 0, 0, 0,
-        0, 0, 0, 0, v[3], v[2], v[1], v[0]);
+    return _mm_set_epi8(
+        0, 0, 0, 0,
+        0, 0, 0, 0,
+        0, 0, 0, 0,
+        char(v[3]), char(v[2]), char(v[1]), char(v[0]));
    }
    static inline __m128i fromInteger(uint32_t from) {
-    return _mm_cvtsi32_si128(from);
+    return _mm_cvtsi32_si128(int32_t(from));
    }
    static inline uint32_t toInteger(__m128i in) {
-    return _mm_cvtsi128_si32(in);
+    return uint32_t(_mm_cvtsi128_si32(in));
    }
    static inline uint32_t addParallel(__m128i in, __m128i kDelta) {
      return toInteger(_mm_add_epi8(in, kDelta));
    }
  #endif
  };
-}  // detail
+} // namespace detail
  
-
-template<size_t kBitWidth, bool kFavorWriter=false>
+template <size_t kBitWidth, bool kFavorWriter = false>
  class RWTicketSpinLockT {
    typedef detail::RWTicketIntTrait<kBitWidth> IntTraitType;
    typedef typename detail::RWTicketIntTrait<kBitWidth>::FullInt FullInt;
@@ -557,13 +591,13 @@ class RWTicketSpinLockT {
    } ticket;
  
   private: // Some x64-specific utilities for atomic access to ticket.
-  template<class T> static T load_acquire(T* addr) {
+  template <class T> static T load_acquire(T* addr) {
      T t = *addr; // acquire barrier
      asm_volatile_memory();
      return t;
    }
  
-  template<class T>
+  template <class T>
    static void store_release(T* addr, T v) {
      asm_volatile_memory();
      *addr = v; // release barrier
@@ -604,7 +638,9 @@ class RWTicketSpinLockT {
    bool try_lock() {
      RWTicket t;
      FullInt old = t.whole = load_acquire(&ticket.whole);
-    if (t.users != t.write) return false;
+    if (t.users != t.write) {
+      return false;
+    }
      ++t.users;
      return __sync_bool_compare_and_swap(&ticket.whole, old, t.whole);
    }
@@ -616,16 +652,18 @@ class RWTicketSpinLockT {
     * turns.
     */
    void writeLockAggressive() {
-    // sched_yield() is needed here to avoid a pathology if the number
+    // std::this_thread::yield() is needed here to avoid a pathology if the number
      // of threads attempting concurrent writes is >= the number of real
      // cores allocated to this process. This is less likely than the
      // corresponding situation in lock_shared(), but we still want to
      // avoid it
-    int count = 0;
+    uint_fast32_t count = 0;
      QuarterInt val = __sync_fetch_and_add(&ticket.users, 1);
      while (val != load_acquire(&ticket.write)) {
        asm_volatile_pause();
-      if (UNLIKELY(++count > 1000)) sched_yield();
+      if (UNLIKELY(++count > 1000)) {
+        std::this_thread::yield();
+      }
      }
    }
  
@@ -638,7 +676,7 @@ class RWTicketSpinLockT {
      // there are a lot of competing readers.  The aggressive spinning
      // can help to avoid starving writers.
      //
-    // We don't worry about sched_yield() here because the caller
+    // We don't worry about std::this_thread::yield() here because the caller
      // has already explicitly abandoned fairness.
      while (!try_lock()) {}
    }
@@ -668,13 +706,15 @@ class RWTicketSpinLockT {
    }
  
    void lock_shared() {
-    // sched_yield() is important here because we can't grab the
+    // std::this_thread::yield() is important here because we can't grab the
      // shared lock if there is a pending writeLockAggressive, so we
      // need to let threads that already have a shared lock complete
-    int count = 0;
+    uint_fast32_t count = 0;
      while (!LIKELY(try_lock_shared())) {
        asm_volatile_pause();
-      if (UNLIKELY((++count & 1023) == 0)) sched_yield();
+      if (UNLIKELY((++count & 1023) == 0)) {
+        std::this_thread::yield();
+      }
      }
    }
  
@@ -696,7 +736,7 @@ class RWTicketSpinLockT {
    }
  
    void unlock_shared() {
-    QuarterInt val = __sync_fetch_and_add(&ticket.write, 1);
+    __sync_fetch_and_add(&ticket.write, 1);
    }
  
    class WriteHolder;
@@ -707,13 +747,16 @@ class RWTicketSpinLockT {
      ReadHolder(ReadHolder const&) = delete;
      ReadHolder& operator=(ReadHolder const&) = delete;
  
-    explicit ReadHolder(RWSpinLock *lock = nullptr) :
-      lock_(lock) {
-      if (lock_) lock_->lock_shared();
+    explicit ReadHolder(RWSpinLock* lock) : lock_(lock) {
+      if (lock_) {
+        lock_->lock_shared();
+      }
      }
  
      explicit ReadHolder(RWSpinLock &lock) : lock_ (&lock) {
-      if (lock_) lock_->lock_shared();
+      if (lock_) {
+        lock_->lock_shared();
+      }
      }
  
      // atomically unlock the write-lock from writer and acquire the read-lock
@@ -725,13 +768,19 @@ class RWTicketSpinLockT {
      }
  
      ~ReadHolder() {
-      if (lock_) lock_->unlock_shared();
+      if (lock_) {
+        lock_->unlock_shared();
+      }
      }
  
      void reset(RWSpinLock *lock = nullptr) {
-      if (lock_) lock_->unlock_shared();
+      if (lock_) {
+        lock_->unlock_shared();
+      }
        lock_ = lock;
-      if (lock_) lock_->lock_shared();
+      if (lock_) {
+        lock_->lock_shared();
+      }
      }
  
      void swap(ReadHolder *other) {
@@ -747,22 +796,34 @@ class RWTicketSpinLockT {
      WriteHolder(WriteHolder const&) = delete;
      WriteHolder& operator=(WriteHolder const&) = delete;
  
-    explicit WriteHolder(RWSpinLock *lock = nullptr) : lock_(lock) {
-      if (lock_) lock_->lock();
+    explicit WriteHolder(RWSpinLock* lock) : lock_(lock) {
+      if (lock_) {
+        lock_->lock();
+      }
      }
      explicit WriteHolder(RWSpinLock &lock) : lock_ (&lock) {
-      if (lock_) lock_->lock();
+      if (lock_) {
+        lock_->lock();
+      }
      }
  
      ~WriteHolder() {
-      if (lock_) lock_->unlock();
+      if (lock_) {
+        lock_->unlock();
+      }
      }
  
      void reset(RWSpinLock *lock = nullptr) {
-      if (lock == lock_) return;
-      if (lock_) lock_->unlock();
+      if (lock == lock_) {
+        return;
+      }
+      if (lock_) {
+        lock_->unlock();
+      }
        lock_ = lock;
-      if (lock_) lock_->lock();
+      if (lock_) {
+        lock_->lock();
+      }
      }
  
      void swap(WriteHolder *other) {
@@ -773,20 +834,6 @@ class RWTicketSpinLockT {
      friend class ReadHolder;
      RWSpinLock *lock_;
    };
-
-  // Synchronized<> adaptors.
-  friend void acquireRead(RWTicketSpinLockT& mutex) {
-    mutex.lock_shared();
-  }
-  friend void acquireReadWrite(RWTicketSpinLockT& mutex) {
-    mutex.lock();
-  }
-  friend void releaseRead(RWTicketSpinLockT& mutex) {
-    mutex.unlock_shared();
-  }
-  friend void releaseReadWrite(RWTicketSpinLockT& mutex) {
-    mutex.unlock();
-  }
  };
  
  typedef RWTicketSpinLockT<32> RWTicketSpinLock32;
@@ -794,10 +841,8 @@ typedef RWTicketSpinLockT<64> RWTicketSpinLock64;
  
  #endif  // RW_SPINLOCK_USE_X86_INTRINSIC_
  
-}  // namespace folly
+} // namespace folly
  
  #ifdef RW_SPINLOCK_USE_X86_INTRINSIC_
  #undef RW_SPINLOCK_USE_X86_INTRINSIC_
  #endif
-
-#endif  // FOLLY_RWSPINLOCK_H_