(wangle) fix race in Core::detachOne()

author Hans Fugal <fugalh@fb.com>

Mon, 27 Oct 2014 15:53:23 +0000 (08:53 -0700)

committer dcsommer <dcsommer@fb.com>

Wed, 29 Oct 2014 23:05:33 +0000 (16:05 -0700)
author Hans Fugal <fugalh@fb.com>
Mon, 27 Oct 2014 15:53:23 +0000 (08:53 -0700)
committer dcsommer <dcsommer@fb.com>
Wed, 29 Oct 2014 23:05:33 +0000 (16:05 -0700)
diff --git a/folly/wangle/detail/Core.h b/folly/wangle/detail/Core.h

index 9b9295d89688b2d2e2ecd4b2c64600f85c432116..f3aa6d24416d247d00e5bd6c1f7bd8ce067973dd 100644 (file)
--- a/folly/wangle/detail/Core.h
+++ b/folly/wangle/detail/Core.h
@@ -205,9 +205,10 @@ class Core : protected FSM<State> {
    }
  
    void detachOne() {
-    ++detached_;
-    assert(detached_ == 1 || detached_ == 2);
-    if (detached_ == 2) {
+    auto d = ++detached_;
+    assert(d >= 1);
+    assert(d <= 2);
+    if (d == 2) {
        // we should have already executed the callback with the value
        assert(calledBack_);
        delete this;
diff --git a/folly/wangle/detail/FSM.h b/folly/wangle/detail/FSM.h

index 95a0bcdef92f0757f02637d1906405026e5467b4..be4eb8aefb66ba2219b5304d1e62e11572c8b416 100644 (file)
--- a/folly/wangle/detail/FSM.h
+++ b/folly/wangle/detail/FSM.h
@@ -48,13 +48,14 @@ public:
    }
  
    /// Atomically do a state transition with accompanying action.
+  /// The action will see the old state.
    /// @returns true on success, false and action unexecuted otherwise
    template <class F>
    bool updateState(Enum A, Enum B, F const& action) {
      std::lock_guard<Mutex> lock(mutex_);
      if (state_ != A) return false;
-    state_ = B;
      action();
+    state_ = B;
      return true;
    }
  
@@ -82,6 +83,9 @@ public:
    ///       }
    ///       /* do unprotected stuff */
    ///       return; // or otherwise break out of the loop
+  ///
+  /// The protected action will see the old state, and the unprotected action
+  /// will see the new state.
    template <class F1, class F2>
    bool updateState(Enum A, Enum B,
                     F1 const& protectedAction, F2 const& unprotectedAction) {
diff --git a/folly/wangle/test/FSM.cpp b/folly/wangle/test/FSM.cpp

index 1ce78c2ee7779279c0fd8c957378f2431ac811ea..80ee53649d10bd702504d9ff9cc5ec535d10fdd6 100644 (file)
--- a/folly/wangle/test/FSM.cpp
+++ b/folly/wangle/test/FSM.cpp
@@ -108,8 +108,8 @@ TEST(FSM, noActionOnBadUpdate) {
    EXPECT_EQ(0, count);
  }
  
-TEST(FSM, stateTransitionBeforeAction) {
+TEST(FSM, stateTransitionAfterAction) {
    FSM<State> fsm(State::A);
    fsm.updateState(State::A, State::B,
-                  [&]{ EXPECT_EQ(State::B, fsm.getState()); });
+                  [&]{ EXPECT_EQ(State::A, fsm.getState()); });
  }
diff --git a/folly/wangle/test/FutureTest.cpp b/folly/wangle/test/FutureTest.cpp

index 877efcfb3c8c3cb0182c2341613a12738b1d97d2..0feaa50fb38fe1ab245e9e1b56009bb82a2eaa7d 100644 (file)
--- a/folly/wangle/test/FutureTest.cpp
+++ b/folly/wangle/test/FutureTest.cpp
@@ -23,6 +23,7 @@
  #include <thread>
  #include <type_traits>
  #include <unistd.h>
+#include <folly/Memory.h>
  #include <folly/wangle/Executor.h>
  #include <folly/wangle/Future.h>
  #include <folly/wangle/ManualExecutor.h>
@@ -670,7 +671,6 @@ TEST(Future, waitWithSemaphore) {
          });
        flag = true;
        result.store(waitWithSemaphore(std::move(n)).value());
-      LOG(INFO) << result;
      },
      std::move(f)
      );
@@ -847,3 +847,26 @@ TEST(Future, getFuture_after_setException) {
    p.fulfil([]() -> void { throw std::logic_error("foo"); });
    EXPECT_THROW(p.getFuture().value(), std::logic_error);
  }
+
+TEST(Future, detachRace) {
+  // Task #5438209
+  // This test is designed to detect a race that was in Core::detachOne()
+  // where detached_ was incremented and then tested, and that
+  // allowed a race where both Promise and Future would think they were the
+  // second and both try to delete. This showed up at scale but was very
+  // difficult to reliably repro in a test. As it is, this only fails about
+  // once in every 1,000 executions. Doing this 1,000 times is going to make a
+  // slow test so I won't do that but if it ever fails, take it seriously, and
+  // run the test binary with "--gtest_repeat=10000 --gtest_filter=*detachRace"
+  // (Don't forget to enable ASAN)
+  auto p = folly::make_unique<Promise<bool>>();
+  auto f = folly::make_unique<Future<bool>>(p->getFuture());
+  folly::Baton<> baton;
+  std::thread t1([&]{
+    baton.post();
+    p.reset();
+  });
+  baton.wait();
+  f.reset();
+  t1.join();
+}
author	Hans Fugal <fugalh@fb.com>
	Mon, 27 Oct 2014 15:53:23 +0000 (08:53 -0700)
committer	dcsommer <dcsommer@fb.com>
	Wed, 29 Oct 2014 23:05:33 +0000 (16:05 -0700)
folly/wangle/detail/Core.h		patch \| blob \| history
folly/wangle/detail/FSM.h		patch \| blob \| history
folly/wangle/test/FSM.cpp		patch \| blob \| history
folly/wangle/test/FutureTest.cpp		patch \| blob \| history