Fix deadlock danger when atomic ops are done under spinlock.

author Andres Freund <andres@anarazel.de>

Mon, 8 Jun 2020 23:50:37 +0000 (16:50 -0700)

committer Andres Freund <andres@anarazel.de>

Thu, 18 Jun 2020 21:12:24 +0000 (14:12 -0700)
author Andres Freund <andres@anarazel.de>
Mon, 8 Jun 2020 23:50:37 +0000 (16:50 -0700)
committer Andres Freund <andres@anarazel.de>
Thu, 18 Jun 2020 21:12:24 +0000 (14:12 -0700)
diff --git a/src/backend/storage/lmgr/spin.c b/src/backend/storage/lmgr/spin.c

index 9b73e7e1851b26f424559ea535802d8242e3a929..27734395852f6a99005d33963c6ad96ee18cf25e 100644 (file)
--- a/src/backend/storage/lmgr/spin.c
+++ b/src/backend/storage/lmgr/spin.c
@@ -27,8 +27,24 @@
  
  
  #ifndef HAVE_SPINLOCKS
+
+/*
+ * No TAS, so spinlocks are implemented as PGSemaphores.
+ */
+
+#ifndef HAVE_ATOMICS
+#define NUM_EMULATION_SEMAPHORES (NUM_SPINLOCK_SEMAPHORES + NUM_ATOMICS_SEMAPHORES)
+#else
+#define NUM_EMULATION_SEMAPHORES (NUM_SPINLOCK_SEMAPHORES)
+#endif /* DISABLE_ATOMICS */
+
  PGSemaphore SpinlockSemaArray;
-#endif
+
+#else                          /* !HAVE_SPINLOCKS */
+
+#define NUM_EMULATION_SEMAPHORES 0
+
+#endif                         /* HAVE_SPINLOCKS */
  
  /*
   * Report the amount of shared memory needed to store semaphores for spinlock
@@ -37,34 +53,19 @@ PGSemaphore SpinlockSemaArray;
  Size
  SpinlockSemaSize(void)
  {
-   return SpinlockSemas() * sizeof(PGSemaphoreData);
+   return NUM_EMULATION_SEMAPHORES * sizeof(PGSemaphoreData);
  }
  
-#ifdef HAVE_SPINLOCKS
-
  /*
   * Report number of semaphores needed to support spinlocks.
   */
  int
  SpinlockSemas(void)
  {
-   return 0;
+   return NUM_EMULATION_SEMAPHORES;
  }
-#else                          /* !HAVE_SPINLOCKS */
  
-/*
- * No TAS, so spinlocks are implemented as PGSemaphores.
- */
-
-
-/*
- * Report number of semaphores needed to support spinlocks.
- */
-int
-SpinlockSemas(void)
-{
-   return NUM_SPINLOCK_SEMAPHORES + NUM_ATOMICS_SEMAPHORES;
-}
+#ifndef HAVE_SPINLOCKS
  
  /*
   * Initialize semaphores.
@@ -83,23 +84,59 @@ SpinlockSemaInit(PGSemaphore spinsemas)
  /*
   * s_lock.h hardware-spinlock emulation using semaphores
   *
- * We map all spinlocks onto a set of NUM_SPINLOCK_SEMAPHORES semaphores.
- * It's okay to map multiple spinlocks onto one semaphore because no process
- * should ever hold more than one at a time.  We just need enough semaphores
- * so that we aren't adding too much extra contention from that.
+ * We map all spinlocks onto NUM_EMULATION_SEMAPHORES semaphores.  It's okay to
+ * map multiple spinlocks onto one semaphore because no process should ever
+ * hold more than one at a time.  We just need enough semaphores so that we
+ * aren't adding too much extra contention from that.
+ *
+ * There is one exception to the restriction of only holding one spinlock at a
+ * time, which is that it's ok if emulated atomic operations are nested inside
+ * spinlocks. To avoid the danger of spinlocks and atomic using the same sema,
+ * we make sure "normal" spinlocks and atomics backed by spinlocks use
+ * distinct semaphores (see the nested argument to s_init_lock_sema).
   *
   * slock_t is just an int for this implementation; it holds the spinlock
- * number from 1..NUM_SPINLOCK_SEMAPHORES.  We intentionally ensure that 0
+ * number from 1..NUM_EMULATION_SEMAPHORES.  We intentionally ensure that 0
   * is not a valid value, so that testing with this code can help find
   * failures to initialize spinlocks.
   */
  
+static inline void
+s_check_valid(int lockndx)
+{
+   if (lockndx <= 0 || lockndx > NUM_EMULATION_SEMAPHORES)
+       elog(ERROR, "invalid spinlock number: %d", lockndx);
+}
+
  void
  s_init_lock_sema(volatile slock_t *lock, bool nested)
  {
     static uint32 counter = 0;
-
-   *lock = ((++counter) % NUM_SPINLOCK_SEMAPHORES) + 1;
+   uint32      offset;
+   uint32      sema_total;
+   uint32      idx;
+
+   if (nested)
+   {
+       /*
+        * To allow nesting atomics inside spinlocked sections, use a
+        * different spinlock. See comment above.
+        */
+       offset = 1 + NUM_SPINLOCK_SEMAPHORES;
+       sema_total = NUM_ATOMICS_SEMAPHORES;
+   }
+   else
+   {
+       offset = 1;
+       sema_total = NUM_SPINLOCK_SEMAPHORES;
+   }
+
+   idx = (counter++ % sema_total) + offset;
+
+   /* double check we did things correctly */
+   s_check_valid(idx);
+
+   *lock = idx;
  }
  
  void
@@ -107,8 +144,8 @@ s_unlock_sema(volatile slock_t *lock)
  {
     int         lockndx = *lock;
  
-   if (lockndx <= 0 || lockndx > NUM_SPINLOCK_SEMAPHORES)
-       elog(ERROR, "invalid spinlock number: %d", lockndx);
+   s_check_valid(lockndx);
+
     PGSemaphoreUnlock(&SpinlockSemaArray[lockndx - 1]);
  }
  
@@ -125,8 +162,8 @@ tas_sema(volatile slock_t *lock)
  {
     int         lockndx = *lock;
  
-   if (lockndx <= 0 || lockndx > NUM_SPINLOCK_SEMAPHORES)
-       elog(ERROR, "invalid spinlock number: %d", lockndx);
+   s_check_valid(lockndx);
+
     /* Note that TAS macros return 0 if *success* */
     return !PGSemaphoreTryLock(&SpinlockSemaArray[lockndx - 1]);
  }
diff --git a/src/test/regress/regress.c b/src/test/regress/regress.c

index 370d39e9fc2bf89185b5ea554082f7289ac434e8..ddfde1f291656c537e6d7f9099f4d0e3b689b73d 100644 (file)
--- a/src/test/regress/regress.c
+++ b/src/test/regress/regress.c
@@ -1159,6 +1159,51 @@ test_spinlock(void)
  #endif
  }
  
+/*
+ * Verify that performing atomic ops inside a spinlock isn't a
+ * problem. Realistically that's only going to be a problem when both
+ * --disable-spinlocks and --disable-atomics are used, but it's cheap enough
+ * to just always test.
+ *
+ * The test works by initializing enough atomics that we'd conflict if there
+ * were an overlap between a spinlock and an atomic by holding a spinlock
+ * while manipulating more than NUM_SPINLOCK_SEMAPHORES atomics.
+ *
+ * NUM_TEST_ATOMICS doesn't really need to be more than
+ * NUM_SPINLOCK_SEMAPHORES, but it seems better to test a bit more
+ * extensively.
+ */
+static void
+test_atomic_spin_nest(void)
+{
+   slock_t lock;
+#define NUM_TEST_ATOMICS (NUM_SPINLOCK_SEMAPHORES + NUM_ATOMICS_SEMAPHORES + 27)
+   pg_atomic_uint32 atomics32[NUM_TEST_ATOMICS];
+
+   SpinLockInit(&lock);
+
+   for (int i = 0; i < NUM_TEST_ATOMICS; i++)
+   {
+       pg_atomic_init_u32(&atomics32[i], 0);
+   }
+
+   /* just so it's not all zeroes */
+   for (int i = 0; i < NUM_TEST_ATOMICS; i++)
+   {
+       EXPECT_EQ_U32(pg_atomic_fetch_add_u32(&atomics32[i], i), 0);
+   }
+
+   /* test whether we can do atomic op with lock held */
+   SpinLockAcquire(&lock);
+   for (int i = 0; i < NUM_TEST_ATOMICS; i++)
+   {
+       EXPECT_EQ_U32(pg_atomic_fetch_sub_u32(&atomics32[i], i), i);
+       EXPECT_EQ_U32(pg_atomic_read_u32(&atomics32[i]), 0);
+   }
+   SpinLockRelease(&lock);
+}
+#undef NUM_TEST_ATOMICS
+
  PG_FUNCTION_INFO_V1(test_atomic_ops);
  Datum
  test_atomic_ops(PG_FUNCTION_ARGS)
@@ -1177,5 +1222,7 @@ test_atomic_ops(PG_FUNCTION_ARGS)
      */
     test_spinlock();
  
+   test_atomic_spin_nest();
+
     PG_RETURN_BOOL(true);
  }
author	Andres Freund <andres@anarazel.de>
	Mon, 8 Jun 2020 23:50:37 +0000 (16:50 -0700)
committer	Andres Freund <andres@anarazel.de>
	Thu, 18 Jun 2020 21:12:24 +0000 (14:12 -0700)
src/backend/storage/lmgr/spin.c		patch \| blob \| blame \| history
src/test/regress/regress.c		patch \| blob \| blame \| history