dist/libobjc/objc-sync.c

 1.1  mrg /* GNU Objective C Runtime @synchronized implementation
1.10  mrg    Copyright (C) 2010-2022 Free Software Foundation, Inc.
 1.1  mrg    Contributed by Nicola Pero <nicola.pero (at) meta-innovation.com>
 1.1  mrg
 1.1  mrg This file is part of GCC.
 1.1  mrg
 1.1  mrg GCC is free software; you can redistribute it and/or modify it under the
 1.1  mrg terms of the GNU General Public License as published by the Free Software
 1.1  mrg Foundation; either version 3, or (at your option) any later version.
 1.1  mrg
 1.1  mrg GCC is distributed in the hope that it will be useful, but WITHOUT ANY
 1.1  mrg WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
 1.1  mrg FOR A PARTICULAR PURPOSE.  See the GNU General Public License for more
 1.1  mrg details.
 1.1  mrg
 1.1  mrg Under Section 7 of GPL version 3, you are granted additional
 1.1  mrg permissions described in the GCC Runtime Library Exception, version
 1.1  mrg 3.1, as published by the Free Software Foundation.
 1.1  mrg
 1.1  mrg You should have received a copy of the GNU General Public License and
 1.1  mrg a copy of the GCC Runtime Library Exception along with this program;
 1.1  mrg see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
 1.1  mrg <http://www.gnu.org/licenses/>.  */
 1.1  mrg
 1.1  mrg /* This file implements objc_sync_enter() and objc_sync_exit(), the
 1.1  mrg    two functions required to support @synchronized().
 1.1  mrg
 1.1  mrg    objc_sync_enter(object) needs to get a recursive lock associated
 1.1  mrg    with 'object', and lock it.
 1.1  mrg
 1.1  mrg    objc_sync_exit(object) needs to get the recursive lock associated
 1.1  mrg    with 'object', and unlock it.  */
 1.1  mrg
 1.1  mrg /* To avoid the overhead of continuously allocating and deallocating
 1.1  mrg    locks, we implement a pool of locks.  When a lock is needed for an
 1.1  mrg    object, we get a lock from the pool and associate it with the
 1.1  mrg    object.
 1.1  mrg
 1.1  mrg    The lock pool need to be protected by its own lock (the
 1.1  mrg    "protection" lock), which has to be locked then unlocked each time
 1.1  mrg    objc_sync_enter() and objc_sync_exit() are called.  To reduce the
 1.1  mrg    contention on the protection lock, instead of a single pool with a
 1.1  mrg    single (global) protection lock we use a number of smaller pools,
 1.1  mrg    each with its own pool protection lock.  To decide which lock pool
 1.1  mrg    to use for each object, we compute a hash from the object pointer.
 1.1  mrg
 1.1  mrg    The implementation of each lock pool uses a linked list of all the
 1.1  mrg    locks in the pool (both unlocked, and locked); this works in the
 1.1  mrg    assumption that the number of locks concurrently required is very
 1.1  mrg    low.  In practice, it seems that you rarely see more than a few
 1.1  mrg    locks ever concurrently required.
 1.1  mrg
 1.1  mrg    A standard case is a thread acquiring a lock recursively, over and
 1.1  mrg    over again: for example when most methods of a class are protected
 1.1  mrg    by @synchronized(self) but they also call each other.  We use
 1.1  mrg    thread-local storage to implement a cache and optimize this case.
 1.1  mrg    The cache stores locks that the thread successfully acquired,
 1.1  mrg    allowing objc_sync_enter() and objc_sync_exit() to locate a lock
 1.1  mrg    which is already held by the current thread without having to use
 1.1  mrg    any protection lock or synchronization mechanism.  It can so detect
 1.1  mrg    recursive locks/unlocks, and transform them into no-ops that
 1.1  mrg    require no actual locking or synchronization mechanisms at all.  */
 1.1  mrg
 1.1  mrg /* You can disable the thread-local cache (most likely to benchmark
 1.1  mrg    the code with and without it) by compiling with
 1.1  mrg    -DSYNC_CACHE_DISABLE, or commenting out the following line.  */
 1.1  mrg /* #define SYNC_CACHE_DISABLE */
 1.1  mrg
 1.1  mrg /* If thread-local storage is not available, automatically disable the
 1.1  mrg    cache.  */
 1.1  mrg #ifndef HAVE_TLS
 1.1  mrg # define SYNC_CACHE_DISABLE
 1.1  mrg #endif
 1.1  mrg
 1.1  mrg #include "objc-private/common.h"
 1.1  mrg #include "objc/objc-sync.h"         /* For objc_sync_enter(), objc_sync_exit() */
 1.1  mrg #include "objc/runtime.h"           /* For objc_malloc() */
 1.1  mrg #include "objc/thr.h"               /* For objc_mutex_loc() and similar */
 1.1  mrg #include "objc-private/objc-sync.h" /* For __objc_sync_init() */
 1.1  mrg
 1.1  mrg /* We have 32 pools of locks, each of them protected by its own
 1.1  mrg    protection lock.  It's tempting to increase this number to reduce
 1.1  mrg    contention; but in our tests it is high enough.  */
 1.1  mrg #define SYNC_NUMBER_OF_POOLS 32
 1.1  mrg
 1.1  mrg /* Given an object, it determines which pool contains the associated
 1.1  mrg    lock.  */
 1.1  mrg #define SYNC_OBJECT_HASH(OBJECT) ((((size_t)OBJECT >> 8) ^ (size_t)OBJECT) & (SYNC_NUMBER_OF_POOLS - 1))
 1.1  mrg
 1.1  mrg /* The locks protecting each pool.  */
 1.1  mrg static objc_mutex_t sync_pool_protection_locks[SYNC_NUMBER_OF_POOLS];
 1.1  mrg
 1.1  mrg /* The data structure (linked list) holding the locks.  */
 1.1  mrg typedef struct lock_node
 1.1  mrg {
 1.1  mrg   /* Pointer to next entry on the list.  NULL indicates end of list.
 1.1  mrg      You need to hold the appropriate sync_pool_protection_locks[N] to
 1.1  mrg      read or write this variable.  */
 1.1  mrg   struct lock_node *next;
 1.1  mrg
 1.1  mrg   /* The (recursive) lock.  Allocated when the node is created, and
 1.1  mrg      always not-NULL, and unchangeable, after that.  */
 1.1  mrg   objc_mutex_t lock;
 1.1  mrg
 1.1  mrg   /* This is how many times the objc_mutex_lock() has been called on
 1.1  mrg      the lock (it is 0 when the lock is unused).  Used to track when
 1.1  mrg      the lock is no longer associated with an object and can be reused
 1.1  mrg      for another object.  It records "real" locks, potentially (but
 1.1  mrg      not necessarily) by multiple threads.  You need to hold the
 1.1  mrg      appropriate sync_pool_protection_locks[N] to read or write this
 1.1  mrg      variable.  */
 1.1  mrg   unsigned int usage_count;
 1.1  mrg
 1.1  mrg   /* The object that the lock is associated with.  This variable can
 1.1  mrg      only be written when holding the sync_pool_protection_locks[N]
 1.1  mrg      and when node->usage_count == 0, ie, the lock is not being used.
 1.1  mrg      You can read this variable either when you hold the
 1.1  mrg      sync_pool_protection_locks[N] or when you hold node->lock,
 1.1  mrg      because in that case you know that node->usage_count can't get to
 1.1  mrg      zero until you release the lock.  It is valid to have usage_count
 1.1  mrg      == 0 and object != nil; in that case, the lock is not currently
 1.1  mrg      being used, but is still currently associated with the
 1.1  mrg      object.  */
 1.1  mrg   id object;
 1.1  mrg
 1.1  mrg   /* This is a counter reserved for use by the thread currently
 1.1  mrg      holding the lock.  So, you need to hold node->lock to read or
 1.1  mrg      write this variable.  It is normally 0, and if the cache is not
 1.1  mrg      being used, it is kept at 0 (even if recursive locks are being
 1.1  mrg      done; in that case, no difference is made between recursive and
 1.1  mrg      non-recursive locks: they all increase usage_count, and call
 1.1  mrg      objc_mutex_lock()).  When the cache is being used, a thread may
 1.1  mrg      be able to find a lock that it already holds using the cache; in
 1.1  mrg      that case, to perform additional locks/unlocks it can
 1.1  mrg      increase/decrease the recursive_usage_count (which does not
 1.1  mrg      require any synchronization with other threads, since it's
 1.1  mrg      protected by the node->lock itself) instead of the usage_count
 1.1  mrg      (which requires locking the pool protection lock).  And it can
 1.1  mrg      skip the call to objc_mutex_lock/unlock too.  */
 1.1  mrg   unsigned int recursive_usage_count;
 1.1  mrg } *lock_node_ptr;
 1.1  mrg
 1.1  mrg
 1.1  mrg /* The pools of locks.  Each of them is a linked list of lock_nodes.
 1.1  mrg    In the list we keep both unlocked and locked nodes.  */
 1.1  mrg static lock_node_ptr sync_pool_array[SYNC_NUMBER_OF_POOLS];
 1.1  mrg
 1.1  mrg #ifndef SYNC_CACHE_DISABLE
 1.1  mrg /* We store a cache of locks acquired by each thread in thread-local
 1.1  mrg    storage.  */
 1.1  mrg static __thread lock_node_ptr *lock_cache = NULL;
 1.1  mrg
 1.1  mrg /* This is a conservative implementation that uses a static array of
 1.1  mrg    fixed size as cache.  Because the cache is an array that we scan
 1.1  mrg    linearly, the bigger it is, the slower it gets.  This does not
 1.1  mrg    matter much at small sizes (eg, the overhead of checking 8 cache
 1.1  mrg    slots instead of 4 is very small compared to the other overheads
 1.1  mrg    involved such as function calls and lock/unlock operations), but at
 1.1  mrg    large sizes it becomes important as obviously there is a size over
 1.1  mrg    which using the cache backfires: the lookup is so slow that the
 1.1  mrg    cache slows down the software instead of speeding it up.  In
 1.1  mrg    practice, it seems that most threads use a small number of
 1.1  mrg    concurrent locks, so we have a conservative implementation with a
 1.1  mrg    fixed-size cache of 8 locks which gives a very predictable
 1.1  mrg    behaviour.  If a thread locks lots of different locks, only the
 1.1  mrg    first 8 get the speed benefits of the cache, but the cache remains
 1.1  mrg    always small, fast and predictable.
 1.1  mrg
 1.1  mrg    SYNC_CACHE_SIZE is the size of the lock cache for each thread.  */
 1.1  mrg #define SYNC_CACHE_SIZE 8
 1.1  mrg #endif /* SYNC_CACHE_DISABLE */
 1.1  mrg
 1.1  mrg /* Called at startup by init.c.  */
 1.1  mrg void
 1.1  mrg __objc_sync_init (void)
 1.1  mrg {
 1.1  mrg   int i;
 1.1  mrg
 1.1  mrg   for (i = 0; i < SYNC_NUMBER_OF_POOLS; i++)
 1.1  mrg     {
 1.1  mrg       lock_node_ptr new_node;
 1.1  mrg
 1.1  mrg       /* Create a protection lock for each pool.  */
 1.1  mrg       sync_pool_protection_locks[i] = objc_mutex_allocate ();
 1.1  mrg
 1.1  mrg       /* Preallocate a lock per pool.  */
 1.1  mrg       new_node = objc_malloc (sizeof (struct lock_node));
 1.1  mrg       new_node->lock = objc_mutex_allocate ();
 1.1  mrg       new_node->object = nil;
 1.1  mrg       new_node->usage_count = 0;
 1.1  mrg       new_node->recursive_usage_count = 0;
 1.1  mrg       new_node->next = NULL;
 1.1  mrg
 1.1  mrg       sync_pool_array[i] = new_node;
 1.1  mrg     }
 1.1  mrg }
 1.1  mrg
 1.1  mrg int
 1.1  mrg objc_sync_enter (id object)
 1.1  mrg {
 1.1  mrg #ifndef SYNC_CACHE_DISABLE
 1.1  mrg   int free_cache_slot;
 1.1  mrg #endif
 1.1  mrg   int hash;
 1.1  mrg   lock_node_ptr node;
 1.1  mrg   lock_node_ptr unused_node;
 1.1  mrg
 1.1  mrg   if (object == nil)
 1.1  mrg     return OBJC_SYNC_SUCCESS;
 1.1  mrg
 1.1  mrg #ifndef SYNC_CACHE_DISABLE
 1.1  mrg   if (lock_cache == NULL)
 1.1  mrg     {
 1.1  mrg       /* Note that this calloc only happen only once per thread, the
 1.1  mrg 	 very first time a thread does a objc_sync_enter().  */
 1.1  mrg       lock_cache = objc_calloc (SYNC_CACHE_SIZE, sizeof (lock_node_ptr));
 1.1  mrg     }
 1.1  mrg
 1.1  mrg   /* Check the cache to see if we have a record of having already
 1.1  mrg      locked the lock corresponding to this object.  While doing so,
 1.1  mrg      keep track of the first free cache node in case we need it
 1.1  mrg      later.  */
 1.1  mrg   node = NULL;
 1.1  mrg   free_cache_slot = -1;
 1.1  mrg
 1.1  mrg   {
 1.1  mrg     int i;
 1.1  mrg     for (i = 0; i < SYNC_CACHE_SIZE; i++)
 1.1  mrg       {
 1.1  mrg 	lock_node_ptr locked_node = lock_cache[i];
 1.1  mrg
 1.1  mrg 	if (locked_node == NULL)
 1.1  mrg 	  {
 1.1  mrg 	    if (free_cache_slot == -1)
 1.1  mrg 	      free_cache_slot = i;
 1.1  mrg 	  }
 1.1  mrg 	else if (locked_node->object == object)
 1.1  mrg 	  {
 1.1  mrg 	    node = locked_node;
 1.1  mrg 	    break;
 1.1  mrg 	  }
 1.1  mrg       }
 1.1  mrg   }
 1.1  mrg
 1.1  mrg   if (node != NULL)
 1.1  mrg     {
 1.1  mrg       /* We found the lock.  Increase recursive_usage_count, which is
 1.1  mrg 	 protected by node->lock, which we already hold.  */
 1.1  mrg       node->recursive_usage_count++;
 1.1  mrg
 1.1  mrg       /* There is no need to actually lock anything, since we already
 1.1  mrg 	 hold the lock.  Correspondingly, objc_sync_exit() will just
 1.1  mrg 	 decrease recursive_usage_count and do nothing to unlock.  */
 1.1  mrg       return OBJC_SYNC_SUCCESS;
 1.1  mrg     }
 1.1  mrg #endif /* SYNC_CACHE_DISABLE */
 1.1  mrg
 1.1  mrg   /* The following is the standard lookup for the lock in the standard
 1.1  mrg      pool lock.  It requires a pool protection lock.  */
 1.1  mrg   hash = SYNC_OBJECT_HASH(object);
 1.1  mrg
 1.1  mrg   /* Search for an existing lock for 'object'.  While searching, make
 1.1  mrg      note of any unused lock if we find any.  */
 1.1  mrg   unused_node = NULL;
 1.1  mrg
 1.1  mrg   objc_mutex_lock (sync_pool_protection_locks[hash]);
 1.1  mrg
 1.1  mrg   node = sync_pool_array[hash];
 1.1  mrg
 1.1  mrg   while (node != NULL)
 1.1  mrg     {
 1.1  mrg       if (node->object == object)
 1.1  mrg 	{
 1.1  mrg 	  /* We found the lock.  */
 1.1  mrg 	  node->usage_count++;
 1.1  mrg 	  objc_mutex_unlock (sync_pool_protection_locks[hash]);
 1.1  mrg
 1.1  mrg #ifndef SYNC_CACHE_DISABLE
 1.1  mrg 	  /* Put it in the cache.  */
 1.1  mrg 	  if (free_cache_slot != -1)
 1.1  mrg 	    lock_cache[free_cache_slot] = node;
 1.1  mrg #endif
 1.1  mrg
 1.1  mrg 	  /* Lock it.  */
 1.1  mrg 	  objc_mutex_lock (node->lock);
 1.1  mrg
 1.1  mrg 	  return OBJC_SYNC_SUCCESS;
 1.1  mrg 	}
 1.1  mrg
 1.1  mrg       if (unused_node == NULL  &&  node->usage_count == 0)
 1.1  mrg 	{
 1.1  mrg 	  /* We found the first unused node.  Record it.  */
 1.1  mrg 	  unused_node = node;
 1.1  mrg 	}
 1.1  mrg
 1.1  mrg       node = node->next;
 1.1  mrg     }
 1.1  mrg
 1.1  mrg   /* An existing lock for 'object' could not be found.  */
 1.1  mrg   if (unused_node != NULL)
 1.1  mrg     {
 1.1  mrg       /* But we found a unused lock; use it.  */
 1.1  mrg       unused_node->object = object;
 1.1  mrg       unused_node->usage_count = 1;
 1.1  mrg       unused_node->recursive_usage_count = 0;
 1.1  mrg       objc_mutex_unlock (sync_pool_protection_locks[hash]);
 1.1  mrg
 1.1  mrg #ifndef SYNC_CACHE_DISABLE
 1.1  mrg       if (free_cache_slot != -1)
 1.1  mrg 	lock_cache[free_cache_slot] = unused_node;
 1.1  mrg #endif
 1.1  mrg
 1.1  mrg       objc_mutex_lock (unused_node->lock);
 1.1  mrg
 1.1  mrg       return OBJC_SYNC_SUCCESS;
 1.1  mrg     }
 1.1  mrg   else
 1.1  mrg     {
 1.1  mrg       /* There are no unused nodes; allocate a new node.  */
 1.1  mrg       lock_node_ptr new_node;
 1.1  mrg
 1.1  mrg       /* Create the node.  */
 1.1  mrg       new_node = objc_malloc (sizeof (struct lock_node));
 1.1  mrg       new_node->lock = objc_mutex_allocate ();
 1.1  mrg       new_node->object = object;
 1.1  mrg       new_node->usage_count = 1;
 1.1  mrg       new_node->recursive_usage_count = 0;
 1.1  mrg
 1.1  mrg       /* Attach it at the beginning of the pool.  */
 1.1  mrg       new_node->next = sync_pool_array[hash];
 1.1  mrg       sync_pool_array[hash] = new_node;
 1.1  mrg       objc_mutex_unlock (sync_pool_protection_locks[hash]);
 1.1  mrg
 1.1  mrg #ifndef SYNC_CACHE_DISABLE
 1.1  mrg       if (free_cache_slot != -1)
 1.1  mrg 	lock_cache[free_cache_slot] = new_node;
 1.1  mrg #endif
 1.1  mrg
 1.1  mrg       objc_mutex_lock (new_node->lock);
 1.1  mrg
 1.1  mrg       return OBJC_SYNC_SUCCESS;
 1.1  mrg     }
 1.1  mrg }
 1.1  mrg
 1.1  mrg int
 1.1  mrg objc_sync_exit (id object)
 1.1  mrg {
 1.1  mrg   int hash;
 1.1  mrg   lock_node_ptr node;
 1.1  mrg
 1.1  mrg   if (object == nil)
 1.1  mrg     return OBJC_SYNC_SUCCESS;
 1.1  mrg
 1.1  mrg #ifndef SYNC_CACHE_DISABLE
 1.1  mrg   if (lock_cache != NULL)
 1.1  mrg     {
 1.1  mrg       int i;
 1.1  mrg
 1.1  mrg       /* Find the lock in the cache.  */
 1.1  mrg       node = NULL;
 1.1  mrg       for (i = 0; i < SYNC_CACHE_SIZE; i++)
 1.1  mrg 	{
 1.1  mrg 	  lock_node_ptr locked_node = lock_cache[i];
 1.1  mrg
 1.1  mrg 	  if (locked_node != NULL  &&  locked_node->object == object)
 1.1  mrg 	    {
 1.1  mrg 	      node = locked_node;
 1.1  mrg 	      break;
 1.1  mrg 	    }
 1.1  mrg 	}
 1.1  mrg       /* Note that, if a node was found in the cache, the variable i
 1.1  mrg 	 now holds the index where it was found, which will be used to
 1.1  mrg 	 remove it from the cache.  */
 1.1  mrg       if (node != NULL)
 1.1  mrg 	{
 1.1  mrg 	  if (node->recursive_usage_count > 0)
 1.1  mrg 	    {
 1.1  mrg 	      node->recursive_usage_count--;
 1.1  mrg 	      return OBJC_SYNC_SUCCESS;
 1.1  mrg 	    }
 1.1  mrg 	  else
 1.1  mrg 	    {
 1.1  mrg 	      /* We need to do a real unlock.  */
 1.1  mrg 	      hash = SYNC_OBJECT_HASH(object);
 1.1  mrg
 1.1  mrg 	      /* TODO: If we had atomic increase/decrease operations
 1.1  mrg 		 with memory barriers, we could avoid the lock
 1.1  mrg 		 here!  */
 1.1  mrg 	      objc_mutex_lock (sync_pool_protection_locks[hash]);
 1.1  mrg 	      node->usage_count--;
 1.1  mrg 	      /* Normally, we do not reset object to nil here.  We'll
 1.1  mrg 		 leave the lock associated with that object, at zero
 1.3  mrg 		 usage count.  This makes it slightly more efficient to
 1.1  mrg 		 provide a lock for that object if (as likely)
 1.1  mrg 		 requested again.  If the object is deallocated, we
 1.1  mrg 		 don't care.  It will never match a new lock that is
 1.1  mrg 		 requested, and the node will be reused at some point.
 1.1  mrg
 1.1  mrg 		 But, if garbage collection is enabled, leaving a
 1.1  mrg 		 pointer to the object in memory might prevent the
 1.1  mrg 		 object from being released.  In that case, we remove
 1.1  mrg 		 it (TODO: maybe we should avoid using the garbage
 1.1  mrg 		 collector at all ?  Nothing is ever deallocated in
 1.1  mrg 		 this file).  */
 1.1  mrg #if OBJC_WITH_GC
 1.1  mrg 	      node->object = nil;
 1.1  mrg #endif
 1.1  mrg 	      objc_mutex_unlock (sync_pool_protection_locks[hash]);
 1.1  mrg
 1.1  mrg 	      /* PS: Between objc_mutex_unlock
 1.1  mrg 		 (sync_pool_protection_locks[hash]) and
 1.1  mrg 		 objc_mutex_unlock (node->lock), the pool is unlocked
 1.1  mrg 		 so other threads may allocate this same lock to
 1.1  mrg 		 another object (!).  This is not a problem, but it is
 1.1  mrg 		 curious.  */
 1.1  mrg 	      objc_mutex_unlock (node->lock);
 1.1  mrg
 1.1  mrg 	      /* Remove the node from the cache.  */
 1.1  mrg 	      lock_cache[i] = NULL;
 1.1  mrg
 1.1  mrg 	      return OBJC_SYNC_SUCCESS;
 1.1  mrg 	    }
 1.1  mrg 	}
 1.1  mrg     }
 1.1  mrg #endif
 1.1  mrg
 1.1  mrg   /* The cache either wasn't there, or didn't work (eg, we overflowed
 1.1  mrg      it at some point and stopped recording new locks in the cache).
 1.1  mrg      Proceed with a full search of the lock pool.  */
 1.1  mrg   hash = SYNC_OBJECT_HASH(object);
 1.1  mrg
 1.1  mrg   objc_mutex_lock (sync_pool_protection_locks[hash]);
 1.1  mrg
 1.1  mrg   /* Search for an existing lock for 'object'.  */
 1.1  mrg   node = sync_pool_array[hash];
 1.1  mrg
 1.1  mrg   while (node != NULL)
 1.1  mrg     {
 1.1  mrg       if (node->object == object)
 1.1  mrg 	{
 1.1  mrg 	  /* We found the lock.  */
 1.1  mrg 	  node->usage_count--;
 1.1  mrg 	  objc_mutex_unlock (sync_pool_protection_locks[hash]);
 1.1  mrg
 1.1  mrg 	  objc_mutex_unlock (node->lock);
 1.1  mrg
 1.1  mrg 	  /* No need to remove the node from the cache, since it
 1.1  mrg 	     wasn't found in the cache when we looked for it!  */
 1.1  mrg 	  return OBJC_SYNC_SUCCESS;
 1.1  mrg 	}
 1.1  mrg
 1.1  mrg       node = node->next;
 1.1  mrg     }
 1.1  mrg
 1.1  mrg   objc_mutex_unlock (sync_pool_protection_locks[hash]);
 1.1  mrg
 1.1  mrg   /* A lock for 'object' to unlock could not be found (!!).  */
 1.1  mrg   return OBJC_SYNC_NOT_OWNING_THREAD_ERROR;
 1.1  mrg }