Home | History | Annotate | Line # | Download | only in tsan
tsan_clock.cpp revision 1.1.1.1
      1 //===-- tsan_clock.cpp ----------------------------------------------------===//
      2 //
      3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
      4 // See https://llvm.org/LICENSE.txt for license information.
      5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
      6 //
      7 //===----------------------------------------------------------------------===//
      8 //
      9 // This file is a part of ThreadSanitizer (TSan), a race detector.
     10 //
     11 //===----------------------------------------------------------------------===//
     12 #include "tsan_clock.h"
     13 #include "tsan_rtl.h"
     14 #include "sanitizer_common/sanitizer_placement_new.h"
     15 
     16 // SyncClock and ThreadClock implement vector clocks for sync variables
     17 // (mutexes, atomic variables, file descriptors, etc) and threads, respectively.
     18 // ThreadClock contains fixed-size vector clock for maximum number of threads.
     19 // SyncClock contains growable vector clock for currently necessary number of
     20 // threads.
     21 // Together they implement very simple model of operations, namely:
     22 //
     23 //   void ThreadClock::acquire(const SyncClock *src) {
     24 //     for (int i = 0; i < kMaxThreads; i++)
     25 //       clock[i] = max(clock[i], src->clock[i]);
     26 //   }
     27 //
     28 //   void ThreadClock::release(SyncClock *dst) const {
     29 //     for (int i = 0; i < kMaxThreads; i++)
     30 //       dst->clock[i] = max(dst->clock[i], clock[i]);
     31 //   }
     32 //
     33 //   void ThreadClock::releaseStoreAcquire(SyncClock *sc) const {
     34 //     for (int i = 0; i < kMaxThreads; i++) {
     35 //       tmp = clock[i];
     36 //       clock[i] = max(clock[i], sc->clock[i]);
     37 //       sc->clock[i] = tmp;
     38 //     }
     39 //   }
     40 //
     41 //   void ThreadClock::ReleaseStore(SyncClock *dst) const {
     42 //     for (int i = 0; i < kMaxThreads; i++)
     43 //       dst->clock[i] = clock[i];
     44 //   }
     45 //
     46 //   void ThreadClock::acq_rel(SyncClock *dst) {
     47 //     acquire(dst);
     48 //     release(dst);
     49 //   }
     50 //
     51 // Conformance to this model is extensively verified in tsan_clock_test.cpp.
     52 // However, the implementation is significantly more complex. The complexity
     53 // allows to implement important classes of use cases in O(1) instead of O(N).
     54 //
     55 // The use cases are:
     56 // 1. Singleton/once atomic that has a single release-store operation followed
     57 //    by zillions of acquire-loads (the acquire-load is O(1)).
     58 // 2. Thread-local mutex (both lock and unlock can be O(1)).
     59 // 3. Leaf mutex (unlock is O(1)).
     60 // 4. A mutex shared by 2 threads (both lock and unlock can be O(1)).
     61 // 5. An atomic with a single writer (writes can be O(1)).
     62 // The implementation dynamically adopts to workload. So if an atomic is in
     63 // read-only phase, these reads will be O(1); if it later switches to read/write
     64 // phase, the implementation will correctly handle that by switching to O(N).
     65 //
     66 // Thread-safety note: all const operations on SyncClock's are conducted under
     67 // a shared lock; all non-const operations on SyncClock's are conducted under
     68 // an exclusive lock; ThreadClock's are private to respective threads and so
     69 // do not need any protection.
     70 //
     71 // Description of SyncClock state:
     72 // clk_ - variable size vector clock, low kClkBits hold timestamp,
     73 //   the remaining bits hold "acquired" flag (the actual value is thread's
     74 //   reused counter);
     75 //   if acquired == thr->reused_, then the respective thread has already
     76 //   acquired this clock (except possibly for dirty elements).
     77 // dirty_ - holds up to two indices in the vector clock that other threads
     78 //   need to acquire regardless of "acquired" flag value;
     79 // release_store_tid_ - denotes that the clock state is a result of
     80 //   release-store operation by the thread with release_store_tid_ index.
     81 // release_store_reused_ - reuse count of release_store_tid_.
     82 
     83 namespace __tsan {
     84 
     85 static atomic_uint32_t *ref_ptr(ClockBlock *cb) {
     86   return reinterpret_cast<atomic_uint32_t *>(&cb->table[ClockBlock::kRefIdx]);
     87 }
     88 
     89 // Drop reference to the first level block idx.
     90 static void UnrefClockBlock(ClockCache *c, u32 idx, uptr blocks) {
     91   ClockBlock *cb = ctx->clock_alloc.Map(idx);
     92   atomic_uint32_t *ref = ref_ptr(cb);
     93   u32 v = atomic_load(ref, memory_order_acquire);
     94   for (;;) {
     95     CHECK_GT(v, 0);
     96     if (v == 1)
     97       break;
     98     if (atomic_compare_exchange_strong(ref, &v, v - 1, memory_order_acq_rel))
     99       return;
    100   }
    101   // First level block owns second level blocks, so them as well.
    102   for (uptr i = 0; i < blocks; i++)
    103     ctx->clock_alloc.Free(c, cb->table[ClockBlock::kBlockIdx - i]);
    104   ctx->clock_alloc.Free(c, idx);
    105 }
    106 
    107 ThreadClock::ThreadClock(unsigned tid, unsigned reused)
    108     : tid_(tid)
    109     , reused_(reused + 1)  // 0 has special meaning
    110     , last_acquire_()
    111     , global_acquire_()
    112     , cached_idx_()
    113     , cached_size_()
    114     , cached_blocks_() {
    115   CHECK_LT(tid, kMaxTidInClock);
    116   CHECK_EQ(reused_, ((u64)reused_ << kClkBits) >> kClkBits);
    117   nclk_ = tid_ + 1;
    118   internal_memset(clk_, 0, sizeof(clk_));
    119 }
    120 
    121 void ThreadClock::ResetCached(ClockCache *c) {
    122   if (cached_idx_) {
    123     UnrefClockBlock(c, cached_idx_, cached_blocks_);
    124     cached_idx_ = 0;
    125     cached_size_ = 0;
    126     cached_blocks_ = 0;
    127   }
    128 }
    129 
    130 void ThreadClock::acquire(ClockCache *c, SyncClock *src) {
    131   DCHECK_LE(nclk_, kMaxTid);
    132   DCHECK_LE(src->size_, kMaxTid);
    133 
    134   // Check if it's empty -> no need to do anything.
    135   const uptr nclk = src->size_;
    136   if (nclk == 0)
    137     return;
    138 
    139   bool acquired = false;
    140   for (unsigned i = 0; i < kDirtyTids; i++) {
    141     SyncClock::Dirty dirty = src->dirty_[i];
    142     unsigned tid = dirty.tid();
    143     if (tid != kInvalidTid) {
    144       if (clk_[tid] < dirty.epoch) {
    145         clk_[tid] = dirty.epoch;
    146         acquired = true;
    147       }
    148     }
    149   }
    150 
    151   // Check if we've already acquired src after the last release operation on src
    152   if (tid_ >= nclk || src->elem(tid_).reused != reused_) {
    153     // O(N) acquire.
    154     nclk_ = max(nclk_, nclk);
    155     u64 *dst_pos = &clk_[0];
    156     for (ClockElem &src_elem : *src) {
    157       u64 epoch = src_elem.epoch;
    158       if (*dst_pos < epoch) {
    159         *dst_pos = epoch;
    160         acquired = true;
    161       }
    162       dst_pos++;
    163     }
    164 
    165     // Remember that this thread has acquired this clock.
    166     if (nclk > tid_)
    167       src->elem(tid_).reused = reused_;
    168   }
    169 
    170   if (acquired) {
    171     last_acquire_ = clk_[tid_];
    172     ResetCached(c);
    173   }
    174 }
    175 
    176 void ThreadClock::releaseStoreAcquire(ClockCache *c, SyncClock *sc) {
    177   DCHECK_LE(nclk_, kMaxTid);
    178   DCHECK_LE(sc->size_, kMaxTid);
    179 
    180   if (sc->size_ == 0) {
    181     // ReleaseStore will correctly set release_store_tid_,
    182     // which can be important for future operations.
    183     ReleaseStore(c, sc);
    184     return;
    185   }
    186 
    187   nclk_ = max(nclk_, (uptr) sc->size_);
    188 
    189   // Check if we need to resize sc.
    190   if (sc->size_ < nclk_)
    191     sc->Resize(c, nclk_);
    192 
    193   bool acquired = false;
    194 
    195   sc->Unshare(c);
    196   // Update sc->clk_.
    197   sc->FlushDirty();
    198   uptr i = 0;
    199   for (ClockElem &ce : *sc) {
    200     u64 tmp = clk_[i];
    201     if (clk_[i] < ce.epoch) {
    202       clk_[i] = ce.epoch;
    203       acquired = true;
    204     }
    205     ce.epoch = tmp;
    206     ce.reused = 0;
    207     i++;
    208   }
    209   sc->release_store_tid_ = kInvalidTid;
    210   sc->release_store_reused_ = 0;
    211 
    212   if (acquired) {
    213     last_acquire_ = clk_[tid_];
    214     ResetCached(c);
    215   }
    216 }
    217 
    218 void ThreadClock::release(ClockCache *c, SyncClock *dst) {
    219   DCHECK_LE(nclk_, kMaxTid);
    220   DCHECK_LE(dst->size_, kMaxTid);
    221 
    222   if (dst->size_ == 0) {
    223     // ReleaseStore will correctly set release_store_tid_,
    224     // which can be important for future operations.
    225     ReleaseStore(c, dst);
    226     return;
    227   }
    228 
    229   // Check if we need to resize dst.
    230   if (dst->size_ < nclk_)
    231     dst->Resize(c, nclk_);
    232 
    233   // Check if we had not acquired anything from other threads
    234   // since the last release on dst. If so, we need to update
    235   // only dst->elem(tid_).
    236   if (!HasAcquiredAfterRelease(dst)) {
    237     UpdateCurrentThread(c, dst);
    238     if (dst->release_store_tid_ != tid_ ||
    239         dst->release_store_reused_ != reused_)
    240       dst->release_store_tid_ = kInvalidTid;
    241     return;
    242   }
    243 
    244   // O(N) release.
    245   dst->Unshare(c);
    246   // First, remember whether we've acquired dst.
    247   bool acquired = IsAlreadyAcquired(dst);
    248   // Update dst->clk_.
    249   dst->FlushDirty();
    250   uptr i = 0;
    251   for (ClockElem &ce : *dst) {
    252     ce.epoch = max(ce.epoch, clk_[i]);
    253     ce.reused = 0;
    254     i++;
    255   }
    256   // Clear 'acquired' flag in the remaining elements.
    257   dst->release_store_tid_ = kInvalidTid;
    258   dst->release_store_reused_ = 0;
    259   // If we've acquired dst, remember this fact,
    260   // so that we don't need to acquire it on next acquire.
    261   if (acquired)
    262     dst->elem(tid_).reused = reused_;
    263 }
    264 
    265 void ThreadClock::ReleaseStore(ClockCache *c, SyncClock *dst) {
    266   DCHECK_LE(nclk_, kMaxTid);
    267   DCHECK_LE(dst->size_, kMaxTid);
    268 
    269   if (dst->size_ == 0 && cached_idx_ != 0) {
    270     // Reuse the cached clock.
    271     // Note: we could reuse/cache the cached clock in more cases:
    272     // we could update the existing clock and cache it, or replace it with the
    273     // currently cached clock and release the old one. And for a shared
    274     // existing clock, we could replace it with the currently cached;
    275     // or unshare, update and cache. But, for simplicity, we currently reuse
    276     // cached clock only when the target clock is empty.
    277     dst->tab_ = ctx->clock_alloc.Map(cached_idx_);
    278     dst->tab_idx_ = cached_idx_;
    279     dst->size_ = cached_size_;
    280     dst->blocks_ = cached_blocks_;
    281     CHECK_EQ(dst->dirty_[0].tid(), kInvalidTid);
    282     // The cached clock is shared (immutable),
    283     // so this is where we store the current clock.
    284     dst->dirty_[0].set_tid(tid_);
    285     dst->dirty_[0].epoch = clk_[tid_];
    286     dst->release_store_tid_ = tid_;
    287     dst->release_store_reused_ = reused_;
    288     // Remember that we don't need to acquire it in future.
    289     dst->elem(tid_).reused = reused_;
    290     // Grab a reference.
    291     atomic_fetch_add(ref_ptr(dst->tab_), 1, memory_order_relaxed);
    292     return;
    293   }
    294 
    295   // Check if we need to resize dst.
    296   if (dst->size_ < nclk_)
    297     dst->Resize(c, nclk_);
    298 
    299   if (dst->release_store_tid_ == tid_ &&
    300       dst->release_store_reused_ == reused_ &&
    301       !HasAcquiredAfterRelease(dst)) {
    302     UpdateCurrentThread(c, dst);
    303     return;
    304   }
    305 
    306   // O(N) release-store.
    307   dst->Unshare(c);
    308   // Note: dst can be larger than this ThreadClock.
    309   // This is fine since clk_ beyond size is all zeros.
    310   uptr i = 0;
    311   for (ClockElem &ce : *dst) {
    312     ce.epoch = clk_[i];
    313     ce.reused = 0;
    314     i++;
    315   }
    316   for (uptr i = 0; i < kDirtyTids; i++) dst->dirty_[i].set_tid(kInvalidTid);
    317   dst->release_store_tid_ = tid_;
    318   dst->release_store_reused_ = reused_;
    319   // Remember that we don't need to acquire it in future.
    320   dst->elem(tid_).reused = reused_;
    321 
    322   // If the resulting clock is cachable, cache it for future release operations.
    323   // The clock is always cachable if we released to an empty sync object.
    324   if (cached_idx_ == 0 && dst->Cachable()) {
    325     // Grab a reference to the ClockBlock.
    326     atomic_uint32_t *ref = ref_ptr(dst->tab_);
    327     if (atomic_load(ref, memory_order_acquire) == 1)
    328       atomic_store_relaxed(ref, 2);
    329     else
    330       atomic_fetch_add(ref_ptr(dst->tab_), 1, memory_order_relaxed);
    331     cached_idx_ = dst->tab_idx_;
    332     cached_size_ = dst->size_;
    333     cached_blocks_ = dst->blocks_;
    334   }
    335 }
    336 
    337 void ThreadClock::acq_rel(ClockCache *c, SyncClock *dst) {
    338   acquire(c, dst);
    339   ReleaseStore(c, dst);
    340 }
    341 
    342 // Updates only single element related to the current thread in dst->clk_.
    343 void ThreadClock::UpdateCurrentThread(ClockCache *c, SyncClock *dst) const {
    344   // Update the threads time, but preserve 'acquired' flag.
    345   for (unsigned i = 0; i < kDirtyTids; i++) {
    346     SyncClock::Dirty *dirty = &dst->dirty_[i];
    347     const unsigned tid = dirty->tid();
    348     if (tid == tid_ || tid == kInvalidTid) {
    349       dirty->set_tid(tid_);
    350       dirty->epoch = clk_[tid_];
    351       return;
    352     }
    353   }
    354   // Reset all 'acquired' flags, O(N).
    355   // We are going to touch dst elements, so we need to unshare it.
    356   dst->Unshare(c);
    357   dst->elem(tid_).epoch = clk_[tid_];
    358   for (uptr i = 0; i < dst->size_; i++)
    359     dst->elem(i).reused = 0;
    360   dst->FlushDirty();
    361 }
    362 
    363 // Checks whether the current thread has already acquired src.
    364 bool ThreadClock::IsAlreadyAcquired(const SyncClock *src) const {
    365   if (src->elem(tid_).reused != reused_)
    366     return false;
    367   for (unsigned i = 0; i < kDirtyTids; i++) {
    368     SyncClock::Dirty dirty = src->dirty_[i];
    369     if (dirty.tid() != kInvalidTid) {
    370       if (clk_[dirty.tid()] < dirty.epoch)
    371         return false;
    372     }
    373   }
    374   return true;
    375 }
    376 
    377 // Checks whether the current thread has acquired anything
    378 // from other clocks after releasing to dst (directly or indirectly).
    379 bool ThreadClock::HasAcquiredAfterRelease(const SyncClock *dst) const {
    380   const u64 my_epoch = dst->elem(tid_).epoch;
    381   return my_epoch <= last_acquire_ ||
    382       my_epoch <= atomic_load_relaxed(&global_acquire_);
    383 }
    384 
    385 // Sets a single element in the vector clock.
    386 // This function is called only from weird places like AcquireGlobal.
    387 void ThreadClock::set(ClockCache *c, unsigned tid, u64 v) {
    388   DCHECK_LT(tid, kMaxTid);
    389   DCHECK_GE(v, clk_[tid]);
    390   clk_[tid] = v;
    391   if (nclk_ <= tid)
    392     nclk_ = tid + 1;
    393   last_acquire_ = clk_[tid_];
    394   ResetCached(c);
    395 }
    396 
    397 void ThreadClock::DebugDump(int(*printf)(const char *s, ...)) {
    398   printf("clock=[");
    399   for (uptr i = 0; i < nclk_; i++)
    400     printf("%s%llu", i == 0 ? "" : ",", clk_[i]);
    401   printf("] tid=%u/%u last_acq=%llu", tid_, reused_, last_acquire_);
    402 }
    403 
    404 SyncClock::SyncClock() {
    405   ResetImpl();
    406 }
    407 
    408 SyncClock::~SyncClock() {
    409   // Reset must be called before dtor.
    410   CHECK_EQ(size_, 0);
    411   CHECK_EQ(blocks_, 0);
    412   CHECK_EQ(tab_, 0);
    413   CHECK_EQ(tab_idx_, 0);
    414 }
    415 
    416 void SyncClock::Reset(ClockCache *c) {
    417   if (size_)
    418     UnrefClockBlock(c, tab_idx_, blocks_);
    419   ResetImpl();
    420 }
    421 
    422 void SyncClock::ResetImpl() {
    423   tab_ = 0;
    424   tab_idx_ = 0;
    425   size_ = 0;
    426   blocks_ = 0;
    427   release_store_tid_ = kInvalidTid;
    428   release_store_reused_ = 0;
    429   for (uptr i = 0; i < kDirtyTids; i++) dirty_[i].set_tid(kInvalidTid);
    430 }
    431 
    432 void SyncClock::Resize(ClockCache *c, uptr nclk) {
    433   Unshare(c);
    434   if (nclk <= capacity()) {
    435     // Memory is already allocated, just increase the size.
    436     size_ = nclk;
    437     return;
    438   }
    439   if (size_ == 0) {
    440     // Grow from 0 to one-level table.
    441     CHECK_EQ(size_, 0);
    442     CHECK_EQ(blocks_, 0);
    443     CHECK_EQ(tab_, 0);
    444     CHECK_EQ(tab_idx_, 0);
    445     tab_idx_ = ctx->clock_alloc.Alloc(c);
    446     tab_ = ctx->clock_alloc.Map(tab_idx_);
    447     internal_memset(tab_, 0, sizeof(*tab_));
    448     atomic_store_relaxed(ref_ptr(tab_), 1);
    449     size_ = 1;
    450   } else if (size_ > blocks_ * ClockBlock::kClockCount) {
    451     u32 idx = ctx->clock_alloc.Alloc(c);
    452     ClockBlock *new_cb = ctx->clock_alloc.Map(idx);
    453     uptr top = size_ - blocks_ * ClockBlock::kClockCount;
    454     CHECK_LT(top, ClockBlock::kClockCount);
    455     const uptr move = top * sizeof(tab_->clock[0]);
    456     internal_memcpy(&new_cb->clock[0], tab_->clock, move);
    457     internal_memset(&new_cb->clock[top], 0, sizeof(*new_cb) - move);
    458     internal_memset(tab_->clock, 0, move);
    459     append_block(idx);
    460   }
    461   // At this point we have first level table allocated and all clock elements
    462   // are evacuated from it to a second level block.
    463   // Add second level tables as necessary.
    464   while (nclk > capacity()) {
    465     u32 idx = ctx->clock_alloc.Alloc(c);
    466     ClockBlock *cb = ctx->clock_alloc.Map(idx);
    467     internal_memset(cb, 0, sizeof(*cb));
    468     append_block(idx);
    469   }
    470   size_ = nclk;
    471 }
    472 
    473 // Flushes all dirty elements into the main clock array.
    474 void SyncClock::FlushDirty() {
    475   for (unsigned i = 0; i < kDirtyTids; i++) {
    476     Dirty *dirty = &dirty_[i];
    477     if (dirty->tid() != kInvalidTid) {
    478       CHECK_LT(dirty->tid(), size_);
    479       elem(dirty->tid()).epoch = dirty->epoch;
    480       dirty->set_tid(kInvalidTid);
    481     }
    482   }
    483 }
    484 
    485 bool SyncClock::IsShared() const {
    486   if (size_ == 0)
    487     return false;
    488   atomic_uint32_t *ref = ref_ptr(tab_);
    489   u32 v = atomic_load(ref, memory_order_acquire);
    490   CHECK_GT(v, 0);
    491   return v > 1;
    492 }
    493 
    494 // Unshares the current clock if it's shared.
    495 // Shared clocks are immutable, so they need to be unshared before any updates.
    496 // Note: this does not apply to dirty entries as they are not shared.
    497 void SyncClock::Unshare(ClockCache *c) {
    498   if (!IsShared())
    499     return;
    500   // First, copy current state into old.
    501   SyncClock old;
    502   old.tab_ = tab_;
    503   old.tab_idx_ = tab_idx_;
    504   old.size_ = size_;
    505   old.blocks_ = blocks_;
    506   old.release_store_tid_ = release_store_tid_;
    507   old.release_store_reused_ = release_store_reused_;
    508   for (unsigned i = 0; i < kDirtyTids; i++)
    509     old.dirty_[i] = dirty_[i];
    510   // Then, clear current object.
    511   ResetImpl();
    512   // Allocate brand new clock in the current object.
    513   Resize(c, old.size_);
    514   // Now copy state back into this object.
    515   Iter old_iter(&old);
    516   for (ClockElem &ce : *this) {
    517     ce = *old_iter;
    518     ++old_iter;
    519   }
    520   release_store_tid_ = old.release_store_tid_;
    521   release_store_reused_ = old.release_store_reused_;
    522   for (unsigned i = 0; i < kDirtyTids; i++)
    523     dirty_[i] = old.dirty_[i];
    524   // Drop reference to old and delete if necessary.
    525   old.Reset(c);
    526 }
    527 
    528 // Can we cache this clock for future release operations?
    529 ALWAYS_INLINE bool SyncClock::Cachable() const {
    530   if (size_ == 0)
    531     return false;
    532   for (unsigned i = 0; i < kDirtyTids; i++) {
    533     if (dirty_[i].tid() != kInvalidTid)
    534       return false;
    535   }
    536   return atomic_load_relaxed(ref_ptr(tab_)) == 1;
    537 }
    538 
    539 // elem linearizes the two-level structure into linear array.
    540 // Note: this is used only for one time accesses, vector operations use
    541 // the iterator as it is much faster.
    542 ALWAYS_INLINE ClockElem &SyncClock::elem(unsigned tid) const {
    543   DCHECK_LT(tid, size_);
    544   const uptr block = tid / ClockBlock::kClockCount;
    545   DCHECK_LE(block, blocks_);
    546   tid %= ClockBlock::kClockCount;
    547   if (block == blocks_)
    548     return tab_->clock[tid];
    549   u32 idx = get_block(block);
    550   ClockBlock *cb = ctx->clock_alloc.Map(idx);
    551   return cb->clock[tid];
    552 }
    553 
    554 ALWAYS_INLINE uptr SyncClock::capacity() const {
    555   if (size_ == 0)
    556     return 0;
    557   uptr ratio = sizeof(ClockBlock::clock[0]) / sizeof(ClockBlock::table[0]);
    558   // How many clock elements we can fit into the first level block.
    559   // +1 for ref counter.
    560   uptr top = ClockBlock::kClockCount - RoundUpTo(blocks_ + 1, ratio) / ratio;
    561   return blocks_ * ClockBlock::kClockCount + top;
    562 }
    563 
    564 ALWAYS_INLINE u32 SyncClock::get_block(uptr bi) const {
    565   DCHECK(size_);
    566   DCHECK_LT(bi, blocks_);
    567   return tab_->table[ClockBlock::kBlockIdx - bi];
    568 }
    569 
    570 ALWAYS_INLINE void SyncClock::append_block(u32 idx) {
    571   uptr bi = blocks_++;
    572   CHECK_EQ(get_block(bi), 0);
    573   tab_->table[ClockBlock::kBlockIdx - bi] = idx;
    574 }
    575 
    576 // Used only by tests.
    577 u64 SyncClock::get(unsigned tid) const {
    578   for (unsigned i = 0; i < kDirtyTids; i++) {
    579     Dirty dirty = dirty_[i];
    580     if (dirty.tid() == tid)
    581       return dirty.epoch;
    582   }
    583   return elem(tid).epoch;
    584 }
    585 
    586 // Used only by Iter test.
    587 u64 SyncClock::get_clean(unsigned tid) const {
    588   return elem(tid).epoch;
    589 }
    590 
    591 void SyncClock::DebugDump(int(*printf)(const char *s, ...)) {
    592   printf("clock=[");
    593   for (uptr i = 0; i < size_; i++)
    594     printf("%s%llu", i == 0 ? "" : ",", elem(i).epoch);
    595   printf("] reused=[");
    596   for (uptr i = 0; i < size_; i++)
    597     printf("%s%llu", i == 0 ? "" : ",", elem(i).reused);
    598   printf("] release_store_tid=%d/%d dirty_tids=%d[%llu]/%d[%llu]",
    599          release_store_tid_, release_store_reused_, dirty_[0].tid(),
    600          dirty_[0].epoch, dirty_[1].tid(), dirty_[1].epoch);
    601 }
    602 
    603 void SyncClock::Iter::Next() {
    604   // Finished with the current block, move on to the next one.
    605   block_++;
    606   if (block_ < parent_->blocks_) {
    607     // Iterate over the next second level block.
    608     u32 idx = parent_->get_block(block_);
    609     ClockBlock *cb = ctx->clock_alloc.Map(idx);
    610     pos_ = &cb->clock[0];
    611     end_ = pos_ + min(parent_->size_ - block_ * ClockBlock::kClockCount,
    612         ClockBlock::kClockCount);
    613     return;
    614   }
    615   if (block_ == parent_->blocks_ &&
    616       parent_->size_ > parent_->blocks_ * ClockBlock::kClockCount) {
    617     // Iterate over elements in the first level block.
    618     pos_ = &parent_->tab_->clock[0];
    619     end_ = pos_ + min(parent_->size_ - block_ * ClockBlock::kClockCount,
    620         ClockBlock::kClockCount);
    621     return;
    622   }
    623   parent_ = nullptr;  // denotes end
    624 }
    625 }  // namespace __tsan
    626