1 /* 2 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. 3 * 4 * This code is free software; you can redistribute it and/or modify it 5 * under the terms of the GNU General Public License version 2 only, as 6 * published by the Free Software Foundation. Oracle designates this 7 * particular file as subject to the "Classpath" exception as provided 8 * by Oracle in the LICENSE file that accompanied this code. 9 * 10 * This code is distributed in the hope that it will be useful, but WITHOUT 11 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 12 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License 13 * version 2 for more details (a copy is included in the LICENSE file that 14 * accompanied this code). 15 * 16 * You should have received a copy of the GNU General Public License version 17 * 2 along with this work; if not, write to the Free Software Foundation, 18 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. 19 * 20 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA 21 * or visit www.oracle.com if you need additional information or have any 22 * questions. 23 */ 24 25 /* 26 * This file is available under and governed by the GNU General Public 27 * License version 2 only, as published by the Free Software Foundation. 28 * However, the following notice accompanied the original version of this 29 * file: 30 * 31 * Written by Doug Lea with assistance from members of JCP JSR-166 32 * Expert Group and released to the public domain, as explained at 33 * http://creativecommons.org/publicdomain/zero/1.0/ 34 */ 35 36 package java.util.concurrent.atomic; 37 38 import java.lang.invoke.MethodHandles; 39 import java.lang.invoke.VarHandle; 40 import java.util.Arrays; 41 import java.util.concurrent.ThreadLocalRandom; 42 import java.util.function.DoubleBinaryOperator; 43 import java.util.function.LongBinaryOperator; 44 45 /** 46 * A package-local class holding common representation and mechanics 47 * for classes supporting dynamic striping on 64bit values. The class 48 * extends Number so that concrete subclasses must publicly do so. 49 */ 50 @SuppressWarnings({"removal","serial"}) 51 abstract class Striped64 extends Number { 52 /* 53 * This class maintains a lazily-initialized table of atomically 54 * updated variables, plus an extra "base" field. The table size 55 * is a power of two. Indexing uses masked per-thread hash codes. 56 * Nearly all declarations in this class are package-private, 57 * accessed directly by subclasses. 58 * 59 * Table entries are of class Cell; a variant of AtomicLong padded 60 * (via @Contended) to reduce cache contention. Padding is 61 * overkill for most Atomics because they are usually irregularly 62 * scattered in memory and thus don't interfere much with each 63 * other. But Atomic objects residing in arrays will tend to be 64 * placed adjacent to each other, and so will most often share 65 * cache lines (with a huge negative performance impact) without 66 * this precaution. 67 * 68 * In part because Cells are relatively large, we avoid creating 69 * them until they are needed. When there is no contention, all 70 * updates are made to the base field. Upon first contention (a 71 * failed CAS on base update), the table is initialized to size 2. 72 * The table size is doubled upon further contention until 73 * reaching the nearest power of two greater than or equal to the 74 * number of CPUS. Table slots remain empty (null) until they are 75 * needed. 76 * 77 * A single spinlock ("cellsBusy") is used for initializing and 78 * resizing the table, as well as populating slots with new Cells. 79 * There is no need for a blocking lock; when the lock is not 80 * available, threads try other slots (or the base). During these 81 * retries, there is increased contention and reduced locality, 82 * which is still better than alternatives. 83 * 84 * The Thread probe fields maintained via ThreadLocalRandom serve 85 * as per-thread hash codes. We let them remain uninitialized as 86 * zero (if they come in this way) until they contend at slot 87 * 0. They are then initialized to values that typically do not 88 * often conflict with others. Contention and/or table collisions 89 * are indicated by failed CASes when performing an update 90 * operation. Upon a collision, if the table size is less than 91 * the capacity, it is doubled in size unless some other thread 92 * holds the lock. If a hashed slot is empty, and lock is 93 * available, a new Cell is created. Otherwise, if the slot 94 * exists, a CAS is tried. Retries proceed by "double hashing", 95 * using a secondary hash (Marsaglia XorShift) to try to find a 96 * free slot. 97 * 98 * The table size is capped because, when there are more threads 99 * than CPUs, supposing that each thread were bound to a CPU, 100 * there would exist a perfect hash function mapping threads to 101 * slots that eliminates collisions. When we reach capacity, we 102 * search for this mapping by randomly varying the hash codes of 103 * colliding threads. Because search is random, and collisions 104 * only become known via CAS failures, convergence can be slow, 105 * and because threads are typically not bound to CPUS forever, 106 * may not occur at all. However, despite these limitations, 107 * observed contention rates are typically low in these cases. 108 * 109 * It is possible for a Cell to become unused when threads that 110 * once hashed to it terminate, as well as in the case where 111 * doubling the table causes no thread to hash to it under 112 * expanded mask. We do not try to detect or remove such cells, 113 * under the assumption that for long-running instances, observed 114 * contention levels will recur, so the cells will eventually be 115 * needed again; and for short-lived ones, it does not matter. 116 */ 117 118 /** 119 * Padded variant of AtomicLong supporting only raw accesses plus CAS. 120 * 121 * JVM intrinsics note: It would be possible to use a release-only 122 * form of CAS here, if it were provided. 123 */ 124 @jdk.internal.vm.annotation.Contended 125 static final class Cell { 126 volatile long value; Cell(long x)127 Cell(long x) { value = x; } cas(long cmp, long val)128 final boolean cas(long cmp, long val) { 129 return VALUE.weakCompareAndSetRelease(this, cmp, val); 130 } reset()131 final void reset() { 132 VALUE.setVolatile(this, 0L); 133 } reset(long identity)134 final void reset(long identity) { 135 VALUE.setVolatile(this, identity); 136 } getAndSet(long val)137 final long getAndSet(long val) { 138 return (long)VALUE.getAndSet(this, val); 139 } 140 141 // VarHandle mechanics 142 private static final VarHandle VALUE; 143 static { 144 try { 145 MethodHandles.Lookup l = MethodHandles.lookup(); 146 VALUE = l.findVarHandle(Cell.class, "value", long.class); 147 } catch (ReflectiveOperationException e) { 148 throw new ExceptionInInitializerError(e); 149 } 150 } 151 } 152 153 /** Number of CPUS, to place bound on table size */ 154 static final int NCPU = Runtime.getRuntime().availableProcessors(); 155 156 /** 157 * Table of cells. When non-null, size is a power of 2. 158 */ 159 transient volatile Cell[] cells; 160 161 /** 162 * Base value, used mainly when there is no contention, but also as 163 * a fallback during table initialization races. Updated via CAS. 164 */ 165 transient volatile long base; 166 167 /** 168 * Spinlock (locked via CAS) used when resizing and/or creating Cells. 169 */ 170 transient volatile int cellsBusy; 171 172 /** 173 * Package-private default constructor. 174 */ Striped64()175 Striped64() { 176 } 177 178 /** 179 * CASes the base field. 180 */ casBase(long cmp, long val)181 final boolean casBase(long cmp, long val) { 182 return BASE.weakCompareAndSetRelease(this, cmp, val); 183 } 184 getAndSetBase(long val)185 final long getAndSetBase(long val) { 186 return (long)BASE.getAndSet(this, val); 187 } 188 189 /** 190 * CASes the cellsBusy field from 0 to 1 to acquire lock. 191 */ casCellsBusy()192 final boolean casCellsBusy() { 193 return CELLSBUSY.compareAndSet(this, 0, 1); 194 } 195 196 /** 197 * Returns the probe value for the current thread. 198 * Duplicated from ThreadLocalRandom because of packaging restrictions. 199 */ getProbe()200 static final int getProbe() { 201 return (int) THREAD_PROBE.get(Thread.currentThread()); 202 } 203 204 /** 205 * Pseudo-randomly advances and records the given probe value for the 206 * given thread. 207 * Duplicated from ThreadLocalRandom because of packaging restrictions. 208 */ advanceProbe(int probe)209 static final int advanceProbe(int probe) { 210 probe ^= probe << 13; // xorshift 211 probe ^= probe >>> 17; 212 probe ^= probe << 5; 213 THREAD_PROBE.set(Thread.currentThread(), probe); 214 return probe; 215 } 216 217 /** 218 * Handles cases of updates involving initialization, resizing, 219 * creating new Cells, and/or contention. See above for 220 * explanation. This method suffers the usual non-modularity 221 * problems of optimistic retry code, relying on rechecked sets of 222 * reads. 223 * 224 * @param x the value 225 * @param fn the update function, or null for add (this convention 226 * avoids the need for an extra field or function in LongAdder). 227 * @param wasUncontended false if CAS failed before call 228 * @param index thread index from getProbe 229 */ longAccumulate(long x, LongBinaryOperator fn, boolean wasUncontended, int index)230 final void longAccumulate(long x, LongBinaryOperator fn, 231 boolean wasUncontended, int index) { 232 if (index == 0) { 233 ThreadLocalRandom.current(); // force initialization 234 index = getProbe(); 235 wasUncontended = true; 236 } 237 for (boolean collide = false;;) { // True if last slot nonempty 238 Cell[] cs; Cell c; int n; long v; 239 if ((cs = cells) != null && (n = cs.length) > 0) { 240 if ((c = cs[(n - 1) & index]) == null) { 241 if (cellsBusy == 0) { // Try to attach new Cell 242 Cell r = new Cell(x); // Optimistically create 243 if (cellsBusy == 0 && casCellsBusy()) { 244 try { // Recheck under lock 245 Cell[] rs; int m, j; 246 if ((rs = cells) != null && 247 (m = rs.length) > 0 && 248 rs[j = (m - 1) & index] == null) { 249 rs[j] = r; 250 break; 251 } 252 } finally { 253 cellsBusy = 0; 254 } 255 continue; // Slot is now non-empty 256 } 257 } 258 collide = false; 259 } 260 else if (!wasUncontended) // CAS already known to fail 261 wasUncontended = true; // Continue after rehash 262 else if (c.cas(v = c.value, 263 (fn == null) ? v + x : fn.applyAsLong(v, x))) 264 break; 265 else if (n >= NCPU || cells != cs) 266 collide = false; // At max size or stale 267 else if (!collide) 268 collide = true; 269 else if (cellsBusy == 0 && casCellsBusy()) { 270 try { 271 if (cells == cs) // Expand table unless stale 272 cells = Arrays.copyOf(cs, n << 1); 273 } finally { 274 cellsBusy = 0; 275 } 276 collide = false; 277 continue; // Retry with expanded table 278 } 279 index = advanceProbe(index); 280 } 281 else if (cellsBusy == 0 && cells == cs && casCellsBusy()) { 282 try { // Initialize table 283 if (cells == cs) { 284 Cell[] rs = new Cell[2]; 285 rs[index & 1] = new Cell(x); 286 cells = rs; 287 break; 288 } 289 } finally { 290 cellsBusy = 0; 291 } 292 } 293 // Fall back on using base 294 else if (casBase(v = base, 295 (fn == null) ? v + x : fn.applyAsLong(v, x))) 296 break; 297 } 298 } 299 apply(DoubleBinaryOperator fn, long v, double x)300 private static long apply(DoubleBinaryOperator fn, long v, double x) { 301 double d = Double.longBitsToDouble(v); 302 d = (fn == null) ? d + x : fn.applyAsDouble(d, x); 303 return Double.doubleToRawLongBits(d); 304 } 305 306 /** 307 * Same as longAccumulate, but injecting long/double conversions 308 * in too many places to sensibly merge with long version, given 309 * the low-overhead requirements of this class. So must instead be 310 * maintained by copy/paste/adapt. 311 */ doubleAccumulate(double x, DoubleBinaryOperator fn, boolean wasUncontended, int index)312 final void doubleAccumulate(double x, DoubleBinaryOperator fn, 313 boolean wasUncontended, int index) { 314 if (index == 0) { 315 ThreadLocalRandom.current(); // force initialization 316 index = getProbe(); 317 wasUncontended = true; 318 } 319 for (boolean collide = false;;) { // True if last slot nonempty 320 Cell[] cs; Cell c; int n; long v; 321 if ((cs = cells) != null && (n = cs.length) > 0) { 322 if ((c = cs[(n - 1) & index]) == null) { 323 if (cellsBusy == 0) { // Try to attach new Cell 324 Cell r = new Cell(Double.doubleToRawLongBits(x)); 325 if (cellsBusy == 0 && casCellsBusy()) { 326 try { // Recheck under lock 327 Cell[] rs; int m, j; 328 if ((rs = cells) != null && 329 (m = rs.length) > 0 && 330 rs[j = (m - 1) & index] == null) { 331 rs[j] = r; 332 break; 333 } 334 } finally { 335 cellsBusy = 0; 336 } 337 continue; // Slot is now non-empty 338 } 339 } 340 collide = false; 341 } 342 else if (!wasUncontended) // CAS already known to fail 343 wasUncontended = true; // Continue after rehash 344 else if (c.cas(v = c.value, apply(fn, v, x))) 345 break; 346 else if (n >= NCPU || cells != cs) 347 collide = false; // At max size or stale 348 else if (!collide) 349 collide = true; 350 else if (cellsBusy == 0 && casCellsBusy()) { 351 try { 352 if (cells == cs) // Expand table unless stale 353 cells = Arrays.copyOf(cs, n << 1); 354 } finally { 355 cellsBusy = 0; 356 } 357 collide = false; 358 continue; // Retry with expanded table 359 } 360 index = advanceProbe(index); 361 } 362 else if (cellsBusy == 0 && cells == cs && casCellsBusy()) { 363 try { // Initialize table 364 if (cells == cs) { 365 Cell[] rs = new Cell[2]; 366 rs[index & 1] = new Cell(Double.doubleToRawLongBits(x)); 367 cells = rs; 368 break; 369 } 370 } finally { 371 cellsBusy = 0; 372 } 373 } 374 // Fall back on using base 375 else if (casBase(v = base, apply(fn, v, x))) 376 break; 377 } 378 } 379 380 // VarHandle mechanics 381 private static final VarHandle BASE; 382 private static final VarHandle CELLSBUSY; 383 private static final VarHandle THREAD_PROBE; 384 static { 385 try { 386 MethodHandles.Lookup l = MethodHandles.lookup(); 387 BASE = l.findVarHandle(Striped64.class, 388 "base", long.class); 389 CELLSBUSY = l.findVarHandle(Striped64.class, 390 "cellsBusy", int.class); 391 l = java.security.AccessController.doPrivileged( 392 new java.security.PrivilegedAction<>() { 393 public MethodHandles.Lookup run() { 394 try { 395 return MethodHandles.privateLookupIn(Thread.class, MethodHandles.lookup()); 396 } catch (ReflectiveOperationException e) { 397 throw new ExceptionInInitializerError(e); 398 } 399 }}); 400 THREAD_PROBE = l.findVarHandle(Thread.class, 401 "threadLocalRandomProbe", int.class); 402 } catch (ReflectiveOperationException e) { 403 throw new ExceptionInInitializerError(e); 404 } 405 } 406 407 } 408