ViewVC Help
View File | Revision Log | Show Annotations | Download File | Root Listing
root/jsr166/jsr166/src/main/java/util/concurrent/ForkJoinPool.java
Revision: 1.38
Committed: Tue Sep 14 03:48:40 2010 UTC (13 years, 8 months ago) by jsr166
Branch: MAIN
Changes since 1.37: +0 -1 lines
Log Message:
fix imports

File Contents

# Content
1 /*
2 * Written by Doug Lea with assistance from members of JCP JSR-166
3 * Expert Group and released to the public domain, as explained at
4 * http://creativecommons.org/licenses/publicdomain
5 */
6
7 package java.util.concurrent;
8
9 import java.util.ArrayList;
10 import java.util.Arrays;
11 import java.util.Collection;
12 import java.util.Collections;
13 import java.util.List;
14 import java.util.concurrent.AbstractExecutorService;
15 import java.util.concurrent.Callable;
16 import java.util.concurrent.ExecutorService;
17 import java.util.concurrent.Future;
18 import java.util.concurrent.RejectedExecutionException;
19 import java.util.concurrent.RunnableFuture;
20 import java.util.concurrent.TimeUnit;
21 import java.util.concurrent.TimeoutException;
22 import java.util.concurrent.atomic.AtomicInteger;
23 import java.util.concurrent.locks.LockSupport;
24 import java.util.concurrent.locks.ReentrantLock;
25
26 /**
27 * An {@link ExecutorService} for running {@link ForkJoinTask}s.
28 * A {@code ForkJoinPool} provides the entry point for submissions
29 * from non-{@code ForkJoinTask} clients, as well as management and
30 * monitoring operations.
31 *
32 * <p>A {@code ForkJoinPool} differs from other kinds of {@link
33 * ExecutorService} mainly by virtue of employing
34 * <em>work-stealing</em>: all threads in the pool attempt to find and
35 * execute subtasks created by other active tasks (eventually blocking
36 * waiting for work if none exist). This enables efficient processing
37 * when most tasks spawn other subtasks (as do most {@code
38 * ForkJoinTask}s). When setting <em>asyncMode</em> to true in
39 * constructors, {@code ForkJoinPool}s may also be appropriate for use
40 * with event-style tasks that are never joined.
41 *
42 * <p>A {@code ForkJoinPool} is constructed with a given target
43 * parallelism level; by default, equal to the number of available
44 * processors. The pool attempts to maintain enough active (or
45 * available) threads by dynamically adding, suspending, or resuming
46 * internal worker threads, even if some tasks are stalled waiting to
47 * join others. However, no such adjustments are guaranteed in the
48 * face of blocked IO or other unmanaged synchronization. The nested
49 * {@link ManagedBlocker} interface enables extension of the kinds of
50 * synchronization accommodated.
51 *
52 * <p>In addition to execution and lifecycle control methods, this
53 * class provides status check methods (for example
54 * {@link #getStealCount}) that are intended to aid in developing,
55 * tuning, and monitoring fork/join applications. Also, method
56 * {@link #toString} returns indications of pool state in a
57 * convenient form for informal monitoring.
58 *
59 * <p> As is the case with other ExecutorServices, there are three
60 * main task execution methods summarized in the following
61 * table. These are designed to be used by clients not already engaged
62 * in fork/join computations in the current pool. The main forms of
63 * these methods accept instances of {@code ForkJoinTask}, but
64 * overloaded forms also allow mixed execution of plain {@code
65 * Runnable}- or {@code Callable}- based activities as well. However,
66 * tasks that are already executing in a pool should normally
67 * <em>NOT</em> use these pool execution methods, but instead use the
68 * within-computation forms listed in the table.
69 *
70 * <table BORDER CELLPADDING=3 CELLSPACING=1>
71 * <tr>
72 * <td></td>
73 * <td ALIGN=CENTER> <b>Call from non-fork/join clients</b></td>
74 * <td ALIGN=CENTER> <b>Call from within fork/join computations</b></td>
75 * </tr>
76 * <tr>
77 * <td> <b>Arrange async execution</td>
78 * <td> {@link #execute(ForkJoinTask)}</td>
79 * <td> {@link ForkJoinTask#fork}</td>
80 * </tr>
81 * <tr>
82 * <td> <b>Await and obtain result</td>
83 * <td> {@link #invoke(ForkJoinTask)}</td>
84 * <td> {@link ForkJoinTask#invoke}</td>
85 * </tr>
86 * <tr>
87 * <td> <b>Arrange exec and obtain Future</td>
88 * <td> {@link #submit(ForkJoinTask)}</td>
89 * <td> {@link ForkJoinTask#fork} (ForkJoinTasks <em>are</em> Futures)</td>
90 * </tr>
91 * </table>
92 *
93 * <p><b>Sample Usage.</b> Normally a single {@code ForkJoinPool} is
94 * used for all parallel task execution in a program or subsystem.
95 * Otherwise, use would not usually outweigh the construction and
96 * bookkeeping overhead of creating a large set of threads. For
97 * example, a common pool could be used for the {@code SortTasks}
98 * illustrated in {@link RecursiveAction}. Because {@code
99 * ForkJoinPool} uses threads in {@linkplain java.lang.Thread#isDaemon
100 * daemon} mode, there is typically no need to explicitly {@link
101 * #shutdown} such a pool upon program exit.
102 *
103 * <pre>
104 * static final ForkJoinPool mainPool = new ForkJoinPool();
105 * ...
106 * public void sort(long[] array) {
107 * mainPool.invoke(new SortTask(array, 0, array.length));
108 * }
109 * </pre>
110 *
111 * <p><b>Implementation notes</b>: This implementation restricts the
112 * maximum number of running threads to 32767. Attempts to create
113 * pools with greater than the maximum number result in
114 * {@code IllegalArgumentException}.
115 *
116 * <p>This implementation rejects submitted tasks (that is, by throwing
117 * {@link RejectedExecutionException}) only when the pool is shut down
118 * or internal resources have been exhausted.
119 *
120 * @since 1.7
121 * @author Doug Lea
122 */
123 public class ForkJoinPool extends AbstractExecutorService {
124
125 /*
126 * Implementation Overview
127 *
128 * This class provides the central bookkeeping and control for a
129 * set of worker threads: Submissions from non-FJ threads enter
130 * into a submission queue. Workers take these tasks and typically
131 * split them into subtasks that may be stolen by other workers.
132 * The main work-stealing mechanics implemented in class
133 * ForkJoinWorkerThread give first priority to processing tasks
134 * from their own queues (LIFO or FIFO, depending on mode), then
135 * to randomized FIFO steals of tasks in other worker queues, and
136 * lastly to new submissions. These mechanics do not consider
137 * affinities, loads, cache localities, etc, so rarely provide the
138 * best possible performance on a given machine, but portably
139 * provide good throughput by averaging over these factors.
140 * (Further, even if we did try to use such information, we do not
141 * usually have a basis for exploiting it. For example, some sets
142 * of tasks profit from cache affinities, but others are harmed by
143 * cache pollution effects.)
144 *
145 * Beyond work-stealing support and essential bookkeeping, the
146 * main responsibility of this framework is to take actions when
147 * one worker is waiting to join a task stolen (or always held by)
148 * another. Because we are multiplexing many tasks on to a pool
149 * of workers, we can't just let them block (as in Thread.join).
150 * We also cannot just reassign the joiner's run-time stack with
151 * another and replace it later, which would be a form of
152 * "continuation", that even if possible is not necessarily a good
153 * idea. Given that the creation costs of most threads on most
154 * systems mainly surrounds setting up runtime stacks, thread
155 * creation and switching is usually not much more expensive than
156 * stack creation and switching, and is more flexible). Instead we
157 * combine two tactics:
158 *
159 * Helping: Arranging for the joiner to execute some task that it
160 * would be running if the steal had not occurred. Method
161 * ForkJoinWorkerThread.helpJoinTask tracks joining->stealing
162 * links to try to find such a task.
163 *
164 * Compensating: Unless there are already enough live threads,
165 * method helpMaintainParallelism() may create or
166 * re-activate a spare thread to compensate for blocked
167 * joiners until they unblock.
168 *
169 * It is impossible to keep exactly the target (parallelism)
170 * number of threads running at any given time. Determining
171 * existence of conservatively safe helping targets, the
172 * availability of already-created spares, and the apparent need
173 * to create new spares are all racy and require heuristic
174 * guidance, so we rely on multiple retries of each. Compensation
175 * occurs in slow-motion. It is triggered only upon timeouts of
176 * Object.wait used for joins. This reduces poor decisions that
177 * would otherwise be made when threads are waiting for others
178 * that are stalled because of unrelated activities such as
179 * garbage collection.
180 *
181 * The ManagedBlocker extension API can't use helping so relies
182 * only on compensation in method awaitBlocker.
183 *
184 * The main throughput advantages of work-stealing stem from
185 * decentralized control -- workers mostly steal tasks from each
186 * other. We do not want to negate this by creating bottlenecks
187 * implementing other management responsibilities. So we use a
188 * collection of techniques that avoid, reduce, or cope well with
189 * contention. These entail several instances of bit-packing into
190 * CASable fields to maintain only the minimally required
191 * atomicity. To enable such packing, we restrict maximum
192 * parallelism to (1<<15)-1 (enabling twice this (to accommodate
193 * unbalanced increments and decrements) to fit into a 16 bit
194 * field, which is far in excess of normal operating range. Even
195 * though updates to some of these bookkeeping fields do sometimes
196 * contend with each other, they don't normally cache-contend with
197 * updates to others enough to warrant memory padding or
198 * isolation. So they are all held as fields of ForkJoinPool
199 * objects. The main capabilities are as follows:
200 *
201 * 1. Creating and removing workers. Workers are recorded in the
202 * "workers" array. This is an array as opposed to some other data
203 * structure to support index-based random steals by workers.
204 * Updates to the array recording new workers and unrecording
205 * terminated ones are protected from each other by a lock
206 * (workerLock) but the array is otherwise concurrently readable,
207 * and accessed directly by workers. To simplify index-based
208 * operations, the array size is always a power of two, and all
209 * readers must tolerate null slots. Currently, all worker thread
210 * creation is on-demand, triggered by task submissions,
211 * replacement of terminated workers, and/or compensation for
212 * blocked workers. However, all other support code is set up to
213 * work with other policies.
214 *
215 * To ensure that we do not hold on to worker references that
216 * would prevent GC, ALL accesses to workers are via indices into
217 * the workers array (which is one source of some of the unusual
218 * code constructions here). In essence, the workers array serves
219 * as a WeakReference mechanism. Thus for example the event queue
220 * stores worker indices, not worker references. Access to the
221 * workers in associated methods (for example releaseEventWaiters)
222 * must both index-check and null-check the IDs. All such accesses
223 * ignore bad IDs by returning out early from what they are doing,
224 * since this can only be associated with shutdown, in which case
225 * it is OK to give up. On termination, we just clobber these
226 * data structures without trying to use them.
227 *
228 * 2. Bookkeeping for dynamically adding and removing workers. We
229 * aim to approximately maintain the given level of parallelism.
230 * When some workers are known to be blocked (on joins or via
231 * ManagedBlocker), we may create or resume others to take their
232 * place until they unblock (see below). Implementing this
233 * requires counts of the number of "running" threads (i.e., those
234 * that are neither blocked nor artificially suspended) as well as
235 * the total number. These two values are packed into one field,
236 * "workerCounts" because we need accurate snapshots when deciding
237 * to create, resume or suspend. Note however that the
238 * correspondence of these counts to reality is not guaranteed. In
239 * particular updates for unblocked threads may lag until they
240 * actually wake up.
241 *
242 * 3. Maintaining global run state. The run state of the pool
243 * consists of a runLevel (SHUTDOWN, TERMINATING, etc) similar to
244 * those in other Executor implementations, as well as a count of
245 * "active" workers -- those that are, or soon will be, or
246 * recently were executing tasks. The runLevel and active count
247 * are packed together in order to correctly trigger shutdown and
248 * termination. Without care, active counts can be subject to very
249 * high contention. We substantially reduce this contention by
250 * relaxing update rules. A worker must claim active status
251 * prospectively, by activating if it sees that a submitted or
252 * stealable task exists (it may find after activating that the
253 * task no longer exists). It stays active while processing this
254 * task (if it exists) and any other local subtasks it produces,
255 * until it cannot find any other tasks. It then tries
256 * inactivating (see method preStep), but upon update contention
257 * instead scans for more tasks, later retrying inactivation if it
258 * doesn't find any.
259 *
260 * 4. Managing idle workers waiting for tasks. We cannot let
261 * workers spin indefinitely scanning for tasks when none are
262 * available. On the other hand, we must quickly prod them into
263 * action when new tasks are submitted or generated. We
264 * park/unpark these idle workers using an event-count scheme.
265 * Field eventCount is incremented upon events that may enable
266 * workers that previously could not find a task to now find one:
267 * Submission of a new task to the pool, or another worker pushing
268 * a task onto a previously empty queue. (We also use this
269 * mechanism for configuration and termination actions that
270 * require wakeups of idle workers). Each worker maintains its
271 * last known event count, and blocks when a scan for work did not
272 * find a task AND its lastEventCount matches the current
273 * eventCount. Waiting idle workers are recorded in a variant of
274 * Treiber stack headed by field eventWaiters which, when nonzero,
275 * encodes the thread index and count awaited for by the worker
276 * thread most recently calling eventSync. This thread in turn has
277 * a record (field nextEventWaiter) for the next waiting worker.
278 * In addition to allowing simpler decisions about need for
279 * wakeup, the event count bits in eventWaiters serve the role of
280 * tags to avoid ABA errors in Treiber stacks. Upon any wakeup,
281 * released threads also try to release at most two others. The
282 * net effect is a tree-like diffusion of signals, where released
283 * threads (and possibly others) help with unparks. To further
284 * reduce contention effects a bit, failed CASes to increment
285 * field eventCount are tolerated without retries in signalWork.
286 * Conceptually they are merged into the same event, which is OK
287 * when their only purpose is to enable workers to scan for work.
288 *
289 * 5. Managing suspension of extra workers. When a worker notices
290 * (usually upon timeout of a wait()) that there are too few
291 * running threads, we may create a new thread to maintain
292 * parallelism level, or at least avoid starvation. Usually, extra
293 * threads are needed for only very short periods, yet join
294 * dependencies are such that we sometimes need them in
295 * bursts. Rather than create new threads each time this happens,
296 * we suspend no-longer-needed extra ones as "spares". For most
297 * purposes, we don't distinguish "extra" spare threads from
298 * normal "core" threads: On each call to preStep (the only point
299 * at which we can do this) a worker checks to see if there are
300 * now too many running workers, and if so, suspends itself.
301 * Method helpMaintainParallelism looks for suspended threads to
302 * resume before considering creating a new replacement. The
303 * spares themselves are encoded on another variant of a Treiber
304 * Stack, headed at field "spareWaiters". Note that the use of
305 * spares is intrinsically racy. One thread may become a spare at
306 * about the same time as another is needlessly being created. We
307 * counteract this and related slop in part by requiring resumed
308 * spares to immediately recheck (in preStep) to see whether they
309 * should re-suspend.
310 *
311 * 6. Killing off unneeded workers. A timeout mechanism is used to
312 * shed unused workers: The oldest (first) event queue waiter uses
313 * a timed rather than hard wait. When this wait times out without
314 * a normal wakeup, it tries to shutdown any one (for convenience
315 * the newest) other spare or event waiter via
316 * tryShutdownUnusedWorker. This eventually reduces the number of
317 * worker threads to a minimum of one after a long enough period
318 * without use.
319 *
320 * 7. Deciding when to create new workers. The main dynamic
321 * control in this class is deciding when to create extra threads
322 * in method helpMaintainParallelism. We would like to keep
323 * exactly #parallelism threads running, which is an impossible
324 * task. We always need to create one when the number of running
325 * threads would become zero and all workers are busy. Beyond
326 * this, we must rely on heuristics that work well in the
327 * presence of transient phenomena such as GC stalls, dynamic
328 * compilation, and wake-up lags. These transients are extremely
329 * common -- we are normally trying to fully saturate the CPUs on
330 * a machine, so almost any activity other than running tasks
331 * impedes accuracy. Our main defense is to allow parallelism to
332 * lapse for a while during joins, and use a timeout to see if,
333 * after the resulting settling, there is still a need for
334 * additional workers. This also better copes with the fact that
335 * some of the methods in this class tend to never become compiled
336 * (but are interpreted), so some components of the entire set of
337 * controls might execute 100 times faster than others. And
338 * similarly for cases where the apparent lack of work is just due
339 * to GC stalls and other transient system activity.
340 *
341 * Beware that there is a lot of representation-level coupling
342 * among classes ForkJoinPool, ForkJoinWorkerThread, and
343 * ForkJoinTask. For example, direct access to "workers" array by
344 * workers, and direct access to ForkJoinTask.status by both
345 * ForkJoinPool and ForkJoinWorkerThread. There is little point
346 * trying to reduce this, since any associated future changes in
347 * representations will need to be accompanied by algorithmic
348 * changes anyway.
349 *
350 * Style notes: There are lots of inline assignments (of form
351 * "while ((local = field) != 0)") which are usually the simplest
352 * way to ensure the required read orderings (which are sometimes
353 * critical). Also several occurrences of the unusual "do {}
354 * while (!cas...)" which is the simplest way to force an update of
355 * a CAS'ed variable. There are also other coding oddities that
356 * help some methods perform reasonably even when interpreted (not
357 * compiled), at the expense of some messy constructions that
358 * reduce byte code counts.
359 *
360 * The order of declarations in this file is: (1) statics (2)
361 * fields (along with constants used when unpacking some of them)
362 * (3) internal control methods (4) callbacks and other support
363 * for ForkJoinTask and ForkJoinWorkerThread classes, (5) exported
364 * methods (plus a few little helpers).
365 */
366
367 /**
368 * Factory for creating new {@link ForkJoinWorkerThread}s.
369 * A {@code ForkJoinWorkerThreadFactory} must be defined and used
370 * for {@code ForkJoinWorkerThread} subclasses that extend base
371 * functionality or initialize threads with different contexts.
372 */
373 public static interface ForkJoinWorkerThreadFactory {
374 /**
375 * Returns a new worker thread operating in the given pool.
376 *
377 * @param pool the pool this thread works in
378 * @throws NullPointerException if the pool is null
379 */
380 public ForkJoinWorkerThread newThread(ForkJoinPool pool);
381 }
382
383 /**
384 * Default ForkJoinWorkerThreadFactory implementation; creates a
385 * new ForkJoinWorkerThread.
386 */
387 static class DefaultForkJoinWorkerThreadFactory
388 implements ForkJoinWorkerThreadFactory {
389 public ForkJoinWorkerThread newThread(ForkJoinPool pool) {
390 return new ForkJoinWorkerThread(pool);
391 }
392 }
393
394 /**
395 * Creates a new ForkJoinWorkerThread. This factory is used unless
396 * overridden in ForkJoinPool constructors.
397 */
398 public static final ForkJoinWorkerThreadFactory
399 defaultForkJoinWorkerThreadFactory =
400 new DefaultForkJoinWorkerThreadFactory();
401
402 /**
403 * Permission required for callers of methods that may start or
404 * kill threads.
405 */
406 private static final RuntimePermission modifyThreadPermission =
407 new RuntimePermission("modifyThread");
408
409 /**
410 * If there is a security manager, makes sure caller has
411 * permission to modify threads.
412 */
413 private static void checkPermission() {
414 SecurityManager security = System.getSecurityManager();
415 if (security != null)
416 security.checkPermission(modifyThreadPermission);
417 }
418
419 /**
420 * Generator for assigning sequence numbers as pool names.
421 */
422 private static final AtomicInteger poolNumberGenerator =
423 new AtomicInteger();
424
425 /**
426 * The time to block in a join (see awaitJoin) before checking if
427 * a new worker should be (re)started to maintain parallelism
428 * level. The value should be short enough to maintain global
429 * responsiveness and progress but long enough to avoid
430 * counterproductive firings during GC stalls or unrelated system
431 * activity, and to not bog down systems with continual re-firings
432 * on GCs or legitimately long waits.
433 */
434 private static final long JOIN_TIMEOUT_MILLIS = 250L; // 4 per second
435
436 /**
437 * The wakeup interval (in nanoseconds) for the oldest worker
438 * waiting for an event to invoke tryShutdownUnusedWorker to
439 * shrink the number of workers. The exact value does not matter
440 * too much. It must be short enough to release resources during
441 * sustained periods of idleness, but not so short that threads
442 * are continually re-created.
443 */
444 private static final long SHRINK_RATE_NANOS =
445 30L * 1000L * 1000L * 1000L; // 2 per minute
446
447 /**
448 * Absolute bound for parallelism level. Twice this number plus
449 * one (i.e., 0xfff) must fit into a 16bit field to enable
450 * word-packing for some counts and indices.
451 */
452 private static final int MAX_WORKERS = 0x7fff;
453
454 /**
455 * Array holding all worker threads in the pool. Array size must
456 * be a power of two. Updates and replacements are protected by
457 * workerLock, but the array is always kept in a consistent enough
458 * state to be randomly accessed without locking by workers
459 * performing work-stealing, as well as other traversal-based
460 * methods in this class. All readers must tolerate that some
461 * array slots may be null.
462 */
463 volatile ForkJoinWorkerThread[] workers;
464
465 /**
466 * Queue for external submissions.
467 */
468 private final LinkedTransferQueue<ForkJoinTask<?>> submissionQueue;
469
470 /**
471 * Lock protecting updates to workers array.
472 */
473 private final ReentrantLock workerLock;
474
475 /**
476 * Latch released upon termination.
477 */
478 private final Phaser termination;
479
480 /**
481 * Creation factory for worker threads.
482 */
483 private final ForkJoinWorkerThreadFactory factory;
484
485 /**
486 * Sum of per-thread steal counts, updated only when threads are
487 * idle or terminating.
488 */
489 private volatile long stealCount;
490
491 /**
492 * Encoded record of top of Treiber stack of threads waiting for
493 * events. The top 32 bits contain the count being waited for. The
494 * bottom 16 bits contains one plus the pool index of waiting
495 * worker thread. (Bits 16-31 are unused.)
496 */
497 private volatile long eventWaiters;
498
499 private static final int EVENT_COUNT_SHIFT = 32;
500 private static final long WAITER_ID_MASK = (1L << 16) - 1L;
501
502 /**
503 * A counter for events that may wake up worker threads:
504 * - Submission of a new task to the pool
505 * - A worker pushing a task on an empty queue
506 * - termination
507 */
508 private volatile int eventCount;
509
510 /**
511 * Encoded record of top of Treiber stack of spare threads waiting
512 * for resumption. The top 16 bits contain an arbitrary count to
513 * avoid ABA effects. The bottom 16bits contains one plus the pool
514 * index of waiting worker thread.
515 */
516 private volatile int spareWaiters;
517
518 private static final int SPARE_COUNT_SHIFT = 16;
519 private static final int SPARE_ID_MASK = (1 << 16) - 1;
520
521 /**
522 * Lifecycle control. The low word contains the number of workers
523 * that are (probably) executing tasks. This value is atomically
524 * incremented before a worker gets a task to run, and decremented
525 * when a worker has no tasks and cannot find any. Bits 16-18
526 * contain runLevel value. When all are zero, the pool is
527 * running. Level transitions are monotonic (running -> shutdown
528 * -> terminating -> terminated) so each transition adds a bit.
529 * These are bundled together to ensure consistent read for
530 * termination checks (i.e., that runLevel is at least SHUTDOWN
531 * and active threads is zero).
532 *
533 * Notes: Most direct CASes are dependent on these bitfield
534 * positions. Also, this field is non-private to enable direct
535 * performance-sensitive CASes in ForkJoinWorkerThread.
536 */
537 volatile int runState;
538
539 // Note: The order among run level values matters.
540 private static final int RUNLEVEL_SHIFT = 16;
541 private static final int SHUTDOWN = 1 << RUNLEVEL_SHIFT;
542 private static final int TERMINATING = 1 << (RUNLEVEL_SHIFT + 1);
543 private static final int TERMINATED = 1 << (RUNLEVEL_SHIFT + 2);
544 private static final int ACTIVE_COUNT_MASK = (1 << RUNLEVEL_SHIFT) - 1;
545
546 /**
547 * Holds number of total (i.e., created and not yet terminated)
548 * and running (i.e., not blocked on joins or other managed sync)
549 * threads, packed together to ensure consistent snapshot when
550 * making decisions about creating and suspending spare
551 * threads. Updated only by CAS. Note that adding a new worker
552 * requires incrementing both counts, since workers start off in
553 * running state.
554 */
555 private volatile int workerCounts;
556
557 private static final int TOTAL_COUNT_SHIFT = 16;
558 private static final int RUNNING_COUNT_MASK = (1 << TOTAL_COUNT_SHIFT) - 1;
559 private static final int ONE_RUNNING = 1;
560 private static final int ONE_TOTAL = 1 << TOTAL_COUNT_SHIFT;
561
562 /**
563 * The target parallelism level.
564 * Accessed directly by ForkJoinWorkerThreads.
565 */
566 final int parallelism;
567
568 /**
569 * True if use local fifo, not default lifo, for local polling
570 * Read by, and replicated by ForkJoinWorkerThreads
571 */
572 final boolean locallyFifo;
573
574 /**
575 * The uncaught exception handler used when any worker abruptly
576 * terminates.
577 */
578 private final Thread.UncaughtExceptionHandler ueh;
579
580 /**
581 * Pool number, just for assigning useful names to worker threads
582 */
583 private final int poolNumber;
584
585 // Utilities for CASing fields. Note that most of these
586 // are usually manually inlined by callers
587
588 /**
589 * Increments running count part of workerCounts
590 */
591 final void incrementRunningCount() {
592 int c;
593 do {} while (!UNSAFE.compareAndSwapInt(this, workerCountsOffset,
594 c = workerCounts,
595 c + ONE_RUNNING));
596 }
597
598 /**
599 * Tries to decrement running count unless already zero
600 */
601 final boolean tryDecrementRunningCount() {
602 int wc = workerCounts;
603 if ((wc & RUNNING_COUNT_MASK) == 0)
604 return false;
605 return UNSAFE.compareAndSwapInt(this, workerCountsOffset,
606 wc, wc - ONE_RUNNING);
607 }
608
609 /**
610 * Forces decrement of encoded workerCounts, awaiting nonzero if
611 * (rarely) necessary when other count updates lag.
612 *
613 * @param dr -- either zero or ONE_RUNNING
614 * @param dt -- either zero or ONE_TOTAL
615 */
616 private void decrementWorkerCounts(int dr, int dt) {
617 for (;;) {
618 int wc = workerCounts;
619 if ((wc & RUNNING_COUNT_MASK) - dr < 0 ||
620 (wc >>> TOTAL_COUNT_SHIFT) - dt < 0) {
621 if ((runState & TERMINATED) != 0)
622 return; // lagging termination on a backout
623 Thread.yield();
624 }
625 if (UNSAFE.compareAndSwapInt(this, workerCountsOffset,
626 wc, wc - (dr + dt)))
627 return;
628 }
629 }
630
631 /**
632 * Tries decrementing active count; fails on contention.
633 * Called when workers cannot find tasks to run.
634 */
635 final boolean tryDecrementActiveCount() {
636 int c;
637 return UNSAFE.compareAndSwapInt(this, runStateOffset,
638 c = runState, c - 1);
639 }
640
641 /**
642 * Advances to at least the given level. Returns true if not
643 * already in at least the given level.
644 */
645 private boolean advanceRunLevel(int level) {
646 for (;;) {
647 int s = runState;
648 if ((s & level) != 0)
649 return false;
650 if (UNSAFE.compareAndSwapInt(this, runStateOffset, s, s | level))
651 return true;
652 }
653 }
654
655 // workers array maintenance
656
657 /**
658 * Records and returns a workers array index for new worker.
659 */
660 private int recordWorker(ForkJoinWorkerThread w) {
661 // Try using slot totalCount-1. If not available, scan and/or resize
662 int k = (workerCounts >>> TOTAL_COUNT_SHIFT) - 1;
663 final ReentrantLock lock = this.workerLock;
664 lock.lock();
665 try {
666 ForkJoinWorkerThread[] ws = workers;
667 int n = ws.length;
668 if (k < 0 || k >= n || ws[k] != null) {
669 for (k = 0; k < n && ws[k] != null; ++k)
670 ;
671 if (k == n)
672 ws = Arrays.copyOf(ws, n << 1);
673 }
674 ws[k] = w;
675 workers = ws; // volatile array write ensures slot visibility
676 } finally {
677 lock.unlock();
678 }
679 return k;
680 }
681
682 /**
683 * Nulls out record of worker in workers array.
684 */
685 private void forgetWorker(ForkJoinWorkerThread w) {
686 int idx = w.poolIndex;
687 // Locking helps method recordWorker avoid unnecessary expansion
688 final ReentrantLock lock = this.workerLock;
689 lock.lock();
690 try {
691 ForkJoinWorkerThread[] ws = workers;
692 if (idx >= 0 && idx < ws.length && ws[idx] == w) // verify
693 ws[idx] = null;
694 } finally {
695 lock.unlock();
696 }
697 }
698
699 /**
700 * Final callback from terminating worker. Removes record of
701 * worker from array, and adjusts counts. If pool is shutting
702 * down, tries to complete termination.
703 *
704 * @param w the worker
705 */
706 final void workerTerminated(ForkJoinWorkerThread w) {
707 forgetWorker(w);
708 decrementWorkerCounts(w.isTrimmed()? 0 : ONE_RUNNING, ONE_TOTAL);
709 while (w.stealCount != 0) // collect final count
710 tryAccumulateStealCount(w);
711 tryTerminate(false);
712 }
713
714 // Waiting for and signalling events
715
716 /**
717 * Releases workers blocked on a count not equal to current count.
718 * Normally called after precheck that eventWaiters isn't zero to
719 * avoid wasted array checks. Gives up upon a change in count or
720 * upon releasing two workers, letting others take over.
721 */
722 private void releaseEventWaiters() {
723 ForkJoinWorkerThread[] ws = workers;
724 int n = ws.length;
725 long h = eventWaiters;
726 int ec = eventCount;
727 boolean releasedOne = false;
728 ForkJoinWorkerThread w; int id;
729 while ((id = ((int)(h & WAITER_ID_MASK)) - 1) >= 0 &&
730 (int)(h >>> EVENT_COUNT_SHIFT) != ec &&
731 id < n && (w = ws[id]) != null) {
732 if (UNSAFE.compareAndSwapLong(this, eventWaitersOffset,
733 h, w.nextWaiter)) {
734 LockSupport.unpark(w);
735 if (releasedOne) // exit on second release
736 break;
737 releasedOne = true;
738 }
739 if (eventCount != ec)
740 break;
741 h = eventWaiters;
742 }
743 }
744
745 /**
746 * Tries to advance eventCount and releases waiters. Called only
747 * from workers.
748 */
749 final void signalWork() {
750 int c; // try to increment event count -- CAS failure OK
751 UNSAFE.compareAndSwapInt(this, eventCountOffset, c = eventCount, c+1);
752 if (eventWaiters != 0L)
753 releaseEventWaiters();
754 }
755
756 /**
757 * Adds the given worker to event queue and blocks until
758 * terminating or event count advances from the given value
759 *
760 * @param w the calling worker thread
761 * @param ec the count
762 */
763 private void eventSync(ForkJoinWorkerThread w, int ec) {
764 long nh = (((long)ec) << EVENT_COUNT_SHIFT) | ((long)(w.poolIndex+1));
765 long h;
766 while ((runState < SHUTDOWN || !tryTerminate(false)) &&
767 (((int)((h = eventWaiters) & WAITER_ID_MASK)) == 0 ||
768 (int)(h >>> EVENT_COUNT_SHIFT) == ec) &&
769 eventCount == ec) {
770 if (UNSAFE.compareAndSwapLong(this, eventWaitersOffset,
771 w.nextWaiter = h, nh)) {
772 awaitEvent(w, ec);
773 break;
774 }
775 }
776 }
777
778 /**
779 * Blocks the given worker (that has already been entered as an
780 * event waiter) until terminating or event count advances from
781 * the given value. The oldest (first) waiter uses a timed wait to
782 * occasionally one-by-one shrink the number of workers (to a
783 * minimum of one) if the pool has not been used for extended
784 * periods.
785 *
786 * @param w the calling worker thread
787 * @param ec the count
788 */
789 private void awaitEvent(ForkJoinWorkerThread w, int ec) {
790 while (eventCount == ec) {
791 if (tryAccumulateStealCount(w)) { // transfer while idle
792 boolean untimed = (w.nextWaiter != 0L ||
793 (workerCounts & RUNNING_COUNT_MASK) <= 1);
794 long startTime = untimed? 0 : System.nanoTime();
795 Thread.interrupted(); // clear/ignore interrupt
796 if (eventCount != ec || w.runState != 0 ||
797 runState >= TERMINATING) // recheck after clear
798 break;
799 if (untimed)
800 LockSupport.park(w);
801 else {
802 LockSupport.parkNanos(w, SHRINK_RATE_NANOS);
803 if (eventCount != ec || w.runState != 0 ||
804 runState >= TERMINATING)
805 break;
806 if (System.nanoTime() - startTime >= SHRINK_RATE_NANOS)
807 tryShutdownUnusedWorker(ec);
808 }
809 }
810 }
811 }
812
813 // Maintaining parallelism
814
815 /**
816 * Pushes worker onto the spare stack.
817 */
818 final void pushSpare(ForkJoinWorkerThread w) {
819 int ns = (++w.spareCount << SPARE_COUNT_SHIFT) | (w.poolIndex + 1);
820 do {} while (!UNSAFE.compareAndSwapInt(this, spareWaitersOffset,
821 w.nextSpare = spareWaiters,ns));
822 }
823
824 /**
825 * Tries (once) to resume a spare if the number of running
826 * threads is less than target.
827 */
828 private void tryResumeSpare() {
829 int sw, id;
830 ForkJoinWorkerThread[] ws = workers;
831 int n = ws.length;
832 ForkJoinWorkerThread w;
833 if ((sw = spareWaiters) != 0 &&
834 (id = (sw & SPARE_ID_MASK) - 1) >= 0 &&
835 id < n && (w = ws[id]) != null &&
836 (workerCounts & RUNNING_COUNT_MASK) < parallelism &&
837 spareWaiters == sw &&
838 UNSAFE.compareAndSwapInt(this, spareWaitersOffset,
839 sw, w.nextSpare)) {
840 int c; // increment running count before resume
841 do {} while (!UNSAFE.compareAndSwapInt
842 (this, workerCountsOffset,
843 c = workerCounts, c + ONE_RUNNING));
844 if (w.tryUnsuspend())
845 LockSupport.unpark(w);
846 else // back out if w was shutdown
847 decrementWorkerCounts(ONE_RUNNING, 0);
848 }
849 }
850
851 /**
852 * Tries to increase the number of running workers if below target
853 * parallelism: If a spare exists tries to resume it via
854 * tryResumeSpare. Otherwise, if not enough total workers or all
855 * existing workers are busy, adds a new worker. In all cases also
856 * helps wake up releasable workers waiting for work.
857 */
858 private void helpMaintainParallelism() {
859 int pc = parallelism;
860 int wc, rs, tc;
861 while (((wc = workerCounts) & RUNNING_COUNT_MASK) < pc &&
862 (rs = runState) < TERMINATING) {
863 if (spareWaiters != 0)
864 tryResumeSpare();
865 else if ((tc = wc >>> TOTAL_COUNT_SHIFT) >= MAX_WORKERS ||
866 (tc >= pc && (rs & ACTIVE_COUNT_MASK) != tc))
867 break; // enough total
868 else if (runState == rs && workerCounts == wc &&
869 UNSAFE.compareAndSwapInt(this, workerCountsOffset, wc,
870 wc + (ONE_RUNNING|ONE_TOTAL))) {
871 ForkJoinWorkerThread w = null;
872 try {
873 w = factory.newThread(this);
874 } finally { // adjust on null or exceptional factory return
875 if (w == null) {
876 decrementWorkerCounts(ONE_RUNNING, ONE_TOTAL);
877 tryTerminate(false); // handle failure during shutdown
878 }
879 }
880 if (w == null)
881 break;
882 w.start(recordWorker(w), ueh);
883 if ((workerCounts >>> TOTAL_COUNT_SHIFT) >= pc) {
884 int c; // advance event count
885 UNSAFE.compareAndSwapInt(this, eventCountOffset,
886 c = eventCount, c+1);
887 break; // add at most one unless total below target
888 }
889 }
890 }
891 if (eventWaiters != 0L)
892 releaseEventWaiters();
893 }
894
895 /**
896 * Callback from the oldest waiter in awaitEvent waking up after a
897 * period of non-use. If all workers are idle, tries (once) to
898 * shutdown an event waiter or a spare, if one exists. Note that
899 * we don't need CAS or locks here because the method is called
900 * only from one thread occasionally waking (and even misfires are
901 * OK). Note that until the shutdown worker fully terminates,
902 * workerCounts will overestimate total count, which is tolerable.
903 *
904 * @param ec the event count waited on by caller (to abort
905 * attempt if count has since changed).
906 */
907 private void tryShutdownUnusedWorker(int ec) {
908 if (runState == 0 && eventCount == ec) { // only trigger if all idle
909 ForkJoinWorkerThread[] ws = workers;
910 int n = ws.length;
911 ForkJoinWorkerThread w = null;
912 boolean shutdown = false;
913 int sw;
914 long h;
915 if ((sw = spareWaiters) != 0) { // prefer killing spares
916 int id = (sw & SPARE_ID_MASK) - 1;
917 if (id >= 0 && id < n && (w = ws[id]) != null &&
918 UNSAFE.compareAndSwapInt(this, spareWaitersOffset,
919 sw, w.nextSpare))
920 shutdown = true;
921 }
922 else if ((h = eventWaiters) != 0L) {
923 long nh;
924 int id = ((int)(h & WAITER_ID_MASK)) - 1;
925 if (id >= 0 && id < n && (w = ws[id]) != null &&
926 (nh = w.nextWaiter) != 0L && // keep at least one worker
927 UNSAFE.compareAndSwapLong(this, eventWaitersOffset, h, nh))
928 shutdown = true;
929 }
930 if (w != null && shutdown) {
931 w.shutdown();
932 LockSupport.unpark(w);
933 }
934 }
935 releaseEventWaiters(); // in case of interference
936 }
937
938 /**
939 * Callback from workers invoked upon each top-level action (i.e.,
940 * stealing a task or taking a submission and running it).
941 * Performs one or more of the following:
942 *
943 * 1. If the worker is active and either did not run a task
944 * or there are too many workers, try to set its active status
945 * to inactive and update activeCount. On contention, we may
946 * try again in this or a subsequent call.
947 *
948 * 2. If not enough total workers, help create some.
949 *
950 * 3. If there are too many running workers, suspend this worker
951 * (first forcing inactive if necessary). If it is not needed,
952 * it may be shutdown while suspended (via
953 * tryShutdownUnusedWorker). Otherwise, upon resume it
954 * rechecks running thread count and need for event sync.
955 *
956 * 4. If worker did not run a task, await the next task event via
957 * eventSync if necessary (first forcing inactivation), upon
958 * which the worker may be shutdown via
959 * tryShutdownUnusedWorker. Otherwise, help release any
960 * existing event waiters that are now releasable,
961 *
962 * @param w the worker
963 * @param ran true if worker ran a task since last call to this method
964 */
965 final void preStep(ForkJoinWorkerThread w, boolean ran) {
966 int wec = w.lastEventCount;
967 boolean active = w.active;
968 boolean inactivate = false;
969 int pc = parallelism;
970 int rs;
971 while (w.runState == 0 && (rs = runState) < TERMINATING) {
972 if ((inactivate || (active && (rs & ACTIVE_COUNT_MASK) >= pc)) &&
973 UNSAFE.compareAndSwapInt(this, runStateOffset, rs, rs - 1))
974 inactivate = active = w.active = false;
975 int wc = workerCounts;
976 if ((wc & RUNNING_COUNT_MASK) > pc) {
977 if (!(inactivate |= active) && // must inactivate to suspend
978 workerCounts == wc && // try to suspend as spare
979 UNSAFE.compareAndSwapInt(this, workerCountsOffset,
980 wc, wc - ONE_RUNNING))
981 w.suspendAsSpare();
982 }
983 else if ((wc >>> TOTAL_COUNT_SHIFT) < pc)
984 helpMaintainParallelism(); // not enough workers
985 else if (!ran) {
986 long h = eventWaiters;
987 int ec = eventCount;
988 if (h != 0L && (int)(h >>> EVENT_COUNT_SHIFT) != ec)
989 releaseEventWaiters(); // release others before waiting
990 else if (ec != wec) {
991 w.lastEventCount = ec; // no need to wait
992 break;
993 }
994 else if (!(inactivate |= active))
995 eventSync(w, wec); // must inactivate before sync
996 }
997 else
998 break;
999 }
1000 }
1001
1002 /**
1003 * Helps and/or blocks awaiting join of the given task.
1004 * See above for explanation.
1005 *
1006 * @param joinMe the task to join
1007 * @param worker the current worker thread
1008 */
1009 final void awaitJoin(ForkJoinTask<?> joinMe, ForkJoinWorkerThread worker) {
1010 int retries = 2 + (parallelism >> 2); // #helpJoins before blocking
1011 while (joinMe.status >= 0) {
1012 int wc;
1013 worker.helpJoinTask(joinMe);
1014 if (joinMe.status < 0)
1015 break;
1016 else if (retries > 0)
1017 --retries;
1018 else if (((wc = workerCounts) & RUNNING_COUNT_MASK) != 0 &&
1019 UNSAFE.compareAndSwapInt(this, workerCountsOffset,
1020 wc, wc - ONE_RUNNING)) {
1021 int stat, c; long h;
1022 while ((stat = joinMe.status) >= 0 &&
1023 (h = eventWaiters) != 0L && // help release others
1024 (int)(h >>> EVENT_COUNT_SHIFT) != eventCount)
1025 releaseEventWaiters();
1026 if (stat >= 0 &&
1027 ((workerCounts & RUNNING_COUNT_MASK) == 0 ||
1028 (stat =
1029 joinMe.internalAwaitDone(JOIN_TIMEOUT_MILLIS)) >= 0))
1030 helpMaintainParallelism(); // timeout or no running workers
1031 do {} while (!UNSAFE.compareAndSwapInt
1032 (this, workerCountsOffset,
1033 c = workerCounts, c + ONE_RUNNING));
1034 if (stat < 0)
1035 break; // else restart
1036 }
1037 }
1038 }
1039
1040 /**
1041 * Same idea as awaitJoin, but no helping, retries, or timeouts.
1042 */
1043 final void awaitBlocker(ManagedBlocker blocker)
1044 throws InterruptedException {
1045 while (!blocker.isReleasable()) {
1046 int wc = workerCounts;
1047 if ((wc & RUNNING_COUNT_MASK) != 0 &&
1048 UNSAFE.compareAndSwapInt(this, workerCountsOffset,
1049 wc, wc - ONE_RUNNING)) {
1050 try {
1051 while (!blocker.isReleasable()) {
1052 long h = eventWaiters;
1053 if (h != 0L &&
1054 (int)(h >>> EVENT_COUNT_SHIFT) != eventCount)
1055 releaseEventWaiters();
1056 else if ((workerCounts & RUNNING_COUNT_MASK) == 0 &&
1057 runState < TERMINATING)
1058 helpMaintainParallelism();
1059 else if (blocker.block())
1060 break;
1061 }
1062 } finally {
1063 int c;
1064 do {} while (!UNSAFE.compareAndSwapInt
1065 (this, workerCountsOffset,
1066 c = workerCounts, c + ONE_RUNNING));
1067 }
1068 break;
1069 }
1070 }
1071 }
1072
1073 /**
1074 * Possibly initiates and/or completes termination.
1075 *
1076 * @param now if true, unconditionally terminate, else only
1077 * if shutdown and empty queue and no active workers
1078 * @return true if now terminating or terminated
1079 */
1080 private boolean tryTerminate(boolean now) {
1081 if (now)
1082 advanceRunLevel(SHUTDOWN); // ensure at least SHUTDOWN
1083 else if (runState < SHUTDOWN ||
1084 !submissionQueue.isEmpty() ||
1085 (runState & ACTIVE_COUNT_MASK) != 0)
1086 return false;
1087
1088 if (advanceRunLevel(TERMINATING))
1089 startTerminating();
1090
1091 // Finish now if all threads terminated; else in some subsequent call
1092 if ((workerCounts >>> TOTAL_COUNT_SHIFT) == 0) {
1093 advanceRunLevel(TERMINATED);
1094 termination.arrive();
1095 }
1096 return true;
1097 }
1098
1099 /**
1100 * Actions on transition to TERMINATING
1101 *
1102 * Runs up to four passes through workers: (0) shutting down each
1103 * (without waking up if parked) to quickly spread notifications
1104 * without unnecessary bouncing around event queues etc (1) wake
1105 * up and help cancel tasks (2) interrupt (3) mop up races with
1106 * interrupted workers
1107 */
1108 private void startTerminating() {
1109 cancelSubmissions();
1110 for (int passes = 0; passes < 4 && workerCounts != 0; ++passes) {
1111 int c; // advance event count
1112 UNSAFE.compareAndSwapInt(this, eventCountOffset,
1113 c = eventCount, c+1);
1114 eventWaiters = 0L; // clobber lists
1115 spareWaiters = 0;
1116 for (ForkJoinWorkerThread w : workers) {
1117 if (w != null) {
1118 w.shutdown();
1119 if (passes > 0 && !w.isTerminated()) {
1120 w.cancelTasks();
1121 LockSupport.unpark(w);
1122 if (passes > 1) {
1123 try {
1124 w.interrupt();
1125 } catch (SecurityException ignore) {
1126 }
1127 }
1128 }
1129 }
1130 }
1131 }
1132 }
1133
1134 /**
1135 * Clears out and cancels submissions, ignoring exceptions.
1136 */
1137 private void cancelSubmissions() {
1138 ForkJoinTask<?> task;
1139 while ((task = submissionQueue.poll()) != null) {
1140 try {
1141 task.cancel(false);
1142 } catch (Throwable ignore) {
1143 }
1144 }
1145 }
1146
1147 // misc support for ForkJoinWorkerThread
1148
1149 /**
1150 * Returns pool number.
1151 */
1152 final int getPoolNumber() {
1153 return poolNumber;
1154 }
1155
1156 /**
1157 * Tries to accumulate steal count from a worker, clearing
1158 * the worker's value if successful.
1159 *
1160 * @return true if worker steal count now zero
1161 */
1162 final boolean tryAccumulateStealCount(ForkJoinWorkerThread w) {
1163 int sc = w.stealCount;
1164 long c = stealCount;
1165 // CAS even if zero, for fence effects
1166 if (UNSAFE.compareAndSwapLong(this, stealCountOffset, c, c + sc)) {
1167 if (sc != 0)
1168 w.stealCount = 0;
1169 return true;
1170 }
1171 return sc == 0;
1172 }
1173
1174 /**
1175 * Returns the approximate (non-atomic) number of idle threads per
1176 * active thread.
1177 */
1178 final int idlePerActive() {
1179 int pc = parallelism; // use parallelism, not rc
1180 int ac = runState; // no mask -- artificially boosts during shutdown
1181 // Use exact results for small values, saturate past 4
1182 return ((pc <= ac) ? 0 :
1183 (pc >>> 1 <= ac) ? 1 :
1184 (pc >>> 2 <= ac) ? 3 :
1185 pc >>> 3);
1186 }
1187
1188 // Public and protected methods
1189
1190 // Constructors
1191
1192 /**
1193 * Creates a {@code ForkJoinPool} with parallelism equal to {@link
1194 * java.lang.Runtime#availableProcessors}, using the {@linkplain
1195 * #defaultForkJoinWorkerThreadFactory default thread factory},
1196 * no UncaughtExceptionHandler, and non-async LIFO processing mode.
1197 *
1198 * @throws SecurityException if a security manager exists and
1199 * the caller is not permitted to modify threads
1200 * because it does not hold {@link
1201 * java.lang.RuntimePermission}{@code ("modifyThread")}
1202 */
1203 public ForkJoinPool() {
1204 this(Runtime.getRuntime().availableProcessors(),
1205 defaultForkJoinWorkerThreadFactory, null, false);
1206 }
1207
1208 /**
1209 * Creates a {@code ForkJoinPool} with the indicated parallelism
1210 * level, the {@linkplain
1211 * #defaultForkJoinWorkerThreadFactory default thread factory},
1212 * no UncaughtExceptionHandler, and non-async LIFO processing mode.
1213 *
1214 * @param parallelism the parallelism level
1215 * @throws IllegalArgumentException if parallelism less than or
1216 * equal to zero, or greater than implementation limit
1217 * @throws SecurityException if a security manager exists and
1218 * the caller is not permitted to modify threads
1219 * because it does not hold {@link
1220 * java.lang.RuntimePermission}{@code ("modifyThread")}
1221 */
1222 public ForkJoinPool(int parallelism) {
1223 this(parallelism, defaultForkJoinWorkerThreadFactory, null, false);
1224 }
1225
1226 /**
1227 * Creates a {@code ForkJoinPool} with the given parameters.
1228 *
1229 * @param parallelism the parallelism level. For default value,
1230 * use {@link java.lang.Runtime#availableProcessors}.
1231 * @param factory the factory for creating new threads. For default value,
1232 * use {@link #defaultForkJoinWorkerThreadFactory}.
1233 * @param handler the handler for internal worker threads that
1234 * terminate due to unrecoverable errors encountered while executing
1235 * tasks. For default value, use {@code null}.
1236 * @param asyncMode if true,
1237 * establishes local first-in-first-out scheduling mode for forked
1238 * tasks that are never joined. This mode may be more appropriate
1239 * than default locally stack-based mode in applications in which
1240 * worker threads only process event-style asynchronous tasks.
1241 * For default value, use {@code false}.
1242 * @throws IllegalArgumentException if parallelism less than or
1243 * equal to zero, or greater than implementation limit
1244 * @throws NullPointerException if the factory is null
1245 * @throws SecurityException if a security manager exists and
1246 * the caller is not permitted to modify threads
1247 * because it does not hold {@link
1248 * java.lang.RuntimePermission}{@code ("modifyThread")}
1249 */
1250 public ForkJoinPool(int parallelism,
1251 ForkJoinWorkerThreadFactory factory,
1252 Thread.UncaughtExceptionHandler handler,
1253 boolean asyncMode) {
1254 checkPermission();
1255 if (factory == null)
1256 throw new NullPointerException();
1257 if (parallelism <= 0 || parallelism > MAX_WORKERS)
1258 throw new IllegalArgumentException();
1259 this.parallelism = parallelism;
1260 this.factory = factory;
1261 this.ueh = handler;
1262 this.locallyFifo = asyncMode;
1263 int arraySize = initialArraySizeFor(parallelism);
1264 this.workers = new ForkJoinWorkerThread[arraySize];
1265 this.submissionQueue = new LinkedTransferQueue<ForkJoinTask<?>>();
1266 this.workerLock = new ReentrantLock();
1267 this.termination = new Phaser(1);
1268 this.poolNumber = poolNumberGenerator.incrementAndGet();
1269 }
1270
1271 /**
1272 * Returns initial power of two size for workers array.
1273 * @param pc the initial parallelism level
1274 */
1275 private static int initialArraySizeFor(int pc) {
1276 // If possible, initially allocate enough space for one spare
1277 int size = pc < MAX_WORKERS ? pc + 1 : MAX_WORKERS;
1278 // See Hackers Delight, sec 3.2. We know MAX_WORKERS < (1 >>> 16)
1279 size |= size >>> 1;
1280 size |= size >>> 2;
1281 size |= size >>> 4;
1282 size |= size >>> 8;
1283 return size + 1;
1284 }
1285
1286 // Execution methods
1287
1288 /**
1289 * Common code for execute, invoke and submit
1290 */
1291 private <T> void doSubmit(ForkJoinTask<T> task) {
1292 if (task == null)
1293 throw new NullPointerException();
1294 if (runState >= SHUTDOWN)
1295 throw new RejectedExecutionException();
1296 submissionQueue.offer(task);
1297 int c; // try to increment event count -- CAS failure OK
1298 UNSAFE.compareAndSwapInt(this, eventCountOffset, c = eventCount, c+1);
1299 helpMaintainParallelism(); // create, start, or resume some workers
1300 }
1301
1302 /**
1303 * Performs the given task, returning its result upon completion.
1304 *
1305 * @param task the task
1306 * @return the task's result
1307 * @throws NullPointerException if the task is null
1308 * @throws RejectedExecutionException if the task cannot be
1309 * scheduled for execution
1310 */
1311 public <T> T invoke(ForkJoinTask<T> task) {
1312 doSubmit(task);
1313 return task.join();
1314 }
1315
1316 /**
1317 * Arranges for (asynchronous) execution of the given task.
1318 *
1319 * @param task the task
1320 * @throws NullPointerException if the task is null
1321 * @throws RejectedExecutionException if the task cannot be
1322 * scheduled for execution
1323 */
1324 public void execute(ForkJoinTask<?> task) {
1325 doSubmit(task);
1326 }
1327
1328 // AbstractExecutorService methods
1329
1330 /**
1331 * @throws NullPointerException if the task is null
1332 * @throws RejectedExecutionException if the task cannot be
1333 * scheduled for execution
1334 */
1335 public void execute(Runnable task) {
1336 ForkJoinTask<?> job;
1337 if (task instanceof ForkJoinTask<?>) // avoid re-wrap
1338 job = (ForkJoinTask<?>) task;
1339 else
1340 job = ForkJoinTask.adapt(task, null);
1341 doSubmit(job);
1342 }
1343
1344 /**
1345 * Submits a ForkJoinTask for execution.
1346 *
1347 * @param task the task to submit
1348 * @return the task
1349 * @throws NullPointerException if the task is null
1350 * @throws RejectedExecutionException if the task cannot be
1351 * scheduled for execution
1352 */
1353 public <T> ForkJoinTask<T> submit(ForkJoinTask<T> task) {
1354 doSubmit(task);
1355 return task;
1356 }
1357
1358 /**
1359 * @throws NullPointerException if the task is null
1360 * @throws RejectedExecutionException if the task cannot be
1361 * scheduled for execution
1362 */
1363 public <T> ForkJoinTask<T> submit(Callable<T> task) {
1364 ForkJoinTask<T> job = ForkJoinTask.adapt(task);
1365 doSubmit(job);
1366 return job;
1367 }
1368
1369 /**
1370 * @throws NullPointerException if the task is null
1371 * @throws RejectedExecutionException if the task cannot be
1372 * scheduled for execution
1373 */
1374 public <T> ForkJoinTask<T> submit(Runnable task, T result) {
1375 ForkJoinTask<T> job = ForkJoinTask.adapt(task, result);
1376 doSubmit(job);
1377 return job;
1378 }
1379
1380 /**
1381 * @throws NullPointerException if the task is null
1382 * @throws RejectedExecutionException if the task cannot be
1383 * scheduled for execution
1384 */
1385 public ForkJoinTask<?> submit(Runnable task) {
1386 ForkJoinTask<?> job;
1387 if (task instanceof ForkJoinTask<?>) // avoid re-wrap
1388 job = (ForkJoinTask<?>) task;
1389 else
1390 job = ForkJoinTask.adapt(task, null);
1391 doSubmit(job);
1392 return job;
1393 }
1394
1395 /**
1396 * @throws NullPointerException {@inheritDoc}
1397 * @throws RejectedExecutionException {@inheritDoc}
1398 */
1399 public <T> List<Future<T>> invokeAll(Collection<? extends Callable<T>> tasks) {
1400 ArrayList<ForkJoinTask<T>> forkJoinTasks =
1401 new ArrayList<ForkJoinTask<T>>(tasks.size());
1402 for (Callable<T> task : tasks)
1403 forkJoinTasks.add(ForkJoinTask.adapt(task));
1404 invoke(new InvokeAll<T>(forkJoinTasks));
1405
1406 @SuppressWarnings({"unchecked", "rawtypes"})
1407 List<Future<T>> futures = (List<Future<T>>) (List) forkJoinTasks;
1408 return futures;
1409 }
1410
1411 static final class InvokeAll<T> extends RecursiveAction {
1412 final ArrayList<ForkJoinTask<T>> tasks;
1413 InvokeAll(ArrayList<ForkJoinTask<T>> tasks) { this.tasks = tasks; }
1414 public void compute() {
1415 try { invokeAll(tasks); }
1416 catch (Exception ignore) {}
1417 }
1418 private static final long serialVersionUID = -7914297376763021607L;
1419 }
1420
1421 /**
1422 * Returns the factory used for constructing new workers.
1423 *
1424 * @return the factory used for constructing new workers
1425 */
1426 public ForkJoinWorkerThreadFactory getFactory() {
1427 return factory;
1428 }
1429
1430 /**
1431 * Returns the handler for internal worker threads that terminate
1432 * due to unrecoverable errors encountered while executing tasks.
1433 *
1434 * @return the handler, or {@code null} if none
1435 */
1436 public Thread.UncaughtExceptionHandler getUncaughtExceptionHandler() {
1437 return ueh;
1438 }
1439
1440 /**
1441 * Returns the targeted parallelism level of this pool.
1442 *
1443 * @return the targeted parallelism level of this pool
1444 */
1445 public int getParallelism() {
1446 return parallelism;
1447 }
1448
1449 /**
1450 * Returns the number of worker threads that have started but not
1451 * yet terminated. The result returned by this method may differ
1452 * from {@link #getParallelism} when threads are created to
1453 * maintain parallelism when others are cooperatively blocked.
1454 *
1455 * @return the number of worker threads
1456 */
1457 public int getPoolSize() {
1458 return workerCounts >>> TOTAL_COUNT_SHIFT;
1459 }
1460
1461 /**
1462 * Returns {@code true} if this pool uses local first-in-first-out
1463 * scheduling mode for forked tasks that are never joined.
1464 *
1465 * @return {@code true} if this pool uses async mode
1466 */
1467 public boolean getAsyncMode() {
1468 return locallyFifo;
1469 }
1470
1471 /**
1472 * Returns an estimate of the number of worker threads that are
1473 * not blocked waiting to join tasks or for other managed
1474 * synchronization. This method may overestimate the
1475 * number of running threads.
1476 *
1477 * @return the number of worker threads
1478 */
1479 public int getRunningThreadCount() {
1480 return workerCounts & RUNNING_COUNT_MASK;
1481 }
1482
1483 /**
1484 * Returns an estimate of the number of threads that are currently
1485 * stealing or executing tasks. This method may overestimate the
1486 * number of active threads.
1487 *
1488 * @return the number of active threads
1489 */
1490 public int getActiveThreadCount() {
1491 return runState & ACTIVE_COUNT_MASK;
1492 }
1493
1494 /**
1495 * Returns {@code true} if all worker threads are currently idle.
1496 * An idle worker is one that cannot obtain a task to execute
1497 * because none are available to steal from other threads, and
1498 * there are no pending submissions to the pool. This method is
1499 * conservative; it might not return {@code true} immediately upon
1500 * idleness of all threads, but will eventually become true if
1501 * threads remain inactive.
1502 *
1503 * @return {@code true} if all threads are currently idle
1504 */
1505 public boolean isQuiescent() {
1506 return (runState & ACTIVE_COUNT_MASK) == 0;
1507 }
1508
1509 /**
1510 * Returns an estimate of the total number of tasks stolen from
1511 * one thread's work queue by another. The reported value
1512 * underestimates the actual total number of steals when the pool
1513 * is not quiescent. This value may be useful for monitoring and
1514 * tuning fork/join programs: in general, steal counts should be
1515 * high enough to keep threads busy, but low enough to avoid
1516 * overhead and contention across threads.
1517 *
1518 * @return the number of steals
1519 */
1520 public long getStealCount() {
1521 return stealCount;
1522 }
1523
1524 /**
1525 * Returns an estimate of the total number of tasks currently held
1526 * in queues by worker threads (but not including tasks submitted
1527 * to the pool that have not begun executing). This value is only
1528 * an approximation, obtained by iterating across all threads in
1529 * the pool. This method may be useful for tuning task
1530 * granularities.
1531 *
1532 * @return the number of queued tasks
1533 */
1534 public long getQueuedTaskCount() {
1535 long count = 0;
1536 for (ForkJoinWorkerThread w : workers)
1537 if (w != null)
1538 count += w.getQueueSize();
1539 return count;
1540 }
1541
1542 /**
1543 * Returns an estimate of the number of tasks submitted to this
1544 * pool that have not yet begun executing. This method takes time
1545 * proportional to the number of submissions.
1546 *
1547 * @return the number of queued submissions
1548 */
1549 public int getQueuedSubmissionCount() {
1550 return submissionQueue.size();
1551 }
1552
1553 /**
1554 * Returns {@code true} if there are any tasks submitted to this
1555 * pool that have not yet begun executing.
1556 *
1557 * @return {@code true} if there are any queued submissions
1558 */
1559 public boolean hasQueuedSubmissions() {
1560 return !submissionQueue.isEmpty();
1561 }
1562
1563 /**
1564 * Removes and returns the next unexecuted submission if one is
1565 * available. This method may be useful in extensions to this
1566 * class that re-assign work in systems with multiple pools.
1567 *
1568 * @return the next submission, or {@code null} if none
1569 */
1570 protected ForkJoinTask<?> pollSubmission() {
1571 return submissionQueue.poll();
1572 }
1573
1574 /**
1575 * Removes all available unexecuted submitted and forked tasks
1576 * from scheduling queues and adds them to the given collection,
1577 * without altering their execution status. These may include
1578 * artificially generated or wrapped tasks. This method is
1579 * designed to be invoked only when the pool is known to be
1580 * quiescent. Invocations at other times may not remove all
1581 * tasks. A failure encountered while attempting to add elements
1582 * to collection {@code c} may result in elements being in
1583 * neither, either or both collections when the associated
1584 * exception is thrown. The behavior of this operation is
1585 * undefined if the specified collection is modified while the
1586 * operation is in progress.
1587 *
1588 * @param c the collection to transfer elements into
1589 * @return the number of elements transferred
1590 */
1591 protected int drainTasksTo(Collection<? super ForkJoinTask<?>> c) {
1592 int count = submissionQueue.drainTo(c);
1593 for (ForkJoinWorkerThread w : workers)
1594 if (w != null)
1595 count += w.drainTasksTo(c);
1596 return count;
1597 }
1598
1599 /**
1600 * Returns a string identifying this pool, as well as its state,
1601 * including indications of run state, parallelism level, and
1602 * worker and task counts.
1603 *
1604 * @return a string identifying this pool, as well as its state
1605 */
1606 public String toString() {
1607 long st = getStealCount();
1608 long qt = getQueuedTaskCount();
1609 long qs = getQueuedSubmissionCount();
1610 int wc = workerCounts;
1611 int tc = wc >>> TOTAL_COUNT_SHIFT;
1612 int rc = wc & RUNNING_COUNT_MASK;
1613 int pc = parallelism;
1614 int rs = runState;
1615 int ac = rs & ACTIVE_COUNT_MASK;
1616 return super.toString() +
1617 "[" + runLevelToString(rs) +
1618 ", parallelism = " + pc +
1619 ", size = " + tc +
1620 ", active = " + ac +
1621 ", running = " + rc +
1622 ", steals = " + st +
1623 ", tasks = " + qt +
1624 ", submissions = " + qs +
1625 "]";
1626 }
1627
1628 private static String runLevelToString(int s) {
1629 return ((s & TERMINATED) != 0 ? "Terminated" :
1630 ((s & TERMINATING) != 0 ? "Terminating" :
1631 ((s & SHUTDOWN) != 0 ? "Shutting down" :
1632 "Running")));
1633 }
1634
1635 /**
1636 * Initiates an orderly shutdown in which previously submitted
1637 * tasks are executed, but no new tasks will be accepted.
1638 * Invocation has no additional effect if already shut down.
1639 * Tasks that are in the process of being submitted concurrently
1640 * during the course of this method may or may not be rejected.
1641 *
1642 * @throws SecurityException if a security manager exists and
1643 * the caller is not permitted to modify threads
1644 * because it does not hold {@link
1645 * java.lang.RuntimePermission}{@code ("modifyThread")}
1646 */
1647 public void shutdown() {
1648 checkPermission();
1649 advanceRunLevel(SHUTDOWN);
1650 tryTerminate(false);
1651 }
1652
1653 /**
1654 * Attempts to cancel and/or stop all tasks, and reject all
1655 * subsequently submitted tasks. Tasks that are in the process of
1656 * being submitted or executed concurrently during the course of
1657 * this method may or may not be rejected. This method cancels
1658 * both existing and unexecuted tasks, in order to permit
1659 * termination in the presence of task dependencies. So the method
1660 * always returns an empty list (unlike the case for some other
1661 * Executors).
1662 *
1663 * @return an empty list
1664 * @throws SecurityException if a security manager exists and
1665 * the caller is not permitted to modify threads
1666 * because it does not hold {@link
1667 * java.lang.RuntimePermission}{@code ("modifyThread")}
1668 */
1669 public List<Runnable> shutdownNow() {
1670 checkPermission();
1671 tryTerminate(true);
1672 return Collections.emptyList();
1673 }
1674
1675 /**
1676 * Returns {@code true} if all tasks have completed following shut down.
1677 *
1678 * @return {@code true} if all tasks have completed following shut down
1679 */
1680 public boolean isTerminated() {
1681 return runState >= TERMINATED;
1682 }
1683
1684 /**
1685 * Returns {@code true} if the process of termination has
1686 * commenced but not yet completed. This method may be useful for
1687 * debugging. A return of {@code true} reported a sufficient
1688 * period after shutdown may indicate that submitted tasks have
1689 * ignored or suppressed interruption, causing this executor not
1690 * to properly terminate.
1691 *
1692 * @return {@code true} if terminating but not yet terminated
1693 */
1694 public boolean isTerminating() {
1695 return (runState & (TERMINATING|TERMINATED)) == TERMINATING;
1696 }
1697
1698 /**
1699 * Returns {@code true} if this pool has been shut down.
1700 *
1701 * @return {@code true} if this pool has been shut down
1702 */
1703 public boolean isShutdown() {
1704 return runState >= SHUTDOWN;
1705 }
1706
1707 /**
1708 * Blocks until all tasks have completed execution after a shutdown
1709 * request, or the timeout occurs, or the current thread is
1710 * interrupted, whichever happens first.
1711 *
1712 * @param timeout the maximum time to wait
1713 * @param unit the time unit of the timeout argument
1714 * @return {@code true} if this executor terminated and
1715 * {@code false} if the timeout elapsed before termination
1716 * @throws InterruptedException if interrupted while waiting
1717 */
1718 public boolean awaitTermination(long timeout, TimeUnit unit)
1719 throws InterruptedException {
1720 try {
1721 return termination.awaitAdvanceInterruptibly(0, timeout, unit) > 0;
1722 } catch (TimeoutException ex) {
1723 return false;
1724 }
1725 }
1726
1727 /**
1728 * Interface for extending managed parallelism for tasks running
1729 * in {@link ForkJoinPool}s.
1730 *
1731 * <p>A {@code ManagedBlocker} provides two methods. Method
1732 * {@code isReleasable} must return {@code true} if blocking is
1733 * not necessary. Method {@code block} blocks the current thread
1734 * if necessary (perhaps internally invoking {@code isReleasable}
1735 * before actually blocking). The unusual methods in this API
1736 * accommodate synchronizers that may, but don't usually, block
1737 * for long periods. Similarly, they allow more efficient internal
1738 * handling of cases in which additional workers may be, but
1739 * usually are not, needed to ensure sufficient parallelism.
1740 * Toward this end, implementations of method {@code isReleasable}
1741 * must be amenable to repeated invocation.
1742 *
1743 * <p>For example, here is a ManagedBlocker based on a
1744 * ReentrantLock:
1745 * <pre> {@code
1746 * class ManagedLocker implements ManagedBlocker {
1747 * final ReentrantLock lock;
1748 * boolean hasLock = false;
1749 * ManagedLocker(ReentrantLock lock) { this.lock = lock; }
1750 * public boolean block() {
1751 * if (!hasLock)
1752 * lock.lock();
1753 * return true;
1754 * }
1755 * public boolean isReleasable() {
1756 * return hasLock || (hasLock = lock.tryLock());
1757 * }
1758 * }}</pre>
1759 *
1760 * <p>Here is a class that possibly blocks waiting for an
1761 * item on a given queue:
1762 * <pre> {@code
1763 * class QueueTaker<E> implements ManagedBlocker {
1764 * final BlockingQueue<E> queue;
1765 * volatile E item = null;
1766 * QueueTaker(BlockingQueue<E> q) { this.queue = q; }
1767 * public boolean block() throws InterruptedException {
1768 * if (item == null)
1769 * item = queue.take();
1770 * return true;
1771 * }
1772 * public boolean isReleasable() {
1773 * return item != null || (item = queue.poll()) != null;
1774 * }
1775 * public E getItem() { // call after pool.managedBlock completes
1776 * return item;
1777 * }
1778 * }}</pre>
1779 */
1780 public static interface ManagedBlocker {
1781 /**
1782 * Possibly blocks the current thread, for example waiting for
1783 * a lock or condition.
1784 *
1785 * @return {@code true} if no additional blocking is necessary
1786 * (i.e., if isReleasable would return true)
1787 * @throws InterruptedException if interrupted while waiting
1788 * (the method is not required to do so, but is allowed to)
1789 */
1790 boolean block() throws InterruptedException;
1791
1792 /**
1793 * Returns {@code true} if blocking is unnecessary.
1794 */
1795 boolean isReleasable();
1796 }
1797
1798 /**
1799 * Blocks in accord with the given blocker. If the current thread
1800 * is a {@link ForkJoinWorkerThread}, this method possibly
1801 * arranges for a spare thread to be activated if necessary to
1802 * ensure sufficient parallelism while the current thread is blocked.
1803 *
1804 * <p>If the caller is not a {@link ForkJoinTask}, this method is
1805 * behaviorally equivalent to
1806 * <pre> {@code
1807 * while (!blocker.isReleasable())
1808 * if (blocker.block())
1809 * return;
1810 * }</pre>
1811 *
1812 * If the caller is a {@code ForkJoinTask}, then the pool may
1813 * first be expanded to ensure parallelism, and later adjusted.
1814 *
1815 * @param blocker the blocker
1816 * @throws InterruptedException if blocker.block did so
1817 */
1818 public static void managedBlock(ManagedBlocker blocker)
1819 throws InterruptedException {
1820 Thread t = Thread.currentThread();
1821 if (t instanceof ForkJoinWorkerThread) {
1822 ForkJoinWorkerThread w = (ForkJoinWorkerThread) t;
1823 w.pool.awaitBlocker(blocker);
1824 }
1825 else {
1826 do {} while (!blocker.isReleasable() && !blocker.block());
1827 }
1828 }
1829
1830 // AbstractExecutorService overrides. These rely on undocumented
1831 // fact that ForkJoinTask.adapt returns ForkJoinTasks that also
1832 // implement RunnableFuture.
1833
1834 protected <T> RunnableFuture<T> newTaskFor(Runnable runnable, T value) {
1835 return (RunnableFuture<T>) ForkJoinTask.adapt(runnable, value);
1836 }
1837
1838 protected <T> RunnableFuture<T> newTaskFor(Callable<T> callable) {
1839 return (RunnableFuture<T>) ForkJoinTask.adapt(callable);
1840 }
1841
1842 // Unsafe mechanics
1843
1844 private static final sun.misc.Unsafe UNSAFE = sun.misc.Unsafe.getUnsafe();
1845 private static final long workerCountsOffset =
1846 objectFieldOffset("workerCounts", ForkJoinPool.class);
1847 private static final long runStateOffset =
1848 objectFieldOffset("runState", ForkJoinPool.class);
1849 private static final long eventCountOffset =
1850 objectFieldOffset("eventCount", ForkJoinPool.class);
1851 private static final long eventWaitersOffset =
1852 objectFieldOffset("eventWaiters", ForkJoinPool.class);
1853 private static final long stealCountOffset =
1854 objectFieldOffset("stealCount", ForkJoinPool.class);
1855 private static final long spareWaitersOffset =
1856 objectFieldOffset("spareWaiters", ForkJoinPool.class);
1857
1858 private static long objectFieldOffset(String field, Class<?> klazz) {
1859 try {
1860 return UNSAFE.objectFieldOffset(klazz.getDeclaredField(field));
1861 } catch (NoSuchFieldException e) {
1862 // Convert Exception to corresponding Error
1863 NoSuchFieldError error = new NoSuchFieldError(field);
1864 error.initCause(e);
1865 throw error;
1866 }
1867 }
1868 }