2010-09-18 19:35:02 -03:00
|
|
|
# Copyright 2009 Brian Quinlan. All Rights Reserved.
|
|
|
|
# Licensed to PSF under a Contributor Agreement.
|
|
|
|
|
|
|
|
"""Implements ThreadPoolExecutor."""
|
|
|
|
|
|
|
|
__author__ = 'Brian Quinlan (brian@sweetapp.com)'
|
|
|
|
|
|
|
|
import atexit
|
|
|
|
from concurrent.futures import _base
|
2017-06-22 03:41:13 -03:00
|
|
|
import itertools
|
2010-09-18 19:35:02 -03:00
|
|
|
import queue
|
|
|
|
import threading
|
|
|
|
import weakref
|
2014-09-02 14:39:18 -03:00
|
|
|
import os
|
2010-09-18 19:35:02 -03:00
|
|
|
|
|
|
|
# Workers are created as daemon threads. This is done to allow the interpreter
|
|
|
|
# to exit when there are still idle threads in a ThreadPoolExecutor's thread
|
|
|
|
# pool (i.e. shutdown() was not called). However, allowing workers to die with
|
|
|
|
# the interpreter has two undesirable properties:
|
2016-08-30 14:47:49 -03:00
|
|
|
# - The workers would still be running during interpreter shutdown,
|
2010-09-18 19:35:02 -03:00
|
|
|
# meaning that they would fail in unpredictable ways.
|
|
|
|
# - The workers could be killed while evaluating a work item, which could
|
|
|
|
# be bad if the callable being evaluated has external side-effects e.g.
|
|
|
|
# writing to a file.
|
|
|
|
#
|
|
|
|
# To work around this problem, an exit handler is installed which tells the
|
|
|
|
# workers to exit when their work queues are empty and then waits until the
|
|
|
|
# threads finish.
|
|
|
|
|
2011-03-26 15:29:44 -03:00
|
|
|
_threads_queues = weakref.WeakKeyDictionary()
|
2010-09-18 19:35:02 -03:00
|
|
|
_shutdown = False
|
2019-06-28 15:54:52 -03:00
|
|
|
# Lock that ensures that new workers are not created while the interpreter is
|
|
|
|
# shutting down. Must be held while mutating _threads_queues and _shutdown.
|
|
|
|
_global_shutdown_lock = threading.Lock()
|
2010-09-18 19:35:02 -03:00
|
|
|
|
|
|
|
def _python_exit():
|
|
|
|
global _shutdown
|
2019-06-28 15:54:52 -03:00
|
|
|
with _global_shutdown_lock:
|
|
|
|
_shutdown = True
|
2011-03-26 15:29:44 -03:00
|
|
|
items = list(_threads_queues.items())
|
|
|
|
for t, q in items:
|
|
|
|
q.put(None)
|
|
|
|
for t, q in items:
|
|
|
|
t.join()
|
2010-09-18 19:35:02 -03:00
|
|
|
|
|
|
|
atexit.register(_python_exit)
|
|
|
|
|
2017-11-04 07:05:49 -03:00
|
|
|
|
2010-09-18 19:35:02 -03:00
|
|
|
class _WorkItem(object):
|
|
|
|
def __init__(self, future, fn, args, kwargs):
|
|
|
|
self.future = future
|
|
|
|
self.fn = fn
|
|
|
|
self.args = args
|
|
|
|
self.kwargs = kwargs
|
|
|
|
|
|
|
|
def run(self):
|
|
|
|
if not self.future.set_running_or_notify_cancel():
|
|
|
|
return
|
|
|
|
|
|
|
|
try:
|
|
|
|
result = self.fn(*self.args, **self.kwargs)
|
2017-08-22 11:50:42 -03:00
|
|
|
except BaseException as exc:
|
|
|
|
self.future.set_exception(exc)
|
|
|
|
# Break a reference cycle with the exception 'exc'
|
|
|
|
self = None
|
2010-09-18 19:35:02 -03:00
|
|
|
else:
|
|
|
|
self.future.set_result(result)
|
|
|
|
|
2017-11-04 07:05:49 -03:00
|
|
|
|
|
|
|
def _worker(executor_reference, work_queue, initializer, initargs):
|
|
|
|
if initializer is not None:
|
|
|
|
try:
|
|
|
|
initializer(*initargs)
|
|
|
|
except BaseException:
|
|
|
|
_base.LOGGER.critical('Exception in initializer:', exc_info=True)
|
|
|
|
executor = executor_reference()
|
|
|
|
if executor is not None:
|
|
|
|
executor._initializer_failed()
|
|
|
|
return
|
2010-09-18 19:35:02 -03:00
|
|
|
try:
|
|
|
|
while True:
|
2011-04-12 12:48:46 -03:00
|
|
|
work_item = work_queue.get(block=True)
|
|
|
|
if work_item is not None:
|
|
|
|
work_item.run()
|
2012-11-03 10:36:01 -03:00
|
|
|
# Delete references to object. See issue16284
|
|
|
|
del work_item
|
2019-05-22 18:29:58 -03:00
|
|
|
|
|
|
|
# attempt to increment idle count
|
|
|
|
executor = executor_reference()
|
|
|
|
if executor is not None:
|
|
|
|
executor._idle_semaphore.release()
|
|
|
|
del executor
|
2011-04-12 12:48:46 -03:00
|
|
|
continue
|
2019-05-22 18:29:58 -03:00
|
|
|
|
2011-03-26 15:29:44 -03:00
|
|
|
executor = executor_reference()
|
|
|
|
# Exit if:
|
|
|
|
# - The interpreter is shutting down OR
|
|
|
|
# - The executor that owns the worker has been collected OR
|
|
|
|
# - The executor that owns the worker has been shutdown.
|
|
|
|
if _shutdown or executor is None or executor._shutdown:
|
2018-04-10 14:23:14 -03:00
|
|
|
# Flag the executor as shutting down as early as possible if it
|
|
|
|
# is not gc-ed yet.
|
|
|
|
if executor is not None:
|
|
|
|
executor._shutdown = True
|
2011-03-26 15:29:44 -03:00
|
|
|
# Notice other workers
|
|
|
|
work_queue.put(None)
|
|
|
|
return
|
|
|
|
del executor
|
2011-11-11 15:05:50 -04:00
|
|
|
except BaseException:
|
2010-09-18 19:35:02 -03:00
|
|
|
_base.LOGGER.critical('Exception in worker', exc_info=True)
|
|
|
|
|
2017-11-04 07:05:49 -03:00
|
|
|
|
|
|
|
class BrokenThreadPool(_base.BrokenExecutor):
|
|
|
|
"""
|
|
|
|
Raised when a worker thread in a ThreadPoolExecutor failed initializing.
|
|
|
|
"""
|
|
|
|
|
|
|
|
|
2010-09-18 19:35:02 -03:00
|
|
|
class ThreadPoolExecutor(_base.Executor):
|
2017-06-22 03:41:13 -03:00
|
|
|
|
|
|
|
# Used to assign unique thread names when thread_name_prefix is not supplied.
|
|
|
|
_counter = itertools.count().__next__
|
|
|
|
|
2017-11-04 07:05:49 -03:00
|
|
|
def __init__(self, max_workers=None, thread_name_prefix='',
|
|
|
|
initializer=None, initargs=()):
|
2010-09-18 19:35:02 -03:00
|
|
|
"""Initializes a new ThreadPoolExecutor instance.
|
|
|
|
|
|
|
|
Args:
|
|
|
|
max_workers: The maximum number of threads that can be used to
|
|
|
|
execute the given calls.
|
2016-08-07 14:19:20 -03:00
|
|
|
thread_name_prefix: An optional name prefix to give our threads.
|
2019-06-15 08:43:10 -03:00
|
|
|
initializer: A callable used to initialize worker threads.
|
2017-11-04 07:05:49 -03:00
|
|
|
initargs: A tuple of arguments to pass to the initializer.
|
2010-09-18 19:35:02 -03:00
|
|
|
"""
|
2014-09-02 14:39:18 -03:00
|
|
|
if max_workers is None:
|
2019-05-28 09:02:52 -03:00
|
|
|
# ThreadPoolExecutor is often used to:
|
|
|
|
# * CPU bound task which releases GIL
|
|
|
|
# * I/O bound task (which releases GIL, of course)
|
|
|
|
#
|
|
|
|
# We use cpu_count + 4 for both types of tasks.
|
|
|
|
# But we limit it to 32 to avoid consuming surprisingly large resource
|
|
|
|
# on many core machine.
|
|
|
|
max_workers = min(32, (os.cpu_count() or 1) + 4)
|
2014-05-17 17:51:10 -03:00
|
|
|
if max_workers <= 0:
|
|
|
|
raise ValueError("max_workers must be greater than 0")
|
|
|
|
|
2017-11-04 07:05:49 -03:00
|
|
|
if initializer is not None and not callable(initializer):
|
|
|
|
raise TypeError("initializer must be a callable")
|
|
|
|
|
2010-09-18 19:35:02 -03:00
|
|
|
self._max_workers = max_workers
|
2018-01-18 05:38:03 -04:00
|
|
|
self._work_queue = queue.SimpleQueue()
|
2019-05-22 18:29:58 -03:00
|
|
|
self._idle_semaphore = threading.Semaphore(0)
|
2010-09-18 19:35:02 -03:00
|
|
|
self._threads = set()
|
2017-11-04 07:05:49 -03:00
|
|
|
self._broken = False
|
2010-09-18 19:35:02 -03:00
|
|
|
self._shutdown = False
|
|
|
|
self._shutdown_lock = threading.Lock()
|
2017-06-22 03:41:13 -03:00
|
|
|
self._thread_name_prefix = (thread_name_prefix or
|
|
|
|
("ThreadPoolExecutor-%d" % self._counter()))
|
2017-11-04 07:05:49 -03:00
|
|
|
self._initializer = initializer
|
|
|
|
self._initargs = initargs
|
2010-09-18 19:35:02 -03:00
|
|
|
|
2019-06-05 12:22:31 -03:00
|
|
|
def submit(self, fn, /, *args, **kwargs):
|
2019-06-28 15:54:52 -03:00
|
|
|
with self._shutdown_lock, _global_shutdown_lock:
|
2017-11-04 07:05:49 -03:00
|
|
|
if self._broken:
|
|
|
|
raise BrokenThreadPool(self._broken)
|
|
|
|
|
2010-09-18 19:35:02 -03:00
|
|
|
if self._shutdown:
|
|
|
|
raise RuntimeError('cannot schedule new futures after shutdown')
|
2018-04-10 14:23:14 -03:00
|
|
|
if _shutdown:
|
2018-11-05 10:20:25 -04:00
|
|
|
raise RuntimeError('cannot schedule new futures after '
|
2018-04-10 14:23:14 -03:00
|
|
|
'interpreter shutdown')
|
2010-09-18 19:35:02 -03:00
|
|
|
|
|
|
|
f = _base.Future()
|
|
|
|
w = _WorkItem(f, fn, args, kwargs)
|
|
|
|
|
|
|
|
self._work_queue.put(w)
|
|
|
|
self._adjust_thread_count()
|
|
|
|
return f
|
|
|
|
submit.__doc__ = _base.Executor.submit.__doc__
|
|
|
|
|
|
|
|
def _adjust_thread_count(self):
|
2019-05-22 18:29:58 -03:00
|
|
|
# if idle threads are available, don't spin new threads
|
|
|
|
if self._idle_semaphore.acquire(timeout=0):
|
|
|
|
return
|
|
|
|
|
2011-03-26 15:29:44 -03:00
|
|
|
# When the executor gets lost, the weakref callback will wake up
|
|
|
|
# the worker threads.
|
|
|
|
def weakref_cb(_, q=self._work_queue):
|
|
|
|
q.put(None)
|
2019-05-22 18:29:58 -03:00
|
|
|
|
2016-08-07 14:19:20 -03:00
|
|
|
num_threads = len(self._threads)
|
|
|
|
if num_threads < self._max_workers:
|
|
|
|
thread_name = '%s_%d' % (self._thread_name_prefix or self,
|
|
|
|
num_threads)
|
|
|
|
t = threading.Thread(name=thread_name, target=_worker,
|
2011-03-26 15:29:44 -03:00
|
|
|
args=(weakref.ref(self, weakref_cb),
|
2017-11-04 07:05:49 -03:00
|
|
|
self._work_queue,
|
|
|
|
self._initializer,
|
|
|
|
self._initargs))
|
2010-09-18 19:35:02 -03:00
|
|
|
t.daemon = True
|
|
|
|
t.start()
|
|
|
|
self._threads.add(t)
|
2011-03-26 15:29:44 -03:00
|
|
|
_threads_queues[t] = self._work_queue
|
2010-09-18 19:35:02 -03:00
|
|
|
|
2017-11-04 07:05:49 -03:00
|
|
|
def _initializer_failed(self):
|
|
|
|
with self._shutdown_lock:
|
|
|
|
self._broken = ('A thread initializer failed, the thread pool '
|
|
|
|
'is not usable anymore')
|
|
|
|
# Drain work queue and mark pending futures failed
|
|
|
|
while True:
|
|
|
|
try:
|
|
|
|
work_item = self._work_queue.get_nowait()
|
|
|
|
except queue.Empty:
|
|
|
|
break
|
|
|
|
if work_item is not None:
|
|
|
|
work_item.future.set_exception(BrokenThreadPool(self._broken))
|
|
|
|
|
2010-09-18 19:35:02 -03:00
|
|
|
def shutdown(self, wait=True):
|
|
|
|
with self._shutdown_lock:
|
|
|
|
self._shutdown = True
|
2011-03-26 15:29:44 -03:00
|
|
|
self._work_queue.put(None)
|
2010-09-18 19:35:02 -03:00
|
|
|
if wait:
|
|
|
|
for t in self._threads:
|
|
|
|
t.join()
|
|
|
|
shutdown.__doc__ = _base.Executor.shutdown.__doc__
|